DoctrineMigrations/Version20140129151724.php
author cavaliet
Tue, 08 Apr 2014 13:13:23 +0200
changeset 127 fafde037c661
parent 123 d48100e2fead
child 129 65c12455ce74
permissions -rw-r--r--
Removed tag V00.15
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     1
<?php
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     2
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     3
namespace Application\Migrations;
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     4
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     5
use Doctrine\DBAL\Migrations\AbstractMigration,
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     6
    Doctrine\DBAL\Schema\Schema,
123
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
     7
	IRI\Bundle\WikiTagBundle\Utils\WikiTagUtils,
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
     8
	IRI\Bundle\WikiTagBundle\Listener\DocumentListener;
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     9
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    10
/**
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    11
 * Migration for WikiTagBundle <= V00.13
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    12
 * This migration takes every tag label and search the REAL dbpedia uri associated to this label.
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    13
 * Before, the dbpedia uri was manually generated by http://dbpedia.org/resource/ + english_label.
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    14
 * Now we get the dbpedia uri by requesting http://LANG_CODE.dbpedia.org/sparql with the current label.
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    15
 * 
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    16
 */
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    17
class Version20140129151724 extends AbstractMigration
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    18
{
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    19
    public function up(Schema $schema)
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    20
    {
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    21
        // this up() migration is autogenerated, please modify it to your needs
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    22
        $this->abortIf($this->connection->getDatabasePlatform()->getName() != "mysql");
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    23
        
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    24
        
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    25
        // First we get all tags.
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    26
        $em = $GLOBALS["kernel"]->getContainer()->get( 'doctrine.orm.entity_manager' );
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    27
        // Avoid php annoying memory leaks
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    28
        $em->getConnection()->getConfiguration()->setSQLLogger(null);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    29
        
123
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    30
        // remove event listener to avoid useless sql queries. Only WikiTag's Tags are modified
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    31
        $listenerInst = null;
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    32
        foreach ($em->getEventManager()->getListeners() as $event => $listeners) {
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    33
        	foreach ($listeners as $hash => $listener) {
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    34
        		if ($listener instanceof DocumentListener) {
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    35
        			$listenerInst = $listener;
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    36
        			break 2;
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    37
        		}
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    38
        	}
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    39
        }
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    40
        $listenerInst || die('Listener is not registered in the event manager');
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    41
        $evm = $em->getEventManager();
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    42
        $evm->removeEventListener(array('onFlush', 'preRemove', 'postPersist', 'postUpdate',  'postRemove'), $listenerInst);
d48100e2fead enhance fr.dbpedia migration for production
cavaliet
parents: 118
diff changeset
    43
        
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    44
        // First step : we populate the dbpedia uris thanks to the dbpedia-owl:wikiPageID
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    45
        echo "\nFIRST STEP";
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
    46
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE t.wikipediaPageId IS NOT NULL ORDER BY t.label ASC');//->setMaxResults(240)->setFirstResult(500);
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    47
        $tags = $query->getResult();
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    48
        $i = 1;
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    49
        $nb_set = 0;
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
    50
        echo "\n".count($tags)." tags to search.";
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    51
        foreach($tags as $tag){
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    52
        	$l = $tag->getLabel();
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    53
        	$uri = WikiTagUtils::getDbpediaUri($tag->getWikipediaPageId(), [], false, "pageid");
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    54
        	$tag->setDbpediaUri($uri);
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    55
        	$em->persist($tag);
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    56
         if($uri!=NULL && $uri!=""){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    57
             $nb_set++;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    58
         }
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    59
        	if( $i % 50 == 0 ){
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    60
        		$em->flush();
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    61
        		echo "\n    FLUSH";
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    62
        	}
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    63
        	$i++;
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    64
        	echo "\n$i : $l \t\t: $uri";
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    65
        }
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    66
        $em->flush();
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    67
        echo "\nFIRST STEP : $nb_set uris found";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    68
        
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    69
        
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    70
        // Second step : we populate the dbpedia uris not found thanks to the foaf:isPrimaryTopicOf
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    71
        echo "\nSECOND STEP";
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
    72
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE (t.wikipediaUrl!=\'\' AND t.wikipediaUrl IS NOT NULL AND (t.dbpediaUri=\'\' OR t.dbpediaUri IS NULL)) ORDER BY t.label ASC');//->setMaxResults(240);
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    73
        $tags = $query->getResult();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    74
        $i = 1;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    75
        $nb_set = 0;
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
    76
        echo "\n".count($tags)." tags to search.";
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    77
        foreach($tags as $tag){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    78
        	$l = $tag->getLabel();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    79
        	$uri = WikiTagUtils::getDbpediaUri($tag->getWikipediaUrl(), [], false, "wikiurl");
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    80
        	$tag->setDbpediaUri($uri);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    81
        	$em->persist($tag);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    82
            if($uri!=NULL && $uri!=""){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    83
                $nb_set++;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    84
            }
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    85
        	if( $i % 50 == 0 ){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    86
        		$em->flush();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    87
        		echo "\n    FLUSH";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    88
        	}
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    89
        	$i++;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    90
        	echo "\n$i : $l \t\t: $uri";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    91
        }
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    92
        $em->flush();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    93
        echo "\nSECOND STEP : $nb_set uris found";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    94
        
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    95
        
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    96
        // Third step : we populate the dbpedia uris not found thanks to the rdfs:label
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    97
        echo "\nTHIRD STEP";
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
    98
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE (t.wikipediaUrl!=\'\' AND t.wikipediaUrl IS NOT NULL AND (t.dbpediaUri=\'\' OR t.dbpediaUri IS NULL)) ORDER BY t.label ASC');//->setMaxResults(240);
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
    99
        $tags = $query->getResult();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   100
        $i = 1;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   101
        $nb_set = 0;
118
e9c1a6f4b83e enhance migration for dbpedia uri
cavaliet
parents: 117
diff changeset
   102
        echo "\n".count($tags)." tags to search.";
117
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   103
        foreach($tags as $tag){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   104
        	$l = $tag->getLabel();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   105
        	$uri = WikiTagUtils::getDbpediaUri($tag->getLabel(), [], false);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   106
        	$tag->setDbpediaUri($uri);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   107
        	$em->persist($tag);
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   108
            if($uri!=NULL && $uri!=""){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   109
                $nb_set++;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   110
            }
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   111
        	if( $i % 50 == 0 ){
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   112
        		$em->flush();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   113
        		echo "\n    FLUSH";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   114
        	}
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   115
        	$i++;
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   116
        	echo "\n$i : $l \t\t: $uri";
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   117
        }
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   118
        $em->flush();
5771052a647a better migration for dbpedia uri
cavaliet
parents: 116
diff changeset
   119
        echo "\nTHIRD STEP : $nb_set uris found";
116
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   120
    }
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   121
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   122
    public function down(Schema $schema)
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   123
    {
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   124
        // this down() migration is autogenerated, please modify it to your needs
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   125
        $this->abortIf($this->connection->getDatabasePlatform()->getName() != "mysql");
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   126
    }
a023e0185a02 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   127
}