app/DoctrineMigrations/Version20140129151724.php
author cavaliet
Wed, 02 Apr 2014 14:35:17 +0200
changeset 113 e4f8c2479e78
parent 110 7602e5ca9c30
child 118 c3f9a6086f52
permissions -rw-r--r--
enhance fr.dbpedia migration for production
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     1
<?php
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     2
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     3
namespace Application\Migrations;
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     4
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     5
use Doctrine\DBAL\Migrations\AbstractMigration,
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     6
    Doctrine\DBAL\Schema\Schema,
113
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
     7
	IRI\Bundle\WikiTagBundle\Utils\WikiTagUtils,
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
     8
	IRI\Bundle\WikiTagBundle\Listener\DocumentListener;
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
     9
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    10
/**
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    11
 * Migration for WikiTagBundle <= V00.13
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    12
 * This migration takes every tag label and search the REAL dbpedia uri associated to this label.
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    13
 * Before, the dbpedia uri was manually generated by http://dbpedia.org/resource/ + english_label.
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    14
 * Now we get the dbpedia uri by requesting http://LANG_CODE.dbpedia.org/sparql with the current label.
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    15
 * 
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    16
 */
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    17
class Version20140129151724 extends AbstractMigration
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    18
{
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    19
    public function up(Schema $schema)
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    20
    {
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    21
        // this up() migration is autogenerated, please modify it to your needs
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    22
        $this->abortIf($this->connection->getDatabasePlatform()->getName() != "mysql");
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    23
        
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    24
        
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    25
        // First we get all tags.
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    26
        $em = $GLOBALS["kernel"]->getContainer()->get( 'doctrine.orm.entity_manager' );
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    27
        // Avoid php annoying memory leaks
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    28
        $em->getConnection()->getConfiguration()->setSQLLogger(null);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    29
        
113
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    30
        // remove event listener to avoid useless sql queries. Only WikiTag's Tags are modified
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    31
        $listenerInst = null;
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    32
        foreach ($em->getEventManager()->getListeners() as $event => $listeners) {
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    33
        	foreach ($listeners as $hash => $listener) {
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    34
        		if ($listener instanceof DocumentListener) {
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    35
        			$listenerInst = $listener;
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    36
        			break 2;
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    37
        		}
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    38
        	}
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    39
        }
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    40
        $listenerInst || die('Listener is not registered in the event manager');
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    41
        $evm = $em->getEventManager();
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    42
        $evm->removeEventListener(array('onFlush', 'preRemove', 'postPersist', 'postUpdate',  'postRemove'), $listenerInst);
e4f8c2479e78 enhance fr.dbpedia migration for production
cavaliet
parents: 110
diff changeset
    43
        
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    44
        // First step : we populate the dbpedia uris thanks to the dbpedia-owl:wikiPageID
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    45
        echo "\nFIRST STEP";
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
    46
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE t.wikipediaPageId IS NOT NULL ORDER BY t.label ASC');//->setMaxResults(240)->setFirstResult(500);
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    47
        $tags = $query->getResult();
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    48
        $i = 1;
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    49
        $nb_set = 0;
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
    50
        echo "\n".count($tags)." tags to search.";
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    51
        foreach($tags as $tag){
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    52
        	$l = $tag->getLabel();
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    53
        	$uri = WikiTagUtils::getDbpediaUri($tag->getWikipediaPageId(), [], false, "pageid");
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    54
        	$tag->setDbpediaUri($uri);
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    55
        	$em->persist($tag);
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    56
         if($uri!=NULL && $uri!=""){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    57
             $nb_set++;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    58
         }
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    59
        	if( $i % 50 == 0 ){
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    60
        		$em->flush();
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    61
        		echo "\n    FLUSH";
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    62
        	}
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    63
        	$i++;
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    64
        	echo "\n$i : $l \t\t: $uri";
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    65
        }
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
    66
        $em->flush();
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    67
        echo "\nFIRST STEP : $nb_set uris found";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    68
        
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    69
        
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    70
        // Second step : we populate the dbpedia uris not found thanks to the foaf:isPrimaryTopicOf
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    71
        echo "\nSECOND STEP";
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
    72
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE (t.wikipediaUrl!=\'\' AND t.wikipediaUrl IS NOT NULL AND (t.dbpediaUri=\'\' OR t.dbpediaUri IS NULL)) ORDER BY t.label ASC');//->setMaxResults(240);
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    73
        $tags = $query->getResult();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    74
        $i = 1;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    75
        $nb_set = 0;
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
    76
        echo "\n".count($tags)." tags to search.";
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    77
        foreach($tags as $tag){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    78
        	$l = $tag->getLabel();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    79
        	$uri = WikiTagUtils::getDbpediaUri($tag->getWikipediaUrl(), [], false, "wikiurl");
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    80
        	$tag->setDbpediaUri($uri);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    81
        	$em->persist($tag);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    82
            if($uri!=NULL && $uri!=""){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    83
                $nb_set++;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    84
            }
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    85
        	if( $i % 50 == 0 ){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    86
        		$em->flush();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    87
        		echo "\n    FLUSH";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    88
        	}
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    89
        	$i++;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    90
        	echo "\n$i : $l \t\t: $uri";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    91
        }
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    92
        $em->flush();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    93
        echo "\nSECOND STEP : $nb_set uris found";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    94
        
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    95
        
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    96
        // Third step : we populate the dbpedia uris not found thanks to the rdfs:label
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    97
        echo "\nTHIRD STEP";
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
    98
        $query = $em->createQuery('SELECT t FROM WikiTagBundle:Tag t WHERE (t.wikipediaUrl!=\'\' AND t.wikipediaUrl IS NOT NULL AND (t.dbpediaUri=\'\' OR t.dbpediaUri IS NULL)) ORDER BY t.label ASC');//->setMaxResults(240);
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
    99
        $tags = $query->getResult();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   100
        $i = 1;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   101
        $nb_set = 0;
110
7602e5ca9c30 enhance migration for dbpedia uri
cavaliet
parents: 109
diff changeset
   102
        echo "\n".count($tags)." tags to search.";
109
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   103
        foreach($tags as $tag){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   104
        	$l = $tag->getLabel();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   105
        	$uri = WikiTagUtils::getDbpediaUri($tag->getLabel(), [], false);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   106
        	$tag->setDbpediaUri($uri);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   107
        	$em->persist($tag);
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   108
            if($uri!=NULL && $uri!=""){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   109
                $nb_set++;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   110
            }
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   111
        	if( $i % 50 == 0 ){
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   112
        		$em->flush();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   113
        		echo "\n    FLUSH";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   114
        	}
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   115
        	$i++;
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   116
        	echo "\n$i : $l \t\t: $uri";
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   117
        }
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   118
        $em->flush();
fc56f9e28cdb better migration for dbpedia uri
cavaliet
parents: 108
diff changeset
   119
        echo "\nTHIRD STEP : $nb_set uris found";
108
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   120
    }
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   121
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   122
    public function down(Schema $schema)
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   123
    {
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   124
        // this down() migration is autogenerated, please modify it to your needs
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   125
        $this->abortIf($this->connection->getDatabasePlatform()->getName() != "mysql");
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   126
    }
48af4fad8a44 migration to real dbpedia uri
cavaliet
parents:
diff changeset
   127
}