src/p4l/mapping/parsers.py
author ymh <ymh.work@gmail.com>
Wed, 02 Oct 2013 05:30:06 +0200
changeset 135 c9f22e2987ea
parent 131 f1854630734f
child 137 bb8bf2688d7e
permissions -rw-r--r--
Add a reminder that the application needs sesame
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
107
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
     1
# -*- coding: utf-8 -*-
126
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     2
#
131
f1854630734f change copyright notice
ymh <ymh.work@gmail.com>
parents: 126
diff changeset
     3
# Copyright IRI (c) 2013
126
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     4
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     5
# contact@iri.centrepompidou.fr
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     6
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     7
# This software is governed by the CeCILL-B license under French law and
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     8
# abiding by the rules of distribution of free software.  You can  use, 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
     9
# modify and/ or redistribute the software under the terms of the CeCILL-B
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    10
# license as circulated by CEA, CNRS and INRIA at the following URL
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    11
# "http://www.cecill.info". 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    12
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    13
# As a counterpart to the access to the source code and  rights to copy,
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    14
# modify and redistribute granted by the license, users are provided only
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    15
# with a limited warranty  and the software's author,  the holder of the
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    16
# economic rights,  and the successive licensors  have only  limited
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    17
# liability. 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    18
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    19
# In this respect, the user's attention is drawn to the risks associated
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    20
# with loading,  using,  modifying and/or developing or reproducing the
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    21
# software by the user in light of its specific status of free software,
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    22
# that may mean  that it is complicated to manipulate,  and  that  also
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    23
# therefore means  that it is reserved for developers  and  experienced
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    24
# professionals having in-depth computer knowledge. Users are therefore
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    25
# encouraged to load and test the software's suitability as regards their
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    26
# requirements in conditions enabling the security of their systems and/or 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    27
# data to be ensured and,  more generally, to use and operate it in the 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    28
# same conditions as regards security. 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    29
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    30
# The fact that you are presently reading this means that you have had
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    31
# knowledge of the CeCILL-B license and that you accept its terms.
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 119
diff changeset
    32
#
107
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    33
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    34
from rdflib.plugins.sparql.processor import prepareQuery
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    35
from rdflib.term import URIRef
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    36
from p4l.models.data import Language, Record
119
ece69ca3ac24 - correct import pour indexation
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    37
from p4l.models import signals
107
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    38
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    39
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    40
class QueryCache(object):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    41
    def __init__(self, *args, **kwargs):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    42
        self.__query_cache = {}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    43
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    44
    def get_sparql_query(self, query, namespaces_dict):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    45
        return self.__query_cache.get(query, False) \
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    46
            or self.__query_cache.setdefault(query, prepareQuery(query, initNs=namespaces_dict))
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    47
    
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    48
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    49
def convert_bool(val):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    50
    if val == True or val == False:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    51
        return val
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    52
    if val is None:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    53
        return False
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    54
    if isinstance(val, basestring):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    55
        if len(val) == 0:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    56
            return False
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    57
        if val[0].lower() in ['t','y','1','o']:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    58
            return True
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    59
        else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    60
            return False        
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    61
    return bool(val)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    62
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    63
class RecordParser(object):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    64
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    65
    
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    66
    def __init__(self, query_cache = None):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    67
        self.query_cache = None
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    68
        if self.query_cache is None:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    69
            self.query_cache = QueryCache()        
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    70
    
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    71
    def extract_single_value_form_graph(self, graph, q, bindings={}, index=0, convert=lambda v:unicode(v) if v is not None else None, default=None):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    72
        return next(self.extract_multiple_values_from_graph(graph, q, bindings, index, convert), default)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    73
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    74
    def extract_multiple_values_from_graph(self, graph, q, bindings={}, index=0, convert=lambda v:unicode(v) if v is not None else None):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    75
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    76
        index_list = index
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    77
        if isinstance(index, int):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    78
            index_list = range(index+1)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    79
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    80
        if hasattr(convert, '__call__'):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    81
            convert_dict = dict((k, convert) for k in index_list)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    82
        else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    83
            convert_dict = convert
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    84
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    85
        convert_dict = dict((k, f if hasattr(f,'__call__') else lambda v:unicode(v) if v is not None else None) for k,f in convert_dict.iteritems())
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    86
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    87
        for row in graph.query(self.query_cache.get_sparql_query(q, dict(graph.namespaces())), initBindings=bindings):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    88
            if len(row) < len(index_list):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    89
                break
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    90
            else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    91
                res = dict([ (k, convert_dict.get(k, lambda v:unicode(v) if v is not None else None)(v)) for k, v in zip(index_list, row)])
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    92
                if isinstance(index, int):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    93
                    yield res[index]
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    94
                else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    95
                    yield res
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    96
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    97
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    98
    def convert_bool(self, val):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
    99
        if val == True or val == False:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   100
            return val
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   101
        if val is None:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   102
            return False
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   103
        if isinstance(val, basestring):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   104
            if len(val) == 0:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   105
                return False
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   106
            if val[0].lower() in ['t','y','1','o']:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   107
                return True
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   108
            else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   109
                return False        
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   110
        return bool(val)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   111
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   112
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   113
    def add_to_related_collection(self, coll, graph, fields, q, bindings={},  convert=lambda v: unicode(v) if v is not None else None, through_fields=None):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   114
        
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   115
        for val in self.extract_multiple_values_from_graph(graph, q, bindings=bindings, index=fields, convert=convert):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   116
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   117
            if through_fields:                
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   118
                new_obj_val = dict([(k,v) for k,v in val.iteritems() if k not in through_fields])
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   119
            else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   120
                new_obj_val = val
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   121
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   122
            if hasattr(coll, 'through'):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   123
                new_obj_rel, _ = coll.model.objects.get_or_create(**new_obj_val)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   124
                if through_fields:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   125
                    through_vals = {coll.source_field_name: coll.instance, coll.target_field_name: new_obj_rel}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   126
                    through_vals.update(dict([(k,v) for k,v in val.iteritems() if k in through_fields]))
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   127
                    coll.through.objects.create(**through_vals)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   128
                    new_obj = None
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   129
                else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   130
                    new_obj = new_obj_rel
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   131
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   132
            else:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   133
                new_obj = coll.create(**new_obj_val)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   134
            
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   135
            if new_obj:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   136
                coll.add(new_obj)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   137
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   138
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   139
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   140
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   141
    def build_record(self, graph, delete=True):
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   142
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   143
        record_uri = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?s WHERE { ?s rdf:type iiep:Record .}")
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   144
        record_identifier = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s dct:identifier ?o .}", bindings={'s':URIRef(record_uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   145
        
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   146
        if delete:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   147
            Record.objects.filter(identifier=record_identifier).delete()
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   148
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   149
        record = Record()
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   150
        record.uri = record_uri
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   151
        record.identifier = record_identifier
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   152
        record.notes = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:notes ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   153
        record.recordType = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s dct:type ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   154
        record.isDocumentPart = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:isDocumentPart ?o .}", bindings={'s':URIRef(record.uri)}, convert=self.convert_bool, default=False)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   155
        record.hidden = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:hidden ?o .}", bindings={'s':URIRef(record.uri)}, convert=self.convert_bool, default=False)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   156
        record.restricted = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:restricted ?o .}", bindings={'s':URIRef(record.uri)}, convert=self.convert_bool, default=False)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   157
        record.editionStatement = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:editionStatement ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   158
        record.corporateAuthorLabel = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s iiep:corporateAuthorLabel ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   159
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   160
        language = self.extract_single_value_form_graph(graph,"SELECT DISTINCT ?o WHERE { ?s dct:language ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   161
        if language:
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   162
            record.language, _ = Language.objects.get_or_create(uri=language)
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   163
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   164
        record.save()
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   165
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   166
        self.add_to_related_collection(record.otherLanguages, graph,  ['uri'], "SELECT ?o WHERE { ?s iiep:otherLanguage ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   167
        self.add_to_related_collection(record.subjects, graph, ['uri'], "SELECT ?o WHERE { ?s dct:subject ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   168
        self.add_to_related_collection(record.themes, graph, ['uri'], "SELECT ?o WHERE { ?s iiep:theme ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   169
        self.add_to_related_collection(record.countries, graph,  ['uri'], "SELECT ?o WHERE { ?s iiep:country ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   170
        self.add_to_related_collection(record.authors, graph, ['name'], "SELECT ?o WHERE { ?s iiep:author ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   171
        self.add_to_related_collection(record.subjectPersons, graph, ['name'], "SELECT ?o WHERE { ?s iiep:subjectPerson ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   172
        self.add_to_related_collection(record.projectNames, graph, ['uri'], "SELECT ?o WHERE { ?s iiep:projectName ?o . }")
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   173
        self.add_to_related_collection(record.audiences, graph,  ['uri'], "SELECT ?o WHERE { ?s dct:audience ?o .}", bindings={'s':URIRef(record.uri)})
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   174
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   175
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   176
            record.periodicals,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   177
            graph, 
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   178
            ['label','lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   179
            "SELECT DISTINCT ?o  ( lang(?o) as ?l) WHERE { ?s iiep:periodical ?o .}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   180
            bindings={'s':URIRef(record.uri)}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   181
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   182
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   183
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   184
            record.meetings,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   185
            graph, 
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   186
            ['label', 'meetingNumber', 'meetingPlace', 'meetingDate', 'meetingYear', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   187
            "SELECT ?l ?mn ?mp ?md ?my (lang(COALESCE(?l,?nm, ?mp,?md,?my)) as ?lang) WHERE { [iiep:meeting ?bnode]. OPTIONAL { ?bnode rdfs:label ?l }. OPTIONAL { ?bnode iiep:meetingNumber ?mn }. OPTIONAL { ?bnode iiep:meetingPlace ?mp }.  OPTIONAL { ?bnode iiep:meetingDate ?md }. OPTIONAL { ?bnode iiep:meetingYear ?my }}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   188
            convert={'meetingYear' : lambda y: int(y) if y is not None else None}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   189
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   190
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   191
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   192
            record.series,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   193
            graph, 
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   194
            ['title', 'volume', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   195
            "SELECT ?t ?vol (lang(COALESCE(?t,?vol)) as ?lang) WHERE { [iiep:serie ?bnode]. OPTIONAL { ?bnode dct:title ?t }. OPTIONAL { ?bnode iiep:volume ?vol } }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   196
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   197
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   198
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   199
            record.subjectCorporateBodies,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   200
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   201
            ['uri'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   202
            "SELECT ?o WHERE { ?s iiep:subjectCorporateBody ?o. }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   203
            bindings={'s':URIRef(record.uri)}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   204
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   205
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   206
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   207
            record.subjectMeetings,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   208
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   209
            ['label', 'meetingNumber', 'meetingPlace', 'meetingDate', 'meetingYear'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   210
            "SELECT ?l ?mn ?mp ?md ?my WHERE { [iiep:subjectMeeting ?bnode]. OPTIONAL { ?bnode rdfs:label ?l }. OPTIONAL { ?bnode iiep:meetingNumber ?mn }. OPTIONAL { ?bnode iiep:meetingPlace ?mp }.  OPTIONAL { ?bnode iiep:meetingDate ?md }. OPTIONAL { ?bnode iiep:meetingYear ?my }}",            
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   211
            convert={'meetingYear' : lambda y: int(y) if y is not None else None}
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   212
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   213
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   214
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   215
            record.corporateAuthors,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   216
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   217
            ['uri'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   218
            "SELECT ?o WHERE { ?s iiep:corporateAuthor ?o.}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   219
            bindings={'s':URIRef(record.uri)}            
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   220
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   221
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   222
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   223
            record.issns,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   224
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   225
            ['issn', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   226
            "SELECT ?issn (lang(COALESCE(?issn)) as ?lang) WHERE { ?s iiep:issn ?issn . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   227
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   228
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   229
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   230
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   231
            record.isbns,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   232
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   233
            ['isbn', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   234
            "SELECT ?isbn (lang(COALESCE(?isbn)) as ?lang) WHERE { ?s iiep:isbn ?isbn . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   235
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   236
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   237
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   238
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   239
            record.documentCodes,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   240
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   241
            ['documentCode', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   242
            "SELECT ?c (lang(COALESCE(?c)) as ?lang) WHERE { ?s iiep:documentCode ?c . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   243
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   244
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   245
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   246
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   247
            record.titles,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   248
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   249
            ['title', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   250
            "SELECT ?t (lang(COALESCE(?t)) as ?lang) WHERE { ?s dct:title ?t . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   251
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   252
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   253
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   254
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   255
            record.abstracts,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   256
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   257
            ['abstract', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   258
            "SELECT ?t (lang(COALESCE(?t)) as ?lang) WHERE { ?s dct:abstract ?t . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   259
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   260
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   261
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   262
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   263
            record.addedTitles,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   264
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   265
            ['title', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   266
            "SELECT ?t (lang(COALESCE(?t)) as ?lang) WHERE { ?s iiep:addedTitle ?t . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   267
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   268
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   269
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   270
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   271
            record.titlesMainDocument,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   272
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   273
            ['title', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   274
            "SELECT ?t (lang(COALESCE(?t)) as ?lang) WHERE { ?s iiep:titleMainDocument ?t . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   275
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   276
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   277
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   278
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   279
            record.imprints,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   280
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   281
            ['imprintCity', 'publisher', 'imprintDate', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   282
            "SELECT ?c ?p ?d (lang(COALESCE(?c, ?p, ?d)) as ?lang) WHERE { [ iiep:imprint ?bnode ]. OPTIONAL { ?bnode iiep:imprintCity ?c }. OPTIONAL { ?bnode dct:publisher ?p }. OPTIONAL { ?bnode iiep:imprintDate ?d }}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   283
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   284
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   285
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   286
            record.collations,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   287
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   288
            ['collation', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   289
            "SELECT ?c (lang(COALESCE(?c)) as ?lang) WHERE { ?s iiep:collation ?c . }",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   290
            bindings={'s':URIRef(record.uri)},
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   291
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   292
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   293
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   294
            record.volumeIssues,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   295
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   296
            ['volume', 'number', 'lang'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   297
            "SELECT ?v ?n (lang(COALESCE(?v, ?n)) as ?lang) WHERE { [ iiep:volumeIssue ?bnode ]. OPTIONAL { ?bnode iiep:volume ?v }. OPTIONAL { ?bnode iiep:number ?n }}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   298
        )
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   299
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   300
        self.add_to_related_collection(
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   301
            record.urls,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   302
            graph,
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   303
            ['address', 'display'],
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   304
            "SELECT ?a ?d WHERE { [ iiep:url ?bnode ]. OPTIONAL { ?bnode iiep:address ?a }. OPTIONAL { ?bnode iiep:display ?d }.}",
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   305
        )
119
ece69ca3ac24 - correct import pour indexation
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
   306
        
ece69ca3ac24 - correct import pour indexation
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
   307
        signals.record_saved.send(Record, instance=record, created=True)
107
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   308
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents:
diff changeset
   309
        return record