src/p4l/management/commands/dump_record.py
author ymh <ymh.work@gmail.com>
Mon, 07 Oct 2013 14:28:31 +0200
changeset 142 c365a6e23a56
parent 132 b23fae63f732
child 145 7c6fe1dab213
permissions -rw-r--r--
Correct dump_record, ensure that ref fields are exported as resources. Correct bug https://github.com/IRI-Research/plan4learning/issues/1
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
     1
# -*- coding: utf-8 -*-
126
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     2
#
131
f1854630734f change copyright notice
ymh <ymh.work@gmail.com>
parents: 126
diff changeset
     3
# Copyright IRI (c) 2013
126
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     4
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     5
# contact@iri.centrepompidou.fr
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     6
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     7
# This software is governed by the CeCILL-B license under French law and
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     8
# abiding by the rules of distribution of free software.  You can  use, 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
     9
# modify and/ or redistribute the software under the terms of the CeCILL-B
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    10
# license as circulated by CEA, CNRS and INRIA at the following URL
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    11
# "http://www.cecill.info". 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    12
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    13
# As a counterpart to the access to the source code and  rights to copy,
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    14
# modify and redistribute granted by the license, users are provided only
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    15
# with a limited warranty  and the software's author,  the holder of the
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    16
# economic rights,  and the successive licensors  have only  limited
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    17
# liability. 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    18
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    19
# In this respect, the user's attention is drawn to the risks associated
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    20
# with loading,  using,  modifying and/or developing or reproducing the
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    21
# software by the user in light of its specific status of free software,
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    22
# that may mean  that it is complicated to manipulate,  and  that  also
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    23
# therefore means  that it is reserved for developers  and  experienced
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    24
# professionals having in-depth computer knowledge. Users are therefore
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    25
# encouraged to load and test the software's suitability as regards their
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    26
# requirements in conditions enabling the security of their systems and/or 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    27
# data to be ensured and,  more generally, to use and operate it in the 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    28
# same conditions as regards security. 
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    29
#
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    30
# The fact that you are presently reading this means that you have had
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    31
# knowledge of the CeCILL-B license and that you accept its terms.
a345f1a67bf1 Python licence headers
ymh <ymh.work@gmail.com>
parents: 107
diff changeset
    32
#
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    33
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    34
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    35
import bz2
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    36
import codecs
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    37
import gzip
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    38
import logging
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    39
from optparse import make_option
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    40
from xml.sax.saxutils import XMLGenerator
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    41
from xml.sax.xmlreader import AttributesNSImpl
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    42
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    43
from django.core.management import BaseCommand
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    44
from django.core.management.base import CommandError
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    45
from django.db.models.fields.related import ForeignKey
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    46
107
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents: 103
diff changeset
    47
from p4l.mapping.constants import GRAPH_NAMESPACES, RDF, get_empty_graph
48440ff95906 small code reorg
ymh <ymh.work@gmail.com>
parents: 103
diff changeset
    48
from p4l.mapping import RecordSerializer
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    49
from p4l.models.data import Record
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    50
from p4l.utils import show_progress
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    51
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    52
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    53
logger = logging.getLogger(__name__)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    54
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    55
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    56
class Command(BaseCommand):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    57
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    58
    args = "file_path..."
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    59
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    60
    help = "Export p4l record rdf format"
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    61
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    62
    option_list = BaseCommand.option_list + (
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    63
        make_option('-l', '--limit',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    64
            dest= 'limit',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    65
            type='int',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    66
            default=-1,
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    67
            help= 'number of record to export. -1 is all (default)' 
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    68
        ),
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    69
        make_option('-s', '--skip',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    70
            dest= 'skip',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    71
            type='int',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    72
            default=0,
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    73
            help= 'number of record to skip before export. default 0.' 
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    74
        ),
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    75
        make_option('-b', '--batch',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    76
            dest= 'batch',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    77
            type='int',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    78
            default=100,
132
b23fae63f732 - correction on documentation
ymh <ymh.work@gmail.com>
parents: 131
diff changeset
    79
            help= 'query batch default 100.' 
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    80
        ),
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    81
        make_option('-j', '--bzip2',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    82
            dest= 'bzip2',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    83
            action='store_true',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    84
            default=False,
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    85
            help= 'bz2 compress' 
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    86
        ),
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    87
        make_option('-z', '--gzip',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    88
            dest= 'gzip',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    89
            action='store_true',
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    90
            default=False,
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    91
            help= 'gzip compress' 
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    92
        ),
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    93
    )
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    94
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    95
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    96
    def get_graph_from_object(self, obj):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    97
        g = get_empty_graph()
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    98
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
    99
        serializer = RecordSerializer()        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   100
        serializer.to_graph(None, obj, None, g)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   101
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   102
        return g
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   103
    
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   104
    
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   105
    def handle(self, *args, **options):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   106
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   107
        if len(args) != 1:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   108
            raise CommandError("This command takes exactly one argument")
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   109
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   110
        filepath = args[0]
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   111
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   112
        bzip2 = options.get('bzip2', False)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   113
        gzip_opt = options.get('gzip', False)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   114
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   115
        if bzip2 and not filepath.endswith(".bz2"):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   116
            filepath += ".bz2"
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   117
        elif gzip_opt and not filepath.endswith(".gz"):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   118
            filepath += ".gz"            
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   119
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   120
        limit = options.get("limit", -1)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   121
        skip = options.get("skip", 0)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   122
        batch = options.get("batch", 100)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   123
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   124
        qs = Record.objects.all().select_related(*[field.name for field in Record._meta.fields if isinstance(field, ForeignKey)]).prefetch_related(*([field.name for field in Record._meta.many_to_many] + [obj.get_accessor_name() for obj in Record._meta.get_all_related_objects()])).order_by('identifier')  # @UndefinedVariable
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   125
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   126
        if limit>=0:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   127
            qs = qs[skip:skip+limit]
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   128
        else:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   129
            qs = qs[skip:]
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   130
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   131
        open_method = None
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   132
        open_args = []
132
b23fae63f732 - correction on documentation
ymh <ymh.work@gmail.com>
parents: 131
diff changeset
   133
        decode_method = lambda s: s
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   134
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   135
        if bzip2:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   136
            open_method = bz2.BZ2File
132
b23fae63f732 - correction on documentation
ymh <ymh.work@gmail.com>
parents: 131
diff changeset
   137
            open_args = [filepath, 'wb', 9]
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   138
        elif gzip_opt:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   139
            open_method = gzip.GzipFile
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   140
            open_args = [filepath, 'wb', 9]
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   141
        else:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   142
            open_method = codecs.open
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   143
            open_args = [filepath, 'wb', "utf-8"]
132
b23fae63f732 - correction on documentation
ymh <ymh.work@gmail.com>
parents: 131
diff changeset
   144
            decode_method = lambda s: s.decode("utf-8")
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   145
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   146
        total_records = qs.count()
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   147
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   148
        print("Total record to export : %d" % total_records)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   149
        progress_writer = None
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   150
        
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   151
        with open_method(*open_args) as dest_file:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   152
            writer = XMLGenerator(dest_file, "UTF-8")
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   153
            writer.startDocument()
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   154
            for prefix,uri in GRAPH_NAMESPACES.items():
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   155
                writer.startPrefixMapping(prefix, uri)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   156
            writer.startElementNS((RDF, 'RDF'), 'RDF', AttributesNSImpl({}, {}))
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   157
            writer.characters("\n")
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   158
            for n in range((total_records/batch)+1):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   159
                for i,r in enumerate(qs[n*batch:((n+1)*batch)]):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   160
                    progress_writer = show_progress(i+(n*batch)+1, total_records, "Exporting record %s" % r.identifier, 50, progress_writer) 
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   161
                    graph = self.get_graph_from_object(r)
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   162
                    do_write = False
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   163
                    for line in graph.serialize(format="pretty-xml", encoding="utf-8").splitlines(True):
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   164
                        if "<iiep:Record" in line:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   165
                            do_write = True
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   166
                        if do_write:
132
b23fae63f732 - correction on documentation
ymh <ymh.work@gmail.com>
parents: 131
diff changeset
   167
                            dest_file.write(decode_method(line))
101
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   168
                        if "</iiep:Record>" in line:
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   169
                            break
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   170
                
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   171
            writer.endElementNS((RDF, 'RDF'), 'RDF')
71532a54d1c4 update virtualenv + implement record serialization
ymh <ymh.work@gmail.com>
parents:
diff changeset
   172
            writer.endDocument()
142
c365a6e23a56 Correct dump_record, ensure that ref fields are exported as resources. Correct bug https://github.com/IRI-Research/plan4learning/issues/1
ymh <ymh.work@gmail.com>
parents: 132
diff changeset
   173
            dest_file.write("\n")