web/ldt/ldt_utils/fileimport.py
author ymh <ymh.work@gmail.com>
Thu, 28 Oct 2010 00:37:07 +0200
changeset 19 cbc514bab5bf
parent 1 eb9188f2ee4f
permissions -rw-r--r--
Added tag V00.06 for changeset b9c2a90029e7
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
1
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     1
from copy import deepcopy
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     2
from django.conf import settings
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     3
from django.core.exceptions import ObjectDoesNotExist
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     4
from ldt.utils import zipfileext
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     5
from models import Content, Media
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     6
import fnmatch
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     7
import lxml.etree
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     8
import os.path
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
     9
import shutil
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    10
import tempfile
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    11
import urllib
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    12
import uuid
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    13
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    14
class FileImportError(Exception):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    15
    def __init__(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    16
        self.value = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    17
    def __str__(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    18
        return repr(self.value)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    19
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    20
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    21
def Property(func):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    22
    return property(**func()) 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    23
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    24
class IriInfo(object):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    25
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    26
    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    27
    def __init__(self, id, order, titledesc, basepath="", videopath=settings.STREAM_URL, decoupage_blacklist = settings.DECOUPAGE_BLACKLIST, flatten = True):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    28
        self.id = id
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    29
        self.basepath = basepath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    30
        self.order = order
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    31
        self.src = ""
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    32
        self.annotations = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    33
        self.videopath = videopath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    34
        self.videourl = ""
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    35
        self.title = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    36
        self.desc = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    37
        self.duration = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    38
        self.created = False
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    39
        self.content = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    40
        self.decoupage_blacklist = decoupage_blacklist
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    41
        if self.decoupage_blacklist is None:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    42
            self.decoupage_blacklist = ()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    43
        self.flatten = flatten
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    44
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    45
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    46
    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    47
    def processIri(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    48
        # for just import a file ldt and get the title for every media
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    49
        if 'http' in self.src:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    50
            #url = urllib.urlopen(self.src)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    51
            path = url
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    52
            #doc = xml.dom.minidom.parse(url)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    53
        #for import a zip, get title and copy file .iri in the media directory
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    54
        else:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    55
            path = os.path.join(self.basepath, self.src)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    56
            #doc = xml.dom.minidom.parse(path)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    57
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    58
        doc = lxml.etree.parse(path)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    59
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    60
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    61
        #doc = Ft.Xml.Domlette.ConvertDocument(doc) 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    62
        #con = xml.xpath.Context.Context(doc, 1, 1, None)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    63
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    64
        res = doc.xpath("/iri/head/meta[@name='title']/@content")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    65
        #res = xml.xpath.Evaluate("/iri/head/meta[@name='title']/@content", context=con)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    66
        #self.title = res[0].value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    67
        self.title = res[0]
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    68
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    69
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    70
        #res = xml.xpath.Evaluate("/iri/body/ensembles",context=con)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    71
        res = doc.xpath("/iri/body/ensembles")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    72
        ensemblesnode = res[0]
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    73
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    74
        ensembleids = []
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    75
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    76
        for node in ensemblesnode: #ensemblesnode.childNodes:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    77
            #if node.nodeType == xml.dom.Node.ELEMENT_NODE and node.tagName == "ensemble":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    78
            if node.tag == "ensemble":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    79
                #id = node.getAttributeNS(None,u"id")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    80
                id = node.attrib["id"]
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    81
                if id not in ensembleids:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    82
                    ensembleids.append(id)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    83
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    84
        if self.annotations is not None:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    85
            newEnsemble = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    86
            #for cnode in self.annotations.childNodes:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    87
            for cnode in self.annotations:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    88
                #if cnode.nodeType == xml.dom.Node.ELEMENT_NODE and cnode.tagName == "decoupage":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    89
                if cnode.tag == "decoupage":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    90
                    if newEnsemble is None:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    91
                        #newensemble = doc.createElementNS(None,'ensemble')
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    92
                        ensembleid = self.id+"_"+str(uuid.uuid1())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    93
                        newensemble = lxml.etree.SubElement(ensemblesnode,
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    94
                                                            'ensemble',
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    95
                                                            {'id' : ensembleid,
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    96
                                                             'title' : self.annotations.get('title') or "",
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    97
                                                             'author' : self.annotations.get('author') or "",
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    98
                                                             'date' : self.annotations.get('date') or "",
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
    99
                                                             'abstract' : self.annotations.get('abstract') or ""
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   100
                                                             }
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   101
                                                            )                        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   102
                        ensembleids.append(ensembleid)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   103
                    newDecoupageNode = deepcopy(cnode)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   104
                    newensemble.append(newDecoupageNode)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   105
                #elif cnode.nodeType == xml.dom.Node.ELEMENT_NODE and cnode.tagName == "ensemble":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   106
                elif cnode.tag == "ensemble":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   107
                    #ensembleid = cnode.getAttribute(u"id")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   108
                    ensembleid = cnode.attrib['id']
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   109
                    cloneNode = deepcopy(cnode)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   110
                    if ensembleid in ensembleids:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   111
                        ensembleid = self.id+"_"+str(uuid.uuid1())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   112
                        cloneNode.set(u"id", ensembleid)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   113
                    ensembleids.append(ensembleid)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   114
                    ensemblesnode.append(cloneNode)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   115
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   116
        res = doc.xpath("/iri/body/medias/media[@id='video']/video")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   117
        if self.flatten:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   118
            src_video = res[0].get('src')
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   119
            self.videourl = os.path.basename(src_video)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   120
            res[0].set('src', self.videourl)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   121
        self.duration = res[0].get(u'dur')
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   122
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   123
        f = open(path, "w")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   124
        try:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   125
            #etree = lxml.etree.ElementTree(doc)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   126
            doc.write(f, encoding="UTF-8", pretty_print=True, xml_declaration=True)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   127
#            xml.dom.ext.Print(doc, stream=f)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   128
        finally:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   129
            f.close()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   130
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   131
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   132
        destPath = os.path.join(os.path.join(os.path.join(settings.MEDIA_ROOT, "media"), "ldt"), self.id);
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   133
        if not os.path.exists(destPath):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   134
            os.makedirs(destPath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   135
        shutil.move(os.path.join(self.basepath, self.src), os.path.join(destPath, os.path.basename(self.src)))
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   136
        self.src = self.id + u"/" + os.path.basename(self.src)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   137
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   138
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   139
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   140
    def saveContent(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   141
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   142
        defaults_media = {'src':unicode(self.videourl), 'title':unicode(self.title), 'description':unicode(self.desc), 'videopath': unicode(self.videopath.rstrip("/") + "/")}
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   143
        media, media_created = Media.objects.get_or_create(src=unicode(self.videourl), defaults = defaults_media)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   144
        if not media_created:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   145
            for key, value in defaults_media.items():
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   146
                setattr(media, key, value)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   147
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   148
        media.save()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   149
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   150
        defaults_content = { 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   151
            'iriurl': unicode(self.src), 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   152
            'title':unicode(self.title),
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   153
            'description':unicode(self.desc),
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   154
            'media':media,
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   155
            'iri':unicode(self.id + u"/" + os.path.basename(self.src)),
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   156
            'duration':int(self.duration)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   157
        }
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   158
        content, self.created = Content.objects.get_or_create(iri_id=self.id, defaults = defaults_content)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   159
        if not self.created:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   160
            for key, value in defaults_content.items():
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   161
                setattr(content, key, value)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   162
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   163
        content.save()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   164
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   165
        self.content = content
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   166
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   167
    def process(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   168
        self.processIri()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   169
        self.saveContent()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   170
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   171
class BaseFileImport(object):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   172
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   173
    def __init__(self, filepath, videopath):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   174
        self.__filepath = filepath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   175
        self.__tempdir = ""
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   176
        self.__videopath = videopath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   177
        self.__author = None
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   178
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   179
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   180
    def filepath(): #@NoSelf
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   181
        doc = """Docstring""" #@UnusedVariable
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   182
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   183
        def fget(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   184
            return self.__filepath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   185
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   186
        def fset(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   187
            self.__filepath = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   188
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   189
        def fdel(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   190
            del self.__filepath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   191
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   192
        return locals()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   193
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   194
    filepath = property(**filepath())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   195
    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   196
    def videopath(): #@NoSelf
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   197
        doc = """Docstring""" #@UnusedVariable
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   198
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   199
        def fget(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   200
            return self.__videopath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   201
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   202
        def fset(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   203
            self.__videopath = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   204
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   205
        def fdel(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   206
            del self.__videopath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   207
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   208
        return locals()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   209
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   210
    videopath = property(**videopath())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   211
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   212
    def author(): #@NoSelf
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   213
        doc = """Docstring""" #@UnusedVariable
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   214
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   215
        def fget(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   216
            return self.__author
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   217
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   218
        def fset(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   219
            self.__author = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   220
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   221
        def fdel(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   222
            del self.__author
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   223
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   224
        return locals()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   225
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   226
    author = property(**author())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   227
    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   228
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   229
class FileImport(BaseFileImport):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   230
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   231
    def __init__(self, filepath, videopath, flatten):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   232
        BaseFileImport.__init__(self, filepath, videopath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   233
        self.__checkExistingMedia = False
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   234
        self.__flatten = flatten
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   235
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   236
    def checkExistingMedia(): #@NoSelf
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   237
        doc = """Docstring""" #@UnusedVariable
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   238
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   239
        def fget(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   240
            return self.__checkExistingMedia
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   241
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   242
        def fset(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   243
            self.__checkExistingMedia = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   244
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   245
        def fdel(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   246
            del self.__checkExistingMedia
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   247
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   248
        return locals()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   249
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   250
    checkExistingMedia = property(**checkExistingMedia())    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   251
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   252
    def flatten(): #@NoSelf
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   253
        doc = """Docstring""" #@UnusedVariable
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   254
       
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   255
        def fget(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   256
            return self.__flatten
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   257
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   258
        def fset(self, value):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   259
            self.__flatten = value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   260
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   261
        def fdel(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   262
            del self.__flatten
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   263
           
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   264
        return locals()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   265
    flatten = property(**flatten())
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   266
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   267
    def processLdt(self, ldtpath=None):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   268
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   269
        # list iri
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   270
        # see if there is some comments
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   271
        # inject comment in iri
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   272
        # copy iri in folder
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   273
        # create or update content
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   274
        contents = {}
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   275
        filepath = ldtpath if ldtpath else self.filepath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   276
        doc = lxml.etree.parse(filepath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   277
        #if ldtpath:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   278
            #doc = xml.dom.minidom.parse(ldtpath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   279
        #    doc = lxml.etree.parse(ldtpath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   280
        #else:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   281
            #doc = xml.dom.minidom.parse(self.filepath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   282
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   283
        #con = xml.xpath.Context.Context(doc, 1, 1, None)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   284
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   285
        #get author from file ldt
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   286
        #result = xml.xpath.Evaluate("/iri/project", context=con)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   287
        result = doc.xpath("/iri/project")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   288
        for pnode in result:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   289
            #author = pnode.getAttributeNS(None,u"user")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   290
            author = pnode.attrib[u"user"]
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   291
            if author:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   292
                self.author = unicode(author)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   293
                break 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   294
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   295
        result = doc.xpath("/iri/medias/media")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   296
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   297
        for i, medianode in  enumerate(result):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   298
        # get iri file's id from file ldt
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   299
            #id = medianode.attributes['id'].value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   300
            id = medianode.attrib['id']
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   301
            if self.checkExistingMedia:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   302
                try:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   303
                    Content.objects.get(iri_id=id)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   304
                    do_pass = True
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   305
                except ObjectDoesNotExist: #Content.DoesNotExist
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   306
                    do_pass = False
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   307
            else:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   308
                    do_pass = False
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   309
            if not do_pass:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   310
                if not (contents.has_key(id)):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   311
                    # Create instance iriInfo(id, order, titledesc, basepath="", videopath=settings.STREAM_URL)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   312
                    if ldtpath:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   313
                        contents[id] = IriInfo(id, i, "", os.path.dirname(ldtpath), flatten=self.flatten)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   314
                    else: 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   315
                        contents[id] = IriInfo(id, i, "", flatten=self.flatten)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   316
                    # Get iri file's url from ldt. This url can be relative path or absolute path.
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   317
                #contents[id].src = medianode.attributes['src'].value
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   318
                contents[id].src = medianode.attrib['src']
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   319
                if medianode.attrib['video'] !="":
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   320
                    contents[id].videopath = medianode.attrib['video']
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   321
                elif self.videopath !="" or self.videopath:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   322
                    contents[id].videopath = self.videopath
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   323
                else:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   324
                    contents[id].videopath =settings.STREAM_URL
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   325
                    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   326
                
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   327
        #get annotation of file ldt
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   328
        result = doc.xpath("/iri/annotations/content")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   329
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   330
        for contentnode in result:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   331
            id = contentnode.attrib['id']
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   332
            if contents.has_key(id):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   333
                if self.author:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   334
                    contentnode.set("author", unicode(self.author))
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   335
                contents[id].annotations = contentnode
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   336
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   337
        #go throught values
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   338
        for iriinfo in contents.values():
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   339
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   340
            iriinfo.process()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   341
            
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   342
            # if yes update
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   343
            # if no create
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   344
            # move iri file to the proper place
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   345
            #return list of iriInfo
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   346
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   347
    def processFile(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   348
        if self.filepath.name.endswith(".ldt"):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   349
            self.processLdt()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   350
        elif self.filepath.name.endswith(".zip"):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   351
            self.processZip()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   352
        else:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   353
            raise FileImportError("Bad file type")
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   354
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   355
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   356
    def processZip(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   357
    # """ extraire .zip, pass to method processLdt"""
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   358
        # create temp directory
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   359
        self.__tempdir = tempfile.mkdtemp()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   360
        openfiles = []
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   361
        flvfiles = []
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   362
        processedids = []
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   363
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   364
        try:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   365
            zipfile = zipfileext.ZipFileExt(self.filepath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   366
            zipfile.unzip_into_dir(self.__tempdir)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   367
            #load ldt
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   368
            foldersToProcess = [self.__tempdir]
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   369
            while len(foldersToProcess):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   370
                currentFolder = foldersToProcess.pop()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   371
                for entry in os.listdir(currentFolder):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   372
                    if entry in settings.ZIP_BLACKLIST:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   373
                        continue
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   374
                    entryPath = os.path.join(currentFolder, entry)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   375
                    if(os.path.isdir(entryPath)):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   376
                        foldersToProcess.append(entryPath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   377
                    elif fnmatch.fnmatch(entry, "*.ldt"):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   378
                        ldtid = self.processLdt(entryPath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   379
                        processedids.append(ldtid)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   380
                    elif fnmatch.fnmatch(entry, "*.flv"):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   381
                        flvfiles.append(entryPath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   382
             
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   383
            if settings.CONTENT_ROOT and os.path.exists(settings.CONTENT_ROOT): 
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   384
                for entry in flvfiles:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   385
                    shutil.copy(entry, settings.CONTENT_ROOT)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   386
                    
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   387
        finally:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   388
            for f in openfiles:
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   389
                f.close()
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   390
            shutil.rmtree(self.__tempdir)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   391
        # delete directory
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   392
        return processedids
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   393
        
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   394
    # def processFileLdt(self):
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   395
        # processedids = []
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   396
        # ldtid = self.processLdt(self.filepath)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   397
        # processedids.append(ldtid)
eb9188f2ee4f first commit
wakimd
parents:
diff changeset
   398
        # return processedids