script/lib/iri_tweet/export_twitter_alchemy.py
changeset 22 3823611919ef
parent 21 8003bcd8d9a2
child 23 2b17b26ca153
equal deleted inserted replaced
21:8003bcd8d9a2 22:3823611919ef
   203                         if entity.type == u'entity_hashtag': 
   203                         if entity.type == u'entity_hashtag': 
   204                             etree.SubElement(tags_node,u"tag").text = entity.hashtag.text
   204                             etree.SubElement(tags_node,u"tag").text = entity.hashtag.text
   205                             
   205                             
   206                     meta_element = etree.SubElement(element, u'meta')
   206                     meta_element = etree.SubElement(element, u'meta')
   207                     
   207                     
   208                     m = re.search("(\+\+|\-\-|\?\?|\=\=)",tw.text)
   208                     polemics_element = etree.Element(u'polemics')
   209                     if m:
   209                     polemic_added = False
       
   210                     for m in re.finditer("(\+\+|\-\-|\?\?|\=\=)",tw.text):
       
   211                         polemic_added = True
   210                         pol_link = {
   212                         pol_link = {
   211                             '++' : u'OK',
   213                             '++' : u'OK',
   212                             '--' : u'KO',
   214                             '--' : u'KO',
   213                             '??' : u'Q',
   215                             '??' : u'Q',
   214                             '==' : u'REF'}[m.group(1)]
   216                             '==' : u'REF'}[m.group(1)]
   215                         etree.SubElement(meta_element, u'polemic').text = pol_link
   217                         etree.SubElement(polemics_element, u'polemic').text = pol_link
       
   218                     if polemic_added:
       
   219                         meta_element.append(polemics_element)
   216                     
   220                     
   217                     etree.SubElement(meta_element, u"twitter").text = etree.CDATA(unicode(tw.original_json))
   221                     etree.SubElement(meta_element, u"twitter").text = etree.CDATA(unicode(tw.original_json))
   218                     
   222                     
   219                 
   223                 
   220                 if content_file and os.path.exists(content_file):
   224                 if content_file and os.path.exists(content_file):