tweet_live: comparison script/lib/iri

equal deleted inserted replaced

-:514e0ee0c68a
+:e6b328970ee8
 ts_copy["user_id"] = ts_copy["user"].id
 ts_copy["original_json"] = self.json_txt
 self.tweet = Tweet(**ts_copy)
 self.session.add(self.tweet)
-self.session.flush()
 # get entities
-for ind_type, entity_list in self.json_dict["entities"].items():
+if "entities" in self.json_dict:
-for ind in entity_list:
+for ind_type, entity_list in self.json_dict["entities"].items():
-self.__process_entity(ind, ind_type)
+for ind in entity_list:
+self.__process_entity(ind, ind_type)
+else:
+extractor = twitter_text.Extractor(self.tweet.text)
+for ind in extractor.extract_hashtags_with_indices():
+self.__process_entity(ind, "hashtags")
+for ind in extractor.extract_mentioned_screen_names_with_indices():
+self.__process_entity(ind, "user_mentions")
+for ind in extractor.extract_urls_with_indices():
+self.__process_entity(ind, "urls")
+self.session.flush()
 def __process_twitter_rest(self):
 tweet_nb = self.session.query(Tweet).filter(Tweet.id == self.json_dict["id"]).count()
 if tweet_nb > 0: