src/core/wp_utils.py
changeset 4 ae066d797a66
parent 3 221af1052ec4
child 33 61c3ffd94f11
equal deleted inserted replaced
3:221af1052ec4 4:ae066d797a66
   128 
   128 
   129     return { 'new_label': new_label, 'alternative_label': alternative_label, 'status': status, 'wikipedia_url': url, 'pageid': pageid, 'alternative_wikipedia_url': alternative_url, 'alternative_pageid': alternative_pageid, 'dbpedia_uri': dbpedia_uri, 'revision_id': revision_id, 'response': original_response }
   129     return { 'new_label': new_label, 'alternative_label': alternative_label, 'status': status, 'wikipedia_url': url, 'pageid': pageid, 'alternative_wikipedia_url': alternative_url, 'alternative_pageid': alternative_pageid, 'dbpedia_uri': dbpedia_uri, 'revision_id': revision_id, 'response': original_response }
   130 
   130 
   131 
   131 
   132 
   132 
   133 def get_or_create_term(term_label, term_uri, term_lang, thesaurus, wp_label_transform=(lambda l:l)):
   133 def get_or_create_term(term_label, term_uri, term_lang, thesaurus, wp_label_transform=(lambda l:l), skip_wp_query=False):
   134     
   134     
   135     term_label_normalized = normalize_term(term_label)
   135     term_label_normalized = normalize_term(term_label)
   136     # We get the wikipedia references for the tag_label
   136     # We get the wikipedia references for the tag_label
   137     # We get or create the tag object
   137     # We get or create the tag object
   138     
   138     
   159         wikipedia_revision_id = process_term(site, term, label=wp_label_transform(term_label_normalized))
   159         wikipedia_revision_id = process_term(site, term, label=wp_label_transform(term_label_normalized))
   160 
   160 
   161         term_label_obj = TermLabel(label=term_label, term=term, lang=term_lang)
   161         term_label_obj = TermLabel(label=term_label, term=term, lang=term_lang)
   162         term_label_obj.save()
   162         term_label_obj.save()
   163         
   163         
   164     elif term.wikipedia_pageid:
   164     elif term.wikipedia_pageid and not skip_wp_query:
   165         wp_res = query_wikipedia_title(site, pageid=term.wikipedia_pageid)
   165         wp_res = query_wikipedia_title(site, pageid=term.wikipedia_pageid)
   166         wikipedia_revision_id = wp_res['revision_id']
   166         wikipedia_revision_id = wp_res['revision_id']
   167         term.wikipedia_revision_id = wikipedia_revision_id
   167         term.wikipedia_revision_id = wikipedia_revision_id
   168         term.save()
   168         term.save()
   169     else:
   169     else: