|
|
-
-
- import os
-
- import yaml
- import json
-
-
-
- class WikidataPEP(object):
-
- def __init__(self, configFile):
-
- with open(configFile, "r") as stream:
- try:
- self.config = yaml.safe_load(stream)
- except yaml.YAMLError as exc:
- print(exc)
-
-
- def importMembersOfParliamentDict(self, listOfCountries):
-
- self.fullDictionaryMemberLists = {}
-
- for country in listOfCountries:
-
- print('started to parse data of members of ' + country + ' ..')
-
- f = open('crawlers/output/' + country +'MemberList.txt')
- text = f.read()
-
- self.fullDictionaryMemberLists[country] = eval(text)
-
- #print(self.fullDictionaryMemberLists)
-
-
- def checkForEntityIds(self, listOfCountries):
-
- from wikibaseintegrator import WikibaseIntegrator
- from wikibaseintegrator import wbi_helpers
-
- fullDictionaryMemberLists = self.fullDictionaryMemberLists
-
- for country in listOfCountries:
-
- for memberId in fullDictionaryMemberLists[country].keys():
-
- name = fullDictionaryMemberLists[country][memberId]['name']
-
- results = wbi_helpers.search_entities(search_string=name)
-
-
- for entityId in results:
-
- wbi = WikibaseIntegrator()
- wikidata_item = wbi.item.get(entity_id=entityId)
-
- for claimkey in wikidata_item.get_json()['claims'].keys():
-
- if claimkey == 'P31':
-
- if wikidata_item.get_json()['claims'][claimkey][0]['mainsnak']['datavalue']['value']['id'] == 'Q5':
-
- print(entityId)
- print('---------')
- print(name)
- print('is a human')
-
-
-
-
- def createMemberOnWikidata(self):
-
- from wikibaseintegrator import wbi_login, WikibaseIntegrator
- from wikibaseintegrator.datatypes import ExternalID, Item
- from wikibaseintegrator.wbi_config import config as wbi_config
-
- wbi_config['USER_AGENT'] = 'PEPimport/1.0 (https://www.wikidata.org/wiki/User:Username)'
-
- # login object
- login_instance = wbi_login.OAuth2(consumer_token='', consumer_secret='')
-
- wbi = WikibaseIntegrator(login=login_instance)
-
- # data type object, e.g. for a NCBI gene entrez ID
- isHuman = Item(value='Q5', prop_nr='P31')
- occupationPolitician = ExternalID(value='Q82955', prop_nr='P106')
- occupationDeputy = ExternalID(value='Q1055894', prop_nr='P106')
- #referenceURL = URL(value='http://legislacion.asamblea.gob.ni/Tablas%20Generales.nsf/InfoDiputado.xsp?documentId=3D4CFDC4B3006D70062587C5007C29E1&action=openDocument&SessionID=1868803A06AB73D50B7F89BD0AB', prop_nr='P106')
-
- # print(isHuman)
- # print(referenceURL)
-
- # data goes into a list, because many data objects can be provided to
- data1 = [isHuman]
- data2 = [occupationDeputy]
- data3 = [occupationPolitician]
-
- # Create a new item
- item = wbi.item.new()
-
- # Set an english label
- item.labels.set(language='en', value='Carlos Humberto Ruíz')
-
- # Set a French description
- item.descriptions.set(language='en', value='Nicaraguan National Assembly Deputy')
-
- item.claims.add(data1)
- #item.claims.add(data2)
- #item.claims.add(data3)
- print(item.write())
-
|