|
|
- import os
-
- import yaml
- import json
-
-
- class WikidataPEP(object):
- def __init__(self, configFile):
- with open(configFile, "r") as stream:
- try:
- self.config = yaml.safe_load(stream)
- except yaml.YAMLError as exc:
- print(exc)
-
- def importMembersOfParliamentDict(self, listOfCountries):
- self.fullDictionaryMemberLists = {}
-
- for country in listOfCountries:
- print("started to parse data of members of " + country + " ..")
-
- f = open("crawlers/output/" + country + "MemberList.txt")
- text = f.read()
-
- self.fullDictionaryMemberLists[country] = eval(text)
-
- # print(self.fullDictionaryMemberLists)
-
- def checkForEntityIds(self, listOfCountries):
- from wikibaseintegrator import WikibaseIntegrator
- from wikibaseintegrator import wbi_helpers
-
- fullDictionaryMemberLists = self.fullDictionaryMemberLists
-
- for country in listOfCountries:
- for memberId in fullDictionaryMemberLists[country].keys():
- name = fullDictionaryMemberLists[country][memberId]["name"]
-
- results = wbi_helpers.search_entities(search_string=name)
-
- for entityId in results:
- wbi = WikibaseIntegrator()
- wikidata_item = wbi.item.get(entity_id=entityId)
-
- for claimkey in wikidata_item.get_json()["claims"].keys():
- if claimkey == "P31":
- if (
- wikidata_item.get_json()["claims"][claimkey][0][
- "mainsnak"
- ]["datavalue"]["value"]["id"]
- == "Q5"
- ):
- print(entityId)
- print("---------")
- print(name)
- print("is a human")
-
- def createMemberOnWikidata(self):
- from wikibaseintegrator import wbi_login, WikibaseIntegrator
- from wikibaseintegrator.datatypes import ExternalID, Item
- from wikibaseintegrator.wbi_config import config as wbi_config
-
- wbi_config["USER_AGENT"] = "PEPimport/1.0 (https://www.wikidata.org/wiki/User:)"
-
- # login object
- login_instance = wbi_login.OAuth2(consumer_token="", consumer_secret="")
-
- wbi = WikibaseIntegrator(login=login_instance)
-
- # data type object, e.g. for a NCBI gene entrez ID
- isHuman = Item(value="Q5", prop_nr="P31")
- occupationPolitician = ExternalID(value="Q82955", prop_nr="P106")
- occupationDeputy = ExternalID(value="Q1055894", prop_nr="P106")
- # referenceURL = URL(value='http://legislacion.asamblea.gob.ni/Tablas%20Generales.nsf/InfoDiputado.xsp?documentId=3D4CFDC4B3006D70062587C5007C29E1&action=openDocument&SessionID=1868803A06AB73D50B7F89BD0AB', prop_nr='P106')
-
- # print(isHuman)
- # print(referenceURL)
-
- # data goes into a list, because many data objects can be provided to
- data1 = [isHuman]
- data2 = [occupationDeputy]
- data3 = [occupationPolitician]
-
- # Create a new item
- item = wbi.item.new()
-
- # Set an english label
- item.labels.set(language="en", value="Carlos Humberto Ruíz")
-
- # Carlos Humberto Ruiz has the Qid Q116918332
-
- # Set a French description
- item.descriptions.set(
- language="en", value="Nicaraguan National Assembly Deputy"
- )
-
- item.claims.add(data1)
- # item.claims.add(data2)
- # item.claims.add(data3)
- print(item.write())
-
- def editMemberOnWikidata(self, Qid):
- from wikibaseintegrator import wbi_login, WikibaseIntegrator
- from wikibaseintegrator.datatypes import ExternalID, Item, Time, String
- from wikibaseintegrator.wbi_config import config as wbi_config
- from wikibaseintegrator.wbi_enums import ActionIfExists
- from wikibaseintegrator.wbi_enums import WikibaseDatePrecision
-
- wbi_config[
- "USER_AGENT"
- ] = "PEPimport/1.0 (https://www.wikidata.org/wiki/User:Alpcentaur)"
-
- # login object
- login_instance = wbi_login.OAuth2(consumer_token="", consumer_secret="")
-
- wbi = WikibaseIntegrator(login=login_instance)
-
- # data type object, e.g. for a NCBI gene entrez ID
- # isHuman = Item(value='Q5', prop_nr='P31')
- # occupationPolitician = Item(value='Q82955', prop_nr='P106')
- # occupationDeputy = Item(value='Q1055894', prop_nr='P106')
- # referenceURL = ExternalID(value='http://legislacion.asamblea.gob.ni/Tablas%20Generales.nsf/InfoDiputado.xsp?documentId=3D4CFDC4B3006D70062587C5007C29E1&action=openDocument&SessionID=1868803A06AB73D50B7F89BD0AB', prop_nr='P854')
-
- # print(isHuman)
- # print(referenceURL)
-
- references = [
- [
- ExternalID(
- value="http://legislacion.asamblea.gob.ni/Tablas%20Generales.nsf/InfoDiputado.xsp?documentId=3D4CFDC4B3006D70062587C5007C29E1&action=openDocument&SessionID=1868803A06AB73D50B7F89BD0AB",
- prop_nr="P854",
- ),
- Time(
- time="+2023-02-27T00:00:00Z",
- prop_nr="P813",
- precision=WikibaseDatePrecision.DAY,
- ),
- ]
- ]
-
- occupationDeputy = Item(value="Q1055894", prop_nr="P106", references=references)
-
- ## data goes into a list, because many data objects can be provided to
- # data1 = [isHuman]
- data2 = [occupationDeputy]
- # data3 = [occupationPolitician]
- # data4 = [referenceURL]
- ## get item for Qid
- item = wbi.item.get(entity_id=Qid)
-
- # print(item.claims)
-
- # Set an english label
- # item.labels.set(language='en', value='Carlos Humberto Ruíz', action_if_exists=ActionIfExists.KEEP)
-
- # Set a French description
- # item.descriptions.set(language='en', value='Nicaraguan National Assembly Deputy', action_if_exists=ActionIfExists.KEEP)
-
- # item.claims.add(data4)
- item.claims.add(data2)
- # item.claims.add(data3)
- print(item.write())
|