Browse Source

update to config.yaml

onlinkgen
alpcentaur 1 year ago
parent
commit
7aa903883b
2 changed files with 9 additions and 6 deletions
  1. +8
    -5
      spiders/config.yaml
  2. +1
    -1
      spiders/fdb_spider.py

+ 8
- 5
spiders/config.yaml View File

@ -6,11 +6,14 @@
foerderinfo.bund.de: foerderinfo.bund.de:
domain: 'http://foerderinfo.bund.de' domain: 'http://foerderinfo.bund.de'
entryList:
link: ''
parent: '//html//body//form//table//tr//td//table//tr'
child-name: '//td//a/text()'
child-link: '//td//a/@href'
entry-list:
link1: 'https://www.foerderinfo.bund.de/SiteGlobals/Forms/foerderinfo/expertensuche/Servicesuche_Formular.html#searchResults'
link2: 'https://www.foerderinfo.bund.de/SiteGlobals/Forms/foerderinfo/expertensuche/Servicesuche_Formular.html?gtp=33498_list%253D2#searchResults'
link3: 'https://www.foerderinfo.bund.de/SiteGlobals/Forms/foerderinfo/expertensuche/Servicesuche_Formular.html?gtp=33498_list%253D3#searchResults'
iteration-var-list: [1,1
parent: '//html//body//form//table//tr//td//table//tr'
child-name: '//td//a/text()'
child-link: '//td//a/@href'
member: member:
info-1: info-1:
parent: '//html//body//form//table' parent: '//html//body//form//table'

+ 1
- 1
spiders/fdb_spider.py View File

@ -35,7 +35,7 @@ class fdb_spider(object):
) )
try: try:
entry_list_link = entry_list.get("link") entry_list_link = entry_list.get("link")
except Exception as e:
except Exception as e:
print( print(
"No entryListLink defined in config.yaml - the original error message is:", "No entryListLink defined in config.yaml - the original error message is:",
e, e,

Loading…
Cancel
Save