added first syntax of general settings yaml per country

This commit is contained in:
corsaronero 2023-02-24 18:29:55 +00:00
parent 2e46df3260
commit b4223bca30

15
crawlers/countries.yaml Normal file
View file

@ -0,0 +1,15 @@
# Settings for the PEP crawler per country to crawl
# Follow the syntax
nicaragua:
memberList:
link: http://legislacion.asamblea.gob.ni/Tablas%20Generales.nsf/Main.xsp
parent: [html, body, form, table, tbody, tr, td, table, tbody]
child-name: [html, body, form, table, tbody, tr, td, table, tbody, tr, td.null, a.text]
child-link: [html, body, form, table, tbody, tr, td, table, tbody, tr, td.null, a.href]
member:
info-1:
parent: [html, body, form, table, tbody]
child-name: [html, body, form, table, tbody, tr.0, td.1, span]
child-image: [html, body, form, table, tbody, tr.1, td.0, span, img]
child-role: [html, body, form, table, tbody, tr.1, td.2, span + label.1]