From a867b069f27b74c52be8c550d38b27ecda89dafb Mon Sep 17 00:00:00 2001 From: Tony Bowden Date: Tue, 14 Aug 2018 08:58:03 +0100 Subject: [PATCH] Also find via Wikidata P39s --- scraper.rb | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/scraper.rb b/scraper.rb index 53b15b0..6218d44 100644 --- a/scraper.rb +++ b/scraper.rb @@ -4,7 +4,6 @@ require 'pry' require 'wikidata/fetcher' - column_header = 'النائب' ar_names = EveryPolitician::Wikidata.wikipedia_xpath( url: 'https://ar.wikipedia.org/wiki/مجلس_النواب_اللبناني', @@ -13,7 +12,9 @@ ) en_names = EveryPolitician::Wikidata.morph_wikinames(source: 'tmtmtmtm/lebanese-parliament-2009', column: 'wikiname') - en_names2 = WikiData::Category.new( 'Category:Members of the Parliament of Lebanon', 'en').member_titles -EveryPolitician::Wikidata.scrape_wikidata(names: { en: en_names | en_names2, ar: ar_names }, output: false) +sparq = 'SELECT DISTINCT ?item WHERE { ?item p:P39/ps:P39 wd:Q21328581 }' +ids = EveryPolitician::Wikidata.sparql(sparq) + +EveryPolitician::Wikidata.scrape_wikidata(ids: ids, names: { en: en_names | en_names2, ar: ar_names })