From 9389af99ba7b66c5bec99d8986444bbcc60d608e Mon Sep 17 00:00:00 2001 From: RTB Date: Fri, 18 Apr 2014 13:17:24 +0200 Subject: [PATCH] removed manual Requests for wikipedia URLs as wikipedia parser handles those through synonyms --- FourmiCrawler/parsers/ChemSpider.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/FourmiCrawler/parsers/ChemSpider.py b/FourmiCrawler/parsers/ChemSpider.py index 3b22ce4..cf4bae7 100644 --- a/FourmiCrawler/parsers/ChemSpider.py +++ b/FourmiCrawler/parsers/ChemSpider.py @@ -26,8 +26,6 @@ class ChemSpider(Parser): requests.extend(requests_synonyms) requests_properties = self.parse_properties(sel) requests.extend(requests_properties) - for wiki_url in sel.xpath('.//p[@class="syn"][strong]/a[@title="Wiki"]/@href').extract(): - requests.append( Request(url=wiki_url) ) return requests