diff --git a/FourmiCrawler/parsers/ChemSpider.py b/FourmiCrawler/parsers/ChemSpider.py index 7141839..98f0c05 100644 --- a/FourmiCrawler/parsers/ChemSpider.py +++ b/FourmiCrawler/parsers/ChemSpider.py @@ -94,13 +94,20 @@ class ChemSpider(Parser): return requests - def new_synonym(self, sel, name, reliability): - log.msg('CS synonym: %s (%s)' % (name, reliability), level=log.DEBUG) + def new_synonym(self, sel, name, category): self.ignore_list.append(name) + language = sel.xpath('span[@class="synonym_language"]/text()').extract() + if language: + language = language[0][1:-1] + else: + language = 'English' synonym = { 'name': name, 'category': category, + 'language': language } + log.msg('CS synonym: %s (%s) (%s)' % (name, category, language), + level=log.DEBUG) return synonym def parse_extendedinfo(self, response):