added scraping of synonym language
This commit is contained in:
parent
4f2c046c9c
commit
ce5eeb56a6
@ -94,13 +94,20 @@ class ChemSpider(Parser):
|
|||||||
|
|
||||||
return requests
|
return requests
|
||||||
|
|
||||||
def new_synonym(self, sel, name, reliability):
|
def new_synonym(self, sel, name, category):
|
||||||
log.msg('CS synonym: %s (%s)' % (name, reliability), level=log.DEBUG)
|
|
||||||
self.ignore_list.append(name)
|
self.ignore_list.append(name)
|
||||||
|
language = sel.xpath('span[@class="synonym_language"]/text()').extract()
|
||||||
|
if language:
|
||||||
|
language = language[0][1:-1]
|
||||||
|
else:
|
||||||
|
language = 'English'
|
||||||
synonym = {
|
synonym = {
|
||||||
'name': name,
|
'name': name,
|
||||||
'category': category,
|
'category': category,
|
||||||
|
'language': language
|
||||||
}
|
}
|
||||||
|
log.msg('CS synonym: %s (%s) (%s)' % (name, category, language),
|
||||||
|
level=log.DEBUG)
|
||||||
return synonym
|
return synonym
|
||||||
|
|
||||||
def parse_extendedinfo(self, response):
|
def parse_extendedinfo(self, response):
|
||||||
|
Reference in New Issue
Block a user