synonyms are now scraped
This commit is contained in:
parent
b46c7a309d
commit
472aae86be
@ -79,6 +79,12 @@ class NIST(Source):
|
|||||||
ul = sel.xpath('body/ul[li/strong="IUPAC Standard InChI:"]')
|
ul = sel.xpath('body/ul[li/strong="IUPAC Standard InChI:"]')
|
||||||
li = ul.xpath('li')
|
li = ul.xpath('li')
|
||||||
|
|
||||||
|
raw_synonyms = ul.xpath('li[strong="Other names:"]/text()').extract()
|
||||||
|
for synonym in raw_synonyms[0].strip().split(';\n'):
|
||||||
|
log.msg('NIST synonym: %s' % synonym, level=log.DEBUG)
|
||||||
|
self.ignore_list.update(synonym)
|
||||||
|
self._spider.get_synonym_requests(synonym)
|
||||||
|
|
||||||
data = {}
|
data = {}
|
||||||
|
|
||||||
raw_formula = ul.xpath('li[strong/a="Formula"]//text()').extract()
|
raw_formula = ul.xpath('li[strong/a="Formula"]//text()').extract()
|
||||||
|
Reference in New Issue
Block a user