Archived
1
0

Able to parse the weblinks to other databases, one example done

This commit is contained in:
Bas Vb 2014-04-16 10:37:57 +02:00
parent cd1637b0fe
commit d778050f36

View File

@ -23,7 +23,7 @@ class WikipediaParser(Parser):
meltingpoint = self.getmeltingpoint(sel)
items.append(meltingpoint)
boilingpoint = self.getboilingpoint(sel)
print boilingpoint
chemlink = self.getchemspider(sel)
items.append(boilingpoint)
return items
@ -43,3 +43,8 @@ class WikipediaParser(Parser):
item['value']= sel.xpath('//tr/td/a[@title="Boiling point"]/../../td[2]/text()').extract() # ('//tr[contains(@href, "/wiki/Melting_point")]/text()').extract()
item['source']= "Wikipedia"
return item
def getchemspider(self, sel):
item=sel.xpath('//tr/td/a[@title="ChemSpider"]/../../td[2]/span/a/@href').extract() # ('//tr[contains(@href, "/wiki/Melting_point")]/text()').extract()
print item
return item