From 22c765b6e567132d0b43b5a5d2dfe3d601e24ebb Mon Sep 17 00:00:00 2001 From: RTB Date: Fri, 18 Apr 2014 14:08:48 +0200 Subject: [PATCH] simplified setting of Results for Predicted ACD/Labs tab --- FourmiCrawler/parsers/ChemSpider.py | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/FourmiCrawler/parsers/ChemSpider.py b/FourmiCrawler/parsers/ChemSpider.py index afae427..a15daaf 100644 --- a/FourmiCrawler/parsers/ChemSpider.py +++ b/FourmiCrawler/parsers/ChemSpider.py @@ -3,6 +3,7 @@ from scrapy import log from scrapy.http import Request from scrapy.selector import Selector from FourmiCrawler.items import Result +import re """ This parser will manage searching for chemicals through the ChemsSpider API, @@ -37,9 +38,12 @@ class ChemSpider(Parser): prop_names = td_list[::2] prop_values = td_list[1::2] for (prop_name, prop_value) in zip(prop_names, prop_values): + prop_name = prop_name.extract().encode('utf-8') + prop_value = prop_value.extract().encode('utf-8') + new_prop = Result({ - 'attribute': prop_name.extract().encode('utf-8'), - 'value': prop_value.extract().encode('utf-8'), + 'attribute': prop_name, + 'value': prop_value, 'source': 'ChemSpider Predicted - ACD/Labs Tab', 'reliability': 'Unknown', 'conditions': ''