regex
This commit is contained in:
parent
873231439c
commit
be63315ca2
@ -2,6 +2,7 @@ from scrapy.http import Request
|
|||||||
from parser import Parser
|
from parser import Parser
|
||||||
from scrapy.selector import Selector
|
from scrapy.selector import Selector
|
||||||
from FourmiCrawler.items import Result
|
from FourmiCrawler.items import Result
|
||||||
|
import re
|
||||||
|
|
||||||
class WikipediaParser(Parser):
|
class WikipediaParser(Parser):
|
||||||
|
|
||||||
@ -45,7 +46,9 @@ class WikipediaParser(Parser):
|
|||||||
|
|
||||||
def cleanitems(self, items):
|
def cleanitems(self, items):
|
||||||
for item in items:
|
for item in items:
|
||||||
print item['value']
|
value=item['value']
|
||||||
|
if re.match('3(...)', value):
|
||||||
|
print value
|
||||||
return items
|
return items
|
||||||
|
|
||||||
def getboilingpoint(self, sel):
|
def getboilingpoint(self, sel):
|
||||||
|
Reference in New Issue
Block a user