from __future__ import unicode_literals
import requests
from scrapy.selector import Selector
def fetch_page(url):
r = requests.get(url)
return r.text
def upso_list_from_listpage(url):
html = fetch_page(url)
sel = Selector(text=html)
upso_lists = []
for i in range ( 1, 31 ):
upso_list = sel.xpath ( '//*[@id="List_['"+i+"']"]/div[4]/span/a/text()').extract()
upso_list.append ( upso_lists )
#upso_list = sel.xpath('//*[@id="List_0"]/div[4]/span/a/text()').extract()
#upso_list = sel.css('.nclicks(mai.text1)').extract()
return upso_lists
from pprint import pprint
pprint(upso_list_from_listpage('http://mokorea.com/ajax/makeBusinessList.php?_method=get&grp=&major=4&cat=&keyword=&hchar=&recom=&page=1&dist=500&gLat=59.8767&gLong=30.4016'))
我想阅读多行。谁能帮助我将XPath更改为变量?我的xpath增加如(list_0,list_1,list_2,list_3 ...)
您的代码将是:
for i in range ( 1, 31 ):
upso_list = sel.xpath ( '//*[@id="List_' + str(i) + '"]/div[4]/span/a/text()').extract()