|
发表于 2019-10-7 10:41:19
|
显示全部楼层
- import urllib.request
- from lxml import html
- def spider(sn):
- url = 'https://re.taobao.com/search_ou?refpid=mm_26632258_3504122_32538762&clk1=0c5e32ca052fe01c4cf901fa6453d137&keyword={}&_input_charset=utf-8&page=0&isinner=0'.format(sn)
- response = urllib.request.urlopen(url)
- html_data = response.read().decode('utf-8')
-
- selector = html.fromstring(html_data)
- titles = selector.xpath('//div[@class="item"]/a/div[@class="info"]/span/@title')
-
- for title in titles:
- print(title)
-
- if __name__ == '__main__':
- sn = '9787115428028'
- spider(sn)
复制代码 |
|