|
发表于 2020-11-30 20:28:08
|
显示全部楼层
本帖最后由 suchocolate 于 2020-11-30 20:33 编辑
- from urllib import request
- from lxml import etree
- import csv
- def main():
- headers = {'User-Agent': 'Firefox'}
- req = request.Request('https://movie.douban.com/chart', headers=headers)
- r = request.urlopen(req)
- html = etree.HTML(r.read().decode('utf-8'))
- result = html.xpath('//span[@style="font-size:13px;"]/text()')
- print(result)
- with open('movies.csv', 'w', encoding='utf-8') as csvfile:
- writer = csv.writer(csvfile)
- for item in result:
- writer.writerow([item])
- print('done')
- if __name__ == '__main__':
- main()
复制代码 |
|