|
|
马上注册,结交更多好友,享用更多功能^_^
您需要 登录 才可以下载或查看,没有账号?立即注册
x
这是代码- import requests
- import re
- from lxml import etree
- import os
- def download_pics(url):
- response = requests.get(url,headers=headers)
- base_link = etree.HTML(response.text).xpath('//div[@class="main-image"]//img/@src')[0][0:-6]
- page_info = etree.HTML(response.text).xpath('//div[@class="pagenavi"]//span/text()')
- max_page = int(page_info[-2])
- for i in range(1,max_page+1):
- page = str(i).zfill(2)
- download_link = base_link+str(page)+'.jpg'
- response = requests.get(download_link)
- pic_name = download_link[-9:-4]
- print('目前第{}套妹子,共{}张 正在下载第{} 张图片......'.format (list_cnt,max_page,i))
- with open(save_path+'\\'+pic_name+'.jpg','wb') as f:
- f.write(response.content)
- def get_list(url):
- global list_cnt,save_path
- list_cnt = 1
- response = requests.get(url,headers=headers)
- p = r'<a href="(https://www.mzitu.com/\d+)" target="_blank">'
- list_pool = re.findall(p,response.text)
- for li in list_pool:
- save_path = '美女图\\EP'+str(list_cnt).zfill(3)
- if not os.path.exists(save_path):
- os.mkdir(save_path)
- download_pics(url)
- list_cnt+=1
- def main():
- if not os.path.exists('美女图'):
- os.mkdir('美女图')
- os.startfile('美女图')
- get_list(url)
- if __name__=="__main__":
- url = 'https://www.mzitu.com/'
- headers = {'user-agent': 'Mozilla/5.0'}
- main()
复制代码
出现错误 Traceback (most recent call last):
File "C:\Users\Administrator\Desktop\新建文本文档 (3).py", line 42, in <module>
main()
File "C:\Users\Administrator\Desktop\新建文本文档 (3).py", line 37, in main
get_list(url)
File "C:\Users\Administrator\Desktop\新建文本文档 (3).py", line 30, in get_list
download_pics(url)
File "C:\Users\Administrator\Desktop\新建文本文档 (3).py", line 8, in download_pics
base_link = etree.HTML(response.text).xpath('//div[@class="main-image"]//img/@src')[0][0:-6]
IndexError: list index out of range
[Finished in 1.6s] |
|