|
|
马上注册,结交更多好友,享用更多功能^_^
您需要 登录 才可以下载或查看,没有账号?立即注册
x
为什么会报错,下载不了文件,请指导,谢谢!
from bs4 import BeautifulSoup
import requests,urllib.request
import time
header ={'User-Agent':'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/63.0.3239.132 Safari/537.36',
'Cookie':'UM_distinctid=1614b695a077d-08cbdffb9f10d5-3c604504-144000-1614b695a0867a; Hm_lvt_ecf0502609cf895cbe057f7979b317bc=1517388652,1517388682; Hm_lpvt_ecf0502609cf895cbe057f7979b317bc=1517388682; CNZZDATA1256181055=1650880320-1517383831-null%7C1517389232'}
url = 'http://www.youwu.cc/guonei/list_1.html'
web_data =requests.get(url,headers=header)
soup = BeautifulSoup(web_data.text,'lxml')
imgs = soup.select('div.item_t > div > a > img')
img_list =[]
for img in imgs:
img_list.append(img.get('src'))
#print(img_list)
path = "D:/aaa/"
for pic in img_list:
urllib.request.urlretrieve(pic, path + pic[-10:])
time.sleep(2)
提示:
Traceback (most recent call last):
File "D:/test/jianda.py", line 17, in <module>
urllib.request.urlretrieve(pic, path + pic[-10:])
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 248, in urlretrieve
with contextlib.closing(urlopen(url, data)) as fp:
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 223, in urlopen
return opener.open(url, data, timeout)
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 532, in open
response = meth(req, response)
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 642, in http_response
'http', request, response, code, msg, hdrs)
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 570, in error
return self._call_chain(*args)
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 504, in _call_chain
result = func(*args)
File "C:\Users\liujun\AppData\Local\Programs\Python\Python36\lib\urllib\request.py", line 650, in http_error_default
raise HTTPError(req.full_url, code, msg, hdrs, fp)
urllib.error.HTTPError: HTTP Error 404: Not Found |
|