|
马上注册,结交更多好友,享用更多功能^_^
您需要 登录 才可以下载或查看,没有账号?立即注册
x
不知道怎么 解决 这种 错误
==================================================================
import urllib.request
import os
def open_html(url):
res = urllib.request.Request(url)
res.add_header('User-Agent',
'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36')
respones = urllib.request.urlopen(res)
html = respones.read()
return html
def get_num(url):
res = urllib.request.Request(url)
res.add_header('User-Agent',
'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36')
respones = urllib.request.urlopen(res)
html = respones.read().decode('utf-8')
# print(html)
a = html.find('index-') + 6
b = html.find('\.',a)
return html[a:b]
def find_adds(url):
res = urllib.request.Request(url)
res.add_header('User-Agent',
'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36')
respones = urllib.request.urlopen(res)
html = respones.read().decode('utf-8')
print(html)
img_adds = []
a = html.find('img src=')
b = html.find('.jpg', a)
if b != -1:
img_adds.append(html[a + 9:b + 4])
while a != -1:
b = html.find('.jpg',a)
print(b)
if b != -1:
img_adds.append(html[a+9:b+4])
else:
b = a + 9
a = html.find('img src=',b)
# print(img_adds)
return img_adds
def save_img(mm,img_adds):
for adds in img_adds:
img_name = adds.split('/')[-1]
with open(img_name, 'wb') as f:
img = open_html(adds)
f.write(img)
def mmmm(mm='tutu',pages=5):
os.mkdir(mm)
os.chdir(mm)
url = 'https://www.4493.com/star/meizi/'
num = int(get_num(url))
for i in range(pages):
num -= i
get_url = url + 'a/more_' + str(num) + '.html'
img_adds = find_adds(get_url)
save_img(mm,img_adds,)
if __name__ == '__main__':
mmmm()
html = respones.read().decode('gb2312')
|
|