|
|

楼主 |
发表于 2019-5-24 18:23:54
|
显示全部楼层
#!/usr/bin/env python3
import urllib.request
import re
import os
import time
def open_url(url):
req = urllib.request.Request(url)
req.add_header('User-Agent', 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.157 Safari/537.36')
page = urllib.request.urlopen(req)
html = page.read().decode('utf-8')
return html
def get_img(html):
pic = r'<img class="alignnone" src="([^"]+\.jpg)"'
img_list = re.findall(pic, html)
for each in img_list:
print(each)
time.sleep(5)
for each in img_list:
filename = each.split("/")[-1]
urllib.request.urlretrieve(each, filename, None)
time.sleep(5)
def plmm(folder='周二珂'):
os.mkdir(folder)
os.chdir(folder)
url = "http://zhainanba.net/21049.html"
get_img(open_url(url))
if __name__ == '__main__':
plmm()
|
|