|
发表于 2020-9-4 18:07:00
|
显示全部楼层
import bs4,requests
def getIP(page):
url=f'https://www.kuaidaili.com/free/inha/{page}/'
res=requests.get(url)
soup=bs4.BeautifulSoup(res.text,'html.parser')
soup=soup.find('tbody')
soup=soup.find_all('tr')
for item in soup:
d=dict.fromkeys(('ip','port'))
d['ip']=item.td.text
d['port'] = item.td.next_sibling.next_sibling.text
print(d)
getIP(1)
{'ip': '175.42.68.49', 'port': '9999'}
{'ip': '122.234.91.192', 'port': '9000'}
{'ip': '182.34.103.5', 'port': '9999'}
{'ip': '121.232.148.205', 'port': '9000'}
{'ip': '114.231.45.60', 'port': '9999'}
{'ip': '123.149.137.17', 'port': '9999'}
{'ip': '171.11.179.18', 'port': '9999'}
{'ip': '119.254.94.93', 'port': '44665'}
{'ip': '123.163.27.179', 'port': '9999'}
{'ip': '220.249.149.229', 'port': '9999'}
{'ip': '125.108.100.114', 'port': '9000'}
{'ip': '36.248.132.117', 'port': '9999'}
{'ip': '125.108.73.169', 'port': '9000'}
{'ip': '123.57.77.187', 'port': '8118'}
{'ip': '183.195.106.118', 'port': '8118'} |
|