|

楼主 |
发表于 2020-6-21 02:32:08
|
显示全部楼层
#我现在保存数据的时候它就保存最后一天,我想保存至少前三条吧import requests
import bs4
import openpyxl
url = 'http://graduatedstudies.ju.edu.jo/ar/arabic/Lists/AcademicNews/School_AllNews.aspx'
res = requests.get(url)
text = bs4.BeautifulSoup(res.text, 'html.parser')
for title in text.find_all('h4', {'class':'blog-post-title'}):
links = ("http://graduatedstudies.ju.edu.jo/" + title.a['href'])
tits = title.a.text
title_all = links, tits + '\n'
print(title_all)
with open('约旦大学最新公告.txt', 'w', encoding='utf-16')as file:
file.write(str(title_all))
|
|