|
|
发表于 2016-4-11 22:57:55
|
显示全部楼层
- import urllib.request
- import re
- def open_url(url):
- req=urllib.request.Request(url)
- req.add_header('User-Agent','Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.110 Safari/537.36')
- page=urllib.request.urlopen(req)
- html=page.read().decode('utf-8')
- #return html
- #遍历输出,如果print错误就跳过,继续输出下一个!
- for each in html:
- try:
- print(each, end='')
- except ValueError:
- pass
-
-
- if __name__=='__main__':
- url='http://tieba.baidu.com/f?kw=%E5%A5%B3%E7%A5%9E&ie=utf-8'
- #url='http://www.fishc.com'
- open_url(url)
-
复制代码 |
|