zoukankan html css js c++ java

python获取网页信息的三种方法

import urllib.request
import http.cookiejar

url = 'http://www.baidu.com/'

# 方法一
print('方法一')
req_one = urllib.request.Request(url)
req_one.add_header('User-Agent', 'Mozilla/6.0')
res_one = urllib.request.urlopen(req_one)
code_one = res_one.getcode()
html_one = res_one.read().decode('utf-8')
res_one.close()
print('方法一网页状态码：%s' % (code_one))
print('方法一网页内容：'+html_one)


# 方法二
print('方法二')
res_two = urllib.request.urlopen(url)
code_two = res_two.getcode()
html_two = res_two.read().decode('utf-8')
print('方法二网页状态码：%s' % (code_two))
print('方法二网页内容：'+html_two)


#方法三
print('方法三')
cj = http.cookiejar.LWPCookieJar()
opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cj))
urllib.request.install_opener(opener)
res_three = urllib.request.urlopen(url)
print(cj)
code_three = res_three.getcode()
html_three = res_three.read().decode('utf-8')
res_three.close()
print('方法三网页状态码：%s' % (code_three))
print('方法三的网页内容：'+html_three)

查看全文

相关阅读:
文件的操作
 encode,decode,str,bytes
字符串操作
 suse12安装mysql8.16
VMware配置共享磁盘安装RAC
Linux过滤文本并显示过滤文字的上下文
 Linux服务器卸载mysql指南
 oracle 各版本各日志存放位置
 impdp按用户导入
 数据泵expdp定时备份

原文地址：https://www.cnblogs.com/2016-10-07/p/7988368.html