zoukankan html css js c++ java

1.4.1python下载网页（每天一更）

# -*- coding: utf-8 -*-

'''
Created on 2019年4月27日

@author: lenovo
'''

# import urllib3
# def download(url):
#     return urllib3.connection_from_url(url)
# 
# print(download('http://now.qq.com'))





# 在python中,urllib2被urllib。request所取代

# import urllib.request
# def download(url):
#     return urllib.request.urlopen(url).read()
# 
# print(download('https://baijiahao.baidu.com/s?id=1632775818269407606&wfr=spider&for=pc'))


# import urllib.request
# def download(url):
#     print("Downloading:" + url)
#     try:
#         html = urllib.request.urlopen(url).read()
#     except urllib.request.URLError as e:
#         print("Download error:" , e.reason)
#         html = None
#     return html
# 
# print(download("htp://www.baidu.co"))


# import urllib.request
# def download(url, num_retries=2):
#     try:
#         html = urllib.request.urlopen(url).read()
#     except urllib.request.URLError as e:
#         print("Download error:" , e.reason)
#         html = None
#         if num_retries > 0 :
#             if hasattr(e, "code") and 500 <= e.code < 600 :
#                 return download(url, num_retries-1)
#     return html
#     
# # print(download("http://httpstat.us/500"))
# print(download("http://www.meetup.com/"))

import urllib.request
def download(url, user_agent="wswp",num_retries=2):
    print("Downloading: " , url)
    headers = { 'User-agent': user_agent}
    request = urllib.request.Request(url, headers=headers)
    try:
        html = urllib.request.urlopen(request).read()
    except urllib.request.URLError as e:
        print('Download error:' , e.reason)
        html = None
        if num_retries > 1 :
            if hasattr(e, 'code') and 500 <= e.code < 600:
                return download(url, user_agent, num_retries-1)
    return html

print(download("http://www.meetup.com/"))

查看全文

相关阅读:
Linux查看进程和已知端口是否启动
 plsql安装
 windows中用批处理文件删除n天前的文件
 阿里云服务器25邮件端口问题
 通过rpm安装crontab
[RHEL7.1]关闭防火墙及SElinux
有了 itchat， python 调用微信个人号从未如此简单（新增 py3 支持）
Linux中tty、pty、pts的概念区别
 不用写代码就能实现深度学习？手把手教你用英伟达 DIGITS 解决图像分类问题
 Hadoop 2.7.3 安装配置及测试

原文地址：https://www.cnblogs.com/xww115/p/10822196.html