zoukankan html css js c++ java

下载ElementUI组件（Python）

代码：

# encoding:utf-8
from bs4 import BeautifulSoup
import requests, re, os, socket
from urllib import request

# 指定要下载的版本
element_ui_version = "2.13.0"
# 指定文件要存放的位置
element_ui_dir = "D:/tmp"

save_ui_dir = os.path.join(element_ui_dir, "element-ui")

if not os.path.isdir(save_ui_dir):
    os.makedirs(save_ui_dir)

element_ui_url = "https://unpkg.com/browse/element-ui@" + element_ui_version + "/"
headers = {
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:73.0) Gecko/20100101 Firefox/73.0"
}


def get_page(url, save_dir):
    print("Current Page:    ", url)
    response = requests.get(url, headers=headers)
    soup = BeautifulSoup(str(response.content), "lxml")
    tbody = soup.find("tbody")
    rule_name = r'href="(.+?)"'
    td_href = re.findall(rule_name, str(tbody))
    dir_list = []
    for href in td_href:
        href_path = os.path.join(save_dir, href)
        if href == "../":
            pass
        elif "/" in href:

            os.mkdir(href_path)
            print("Makedir:    ", href_path.replace(save_ui_dir, ""))
            dir_list.append(href)
        else:
            file_url = url + href
            abs_name = file_url.replace(element_ui_url, "")
            print("Download:    ", abs_name)
            get_file(file_url, href_path)

    for sub_dir in dir_list:
        sub_url = url + sub_dir
        sub_dir = os.path.join(save_dir, sub_dir)
        get_page(sub_url, sub_dir)


def get_file(url, filename):
    opener = request.build_opener()
    opener.addheaders = [('User-agent',
                          'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:73.0) Gecko/20100101 Firefox/73.0')]
    request.install_opener(opener)
    socket.setdefaulttimeout(30)
    url = url.replace("browse/", "")
    count = 1
    while count <= 5:
        try:
            request.urlretrieve(url, filename)
            break
        except socket.timeout:
            err_info = '<Timeout>   Reloading for %d time' % count
            print(err_info)
            count += 1
        except Exception as e:
            err_info = '<' + str(e) + '>   Reloading for %d time' % count
            print(err_info)
            count += 1
    if count > 5:
        print("<Error>  download job failed!")
    else:
        pass
get_page(element_ui_url, save_ui_dir)

查看全文

相关阅读:
数据结构括号法二叉树转化为二叉链表链式存储结构
 数据结构二叉树的非递归遍历算法再回顾
 C语言算法设计一个算法，将数组m个元素循环右移。要求算法空间复杂度为O(1)
JAVA 递归输出所有可能的出栈序列
 C语言数据结构头尾指针数组的综合应用
 C语言重写strcmp函数
 C语言数据结构判断出栈序列合法性
 PMD执行Java代码分析的原理
 Redis缓存和MySQL数据一致性方案详解
 mybtais 源码分析

原文地址：https://www.cnblogs.com/LoganChen/p/13039934.html