zoukankan      html  css  js  c++  java
  • 2、Python request、BeautifulSoup(download mm_pic)

    import requests
    from bs4 import BeautifulSoup
    import os
    class DownLoadImg(object):
    
        def __init__(self):
            self.url = 'http://jandan.net/ooxx/'
            self.header = {
                'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.108 Safari/537.36'}
        def get_Page(self):
            response = self.open_url(self.url)
            page = response.text
            # print(page)
            soup = BeautifulSoup(page)
            page_c = soup.select('span.current-comment-page')
            # page_num = str(page_num).split('[')[-1].split(']')[0]
            page_num = page_c[0].next[1:-1]
            return page_num
    
        def open_url(self,url):
            response = requests.get(url,self.header)
            return response
    
        def get_and_save_Img(self):
            dir = os.path.exists('download_mm')
            if dir == False:
    
                os.mkdir('download_mm')
            os.chdir('download_mm')
    
            times = input('Please enter the number of pages to download:')
            i = 0
            num = int(self.get_Page())
            while i < int(times):
                url = self.url + 'page-' +str(num)
                print(url)
                response = self.open_url(url)
    
                html = response.text
                # print(html)
                bs = BeautifulSoup(html)
                img_list = bs.select('img')
                for img in img_list:
                    src ='http:' + img.attrs['src']
                    img_name = str(src).split('/')[-1]
                    get_img = requests.get(src, self.header)
    
                    with open(img_name,'wb') as dl:
                        dl.write(get_img.content)
    
                num -= 1
                i += 1
    
    if __name__ == "__main__":
    
        dl = DownLoadImg()
        dl.get_and_save_Img()
    

      

  • 相关阅读:
    JS框架设计读书笔记之-选择器引擎02
    JS框架设计读书笔记之-选择器引擎01
    JS框架设计读书笔记之-小知识
    JS框架设计读书笔记之-函数
    JS框架设计读书笔记之-核心模块
    7.19 NOIP模拟6
    一 网络基础之网络协议篇
    Socket 网络编程
    Python 常用模块
    类的特殊成员
  • 原文地址:https://www.cnblogs.com/royfans/p/7417928.html
Copyright © 2011-2022 走看看