zoukankan      html  css  js  c++  java
  • python3_mechanicalsoup

    python3_mechanicalsoup

    # !/usr/bin/python3.4
    # -*- coding: utf-8 -*-
    
    import mechanicalsoup
    
    # 事实证明,这个库非常的不友好
    # 非常!!
    # 和mechanize没法比
    # https://github.com/hickford/MechanicalSoup
    
    def openbrowser(url):
    
        # 定义browser
        browser = mechanicalsoup.Browser()
    
        # 头部
        browser.addheaders = [('User-Agent',
                               'Mozilla/5.0 (iPad; U; CPU OS 4_3_3 like Mac OS X; en-us) AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 Safari/6533.18.5'),
                              ('Referer', 'http://www.baidu.com'),
                              ('Host', 'www.baidu.com')]
        # 打开百度
        result = browser.get(url)
        # 定位搜索表格
        search = result.soup.select("#form")[0]
        print(search)
        # 搜索框填入ttyb
        search.select("#kw")[0]['value'] = "TTyb"
        # 点击百度一下
        page2 = browser.submit(search, result.url)
    
        # ('UTF-8')('unicode_escape')('gbk','ignore')
        html = page2.content.decode("UTF-8", "ignore")
    
        return html
    
    
    if __name__ == '__main__':
        url = "http://www.baidu.com"
        html = openbrowser(url)
        print(html)
    
    
  • 相关阅读:
    ORACLE同义词
    eclipse如何检出项目的jar包
    2020-04-03
    十大经典排序算法
    2020-03-30
    world文档设置表格自定义序列
    2020面试记录
    java如何用一个循环实现两个有序数组合并成一个有序数组
    2020-1-8
    好物推荐之抽纸
  • 原文地址:https://www.cnblogs.com/TTyb/p/6039411.html
Copyright © 2011-2022 走看看