zoukankan      html  css  js  c++  java
  • python3_mechanicalsoup

    python3_mechanicalsoup

    # !/usr/bin/python3.4
    # -*- coding: utf-8 -*-
    
    import mechanicalsoup
    
    # 事实证明,这个库非常的不友好
    # 非常!!
    # 和mechanize没法比
    # https://github.com/hickford/MechanicalSoup
    
    def openbrowser(url):
    
        # 定义browser
        browser = mechanicalsoup.Browser()
    
        # 头部
        browser.addheaders = [('User-Agent',
                               'Mozilla/5.0 (iPad; U; CPU OS 4_3_3 like Mac OS X; en-us) AppleWebKit/533.17.9 (KHTML, like Gecko) Version/5.0.2 Mobile/8J2 Safari/6533.18.5'),
                              ('Referer', 'http://www.baidu.com'),
                              ('Host', 'www.baidu.com')]
        # 打开百度
        result = browser.get(url)
        # 定位搜索表格
        search = result.soup.select("#form")[0]
        print(search)
        # 搜索框填入ttyb
        search.select("#kw")[0]['value'] = "TTyb"
        # 点击百度一下
        page2 = browser.submit(search, result.url)
    
        # ('UTF-8')('unicode_escape')('gbk','ignore')
        html = page2.content.decode("UTF-8", "ignore")
    
        return html
    
    
    if __name__ == '__main__':
        url = "http://www.baidu.com"
        html = openbrowser(url)
        print(html)
    
    
  • 相关阅读:
    所有时间测试函数
    时间函数应用 time
    50个c/c++源代码网站
    ASN.1详解
    SNMP协议
    SNMP协议详解
    大数据需要建立规则和标准
    常用的三层架构设计
    构建大型网站架构十步骤
    iOS 应用程序内部国际化,不跟随系统语言
  • 原文地址:https://www.cnblogs.com/TTyb/p/6039411.html
Copyright © 2011-2022 走看看