zoukankan      html  css  js  c++  java
  • 爬取拉钩网 python3.7

    import requests
    import time
    import json
    def main():
    url_start = "https://www.lagou.com/jobs/list_运维?city=%E6%88%90%E9%83%BD&cl=false&fromSearch=true&labelWords=&suginput="
    url_parse = "https://www.lagou.com/jobs/positionAjax.json?city=成都&needAddtionalResult=false"
    headers = {
    'Accept': 'application/json, text/javascript, */*; q=0.01',
    'Referer': 'https://www.lagou.com/jobs/list_%E8%BF%90%E7%BB%B4?city=%E6%88%90%E9%83%BD&cl=false&fromSearch=true&labelWords=&suginput=',
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/72.0.3626.121 Safari/537.36'
    }
    for x in range(1, 5):
    data = {
    'first': 'true',
    'pn': str(x),
    'kd': '运维'
    }
    s = requests.Session()
    s.get(url_start, headers=headers, timeout=3) # 请求首页获取cookies
    cookie = s.cookies # 为此次获取的cookies
    response = s.post(url_parse, data=data, headers=headers, cookies=cookie, timeout=3) # 获取此次文本
    time.sleep(5)
    response.encoding = response.apparent_encoding
    text = json.loads(response.text)
    info = text["content"]["positionResult"]["result"]
    for i in info:
    print(i["companyFullName"])
    companyFullName = i["companyFullName"]
    print(i["positionName"])
    positionName = i["positionName"]
    print(i["salary"])
    salary = i["salary"]
    print(i["companySize"])
    companySize = i["companySize"]
    print(i["skillLables"])
    skillLables = i["skillLables"]
    print(i["createTime"])
    createTime = i["createTime"]
    print(i["district"])
    district = i["district"]
    print(i["stationname"])
    stationname = i["stationname"]

    if __name__ == '__main__':
    main()
  • 相关阅读:
    Bootstrap Div 居中的方法
    JQuery 实现 锚点跳转
    JQuery 获取页面某一元素的位置
    BootStrap 实现导航栏nav透明,nav子元素文字不透明
    bootstrap3中container与container_fluid容器的区别
    常见向量范数和矩阵范数
    leetcode 202. Happy Number
    leetcode 172. Factorial Trailing Zeroes
    leetcode 168. Excel Sheet Column Title 171 Excel Sheet Column Number
    leetcode Two Sum II
  • 原文地址:https://www.cnblogs.com/weixin272958297/p/11630241.html
Copyright © 2011-2022 走看看