zoukankan      html  css  js  c++  java
  • 美团数据采集

    import json
    import requests
    
    headers = {
        "User-Agent": "Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36",
        "Host": "apimobile.meituan.com",
        "Origin": "https://sh.meituan.com",
        "Referer": "https://sh.meituan.com/jiankangliren/c76/pn3/",
        "cookie": "uuid=7d2aafa238ee4612aa1b.1628841683.1.0.0; _lxsdk_cuid=17b3e87ac8bc8-0439c46fc4e8e-45410429-232800-17b3e87ac8cc8; mtcdn=K; userTicket=vRpNBghrqYEgwbQAMdqZJjlaRSJfFTTuHqVIZFEG; u=1782900880; n=%E6%9F%B3%E5%8D%BF.; lt=os1Vk9j5ZezoRGVSqGzTKVziBFMAAAAATQ4AAGB5A1KVP_53WXEv3MUbSNPmAfNXPPcdU8mhZoosjqwcOMvQngLdTj-i0zs_nszTjA; mt_c_token=os1Vk9j5ZezoRGVSqGzTKVziBFMAAAAATQ4AAGB5A1KVP_53WXEv3MUbSNPmAfNXPPcdU8mhZoosjqwcOMvQngLdTj-i0zs_nszTjA; token=os1Vk9j5ZezoRGVSqGzTKVziBFMAAAAATQ4AAGB5A1KVP_53WXEv3MUbSNPmAfNXPPcdU8mhZoosjqwcOMvQngLdTj-i0zs_nszTjA; lsu=; token2=os1Vk9j5ZezoRGVSqGzTKVziBFMAAAAATQ4AAGB5A1KVP_53WXEv3MUbSNPmAfNXPPcdU8mhZoosjqwcOMvQngLdTj-i0zs_nszTjA; ci=10; rvct=10; firstTime=1628842456220; unc=%E6%9F%B3%E5%8D%BF."
    }
    urltem = "https://apimobile.meituan.com/group/v4/poi/pcsearch/10?uuid=7d2aafa238ee4612aa1b.1628841683.1.0.0&userid=1782900880&limit=32&offset=%s&cateId=21004&token=os1Vk9j5ZezoRGVSqGzTKVziBFMAAAAATQ4AAGB5A1KVP_53WXEv3MUbSNPmAfNXPPcdU8mhZoosjqwcOMvQngLdTj-i0zs_nszTjA&areaId=-1"
    ret = []
    i = 0
    for i in range(30):
        res = requests.get(
            url=urltem % (i * 32),
            headers=headers
        )
        print(res.text)
        data = json.loads(res.text)
        searchResult = data["data"]["searchResult"]
        if len(searchResult) == 0:
            break
        for obj in searchResult:
            ret.append({
                "title": obj["title"],
                "avgscore": obj["avgscore"],
                "comments": obj["comments"],
                "address": obj["address"],
                "phone": obj["phone"],
            })
    with open("e:\ret.log", "a", encoding="utf-8") as f:
        json.dump(ret, f, ensure_ascii=False)

    有追求,才有动力!

    向每一个软件工程师致敬!

    by wujf

    mail:921252375@qq.com

  • 相关阅读:
    2017.5.11下午学习内容
    windows消息和消息队列
    探索Win32系统之窗口类(转载)
    WinMain函数详解(转载)
    Ajax爬取实战头条街拍美图
    Ajax实战微博
    Ajax请求分析实战
    ubuntu 安装rails
    ubuntu Thunderbird 接收邮件显示乱码的问题排除
    ubuntu 开机挂载windows分区
  • 原文地址:https://www.cnblogs.com/wujf/p/15247386.html
Copyright © 2011-2022 走看看