Python爬虫入门指南:从新手到高手,附爬虫辅助神器在线网址推荐

Python – 爬虫小白入门大佬勿喷 – 爬虫辅助神器在线网址推荐

  • 爬虫在线辅助神器
  • 实战意义
  • 实战指南
  • 打开任意网站
  • 按F12 打开控制台
  • 打开爬虫工具库
  • 自动生成代码(可直接运行)
  • 结束语
  • 工欲善其事,必先利其器

    爬虫在线辅助神器

    网址:https://spidertools.cn/#/curl2Request


    该网站提供了一个便捷的在线工具,允许用户将cURL命令转换为Python的requests库代码。这对于网络开发者、爬虫工程师以及进行网页数据抓取的人员来说极为实用,因为它简化了从命令行到编程语言的过渡过程

    实战意义

    该网站功能非常强大
    可以直接将cURL转requests 并可以直接运行
    该网站还提供很多在线加解密和第三方在线工具
    可以说开源的作者非常优秀

    实战指南

    打开任意网站

    例子: https://blog.csdn.net/qq_41133533/article/details/145658393?spm=1001.2014.3001.5501

    按F12 打开控制台

    打开爬虫工具库

    自动生成代码(可直接运行)

    
    import requests
    
    
    headers = {
        "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
        "Accept-Language": "zh-CN,zh;q=0.9",
        "Cache-Control": "no-cache",
        "Connection": "keep-alive",
        "Pragma": "no-cache",
        "Referer": "https://blog.csdn.net/qq_41133533?spm=1008.2028.3001.5343",
        "Sec-Fetch-Dest": "document",
        "Sec-Fetch-Mode": "navigate",
        "Sec-Fetch-Site": "same-origin",
        "Sec-Fetch-User": "?1",
        "Upgrade-Insecure-Requests": "1",
        "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/132.0.0.0 Safari/537.36",
        "sec-ch-ua": "\"Not A(Brand\";v=\"8\", \"Chromium\";v=\"132\", \"Google Chrome\";v=\"132\"",
        "sec-ch-ua-mobile": "?0",
        "sec-ch-ua-platform": "\"Windows\""
    }
    cookies = {
        "uuid_tt_dd": "10_20293302920-1729957029796-505028",
        "fid": "20_43520340897-1729957036667-654213",
        "UN": "qq_41133533",
        "p_uid": "U010000",
        "_ga": "GA1.2.1748067707.1730382260",
        "FCNEC": "%5B%5B%22AKsRol-WOmqfuhiNRpWrDE_W6wj53DYAonTZ24A3ES2eSD--40wsc928PmXhfmx1dkw3q_7TLaksTeks4oNIEncg0khT7ZFtXiUIthrg9_I1H2Y2EFqcm3iyfAYijR5tOQZIZfVvBVc_TdW4-vATdsRi8Fn6x8Ehkg%3D%3D%22%5D%5D",
        "_ga_7W1N0GEY1P": "GS1.1.1736684120.4.1.1736684602.60.0.0",
        "c_segment": "4",
        "Hm_lvt_6bcd52f51e9b3dce32bec4a3997715ac": "1739624281",
        "HMACCOUNT": "1FFCAB5935065DD2",
        "dc_sid": "a7f478eb2e6accf6638847d79e59fc1b",
        "SESSION": "40a2621e-ca82-49e7-96ef-f792f42405ad",
        "hide_login": "1",
        "c_ins_prid": "-",
        "c_ins_rid": "1739627194611_565537",
        "c_ins_fref": "https://blog.csdn.net/qq_41133533",
        "c_ins_fpage": "/index.html",
        "c_ins_um": "-",
        "ins_first_time": "1739627197627",
        "loginbox_strategy": "%7B%22taskId%22%3A317%2C%22abCheckTime%22%3A1739627197753%2C%22version%22%3A%22ExpA%22%2C%22nickName%22%3A%22%E6%9E%9C%E6%A0%B8%20JAVA%22%7D",
        "creative_btn_mp": "3",
        "UserName": "qq_41133533",
        "UserInfo": "a4719413fa2949c490f03ebf899b4a24",
        "UserToken": "a4719413fa2949c490f03ebf899b4a24",
        "UserNick": "%E6%9E%9C%E6%A0%B8+JAVA",
        "AU": "1FA",
        "BT": "1739627224827",
        "csdn_newcert_qq_41133533": "1",
        "https_waf_cookie": "09732fd8-9e17-4d8c888a889d12a22f93c6ee272b1e03dd64",
        "x_inscode_token": "eyJ0eXAiOiJKV1QiLCJhbGciOiJIUzI1NiJ9.eyJjcmVkZW50aWFsIjoiIiwiY3NkblVzZXJuYW1lIjoicXFfNDExMzM1MzMiLCJ1c2VySWQiOiI2NDFkM2I3YWJkMGE5YjUxNTFjNzA4MWQiLCJ1c2VybmFtZSI6InFxXzQxMTMzNTMzIn0.JlkwESyLEVShHfsB4-4MTpN6c1Ckl6mfgi1hyxZP8ZU",
        "Hm_lvt_ec8a58cd84a81850bcbd95ef89524721": "1739633100",
        "Hm_lpvt_ec8a58cd84a81850bcbd95ef89524721": "1739633100",
        "c_utm_source": "bbs_include",
        "c_first_ref": "default",
        "c_first_page": "https%3A//www.csdn.net/",
        "dc_session_id": "10_1739683542934.338792",
        "c_dsid": "11_1739683544027.158594",
        "_clck": "4j4vuq%7C2%7Cfth%7C0%7C1760",
        "toolbar_remind_num": "3",
        "__gads": "ID=915681db86891bd5:T=1729957047:RT=1739683651:S=ALNI_MYU2vXasjnZUfdBbYu1vopQejrdzA",
        "__gpi": "UID=00000f562804eaed:T=1729957047:RT=1739683651:S=ALNI_Mbyl5UMzW8GboTk9bheUhCHW54rGw",
        "__eoi": "ID=ed829d3eedbbd8fa:T=1729957047:RT=1739683651:S=AA-AfjaJgDkjdHHkPh2qUkoI0Q_t",
        "_clsk": "khovxm%7C1739683652812%7C2%7C0%7Cn.clarity.ms%2Fcollect",
        "c_page_id": "default",
        "c_pref": "https%3A//blog.csdn.net/qq_41133533%3Fspm%3D1008.2028.3001.5343",
        "c_ref": "https%3A//mp.csdn.net/mp_blog/creation/editor%3Fspm%3D1001.2014.3001.4503",
        "log_Id_pv": "12",
        "Hm_lpvt_6bcd52f51e9b3dce32bec4a3997715ac": "1739683780",
        "log_Id_view": "440",
        "log_Id_click": "35",
        "dc_tos": "srrhw0",
        "waf_captcha_marker": "c47a30cc91f55932690e6ce83660b3462e95ebc150d80dd823aad62fbc2408b6"
    }
    url = "https://blog.csdn.net/qq_41133533/article/details/145658393"
    params = {
        "spm": "1001.2014.3001.5501"
    }
    response = requests.get(url, headers=headers, cookies=cookies, params=params)
    
    print(response.text)
    print(response)
    
    
    

    选择合适的工具 事半功倍 加油💪💪

    结束语

    欢迎一起交流学习
    有帮助请留下足迹 一键三连
    爬虫大佬勿喷,欢迎指正问题
    后面会做一系列的爬虫文章,请持续关注作者❣❣❣。

    作者:果核 JAVA

    物联沃分享整理
    物联沃-IOTWORD物联网 » Python爬虫入门指南:从新手到高手,附爬虫辅助神器在线网址推荐

    发表回复