闲鱼数据的获取与下载
25-04-08 02:22
982
0
今天给大家分享闲鱼的数据获取和逆向,只需要在终端输入想搜索的物品名,再输入想下载内容的页码,
对应数据的csv文件便会自动命名好并创建在相应的文件夹内,以供大家观看和相应需求。
值得注意的是cookies 过很长一段时间会失效,到时候则需要大家手动替换这一栏啦,也不是很难。
from hashlib import md5 import time import requests import csv import os from pathlib import Path # 定义路径 os_path = Path.cwd() / '闲鱼' print(os_path) # 检查目录是否存在,如果不存在则创建 if not os_path.exists(): os_path.mkdir(parents=True, exist_ok=True) # parents=True 支持多级目录创建 cookies = { 'cna': 'o2VyIG74FTMCASShMKcIxy+k', 'cookie2': '124e5ba3daf492b75775ddeb501c4470', '_samesite_flag_': 'true', 't': 'af37bded5c848ba4245c9527b710787f', '_tb_token_': 'e33ff5759af39', 'mtop_partitioned_detect': '1', '_m_h5_tk': '43a8d19ad104ac584f86e23e273c6aa8_1743764419015', '_m_h5_tk_enc': '37d8a137028ac2a98bb85db99720098f', 'xlly_s': '1', } #cookies过一段时间会刷新,记得改成自己电脑的cookies, headers = { 'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/134.0.0.0 Safari/537.36 Edg/134.0.0.0', # 'cookie': 'cna=o2VyIG74FTMCASShMKcIxy+k; cookie2=124e5ba3daf492b75775ddeb501c4470; xlly_s=1; _samesite_flag_=true; t=af37bded5c848ba4245c9527b710787f; _tb_token_=e33ff5759af39; mtop_partitioned_detect=1; _m_h5_tk=179c6ebaaf128f51c3115d032879d73e_1743696440707; _m_h5_tk_enc=e52128cad70c5425624fe37abe435555; tfstk=ggljBubsPijXYqIoonLzPgrFhmFsCcOF5Nat-VCVWSFAXG3L4mr4gFA_Xmqrgou4MlCsbVlqbfgG1P3tjEqwoLumo5V9YHR6Tq00ME3tRjwYw_UIyPI9U-IeCSJJYHReaKQ81ntE02oQCLag2rUTB5L5ePzg6rFO6UZ85yXODcF9PUaTSsCAMrERwy4T6lnT6Ug8qPMEwQay7ogXkrjvDARFBqZ561h7yhqKlw5Qub4jHk3xG1fMJrwbvqEWxbU2383gCfbG1o3xKc4KDiKUnVHSVrN6atFKPAnQrjdFczDqy2r-RwCKoSMIOSHXqTVqcbF-Mv_O64Nbm8U7Fit7vj0-t7ey9eg-ZmumNV796zoU2qcY1BL3GSEYNzcwqsEseAh4n5jvY-0tF0ab9gP5TkZm3O_7K1a7YUT5IOj2Atuy2k1qP-UuzM8WPiN8Hz47YUT5IO2Yrz8ePUsbw', } keyword=input("请输入搜索物品:") page=input("请输入搜索页码:") data = { 'data': f'{{"pageNumber":"{page}","keyword": "{keyword}","fromFilter":false,"rowsPerPage":30,"sortValue":"","sortField":"","customDistance":"","gps":"","propValueStr":{{}},"customGps":"","searchReqFromPage":"pcSearch","extraFilterValue":"{{}}","userPositionJson":"{{}}"}}' } time = str(round(time.time() * 1000)) params = { 'jsv': '2.7.2', 'appKey': '34839810', 't': time, 'v': '1.0', 'type': 'originaljson', 'accountSite': 'xianyu', 'dataType': 'json', 'timeout': '20000', 'api': 'mtop.taobao.idlemtopsearch.pc.search', 'sessionOption': 'AutoLoginOnly', 'spm_cnt': 'a21ybx.search.0.0', 'spm_pre': 'a21ybx.search.searchInput.0', } token =cookies['_m_h5_tk'].split('_')[0] print(token) appKey = "34839810" data_1 = f'{{"pageNumber":"{page}","keyword": "{keyword}","fromFilter":false,"rowsPerPage":30,"sortValue":"","sortField":"","customDistance":"","gps":"","propValueStr":{{}},"customGps":"","searchReqFromPage":"pcSearch","extraFilterValue":"{{}}","userPositionJson":"{{}}"}}' i = ( token + "&" + time + "&" + appKey + "&" + data_1) sign=md5(i.encode()).hexdigest() params['sign']=sign print(data,data_1) response = requests.post( 'https://h5api.m.goofish.com/h5/mtop.taobao.idlemtopsearch.pc.search/1.0/', params=params, cookies=cookies, headers=headers, data=data, ) result=response.json() print(result) resultlist=result['data']['resultList'] for index in resultlist: try: name = index['data']['item']['main']['exContent']['userNickName'] except: name = "未知" try: price = index['data']['item']['main']['exContent']['detailParams'][ 'soldPrice'] except: price = "未知" shop_id = index['data']['item']['main']['exContent']['detailParams'][ 'itemId'] shop_link = f'https://www.goofish.com/item?id=893424239322&categoryId={shop_id}' dit = {"用户名": name, "地区": index['data']['item']['main']['exContent']['area'], "售价": price, "标题": index['data']['item']['main']['exContent']['detailParams'][ 'title'], '详情页': shop_link} fieldnames = [ "用户名", "地区", "售价", "标题", '详情页'] # 打开文件并写入数据 import csv import os # 定义字段名 fieldnames = [ "用户名", "地区", "售价", "标题", "详情页" ] # 检查文件是否存在(决定是否需要写入表头) file_name = f"{keyword}.csv" file_path = os_path / file_name file_exists = os.path.isfile(f'["{file_name}.csv"]') # 打开文件并写入数据 with open(file_path , mode="a", newline="", encoding="utf-8") as file: csv_writer = csv.DictWriter(file, fieldnames=fieldnames) # 如果文件不存在或为空,则写入表头 if not file_exists: csv_writer.writeheader() # 写入一行数据 csv_writer.writerow(dit) print(dit)
-
网上兼职副业赚钱网站合集
最近看到网友整理发布副业和网赚平台,合并了一下,现在想在网上兼职赚钱也是要有一技之长的,什么都不会的话还是考虑摆地摊吧。那些无要求... 758 0 25-03-10 -
新浪读书小程序
新浪读书小程序提供了一个在线阅读平台,无需下载安装即可在微信、支付宝等平台使用,节省存储空间并提供即时阅读。该应用集成了丰富的电子... 847 0 24-09-16 -
手撸call apply bind
如果自己去实现call apply bind,看上去挺复杂,写起来其实就几行代码 因为call和apply一样,只是传参不一样,所以我就只写一个call实现... 615 0 25-04-07 -
B站UP主相册图片下载神器
B站UP主图片下载工具是网友开发的一款图片下载软件,支持下载UP主动态里面的所有图片,默认全部下载,下载越多执行越慢!布景复线程 下载... 1456 0 24-05-30 -
深入理解Android——卷II
笔者“深入理解Android”系列的第二本,这一本将关注重点放在了Android Framework的Java层。在众多可供分析的知识点中,笔者另辟蹊径,选... 874 0 24-05-24 -
如何消化你每天获得的信息
我们身处信息时代,这是我们得天独厚的优势。我们一个小时获取的信息量可能需要古人花一年的时间去搜集整理,《西游记》便是一个很好的例子... 734 0 25-03-03 -
蚂蚁庄园自动喂鸡驱赶脚本
蚂蚁庄园自动喂鸡驱赶脚本脚本简介基于AutoJS实现的自动喂养脚本运行config.js 修改配置,设置密码等支持使用加速卡支持捡屎支持OCR识别倒... 939 0 25-02-04 -
211款经典必收藏中文字体,高级PS设计师必备
482 0 21-06-18
发表我的评论
共0条评论
- 这篇文章还没有收到评论,赶紧来抢沙发吧~