'''
1.确定需求:
爬取什么数据
爬取大学名称
2.找到数据源地址
数据在哪个链接中
https://api.zjzw.cn/web/api/?keyword=&page=1&province_id=&ranktype=&request_type=1&size=20&top_school_id=[3703,2461,659,3117,597,1724]&type=&uri=apidata/api/gkv3/school/lists&signsafe=b6a400d702222a65bbc2fbd7d848933e
3.复制curl(base)到https://curlconverter.com/拿到爬虫代码
4.解析出需要的数据
5.存储数据
'''
import requests
import json
headers = {
"accept": "application/json, text/plain, */*",
"accept-language": "zh-cn,zh;q=0.9",
"content-type": "application/json",
"origin": "https://www.gaokao.cn",
"priority": "u=1, i",
"referer": "https://www.gaokao.cn/",
"sec-ch-ua": "\"not/a)brand\";v=\"8\", \"chromium\";v=\"126\", \"google chrome\";v=\"126\"",
"sec-ch-ua-mobile": "?0",
"sec-ch-ua-platform": "\"windows\"",
"sec-fetch-dest": "empty",
"sec-fetch-mode": "cors",
"sec-fetch-site": "cross-site",
"user-agent": "mozilla/5.0 (windows nt 10.0; win64; x64) applewebkit/537.36 (khtml, like gecko) chrome/126.0.0.0 safari/537.36"
}
url = "https://api.zjzw.cn/web/api/"
params = {
"keyword": "",
"page": "1",
"province_id": "",
"ranktype": "",
"request_type": "1",
"size": "20",
"top_school_id": "\\[3703,2461,659,3117,597,1724\\]",
"type": "",
"uri": "apidata/api/gkv3/school/lists",
"signsafe": "b6a400d702222a65bbc2fbd7d848933e"
}
data = {
"keyword": "",
"page": 1,
"province_id": "",
"ranktype": "",
"request_type": 1,
"signsafe": "b6a400d702222a65bbc2fbd7d848933e",
"size": 20,
"top_school_id": "[3703,2461,659,3117,597,1724]",
"type": "",
"uri": "apidata/api/gkv3/school/lists"
}
a=[]
data = json.dumps(data, separators=(',', ':'))
response = requests.post(url, headers=headers, params=params, data=data).text #str
res=eval(response)
for i in res['data']['item']:
a.append(i['name'])
with open('存储的文件名称.txt','w') as f: #encoding='utf-8'
for i in a:
f.write(i+'\n')
print('程序运行结束')
配套视频
https://www.bilibili.com/video/bv1vx4y1s73e/?share_source=copy_web&vd_source=9a94d4db7fa8a361a15f7c2717f048fd
版权声明:本文内容由互联网用户贡献,该文观点仅代表作者本人。本站仅提供信息存储服务,不拥有所有权,不承担相关法律责任。
如发现本站有涉嫌抄袭侵权/违法违规的内容, 请发送邮件至 2386932994@qq.com 举报,一经查实将立刻删除。
发表评论