2024年1月27日发(作者:)
lists = []flag=0for pro in province: for i in all_data[pro]: if flag==0: name = list(()) flag+=1 (list(()))import pandas as pd
test=ame(columns=name,data=lists)print(test)_csv('./数据可视化/课设/data/province_history_',encoding='utf-8')#
爬取各省市数据header = { 'Cookie':'RK=KzwZgVEeXg; ptcz=157737b47be19a589c1f11e7d5ea356f466d6f619b5db6525e3e4e9ea568b156; pgv_pvid=8404792176; o_cookie=1332806659; pac_uid=1_1332806659; luin=o1332806659; lskey=00010000f347903107135dfbd497aa640c9344fe129f3f881877cca68a1e46b4821572bebdf89eb35565f4e6; _qpsvr_localtk=0.24584627136079518; uin=o1332806659; skey=@twSZvHSZD; qzone_check=1332806659_1624245080', 'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.106 Safari/537.36'}all_data={}every_province = province[1]for i in children[1]: url = '/newsqa/v1/query/pubished/daily/list?province={0}&city={1}'.format(every_province,i)# print(url) response = (url,headers=header) data = ()['data'] all_data[i]=datalists = []flag=0for child in children[1]: for i in all_data[child]: if flag==0: name = list(()) flag+=1 (list(()))test=ame(columns=name,data=lists)print(test)# _csv('./数据可视化/课设/data/' + every_province + 'province_history_',encoding='utf-8')test = _values(['city','y','date']).reset_index(drop=True)print(test)# _csv('D:/学习资料/数据可视化/课设/data/' + every_province + 'province_history_',encoding='utf-8')
#
爬取各省市数据header = { 'Cookie':'RK=KzwZgVEeXg; ptcz=157737b47be19a589c1f11e7d5ea356f466d6f619b5db6525e3e4e9ea568b156; pgv_pvid=8404792176; o_cookie=1332806659; pac_uid=1_1332806659; luin=o1332806659; lskey=00010000f347903107135dfbd497aa640c9344fe129f3f881877cca68a1e46b4821572bebdf89eb35565f4e6; _qpsvr_localtk=0.24584627136079518; uin=o1332806659; skey=@twSZvHSZD; qzone_check=1332806659_1624245080', 'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.106 Safari/537.36'}index = 0 #
控制爬取哪个省for every_province in province: all_data={} for i in children[index]: url = '/newsqa/v1/query/pubished/daily/list?province={0}&city={1}'.format(every_province,i) print(url) response = (url,headers=header) data = ()['data'] all_data[i]=data
lists = [] flag=0 for child in children[index]: if child == '地区待确认': continue
print(child) if all_data[child] is None: continue for i in all_data[child]: if flag==0: name = list(()) flag+=1 (list(()))
index+=1
test=ame(columns=name,data=lists) print(()) test = _values(['city','y','date']) test = _index(drop=True) print(test) _csv('./数据可视化/课设/data/' + every_province + 'province_history_',encoding='utf-8')
本文发布于:2024-01-27 20:38:52,感谢您对本站的认可!
本文链接:https://www.4u4v.net/it/17063591322504.html
版权声明:本站内容均来自互联网,仅供演示用,请勿用于商业和其他非法用途。如果侵犯了您的权益请与我们联系,我们将在24小时内删除。
留言与评论(共有 0 条评论) |