import requestsfrom bs4 import BeautifulSoupimport pandas as pdu1 = "=0&limit=20&sort=new_score&status=P"
def urls(): # 获取多个网址urllist = []value = [x * 10 for x in range(1, 40) if x % 2 == 0] # 列表生成式for i in value:urllist.append("=%d&limit=20&sort=new_score&status=P" % i)return urllisturllist = urls()def data():spanlist = [] # 放在循环之外for i in urllist:re = (i)soup = , 'lxml')span = soup.find_all('span', class_='short')for i in span:spanlist.)df = pd.DataFrame({'影评': spanlist})return dfdf = data()
txt = str(df.values)
dic = {}
name = ['黑寡妇', '灭霸', '美队', '钢铁侠', '雷神', '奇异博士', '星爵', '浩克', '黑豹', '蜘蛛侠', '惊奇队长']
for i in name:dic[i] = unt(i)
print(dic) # {'黑寡妇': 7, '灭霸': 19, '美队': 15,}
df = pd.DataFrame(dic.values(), dic.keys())
#df.to_excel('./10.xls') #导出到excel
可视化效果图:
本文发布于:2024-01-28 03:06:50,感谢您对本站的认可!
本文链接:https://www.4u4v.net/it/17063824144333.html
版权声明:本站内容均来自互联网,仅供演示用,请勿用于商业和其他非法用途。如果侵犯了您的权益请与我们联系,我们将在24小时内删除。
留言与评论(共有 0 条评论) |