#encoding:utf-8
import urllib
from snownlp import SnowNLP
r = False
l = ''
n = 0
sno = raw_input('please input goods number:n')
f = open('','w')
try:for i in range (1,64) :p = urllib.urlopen('/%s-3-%d-0.html'%(sno,i))for j ad():if j == 'n':#print lif r :if '</dd>' in l:l = l.replace('t','')l = l.replace(' ','')l = l.replace('<dd>','')l = l.replace('</dd>','')n = n+1print lf.write(str(n))f.write(' ')f.write(l)f.write(' ')s = SnowNLP(l.decode('gbk')).sentimentsf.write(str(s))f.write('n')r = Falseif 'comment-content' in l :r = Truel = ''else:l = l + j
except Exception,e:f.close()
f.close()
print 'All Finish!'
里面的snownlp模块是用来进行情感分析的,将评论解码成unicode格式,然后调入snownlp模块的sentisments就可以得到一个感情值,0.5为中性,越接近1越是喜欢,越接近0越是厌恶 本文发布于:2024-02-01 07:40:16,感谢您对本站的认可!
本文链接:https://www.4u4v.net/it/170674441634951.html
版权声明:本站内容均来自互联网,仅供演示用,请勿用于商业和其他非法用途。如果侵犯了您的权益请与我们联系,我们将在24小时内删除。
留言与评论(共有 0 条评论) |