代码如下
txt = open("抓取数据.csv", 'rt', encoding='utf-8').read() # 读取所需要分析的文件内容
Excel = open("工作簿1.csv", 'w', newline='') # 打开表格文件,若表格文件不存在则创建
writ = csv.writer(Excel) # 创建一个csv的writer对象用于写每一行内容
writ.writerow(['名称', '出现次数']) # 写表格表头
words = jieba.lcut(txt) # 使用jieba库对文本进行分词
counts = {} # 创建一个字典,用于对词出现次数的统计,键表示词,值表示对应的次数
for word in words:
if len(word) <= 1:
continue
else:
counts[word] = counts.get(word, 0) + 1 # 在字典中查询若该字返回次数加一
item = list(counts.items()) # 将字典转化为列表格式
item.sort(key=lambda x: x[1], reverse=True) # 对列表按照第二列进行排序
for i in range(10):
writ.writerow(item[i]) # 将前十名写入表格
Traceback (most recent call last):
File "C:\Users\刘玉淇\PycharmProjects\pythonProject1\统计词频.py", line 4, in <module>
txt = open("抓取数据.csv", 'rt', encoding='utf-8').read() # 读取所需要分析的文件内容
FileNotFoundError: [Errno 2] No such file or directory: '抓取数据.csv'
Process finished with exit code 1