如果使用encoding=utf-8,报错如下
将导入时encoding改成GBK
split的时候报错
stop=[]
text=[]
after_text=[]
file_stop=r"D:\stopword(停用词).txt"
file_text=r"D:/简历表.csv"
with open(file_stop, "r", encoding="GBK") as f:
for line in f.readlines():
lline=line.strip()
stop.append(lline)
with open(file_text, "r", encoding="GBK") as f:
print(f.readlines())
for line in f.readlines():
lline = line.split()
for i in lline :
if i not in stop:
after_text.append(i)
print(after_text)
with open(r"D:\新桌面\前端\训练数据\训练数据\stop.txt","w+") as f:
for i in after_text:
f.write(i)