第一单元
application software应用软件
basic application基本应用软件
communication device通信设备
compact disc (CD)光盘
computer competency计算机能力
请问怎么提取
if __name__ == '__main__':
info = open("know.txt")
print "中文"
#a = info.readlines()
#print a
for line in info:
line = line.decode('GB2312').encode('utf-8')
print line
letter_str = re.findall(r'([a-zA-Z]+)',line,re.MULTILINE)
hanzi_str = re.findall(r'([^a-zA-Z]+)',line,re.MULTILINE)
print hanzi_str
str = [letter_str,hanzi_str]
knowledge.append(str)
write_excel(knowledge)