下面这个Python是处理上图数据让他们分隔成语汇、拼音、释义的,但是我用Python无法运行,哪位大佬帮我看看
import re
ptn = r'^[\x00-\x7f]+$'
ptn2 = r'^[^\x00-\x7f]+$'
cantonese = []
mandarin = []
pinyin = []
n = 0
while n < len(a):
cantonese.append(a[n])
py = []
m = n + 1
for i in range(len(a[n])):
if re.search(ptn2,a[m]) == None:
py.append(a[m])
m += 1
else:
break
pinyin.append(py)
if m + 1 == len(a) or re.search(ptn2,a[m+1]) != None:
mandarin.append(a[m])
n = m + 1
else:
mandarin.append("")
n = m