data=open('/Users/momo/Desktop/小論文/模擬/紅樓夢/紅樓夢.txt')
#for line in data:
# print(line)
type(data)
fout = open('/Users/momo/Desktop/小論文/模擬/紅樓夢/output.txt', 'w')
import jieba as jb
seg_list = jb.cut('你是誰', cut_all=True)
print("Full Mode:", "/ ".join(seg_list)) # 全模式
Full Mode: 你/ 是/ 誰
for eachLine in data:
wordList = list(jb.cut(eachLine))#用結巴分詞,對每行內容進行分詞
outStr = ''
for word in wordList:
outStr += word
outStr += '/ '
fout.write(outStr.strip()+'\n') #將分詞好的結果寫入到輸出文件
data.close()
fout.close()
待學習:分詞流程處理,分詞字典應用