基於Python結巴分詞(調用自定義詞庫已經去除停用詞)

# -*- coding: utf-8 -*- import time import jieba import jieba.posseg as pseg#用於詞性標註 #分詞 #停用詞過濾 def stop_word(fid1,fid2,fid3): stopword=[] for j in fid2.readlines(): stopword.append(j.s
相關文章
相關標籤/搜索