You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
jieba/test/test_userdict.py

27 lines
551 B
Python

#encoding=utf-8
import sys
sys.path.append("../")
import jieba
jieba.load_userdict("userdict.txt")
import jieba.posseg as pseg
test_sent = "李小福是创新办主任也是云计算方面的专家"
words = jieba.cut(test_sent)
for w in words:
print w
result = pseg.cut(test_sent)
for w in result:
print w.word, "/", w.flag, ", ",
print "\n========"
terms = jieba.cut('easy_install is great')
for t in terms:
print t
print '-------------------------'
terms = jieba.cut('python 的正则表达式是好用的')
for t in terms:
print t