From a36b98b1fb465e43f67bf330e77d4c5d61e6deb2 Mon Sep 17 00:00:00 2001 From: Sun Junyi Date: Sat, 29 Sep 2012 16:09:25 +0800 Subject: [PATCH] doc --- README.md | 29 +++++++++++++++++++++++++++++ 1 file changed, 29 insertions(+) create mode 100644 README.md diff --git a/README.md b/README.md new file mode 100644 index 0000000..2df4162 --- /dev/null +++ b/README.md @@ -0,0 +1,29 @@ +jieba +======== +结巴中文分词:像结巴说话一样把所有词都分出来 + +Usage +======== +* 将jieba目录放置于当前目录或者site-packages目录 + + + +代码示例 + + #encoding=utf-8 + import jieba + + seg_list = jieba.cut("我爱北京天安门") + print "/ ".join(seg_list) + +Output: + * 我/ 爱/ 北/ 北京/ 天/ 天安/ 天安门/ 门 + +Performance +========= +* 1.5 MB / Second +* Test Env: Intel(R) Core(TM) i7-2600 CPU @ 3.4GHz;《围城》.txt + +Example +========= +* 在线分词效果展示 https://jiebademo.appspot.com/ (需要翻墙)