mirror of https://github.com/fxsjy/jieba.git
You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
43 lines
1.1 KiB
Python
43 lines
1.1 KiB
Python
#!/usr/bin/env python
|
|
# -*- coding: utf-8 -*-
|
|
|
|
import jieba
|
|
import threading
|
|
|
|
def inittokenizer(tokenizer, group):
|
|
print('===> Thread %s:%s started' % (group, threading.current_thread().ident))
|
|
tokenizer.initialize()
|
|
print('<=== Thread %s:%s finished' % (group, threading.current_thread().ident))
|
|
|
|
tokrs1 = [jieba.Tokenizer() for n in range(5)]
|
|
tokrs2 = [jieba.Tokenizer('../extra_dict/dict.txt.small') for n in range(5)]
|
|
|
|
thr1 = [threading.Thread(target=inittokenizer, args=(tokr, 1)) for tokr in tokrs1]
|
|
thr2 = [threading.Thread(target=inittokenizer, args=(tokr, 2)) for tokr in tokrs2]
|
|
for thr in thr1:
|
|
thr.start()
|
|
for thr in thr2:
|
|
thr.start()
|
|
for thr in thr1:
|
|
thr.join()
|
|
for thr in thr2:
|
|
thr.join()
|
|
|
|
del tokrs1, tokrs2
|
|
|
|
print('='*40)
|
|
|
|
tokr1 = jieba.Tokenizer()
|
|
tokr2 = jieba.Tokenizer('../extra_dict/dict.txt.small')
|
|
|
|
thr1 = [threading.Thread(target=inittokenizer, args=(tokr1, 1)) for n in range(5)]
|
|
thr2 = [threading.Thread(target=inittokenizer, args=(tokr2, 2)) for n in range(5)]
|
|
for thr in thr1:
|
|
thr.start()
|
|
for thr in thr2:
|
|
thr.start()
|
|
for thr in thr1:
|
|
thr.join()
|
|
for thr in thr2:
|
|
thr.join()
|