diff --git a/jieba/__init__.py b/jieba/__init__.py index 0e894c6..6b066d0 100644 --- a/jieba/__init__.py +++ b/jieba/__init__.py @@ -297,7 +297,7 @@ def __lcut_for_search(sentence): @require_initialized -def enable_parallel(processnum): +def enable_parallel(processnum=None): global pool,cut,cut_for_search if os.name=='nt': raise Exception("jieba: parallel mode only supports posix system") diff --git a/test/parallel/test_file.py b/test/parallel/test_file.py index e10d1a2..01ce380 100644 --- a/test/parallel/test_file.py +++ b/test/parallel/test_file.py @@ -9,14 +9,13 @@ jieba.enable_parallel() url = sys.argv[1] content = open(url,"rb").read() t1 = time.time() -words = list(jieba.cut(content)) +words = "/ ".join(jieba.cut(content)) t2 = time.time() tm_cost = t2-t1 log_f = open("1.log","wb") -for w in words: - print >> log_f, w.encode("utf-8"), "/" , +log_f.write(words.encode('utf-8')) print 'speed' , len(content)/tm_cost, " bytes/second" diff --git a/test/test_file.py b/test/test_file.py index 288c2cc..6234e2a 100644 --- a/test/test_file.py +++ b/test/test_file.py @@ -8,14 +8,14 @@ jieba.initialize() url = sys.argv[1] content = open(url,"rb").read() t1 = time.time() -words = list(jieba.cut(content)) +words = "/ ".join(jieba.cut(content)) t2 = time.time() tm_cost = t2-t1 log_f = open("1.log","wb") -for w in words: - print >> log_f, w.encode("utf-8"), "/" , +log_f.write(words.encode('utf-8')) + print 'cost',tm_cost print 'speed' , len(content)/tm_cost, " bytes/second"