version update

This commit is contained in:
fxsjy 2014-11-13 10:43:43 +08:00
parent 40c0edfd99
commit 315a411e52
3 changed files with 9 additions and 2 deletions

View File

@ -1,3 +1,10 @@
2014-11-13: version 0.35
1) 改进词典cache的dump和加载机制by @gumblex
2提升关键词提取的性能; by @gumblex
3关键词提取新增基于textrank算法的子模块; by @singlee
4修复自定义stopwords功能的bug; by @walkskyer
2014-10-20: version 0.34
1. 提升性能词典结构由Trie改为Prefix Set内存占用减少2/3, 详见https://github.com/fxsjy/jieba/pull/187by @gumblex
2. 修复关键词提取功能的性能问题

View File

@ -54,7 +54,7 @@ def set_stop_words(stop_words_path):
if not os.path.exists(abs_path):
raise Exception("jieba: path does not exist: " + abs_path)
content = open(abs_path,'rb').read().decode('utf-8')
lines = content.split('\n')
lines = content.replace("\r","").split('\n')
for line in lines:
STOP_WORDS.add(line)

View File

@ -1,6 +1,6 @@
from distutils.core import setup
setup(name='jieba3k',
version='0.34',
version='0.35',
description='Chinese Words Segementation Utilities',
author='Sun, Junyi',
author_email='ccnusjy@gmail.com',