Merge branch 'dev'

2025-07-18 00:00:12 +08:00 · 2013-11-04 07:04:38 -08:00 · 2013-11-04 07:04:38 -08:00 · 1f65862c82
commit 1f65862c82
parent c701ddd14c 910a368afb
60 changed files with 720 additions and 1388 deletions
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@ -0,0 +1,2 @@
 PROJECT(CPPJIEBA)
 ADD_SUBDIRECTORY(src)
--- a/README.md
+++ b/README.md
@ -7,41 +7,63 @@
 - `master`分支支持`utf8`编码   
 - `gbk`分支支持`gbk`编码
 ## 安装与使用
-## 模块详解
+### 下载和安装
-### Trie树
+```sh
-Trie.cpp/Trie.h 负责载入词典的trie树，主要供Segment模块使用。
+wget https://github.com/aszxqw/cppjieba/archive/master.zip -O cppjieba-master.zip
 unzip cppjieba-master.zip
 cd cppjieba-master
 mkdir build
 cd build
 cmake -DCMAKE_INSTALL_PREFIX=/usr ..
 make
 sudo make install
 ```
-### Segment模块
+### 卸载
 ```sh
 cd build/
 cat install_manifest.txt | sudo xargs rm -rf
 ```
-MPSegment.cpp/MPSegment.h 
+### 验证
 (Maximum Probability)最大概率法:负责根据Trie树构建有向无环图和进行动态规划算法，是分词算法的核心。
-HMMSegment.cpp/HMMSegment.h
+```sh
-是根据HMM模型来进行分词，主要算法思路是根据(B,E,M,S)四个状态来代表每个字的隐藏状态。
+cd test/
-HMM模型由dicts/下面的`hmm_model.utf8`提供。
+g++ -o segment.demo segment.cpp -L/usr/lib/CppJieba/ -lcppjieba
-分词算法即viterbi算法。
+./segment.demo # you will see the demo.
 ```
 运行一下 `./server` 或 `./segment` 都会有对应的帮助文档显示。
-### TransCode模块
+同时，如果想知道开发时如何使用`libcppjieba.a` 请看`test/segment.cpp`源代码即可。
-TransCode.cpp/TransCode.h 负责转换编码类型，将utf8和gbk转换成`uint16_t`类型，也负责逆转换。
+如果想知道如何搭建一个`cppjieba`中文分词的http服务请见 `test/server.cpp`源代码即可。
 若还有其他问题，欢迎`send mail`或者`open issue`。  :)
 ### 搭建服务
-## Demo
+```
 cd ./test
 g++ -o server server.cpp -L/usr/lib/CppJieba/ -L/usr/lib/CppJieba/Husky -lcppjieba -lhusky -lpthread
 ./server -n 4 -p 11258 -k start >> run.log 2>&1 #启动服务，监听11258这个端口。
 ./server -n 4 -p 11258 -k stop  #停止服务
 ```
 #### 验证服务
 然后用chrome浏览器打开`http://127.0.0.1:11258/?key=我来自北京邮电大学`
 (用chrome的原因是chrome的默认编码就是utf-8)
 或者用命令 `curl "http://127.0.0.1:11258/?key=我来自北京邮电大学"` (ubuntu中的curl安装命令`sudo apt-get install curl`)
 ## 分词效果
 ### MPSegment's demo
 __这部分的功能经过线上考验，一直稳定运行，暂时没有发现什么bug。__
 ```
 cd ./demo;
 make;
 ./segment_demo testlines.utf8
 ```
 Output:
 ```
 我来到北京清华大学
@ -59,12 +81,6 @@ Output:
 ### HMMSegment's demo
 ```
 cd ./demo;
 make;
 ./segment_demo testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutHMM
 ```
 Output:
 ```
 我来到北京清华大学
@ -78,11 +94,6 @@ Output:
 ```
 ### MixSegment's demo
 ```
 cd ./demo;
 make;
 ./segment_demo testlines.utf8 --algorithm cutMix
 ```
 Output:
 ```
@ -98,62 +109,51 @@ Output:
 我/来自/北京邮电大学/。。。/学号/091111xx/。。。
 ```
 ### Server's demo
 引入了husky这个文件夹，husky是一个简单的http服务框架。    
 ```
 cd ./demo;
 make;
 ./start.sh #启动一个服务，监听11258这个端口(在start.sh里面指定)。
 ```
 关闭和重启分别是`stop.sh`和`restart.sh`
 然后用chrome浏览器打开`http://127.0.0.1:11258/?key=我来自北京邮电大学`
 (用chrome的原因是chrome的默认编码就是utf-8)
 或者用命令 `curl "http://127.0.0.1:11258/?key=我来自北京邮电大学"`
 ### 效果分析
 以上依次是MP,HMM,Mix三种方法的效果。  
 可以看出效果最好的是Mix，也就是融合MP和HMM的切词算法。即可以准确切出词典已有的词，又可以切出像"杭研"这样的未登录词。
-## Help
+
 ## 模块详解
 本项目主要是如下目录组成：
-### Limonp 
+### src
 核心目录，包含主要源代码。
 #### Trie树
 Trie.cpp/Trie.h 负责载入词典的trie树，主要供Segment模块使用。
 #### Segment模块
 MPSegment.cpp/MPSegment.h 
 (Maximum Probability)最大概率法:负责根据Trie树构建有向无环图和进行动态规划算法，是分词算法的核心。
 HMMSegment.cpp/HMMSegment.h
 是根据HMM模型来进行分词，主要算法思路是根据(B,E,M,S)四个状态来代表每个字的隐藏状态。
 HMM模型由dicts/下面的`hmm_model.utf8`提供。
 分词算法即viterbi算法。
 #### TransCode模块
 TransCode.cpp/TransCode.h 负责转换编码类型，将utf8和gbk转换成`uint16_t`类型，也负责逆转换。
 ### src/Husky
 提供服务的框架代码，
 详见：  https://github.com/aszxqw/husky
 ### src/Limonp 
 主要是一些工具函数，例如字符串操作等。    
 直接include就可以使用。
-### cppjieba
+详见：  https://github.com/aszxqw/limonp
 核心目录，包含主要源代码。
 make 之后产生libcppjieb.a
 使用方法参考如上cppcommon
 ### run `./segment_demo` to get help.
 如下:
 ```
 usage:
        ./segment_demo[options] <filename>
 options:
        --algorithm     Supported methods are [cutDAG, cutHMM, cutMix] for now.
                        If not specified, the default is cutDAG
        --dictpath      If not specified, the default is ../dicts/jieba.dict.utf8
        --modelpath     If not specified, the default is ../dicts/hmm_model.utf8
                        If not specified, the default is utf8.
 example:
        ./segment_demo testlines.utf8 --dictpath ../dicts/jieba.dict.utf8
        ./segment_demo testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutHMM
        ./segment_demo testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutMix
 ```
 ## 分词速度
@ -163,11 +163,11 @@ example:
 测试环境: `Intel(R) Xeon(R) CPU  E5506  @ 2.13GHz`
-## Contact
+## 联系客服
 如果有运行问题或者任何疑问，欢迎联系 : wuyanyi09@gmail.com
-## Thanks
+## 鸣谢
 "结巴中文"分词作者: SunJunyi  
 https://github.com/fxsjy/jieba
--- a/cppjieba/KeyWordExt.cpp
+++ b/cppjieba/KeyWordExt.cpp
@ -1,360 +0,0 @@
 /************************************
 * file enc : ASCII
 * author   : wuyanyi09@gmail.com
 ************************************/
 #include "KeyWordExt.h"
 namespace CppJieba
 {
    KeyWordExt::KeyWordExt()
    {
    }
    KeyWordExt::~KeyWordExt()
    {
    }
    bool KeyWordExt::init(const char* const segDictFile)
    {
        LogInfo("KeyWordExt init start ...");
        if(!_segment.init(segDictFile))
        {
            LogError("_segment.init failed.");
            return false;
        }
        return true;
    }
    bool KeyWordExt::loadStopWords(const char * const filePath)
    {
        LogInfo("_loadStopWords(%s) start", filePath);
        if(!_stopWords.empty())
        {
            LogError("_stopWords has been loaded before! ");
            return false;
        }
        if(!checkFileExist(filePath))
        {
            LogError("cann't find file[%s].",filePath);
            return false;
        }
        ifstream ifile(filePath);
        string line;
        Unicode word;
        while(getline(ifile, line))
        {
            if(!TransCode::decode(line, word))
            {
                LogError("decode failed .");
                return false;
            }
            _stopWords.insert(word);
        }
        LogInfo("load stopwords[%d] finished.", _stopWords.size());
        return true;
    }
    bool KeyWordExt::dispose()
    {
        _segment.dispose();
        return true;
    }
    bool KeyWordExt::_wordInfoCompare(const KeyWordInfo& a, const KeyWordInfo& b)
    {
        return a.weight > b.weight;
    }
    bool KeyWordExt::_sortWLIDF(vector<KeyWordInfo>& wordInfos)
    {
        for(uint i = 0; i < wordInfos.size(); i++)
        {
            KeyWordInfo& wInfo = wordInfos[i];
            wInfo.idf = - wInfo.logFreq;
            wInfo.weight = log(double(wInfo.word.size() + 1)) * wInfo.idf;
        }
        sort(wordInfos.begin(), wordInfos.end(), _wordInfoCompare);
        return true;
    }
    bool KeyWordExt::_extTopN(vector<KeyWordInfo>& wordInfos, uint topN)
    {
        int dis = wordInfos.size() - topN;
        if(dis <= 0)
        {
            return true;
        }
        if(uint(dis) <= topN)
        {
            for(int i = 0; i< dis; i++)
            {
                wordInfos.pop_back();
            }
        }
        else// in case that topN << size;
        {
            vector<KeyWordInfo> tmp(wordInfos.begin(), wordInfos.begin() + topN);
            wordInfos.swap(tmp);
        }
        return true;
    }
    bool KeyWordExt::extract(const vector<string>& words, vector<KeyWordInfo>& keyWordInfos, uint topN)
    {
        if(words.empty())
        {
            return false;
        }
        keyWordInfos.clear();
        for(uint i = 0; i < words.size(); i++)
        {
            Unicode uniWord;
            if(!TransCode::decode(words[i], uniWord))
            {
                LogError("decode failed");
                return false;
            }
            keyWordInfos.push_back(uniWord);
        }
        return _extract(keyWordInfos, topN);
    }
    bool KeyWordExt::extract(const string& title, vector<KeyWordInfo>& keyWordInfos, uint topN)
    {
        if(title.empty())
        {
            return false;
        }
        vector<TrieNodeInfo> trieNodeInfos; 
        Unicode unico;
        if(!TransCode::decode(title, unico))
        {
            return false;
        }
        _segment.cut(unico.begin(), unico.end(), trieNodeInfos);
        keyWordInfos.clear();
        for(uint i = 0; i < trieNodeInfos.size(); i++)
        {
            keyWordInfos.push_back(trieNodeInfos[i]);
        }
        return _extract(keyWordInfos, topN);
    }
    bool KeyWordExt::_extract(vector<KeyWordInfo>& keyWordInfos, uint topN)
    {
        if(!_filter(keyWordInfos))
        {
            LogError("_filter failed.");
            return false;
        }
        if(!_sortWLIDF(keyWordInfos))
        {
            LogError("_sortWLIDF failed.");
            return false;
        }
        if(!_extTopN(keyWordInfos, topN))
        {
            LogError("_extTopN failed.");
            return false;
        }
        return true;
    }
    bool KeyWordExt::_filter(vector<KeyWordInfo>& wordInfos)
    {
        if(!_filterDuplicate(wordInfos))
        {
            LogError("_filterDuplicate failed.");
            return false;
        }
        if(!_filterSingleWord(wordInfos))
        {
            LogError("_filterSingleWord failed.");
            return false;
        }
        if(!_filterStopWords(wordInfos))
        {
            LogError("_filterStopWords failed.");
            return false;
        }
        if(!_filterSubstr(wordInfos))
        {
            LogError("_filterSubstr failed.");
            return false;
        }
        return true;
    }
    bool KeyWordExt::_filterStopWords(vector<KeyWordInfo>& wordInfos)
    {
        if(_stopWords.empty())
        {
            return true;
        }
        for(vector<KeyWordInfo>::iterator it = wordInfos.begin(); it != wordInfos.end();)
        {
            if(_stopWords.find(it->word) != _stopWords.end())
            {
                it = wordInfos.erase(it);
            }
            else
            {
                it ++;
            }
        }
        return true;
    }
    bool KeyWordExt::_filterDuplicate(vector<KeyWordInfo>& wordInfos)
    {
        set<Unicode> st;
        for(vector<KeyWordInfo>::iterator it = wordInfos.begin(); it != wordInfos.end(); )
        {
            if(st.find(it->word) != st.end())
            {
                it = wordInfos.erase(it);
            }
            else
            {
                st.insert(it->word);
                it++;
            }
        }
        return true;
    }
    bool KeyWordExt::_filterSingleWord(vector<KeyWordInfo>& wordInfos)
    {
        for(vector<KeyWordInfo>::iterator it = wordInfos.begin(); it != wordInfos.end();)
        {
            // filter single word
            if(1 == it->word.size())
            {
                it = wordInfos.erase(it);
            }
            else
            {
                it++;
            }
        }
        return true;
    }
    bool KeyWordExt::_filterSubstr(vector<KeyWordInfo>& wordInfos)
    {
        vector<Unicode> tmp ;
        for(uint i = 0; i < wordInfos.size(); i++)
        {
            tmp.push_back(wordInfos[i].word);
        }
        for(vector<KeyWordInfo>::iterator it = wordInfos.begin(); it != wordInfos.end(); )
        {
            if(_isSubIn(tmp, it->word))
            {
                it = wordInfos.erase(it);
            }
            else
            {
                it++;
            }
        }
        return true;
    }
    //bool KeyWordExt::_isContainSubWords(const string& word)
    //{
    //    for(uint i = 0; i < _priorSubWords.size(); i++)
    //    {
    //        if(string::npos != word.find(_priorSubWords[i]))
    //        {
    //            return true;
    //        }
    //    }
    //    return false;
    //}
    //bool KeyWordExt::_prioritizeSubWords(vector<KeyWordInfo>& wordInfos)
    //{
    //    if(2 > wordInfos.size())
    //    {
    //        return true;
    //    }
    //    KeyWordInfo prior;
    //    bool flag = false;
    //    for(vector<KeyWordInfo>::iterator it = wordInfos.begin(); it != wordInfos.end(); )
    //    {
    //        if(_isContainSubWords(it->word))
    //        {
    //            prior = *it;
    //            it = wordInfos.erase(it);
    //            flag = true;
    //            break;
    //        }
    //        else
    //        {
    //            it ++;
    //        }
    //    }
    //    if(flag)
    //    {
    //        wordInfos.insert(wordInfos.begin(), prior);
    //    }
    //    return true;
    //}
 }
 #ifdef KEYWORDEXT_UT
 using namespace CppJieba;
 int main()
 {
    KeyWordExt ext;
    ext.init();
    if(!ext.loadSegDict("../dicts/segdict.gbk.v2.1"))
    {
        return 1;
    }
    ext._loadStopWords("../dicts/stopwords.gbk.v1.0");
    ifstream ifile("testtitle.gbk");
    vector<string> res;
    string line;
    while(getline(ifile, line))
    {
        cout<<line<<endl;
        res.clear();
        ext.extract(line, res, 20);
        PRINT_VECTOR(res);
    }
    ext.dispose();
    return 0;
 }
 #endif
--- a/cppjieba/KeyWordExt.h
+++ b/cppjieba/KeyWordExt.h
@ -1,68 +0,0 @@
 /************************************
 * file enc : ASCII
 * author   : wuyanyi09@gmail.com
 ************************************/
 #ifndef CPPJIEBA_KEYWORDEXT_H
 #define CPPJIEBA_KEYWORDEXT_H
 #include <logger.hpp>
 #include "MPSegment.h"
 #include "structs.h"
 namespace CppJieba
 {
    class KeyWordExt
    {
        private:
            MPSegment _segment;
            //vector<string> _priorSubWords;
            set<Unicode> _stopWords;
        public:
            KeyWordExt();
            ~KeyWordExt();
            bool init(const char* const segDictFile);
            bool dispose();
            bool loadStopWords(const char * const filePath);
        private:
            //bool _loadPriorSubWords(const char * const filePath);
        public:
            bool extract(const string& title, vector<KeyWordInfo>& keyWordInfos, uint topN);
            bool extract(const vector<string>& words, vector<KeyWordInfo>& keyWordInfos, uint topN);
        private:
            static bool _wordInfoCompare(const KeyWordInfo& a, const KeyWordInfo& b);
        private:
            bool _extract(vector<KeyWordInfo>& keyWordInfos, uint topN);
            bool _extTopN(vector<KeyWordInfo>& wordInfos, uint topN);
        private:
            //sort by word len - idf
            bool _sortWLIDF(vector<KeyWordInfo>& wordInfos);
        private:
            bool _filter(vector<KeyWordInfo>& );
            bool _filterDuplicate(vector<KeyWordInfo>& );
            bool _filterSingleWord(vector<KeyWordInfo>& );
            bool _filterSubstr(vector<KeyWordInfo>& );
            bool _filterStopWords(vector<KeyWordInfo>& );
        private:
            inline bool _isSubIn(const vector<Unicode>& words, const Unicode& word)const
            {
                for(uint j = 0; j < words.size(); j++)
                {
                    if(word != words[j] && words[j].end() != search(words[j].begin(), words[j].end(), word.begin(), word.end()))
                    {
                        return true;
                    }
                }
                return false;
            }
            //bool _prioritizeSubWords(vector<KeyWordInfo>& wordInfos);
            //bool _isContainSubWords(const string& word);
    };
 }
 #endif
--- a/cppjieba/Makefile
+++ b/cppjieba/Makefile
@ -1,66 +0,0 @@
 CXX    := g++
 LD     := g++
 AR     := ar rc
 DEBUG_CXXFLAGS     := -g -Wall -DDEBUG 
 RELEASE_CXXFLAGS   := -Wall -O3
 ifeq (YES, ${RELEASE})
   CXXFLAGS     := ${RELEASE_CXXFLAGS}
   LDFLAGS      := ${RELEASE_LDFLAGS}
 else
   CXXFLAGS       := ${DEBUG_CXXFLAGS}
   LDFLAGS      := ${DEBUG_LDFLAGS}
 endif
 SOURCES := $(wildcard *.cpp)
 OBJS := $(patsubst %.cpp,%.o,$(SOURCES))
 INC := -I../limonp
 LIBA := libcppjieba.a
 # remove the objs after compilation
 .INTERMEDIATE: 
 #.PHONY: clean $(CMLIB) 
 .PHONY: clean 
 all: $(LIBA)
 # This is a suffix rule 
 #.c.o: 
 %.o: %.cpp
 	$(CXX) -c $(CXXFLAGS) $< $(INC)
 ${LIBA}: $(OBJS)
 	$(AR) $@ $(OBJS) 
 #unit test
 Trie.ut: Trie.cpp Trie.h globals.h  TransCode.cpp TransCode.hpp $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) Trie.cpp TransCode.cpp  -DTRIE_UT $(CMLIB)
 MPSegment.ut: MPSegment.cpp Trie.cpp MPSegment.h Trie.h globals.h $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) MPSegment.cpp Trie.cpp TransCode.cpp -DSEGMENT_UT $(CMLIB) 
 KeyWordExt.ut: KeyWordExt.cpp KeyWordExt.h MPSegment.h Trie.h globals.h TransCode.cpp TransCode.hpp  $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) KeyWordExt.cpp MPSegment.cpp Trie.cpp TransCode.cpp -DKEYWORDEXT_UT $(CMLIB)
 TransCode.ut: TransCode.cpp TransCode.hpp globals.h $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) TransCode.cpp -DCPPJIEBA_TRANSCODE_UT $(CMLIB) 
 HMMSegment.ut: HMMSegment.cpp TransCode.cpp TransCode.hpp HMMSegment.h $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) TransCode.cpp HMMSegment.cpp -DHMMSEGMENT_UT $(CMLIB) 
 MixSegment.ut: MixSegment.cpp MixSegment.h HMMSegment.cpp MPSegment.cpp Trie.cpp MPSegment.h Trie.h globals.h $(CMLIB)
 	$(CXX) -o $@ $(CXXFLAGS) MixSegment.cpp HMMSegment.cpp MPSegment.cpp Trie.cpp TransCode.cpp -DMIXSEGMENT_UT $(CMLIB) 
 ChineseFilter.ut: ChineseFilter.cpp ChineseFilter.hpp
 	$(CXX) -o $@ $(CXXFLAGS) ChineseFilter.cpp -DUT
 clean:
 	rm -f *.o *.d *.d.* *.ut $(LIBA) 
 sinclude $(SOURCES:.cpp=.d)
 %.d:%.cpp
 	@set -e; rm -f $@; \
 	$(CXX) -MM $< > $@.$$$$; \
 	sed 's,\($*\).o[ :]*,\1.o $@ : ,g' < $@.$$$$ > $@; \
 	rm -f $@.$$$$
--- a/demo/Makefile
+++ b/demo/Makefile
@ -1,53 +0,0 @@
 CXX    := g++
 LD     := g++
 AR     := ar rc
 DEBUG_CXXFLAGS     := -g -Wall -DDEBUG 
 RELEASE_CXXFLAGS   := -Wall -O3
 ifeq (YES, ${DEBUG})
   CXXFLAGS       := ${DEBUG_CXXFLAGS}
   LDFLAGS      := ${DEBUG_LDFLAGS}
 else
   CXXFLAGS     := ${RELEASE_CXXFLAGS}
   LDFLAGS      := ${RELEASE_LDFLAGS}
 endif
 INCS := -I../limonp
 LINK := -lpthread
 SOURCES := $(wildcard *.cpp)
 OBJS := $(patsubst %.cpp,%.o,$(SOURCES))
 DEMOS := $(patsubst %.cpp,%.demo,$(SOURCES))
 CPPJIEBADIR := ../cppjieba
 LIBCPPJIEBA := $(CPPJIEBADIR)/libcppjieba.a
 HUSKYDIR := ../husky
 LIBHUSKYA := $(HUSKYDIR)/libhusky.a
 .PHONY: clean $(LIBCPPJIEBA) 
 all: $(DEMOS)
 %.demo: %.cpp $(LIBCPPJIEBA) $(LIBHUSKYA)
 	$(CXX) -o $@ $(CXXFLAGS) $^ $(INCS) $(LINK)
 $(LIBCPPJIEBA): 
 	cd $(CPPJIEBADIR) && $(MAKE)
 $(LIBHUSKYA): 
 	cd $(HUSKYDIR) && $(MAKE)
 clean:
 	rm -f *.o *.ut *.d *.d.* $(DEMOS)
 	cd $(CPPJIEBADIR) && make clean
 	cd $(HUSKYDIR) && make clean
 sinclude $(SOURCES:.cpp=.d)
 %.d:%.cpp
 	@set -e; rm -f $@; \
 	$(CXX) -MM $< > $@.$$$$; \
 	sed 's,\($*\).o[ :]*,\1.o $@ : ,g' < $@.$$$$ > $@; \
 	rm -f $@.$$$$
--- a/demo/example.sh
+++ b/demo/example.sh
@ -1,3 +0,0 @@
 ./segment.demo testlines.utf8 --dictpath ../dicts/jieba.dict.utf8 
 ./segment.demo testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutHMM 
 ./segment.demo testlines.utf8 --algorithm cutMix
--- a/demo/keywordext.cpp
+++ b/demo/keywordext.cpp
@ -1,56 +0,0 @@
 #include <iostream>
 #include <fstream>
 #include <ArgvContext.hpp>
 #include "../cppjieba/KeyWordExt.h"
 using namespace CppJieba;
 void testKeyWordExt(const char * dictPath, const char * filePath)
 {
    KeyWordExt ext;
    if(!ext.init(dictPath))
    {
        return;
    }
    ifstream ifile(filePath);
    vector<KeyWordInfo> res;
    string line;
    while(getline(ifile, line))
    {
        res.clear();
        if(!line.empty())
        {
            ext.extract(line, res, 20);
            cout<<line<<'\n'<<joinWordInfos(res)<<endl;
        }
    }
    ext.dispose();
 }
 const char * const DEFAULT_DICTPATH = "../dicts/jieba.dict.utf8";
 int main(int argc, char ** argv)
 {
    if(2 > argc)
    {
        cout<<"usage: \n\t"<<argv[0]<<" [options] <filename>\n"
            <<"options:\n"
            <<"\t--dictpath\tIf not specified, the default is "<<DEFAULT_DICTPATH<<"\n"
            <<"examples:\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --encoding utf-8 --dictpath ../dicts/jieba.dict.utf8\n"
            <<endl;
        return -1;
    }
    ArgvContext arg(argc, argv);
    string dictPath = arg["--dictpath"];
    if("" == dictPath)
    {
        dictPath = DEFAULT_DICTPATH;
    }
    testKeyWordExt(dictPath.c_str(), arg[1].c_str());
    return 0;
 }
--- a/demo/segment.cpp
+++ b/demo/segment.cpp
@ -1,124 +0,0 @@
 #include <iostream>
 #include <fstream>
 #include <ArgvContext.hpp>
 #include "../cppjieba/MPSegment.h"
 #include "../cppjieba/HMMSegment.h"
 #include "../cppjieba/MixSegment.h"
 using namespace CppJieba;
 MPSegment seg;
 HMMSegment hmmseg;
 MixSegment mixseg;
 bool init(const char * const dictPath, const char * const modelPath)
 {
    if(!seg.init(dictPath))
    {
        cout<<"seg init failed."<<endl;
        return false;
    }
    if(!hmmseg.init(modelPath))
    {
        cout<<"hmmseg init failed."<<endl;
        return false;
    }
    if(!mixseg.init(dictPath, modelPath))
    {
        cout<<"mixseg init failed."<<endl;
        return false;
    }
    return true;
 }
 void cut(const ISegment * seg, const char * const filePath)
 {
    ifstream ifile(filePath);
    vector<string> res;
    string line;
    while(getline(ifile, line))
    {
        if(!line.empty())
        {
            res.clear();
            seg->cut(line, res);
            cout<<line<<"\n"<<joinStr(res,"/")<<endl;
        }
    }
 }
 bool dispose()
 {
    if(!seg.dispose())
    {
        cout<<"seg dispose failed."<<endl;
        return false;
    }
    if(!hmmseg.dispose())
    {
        cout<<"seg dispose failed."<<endl;
        return false;
    }
    if(!mixseg.dispose())
    {
        cout<<"seg dispose failed."<<endl;
        return false;
    }
    return true;
 }
 const char * const DEFAULT_DICTPATH = "../dicts/jieba.dict.utf8";
 const char * const DEFAULT_MODELPATH = "../dicts/hmm_model.utf8";
 int main(int argc, char ** argv)
 {
    if(argc < 2)
    {
        cout<<"usage: \n\t"<<argv[0]<<"[options] <filename>\n"
            <<"options:\n"
            <<"\t--algorithm\tSupported methods are [cutDAG, cutHMM, cutMix] for now. \n\t\t\tIf not specified, the default is cutDAG\n"
            <<"\t--dictpath\tIf not specified, the default is "<<DEFAULT_DICTPATH<<'\n'
            <<"\t--modelpath\tIf not specified, the default is "<<DEFAULT_MODELPATH<<'\n'
            <<"example:\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --dictpath ../dicts/jieba.dict.utf8\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutHMM\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --modelpath ../dicts/hmm_model.utf8 --algorithm cutMix\n"
            <<endl;
        return -1;
    }
    ArgvContext arg(argc, argv);
    string dictPath = arg["--dictpath"];
    string modelPath = arg["--modelpath"];
    string algorithm = arg["--algorithm"];
    if(dictPath.empty())
    {
        dictPath = DEFAULT_DICTPATH;
    }
    if(modelPath.empty())
    {
        modelPath = DEFAULT_MODELPATH;
    }
    if(!init(dictPath.c_str(), modelPath.c_str()))
    {
        LogError("init failed.");
        return -1;
    }
    if("cutHMM" == algorithm)
    {
        cut(&hmmseg, arg[1].c_str());
    }
    else if("cutMix" == algorithm)
    {
        cut(&mixseg, arg[1].c_str());
    }
    else
    {
        cut(&seg, arg[1].c_str());
    }
    dispose();
    return 0;
 }
--- a/husky/Makefile
+++ b/husky/Makefile
@ -1,42 +0,0 @@
 CXX    := g++
 LD     := g++
 AR     := ar rc
 DEBUG_CXXFLAGS     := -g -Wall -DDEBUG 
 RELEASE_CXXFLAGS   := -Wall -O3
 ifeq (YES, ${RELEASE})
   CXXFLAGS     := ${RELEASE_CXXFLAGS}
   LDFLAGS      := ${RELEASE_LDFLAGS}
 else
   CXXFLAGS       := ${DEBUG_CXXFLAGS}
   LDFLAGS      := ${DEBUG_LDFLAGS}
 endif
 DOLINK := $(LD) $(LDFLAGS) -o $@ $^
 DOPACK := $(AR)  
 SOURCES = $(wildcard *.cpp)
 OBJS := $(patsubst %.cpp,%.o,$(SOURCES))
 INC := -I../limonp
 LIBA := libhusky.a
 .PHONY: clean 
 all: $(LIBA)
 %.o: %.cpp
 	$(CXX) -c $(CXXFLAGS) $< $(INC)
 ${LIBA}: $(OBJS) 
 	$(DOPACK) $@ $(OBJS) 
 clean:
 	rm -f *.o *.d *.d.* $(LIBA) 
 sinclude $(SOURCES:.cpp=.d)
 %.d:%.cpp
 	@set -e; rm -f $@; \
 	$(CXX) -MM $< > $@.$$$$; \
 	sed 's,\($*\).o[ :]*,\1.o $@ : ,g' < $@.$$$$ > $@; \
 	rm -f $@.$$$$
--- a/limonp/map_functs.hpp
+++ b/limonp/map_functs.hpp
@ -1,123 +0,0 @@
 /************************************
 * file enc : ascii
 * author   : wuyanyi09@gmail.com
 ************************************/
 #ifndef LIMONP_MAP_FUNCTS_H
 #define LIMONP_MAP_FUNCTS_H
 #include <map>
 #include <set>
 #include <iostream>
 #include <sstream>
 #include "typedefs.h"
 namespace Limonp
 {
    using namespace std;
    template <typename T>
        string setToString(const set<T>& st)
        {
            if(st.empty())
            {
                return "{}";
            }
            stringstream ss;
            ss<<'{';
            typename set<T>::const_iterator it = st.begin();
            ss<<*it;
            it++;
            while(it != st.end())
            {
                ss<<", "<<*it;
                it++;
            }
            ss<<'}';
            return ss.str();
        }
    template<typename T1, typename T2>
        string mapToString(const map<T1, T2>& mp)
        {
            if(mp.empty())
            {
                return "{}";
            }
            stringstream ss;
            ss<<'{';
            typename map<T1, T2>::const_iterator it = mp.begin();
            ss<<it->first<<": "<<it->second;
            it++;
            while(it != mp.end())
            {
                ss<<", "<<it->first<<": "<<it->second;
                it++;
            }
            ss<<'}';
            return ss.str();
        }
    template<typename T1, typename T2>
        string HashMapToString(const HashMap<T1, T2>& mp)
        {
            if(mp.empty())
            {
                return "{}";
            }
            stringstream ss;
            ss<<'{';
            typename HashMap<T1, T2>::const_iterator it = mp.begin();
            ss<<it->first<<": "<<it->second;
            it++;
            while(it != mp.end())
            {
                ss<<", "<<it->first<<": "<<it->second;
                it++;
            }
            ss<<'}';
            return ss.str();
        }
    template<typename T1, typename T2>
        string pairToString(const pair<T1, T2>& p)
        {
            stringstream ss;
            ss<<p.first<<":"<<p.second;
            return ss.str();
        }
    template<class kT, class vT>
        void printMap(const map<kT, vT>& mp)
        {
            for(typename map<kT, vT>::const_iterator it = mp.begin(); it != mp.end(); it++)
            {
                cout<<it->first<<' '<<it->second<<endl;
            }
        }
    template<class kT, class vT>
        vT getMap(const map<kT, vT>& mp, const kT & key, const vT & defaultVal)
        {
            typename map<kT, vT>::const_iterator it;
            it = mp.find(key);
            if(mp.end() == it)
            {
                return defaultVal;
            }
            return it->second;
        }
    template<class kT, class vT>
        void map2Vec(const map<kT, vT>& mp, vector<pair<kT, vT> > & res)
        {
            typename map<kT, vT>::const_iterator it = mp.begin();
            for(; it != mp.end(); it++)
            {
                res.push_back(*it);
            }
        }
 }
 #endif
--- a/limonp/typedefs.h
+++ b/limonp/typedefs.h
@ -1,21 +0,0 @@
 /************************************
 * file enc : utf8
 * author   : wuyanyi09@gmail.com
 ************************************/
 #ifndef LIMONP_TYPEDEFS_H
 #define LIMONP_TYPEDEFS_H
 #include <stdint.h>
 #include <vector>
 #include <sys/types.h>
 #include <tr1/unordered_map>
 #define HashMap std::tr1::unordered_map
 namespace Limonp
 {
    typedef std::vector<uint16_t> Unicode;
    typedef std::vector<uint16_t>::const_iterator UnicodeConstIterator;
 }
 #endif
--- a/limonp/vec_functs.hpp
+++ b/limonp/vec_functs.hpp
@ -1,142 +0,0 @@
 /************************************
 * file enc : ascii
 * author   : wuyanyi09@gmail.com
 ************************************/
 #ifndef LIMONP_VEC_FUNCTS_H
 #define LIMONP_VEC_FUNCTS_H
 #include <iostream>
 #include <vector>
 #include <algorithm>
 #include <queue>
 #include <string>
 #include <iostream>
 #include <string>
 #include <vector>
 #include <utility>
 #include <algorithm>
 #include <sstream>
 #define FOR_VECTOR(vec, i) for(size_t i = 0; i < vec.size(); i++)
 #define PRINT_VECTOR(vec) FOR_VECTOR(vec, i)\
 {\
    cout<<vec[i]<<endl;\
 }
 #define PRINT_MATRIX(mat) FOR_VECTOR(mat, i) \
 {\
    FOR_VECTOR(mat[i], j)\
    {\
        cout<<"["<<i<<","<<j<<"]:"<<mat[i][j]<<endl;\
    }\
 }
 namespace Limonp
 {
    using namespace std;
    template <typename T>
        bool vecToString(const vector<T>& vec, string& res)
        {
            if(vec.empty())
            {
                res = "[]";
                return false;
            }
            stringstream ss;
            ss<<"[\""<<vec[0];
            for(uint i = 1; i < vec.size(); i++)
            {
                ss<<"\", \""<<vec[i];
            }
            ss<<"\"]";
            res = ss.str();
            return true;
        }
    template <typename T>
        string vecToString(const vector<T>& vec)
        {
            string res;
            vecToString(vec, res);
            return res;
        }
 	template<typename T>
 		bool isInVec(const vector<T>& vec, const T& item)
 		{
 			typename vector<T>::const_iterator it	= find(vec.begin(), vec.end(), item);
 			return it != vec.end();
 		}
 	template<typename T>
 		void splitVec(const vector<T>& vecSrc, vector< pair<T, vector<T> > >& outVec, const vector<T>& patterns)
 		{
 			vector<T> tmp;
 			T pattern;
 			size_t patternSize = patterns.size();
 			for(size_t i = 0; i < vecSrc.size(); i++)
 			{
 				size_t patternPos = patternSize;
 				for(size_t j = 0; j < patternSize; j++)
 				{
 					if(patterns[j] == vecSrc[i])
 					{
 						patternPos = j;
 						break;
 					}
 				}
 				if(patternPos != patternSize)
 				{
 					if(!tmp.empty())
 					{
 						outVec.push_back(make_pair<T, vector<T> >(pattern, tmp));
 						tmp.clear();
 					}
 					pattern = patterns[patternPos];
 				}
 				else
 				{
 					tmp.push_back(vecSrc[i]);
 				}
 			}
 			if(!tmp.empty())
 			{
 				outVec.push_back(make_pair<T, vector<T> >(pattern, tmp));
 			}
 		}
 	template<typename T>
 		void splitVec(const vector<T>& vecSrc, vector< vector<T> >& outVec, const vector<T>& patternVec)
 		{
 			vector<T> tmp;
 			for(size_t i = 0; i < vecSrc.size(); i++)
 			{
 				bool flag = false;
 				for(size_t j = 0; j < patternVec.size(); j++)
 				{
 					if(patternVec[j] == vecSrc[i])
 					{
 						flag = true;
 						break;
 					}
 				}
 				if(flag)
 				{
 					if(!tmp.empty())
 					{
 						outVec.push_back(tmp);
 						tmp.clear();
 					}
 				}
 				else
 				{
 					tmp.push_back(vecSrc[i]);
 				}
 			}
 			if(!tmp.empty())
 			{
 				outVec.push_back(tmp);
 			}
 		}
 }
 #endif
--- a/scripts/add_header.sh
+++ b/scripts/add_header.sh
@ -1 +0,0 @@
 sed -i '1i/************************************\n * file enc : utf8\n * author   : wuyanyi09@gmail.com\n************************************/' ../src/*.h ../src/*.cpp ../src/*.tcc 
--- a/scripts/check_dict.py
+++ b/scripts/check_dict.py
@ -1,29 +0,0 @@
 #!/usr/bin/python
 import sys
 if len(sys.argv) == 1:
    print "usage : %s dict_file1 dict_file2 ..."
    exit(1)
 d = {}
 for fname in sys.argv[1:]:
    with open(fname, "r") as fin:
        for i, line in enumerate(fin):
            try:
                word, cnt, tag = line.strip().split(" ")
                if word in d:
                    print "error file[%s] line[%s] : %s" %(fname, i, line)
                    exit(1)
                else:
                    d[word] = True
                if 0 >= int(cnt) :
                    print "error file[%s] line[%s] : %s" %(fname, i, line)
                    exit(1)
            except Exception as err:
                print "error file[%s] line[%s] : %s" %(fname, i, line)
                exit(1)
 print "OK"
--- a/scripts/filter_dict.py
+++ b/scripts/filter_dict.py
@ -1,23 +0,0 @@
 #!/usr/bin/python
 import sys
 if len(sys.argv) == 1:
    print "usage : %s dict_file_path"
    exit(1)
 d = {}
 with open(sys.argv[1], "r") as fin:
    for i, line in enumerate(fin):
        word, cnt, tag = line.strip().split(" ")
        if word in d:
            #print "error file[%s] line[%s] : %s" %(fname, i, line)
            #exit(1)
            continue
        else:
            d[word] = True
        if 0 >= int(cnt) :
            continue
        print line.strip()
--- a/scripts/iconv_dict.py
+++ b/scripts/iconv_dict.py
@ -1,15 +0,0 @@
 #!/usr/bin/python
 import sys
 if len(sys.argv) != 4:
    print "usage : %s from_enc to_enc dict_file_path \nexample: %s gbk utf-8 fname" %(__file__, __file__)
    exit(1)
 with open(sys.argv[3], "r") as fin:
    for i, line in enumerate(fin):
        try:
            print line.strip().decode(sys.argv[1]).encode(sys.argv[2])
        except Exception as err:
            print >> sys.stderr, err
--- a/scripts/restart.sh
+++ b/scripts/restart.sh
--- a/scripts/start.sh
+++ b/scripts/start.sh
--- a/scripts/stop.sh
+++ b/scripts/stop.sh
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@ -0,0 +1,23 @@
 SET(EXECUTABLE_OUTPUT_PATH ${PROJECT_BINARY_DIR}/bin)
 SET(LIBRARY_OUTPUT_PATH ${PROJECT_BINARY_DIR}/lib)
 SET(LIBCPPJIEBA_SRC HMMSegment.cpp MixSegment.cpp  MPSegment.cpp  Trie.cpp)
 ADD_LIBRARY(cppjieba STATIC ${LIBCPPJIEBA_SRC})
 ADD_EXECUTABLE(segment segment.cpp)
 ADD_EXECUTABLE(server server.cpp)
 LINK_DIRECTORIES(husky)
 TARGET_LINK_LIBRARIES(segment cppjieba)
 TARGET_LINK_LIBRARIES(server cppjieba husky pthread)
 SET_TARGET_PROPERTIES(cppjieba PROPERTIES VERSION 1.2 SOVERSION 1)
 INSTALL(TARGETS cppjieba ARCHIVE DESTINATION lib/CppJieba)
 INSTALL(TARGETS segment RUNTIME DESTINATION bin/CppJieba)
 INSTALL(TARGETS server RUNTIME DESTINATION bin/CppJieba)
 INSTALL(FILES ChineseFilter.hpp HMMSegment.h MPSegment.h structs.h Trie.h globals.h ISegment.hpp  MixSegment.h  SegmentBase.hpp  TransCode.hpp  DESTINATION include/CppJieba)
 ADD_SUBDIRECTORY(Husky)
 ADD_SUBDIRECTORY(Limonp)
--- a/cppjieba/ChineseFilter.hpp
+++ b/cppjieba/ChineseFilter.hpp
--- a/cppjieba/HMMSegment.cpp
+++ b/cppjieba/HMMSegment.cpp
--- a/cppjieba/HMMSegment.h
+++ b/cppjieba/HMMSegment.h
@ -4,8 +4,8 @@
 #include <iostream>
 #include <fstream>
 #include <memory.h>
-#include <str_functs.hpp>
+#include "Limonp/str_functs.hpp"
-#include <logger.hpp>
+#include "Limonp/logger.hpp"
 #include "globals.h"
 #include "TransCode.hpp"
 #include "ISegment.hpp"
--- a/src/Husky/CMakeLists.txt
+++ b/src/Husky/CMakeLists.txt
@ -0,0 +1,8 @@
 SET(EXECUTABLE_OUTPUT_PATH ${PROJECT_BINARY_DIR}/bin)
 SET(LIBRARY_OUTPUT_PATH ${PROJECT_BINARY_DIR}/lib)
 SET(LIBHUSKY_SRC Daemon.cpp  ServerFrame.cpp)
 ADD_LIBRARY(husky STATIC ${LIBHUSKY_SRC})
 INSTALL(TARGETS husky ARCHIVE DESTINATION lib/CppJieba/Husky)
 INSTALL(FILES Daemon.h globals.h HttpReqInfo.hpp ServerFrame.h ThreadManager.hpp DESTINATION include/CppJieba/Husky)
--- a/src/Husky/Daemon.cpp
+++ b/src/Husky/Daemon.cpp
--- a/src/Husky/Daemon.h
+++ b/src/Husky/Daemon.h
@ -8,7 +8,7 @@
 #include <sys/wait.h>
 #include <sys/stat.h>
 #include <signal.h>
-#include <logger.hpp>
+#include "../Limonp/logger.hpp"
 #include "ServerFrame.h"
 namespace Husky
--- a/src/Husky/HttpReqInfo.hpp
+++ b/src/Husky/HttpReqInfo.hpp
@ -3,14 +3,14 @@
 #include <iostream>
 #include <string>
 #include "../Limonp/logger.hpp"
 #include "../Limonp/str_functs.hpp"
 #include "globals.h"
 #include <str_functs.hpp>
 #include <logger.hpp>
 #include <map_functs.hpp>
 namespace Husky
 {
    using namespace Limonp;
    using namespace std;
    static const char* const KEY_METHOD = "METHOD";
    static const char* const KEY_PATH = "PATH";
@ -130,7 +130,8 @@ namespace Husky
                        LogFatal("headerStr illegal.");
                        return false;
                    }
-                    _headerMap[upperStr(k)] = v;
+                    upper(k);
                    _headerMap[k] = v;
                    lpos = rpos + 1;
                }
                //message header end
@ -160,6 +161,8 @@ namespace Husky
            HashMap<string, string> _headerMap;
            HashMap<string, string> _methodGetMap;
            HashMap<string, string> _methodPostMap;
            //public:
            friend ostream& operator<<(ostream& os, const HttpReqInfo& obj);
        private:
            bool _find(const HashMap<string, string>& mp, const string& key, string& res)const
            {
@ -171,19 +174,6 @@ namespace Husky
                res = it->second;
                return true;
            }
        public:
            //string toString() const;// function for debug because of heavy time consuming
            string toString() const
            {
                string res("{");
                res += HashMapToString(_headerMap);
                res += ",";
                res += HashMapToString(_methodGetMap);
                res += ",";
                res += HashMapToString(_methodPostMap);
                res += "}";
                return res;
            }
        private:
            bool _parseUrl(const string& url, HashMap<string, string>& mp)
            {
@ -226,6 +216,11 @@ namespace Husky
            }
    };
    inline std::ostream& operator << (std::ostream& os, const Husky::HttpReqInfo& obj)
    {
        return os << obj._headerMap << obj._methodGetMap << obj._methodPostMap;
    }
 }
 #endif
--- a/src/Husky/ServerFrame.cpp
+++ b/src/Husky/ServerFrame.cpp
@ -134,13 +134,13 @@ namespace Husky
            nRetCode = recv(hClientSock, chRecvBuf, RECV_BUFFER, 0);	
            strRec = chRecvBuf;
-#ifdef DEBUG
+#ifdef HUKSY_DEBUG
-            LogDebug("response[%s]", strRec.c_str());
+            LogDebug("request[%s]", strRec.c_str());
 #endif
            if(SOCKET_ERROR==nRetCode)
            {
-                LogError("error [%s]", strerror(errno));
+                LogDebug("error [%s]", strerror(errno));
                closesocket(hClientSock);
                continue;
            }
@ -160,15 +160,15 @@ namespace Husky
            strHttpResp=chHttpHeader;
            strHttpResp+=strSnd;
 #ifdef HUKSY_DEBUG
            LogDebug("response'body [%s]", strSnd.c_str());
 #endif
            if (SOCKET_ERROR==send(hClientSock,strHttpResp.c_str(),strHttpResp.length(),0))
            {
                LogError("error [%s]", strerror(errno));
            }
 #ifdef DEBUG
            LogDebug("send response [%s] ", strHttpResp.c_str());
 #endif
            closesocket(hClientSock);
        }
--- a/src/Husky/ServerFrame.h
+++ b/src/Husky/ServerFrame.h
--- a/src/Husky/ThreadManager.hpp
+++ b/src/Husky/ThreadManager.hpp
--- a/src/Husky/globals.h
+++ b/src/Husky/globals.h
--- a/cppjieba/ISegment.hpp
+++ b/cppjieba/ISegment.hpp
--- a/src/Limonp/ArgvContext.hpp
+++ b/src/Limonp/ArgvContext.hpp
@ -10,7 +10,6 @@
 #include <sstream>
 #include "str_functs.hpp"
 #include "map_functs.hpp"
 #include "vec_functs.hpp"
 namespace Limonp
 {
@ -43,12 +42,7 @@ namespace Limonp
            }
            ~ArgvContext(){};
        public:
-            string toString()
+            friend ostream& operator << (ostream& os, const ArgvContext& args); 
            {
                stringstream ss;
                ss<<vecToString<string>(_args)<<mapToString<string, string>(_mpss)<<setToString<string>(_sset);
                return ss.str();
            }
            string operator [](uint i)
            {
                if(i < _args.size())
@ -81,6 +75,16 @@ namespace Limonp
            set<string> _sset; 
    };
    inline ostream& operator << (ostream& os, const ArgvContext& args)
    {
        return os<<args._args<<args._mpss<<args._sset;
    }
            //string toString()
            //{
            //    stringstream ss;
            //    return ss.str();
            //}
 }
 #endif
--- a/src/Limonp/CMakeLists.txt
+++ b/src/Limonp/CMakeLists.txt
@ -0,0 +1,2 @@
 FILE(GLOB HEAD_HPP_LIST "*.hpp")
 INSTALL(FILES ${HEAD_HPP_LIST} DESTINATION include/CppJieba/Limonp)
--- a/src/Limonp/MysqlClient.hpp
+++ b/src/Limonp/MysqlClient.hpp
@ -6,7 +6,6 @@
 #include <vector>
 #include <string>
 #include "logger.hpp"
 #include "vec_functs.hpp"
 namespace Limonp
 {
@ -21,8 +20,9 @@ namespace Limonp
            const char * const USER;
            const char * const PASSWD;
            const char * const DB;
            const char * const CHARSET;
        public:
-            MysqlClient(const char* host, uint port, const char* user, const char* passwd, const char* db): HOST(host), PORT(port), USER(user), PASSWD(passwd), DB(db){ _conn = NULL;};
+            MysqlClient(const char* host, uint port, const char* user, const char* passwd, const char* db, const char* charset = "utf8"): HOST(host), PORT(port), USER(user), PASSWD(passwd), DB(db), CHARSET(charset){ _conn = NULL;};
            ~MysqlClient(){dispose();};
        public:
            bool init()
@ -42,10 +42,17 @@ namespace Limonp
                    return false;
                }  
                if(mysql_set_character_set(_conn, CHARSET))
                {
                    LogError("mysql_set_character_set [%s] failed.", CHARSET);
                    return false;
                }
                //set reconenct
                char value = 1;
                mysql_options(_conn, MYSQL_OPT_RECONNECT, &value);
                LogInfo("MysqlClient {host: %s, port:%d, database:%s, charset:%s}", HOST, PORT, DB, CHARSET);
                return true;
            }
            bool dispose()
@ -71,6 +78,18 @@ namespace Limonp
                }
                return true;
            }
            uint insert(const char* tb_name, const char* keys, const vector<string>& vals)
            {
                uint retn = 0;
                string sql;
                for(uint i = 0; i < vals.size(); i ++)
                {
                    sql.clear();
                    string_format(sql, "insert into %s (%s) values %s", tb_name, keys, vals[i].c_str());
                    retn += executeSql(sql.c_str());
                }
                return retn;
            }
            bool select(const char* sql, RowsType& rows)
            {
                if(!executeSql(sql))
--- a/src/Limonp/cast_functs.hpp
+++ b/src/Limonp/cast_functs.hpp
--- a/src/Limonp/config.hpp
+++ b/src/Limonp/config.hpp
--- a/src/Limonp/io_functs.hpp
+++ b/src/Limonp/io_functs.hpp
--- a/src/Limonp/logger.hpp
+++ b/src/Limonp/logger.hpp
@ -13,13 +13,14 @@
 #include <stdarg.h>
 #include "io_functs.hpp"
 #include "str_functs.hpp"
 #include "typedefs.h"
-#define LogDebug(fmt, ...) Logger::LoggingF(LL_DEBUG, __FILE__, __LINE__, fmt, ## __VA_ARGS__)
+#define FILE_BASENAME strrchr(__FILE__, '/') ? strrchr(__FILE__, '/') + 1 : __FILE__
-#define LogInfo(fmt, ...) Logger::LoggingF(LL_INFO, __FILE__, __LINE__, fmt, ## __VA_ARGS__)
+
-#define LogWarn(fmt, ...) Logger::LoggingF(LL_WARN, __FILE__, __LINE__, fmt, ## __VA_ARGS__)
+#define LogDebug(fmt, ...) Logger::LoggingF(LL_DEBUG, FILE_BASENAME, __LINE__, fmt, ## __VA_ARGS__)
-#define LogError(fmt, ...) Logger::LoggingF(LL_ERROR, __FILE__, __LINE__, fmt, ## __VA_ARGS__)
+#define LogInfo(fmt, ...) Logger::LoggingF(LL_INFO, FILE_BASENAME, __LINE__, fmt, ## __VA_ARGS__)
-#define LogFatal(fmt, ...) Logger::LoggingF(LL_FATAL, __FILE__, __LINE__, fmt, ## __VA_ARGS__)
+#define LogWarn(fmt, ...) Logger::LoggingF(LL_WARN, FILE_BASENAME, __LINE__, fmt, ## __VA_ARGS__)
 #define LogError(fmt, ...) Logger::LoggingF(LL_ERROR, FILE_BASENAME, __LINE__, fmt, ## __VA_ARGS__)
 #define LogFatal(fmt, ...) Logger::LoggingF(LL_FATAL, FILE_BASENAME, __LINE__, fmt, ## __VA_ARGS__)
 namespace Limonp
--- a/src/Limonp/macro_def.hpp
+++ b/src/Limonp/macro_def.hpp
--- a/src/Limonp/map_functs.hpp
+++ b/src/Limonp/map_functs.hpp
@ -0,0 +1,116 @@
 /************************************
 * file enc : ascii
 * author   : wuyanyi09@gmail.com
 ************************************/
 #ifndef LIMONP_MAP_FUNCTS_H
 #define LIMONP_MAP_FUNCTS_H
 #include <map>
 #include <set>
 #include <iostream>
 #include <sstream>
 #include <tr1/unordered_map>
 #define HashMap std::tr1::unordered_map
 namespace Limonp
 {
    using namespace std;
    //template <typename T>
    //    string setToString(const set<T>& st)
    //    {
    //        if(st.empty())
    //        {
    //            return "{}";
    //        }
    //        stringstream ss;
    //        ss<<'{';
    //        typename set<T>::const_iterator it = st.begin();
    //        ss<<*it;
    //        it++;
    //        while(it != st.end())
    //        {
    //            ss<<", "<<*it;
    //            it++;
    //        }
    //        ss<<'}';
    //        return ss.str();
    //    }
    //template<typename T1, typename T2>
    //    string mapToString(const map<T1, T2>& mp)
    //    {
    //        if(mp.empty())
    //        {
    //            return "{}";
    //        }
    //        stringstream ss;
    //        ss<<'{';
    //        typename map<T1, T2>::const_iterator it = mp.begin();
    //        ss<<it->first<<": "<<it->second;
    //        it++;
    //        while(it != mp.end())
    //        {
    //            ss<<", "<<it->first<<": "<<it->second;
    //            it++;
    //        }
    //        ss<<'}';
    //        return ss.str();
    //    }
    //template<typename T1, typename T2>
    //    string HashMapToString(const HashMap<T1, T2>& mp)
    //    {
    //        if(mp.empty())
    //        {
    //            return "{}";
    //        }
    //        stringstream ss;
    //        ss<<'{';
    //        typename HashMap<T1, T2>::const_iterator it = mp.begin();
    //        ss<<it->first<<": "<<it->second;
    //        it++;
    //        while(it != mp.end())
    //        {
    //            ss<<", "<<it->first<<": "<<it->second;
    //            it++;
    //        }
    //        ss<<'}';
    //        return ss.str();
    //    }
    //template<typename T1, typename T2>
    //    string pairToString(const pair<T1, T2>& p)
    //    {
    //        stringstream ss;
    //        ss<<p.first<<":"<<p.second;
    //        return ss.str();
    //    }
    template<class kT, class vT>
        vT getMap(const map<kT, vT>& mp, const kT & key, const vT & defaultVal)
        {
            typename map<kT, vT>::const_iterator it;
            it = mp.find(key);
            if(mp.end() == it)
            {
                return defaultVal;
            }
            return it->second;
        }
    template<class kT, class vT>
        void map2Vec(const map<kT, vT>& mp, vector<pair<kT, vT> > & res)
        {
            typename map<kT, vT>::const_iterator it = mp.begin();
            for(; it != mp.end(); it++)
            {
                res.push_back(*it);
            }
        }
 }
 #endif
--- a/src/Limonp/std_outbound.hpp
+++ b/src/Limonp/std_outbound.hpp
@ -0,0 +1,101 @@
 #ifndef LIMONP_STD_OUTBOUND_H
 #define LIMONP_STD_OUTBOUND_H
 #include <tr1/unordered_map>
 #include <map>
 #include <set>
 namespace std
 {
    template<typename T>
        ostream& operator << (ostream& os, const vector<T>& vec)
        {
            if(vec.empty())
            {
                return os << "[]";
            }
            os<<"[\""<<vec[0];
            for(uint i = 1; i < vec.size(); i++)
            {
                os<<"\", \""<<vec[i];
            }
            os<<"\"]";
            return os;
        }
    template<class T1, class T2>
        ostream& operator << (ostream& os, const pair<T1, T2>& pr)
        {
            os << pr.first << ":" << pr.second ;
            return os;
        }
    template<class T>
        string& operator << (string& str, const T& obj)
        {
            stringstream ss;
            ss << obj; // call ostream& operator << (ostream& os,
            return str = ss.str();
        }
    template<class T1, class T2>
        ostream& operator << (ostream& os, const map<T1, T2>& mp)
        {
            if(mp.empty())
            {
                os<<"{}";
                return os;
            }
            os<<'{';
            typename map<T1, T2>::const_iterator it = mp.begin();
            os<<*it;
            it++;
            while(it != mp.end())
            {
                os<<", "<<*it;
                it++;
            }
            os<<'}';
            return os;
        }
    template<class T1, class T2>
        ostream& operator << (ostream& os, const std::tr1::unordered_map<T1, T2>& mp)
        {
            if(mp.empty())
            {
                return os << "{}";
            }
            os<<'{';
            typename std::tr1::unordered_map<T1, T2>::const_iterator it = mp.begin();
            os<<*it;
            it++;
            while(it != mp.end())
            {
                os<<", "<<*it++;
            }
            return os<<'}';
        }
    template<class T>
        ostream& operator << (ostream& os, const set<T>& st)
        {
            if(st.empty())
            {
                os << "{}";
                return os;
            }
            os<<'{';
            typename set<T>::const_iterator it = st.begin();
            os<<*it;
            it++;
            while(it != st.end())
            {
                os<<", "<<*it;
                it++;
            }
            os<<'}';
            return os;
        }
 }
 #endif
--- a/src/Limonp/str_functs.hpp
+++ b/src/Limonp/str_functs.hpp
@ -15,9 +15,17 @@
 #include <stdio.h>
 #include <stdarg.h>
 #include <memory.h>
 #include "typedefs.h"
 #include <functional> 
 #include <locale>
 #include <sstream>
 #include <sys/types.h>
 #include <iterator>
 #include <algorithm>
 #include "std_outbound.hpp"
 #include "map_functs.hpp"
 #define print(x) cout<<(x)<<endl
 namespace Limonp
 {
    using namespace std;
@ -42,11 +50,12 @@ namespace Limonp
        }
        return str;
    }
-    
+
    inline void string_format(string& res, const char* fmt, ...)
    {
        int size = 256;
        va_list ap;
        res.clear();
        while (1) {
            res.resize(size);
            va_start(ap, fmt);
@ -63,27 +72,55 @@ namespace Limonp
        }
    }
-    inline bool joinStr(const vector<string>& src, string& dest, const string& connectorStr)
+    //inline bool joinStr(const vector<string>& src, string& dest, const string& connectorStr)
-    {
+    //{
-        if(src.empty())
+    //    if(src.empty())
-        {
+    //    {
-            return false;
+    //        return false;
-        }
+    //    }
-        for(uint i = 0; i < src.size() - 1; i++)
+    //    for(uint i = 0; i < src.size() - 1; i++)
-        {
+    //    {
-            dest += src[i];
+    //        dest += src[i];
-            dest += connectorStr;
+    //        dest += connectorStr;
-        }
+    //    }
-        dest += src[src.size() - 1];
+    //    dest += src[src.size() - 1];
-        return true;
+    //    return true;
-    }
+    //}
-    inline string joinStr(const vector<string>& source, const string& connector)
+    //inline string joinStr(const vector<string>& source, const string& connector)
-    {
+    //{
-        string res;
+    //    string res;
-        joinStr(source, res, connector);
+    //    joinStr(source, res, connector);
-        return res;
+    //    return res;
-    }
+    //}
    template<class T>
        void join(T begin, T end, string& res, const string& connector)
        {
            if(begin == end)
            {
                return;
            }
            stringstream ss;
            ss<<*begin;
            begin++;
            while(begin != end)
            {
                ss << connector << *begin;
                begin ++;
            }
            res = ss.str();
        }
    template<class T>
        string join(T begin, T end, const string& connector)
        {
            string res;
            join(begin ,end, res, connector);
            return res;
        }
    inline bool splitStr(const string& src, vector<string>& res, const string& pattern)
    {
@ -104,26 +141,24 @@ namespace Limonp
                return true;
            }
            res.push_back(src.substr(start, end - start));
-			if(end == src.size() - 1)
+            if(end == src.size() - 1)
-			{
+            {
-				res.push_back("");
+                res.push_back("");
-				break;
+                break;
-			}
+            }
            start = end + 1;
        }
        return true;
    }
-    inline string upperStr(const string& strIn)
+    inline string& upper(string& str)
    {
        string str = strIn;
        transform(str.begin(), str.end(), str.begin(), (int (*)(int))toupper);
        return str;
    }
-    inline string lowerStr(const string& strIn)
+    inline string& lower(string& str)
    {
        string str = strIn;
        transform(str.begin(), str.end(), str.begin(), (int (*)(int))tolower);
        return str;
    }
@ -183,40 +218,40 @@ namespace Limonp
        return str.find(ch) != string::npos;
    }
-    inline void extractWords(const string& sentence, vector<string>& words)
+    //inline void extractWords(const string& sentence, vector<string>& words)
-    {
+    //{
-        bool flag = false;
+    //    bool flag = false;
-        uint lhs = 0, len = 0;
+    //    uint lhs = 0, len = 0;
-        for(uint i = 0; i < sentence.size(); i++)
+    //    for(uint i = 0; i < sentence.size(); i++)
-        {
+    //    {
-            char x = sentence[i];
+    //        char x = sentence[i];
-            if((0x0030 <= x && x<= 0x0039) || (0x0041 <= x && x <= 0x005a ) || (0x0061 <= x && x <= 0x007a))
+    //        if((0x0030 <= x && x<= 0x0039) || (0x0041 <= x && x <= 0x005a ) || (0x0061 <= x && x <= 0x007a))
-            {
+    //        {
-                if(flag)
+    //            if(flag)
-                {
+    //            {
-                    len ++;
+    //                len ++;
-                }
+    //            }
-                else
+    //            else
-                {
+    //            {
-                    lhs = i;
+    //                lhs = i;
-                    len = 1;
+    //                len = 1;
-                }
+    //            }
-                flag = true;
+    //            flag = true;
-            }
+    //        }
-            else
+    //        else
-            {
+    //        {
-                if(flag)
+    //            if(flag)
-                {
+    //            {
-                    words.push_back(string(sentence, lhs, len));
+    //                words.push_back(string(sentence, lhs, len));
-                }
+    //            }
-                flag = false;
+    //            flag = false;
-            }
+    //        }
-        }
+    //    }
-        if(flag)
+    //    if(flag)
-        {
+    //    {
-            words.push_back(string(sentence, lhs, len));
+    //        words.push_back(string(sentence, lhs, len));
-        }
+    //    }
-    }
+    //}
 }
--- a/cppjieba/MPSegment.cpp
+++ b/cppjieba/MPSegment.cpp
--- a/cppjieba/MPSegment.h
+++ b/cppjieba/MPSegment.h
@ -7,7 +7,7 @@
 #include <algorithm>
 #include <set>
-#include <logger.hpp>
+#include "Limonp/logger.hpp"
 #include "Trie.h"
 #include "globals.h"
 #include "ISegment.hpp"
--- a/cppjieba/MixSegment.cpp
+++ b/cppjieba/MixSegment.cpp
--- a/cppjieba/MixSegment.h
+++ b/cppjieba/MixSegment.h
@ -3,7 +3,7 @@
 #include "MPSegment.h"
 #include "HMMSegment.h"
-#include <str_functs.hpp>
+#include "Limonp/str_functs.hpp"
 namespace CppJieba
 {
--- a/cppjieba/SegmentBase.hpp
+++ b/cppjieba/SegmentBase.hpp
@ -4,8 +4,8 @@
 #include "globals.h"
 #include "ISegment.hpp"
 #include "ChineseFilter.hpp"
-#include <str_functs.hpp>
+#include "Limonp/str_functs.hpp"
-#include <logger.hpp>
+#include "Limonp/logger.hpp"
 namespace CppJieba
 {
--- a/cppjieba/TransCode.hpp
+++ b/cppjieba/TransCode.hpp
@ -7,8 +7,7 @@
 #include "globals.h"
-#include <str_functs.hpp>
+#include "Limonp/str_functs.hpp"
 #include <vec_functs.hpp>
 namespace CppJieba
 {
--- a/cppjieba/Trie.cpp
+++ b/cppjieba/Trie.cpp
--- a/cppjieba/Trie.h
+++ b/cppjieba/Trie.h
@ -12,8 +12,8 @@
 #include <stdint.h>
 #include <cmath>
 #include <limits>
-#include <str_functs.hpp>
+#include "Limonp/str_functs.hpp"
-#include <logger.hpp>
+#include "Limonp/logger.hpp"
 #include "TransCode.hpp"
 #include "globals.h"
 #include "structs.h"
--- a/cppjieba/globals.h
+++ b/cppjieba/globals.h
--- a/src/segment.cpp
+++ b/src/segment.cpp
@ -0,0 +1,82 @@
 #include <iostream>
 #include <fstream>
 #include "Limonp/ArgvContext.hpp"
 #include "MPSegment.h"
 #include "HMMSegment.h"
 #include "MixSegment.h"
 using namespace CppJieba;
 void cut(const ISegment * seg, const char * const filePath)
 {
    ifstream ifile(filePath);
    vector<string> res;
    string line;
    while(getline(ifile, line))
    {
        if(!line.empty())
        {
            res.clear();
            seg->cut(line, res);
            cout<<join(res.begin(), res.end(),"/")<<endl;
        }
    }
 }
 int main(int argc, char ** argv)
 {
    if(argc < 2)
    {
        cout<<"usage: \n\t"<<argv[0]<<" [options] <filename>\n"
            <<"options:\n"
            <<"\t--algorithm\tSupported methods are [cutDAG, cutHMM, cutMix] for now. \n\t\t\tIf not specified, the default is cutDAG\n"
            <<"\t--dictpath\tsee example\n"
            <<"\t--modelpath\tsee example\n"
            <<"example:\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --dictpath dicts/jieba.dict.utf8\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --modelpath dicts/hmm_model.utf8 --algorithm cutHMM\n"
            <<"\t"<<argv[0]<<" testlines.utf8 --dictpath dicts/jieba.dict.utf8 --modelpath dicts/hmm_model.utf8 --algorithm cutMix\n"
            <<endl;
        return EXIT_FAILURE;
    }
    ArgvContext arg(argc, argv);
    string dictPath = arg["--dictpath"];
    string modelPath = arg["--modelpath"];
    string algorithm = arg["--algorithm"];
    if("cutHMM" == algorithm)
    {
        HMMSegment seg;
        if(!seg.init(modelPath.c_str()))
        {
            cout<<"seg init failed."<<endl;
            return EXIT_FAILURE;
        }
        cut(&seg, arg[1].c_str());
        seg.dispose();
    }
    else if("cutMix" == algorithm)
    {
        MixSegment seg;
        if(!seg.init(dictPath.c_str(), modelPath.c_str()))
        {
            cout<<"seg init failed."<<endl;
            return EXIT_FAILURE;
        }
        cut(&seg, arg[1].c_str());
        seg.dispose();
    }
    else
    {
        MPSegment seg;
        if(!seg.init(dictPath.c_str()))
        {
            cout<<"seg init failed."<<endl;
            return false;
        }
        cut(&seg, arg[1].c_str());
        seg.dispose();
    }
    return EXIT_SUCCESS;
 }
--- a/demo/server.cpp
+++ b/demo/server.cpp
@ -3,12 +3,12 @@
 #include <string>
 #include <ctype.h>
 #include <string.h>
-#include <ArgvContext.hpp>
+#include "Limonp/ArgvContext.hpp"
-#include "../husky/Daemon.h"
+#include "Husky/Daemon.h"
-#include "../husky/ServerFrame.h"
+#include "Husky/ServerFrame.h"
-#include "../cppjieba/MPSegment.h"
+#include "MPSegment.h"
-#include "../cppjieba/HMMSegment.h"
+#include "HMMSegment.h"
-#include "../cppjieba/MixSegment.h"
+#include "MixSegment.h"
 using namespace Husky;
 using namespace CppJieba;
@ -31,7 +31,7 @@ class ServerDemo: public IRequestHandler
            httpReq.GET("key", tmp); 
            URLDecode(tmp, sentence);
            _segment.cut(sentence, words);
-            vecToString(words, strSnd);
+            strSnd << words;
            return true;
        }
    private:
--- a/cppjieba/structs.h
+++ b/cppjieba/structs.h
@ -74,7 +74,7 @@ namespace CppJieba
        KeyWordInfo(const TrieNodeInfo& trieNodeInfo):TrieNodeInfo(trieNodeInfo)
        {
        }
-        inline string toString() const
+        string toString() const
        {
            string tmp;
            TransCode::encode(word, tmp);
@ -89,16 +89,23 @@ namespace CppJieba
            return *this;
        }
    };
-
+    
-    inline string joinWordInfos(const vector<KeyWordInfo>& vec)
+    inline ostream& operator << (ostream& os, const KeyWordInfo& info)
    {
-        vector<string> tmp;
+        string tmp;
-        for(uint i = 0; i < vec.size(); i++)
+        TransCode::encode(info.word, tmp);
-        {
+        return os << "{words:" << tmp << ", weight:" << info.weight << ", idf:" << info.idf << "}";
            tmp.push_back(vec[i].toString());
        }
        return joinStr(tmp, ",");
    }
    //inline string joinWordInfos(const vector<KeyWordInfo>& vec)
    //{
    //    vector<string> tmp;
    //    for(uint i = 0; i < vec.size(); i++)
    //    {
    //        tmp.push_back(vec[i].toString());
    //    }
    //    return joinStr(tmp, ",");
    //}
 }
 #endif
--- a/test/Makefile
+++ b/test/Makefile
@ -1,54 +0,0 @@
 CXX    := g++
 LD     := g++
 AR     := ar rc
 INCS := -I../cppjieba/
 DEBUG_CXXFLAGS     := -g -Wall -DDEBUG -DUT $(INCS)
 CXXFLAGS       := ${DEBUG_CXXFLAGS}
 LDFLAGS      := ${DEBUG_LDFLAGS}
 DOLINK := $(LD) $(LDFLAGS) 
 DOPACK := $(AR)  
 SOURCES := $(wildcard *.cpp)
 OBJS := $(patsubst %.cpp,%.o,$(SOURCES))
 UTS := $(patsubst %.cpp,%.ut,$(SOURCES))
 CPPJIEBADIR = ../cppjieba
 LIBCPPJIEBA = $(CPPJIEBADIR)/libcppjieba.a
 CPPCOMMONDIR = ../cppcommon
 LIBCPPCM = $(CPPCOMMONDIR)/libcm.a
 LIBA := $(LIBCPPJIEBA) $(LIBCPPCM)
 # remove the objs after compilation
 .PHONY: clean $(LIBA)
 # Main Targets
 all: $(UTS)
 # This is a suffix rule 
 #.c.o: 
 %.o: %.cpp
 	$(CXX) -c $(CXXFLAGS) $<
 %.ut: %.o $(LIBA)
 	$(CXX) $(CXXFLAGS) -o $@ $^
 $(LIBCPPJIEBA): 
 	cd $(CPPJIEBADIR) && $(MAKE)
 $(LIBCPPCM): 
 	cd $(CPPCOMMONDIR) && $(MAKE)
 clean:
 	rm -f *.o *.ut *.d *.d.*
 #	cd $(CPPJIEBADIR) && make clean
 #	cd $(CPPCOMMONDIR) && make clean
 sinclude $(SOURCES:.cpp=.d)
 %.d:%.cpp
 	@set -e; rm -f $@; \
 	$(CXX) -MM $< > $@.$$$$; \
 	sed 's,\($*\).o[ :]*,\1.o $@ : ,g' < $@.$$$$ > $@; \
 	rm -f $@.$$$$
--- a/test/segment.cpp
+++ b/test/segment.cpp
@ -0,0 +1,60 @@
 #include <iostream>
 #include <fstream>
 #include <CppJieba/Limonp/ArgvContext.hpp>
 #include <CppJieba/MPSegment.h>
 #include <CppJieba/HMMSegment.h>
 #include <CppJieba/MixSegment.h>
 using namespace CppJieba;
 void cut(const ISegment * seg, const char * const filePath)
 {
    ifstream ifile(filePath);
    vector<string> res;
    string line;
    while(getline(ifile, line))
    {
        if(!line.empty())
        {
            res.clear();
            seg->cut(line, res);
            cout<<join(res.begin(), res.end(),"/")<<endl;
        }
    }
 }
 int main(int argc, char ** argv)
 {
    //demo
    {
        HMMSegment seg;
        if(!seg.init("../dicts/hmm_model.utf8"))
        {
            cout<<"seg init failed."<<endl;
            return EXIT_FAILURE;
        }
        cut(&seg, "testlines.utf8");
        seg.dispose();
    }
    {
        MixSegment seg;
        if(!seg.init("../dicts/jieba.dict.utf8", "../dicts/hmm_model.utf8"))
        {
            cout<<"seg init failed."<<endl;
            return EXIT_FAILURE;
        }
        cut(&seg, "testlines.utf8");
        seg.dispose();
    }
    {
        MPSegment seg;
        if(!seg.init("../dicts/jieba.dict.utf8"))
        {
            cout<<"seg init failed."<<endl;
            return false;
        }
        cut(&seg, "testlines.utf8");
        seg.dispose();
    }
    return EXIT_SUCCESS;
 }
--- a/test/server.cpp
+++ b/test/server.cpp
@ -0,0 +1,58 @@
 #include <CppJieba/Husky/ServerFrame.h>
 #include <CppJieba/Husky/Daemon.h>
 #include <CppJieba/Limonp/ArgvContext.hpp>
 #include <CppJieba/MPSegment.h>
 #include <CppJieba/HMMSegment.h>
 #include <CppJieba/MixSegment.h>
 using namespace Husky;
 using namespace CppJieba;
 const char * const DEFAULT_DICTPATH = "../dicts/jieba.dict.utf8";
 const char * const DEFAULT_MODELPATH = "../dicts/hmm_model.utf8";
 class ServerDemo: public IRequestHandler
 {
 	public:
        ServerDemo(){};
        virtual ~ServerDemo(){};
 		virtual bool init(){return _segment.init(DEFAULT_DICTPATH, DEFAULT_MODELPATH);};
 		virtual bool dispose(){return _segment.dispose();};
 	public:
        virtual bool do_GET(const HttpReqInfo& httpReq, string& strSnd)
        {
            string sentence, tmp;
            vector<string> words;
            httpReq.GET("key", tmp); 
            URLDecode(tmp, sentence);
            _segment.cut(sentence, words);
            strSnd << words;
            return true;
        }
    private:
        MixSegment _segment;
 };
 int main(int argc,char* argv[])
 {
 	if(argc != 7)
 	{
 		printf("usage: %s -n THREAD_NUMBER -p LISTEN_PORT -k start|stop\n",argv[0]);
 		return -1;
 	}
    ArgvContext arg(argc, argv);
    unsigned int port = atoi(arg["-p"].c_str());
    unsigned int threadNum = atoi(arg["-n"].c_str());
    ServerDemo s;
    Daemon daemon(&s);
    if(arg["-k"] == "start")
    {
        return !daemon.Start(port, threadNum);
    }
    else
    {
        return !daemon.Stop();
    }
 }
--- a/test/testlines.utf8
+++ b/test/testlines.utf8
		`@ -1 +0,0 @@`
			`sed -i '1i/***********************************\n file enc : utf8\n * author : wuyanyi09@gmail.com\n***********************************/' ../src/.h ../src/.cpp ../src/.tcc`
		`@ -0,0 +1,2 @@`
							`FILE(GLOB HEAD_HPP_LIST "*.hpp")`
							`INSTALL(FILES ${HEAD_HPP_LIST} DESTINATION include/CppJieba/Limonp)`