mirror of
https://github.com/yanyiwu/cppjieba.git
synced 2025-07-18 00:00:12 +08:00
add TMixSegment.cpp for testing
This commit is contained in:
parent
2e2036bb73
commit
9f35b82dd1
@ -26,14 +26,14 @@ namespace CppJieba
|
||||
virtual bool cut(Unicode::const_iterator begin, Unicode::const_iterator end, vector<string>& res)const = 0;
|
||||
virtual bool cut(const string& str, vector<string>& res)const
|
||||
{
|
||||
if(!_getInitFlag())
|
||||
{
|
||||
LogError("not inited.");
|
||||
return false;
|
||||
}
|
||||
assert(_getInitFlag());
|
||||
//if(!_getInitFlag())
|
||||
//{
|
||||
// LogError("not inited.");
|
||||
// return false;
|
||||
//}
|
||||
Unicode unico;
|
||||
#ifdef NO_FILTER
|
||||
unico.clear();
|
||||
if(!TransCode::decode(str, unico))
|
||||
{
|
||||
LogFatal("str[%s] decode failed.", str.c_str());
|
||||
|
@ -6,10 +6,16 @@ using namespace CppJieba;
|
||||
TEST(MixSegmentTest, Test1)
|
||||
{
|
||||
MixSegment segment("../dicts/jieba.dict.utf8", "../dicts/hmm_model.utf8");;
|
||||
const char* str = "我来自北京邮电大学。。。学号 123456";
|
||||
const char* res[] = {"我", "来自", "北京邮电大学", "。","。","。","。","学号", " 123456"};
|
||||
string s;
|
||||
vector<string> buf(res, res + sizeof(res)/sizeof(res[0]));
|
||||
const char* str = "我来自北京邮电大学。。。 学号 123456";
|
||||
const char* res[] = {"我", "来自", "北京邮电大学", "。","。","。"," ","学号", " 123456"};
|
||||
//string s;
|
||||
//vector<string> buf(res, res + sizeof(res)/sizeof(res[0]));
|
||||
vector<string> words;
|
||||
ASSERT_EQ(segment.init(), true);
|
||||
ASSERT_EQ(segment.cut(str, words), true);
|
||||
EXPECT_EQ(words, vector<string>(res, res + sizeof(res)/sizeof(res[0])));
|
||||
//print(words);
|
||||
|
||||
//for(uint i = 0; i < sizeof(res)/sizeof(res[0]); i++)
|
||||
//{
|
||||
// buf.push_back()
|
||||
|
Loading…
x
Reference in New Issue
Block a user