Searched refs:CJKVTokenizer (Results 1 – 13 of 13) sorted by relevance
/dports/deskutils/pinot/pinot-1.20/IndexSearch/cjkv/ |
H A D | CJKVTokenizer.cc | 159 CJKVTokenizer::TokensHandler(), in VectorTokensHandler() 179 CJKVTokenizer::CJKVTokenizer() : in CJKVTokenizer() function in CJKVTokenizer 186 CJKVTokenizer::~CJKVTokenizer() in ~CJKVTokenizer() 190 string CJKVTokenizer::normalize(const string &str, in normalize() 208 string CJKVTokenizer::strip_marks(const string &str) in strip_marks() 258 void CJKVTokenizer::set_ngram_size(unsigned int ngram_size) in set_ngram_size() 263 unsigned int CJKVTokenizer::get_ngram_size(void) const in get_ngram_size() 283 unsigned int CJKVTokenizer::get_max_text_size(void) const in get_max_text_size() 399 void CJKVTokenizer::split(const string &str, in split() 442 bool CJKVTokenizer::has_cjkv(const string &str) in has_cjkv() [all …]
|
H A D | CJKVTokenizer.h | 37 class DIJON_CJKV_EXPORT CJKVTokenizer 40 CJKVTokenizer(); 41 ~CJKVTokenizer();
|
/dports/deskutils/pinot/pinot-1.20/IndexSearch/ |
H A D | QueryProperties.cpp | 30 class FilterRemover : public Dijon::CJKVTokenizer::TokensHandler 34 Dijon::CJKVTokenizer::TokensHandler(), in FilterRemover() 84 class SetTokensHandler : public Dijon::CJKVTokenizer::TokensHandler 88 Dijon::CJKVTokenizer::TokensHandler(), in SetTokensHandler() 214 Dijon::CJKVTokenizer tokenizer; in removeFilters() 354 Dijon::CJKVTokenizer tokenizer; in getTerms()
|
H A D | WebEngine.cpp | 41 class TermHighlighter : public Dijon::CJKVTokenizer::TokensHandler 46 Dijon::CJKVTokenizer::TokensHandler(), in TermHighlighter() 275 Dijon::CJKVTokenizer tokenizer; in processResult()
|
H A D | Makefile.am | 22 cjkv/CJKVTokenizer.h
|
/dports/deskutils/pinot/pinot-1.20/ |
H A D | ChangeLog-dijon | 66 M /trunk/cjkv/CJKVTokenizer.cc 67 M /trunk/cjkv/CJKVTokenizer.h 139 M /trunk/cjkv/CJKVTokenizer.cc 140 M /trunk/cjkv/CJKVTokenizer.h 320 M /trunk/cjkv/CJKVTokenizer.cc 335 M /trunk/cjkv/CJKVTokenizer.cc 342 M /trunk/cjkv/CJKVTokenizer.cc 449 M /trunk/cjkv/CJKVTokenizer.h 526 M /trunk/cjkv/CJKVTokenizer.h 585 M /trunk/cjkv/CJKVTokenizer.h [all …]
|
H A D | TODO | 25 - HtmlParser should use CJKVTokenizer's Unicode conversion function
|
H A D | ChangeLog-svn | 401 Install cjkv/CJKVTokenizer.h. 491 M /trunk/IndexSearch/cjkv/CJKVTokenizer.cc 553 M /trunk/IndexSearch/cjkv/CJKVTokenizer.cc 554 M /trunk/IndexSearch/cjkv/CJKVTokenizer.h 611 M /trunk/IndexSearch/cjkv/CJKVTokenizer.cc 839 M /trunk/IndexSearch/cjkv/CJKVTokenizer.cc 840 M /trunk/IndexSearch/cjkv/CJKVTokenizer.h 1444 A /trunk/IndexSearch/cjkv/CJKVTokenizer.cc 1445 A /trunk/IndexSearch/cjkv/CJKVTokenizer.h 2533 CJKVTokenizer, this should preserve dots, eg dots in acronyms and version [all …]
|
/dports/deskutils/pinot/pinot-1.20/IndexSearch/Xapian/ |
H A D | XapianEngine.cpp | 201 CJKVTokenizer tokenizer; in operator ()() 366 class QueryModifier : public Dijon::CJKVTokenizer::TokensHandler 448 string unaccentedTok(Dijon::CJKVTokenizer::strip_marks(tok)); in handle_token() 613 CJKVTokenizer tokenizer; in parseQuery()
|
H A D | XapianIndex.h | 153 void addPostingsToDocument(Dijon::CJKVTokenizer &tokenizer, Xapian::Stem *pStemmer,
|
H A D | XapianIndex.cpp | 63 class TokensIndexer : public Dijon::CJKVTokenizer::TokensHandler 70 Dijon::CJKVTokenizer::TokensHandler(), in TokensIndexer() 155 string unaccentedTerm(Dijon::CJKVTokenizer::strip_marks(term)); in handle_token() 382 Dijon::CJKVTokenizer tokenizer; in addPostingsToDocument() 447 void XapianIndex::addPostingsToDocument(Dijon::CJKVTokenizer &tokenizer, Xapian::Stem *pStemmer, in addPostingsToDocument() 1687 Dijon::CJKVTokenizer tokenizer; in getCloseTerms()
|
H A D | AbstractGenerator.cpp | 71 CJKVTokenizer tokenizer; in generateAbstract()
|
/dports/deskutils/pinot/pinot-1.20/Tokenize/ |
H A D | Makefile.am | 111 $(top_srcdir)/IndexSearch/cjkv/CJKVTokenizer.cc
|