33 void CNGramTokenizer::init()
35 SG_ADD(&
n,
"n",
"Size of n-grams",
49 return "NGramTokenizer";
The class CNGramTokenizer is used to tokenize a SGVector into n-grams.
virtual const char * get_name() const
virtual void set_text(SGVector< char > txt)
The class CTokenizer acts as a base class in order to implement tokenizers. Sub-classes must implemen...
virtual void set_text(SGVector< char > txt)
all of classes and functions are contained in the shogun namespace
virtual index_t next_token_idx(index_t &start)
CNGramTokenizer(int32_t ns=3)
virtual CNGramTokenizer * get_copy()