35 void CDelimiterTokenizer::init()
52 return "DelimiterTokenizer";
static void fill_vector(T *vec, int32_t len, T value)
virtual void set_text(SGVector< char > txt)
bool get_skip_delimiters() const
virtual index_t next_token_idx(index_t &start)
void set_skip_delimiters(bool skip_delimiters)
CDelimiterTokenizer * get_copy()
virtual const char * get_name() const
CDelimiterTokenizer(bool skip_delimiters=false)
all of classes and functions are contained in the shogun namespace
The class CDelimiterTokenizer is used to tokenize a SGVector into tokens using custom chars as ...
SGVector< bool > delimiters
void init_for_whitespace()
virtual void set_text(SGVector< char > txt)
bool skip_consecutive_delimiters