10 #ifndef _STREAMING_HASHEDDOCDOTFEATURES__H__
11 #define _STREAMING_HASHEDDOCDOTFEATURES__H__
24 class CStreamingDotFeatures;
26 class CHashedDocConverter;
107 int32_t vec2_len,
bool abs_val=
false);
123 virtual const char*
get_name()
const;
239 int32_t bits,
bool normalize, int32_t n_grams, int32_t skips);
263 #endif // _STREAMING_HASHEDDOCDOTFEATURES__H__
virtual int32_t get_num_vectors() const
This class implements streaming features for a document collection. Like in the standard Bag-of-Words...
virtual void release_example()
virtual int32_t get_dim_feature_space() const
virtual const char * get_name() const
virtual float64_t get_label()
virtual CFeatures * duplicate() const
virtual bool get_next_example()
EFeatureClass
shogun feature class
A Streaming File access class.
virtual EFeatureType get_feature_type() const
virtual void add_to_dense_vec(float32_t alpha, float32_t *vec2, int32_t vec2_len, bool abs_val=false)
This class can be used to convert a document collection contained in a CStringFeatures object w...
virtual EFeatureClass get_feature_class() const
virtual void set_vector_reader()
SGSparseVector< float64_t > get_vector()
virtual float32_t dense_dot(const float32_t *vec2, int32_t vec2_len)
virtual void set_vector_and_label_reader()
The class CTokenizer acts as a base class in order to implement tokenizers. Sub-classes must implemen...
SGSparseVector< float64_t > current_vector
virtual void start_parser()
virtual int32_t get_num_features()
CHashedDocConverter * converter
Streaming features that support dot products among other operations.
EFeatureType
shogun feature type
virtual ~CStreamingHashedDocDotFeatures()
all of classes and functions are contained in the shogun namespace
The class Features is the base class of all feature objects.
void set_normalization(bool normalize)
CStreamingHashedDocDotFeatures()
void set_k_skip_n_grams(int32_t k, int32_t n)
CInputParser< char > parser
virtual void end_parser()
virtual float32_t dot(CStreamingDotFeatures *df)