SHOGUN
4.1.0
|
This class implements streaming features with sparse feature vectors. The vector is represented as an SGSparseVector<T>. Each entry is of type SGSparseVectorEntry<T> with members `feat_index' and `entry'.
This class expects the input from the StreamingFile object to be zero-based, i.e., a feature entered as 1:6.5 would have feat_index=0 and entry=6.5.
The current example is stored as a combination of current_vector and current_label. current_num_features stores the highest dimensionality of examples encountered upto the point of the function call. For example, if the first example is '1:6.5 7:10.0', then current_num_features would be 7 after the first function call.
Since the dimensionality of the feature space is not immediately known initially, current_num_features may increase as more examples are processed and larger dimensions are seen. For this purpose, `expand_if_required()' is provided which when called with a dynamically allocated float or double array and the length, reallocates that array to the new dimensionality (if necessary), setting the newer dimensions to zero, and updates the length parameter to equal the new length of the array.
Definition at line 48 of file StreamingSparseFeatures.h.
Public Member Functions | |
CStreamingSparseFeatures () | |
CStreamingSparseFeatures (CStreamingFile *file, bool is_labelled, int32_t size) | |
virtual | ~CStreamingSparseFeatures () |
virtual void | set_vector_reader () |
virtual void | set_vector_and_label_reader () |
virtual void | start_parser () |
virtual void | end_parser () |
virtual bool | get_next_example () |
T | get_feature (int32_t index) |
SGSparseVector< T > | get_vector () |
virtual float64_t | get_label () |
virtual void | release_example () |
virtual void | reset_stream () |
int32_t | set_num_features (int32_t num) |
virtual int32_t | get_dim_feature_space () const |
virtual float32_t | dot (CStreamingDotFeatures *df) |
T | dense_dot (T alpha, T *vec, int32_t dim, T b) |
virtual float64_t | dense_dot (const float64_t *vec2, int32_t vec2_len) |
virtual float32_t | dense_dot (const float32_t *vec2, int32_t vec2_len) |
virtual void | add_to_dense_vec (float64_t alpha, float64_t *vec2, int32_t vec2_len, bool abs_val=false) |
virtual void | add_to_dense_vec (float32_t alpha, float32_t *vec2, int32_t vec2_len, bool abs_val=false) |
int64_t | get_num_nonzero_entries () |
float32_t | compute_squared () |
void | sort_features () |
virtual int32_t | get_num_features () |
virtual int32_t | get_nnz_features_for_vector () |
virtual EFeatureType | get_feature_type () const |
virtual EFeatureClass | get_feature_class () const |
virtual CFeatures * | duplicate () const |
virtual const char * | get_name () const |
virtual int32_t | get_num_vectors () const |
virtual void | dense_dot_range (float32_t *output, float32_t *alphas, float32_t *vec, int32_t dim, float32_t b, int32_t num_vec=0) |
virtual void | expand_if_required (float32_t *&vec, int32_t &len) |
virtual void | expand_if_required (float64_t *&vec, int32_t &len) |
virtual void * | get_feature_iterator () |
virtual bool | get_next_feature (int32_t &index, float32_t &value, void *iterator) |
virtual void | free_feature_iterator (void *iterator) |
void | set_read_functions () |
virtual bool | get_has_labels () |
virtual bool | is_seekable () |
virtual CFeatures * | get_streamed_features (index_t num_elements) |
virtual void | add_preprocessor (CPreprocessor *p) |
virtual void | del_preprocessor (int32_t num) |
CPreprocessor * | get_preprocessor (int32_t num) const |
void | set_preprocessed (int32_t num) |
bool | is_preprocessed (int32_t num) const |
int32_t | get_num_preprocessed () const |
int32_t | get_num_preprocessors () const |
void | clean_preprocessors () |
void | list_preprocessors () |
int32_t | get_cache_size () const |
virtual bool | reshape (int32_t num_features, int32_t num_vectors) |
void | list_feature_obj () const |
virtual void | load (CFile *loader) |
virtual void | save (CFile *writer) |
bool | check_feature_compatibility (CFeatures *f) const |
bool | has_property (EFeatureProperty p) const |
void | set_property (EFeatureProperty p) |
void | unset_property (EFeatureProperty p) |
virtual CFeatures * | create_merged_copy (CList *others) |
virtual CFeatures * | create_merged_copy (CFeatures *other) |
virtual void | add_subset (SGVector< index_t > subset) |
virtual void | add_subset_in_place (SGVector< index_t > subset) |
virtual void | remove_subset () |
virtual void | remove_all_subsets () |
virtual CSubsetStack * | get_subset_stack () |
virtual void | subset_changed_post () |
virtual CFeatures * | copy_subset (SGVector< index_t > indices) |
virtual CFeatures * | copy_dimension_subset (SGVector< index_t > dims) |
virtual bool | support_compatible_class () const |
virtual bool | get_feature_class_compatibility (EFeatureClass rhs) const |
virtual CSGObject * | shallow_copy () const |
virtual CSGObject * | deep_copy () const |
virtual bool | is_generic (EPrimitiveType *generic) const |
template<class T > | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
template<> | |
void | set_generic () |
void | unset_generic () |
virtual void | print_serializable (const char *prefix="") |
virtual bool | save_serializable (CSerializableFile *file, const char *prefix="") |
virtual bool | load_serializable (CSerializableFile *file, const char *prefix="") |
void | set_global_io (SGIO *io) |
SGIO * | get_global_io () |
void | set_global_parallel (Parallel *parallel) |
Parallel * | get_global_parallel () |
void | set_global_version (Version *version) |
Version * | get_global_version () |
SGStringList< char > | get_modelsel_names () |
void | print_modsel_params () |
char * | get_modsel_param_descr (const char *param_name) |
index_t | get_modsel_param_index (const char *param_name) |
void | build_gradient_parameter_dictionary (CMap< TParameter *, CSGObject * > *dict) |
virtual void | update_parameter_hash () |
virtual bool | parameter_hash_changed () |
virtual bool | equals (CSGObject *other, float64_t accuracy=0.0, bool tolerant=false) |
virtual CSGObject * | clone () |
Static Public Member Functions | |
static T | sparse_dot (T alpha, SGSparseVectorEntry< T > *avec, int32_t alen, SGSparseVectorEntry< T > *bvec, int32_t blen) |
Public Attributes | |
SGIO * | io |
Parallel * | parallel |
Version * | version |
Parameter * | m_parameters |
Parameter * | m_model_selection_parameters |
Parameter * | m_gradient_parameters |
uint32_t | m_hash |
Protected Member Functions | |
virtual void | load_serializable_pre () throw (ShogunException) |
virtual void | load_serializable_post () throw (ShogunException) |
virtual void | save_serializable_pre () throw (ShogunException) |
virtual void | save_serializable_post () throw (ShogunException) |
Protected Attributes | |
CInputParser < SGSparseVectorEntry< T > > | parser |
The parser object, which reads from input and returns parsed example objects. More... | |
SGSparseVector< T > | current_sgvector |
The current example's feature vector as an SGVector<T> More... | |
index_t | current_vec_index |
The current vector index. More... | |
float64_t | current_label |
The current example's label. More... | |
int32_t | current_num_features |
Number of features in current vector (as seen so far upto the current vector) More... | |
bool | has_labels |
Whether examples are labelled or not. More... | |
CStreamingFile * | working_file |
The StreamingFile object to read from. More... | |
bool | seekable |
Whether the stream is seekable. More... | |
CSubsetStack * | m_subset_stack |
Default constructor.
Sets the reading functions to be CStreamingFile::get_*_vector and get_*_vector_and_label depending on the type T.
Definition at line 19 of file StreamingSparseFeatures.cpp.
CStreamingSparseFeatures | ( | CStreamingFile * | file, |
bool | is_labelled, | ||
int32_t | size | ||
) |
Constructor taking args. Initializes the parser with the given args.
file | StreamingFile object, input file. |
is_labelled | Whether examples are labelled or not. |
size | Number of example objects to be stored in the parser at a time. |
Definition at line 26 of file StreamingSparseFeatures.cpp.
|
virtual |
Destructor.
Ends the parsing thread. (Waits for pthread_join to complete)
Definition at line 36 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
Adds a subset of indices on top of the current subsets (possibly subset of subset). Every call causes a new active index vector to be stored. Added subsets can be removed one-by-one. If this is not needed, add_subset_in_place() should be used (does not store intermediate index vectors)
Calls subset_changed_post() afterwards
subset | subset of indices to add |
Reimplemented in CCombinedFeatures.
Definition at line 310 of file Features.cpp.
Sets/changes latest added subset. This allows to add multiple subsets with in-place memory requirements. They cannot be removed one-by-one afterwards, only the latest active can. If this is needed, use add_subset(). If no subset is active, this just adds.
Calls subset_changed_post() afterwards
subset | subset of indices to replace the latest one with. |
Definition at line 316 of file Features.cpp.
|
virtual |
Add alpha*current_vector to another float64_t type dense vector. Takes the absolute value of current_vector if specified.
alpha | alpha |
vec2 | vector to add to, float64_t* |
vec2_len | length of vector |
abs_val | true if abs of current_vector should be taken |
Definition at line 133 of file StreamingSparseFeatures.cpp.
|
virtual |
Add alpha*current_vector to another dense vector. Takes the absolute value of current_vector if specified.
alpha | alpha |
vec2 | vector to add to |
vec2_len | length of vector |
abs_val | true if abs of current_vector should be taken |
Implements CStreamingDotFeatures.
Definition at line 161 of file StreamingSparseFeatures.cpp.
|
inherited |
Builds a dictionary of all parameters in SGObject as well of those of SGObjects that are parameters of this object. Dictionary maps parameters to the objects that own them.
dict | dictionary of parameters to be built. |
Definition at line 597 of file SGObject.cpp.
|
inherited |
check feature compatibility
f | features to check for compatibility |
Definition at line 283 of file Features.cpp.
|
inherited |
clears all preprocs
Definition at line 116 of file Features.cpp.
|
virtualinherited |
Creates a clone of the current object. This is done via recursively traversing all parameters, which corresponds to a deep copy. Calling equals on the cloned object always returns true although none of the memory of both objects overlaps.
Definition at line 714 of file SGObject.cpp.
float32_t compute_squared | ( | ) |
Compute sum of squares of features on current vector.
Definition at line 195 of file StreamingSparseFeatures.cpp.
Creates a new CFeatures instance containing only the dimensions of the feature vector which are specified by the provided indices.
This method is needed for feature selection tasks NOT IMPLEMENTED!
dims | indices of feature dimensions to copy |
Reimplemented in CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, and CDenseFeatures< uint16_t >.
Definition at line 348 of file Features.cpp.
Creates a new CFeatures instance containing copies of the elements which are specified by the provided indices.
This method is needed for a KernelMachine to store its model data. NOT IMPLEMENTED!
indices | indices of feature elements to copy |
Reimplemented in CStringFeatures< ST >, CStringFeatures< T >, CStringFeatures< uint8_t >, CStringFeatures< char >, CStringFeatures< uint16_t >, CSparseFeatures< ST >, CSparseFeatures< float64_t >, CSparseFeatures< T >, CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, CDenseFeatures< uint16_t >, and CCombinedFeatures.
Definition at line 340 of file Features.cpp.
Takes a list of feature instances and returns a new instance being a concatenation of a copy of this instace's data and the given instancess data. Note that the feature types have to be equal.
NOT IMPLEMENTED!
others | list of feature objects to append |
Reimplemented in CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, and CDenseFeatures< uint16_t >.
Definition at line 235 of file Features.h.
Convenience method for method with same name and list as parameter.
NOT IMPLEMENTED!
other | feature object to append |
Reimplemented in CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, CDenseFeatures< uint16_t >, and CCombinedFeatures.
Definition at line 249 of file Features.h.
|
virtualinherited |
A deep copy. All the instance variables will also be copied.
Definition at line 198 of file SGObject.cpp.
|
virtualinherited |
delete preprocessor from list
num | index of preprocessor in list |
Definition at line 122 of file Features.cpp.
T dense_dot | ( | T | alpha, |
T * | vec, | ||
int32_t | dim, | ||
T | b | ||
) |
compute the dot product between dense weights and a sparse feature vector alpha * sparse^T * w + b
alpha | scalar to multiply with |
vec | dense vector to compute dot product with |
dim | length of the dense vector |
b | bias |
Definition at line 82 of file StreamingSparseFeatures.cpp.
Dot product with another float64_t type dense vector.
vec2 | The dense vector with which to take the dot product. |
vec2_len | length of vector |
Definition at line 91 of file StreamingSparseFeatures.cpp.
Dot product with another dense vector.
vec2 | The dense vector with which to take the dot product. |
vec2_len | length of vector |
Implements CStreamingDotFeatures.
Definition at line 112 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
Compute the dot product for all vectors. This function makes use of dense_dot alphas[i] * sparse[i]^T * w + b
output | result for the given vector range |
alphas | scalars to multiply with, may be NULL |
vec | dense vector to compute dot product with |
dim | length of the dense vector |
b | bias |
num_vec | number of vectors to operate on (indices 0 to num_vec-1) |
If num_vec == 0 or left to its default value, the function attempts to return dot product for all vectors. However, the given output vector must be preallocated!
note that the result will be written to output[0...(num_vec-1)] except when num_vec = 0
Definition at line 30 of file StreamingDotFeatures.cpp.
|
virtual |
Dot product taken with another StreamingDotFeatures object.
Currently only works if it is a CStreamingSparseFeatures object. It takes the dot product of the current_vectors of both objects.
df | CStreamingDotFeatures object. |
Implements CStreamingDotFeatures.
Definition at line 357 of file StreamingSparseFeatures.cpp.
|
virtual |
Duplicate the object.
Implements CFeatures.
Definition at line 223 of file StreamingSparseFeatures.cpp.
|
virtual |
Ends the parsing thread.
Waits for the thread to join.
Implements CStreamingFeatures.
Definition at line 300 of file StreamingSparseFeatures.cpp.
Recursively compares the current SGObject to another one. Compares all registered numerical parameters, recursion upon complex (SGObject) parameters. Does not compare pointers!
May be overwritten but please do with care! Should not be necessary in most cases.
other | object to compare with |
accuracy | accuracy to use for comparison (optional) |
tolerant | allows linient check on float equality (within accuracy) |
Definition at line 618 of file SGObject.cpp.
|
virtualinherited |
Expand the vector passed so that it its length is equal to the dimensionality of the features. The previous values are kept intact through realloc, and the new ones are set to zero.
vec | float32_t* vector |
len | length of the vector |
Reimplemented in CStreamingVwFeatures.
Definition at line 53 of file StreamingDotFeatures.cpp.
|
virtualinherited |
Expand the vector passed so that it its length is equal to the dimensionality of the features. The previous values are kept intact through realloc, and the new ones are set to zero.
vec | float64_t* vector |
len | length of the vector |
Reimplemented in CStreamingVwFeatures.
Definition at line 64 of file StreamingDotFeatures.cpp.
|
virtualinherited |
clean up iterator call this function with the iterator returned by get_first_feature
iterator | as returned by get_first_feature |
Definition at line 93 of file StreamingDotFeatures.cpp.
|
inherited |
|
virtual |
obtain the dimensionality of the feature space
(not mix this up with the dimensionality of the input space, usually obtained via get_num_features())
Implements CStreamingDotFeatures.
Definition at line 351 of file StreamingSparseFeatures.cpp.
T get_feature | ( | int32_t | index | ) |
get a single feature
index | index of feature in this vector |
Definition at line 43 of file StreamingSparseFeatures.cpp.
|
virtual |
Return the feature class
Implements CFeatures.
Definition at line 376 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
Given a class in right hand side, does this class support compatible computation?
for example, is this->dot(rhs_prt) valid, where rhs_prt is the class in right hand side
rhs | the class in right hand side |
Reimplemented in CDenseSubSamplesFeatures< ST >.
Definition at line 355 of file Features.cpp.
|
virtualinherited |
iterate over the non-zero features
call get_feature_iterator first, followed by get_next_feature and free_feature_iterator to cleanup
Definition at line 75 of file StreamingDotFeatures.cpp.
|
virtual |
|
inherited |
|
inherited |
|
inherited |
|
virtualinherited |
Return whether the examples are labelled or not.
Definition at line 35 of file StreamingFeatures.cpp.
|
virtual |
Return the label of the current example as a float.
Examples must be labelled, otherwise an error occurs.
Implements CStreamingFeatures.
Definition at line 337 of file StreamingSparseFeatures.cpp.
|
inherited |
Definition at line 498 of file SGObject.cpp.
|
inherited |
Returns description of a given parameter string, if it exists. SG_ERROR otherwise
param_name | name of the parameter |
Definition at line 522 of file SGObject.cpp.
|
inherited |
Returns index of model selection parameter with provided index
param_name | name of model selection parameter |
Definition at line 535 of file SGObject.cpp.
|
virtual |
Return the name.
Implements CSGObject.
Definition at line 324 of file StreamingSparseFeatures.h.
|
virtual |
Instructs the parser to return the next example.
This example is stored as the current_example in this object.
Implements CStreamingFeatures.
Definition at line 306 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
iterate over the non-zero features
call this function with the iterator returned by get_first_feature and call free_feature_iterator to cleanup
index | is returned by reference (-1 when not available) |
value | is returned by reference |
iterator | as returned by get_first_feature |
Definition at line 87 of file StreamingDotFeatures.cpp.
|
virtual |
Return the number of non-zero features in vector
Reimplemented from CStreamingDotFeatures.
Definition at line 370 of file StreamingSparseFeatures.cpp.
|
virtual |
Return the number of features in the current example.
Implements CStreamingFeatures.
Definition at line 364 of file StreamingSparseFeatures.cpp.
int64_t get_num_nonzero_entries | ( | ) |
Get number of non-zero entries in current sparse vector
Definition at line 189 of file StreamingSparseFeatures.cpp.
|
inherited |
get the number of applied preprocs
Definition at line 103 of file Features.cpp.
|
inherited |
get number of preprocessors
Definition at line 155 of file Features.cpp.
|
virtual |
Return the number of vectors stored in this object.
Implements CFeatures.
Definition at line 229 of file StreamingSparseFeatures.cpp.
|
inherited |
get specified preprocessor
num | index of preprocessor in list |
Definition at line 93 of file Features.cpp.
Returns a new CFeatures instance which contains num_elements elements from the underlying stream. Not SG_REF'ed
num_elements | num elements to save from stream |
NOT IMPLEMENTED!
Reimplemented in CStreamingDenseFeatures< T >, CStreamingDenseFeatures< float64_t >, and CStreamingDenseFeatures< float32_t >.
Definition at line 191 of file StreamingFeatures.h.
|
virtualinherited |
SGSparseVector< T > get_vector | ( | ) |
Return the current feature vector as an SGSparseVector<T>.
Definition at line 331 of file StreamingSparseFeatures.cpp.
|
inherited |
check if features have given property
p | feature property |
Definition at line 295 of file Features.cpp.
|
virtualinherited |
If the SGSerializable is a class template then TRUE will be returned and GENERIC is set to the type of the generic.
generic | set to the type of the generic if returning TRUE |
Definition at line 296 of file SGObject.cpp.
|
inherited |
get whether specified preprocessor was already applied
num | index of preprocessor in list |
Definition at line 149 of file Features.cpp.
|
virtualinherited |
Whether the stream is seekable (to check if multiple epochs are possible), i.e., whether we can process examples in a batch fashion.
A stream can usually seekable when it comes from a file or when it comes from another conventional CFeatures object.
Definition at line 40 of file StreamingFeatures.cpp.
|
inherited |
list feature object
Definition at line 171 of file Features.cpp.
|
inherited |
print preprocessors
Definition at line 131 of file Features.cpp.
|
virtualinherited |
load features from file
loader | File object via which data shall be loaded |
Reimplemented in CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, CDenseFeatures< uint16_t >, CSparseFeatures< ST >, CSparseFeatures< float64_t >, CSparseFeatures< T >, CStringFeatures< ST >, CStringFeatures< T >, CStringFeatures< uint8_t >, CStringFeatures< char >, and CStringFeatures< uint16_t >.
Definition at line 269 of file Features.cpp.
|
virtualinherited |
Load this object from file. If it will fail (returning FALSE) then this object will contain inconsistent data and should not be used!
file | where to load from |
prefix | prefix for members |
Definition at line 369 of file SGObject.cpp.
|
protectedvirtualinherited |
Can (optionally) be overridden to post-initialize some member variables which are not PARAMETER::ADD'ed. Make sure that at first the overridden method BASE_CLASS::LOAD_SERIALIZABLE_POST is called.
ShogunException | will be thrown if an error occurs. |
Reimplemented in CKernel, CWeightedDegreePositionStringKernel, CList, CAlphabet, CLinearHMM, CGaussianKernel, CInverseMultiQuadricKernel, CCircularKernel, and CExponentialKernel.
Definition at line 426 of file SGObject.cpp.
|
protectedvirtualinherited |
Can (optionally) be overridden to pre-initialize some member variables which are not PARAMETER::ADD'ed. Make sure that at first the overridden method BASE_CLASS::LOAD_SERIALIZABLE_PRE is called.
ShogunException | will be thrown if an error occurs. |
Reimplemented in CDynamicArray< T >, CDynamicArray< float64_t >, CDynamicArray< float32_t >, CDynamicArray< int32_t >, CDynamicArray< char >, CDynamicArray< bool >, and CDynamicObjectArray.
Definition at line 421 of file SGObject.cpp.
|
virtualinherited |
Definition at line 262 of file SGObject.cpp.
|
inherited |
prints all parameter registered for model selection and their type
Definition at line 474 of file SGObject.cpp.
|
virtualinherited |
prints registered parameters out
prefix | prefix for members |
Definition at line 308 of file SGObject.cpp.
|
virtual |
Release the current example, indicating to the parser that it has been processed by the learning algorithm.
The parser is then free to throw away that example.
Implements CStreamingFeatures.
Definition at line 345 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
removes all subsets Calls subset_changed_post() afterwards
Reimplemented in CCombinedFeatures.
Definition at line 328 of file Features.cpp.
|
virtualinherited |
removes that last added subset from subset stack, if existing Calls subset_changed_post() afterwards
Reimplemented in CCombinedFeatures.
Definition at line 322 of file Features.cpp.
|
virtual |
Reset the file back to the first example if possible.
Reimplemented from CStreamingFeatures.
Definition at line 50 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
in case there is a feature matrix allow for reshaping
NOT IMPLEMENTED!
num_features | new number of features |
num_vectors | new number of vectors |
Reimplemented in CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, and CDenseFeatures< uint16_t >.
Definition at line 165 of file Features.cpp.
|
virtualinherited |
save features to file
writer | File object via which data shall be saved |
Reimplemented in CStringFeatures< ST >, CStringFeatures< T >, CStringFeatures< uint8_t >, CStringFeatures< char >, CStringFeatures< uint16_t >, CDenseFeatures< ST >, CDenseFeatures< uint32_t >, CDenseFeatures< float64_t >, CDenseFeatures< T >, CDenseFeatures< uint16_t >, CSparseFeatures< ST >, CSparseFeatures< float64_t >, and CSparseFeatures< T >.
Definition at line 276 of file Features.cpp.
|
virtualinherited |
Save this object to file.
file | where to save the object; will be closed during returning if PREFIX is an empty string. |
prefix | prefix for members |
Definition at line 314 of file SGObject.cpp.
|
protectedvirtualinherited |
Can (optionally) be overridden to post-initialize some member variables which are not PARAMETER::ADD'ed. Make sure that at first the overridden method BASE_CLASS::SAVE_SERIALIZABLE_POST is called.
ShogunException | will be thrown if an error occurs. |
Reimplemented in CKernel.
Definition at line 436 of file SGObject.cpp.
|
protectedvirtualinherited |
Can (optionally) be overridden to pre-initialize some member variables which are not PARAMETER::ADD'ed. Make sure that at first the overridden method BASE_CLASS::SAVE_SERIALIZABLE_PRE is called.
ShogunException | will be thrown if an error occurs. |
Reimplemented in CKernel, CDynamicArray< T >, CDynamicArray< float64_t >, CDynamicArray< float32_t >, CDynamicArray< int32_t >, CDynamicArray< char >, CDynamicArray< bool >, and CDynamicObjectArray.
Definition at line 431 of file SGObject.cpp.
|
inherited |
Definition at line 41 of file SGObject.cpp.
|
inherited |
Definition at line 46 of file SGObject.cpp.
|
inherited |
Definition at line 51 of file SGObject.cpp.
|
inherited |
Definition at line 56 of file SGObject.cpp.
|
inherited |
Definition at line 61 of file SGObject.cpp.
|
inherited |
Definition at line 66 of file SGObject.cpp.
|
inherited |
Definition at line 71 of file SGObject.cpp.
|
inherited |
Definition at line 76 of file SGObject.cpp.
|
inherited |
Definition at line 81 of file SGObject.cpp.
|
inherited |
Definition at line 86 of file SGObject.cpp.
|
inherited |
Definition at line 91 of file SGObject.cpp.
|
inherited |
Definition at line 96 of file SGObject.cpp.
|
inherited |
Definition at line 101 of file SGObject.cpp.
|
inherited |
Definition at line 106 of file SGObject.cpp.
|
inherited |
Definition at line 111 of file SGObject.cpp.
|
inherited |
set generic type to T
|
inherited |
|
inherited |
set the parallel object
parallel | parallel object to use |
Definition at line 241 of file SGObject.cpp.
|
inherited |
set the version object
version | version object to use |
Definition at line 283 of file SGObject.cpp.
int32_t set_num_features | ( | int32_t | num | ) |
set number of features
Sometimes when loading sparse features not all possible dimensions are used. This may pose a problem to classifiers when being applied to higher dimensional test-data. This function allows to artificially explode the feature space
num | the number of features, must be larger than the current number of features |
Definition at line 56 of file StreamingSparseFeatures.cpp.
|
inherited |
set applied flag for preprocessor
num | index of preprocessor in list |
Definition at line 143 of file Features.cpp.
|
inherited |
|
inherited |
Set the vector reading functions.
The functions are implemented specific to the type in the derived class.
Definition at line 29 of file StreamingFeatures.cpp.
|
virtual |
Sets the read function (in case the examples are labelled) to get_*_vector_and_label from CStreamingFile.
The exact function depends on type T.
The parser uses the function set by this while reading labelled examples.
Implements CStreamingFeatures.
Definition at line 241 of file StreamingSparseFeatures.cpp.
|
virtual |
Sets the read function (in case the examples are unlabelled) to get_*_vector() from CStreamingFile.
The exact function depends on type T.
The parser uses the function set by this while reading unlabelled examples.
Implements CStreamingFeatures.
Definition at line 236 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
A shallow copy. All the SGObject instance variables will be simply assigned and SG_REF-ed.
Reimplemented in CGaussianKernel.
Definition at line 192 of file SGObject.cpp.
void sort_features | ( | ) |
Ensure features of the current vector are in ascending order. It modifies the current_sgvector in-place and does not change the reference in current_sgvector.features.
Definition at line 211 of file StreamingSparseFeatures.cpp.
|
static |
compute the dot product between two sparse feature vectors alpha * vec^T * vec
alpha | scalar to multiply with |
avec | first sparse feature vector |
alen | avec's length |
bvec | second sparse feature vector |
blen | bvec's length |
Definition at line 65 of file StreamingSparseFeatures.cpp.
|
virtual |
Starts the parsing thread.
To be called before trying to use any feature vectors from this object.
Implements CStreamingFeatures.
Definition at line 293 of file StreamingSparseFeatures.cpp.
|
virtualinherited |
method may be overwritten to update things that depend on subset
Reimplemented in CStringFeatures< ST >, CStringFeatures< T >, CStringFeatures< uint8_t >, CStringFeatures< char >, and CStringFeatures< uint16_t >.
Definition at line 293 of file Features.h.
|
virtualinherited |
does this class support compatible computation bewteen difference classes? for example, this->dot(rhs_prt), can rhs_prt be an instance of a difference class?
Reimplemented in CDenseSubSamplesFeatures< ST >.
Definition at line 323 of file Features.h.
|
inherited |
unset generic type
this has to be called in classes specializing a template class
Definition at line 303 of file SGObject.cpp.
|
inherited |
|
virtualinherited |
Updates the hash of current parameter combination
Definition at line 248 of file SGObject.cpp.
|
protected |
The current example's label.
Definition at line 360 of file StreamingSparseFeatures.h.
|
protected |
Number of features in current vector (as seen so far upto the current vector)
Definition at line 363 of file StreamingSparseFeatures.h.
|
protected |
The current example's feature vector as an SGVector<T>
Definition at line 354 of file StreamingSparseFeatures.h.
|
protected |
The current vector index.
Definition at line 357 of file StreamingSparseFeatures.h.
|
protectedinherited |
Whether examples are labelled or not.
Definition at line 201 of file StreamingFeatures.h.
|
inherited |
io
Definition at line 369 of file SGObject.h.
|
inherited |
parameters wrt which we can compute gradients
Definition at line 384 of file SGObject.h.
|
inherited |
Hash of parameter values
Definition at line 387 of file SGObject.h.
|
inherited |
model selection parameters
Definition at line 381 of file SGObject.h.
|
inherited |
parameters
Definition at line 378 of file SGObject.h.
|
protectedinherited |
subset used for index transformations
Definition at line 352 of file Features.h.
|
inherited |
parallel
Definition at line 372 of file SGObject.h.
|
protected |
The parser object, which reads from input and returns parsed example objects.
Definition at line 351 of file StreamingSparseFeatures.h.
|
protectedinherited |
Whether the stream is seekable.
Definition at line 207 of file StreamingFeatures.h.
|
inherited |
version
Definition at line 375 of file SGObject.h.
|
protectedinherited |
The StreamingFile object to read from.
Definition at line 204 of file StreamingFeatures.h.