/usr/include/shogun/lib/SGSparseVector.h is in libshogun-dev 3.1.1-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 | /*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 3 of the License, or
* (at your option) any later version.
*
* Written (W) 2013 Thoralf Klein
* Written (W) 2012 Fernando José Iglesias García
* Written (W) 2010,2012 Soeren Sonnenburg
* Copyright (C) 2010 Berlin Institute of Technology
* Copyright (C) 2012 Soeren Sonnenburg
*/
#ifndef __SGSPARSEVECTOR_H__
#define __SGSPARSEVECTOR_H__
#include <shogun/lib/config.h>
#include <shogun/lib/DataType.h>
#include <shogun/lib/SGReferencedData.h>
namespace shogun
{
class CFile;
/** @brief template class SGSparseVectorEntry */
template <class T> struct SGSparseVectorEntry
{
/** feature index */
index_t feat_index;
/** entry ... */
T entry;
};
/** @brief template class SGSparseVector
* The assumtion is that the stored SGSparseVectorEntry<T>* vector is ordered
* by SGSparseVectorEntry.feat_index in non-decreasing order.
* This has to be assured by the user of the class.
*/
template <class T> class SGSparseVector : public SGReferencedData
{
public:
/** default constructor */
SGSparseVector();
/** constructor for setting params
*
* @param feats vector of SGSparseVectorEntry ordered by SGSparseVectorEntry.feat_index in non-decreasing order
* @param num_entries number of elements in feats vector
* @param ref_counting use reference counting
*/
SGSparseVector(SGSparseVectorEntry<T>* feats, index_t num_entries,
bool ref_counting=true);
/** constructor to create new vector in memory */
SGSparseVector(index_t num_entries, bool ref_counting=true);
/** copy constructor */
SGSparseVector(const SGSparseVector& orig);
virtual ~SGSparseVector();
/** compute the dot product between dense weights and a sparse feature vector
* alpha * sparse^T * w + b
*
* possible with subset
*
* @param alpha scalar to multiply with
* @param vec dense vector to compute dot product with
* @param dim length of the dense vector
* @param b bias
* @return dot product between dense weights and a sparse feature vector
*/
T dense_dot(T alpha, T* vec, int32_t dim, T b);
/** compute the dot product between dense weights and a sparse feature vector
* sparse^T * w
*
* @param vec dense vector to compute dot product with
* @return dot product between dense weights and a sparse feature vector
*/
template<typename ST> T dense_dot(SGVector<ST> vec);
/** compute the dot product between current sparse vector and a given
* sparse vector.
* sparse_a^T * sparse_b
*
* @param v sparse vector
* @return dot product between the current sparse vector and v sparse vector
*/
T sparse_dot(const SGSparseVector<T>& v);
/** compute the dot product between two sparse vectors.
* sparse_a^T * sparse_b
*
* @param a sparse vector
* @param b sparse vector
* @return dot product between a and b
*/
static T sparse_dot(const SGSparseVector<T>& a, const SGSparseVector<T>& b);
/**
* get the sparse vector (no copying is done here)
*
* @return the refcount increased vector
*/
inline SGSparseVector<T> get()
{
return *this;
}
/**
* get number of dimensions
*
* @return largest feature index
*/
int32_t get_num_dimensions();
/**
* sort features by indices (Setting stable_pointer=true to
* guarantee that pointer features does not change. On the
* other hand, stable_pointer=false can shrink the vector if
* possible.)
*
* @param stable_pointer (default false) enforce stable pointer
*/
void sort_features(bool stable_pointer = false);
/**
* get feature value for index
*
* @param index
* @return value
*/
T get_feature(int32_t index);
/**
* get dense representation of given size
*
* @param dimension of requested dense vector
* @return SGVector<T>
*/
SGVector<T> get_dense(int32_t dimension);
/**
* get shortet dense representation for sparse vector
*
* @return SGVector<T>
*/
SGVector<T> get_dense();
/** clone vector */
SGSparseVector<T> clone() const;
/** load vector from file
*
* @param loader File object via which to load data
*/
void load(CFile* loader);
/** save vector to file
*
* @param saver File object via which to save data
*/
void save(CFile* saver);
/** display vector
*
* @param name vector name in output
* @param prefix prepend on every entry
*/
void display_vector(const char* name="vector",
const char* prefix="");
protected:
virtual void copy_data(const SGReferencedData& orig);
virtual void init_data();
virtual void free_data();
/** helper function to compute dot product
*
* determines whether symmetric (similar number of non-zero elements in
* both sparse vectors) or asymetric (logarithmically more elements in one vector)
* dot product computation routine shall be taken
*
* @param alen length of vector a
* @param blen length of vector b
*
* @return -1,0,1 if asymetric(b,a), symmetric(a,b) respectively
* asymmetric(a,b) shall be called
*/
static int32_t cmp_dot_prod_symmetry_fast(index_t alen, index_t blen);
/** compute dot product between vectors a and b
*
* particularly fast if len(a) << len(b)
*
* @param a vector a
* @param b vector b
*
* @return dot product
*/
static T dot_prod_asymmetric(const SGSparseVector<T>& a, const SGSparseVector<T>& b);
/** compute dot product between vectors a and b
*
* particularly fast if len(a) ~= len(b)
*
* @param a vector a
* @param b vector b
*
* @return dot product
*/
static T dot_prod_symmetric(const SGSparseVector<T>& a, const SGSparseVector<T>& b);
public:
/** number of feature entries */
index_t num_feat_entries;
/** features */
SGSparseVectorEntry<T>* features;
};
}
#endif // __SGSPARSEVECTOR_H__
|