/usr/include/shogun/features/StringFileFeatures.h is in libshogun-dev 3.1.1-1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 | /*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 3 of the License, or
* (at your option) any later version.
*
* Written (W) 2009 Soeren Sonnenburg
* Copyright (C) 2009 Berlin Institute of Technology
*/
#ifndef _CSTRINGFILEFEATURES__H__
#define _CSTRINGFILEFEATURES__H__
#include <shogun/features/StringFeatures.h>
#include <shogun/features/Alphabet.h>
#include <shogun/io/MemoryMappedFile.h>
#include <shogun/mathematics/Math.h>
#include <shogun/io/SGIO.h>
namespace shogun
{
class CAlphabet;
template <class T> class CMemoryMappedFile;
/** @brief File based string features.
*
* StringFeatures that are file based. Underneath memory mapped files are used.
* Derived from CStringFeatures thus transparently enabling all of the
* StringFeature functionality.
*
* Supported file format contains one string per line, lines of variable length
* are supported and must be separated by '\n'.
*/
template <class ST> class CStringFileFeatures : public CStringFeatures<ST>
{
public:
/** default constructor
*
*/
CStringFileFeatures();
/** constructor
*
* @param fname filename of the file containing line based features
* @param alpha alphabet (type) to use for string features
*/
CStringFileFeatures(const char* fname, EAlphabet alpha);
/** default destructor
*
*/
virtual ~CStringFileFeatures();
/** Returns the name of the SGSerializable instance.
*
* @return name of the SGSerializable
*/
virtual const char* get_name() const { return "StringFileFeatures"; }
protected:
/** get next line from file
*
* The returned line may be modfied in case the file was opened
* read/write. It is otherwise read-only.
*
* @param len length of line (returned via reference)
* @param offs offset to be passed for reading next line, should be 0
* initially (returned via reference)
* @param line_nr used to indicate errors (returned as reference should be 0
* initially)
* @param file_length total length of the file (for error checking)
*
* @return line (NOT ZERO TERMINATED)
*/
ST* get_line(uint64_t& len, uint64_t& offs, int32_t& line_nr, uint64_t file_length);
/** cleanup string features */
virtual void cleanup();
/** cleanup a single feature vector */
virtual void cleanup_feature_vector(int32_t num);
/** obtain meta information from file
*
* i.e., determine number of strings and their lengths
*/
void fetch_meta_info_from_file(int32_t granularity=1048576);
protected:
/** memory mapped file*/
CMemoryMappedFile<ST>* file;
};
}
#endif // _CSTRINGFILEFEATURES__H__
|