20 class CDelimiterTokenizer;
23 template <
class ST>
class SGString;
24 template <
class T>
class SGSparseVector;
40 CCSVFile(FILE* f,
const char* name=NULL);
48 CCSVFile(
int fd,
const char* mode,
const char* name=NULL);
56 CCSVFile(
const char* fname,
char rw=
'r',
const char* name=NULL);
94 virtual void get_vector(int8_t*& vector, int32_t& len);
95 virtual void get_vector(uint8_t*& vector, int32_t& len);
96 virtual void get_vector(
char*& vector, int32_t& len);
97 virtual void get_vector(int32_t*& vector, int32_t& len);
98 virtual void get_vector(uint32_t*& vector, int32_t& len);
102 virtual void get_vector(int16_t*& vector, int32_t& len);
103 virtual void get_vector(uint16_t*& vector, int32_t& len);
104 virtual void get_vector(int64_t*& vector, int32_t& len);
105 virtual void get_vector(uint64_t*& vector, int32_t& len);
117 uint8_t*& matrix, int32_t& num_feat, int32_t& num_vec);
119 int8_t*& matrix, int32_t& num_feat, int32_t& num_vec);
121 char*& matrix, int32_t& num_feat, int32_t& num_vec);
123 int32_t*& matrix, int32_t& num_feat, int32_t& num_vec);
125 uint32_t*& matrix, int32_t& num_feat, int32_t& num_vec);
127 int64_t*& matrix, int32_t& num_feat, int32_t& num_vec);
129 uint64_t*& matrix, int32_t& num_feat, int32_t& num_vec);
131 float32_t*& matrix, int32_t& num_feat, int32_t& num_vec);
133 float64_t*& matrix, int32_t& num_feat, int32_t& num_vec);
135 floatmax_t*& matrix, int32_t& num_feat, int32_t& num_vec);
137 int16_t*& matrix, int32_t& num_feat, int32_t& num_vec);
139 uint16_t*& matrix, int32_t& num_feat, int32_t& num_vec);
151 uint8_t*& array, int32_t*& dims, int32_t& num_dims);
153 char*& array, int32_t*& dims, int32_t& num_dims);
155 int32_t*& array, int32_t*& dims, int32_t& num_dims);
157 float32_t*& array, int32_t*& dims, int32_t& num_dims);
159 float64_t*& array, int32_t*& dims, int32_t& num_dims);
161 int16_t*& array, int32_t*& dims, int32_t& num_dims);
163 uint16_t*& array, int32_t*& dims, int32_t& num_dims);
212 int32_t& max_string_len);
215 int32_t& max_string_len);
218 int32_t& max_string_len);
221 int32_t& max_string_len);
224 int32_t& max_string_len);
227 int32_t& max_string_len);
230 int32_t& max_string_len);
233 int32_t& max_string_len);
236 int32_t& max_string_len);
239 int32_t& max_string_len);
242 int32_t& max_string_len);
245 int32_t& max_string_len);
258 virtual void set_vector(
const int8_t* vector, int32_t len);
259 virtual void set_vector(
const uint8_t* vector, int32_t len);
260 virtual void set_vector(
const char* vector, int32_t len);
261 virtual void set_vector(
const int32_t* vector, int32_t len);
262 virtual void set_vector(
const uint32_t* vector, int32_t len);
266 virtual void set_vector(
const int16_t* vector, int32_t len);
267 virtual void set_vector(
const uint16_t* vector, int32_t len);
268 virtual void set_vector(
const int64_t* vector, int32_t len);
269 virtual void set_vector(
const uint64_t* vector, int32_t len);
280 const uint8_t* matrix, int32_t num_feat, int32_t num_vec);
282 const int8_t* matrix, int32_t num_feat, int32_t num_vec);
284 const char* matrix, int32_t num_feat, int32_t num_vec);
286 const int32_t* matrix, int32_t num_feat, int32_t num_vec);
288 const uint32_t* matrix, int32_t num_feat, int32_t num_vec);
290 const int64_t* matrix, int32_t num_feat, int32_t num_vec);
292 const uint64_t* matrix, int32_t num_feat, int32_t num_vec);
294 const float32_t* matrix, int32_t num_feat, int32_t num_vec);
296 const float64_t* matrix, int32_t num_feat, int32_t num_vec);
298 const floatmax_t* matrix, int32_t num_feat, int32_t num_vec);
300 const int16_t* matrix, int32_t num_feat, int32_t num_vec);
302 const uint16_t* matrix, int32_t num_feat, int32_t num_vec);
373 #endif // #ifndef SWIG
375 virtual const char*
get_name()
const {
return "CSVFile"; }
382 void init_with_defaults();
385 void skip_lines(int32_t num_lines);
401 bool is_data_transposed;
407 int32_t m_num_to_skip;
void set_delimiter(char delimiter)
virtual void get_matrix(uint8_t *&matrix, int32_t &num_feat, int32_t &num_vec)
void set_transpose(bool value)
virtual void set_vector(const int8_t *vector, int32_t len)
virtual void set_matrix(const uint8_t *matrix, int32_t num_feat, int32_t num_vec)
virtual void set_string_list(const SGString< uint8_t > *strings, int32_t num_str)
Class for buffered reading from a ascii file.
void set_lines_to_skip(int32_t num_lines)
int32_t get_stats(int32_t &num_tokens)
Class CSVFile used to read data from comma-separated values (CSV) files. See http://en.wikipedia.org/wiki/Comma-separated_values.
Class for reading from a string.
virtual void get_vector(int8_t *&vector, int32_t &len)
A File access base class.
virtual void get_sparse_matrix(SGSparseVector< bool > *&matrix, int32_t &num_feat, int32_t &num_vec)
all of classes and functions are contained in the shogun namespace
The class CDelimiterTokenizer is used to tokenize a SGVector into tokens using custom chars as ...
virtual void set_sparse_matrix(const SGSparseVector< bool > *matrix, int32_t num_feat, int32_t num_vec)
template class SGSparseVector The assumtion is that the stored SGSparseVectorEntry* vector is orde...
virtual const char * get_name() const
virtual void get_string_list(SGString< uint8_t > *&strings, int32_t &num_str, int32_t &max_string_len)
virtual void get_ndarray(uint8_t *&array, int32_t *&dims, int32_t &num_dims)