|
|
| LibFMParser (InputSplit *source, int nthread) |
| |
|
| LibFMParser (InputSplit *source, const std::map< std::string, std::string > &args, int nthread) |
| |
|
| TextParserBase (InputSplit *source, int nthread) |
| |
| virtual void | BeforeFirst (void) |
| | set before first of the item
|
| |
| virtual size_t | BytesRead (void) const |
| |
| virtual bool | ParseNext (std::vector< RowBlockContainer< IndexType, DType > > *data) |
| | read in next several blocks of data
|
| |
| virtual bool | Next (void) |
| | implement next
|
| |
| virtual const RowBlock< IndexType, DType > & | Value (void) const |
| | get current data
|
| |
|
Parser< uint32_t, real_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
Parser< uint64_t, real_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
Parser< uint32_t, int32_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
Parser< uint64_t, int32_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
Parser< uint32_t, int64_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
Parser< uint64_t, int64_t > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| |
|
virtual | ~DataIter (void) DMLC_THROW_EXCEPTION |
| | destructor
|
| |
|
|
typedef Parser< IndexType, DType > *(* | Factory) (const std::string &path, const std::map< std::string, std::string > &args, unsigned part_index, unsigned num_parts) |
| | Factory type of the parser.
|
| |
| static Parser< IndexType, DType > * | Create (const char *uri_, unsigned part_index, unsigned num_parts, const char *type) |
| | create a new instance of parser based on the "type"
|
| |
| static const char * | BackFindEndLine (const char *bptr, const char *begin) |
| | start from bptr, go backward and find first endof line
|
| |
| static void | IgnoreUTF8BOM (const char **begin, const char **end) |
| | Ignore UTF-8 BOM if present.
|
| |
|
IndexType | data_ptr_ |
| | pointer to begin and end of data
|
| |
|
IndexType | data_end_ |
| |
|
std::vector< RowBlockContainer< IndexType, DType > > | data_ |
| | internal data
|
| |
|
RowBlock< IndexType, DType > | block_ |
| | internal row block
|
| |
template<typename IndexType, typename DType = real_t>
class dmlc::data::LibFMParser< IndexType, DType >
Text parser that parses the input lines and returns rows in input data.