10 LIGHTGBM_EXPORT
DatasetLoader(
const Config& io_config,
const PredictFunction& predict_fun,
int num_class,
const char* filename);
14 LIGHTGBM_EXPORT
Dataset* LoadFromFile(
const char* filename,
const char* initscore_file,
int rank,
int num_machines);
16 LIGHTGBM_EXPORT
Dataset* LoadFromFile(
const char* filename,
const char* initscore_file) {
17 return LoadFromFile(filename, initscore_file, 0, 1);
20 LIGHTGBM_EXPORT
Dataset* LoadFromFileAlignWithOtherDataset(
const char* filename,
const char* initscore_file,
const Dataset* train_data);
22 LIGHTGBM_EXPORT
Dataset* CostructFromSampleData(
double** sample_values,
23 int** sample_indices,
int num_col,
const int* num_per_col,
32 Dataset* LoadFromBinFile(
const char* data_filename,
const char* bin_filename,
int rank,
int num_machines,
int* num_global_data, std::vector<data_size_t>* used_data_indices);
34 void SetHeader(
const char* filename);
36 void CheckDataset(
const Dataset* dataset);
38 std::vector<std::string> LoadTextDataToMemory(
const char* filename,
const Metadata& metadata,
int rank,
int num_machines,
int* num_global_data, std::vector<data_size_t>* used_data_indices);
40 std::vector<std::string> SampleTextDataFromMemory(
const std::vector<std::string>& data);
42 std::vector<std::string> SampleTextDataFromFile(
const char* filename,
const Metadata& metadata,
int rank,
int num_machines,
int* num_global_data, std::vector<data_size_t>* used_data_indices);
44 void ConstructBinMappersFromTextData(
int rank,
int num_machines,
const std::vector<std::string>& sample_data,
const Parser* parser,
Dataset* dataset);
47 void ExtractFeaturesFromMemory(std::vector<std::string>& text_data,
const Parser* parser,
Dataset* dataset);
50 void ExtractFeaturesFromFile(
const char* filename,
const Parser* parser,
const std::vector<data_size_t>& used_data_indices,
Dataset* dataset);
53 std::string CheckCanLoadFromBin(
const char* filename);
59 const PredictFunction& predict_fun_;
69 std::unordered_set<int> ignore_features_;
71 std::vector<std::string> feature_names_;
73 std::unordered_set<int> categorical_features_;