The parsed fields from init command.
if (it->first == "signal")
else if (it->first == "val_channel")
else if (it->first == "time_channel")
else if (it->first == "win_from")
else if (it->first == "win_to")
win_to = med_stoi(it->second);
else if (it->first == "time_unit_win")
else if (it->first == "regex_filter")
else if (it->first == "remove_regex_filter")
else if (it->first == "min_age")
else if (it->first == "max_age")
else if (it->first == "age_bin")
else if (it->first == "min_code_cnt")
else if (it->first == "fdr")
fdr = med_stof(it->second);
else if (it->first == "take_top")
else if (it->first == "filter_hierarchy")
filter_hierarchy = med_stoi(it->second) > 0;
else if (it->first == "lift_below")
else if (it->first == "lift_above")
else if (it->first == "filter_child_count_ratio")
else if (it->first == "filter_child_lift_ratio")
else if (it->first == "filter_child_pval_diff")
else if (it->first == "filter_child_removed_ratio")
else if (it->first == "chi_square_at_least")
else if (it->first == "sort_by_chi")
else if (it->first == "minimal_chi_cnt")
else if (it->first == "use_fixed_lift")
else if (it->first == "verbose")
verbose = med_stoi(it->second) > 0;
else if (it->first == "verbose_full")
else if (it->first == "verbose_full_file")
else if (it->first == "feature_prefix")
else if (it->first == "stat_metric") {
if (conv_map_stats.find(it->second) != conv_map_stats.end())
stat_metric = category_stat_test(conv_map_stats.at(it->second));
else
MTHROW_AND_ERR("Unknown stat_test \"%s\". options are: %s\n",
it->second.c_str(), medial::io::get_list(conv_map_stats).c_str());
}
else if (it->first == "max_depth")
else if (it->first == "max_parents")
else if (it->first == "generate_with_counts")
else if (it->first == "regression_cntrl_lower") {
}
else if (it->first == "regression_cntrl_upper") {
}
else if (it->first == "regression_case_lower") {
}
else if (it->first == "regression_case_upper") {
}
else if (it->first == "male_regression_cntrl_lower")
else if (it->first == "male_regression_cntrl_upper")
else if (it->first == "male_regression_case_lower")
else if (it->first == "male_regression_case_upper")
else if (it->first == "female_regression_cntrl_lower")
else if (it->first == "female_regression_cntrl_upper")
else if (it->first == "female_regression_case_lower")
else if (it->first == "female_regression_case_upper")
else if (boost::starts_with(it->first, prefix_str)) {
int val_channel_f = med_stoi(it->first.substr(prefix_str.length()));
boost::split(f_v_sets, it->second, boost::is_any_of(","));
}
else if (boost::starts_with(it->first, prefix_str_names)) {
int val_channel_f = med_stoi(it->first.substr(prefix_str_names.length()));
}
else if (it->first == "fg_type") {}
else if (it->first ==
"tags") { boost::split(
tags, it->second, boost::is_any_of(
",")); }
else
MTHROW_AND_ERR("Unknown parameter \'%s\' for CategoryDependencyGenerator\n", it->first.c_str())
bool generate_with_counts
If true will generate feature with counts not just as set.
Definition FeatureGenerator.h:945
float filter_child_lift_ratio
below this threshold of lift change to remove child category
Definition FeatureGenerator.h:930
int max_depth
maximal depth to go in heirarchy
Definition FeatureGenerator.h:937
float male_regression_cntrl_lower
lower limit mask on outcome for controls - important inregression
Definition FeatureGenerator.h:949
string regex_filter
regex filter for filtering categories in learn
Definition FeatureGenerator.h:922
bool use_fixed_lift
If true will also sort be lifts below 1.
Definition FeatureGenerator.h:939
string verbose_full_file
output file for verbose_full debug in learn
Definition FeatureGenerator.h:943
vector< string > filter_set_by_val_channel_names
naming for each set matched filter_set_by_val_channel variable
Definition FeatureGenerator.h:947
category_stat_test stat_metric
statistical test
Definition FeatureGenerator.h:933
float male_regression_cntrl_upper
upper limit mask on outcome for controls - important inregression
Definition FeatureGenerator.h:950
int min_code_cnt
minimal number of occourences to consider signal
Definition FeatureGenerator.h:924
int age_bin
age bin for testing statistical dependency
Definition FeatureGenerator.h:921
float filter_child_pval_diff
below this threshold of pvalue diff change to remove child category (with AND condition on average li...
Definition FeatureGenerator.h:929
string remove_regex_filter
remove regex filter for filtering categories in learn
Definition FeatureGenerator.h:923
string signalName
the signal name
Definition FeatureGenerator.h:912
float female_regression_case_lower
lower limit mask on outcome for cases - important inregression
Definition FeatureGenerator.h:955
float male_regression_case_lower
lower limit mask on outcome for cases - important inregression
Definition FeatureGenerator.h:951
float lift_below
filter lift to keep below it
Definition FeatureGenerator.h:927
string feature_prefix
additional prefix to add to name to describe the feature
Definition FeatureGenerator.h:944
int time_channel
n >= 0 : use time channel n , default: 0.
Definition FeatureGenerator.h:914
int win_to
time window for feature: win_to is the maximal time before the prediction time
Definition FeatureGenerator.h:917
float female_regression_cntrl_lower
lower limit mask on outcome for controls - important inregression
Definition FeatureGenerator.h:953
int minimal_chi_cnt
chi_square arg to keep at least count to use row in calc
Definition FeatureGenerator.h:935
vector< vector< string > > filter_set_by_val_channel
filter set by value channels. can be initialized by "filter_set_by_val_channel_X":"string_set_for_val...
Definition FeatureGenerator.h:946
int max_parents
controls maximum parents count
Definition FeatureGenerator.h:938
float filter_child_removed_ratio
If child removed ratio is beyond this and has other child taken - remove parent.
Definition FeatureGenerator.h:932
float female_regression_case_upper
upper limit mask on outcome for cases - important inregression
Definition FeatureGenerator.h:956
int win_from
time window for feature: win_from is the minimal time before from the prediction time
Definition FeatureGenerator.h:916
int max_age
maximal age for testing statistical dependency
Definition FeatureGenerator.h:920
float male_regression_case_upper
upper limit mask on outcome for cases - important inregression
Definition FeatureGenerator.h:952
int take_top
maximal number of features to create
Definition FeatureGenerator.h:926
float fdr
the FDR value
Definition FeatureGenerator.h:925
bool verbose_full
If true will print a lot - table of all stats for each code.
Definition FeatureGenerator.h:942
bool verbose
Apply hierarchy filtering.
Definition FeatureGenerator.h:941
int min_age
minimal age for testing statistical dependency
Definition FeatureGenerator.h:919
float female_regression_cntrl_upper
upper limit mask on outcome for controls - important inregression
Definition FeatureGenerator.h:954
float lift_above
filter lift to keep above it
Definition FeatureGenerator.h:928
int val_channel
n >= 0 : use val channel n , default : 0.
Definition FeatureGenerator.h:915
float filter_child_count_ratio
If child ratio count is too similar, small change from parent code - keep only paretn code.
Definition FeatureGenerator.h:931
int time_unit_win
the time unit in which the windows are given. Default: Undefined
Definition FeatureGenerator.h:918
float chi_square_at_least
chi_square arg to test for at least that change in lift to measure bigger diffrence
Definition FeatureGenerator.h:934
int sort_by_chi
sort results by chi-square
Definition FeatureGenerator.h:936
vector< string > tags
Tags - for defining labels or groups. may be used later for filtering for example.
Definition FeatureGenerator.h:69
int string_to_type(const string &str)
Convert string to type.
Definition MedTime.cpp:358