MR_LIBS/binary__objective_8hpp_source.html

#ifndef LIGHTGBM_OBJECTIVE_BINARY_OBJECTIVE_HPP_

#define LIGHTGBM_OBJECTIVE_BINARY_OBJECTIVE_HPP_


#include <LightGBM/objective_function.h>


#include <cstring>

#include <cmath>


namespace LightGBM {


class BinaryLogloss: public ObjectiveFunction {

public:

  explicit BinaryLogloss(const Config& config, std::function<bool(label_t)> is_pos = nullptr) {

    sigmoid_ = static_cast<double>(config.sigmoid);

    if (sigmoid_ <= 0.0) {

      Log::Fatal("Sigmoid parameter %f should be greater than zero", sigmoid_);

    }

    is_unbalance_ = config.is_unbalance;

    scale_pos_weight_ = static_cast<double>(config.scale_pos_weight);

    if (is_unbalance_ && std::fabs(scale_pos_weight_ - 1.0f) > 1e-6) {

      Log::Fatal("Cannot set is_unbalance and scale_pos_weight at the same time");

    }

    is_pos_ = is_pos;

    if (is_pos_ == nullptr) {

      is_pos_ = [](label_t label) {return label > 0; };

    }

  }


  explicit BinaryLogloss(const std::vector<std::string>& strs) {

    sigmoid_ = -1;

    for (auto str : strs) {

      auto tokens = Common::Split(str.c_str(), ':');

      if (tokens.size() == 2) {

        if (tokens[0] == std::string("sigmoid")) {

          Common::Atof(tokens[1].c_str(), &sigmoid_);

        }

      }

    }

    if (sigmoid_ <= 0.0) {

      Log::Fatal("Sigmoid parameter %f should be greater than zero", sigmoid_);

    }

  }


  ~BinaryLogloss() {}


  void Init(const Metadata& metadata, data_size_t num_data) override {

    num_data_ = num_data;

    label_ = metadata.label();

    weights_ = metadata.weights();

    data_size_t cnt_positive = 0;

    data_size_t cnt_negative = 0;

    // REMOVEME: remove the warning after 2.4 version release

    Log::Warning("Starting from the 2.1.2 version, default value for "

                 "the \"boost_from_average\" parameter in \"binary\" objective is true.\n"

                 "This may cause significantly different results comparing to the previous versions of LightGBM.\n"

                 "Try to set boost_from_average=false, if your old models produce bad results");

    // count for positive and negative samples

    #pragma omp parallel for schedule(static) reduction(+:cnt_positive, cnt_negative)

    for (data_size_t i = 0; i < num_data_; ++i) {

      if (is_pos_(label_[i])) {

        ++cnt_positive;

      } else {

        ++cnt_negative;

      }

    }

    need_train_ = true;

    if (cnt_negative == 0 || cnt_positive == 0) {

      Log::Warning("Contains only one class");

      // not need to boost.

      need_train_ = false;

    }

    Log::Info("Number of positive: %d, number of negative: %d", cnt_positive, cnt_negative);

    // use -1 for negative class, and 1 for positive class

    label_val_[0] = -1;

    label_val_[1] = 1;

    // weight for label

    label_weights_[0] = 1.0f;

    label_weights_[1] = 1.0f;

    // if using unbalance, change the labels weight

    if (is_unbalance_ && cnt_positive > 0 && cnt_negative > 0) {

      if (cnt_positive > cnt_negative) {

        label_weights_[1] = 1.0f;

        label_weights_[0] = static_cast<double>(cnt_positive) / cnt_negative;

      } else {

        label_weights_[1] = static_cast<double>(cnt_negative) / cnt_positive;

        label_weights_[0] = 1.0f;

      }

    }

    label_weights_[1] *= scale_pos_weight_;

  }


  void GetGradients(const double* score, score_t* gradients, score_t* hessians) const override {

    if (!need_train_) {

      return;

    }

    if (weights_ == nullptr) {

      #pragma omp parallel for schedule(static)

      for (data_size_t i = 0; i < num_data_; ++i) {

        // get label and label weights

        const int is_pos = is_pos_(label_[i]);

        const int label = label_val_[is_pos];

        const double label_weight = label_weights_[is_pos];

        // calculate gradients and hessians

        const double response = -label * sigmoid_ / (1.0f + std::exp(label * sigmoid_ * score[i]));

        const double abs_response = fabs(response);

        gradients[i] = static_cast<score_t>(response * label_weight);

        hessians[i] = static_cast<score_t>(abs_response * (sigmoid_ - abs_response) * label_weight);

      }

    } else {

      #pragma omp parallel for schedule(static)

      for (data_size_t i = 0; i < num_data_; ++i) {

        // get label and label weights

        const int is_pos = is_pos_(label_[i]);

        const int label = label_val_[is_pos];

        const double label_weight = label_weights_[is_pos];

        // calculate gradients and hessians

        const double response = -label * sigmoid_ / (1.0f + std::exp(label * sigmoid_ * score[i]));

        const double abs_response = fabs(response);

        gradients[i] = static_cast<score_t>(response * label_weight  * weights_[i]);

        hessians[i] = static_cast<score_t>(abs_response * (sigmoid_ - abs_response) * label_weight * weights_[i]);

      }

    }

  }


  // implement custom average to boost from (if enabled among options)

  double BoostFromScore(int) const override {

    double suml = 0.0f;

    double sumw = 0.0f;

    if (weights_ != nullptr) {

      #pragma omp parallel for schedule(static) reduction(+:suml, sumw)

      for (data_size_t i = 0; i < num_data_; ++i) {

        suml += is_pos_(label_[i]) * weights_[i];

        sumw += weights_[i];

      }

    } else {

      sumw = static_cast<double>(num_data_);

      #pragma omp parallel for schedule(static) reduction(+:suml)

      for (data_size_t i = 0; i < num_data_; ++i) {

        suml += is_pos_(label_[i]);

      }

    }

    double pavg = suml / sumw;

    pavg = std::min(pavg, 1.0 - kEpsilon);

    pavg = std::max<double>(pavg, kEpsilon);

    double initscore = std::log(pavg / (1.0f - pavg)) / sigmoid_;

    Log::Info("[%s:%s]: pavg=%f -> initscore=%f",  GetName(), __func__, pavg, initscore);

    return initscore;

  }


  bool ClassNeedTrain(int /*class_id*/) const override {

    return need_train_;

  }


  const char* GetName() const override {

    return "binary";

  }


  void ConvertOutput(const double* input, double* output) const override {

    output[0] = 1.0f / (1.0f + std::exp(-sigmoid_ * input[0]));

  }


  std::string ToString() const override {

    std::stringstream str_buf;

    str_buf << GetName() << " ";

    str_buf << "sigmoid:" << sigmoid_;

    return str_buf.str();

  }


  bool SkipEmptyClass() const override { return true; }


  bool NeedAccuratePrediction() const override { return false; }


private:

  data_size_t num_data_;

  const label_t* label_;

  bool is_unbalance_;

  double sigmoid_;

  int label_val_[2];

  double label_weights_[2];

  const label_t* weights_;

  double scale_pos_weight_;

  std::function<bool(label_t)> is_pos_;

  bool need_train_;

};


}  // namespace LightGBM

#endif   // LightGBM_OBJECTIVE_BINARY_OBJECTIVE_HPP_

LightGBM::BinaryLogloss
Objective function for binary classification.
Definition binary_objective.hpp:13

LightGBM::BinaryLogloss::GetGradients
void GetGradients(const double *score, score_t *gradients, score_t *hessians) const override
calculating first order derivative of loss function
Definition binary_objective.hpp:94

LightGBM::BinaryLogloss::NeedAccuratePrediction
bool NeedAccuratePrediction() const override
The prediction should be accurate or not. True will disable early stopping for prediction.
Definition binary_objective.hpp:173

LightGBM::BinaryLogloss::Init
void Init(const Metadata &metadata, data_size_t num_data) override
Initialize.
Definition binary_objective.hpp:48

LightGBM::Metadata
This class is used to store some meta(non-feature) data for training data, e.g. labels,...
Definition dataset.h:36

LightGBM::Metadata::label
const label_t * label() const
Get pointer of label.
Definition dataset.h:113

LightGBM::Metadata::weights
const label_t * weights() const
Get weights, if not exists, will return nullptr.
Definition dataset.h:146

LightGBM::ObjectiveFunction
The interface of Objective Function.
Definition objective_function.h:13

LightGBM
desc and descl2 fields must be written in reStructuredText format
Definition application.h:10

LightGBM::score_t
float score_t
Type of score, and gradients.
Definition meta.h:26

LightGBM::label_t
float label_t
Type of metadata, include weight and label.
Definition meta.h:33

LightGBM::data_size_t
int32_t data_size_t
Type of data size, it is better to use signed type.
Definition meta.h:14

LightGBM::Config
Definition config.h:27