MR_LIBS/ranking__utils_8h_source.html

#ifndef XGBOOST_COMMON_RANKING_UTILS_H_

#define XGBOOST_COMMON_RANKING_UTILS_H_

#include <algorithm>                     // for min

#include <cmath>                         // for log2, fabs, floor

#include <cstddef>                       // for size_t

#include <cstdint>                       // for uint32_t, uint8_t, int32_t

#include <limits>                        // for numeric_limits

#include <string>                        // for char_traits, string

#include <vector>                        // for vector


#include "dmlc/parameter.h"              // for FieldEntry, DMLC_DECLARE_FIELD

#include "error_msg.h"                   // for GroupWeight, GroupSize, InvalidCUDAOrdinal

#include "xgboost/base.h"                // for XGBOOST_DEVICE, bst_group_t

#include "xgboost/context.h"             // for Context

#include "xgboost/data.h"                // for MetaInfo

#include "xgboost/host_device_vector.h"  // for HostDeviceVector

#include "xgboost/linalg.h"              // for Vector, VectorView, Tensor

#include "xgboost/logging.h"             // for CHECK_EQ, CHECK

#include "xgboost/parameter.h"           // for XGBoostParameter

#include "xgboost/span.h"                // for Span

#include "xgboost/string_view.h"         // for StringView


namespace xgboost::ltr {

using rel_degree_t = std::uint32_t;  // NOLINT

using position_t = std::uint32_t;  // NOLINT


constexpr std::size_t MaxRel() { return sizeof(rel_degree_t) * 8 - 1; }

static_assert(MaxRel() == 31);


XGBOOST_DEVICE inline double CalcDCGGain(rel_degree_t label) {

  return static_cast<double>((1u << label) - 1);

}


XGBOOST_DEVICE inline double CalcDCGDiscount(std::size_t idx) {

  return 1.0 / std::log2(static_cast<double>(idx) + 2.0);

}


XGBOOST_DEVICE inline double CalcInvIDCG(double idcg) {

  auto inv_idcg = (idcg == 0.0 ? 0.0 : (1.0 / idcg));  // handle irrelevant document

  return inv_idcg;

}


enum class PairMethod : std::int32_t {

  kTopK = 0,

  kMean = 1,

};

}  // namespace xgboost::ltr


DECLARE_FIELD_ENUM_CLASS(xgboost::ltr::PairMethod);


namespace xgboost::ltr {


struct LambdaRankParam : public XGBoostParameter<LambdaRankParam> {

 private:

  static constexpr position_t DefaultK() { return 32; }

  static constexpr position_t DefaultSamplePairs() { return 1; }


 protected:

  // pairs

  // should be accessed by getter for auto configuration.

  // nolint so that we can keep the string name.

  PairMethod lambdarank_pair_method{PairMethod::kTopK};  // NOLINT

  std::size_t lambdarank_num_pair_per_sample{NotSet()};  // NOLINT


 public:

  static constexpr position_t NotSet() { return std::numeric_limits<position_t>::max(); }


  // unbiased

  bool lambdarank_unbiased{false};

  double lambdarank_bias_norm{1.0};

  // ndcg

  bool ndcg_exp_gain{true};


  bool operator==(LambdaRankParam const& that) const {

    return lambdarank_pair_method == that.lambdarank_pair_method &&

           lambdarank_num_pair_per_sample == that.lambdarank_num_pair_per_sample &&

           lambdarank_unbiased == that.lambdarank_unbiased &&

           lambdarank_bias_norm == that.lambdarank_bias_norm && ndcg_exp_gain == that.ndcg_exp_gain;

  }

  bool operator!=(LambdaRankParam const& that) const { return !(*this == that); }


  [[nodiscard]] double Regularizer() const { return 1.0 / (1.0 + this->lambdarank_bias_norm); }


  [[nodiscard]] position_t NumPair() const {

    if (lambdarank_num_pair_per_sample == NotSet()) {

      switch (lambdarank_pair_method) {

        case PairMethod::kMean:

          return DefaultSamplePairs();

        case PairMethod::kTopK:

          return DefaultK();

      }

    } else {

      return lambdarank_num_pair_per_sample;

    }

    LOG(FATAL) << "Unreachable.";

    return 0;

  }


  [[nodiscard]] bool HasTruncation() const { return lambdarank_pair_method == PairMethod::kTopK; }


  // Used for evaluation metric and cache initialization, iterate through top-k or the whole list

  [[nodiscard]] auto TopK() const {

    if (HasTruncation()) {

      return NumPair();

    } else {

      return NotSet();

    }

  }


  DMLC_DECLARE_PARAMETER(LambdaRankParam) {

    DMLC_DECLARE_FIELD(lambdarank_pair_method)

        .set_default(PairMethod::kTopK)

        .add_enum("mean", PairMethod::kMean)

        .add_enum("topk", PairMethod::kTopK)

        .describe("Method for constructing pairs.");

    DMLC_DECLARE_FIELD(lambdarank_num_pair_per_sample)

        .set_default(NotSet())

        .set_lower_bound(1)

        .describe("Number of pairs for each sample in the list.");

    DMLC_DECLARE_FIELD(lambdarank_unbiased)

        .set_default(false)

        .describe("Unbiased lambda mart. Use extended IPW to debias click position");

    DMLC_DECLARE_FIELD(lambdarank_bias_norm)

        .set_default(1.0)

        .set_lower_bound(0.0)

        .describe("Lp regularization for unbiased lambdarank.");

    DMLC_DECLARE_FIELD(ndcg_exp_gain)

        .set_default(true)

        .describe("When set to true, the label gain is 2^rel - 1, otherwise it's rel.");

  }

};


class RankingCache {

 private:

  void InitOnCPU(Context const* ctx, MetaInfo const& info);

  void InitOnCUDA(Context const* ctx, MetaInfo const& info);

  // Cached parameter

  LambdaRankParam param_;

  // offset to data groups.

  HostDeviceVector<bst_group_t> group_ptr_;

  // store the sorted index of prediction.

  HostDeviceVector<std::size_t> sorted_idx_cache_;

  // Maximum size of group

  std::size_t max_group_size_{0};

  // Normalization for weight

  double weight_norm_{1.0};

  // offset to threads assigned to each group for gradient calculation

  HostDeviceVector<std::size_t> threads_group_ptr_;

  // Sorted index of label for finding buckets.

  HostDeviceVector<std::size_t> y_sorted_idx_cache_;

  // Cached labels sorted by the model

  HostDeviceVector<float> y_ranked_by_model_;

  // store rounding factor for objective for each group

  linalg::Vector<GradientPair> roundings_;

  // rounding factor for cost

  HostDeviceVector<double> cost_rounding_;

  // temporary storage for creating rounding factors. Stored as byte to avoid having cuda

  // data structure in here.

  HostDeviceVector<std::uint8_t> max_lambdas_;

  // total number of cuda threads used for gradient calculation

  std::size_t n_cuda_threads_{0};


  // Create model rank list on GPU

  common::Span<std::size_t const> MakeRankOnCUDA(Context const* ctx,

                                                 common::Span<float const> predt);

  // Create model rank list on CPU

  common::Span<std::size_t const> MakeRankOnCPU(Context const* ctx,

                                                common::Span<float const> predt);


 protected:

  [[nodiscard]] std::size_t MaxGroupSize() const { return max_group_size_; }


 public:

  RankingCache(Context const* ctx, MetaInfo const& info, LambdaRankParam const& p) : param_{p} {

    CHECK(param_.GetInitialised());

    if (!info.group_ptr_.empty()) {

      CHECK_EQ(info.group_ptr_.back(), info.labels.Size())

          << error::GroupSize() << "the size of label.";

    }

    if (ctx->IsCPU()) {

      this->InitOnCPU(ctx, info);

    } else {

      this->InitOnCUDA(ctx, info);

    }

    if (!info.weights_.Empty()) {

      CHECK_EQ(Groups(), info.weights_.Size()) << error::GroupWeight();

    }

  }

  [[nodiscard]] std::size_t MaxPositionSize() const {

    // Use truncation level as bound.

    if (param_.HasTruncation()) {

      return param_.NumPair();

    }

    // Hardcoded maximum size of positions to track. We don't need too many of them as the

    // bias decreases exponentially.

    return std::min(max_group_size_, static_cast<std::size_t>(32));

  }

  // Constructed as [1, n_samples] if group ptr is not supplied by the user

  common::Span<bst_group_t const> DataGroupPtr(Context const* ctx) const {

    group_ptr_.SetDevice(ctx->gpu_id);

    return ctx->IsCPU() ? group_ptr_.ConstHostSpan() : group_ptr_.ConstDeviceSpan();

  }


  [[nodiscard]] auto const& Param() const { return param_; }

  [[nodiscard]] std::size_t Groups() const { return group_ptr_.Size() - 1; }

  [[nodiscard]] double WeightNorm() const { return weight_norm_; }


  // Create a rank list by model prediction

  common::Span<std::size_t const> SortedIdx(Context const* ctx, common::Span<float const> predt) {

    if (sorted_idx_cache_.Empty()) {

      sorted_idx_cache_.SetDevice(ctx->gpu_id);

      sorted_idx_cache_.Resize(predt.size());

    }

    if (ctx->IsCPU()) {

      return this->MakeRankOnCPU(ctx, predt);

    } else {

      return this->MakeRankOnCUDA(ctx, predt);

    }

  }

  // The function simply returns a uninitialized buffer as this is only used by the

  // objective for creating pairs.

  common::Span<std::size_t> SortedIdxY(Context const* ctx, std::size_t n_samples) {

    CHECK(ctx->IsCUDA()) << error::InvalidCUDAOrdinal();

    if (y_sorted_idx_cache_.Empty()) {

      y_sorted_idx_cache_.SetDevice(ctx->gpu_id);

      y_sorted_idx_cache_.Resize(n_samples);

    }

    return y_sorted_idx_cache_.DeviceSpan();

  }

  common::Span<float> RankedY(Context const* ctx, std::size_t n_samples) {

    CHECK(ctx->IsCUDA()) << error::InvalidCUDAOrdinal();

    if (y_ranked_by_model_.Empty()) {

      y_ranked_by_model_.SetDevice(ctx->gpu_id);

      y_ranked_by_model_.Resize(n_samples);

    }

    return y_ranked_by_model_.DeviceSpan();

  }


  // CUDA cache getters, the cache is shared between metric and objective, some of these

  // fields are lazy initialized to avoid unnecessary allocation.

  [[nodiscard]] common::Span<std::size_t const> CUDAThreadsGroupPtr() const {

    CHECK(!threads_group_ptr_.Empty());

    return threads_group_ptr_.ConstDeviceSpan();

  }

  [[nodiscard]] std::size_t CUDAThreads() const { return n_cuda_threads_; }


  linalg::VectorView<GradientPair> CUDARounding(Context const* ctx) {

    if (roundings_.Size() == 0) {

      roundings_.SetDevice(ctx->gpu_id);

      roundings_.Reshape(Groups());

    }

    return roundings_.View(ctx->gpu_id);

  }

  common::Span<double> CUDACostRounding(Context const* ctx) {

    if (cost_rounding_.Size() == 0) {

      cost_rounding_.SetDevice(ctx->gpu_id);

      cost_rounding_.Resize(1);

    }

    return cost_rounding_.DeviceSpan();

  }

  template <typename Type>

  common::Span<Type> MaxLambdas(Context const* ctx, std::size_t n) {

    max_lambdas_.SetDevice(ctx->gpu_id);

    std::size_t bytes = n * sizeof(Type);

    if (bytes != max_lambdas_.Size()) {

      max_lambdas_.Resize(bytes);

    }

    return common::Span<Type>{reinterpret_cast<Type*>(max_lambdas_.DevicePointer()), n};

  }

};


class NDCGCache : public RankingCache {

  // NDCG discount

  HostDeviceVector<double> discounts_;

  // 1.0 / IDCG

  linalg::Vector<double> inv_idcg_;

  // store the intermediate DCG calculation result for metric

  linalg::Vector<double> dcg_;


 public:

  void InitOnCPU(Context const* ctx, MetaInfo const& info);

  void InitOnCUDA(Context const* ctx, MetaInfo const& info);


 public:

  NDCGCache(Context const* ctx, MetaInfo const& info, LambdaRankParam const& p)

      : RankingCache{ctx, info, p} {

    if (ctx->IsCPU()) {

      this->InitOnCPU(ctx, info);

    } else {

      this->InitOnCUDA(ctx, info);

    }

  }


  linalg::VectorView<double const> InvIDCG(Context const* ctx) const {

    return inv_idcg_.View(ctx->gpu_id);

  }

  common::Span<double const> Discount(Context const* ctx) const {

    return ctx->IsCPU() ? discounts_.ConstHostSpan() : discounts_.ConstDeviceSpan();

  }

  linalg::VectorView<double> Dcg(Context const* ctx) {

    if (dcg_.Size() == 0) {

      dcg_.SetDevice(ctx->gpu_id);

      dcg_.Reshape(this->Groups());

    }

    return dcg_.View(ctx->gpu_id);

  }

};


template <typename NoneOf>


void CheckNDCGLabels(ltr::LambdaRankParam const& p, linalg::VectorView<float const> labels,

                     NoneOf none_of) {

  auto d_labels = labels.Values();

  if (p.ndcg_exp_gain) {

    auto label_is_integer =

        none_of(d_labels.data(), d_labels.data() + d_labels.size(), [] XGBOOST_DEVICE(float v) {

          auto l = std::floor(v);

          return std::fabs(l - v) > kRtEps || v < 0.0f;

        });

    CHECK(label_is_integer)

        << "When using relevance degree as target, label must be either 0 or positive integer.";

  }


  if (p.ndcg_exp_gain) {

    auto label_is_valid = none_of(d_labels.data(), d_labels.data() + d_labels.size(),

                                  [] XGBOOST_DEVICE(ltr::rel_degree_t v) { return v > MaxRel(); });

    CHECK(label_is_valid) << "Relevance degress must be lesser than or equal to " << MaxRel()

                          << " when the exponential NDCG gain function is used. "

                          << "Set `ndcg_exp_gain` to false to use custom DCG gain.";

  }

}


template <typename AllOf>

bool IsBinaryRel(linalg::VectorView<float const> label, AllOf all_of) {

  auto s_label = label.Values();

  return all_of(s_label.data(), s_label.data() + s_label.size(), [] XGBOOST_DEVICE(float y) {

    return std::abs(y - 1.0f) < kRtEps || std::abs(y - 0.0f) < kRtEps;

  });

}

template <typename AllOf>


void CheckPreLabels(StringView name, linalg::VectorView<float const> label, AllOf all_of) {

  auto s_label = label.Values();

  auto is_binary = IsBinaryRel(label, all_of);

  CHECK(is_binary) << name << " can only be used with binary labels.";

}


class PreCache : public RankingCache {

  HostDeviceVector<double> pre_;


  void InitOnCPU(Context const* ctx, MetaInfo const& info);

  void InitOnCUDA(Context const* ctx, MetaInfo const& info);


 public:

  PreCache(Context const* ctx, MetaInfo const& info, LambdaRankParam const& p)

      : RankingCache{ctx, info, p} {

    if (ctx->IsCPU()) {

      this->InitOnCPU(ctx, info);

    } else {

      this->InitOnCUDA(ctx, info);

    }

  }


  common::Span<double> Pre(Context const* ctx) {

    if (pre_.Empty()) {

      pre_.SetDevice(ctx->gpu_id);

      pre_.Resize(this->Groups());

    }

    return ctx->IsCPU() ? pre_.HostSpan() : pre_.DeviceSpan();

  }

};


class MAPCache : public RankingCache {

  // Total number of relevant documents for each group

  HostDeviceVector<double> n_rel_;

  // \sum l_k/k

  HostDeviceVector<double> acc_;

  HostDeviceVector<double> map_;

  // Number of samples in this dataset.

  std::size_t n_samples_{0};


  void InitOnCPU(Context const* ctx, MetaInfo const& info);

  void InitOnCUDA(Context const* ctx, MetaInfo const& info);


 public:

  MAPCache(Context const* ctx, MetaInfo const& info, LambdaRankParam const& p)

      : RankingCache{ctx, info, p}, n_samples_{static_cast<std::size_t>(info.num_row_)} {

    if (ctx->IsCPU()) {

      this->InitOnCPU(ctx, info);

    } else {

      this->InitOnCUDA(ctx, info);

    }

  }


  common::Span<double> NumRelevant(Context const* ctx) {

    if (n_rel_.Empty()) {

      n_rel_.SetDevice(ctx->gpu_id);

      n_rel_.Resize(n_samples_);

    }

    return ctx->IsCPU() ? n_rel_.HostSpan() : n_rel_.DeviceSpan();

  }

  common::Span<double> Acc(Context const* ctx) {

    if (acc_.Empty()) {

      acc_.SetDevice(ctx->gpu_id);

      acc_.Resize(n_samples_);

    }

    return ctx->IsCPU() ? acc_.HostSpan() : acc_.DeviceSpan();

  }

  common::Span<double> Map(Context const* ctx) {

    if (map_.Empty()) {

      map_.SetDevice(ctx->gpu_id);

      map_.Resize(this->Groups());

    }

    return ctx->IsCPU() ? map_.HostSpan() : map_.DeviceSpan();

  }

};


std::string ParseMetricName(StringView name, StringView param, position_t* topn, bool* minus);


std::string MakeMetricName(StringView name, position_t topn, bool minus);

}  // namespace xgboost::ltr

#endif  // XGBOOST_COMMON_RANKING_UTILS_H_

xgboost::HostDeviceVector
Definition host_device_vector.h:87

xgboost::MetaInfo
Meta information about dataset, always sit in memory.
Definition data.h:48

xgboost::MetaInfo::weights_
HostDeviceVector< bst_float > weights_
weights of each instance, optional
Definition data.h:69

xgboost::MetaInfo::group_ptr_
std::vector< bst_group_t > group_ptr_
the index of begin and end of a group needed when the learning task is ranking.
Definition data.h:67

xgboost::MetaInfo::num_row_
uint64_t num_row_
number of rows in the data
Definition data.h:54

xgboost::MetaInfo::labels
linalg::Tensor< float, 2 > labels
label of each instance
Definition data.h:60

xgboost::common::Span
span class implementation, based on ISO++20 span<T>. The interface should be the same.
Definition span.h:424

xgboost::linalg::TensorView
A tensor view with static type and dimension.
Definition linalg.h:293

xgboost::linalg::Tensor
A tensor storage.
Definition linalg.h:742

xgboost::linalg::Tensor::SetDevice
void SetDevice(int32_t device) const
Set device ordinal for this tensor.
Definition linalg.h:933

xgboost::linalg::Tensor::Reshape
void Reshape(S &&...s)
Reshape the tensor.
Definition linalg.h:887

xgboost::linalg::Tensor::View
TensorView< T, kDim > View(int32_t device)
Get a TensorView for this tensor.
Definition linalg.h:837

xgboost::ltr::MAPCache
Definition ranking_utils.h:406

xgboost::ltr::NDCGCache
Definition ranking_utils.h:292

xgboost::ltr::PreCache
Definition ranking_utils.h:381

xgboost::ltr::RankingCache
Common cached items for ranking tasks.
Definition ranking_utils.h:150

context.h
Copyright 2014-2023, XGBoost Contributors.

parameter.h
Provide lightweight util to do parameter setup and checking.

host_device_vector.h
A device-and-host vector abstraction layer.

base.h
Copyright 2015-2023 by XGBoost Contributors.

XGBOOST_DEVICE
#define XGBOOST_DEVICE
Tag function as usable by device.
Definition base.h:64

data.h
Copyright 2015-2023 by XGBoost Contributors.

logging.h
defines console logging options for xgboost. Use to enforce unified print behavior.

parameter.h
macro for using C++11 enum class as DMLC parameter

DECLARE_FIELD_ENUM_CLASS
#define DECLARE_FIELD_ENUM_CLASS(EnumClass)
Specialization of FieldEntry for enum class (backed by int)
Definition parameter.h:50

linalg.h
Copyright 2021-2023 by XGBoost Contributors.

xgboost::ltr
Copyright 2023 by XGBoost contributors.
Definition ranking_utils.cc:22

xgboost::ltr::CheckNDCGLabels
void CheckNDCGLabels(ltr::LambdaRankParam const &p, linalg::VectorView< float const > labels, NoneOf none_of)
Validate label for NDCG.
Definition ranking_utils.h:339

xgboost::ltr::ParseMetricName
std::string ParseMetricName(StringView name, StringView param, position_t *topn, bool *minus)
Parse name for ranking metric given parameters.
Definition ranking_utils.cc:137

xgboost::ltr::MakeMetricName
std::string MakeMetricName(StringView name, position_t topn, bool minus)
Parse name for ranking metric given parameters.
Definition ranking_utils.cc:157

xgboost::ltr::CheckPreLabels
void CheckPreLabels(StringView name, linalg::VectorView< float const > label, AllOf all_of)
Validate label for precision-based metric.
Definition ranking_utils.h:375

xgboost::ltr::rel_degree_t
std::uint32_t rel_degree_t
Relevance degree.
Definition ranking_utils.h:30

xgboost::ltr::position_t
std::uint32_t position_t
top-k position
Definition ranking_utils.h:34

xgboost::ltr::MaxRel
constexpr std::size_t MaxRel()
Maximum relevance degree for NDCG.
Definition ranking_utils.h:39

xgboost::kRtEps
constexpr bst_float kRtEps
small eps gap for minimum split decision.
Definition base.h:319

Param
Definition parameter_test.cc:4

xgboost::Context
Runtime context for XGBoost.
Definition context.h:84

xgboost::Context::IsCPU
bool IsCPU() const
Is XGBoost running on CPU?
Definition context.h:133

xgboost::Context::IsCUDA
bool IsCUDA() const
Is XGBoost running on a CUDA device?
Definition context.h:137

xgboost::StringView
Definition string_view.h:15

xgboost::XGBoostParameter
Definition parameter.h:84

xgboost::ltr::LambdaRankParam
Definition ranking_utils.h:64

xgboost::ltr::LambdaRankParam::NumPair
position_t NumPair() const
Get number of pairs for each sample.
Definition ranking_utils.h:98