MR_LIBS/linalg__op_8h_source.html

#ifndef XGBOOST_COMMON_LINALG_OP_H_

#define XGBOOST_COMMON_LINALG_OP_H_

#include <cstdint>  // std::int32_t

#include <type_traits>


#include "common.h"

#include "threading_utils.h"

#include "transform_iterator.h"  // MakeIndexTransformIter

#include "xgboost/context.h"     // Context

#include "xgboost/linalg.h"


namespace xgboost {

namespace linalg {

template <typename T, int32_t D, typename Fn>

void ElementWiseTransformHost(linalg::TensorView<T, D> t, int32_t n_threads, Fn&& fn) {

  if (t.Contiguous()) {

    auto ptr = t.Values().data();

    common::ParallelFor(t.Size(), n_threads, [&](size_t i) { ptr[i] = fn(i, ptr[i]); });

  } else {

    common::ParallelFor(t.Size(), n_threads, [&](size_t i) {

      auto& v = detail::Apply(t, linalg::UnravelIndex(i, t.Shape()));

      v = fn(i, v);

    });

  }

}


template <typename T, int32_t D, typename Fn>

void ElementWiseKernelHost(linalg::TensorView<T, D> t, int32_t n_threads, Fn&& fn) {

  static_assert(std::is_void<std::result_of_t<Fn(size_t, T&)>>::value,

                "For function with return, use transform instead.");

  if (t.Contiguous()) {

    auto ptr = t.Values().data();

    common::ParallelFor(t.Size(), n_threads, [&](size_t i) { fn(i, ptr[i]); });

  } else {

    common::ParallelFor(t.Size(), n_threads, [&](size_t i) {

      auto& v = detail::Apply(t, linalg::UnravelIndex(i, t.Shape()));

      fn(i, v);

    });

  }

}


#if !defined(XGBOOST_USE_CUDA)

template <typename T, int32_t D, typename Fn>

void ElementWiseKernelDevice(linalg::TensorView<T, D>, Fn&&, void* = nullptr) {

  common::AssertGPUSupport();

}


template <typename T, int32_t D, typename Fn>

void ElementWiseTransformDevice(linalg::TensorView<T, D>, Fn&&, void* = nullptr) {

  common::AssertGPUSupport();

}


template <typename T, int32_t D, typename Fn>

void ElementWiseKernel(Context const* ctx, linalg::TensorView<T, D> t, Fn&& fn) {

  if (!ctx->IsCPU()) {

    common::AssertGPUSupport();

  }

  ElementWiseKernelHost(t, ctx->Threads(), fn);

}

#endif  // !defined(XGBOOST_USE_CUDA)


template <typename T, std::int32_t kDim>

auto cbegin(TensorView<T, kDim> const& v) {  // NOLINT

  auto it = common::MakeIndexTransformIter([&](size_t i) -> std::remove_cv_t<T> const& {

    return linalg::detail::Apply(v, linalg::UnravelIndex(i, v.Shape()));

  });

  return it;

}


template <typename T, std::int32_t kDim>

auto cend(TensorView<T, kDim> const& v) {  // NOLINT

  return cbegin(v) + v.Size();

}


template <typename T, std::int32_t kDim>

auto begin(TensorView<T, kDim>& v) {  // NOLINT

  auto it = common::MakeIndexTransformIter(

      [&](size_t i) -> T& { return linalg::detail::Apply(v, linalg::UnravelIndex(i, v.Shape())); });

  return it;

}


template <typename T, std::int32_t kDim>

auto end(TensorView<T, kDim>& v) {  // NOLINT

  return begin(v) + v.Size();

}

}  // namespace linalg

}  // namespace xgboost

#endif  // XGBOOST_COMMON_LINALG_OP_H_

context.h
Copyright 2014-2023, XGBoost Contributors.

linalg.h
Copyright 2021-2023 by XGBoost Contributors.

xgboost::linalg::UnravelIndex
LINALG_HD auto UnravelIndex(size_t idx, common::Span< size_t const, D > shape)
Turns linear index into multi-dimension index.
Definition linalg.h:613

xgboost
namespace of xgboost
Definition base.h:90

xgboost::Context::Threads
std::int32_t Threads() const
Returns the automatically chosen number of threads based on the nthread parameter and the system sett...
Definition context.cc:203

xgboost::Context::IsCPU
bool IsCPU() const
Is XGBoost running on CPU?
Definition context.h:133

common.h
Copyright 2015-2023 by XGBoost Contributors.