MR_LIBS/strtonum_8h_source.html

#ifndef DMLC_STRTONUM_H_

#define DMLC_STRTONUM_H_


#if DMLC_USE_CXX11

#include <type_traits>

#endif


#include <string>

#include <limits>

#include <cstdint>

#include "./base.h"

#include "./logging.h"


namespace dmlc {


inline bool isspace(char c) {

  return (c == ' ' || c == '\t' || c == '\r' || c == '\n' || c == '\f');

}


inline bool isblank(char c) {

  return (c == ' ' || c == '\t');

}


inline bool isdigit(char c) {

  return (c >= '0' && c <= '9');

}


inline bool isalpha(char c) {

  static_assert(

    static_cast<int>('A') == 65 && static_cast<int>('Z' - 'A') == 25,

    "Only system with ASCII character set is supported");

  return (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z');

}


inline bool isdigitchars(char c) {

  return (c >= '0' && c <= '9')

    || c == '+' || c == '-'

    || c == '.'

    || c == 'e' || c == 'E';

}


const int kStrtofMaxDigits = 19;


template <typename FloatType, bool CheckRange = false>


inline FloatType ParseFloat(const char* nptr, char** endptr) {

#if DMLC_USE_CXX11

  static_assert(std::is_same<FloatType, double>::value

                || std::is_same<FloatType, float>::value,

               "ParseFloat is defined only for 'float' and 'double' types");

  constexpr unsigned kMaxExponent

    = (std::is_same<FloatType, double>::value ? 308U : 38U);

  constexpr FloatType kMaxSignificandForMaxExponent

    = static_cast<FloatType>(std::is_same<FloatType, double>::value

                             ? 1.79769313486231570 : 3.402823466);

    // If a floating-point value has kMaxExponent, what is

    //   the largest possible significand value?

  constexpr FloatType kMaxSignificandForNegMaxExponent

    = static_cast<FloatType>(std::is_same<FloatType, double>::value

                             ? 2.22507385850720139 : 1.175494351);

    // If a floating-point value has -kMaxExponent, what is

    //   the largest possible significand value?

#else

  const unsigned kMaxExponent

    = (sizeof(FloatType) == sizeof(double) ? 308U : 38U);

  const FloatType kMaxSignificandForMaxExponent

    = static_cast<FloatType>(sizeof(FloatType) == sizeof(double)

                             ? 1.79769313486231570 : 3.402823466);

  const FloatType kMaxSignificandForNegMaxExponent

    = static_cast<FloatType>(sizeof(FloatType) == sizeof(double)

                             ? 2.22507385850720139 : 1.175494351);

#endif


  const char *p = nptr;

  // Skip leading white space, if any. Not necessary

  while (isspace(*p) ) ++p;


  // Get sign, if any.

  bool sign = true;

  if (*p == '-') {

    sign = false; ++p;

  } else if (*p == '+') {

    ++p;

  }


  // Handle INF and NAN

  {

    int i = 0;

    // case-insensitive match for INF and INFINITY

    while (i < 8 && static_cast<char>((*p) | 32) == "infinity"[i]) {

      ++i; ++p;

    }

    if (i == 3 || i == 8) {

      if (endptr) *endptr = (char*)p;  // NOLINT(*)

      return sign ?  std::numeric_limits<FloatType>::infinity()

                  : -std::numeric_limits<FloatType>::infinity();

    } else {

      p -= i;

    }


    // case-insensitive match for NAN

    i = 0;

    while (i < 3 && static_cast<char>((*p) | 32) == "nan"[i]) {

      ++i; ++p;

    }

    if (i == 3) {

      // Got NAN; check if the value is of form NAN(char_sequence)

      if (*p == '(') {

        ++p;

        while (isdigit(*p) || isalpha(*p) || *p == '_') ++p;

        CHECK_EQ(*p, ')') << "Invalid NAN literal";

        ++p;

      }

      static_assert(std::numeric_limits<FloatType>::has_quiet_NaN,

        "Only system with quiet NaN is supported");

      if (endptr) *endptr = (char*)p;  // NOLINT(*)

      return std::numeric_limits<FloatType>::quiet_NaN();

    } else {

      p -= i;

    }

  }


  // Get digits before decimal point or exponent, if any.

  uint64_t predec;  // to store digits before decimal point

  for (predec = 0; isdigit(*p); ++p) {

    predec = predec * 10ULL + static_cast<uint64_t>(*p - '0');

  }

  FloatType value = static_cast<FloatType>(predec);


  // Get digits after decimal point, if any.

  if (*p == '.') {

    uint64_t pow10 = 1;

    uint64_t val2 = 0;

    int digit_cnt = 0;

    ++p;

    while (isdigit(*p)) {

      if (digit_cnt < kStrtofMaxDigits) {

        val2 = val2 * 10ULL + static_cast<uint64_t>(*p - '0');

        pow10 *= 10ULL;

      }  // when kStrtofMaxDigits is read, ignored following digits

      ++p;

      ++digit_cnt;

    }

    value += static_cast<FloatType>(

        static_cast<double>(val2) / static_cast<double>(pow10));

  }


  // Handle exponent, if any.

  if ((*p == 'e') || (*p == 'E')) {

    ++p;

    bool frac = false;

    FloatType scale = static_cast<FloatType>(1.0f);

    unsigned expon;

    // Get sign of exponent, if any.

    if (*p == '-') {

      frac = true;

      ++p;

    } else if (*p == '+') {

      ++p;

    }

    // Get digits of exponent, if any.

    for (expon = 0; isdigit(*p); ++p) {

      expon = expon * 10U + static_cast<unsigned>(*p - '0');

    }

    if (expon > kMaxExponent) {  // out of range, clip or raise error

      if (CheckRange) {

        errno = ERANGE;

        if (endptr) *endptr = (char*)p;  // NOLINT(*)

        return std::numeric_limits<FloatType>::infinity();

      } else {

        expon = kMaxExponent;

      }

    }

    // handle edge case where exponent is exactly kMaxExponent

    if (expon == kMaxExponent

        && ((!frac && value > kMaxSignificandForMaxExponent)

           || (frac && value < kMaxSignificandForNegMaxExponent))) {

      if (CheckRange) {

        errno = ERANGE;

        if (endptr) *endptr = (char*)p;  // NOLINT(*)

        return std::numeric_limits<FloatType>::infinity();

      } else {

        value = (frac ? kMaxSignificandForNegMaxExponent

                 : kMaxSignificandForMaxExponent);

      }

    }

    // Calculate scaling factor.

    while (expon >= 8U) { scale *= static_cast<FloatType>(1E8f);  expon -= 8U; }

    while (expon >  0U) { scale *= static_cast<FloatType>(10.0f); expon -= 1U; }

    // Return signed and scaled floating point result.

    value = frac ? (value / scale) : (value * scale);

  }

  // Consume 'f' suffix, if any

  if (*p == 'f' || *p == 'F') {

    ++p;

  }


  if (endptr) *endptr = (char*)p;  // NOLINT(*)

  return sign ? value : - value;

}


inline float strtof(const char* nptr, char** endptr) {

  return ParseFloat<float>(nptr, endptr);

}


inline float strtof_check_range(const char* nptr, char** endptr) {

  return ParseFloat<float, true>(nptr, endptr);

}


inline double strtod(const char* nptr, char** endptr) {

  return ParseFloat<double>(nptr, endptr);

}


inline double strtod_check_range(const char* nptr, char** endptr) {

  return ParseFloat<double, true>(nptr, endptr);

}


template <typename SignedIntType>


inline SignedIntType ParseSignedInt(const char* nptr, char** endptr, int base) {

#ifdef DMLC_USE_CXX11

  static_assert(std::is_signed<SignedIntType>::value

                && std::is_integral<SignedIntType>::value,

                "ParseSignedInt is defined for signed integers only");

#endif

  CHECK(base <= 10 && base >= 2);

  const char* p = nptr;

  // Skip leading white space, if any. Not necessary

  while (isspace(*p) ) ++p;


  // Get sign if any

  bool sign = true;

  if (*p == '-') {

    sign = false; ++p;

  } else if (*p == '+') {

    ++p;

  }


  SignedIntType value;

  const SignedIntType base_val = static_cast<SignedIntType>(base);

  for (value = 0; isdigit(*p); ++p) {

    value = value * base_val + static_cast<SignedIntType>(*p - '0');

  }


  if (endptr) *endptr = (char*)p;  // NOLINT(*)

  return sign ? value : - value;

}


template <typename UnsignedIntType>


inline UnsignedIntType ParseUnsignedInt(const char* nptr, char** endptr, int base) {

#ifdef DMLC_USE_CXX11

  static_assert(std::is_unsigned<UnsignedIntType>::value

                && std::is_integral<UnsignedIntType>::value,

                "ParseUnsignedInt is defined for unsigned integers only");

#endif

  CHECK(base <= 10 && base >= 2);

  const char *p = nptr;

  // Skip leading white space, if any. Not necessary

  while (isspace(*p)) ++p;


  // Get sign if any

  bool sign = true;

  if (*p == '-') {

    sign = false; ++p;

  } else if (*p == '+') {

    ++p;

  }


  // we are parsing unsigned, so no minus sign should be found

  CHECK_EQ(sign, true);


  UnsignedIntType value;

  const UnsignedIntType base_val = static_cast<UnsignedIntType>(base);

  for (value = 0; isdigit(*p); ++p) {

    value = value * base_val + static_cast<UnsignedIntType>(*p - '0');

  }


  if (endptr) *endptr = (char*)p; // NOLINT(*)

  return value;

}


inline uint64_t strtoull(const char* nptr, char **endptr, int base) {

  return ParseUnsignedInt<uint64_t>(nptr, endptr, base);

}


inline long atol(const char* p) {  // NOLINT(*)

  return ParseSignedInt<long>(p, 0, 10); // NOLINT(*)

}


inline float atof(const char* nptr) {

  return strtof(nptr, 0);

}


inline float stof(const std::string& value, size_t* pos = nullptr) {

  const char* str_source = value.c_str();

  char* endptr;

  const float parsed_value = dmlc::strtof_check_range(str_source, &endptr);

  if (errno == ERANGE && parsed_value == std::numeric_limits<float>::infinity()) {

    throw std::out_of_range("Out of range value");

  } else if (const_cast<const char*>(endptr) == str_source) {

    throw std::invalid_argument("No conversion could be performed");

  }

  if (pos) {

    *pos = static_cast<size_t>(const_cast<const char*>(endptr) - str_source);

  }

  return parsed_value;

}


inline double stod(const std::string& value, size_t* pos = nullptr) {

  const char* str_source = value.c_str();

  char* endptr;

  const double parsed_value = dmlc::strtod_check_range(str_source, &endptr);

  if (errno == ERANGE && parsed_value == std::numeric_limits<double>::infinity()) {

    throw std::out_of_range("Out of range value");

  } else if (const_cast<const char*>(endptr) == str_source) {

    throw std::invalid_argument("No conversion could be performed");

  }

  if (pos) {

    *pos = static_cast<size_t>(const_cast<const char*>(endptr) - str_source);

  }

  return parsed_value;

}


template<typename T>


class Str2T {

 public:

  static inline T get(const char * begin);

};


template<typename T>


inline T Str2Type(const char * begin) {

  return Str2T<T>::get(begin);

}


template<>


class Str2T<int32_t> {

 public:


  static inline int32_t get(const char * begin) {

    return ParseSignedInt<int32_t>(begin, NULL, 10);

  }


};


template<>


class Str2T<uint32_t> {

 public:


  static inline uint32_t get(const char* begin) {

    return ParseUnsignedInt<uint32_t>(begin, NULL, 10);

  }


};


template<>


class Str2T<int64_t> {

 public:


  static inline int64_t get(const char * begin) {

    return ParseSignedInt<int64_t>(begin, NULL, 10);

  }


};


template<>


class Str2T<uint64_t> {

 public:


  static inline uint64_t get(const char * begin) {

    return ParseUnsignedInt<uint64_t>(begin, NULL, 10);

  }


};


template<>


class Str2T<float> {

 public:


  static inline float get(const char * begin) {

    return atof(begin);

  }


};


template<>


class Str2T<double> {

 public:


  static inline double get(const char * begin) {

    return strtod(begin, 0);

  }


};


template<typename T1, typename T2>


inline int ParsePair(const char * begin, const char * end,

                     const char ** endptr, T1 &v1, T2 &v2) { // NOLINT(*)

  const char * p = begin;

  while (p != end && !isdigitchars(*p)) ++p;

  if (p == end) {

    *endptr = end;

    return 0;

  }

  const char * q = p;

  while (q != end && isdigitchars(*q)) ++q;

  v1 = Str2Type<T1>(p);

  p = q;

  while (p != end && isblank(*p)) ++p;

  if (p == end || *p != ':') {

    // only v1

    *endptr = p;

    return 1;

  }

  p++;

  while (p != end && !isdigitchars(*p)) ++p;

  q = p;

  while (q != end && isdigitchars(*q)) ++q;

  *endptr = q;

  v2 = Str2Type<T2>(p);

  return 2;

}


template<typename T1, typename T2, typename T3>


inline int ParseTriple(const char * begin, const char * end,

                       const char ** endptr, T1 &v1, T2 &v2, T3 &v3) { // NOLINT(*)

  const char * p = begin;

  while (p != end && !isdigitchars(*p)) ++p;

  if (p == end) {

    *endptr = end;

    return 0;

  }

  const char * q = p;

  while (q != end && isdigitchars(*q)) ++q;

  v1 = Str2Type<T1>(p);

  p = q;

  while (p != end && isblank(*p)) ++p;

  if (p == end || *p != ':') {

    // only v1

    *endptr = p;

    return 1;

  }

  p++;

  while (p != end && !isdigitchars(*p)) ++p;

  q = p;

  while (q != end && isdigitchars(*q)) ++q;

  v2 = Str2Type<T2>(p);

  p = q;

  while (p != end && isblank(*p)) ++p;

  if (p == end || *p != ':') {

    // only v1:v2

    *endptr = p;

    return 2;

  }

  p++;

  while (p != end && !isdigitchars(*p)) ++p;

  q = p;

  while (q != end && isdigitchars(*q)) ++q;

  *endptr = q;

  v3 = Str2Type<T3>(p);

  return 3;

}


}  // namespace dmlc


#endif  // DMLC_STRTONUM_H_

dmlc::Str2T< double >::get
static double get(const char *begin)
Convert a string into double.
Definition strtonum.h:631

dmlc::Str2T< float >::get
static float get(const char *begin)
Convert a string into float.
Definition strtonum.h:615

dmlc::Str2T< int32_t >::get
static int32_t get(const char *begin)
Convert a string into signed 32-bit integer.
Definition strtonum.h:551

dmlc::Str2T< int64_t >::get
static int64_t get(const char *begin)
Convert a string into signed 64-bit integer.
Definition strtonum.h:583

dmlc::Str2T< uint32_t >::get
static uint32_t get(const char *begin)
Convert a string into unsigned 32-bit integer.
Definition strtonum.h:567

dmlc::Str2T< uint64_t >::get
static uint64_t get(const char *begin)
Convert a string into unsigned 64-bit integer.
Definition strtonum.h:599

dmlc::Str2T
Interface class that defines a single method get() to convert a string into type T....
Definition strtonum.h:519

dmlc::Str2T::get
static T get(const char *begin)
Convert a string into type T.

logging.h
defines console logging options for xgboost. Use to enforce unified print behavior.

dmlc
namespace for dmlc
Definition array_view.h:12

dmlc::strtod
double strtod(const char *nptr, char **endptr)
A faster implementation of strtod(). See documentation of std::strtof() for more information....
Definition strtonum.h:303

dmlc::strtof_check_range
float strtof_check_range(const char *nptr, char **endptr)
A faster implementation of strtof(). See documentation of std::strtof() for more information....
Definition strtonum.h:286

dmlc::isblank
bool isblank(char c)
Inline implementation of isblank(). Tests whether the given character is a space or tab character.
Definition strtonum.h:36

dmlc::stof
float stof(const std::string &value, size_t *pos=nullptr)
A faster implementation of stof(). See documentation of std::stof() for more information....
Definition strtonum.h:467

dmlc::atol
long atol(const char *p)
A faster implementation of atol(). See documentation of std::atol() for more information....
Definition strtonum.h:434

dmlc::atof
float atof(const char *nptr)
A faster implementation of atof(). Unlike std::atof(), this function returns float type....
Definition strtonum.h:448

dmlc::isspace
bool isspace(char c)
Inline implementation of isspace(). Tests whether the given character is a whitespace letter.
Definition strtonum.h:26

dmlc::isdigit
bool isdigit(char c)
Inline implementation of isdigit(). Tests whether the given character is a decimal digit.
Definition strtonum.h:46

dmlc::stod
double stod(const std::string &value, size_t *pos=nullptr)
A faster implementation of stod(). See documentation of std::stod() for more information....
Definition strtonum.h:497

dmlc::kStrtofMaxDigits
const int kStrtofMaxDigits
Maximum number of decimal digits dmlc::strtof() / dmlc::strtod() will process. Trailing digits will b...
Definition strtonum.h:81

dmlc::isalpha
bool isalpha(char c)
Inline implementation of isalpha(). Tests whether the given character is an alphabet letter.
Definition strtonum.h:56

dmlc::strtof
float strtof(const char *nptr, char **endptr)
A faster implementation of strtof(). See documentation of std::strtof() for more information....
Definition strtonum.h:268

dmlc::Str2Type
T Str2Type(const char *begin)
Convenience function for converting string into type T.
Definition strtonum.h:536

dmlc::isdigitchars
bool isdigitchars(char c)
Tests whether the given character is a valid letter in the string representation of a floating-point ...
Definition strtonum.h:70

dmlc::strtod_check_range
double strtod_check_range(const char *nptr, char **endptr)
A faster implementation of strtod(). See documentation of std::strtod() for more information....
Definition strtonum.h:321

dmlc::ParseSignedInt
SignedIntType ParseSignedInt(const char *nptr, char **endptr, int base)
A fast string-to-integer convertor, for signed integers TODO: the current version supports only base ...
Definition strtonum.h:337

dmlc::ParsePair
int ParsePair(const char *begin, const char *end, const char **endptr, T1 &v1, T2 &v2)
Parse colon seperated pair v1[:v2].
Definition strtonum.h:648

dmlc::strtoull
uint64_t strtoull(const char *nptr, char **endptr, int base)
A faster implementation of strtoull(). See documentation of std::strtoull() for more information....
Definition strtonum.h:422

dmlc::ParseTriple
int ParseTriple(const char *begin, const char *end, const char **endptr, T1 &v1, T2 &v2, T3 &v3)
Parse colon seperated triple v1:v2[:v3].
Definition strtonum.h:689

dmlc::ParseFloat
FloatType ParseFloat(const char *nptr, char **endptr)
Common implementation for dmlc::strtof() and dmlc::strtod() TODO: the current version does not suppor...
Definition strtonum.h:99

dmlc::ParseUnsignedInt
UnsignedIntType ParseUnsignedInt(const char *nptr, char **endptr, int base)
A fast string-to-integer convertor, for unsigned integers TODO: the current version supports only bas...
Definition strtonum.h:378

base.h
Macros common to all headers.