2018-08-01 10:38:30 +08:00
|
|
|
// -*- C++ -*-
|
|
|
|
//===------------------------------ charconv ------------------------------===//
|
|
|
|
//
|
2019-01-19 18:56:40 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2018-08-01 10:38:30 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef _LIBCPP_CHARCONV
|
|
|
|
#define _LIBCPP_CHARCONV
|
|
|
|
|
|
|
|
/*
|
|
|
|
charconv synopsis
|
|
|
|
|
|
|
|
namespace std {
|
|
|
|
|
|
|
|
// floating-point format for primitive numerical conversion
|
|
|
|
enum class chars_format {
|
|
|
|
scientific = unspecified,
|
|
|
|
fixed = unspecified,
|
|
|
|
hex = unspecified,
|
|
|
|
general = fixed | scientific
|
|
|
|
};
|
|
|
|
|
|
|
|
// 23.20.2, primitive numerical output conversion
|
|
|
|
struct to_chars_result {
|
|
|
|
char* ptr;
|
|
|
|
errc ec;
|
|
|
|
};
|
|
|
|
|
|
|
|
to_chars_result to_chars(char* first, char* last, see below value,
|
|
|
|
int base = 10);
|
|
|
|
|
|
|
|
to_chars_result to_chars(char* first, char* last, float value);
|
|
|
|
to_chars_result to_chars(char* first, char* last, double value);
|
|
|
|
to_chars_result to_chars(char* first, char* last, long double value);
|
|
|
|
|
|
|
|
to_chars_result to_chars(char* first, char* last, float value,
|
|
|
|
chars_format fmt);
|
|
|
|
to_chars_result to_chars(char* first, char* last, double value,
|
|
|
|
chars_format fmt);
|
|
|
|
to_chars_result to_chars(char* first, char* last, long double value,
|
|
|
|
chars_format fmt);
|
|
|
|
|
|
|
|
to_chars_result to_chars(char* first, char* last, float value,
|
|
|
|
chars_format fmt, int precision);
|
|
|
|
to_chars_result to_chars(char* first, char* last, double value,
|
|
|
|
chars_format fmt, int precision);
|
|
|
|
to_chars_result to_chars(char* first, char* last, long double value,
|
|
|
|
chars_format fmt, int precision);
|
|
|
|
|
|
|
|
// 23.20.3, primitive numerical input conversion
|
|
|
|
struct from_chars_result {
|
|
|
|
const char* ptr;
|
|
|
|
errc ec;
|
|
|
|
};
|
|
|
|
|
|
|
|
from_chars_result from_chars(const char* first, const char* last,
|
|
|
|
see below& value, int base = 10);
|
|
|
|
|
|
|
|
from_chars_result from_chars(const char* first, const char* last,
|
|
|
|
float& value,
|
|
|
|
chars_format fmt = chars_format::general);
|
|
|
|
from_chars_result from_chars(const char* first, const char* last,
|
|
|
|
double& value,
|
|
|
|
chars_format fmt = chars_format::general);
|
|
|
|
from_chars_result from_chars(const char* first, const char* last,
|
|
|
|
long double& value,
|
|
|
|
chars_format fmt = chars_format::general);
|
|
|
|
|
|
|
|
} // namespace std
|
|
|
|
|
|
|
|
*/
|
|
|
|
|
2020-11-05 04:01:25 +08:00
|
|
|
#include <__availability>
|
2021-08-08 17:02:07 +08:00
|
|
|
#include <__bits>
|
2021-05-19 23:57:04 +08:00
|
|
|
#include <__config>
|
2018-08-01 10:38:30 +08:00
|
|
|
#include <__errc>
|
2021-04-24 23:28:35 +08:00
|
|
|
#include <__utility/to_underlying.h>
|
2020-12-08 10:45:29 +08:00
|
|
|
#include <cmath> // for log2f
|
|
|
|
#include <cstdint>
|
[libc++] Fixes std::to_chars for bases != 10.
While working on D70631, Microsoft's unit tests discovered an issue.
Our `std::to_chars` implementation for bases != 10 uses the range
`[first,last)` as temporary buffer. This violates the contract for
to_chars:
[charconv.to.chars]/1 http://eel.is/c++draft/charconv#to.chars-1
`to_chars_result to_chars(char* first, char* last, see below value, int base = 10);`
"If the member ec of the return value is such that the value is equal to
the value of a value-initialized errc, the conversion was successful and
the member ptr is the one-past-the-end pointer of the characters
written."
Our implementation modifies the range `[member ptr, last)`, which causes
Microsoft's test to fail. Their test verifies the buffer
`[member ptr, last)` is unchanged. (The test is only done when the
conversion is successful.)
While looking at the code I noticed the performance for bases != 10 also
is suboptimal. This is tracked in D97705.
This patch fixes the issue and adds a benchmark. This benchmark will be
used as baseline for D97705.
Reviewed By: #libc, Quuxplusone, zoecarver
Differential Revision: https://reviews.llvm.org/D100722
2021-02-27 23:52:39 +08:00
|
|
|
#include <cstdlib> // for _LIBCPP_UNREACHABLE
|
2020-12-08 10:45:29 +08:00
|
|
|
#include <cstring>
|
2018-08-01 10:38:30 +08:00
|
|
|
#include <limits>
|
2020-12-08 10:45:29 +08:00
|
|
|
#include <type_traits>
|
2018-08-01 10:38:30 +08:00
|
|
|
|
|
|
|
#include <__debug>
|
|
|
|
|
|
|
|
#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
|
|
|
|
#pragma GCC system_header
|
|
|
|
#endif
|
|
|
|
|
2018-10-26 09:00:56 +08:00
|
|
|
_LIBCPP_PUSH_MACROS
|
|
|
|
#include <__undef_macros>
|
|
|
|
|
2018-08-01 10:38:30 +08:00
|
|
|
_LIBCPP_BEGIN_NAMESPACE_STD
|
|
|
|
|
2018-10-25 20:13:43 +08:00
|
|
|
namespace __itoa {
|
2020-05-21 22:25:15 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS _LIBCPP_FUNC_VIS char* __u64toa(uint64_t __value, char* __buffer) _NOEXCEPT;
|
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS _LIBCPP_FUNC_VIS char* __u32toa(uint32_t __value, char* __buffer) _NOEXCEPT;
|
2018-10-25 20:13:43 +08:00
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
#ifndef _LIBCPP_CXX03_LANG
|
2018-08-01 10:38:30 +08:00
|
|
|
|
|
|
|
enum class _LIBCPP_ENUM_VIS chars_format
|
|
|
|
{
|
|
|
|
scientific = 0x1,
|
|
|
|
fixed = 0x2,
|
|
|
|
hex = 0x4,
|
|
|
|
general = fixed | scientific
|
|
|
|
};
|
|
|
|
|
2021-02-20 18:00:00 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY constexpr chars_format
|
|
|
|
operator~(chars_format __x) {
|
|
|
|
return chars_format(~_VSTD::__to_underlying(__x));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY constexpr chars_format
|
|
|
|
operator&(chars_format __x, chars_format __y) {
|
|
|
|
return chars_format(_VSTD::__to_underlying(__x) &
|
|
|
|
_VSTD::__to_underlying(__y));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY constexpr chars_format
|
|
|
|
operator|(chars_format __x, chars_format __y) {
|
|
|
|
return chars_format(_VSTD::__to_underlying(__x) |
|
|
|
|
_VSTD::__to_underlying(__y));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY constexpr chars_format
|
|
|
|
operator^(chars_format __x, chars_format __y) {
|
|
|
|
return chars_format(_VSTD::__to_underlying(__x) ^
|
|
|
|
_VSTD::__to_underlying(__y));
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY _LIBCPP_CONSTEXPR_AFTER_CXX11 chars_format&
|
|
|
|
operator&=(chars_format& __x, chars_format __y) {
|
|
|
|
__x = __x & __y;
|
|
|
|
return __x;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY _LIBCPP_CONSTEXPR_AFTER_CXX11 chars_format&
|
|
|
|
operator|=(chars_format& __x, chars_format __y) {
|
|
|
|
__x = __x | __y;
|
|
|
|
return __x;
|
|
|
|
}
|
|
|
|
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY _LIBCPP_CONSTEXPR_AFTER_CXX11 chars_format&
|
|
|
|
operator^=(chars_format& __x, chars_format __y) {
|
|
|
|
__x = __x ^ __y;
|
|
|
|
return __x;
|
|
|
|
}
|
|
|
|
|
2018-08-01 10:38:30 +08:00
|
|
|
struct _LIBCPP_TYPE_VIS to_chars_result
|
|
|
|
{
|
|
|
|
char* ptr;
|
|
|
|
errc ec;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct _LIBCPP_TYPE_VIS from_chars_result
|
|
|
|
{
|
|
|
|
const char* ptr;
|
|
|
|
errc ec;
|
|
|
|
};
|
|
|
|
|
|
|
|
void to_chars(char*, char*, bool, int = 10) = delete;
|
|
|
|
void from_chars(const char*, const char*, bool, int = 10) = delete;
|
|
|
|
|
|
|
|
namespace __itoa
|
|
|
|
{
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
static _LIBCPP_CONSTEXPR uint64_t __pow10_64[] = {
|
2018-08-01 10:38:30 +08:00
|
|
|
UINT64_C(0),
|
|
|
|
UINT64_C(10),
|
|
|
|
UINT64_C(100),
|
|
|
|
UINT64_C(1000),
|
|
|
|
UINT64_C(10000),
|
|
|
|
UINT64_C(100000),
|
|
|
|
UINT64_C(1000000),
|
|
|
|
UINT64_C(10000000),
|
|
|
|
UINT64_C(100000000),
|
|
|
|
UINT64_C(1000000000),
|
|
|
|
UINT64_C(10000000000),
|
|
|
|
UINT64_C(100000000000),
|
|
|
|
UINT64_C(1000000000000),
|
|
|
|
UINT64_C(10000000000000),
|
|
|
|
UINT64_C(100000000000000),
|
|
|
|
UINT64_C(1000000000000000),
|
|
|
|
UINT64_C(10000000000000000),
|
|
|
|
UINT64_C(100000000000000000),
|
|
|
|
UINT64_C(1000000000000000000),
|
|
|
|
UINT64_C(10000000000000000000),
|
|
|
|
};
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
static _LIBCPP_CONSTEXPR uint32_t __pow10_32[] = {
|
2018-08-01 10:38:30 +08:00
|
|
|
UINT32_C(0), UINT32_C(10), UINT32_C(100),
|
|
|
|
UINT32_C(1000), UINT32_C(10000), UINT32_C(100000),
|
|
|
|
UINT32_C(1000000), UINT32_C(10000000), UINT32_C(100000000),
|
|
|
|
UINT32_C(1000000000),
|
|
|
|
};
|
|
|
|
|
|
|
|
template <typename _Tp, typename = void>
|
|
|
|
struct _LIBCPP_HIDDEN __traits_base
|
|
|
|
{
|
|
|
|
using type = uint64_t;
|
|
|
|
|
|
|
|
static _LIBCPP_INLINE_VISIBILITY int __width(_Tp __v)
|
|
|
|
{
|
2021-08-08 17:02:07 +08:00
|
|
|
auto __t = (64 - _VSTD::__libcpp_clz(static_cast<type>(__v | 1))) * 1233 >> 12;
|
2018-08-01 10:38:30 +08:00
|
|
|
return __t - (__v < __pow10_64[__t]) + 1;
|
|
|
|
}
|
|
|
|
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
static _LIBCPP_INLINE_VISIBILITY char* __convert(_Tp __v, char* __p)
|
|
|
|
{
|
|
|
|
return __u64toa(__v, __p);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
static _LIBCPP_INLINE_VISIBILITY decltype(__pow10_64)& __pow() { return __pow10_64; }
|
2018-08-01 10:38:30 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
struct _LIBCPP_HIDDEN
|
|
|
|
__traits_base<_Tp, decltype(void(uint32_t{declval<_Tp>()}))>
|
|
|
|
{
|
|
|
|
using type = uint32_t;
|
|
|
|
|
|
|
|
static _LIBCPP_INLINE_VISIBILITY int __width(_Tp __v)
|
|
|
|
{
|
2021-08-08 17:02:07 +08:00
|
|
|
auto __t = (32 - _VSTD::__libcpp_clz(static_cast<type>(__v | 1))) * 1233 >> 12;
|
2018-08-01 10:38:30 +08:00
|
|
|
return __t - (__v < __pow10_32[__t]) + 1;
|
|
|
|
}
|
|
|
|
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
static _LIBCPP_INLINE_VISIBILITY char* __convert(_Tp __v, char* __p)
|
|
|
|
{
|
|
|
|
return __u32toa(__v, __p);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
static _LIBCPP_INLINE_VISIBILITY decltype(__pow10_32)& __pow() { return __pow10_32; }
|
2018-08-01 10:38:30 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY bool
|
|
|
|
__mul_overflowed(unsigned char __a, _Tp __b, unsigned char& __r)
|
|
|
|
{
|
|
|
|
auto __c = __a * __b;
|
|
|
|
__r = __c;
|
2020-11-28 03:13:05 +08:00
|
|
|
return __c > numeric_limits<unsigned char>::max();
|
2018-08-01 10:38:30 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY bool
|
|
|
|
__mul_overflowed(unsigned short __a, _Tp __b, unsigned short& __r)
|
|
|
|
{
|
|
|
|
auto __c = __a * __b;
|
|
|
|
__r = __c;
|
2020-11-28 03:13:05 +08:00
|
|
|
return __c > numeric_limits<unsigned short>::max();
|
2018-08-01 10:38:30 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY bool
|
|
|
|
__mul_overflowed(_Tp __a, _Tp __b, _Tp& __r)
|
|
|
|
{
|
|
|
|
static_assert(is_unsigned<_Tp>::value, "");
|
|
|
|
#if !defined(_LIBCPP_COMPILER_MSVC)
|
|
|
|
return __builtin_mul_overflow(__a, __b, &__r);
|
|
|
|
#else
|
2020-11-28 03:13:05 +08:00
|
|
|
bool __did = __b && (numeric_limits<_Tp>::max() / __b) < __a;
|
2018-08-01 10:38:30 +08:00
|
|
|
__r = __a * __b;
|
|
|
|
return __did;
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp, typename _Up>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY bool
|
|
|
|
__mul_overflowed(_Tp __a, _Up __b, _Tp& __r)
|
|
|
|
{
|
|
|
|
return __mul_overflowed(__a, static_cast<_Tp>(__b), __r);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
struct _LIBCPP_HIDDEN __traits : __traits_base<_Tp>
|
|
|
|
{
|
2019-03-21 02:13:23 +08:00
|
|
|
static _LIBCPP_CONSTEXPR int digits = numeric_limits<_Tp>::digits10 + 1;
|
2018-08-01 10:38:30 +08:00
|
|
|
using __traits_base<_Tp>::__pow;
|
|
|
|
using typename __traits_base<_Tp>::type;
|
|
|
|
|
|
|
|
// precondition: at least one non-zero character available
|
|
|
|
static _LIBCPP_INLINE_VISIBILITY char const*
|
|
|
|
__read(char const* __p, char const* __ep, type& __a, type& __b)
|
|
|
|
{
|
|
|
|
type __cprod[digits];
|
|
|
|
int __j = digits - 1;
|
|
|
|
int __i = digits;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (!('0' <= *__p && *__p <= '9'))
|
|
|
|
break;
|
|
|
|
__cprod[--__i] = *__p++ - '0';
|
|
|
|
} while (__p != __ep && __i != 0);
|
|
|
|
|
|
|
|
__a = __inner_product(__cprod + __i + 1, __cprod + __j, __pow() + 1,
|
|
|
|
__cprod[__i]);
|
|
|
|
if (__mul_overflowed(__cprod[__j], __pow()[__j - __i], __b))
|
|
|
|
--__p;
|
|
|
|
return __p;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _It1, typename _It2, class _Up>
|
|
|
|
static _LIBCPP_INLINE_VISIBILITY _Up
|
|
|
|
__inner_product(_It1 __first1, _It1 __last1, _It2 __first2, _Up __init)
|
|
|
|
{
|
|
|
|
for (; __first1 < __last1; ++__first1, ++__first2)
|
|
|
|
__init = __init + *__first1 * *__first2;
|
|
|
|
return __init;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
} // namespace __itoa
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY _Tp
|
|
|
|
__complement(_Tp __x)
|
|
|
|
{
|
|
|
|
static_assert(is_unsigned<_Tp>::value, "cast to unsigned first");
|
|
|
|
return _Tp(~__x + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
__to_chars_itoa(char* __first, char* __last, _Tp __value, true_type)
|
|
|
|
{
|
2021-05-12 23:46:24 +08:00
|
|
|
auto __x = __to_unsigned_like(__value);
|
2018-08-01 10:38:30 +08:00
|
|
|
if (__value < 0 && __first != __last)
|
|
|
|
{
|
|
|
|
*__first++ = '-';
|
|
|
|
__x = __complement(__x);
|
|
|
|
}
|
|
|
|
|
|
|
|
return __to_chars_itoa(__first, __last, __x, false_type());
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
__to_chars_itoa(char* __first, char* __last, _Tp __value, false_type)
|
|
|
|
{
|
|
|
|
using __tx = __itoa::__traits<_Tp>;
|
|
|
|
auto __diff = __last - __first;
|
|
|
|
|
|
|
|
if (__tx::digits <= __diff || __tx::__width(__value) <= __diff)
|
2019-06-14 06:27:24 +08:00
|
|
|
return {__tx::__convert(__value, __first), errc(0)};
|
2018-08-01 10:38:30 +08:00
|
|
|
else
|
|
|
|
return {__last, errc::value_too_large};
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
__to_chars_integral(char* __first, char* __last, _Tp __value, int __base,
|
|
|
|
true_type)
|
|
|
|
{
|
2021-05-12 23:46:24 +08:00
|
|
|
auto __x = __to_unsigned_like(__value);
|
2018-08-01 10:38:30 +08:00
|
|
|
if (__value < 0 && __first != __last)
|
|
|
|
{
|
|
|
|
*__first++ = '-';
|
|
|
|
__x = __complement(__x);
|
|
|
|
}
|
|
|
|
|
|
|
|
return __to_chars_integral(__first, __last, __x, __base, false_type());
|
|
|
|
}
|
|
|
|
|
[libc++] Fixes std::to_chars for bases != 10.
While working on D70631, Microsoft's unit tests discovered an issue.
Our `std::to_chars` implementation for bases != 10 uses the range
`[first,last)` as temporary buffer. This violates the contract for
to_chars:
[charconv.to.chars]/1 http://eel.is/c++draft/charconv#to.chars-1
`to_chars_result to_chars(char* first, char* last, see below value, int base = 10);`
"If the member ec of the return value is such that the value is equal to
the value of a value-initialized errc, the conversion was successful and
the member ptr is the one-past-the-end pointer of the characters
written."
Our implementation modifies the range `[member ptr, last)`, which causes
Microsoft's test to fail. Their test verifies the buffer
`[member ptr, last)` is unchanged. (The test is only done when the
conversion is successful.)
While looking at the code I noticed the performance for bases != 10 also
is suboptimal. This is tracked in D97705.
This patch fixes the issue and adds a benchmark. This benchmark will be
used as baseline for D97705.
Reviewed By: #libc, Quuxplusone, zoecarver
Differential Revision: https://reviews.llvm.org/D100722
2021-02-27 23:52:39 +08:00
|
|
|
template <typename _Tp>
|
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS _LIBCPP_INLINE_VISIBILITY int __to_chars_integral_width(_Tp __value, unsigned __base) {
|
|
|
|
_LIBCPP_ASSERT(__value >= 0, "The function requires a non-negative value.");
|
|
|
|
|
|
|
|
unsigned __base_2 = __base * __base;
|
|
|
|
unsigned __base_3 = __base_2 * __base;
|
|
|
|
unsigned __base_4 = __base_2 * __base_2;
|
|
|
|
|
|
|
|
int __r = 0;
|
|
|
|
while (true) {
|
|
|
|
if (__value < __base)
|
|
|
|
return __r + 1;
|
|
|
|
if (__value < __base_2)
|
|
|
|
return __r + 2;
|
|
|
|
if (__value < __base_3)
|
|
|
|
return __r + 3;
|
|
|
|
if (__value < __base_4)
|
|
|
|
return __r + 4;
|
|
|
|
|
|
|
|
__value /= __base_4;
|
|
|
|
__r += 4;
|
|
|
|
}
|
|
|
|
|
|
|
|
_LIBCPP_UNREACHABLE();
|
|
|
|
}
|
|
|
|
|
2018-08-01 10:38:30 +08:00
|
|
|
template <typename _Tp>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
__to_chars_integral(char* __first, char* __last, _Tp __value, int __base,
|
|
|
|
false_type)
|
|
|
|
{
|
[libc++] Fixes std::to_chars for bases != 10.
While working on D70631, Microsoft's unit tests discovered an issue.
Our `std::to_chars` implementation for bases != 10 uses the range
`[first,last)` as temporary buffer. This violates the contract for
to_chars:
[charconv.to.chars]/1 http://eel.is/c++draft/charconv#to.chars-1
`to_chars_result to_chars(char* first, char* last, see below value, int base = 10);`
"If the member ec of the return value is such that the value is equal to
the value of a value-initialized errc, the conversion was successful and
the member ptr is the one-past-the-end pointer of the characters
written."
Our implementation modifies the range `[member ptr, last)`, which causes
Microsoft's test to fail. Their test verifies the buffer
`[member ptr, last)` is unchanged. (The test is only done when the
conversion is successful.)
While looking at the code I noticed the performance for bases != 10 also
is suboptimal. This is tracked in D97705.
This patch fixes the issue and adds a benchmark. This benchmark will be
used as baseline for D97705.
Reviewed By: #libc, Quuxplusone, zoecarver
Differential Revision: https://reviews.llvm.org/D100722
2021-02-27 23:52:39 +08:00
|
|
|
if (__base == 10)
|
|
|
|
return __to_chars_itoa(__first, __last, __value, false_type());
|
|
|
|
|
|
|
|
ptrdiff_t __cap = __last - __first;
|
|
|
|
int __n = __to_chars_integral_width(__value, __base);
|
|
|
|
if (__n > __cap)
|
|
|
|
return {__last, errc::value_too_large};
|
|
|
|
|
|
|
|
__last = __first + __n;
|
|
|
|
char* __p = __last;
|
|
|
|
do {
|
|
|
|
unsigned __c = __value % __base;
|
|
|
|
__value /= __base;
|
|
|
|
*--__p = "0123456789abcdefghijklmnopqrstuvwxyz"[__c];
|
|
|
|
} while (__value != 0);
|
|
|
|
return {__last, errc(0)};
|
2018-08-01 10:38:30 +08:00
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_integral<_Tp>::value, int>::type = 0>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
to_chars(char* __first, char* __last, _Tp __value)
|
|
|
|
{
|
|
|
|
return __to_chars_itoa(__first, __last, __value, is_signed<_Tp>());
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_integral<_Tp>::value, int>::type = 0>
|
2020-02-14 22:19:47 +08:00
|
|
|
_LIBCPP_AVAILABILITY_TO_CHARS
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY to_chars_result
|
|
|
|
to_chars(char* __first, char* __last, _Tp __value, int __base)
|
|
|
|
{
|
|
|
|
_LIBCPP_ASSERT(2 <= __base && __base <= 36, "base not in [2, 36]");
|
|
|
|
return __to_chars_integral(__first, __last, __value, __base,
|
|
|
|
is_signed<_Tp>());
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _It, typename _Tp, typename _Fn, typename... _Ts>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__sign_combinator(_It __first, _It __last, _Tp& __value, _Fn __f, _Ts... __args)
|
|
|
|
{
|
|
|
|
using __tl = numeric_limits<_Tp>;
|
2021-05-12 23:46:24 +08:00
|
|
|
decltype(__to_unsigned_like(__value)) __x;
|
2018-08-01 10:38:30 +08:00
|
|
|
|
|
|
|
bool __neg = (__first != __last && *__first == '-');
|
|
|
|
auto __r = __f(__neg ? __first + 1 : __first, __last, __x, __args...);
|
|
|
|
switch (__r.ec)
|
|
|
|
{
|
|
|
|
case errc::invalid_argument:
|
|
|
|
return {__first, __r.ec};
|
|
|
|
case errc::result_out_of_range:
|
|
|
|
return __r;
|
|
|
|
default:
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (__neg)
|
|
|
|
{
|
2021-05-12 23:46:24 +08:00
|
|
|
if (__x <= __complement(__to_unsigned_like(__tl::min())))
|
2018-08-01 10:38:30 +08:00
|
|
|
{
|
|
|
|
__x = __complement(__x);
|
2020-12-08 10:45:29 +08:00
|
|
|
_VSTD::memcpy(&__value, &__x, sizeof(__x));
|
2018-08-01 10:38:30 +08:00
|
|
|
return __r;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2020-11-28 03:13:05 +08:00
|
|
|
if (__x <= __tl::max())
|
2018-08-01 10:38:30 +08:00
|
|
|
{
|
|
|
|
__value = __x;
|
|
|
|
return __r;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return {__r.ptr, errc::result_out_of_range};
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY bool
|
|
|
|
__in_pattern(_Tp __c)
|
|
|
|
{
|
|
|
|
return '0' <= __c && __c <= '9';
|
|
|
|
}
|
|
|
|
|
|
|
|
struct _LIBCPP_HIDDEN __in_pattern_result
|
|
|
|
{
|
|
|
|
bool __ok;
|
|
|
|
int __val;
|
|
|
|
|
|
|
|
explicit _LIBCPP_INLINE_VISIBILITY operator bool() const { return __ok; }
|
|
|
|
};
|
|
|
|
|
|
|
|
template <typename _Tp>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY __in_pattern_result
|
|
|
|
__in_pattern(_Tp __c, int __base)
|
|
|
|
{
|
|
|
|
if (__base <= 10)
|
|
|
|
return {'0' <= __c && __c < '0' + __base, __c - '0'};
|
|
|
|
else if (__in_pattern(__c))
|
|
|
|
return {true, __c - '0'};
|
|
|
|
else if ('a' <= __c && __c < 'a' + __base - 10)
|
|
|
|
return {true, __c - 'a' + 10};
|
|
|
|
else
|
|
|
|
return {'A' <= __c && __c < 'A' + __base - 10, __c - 'A' + 10};
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename _It, typename _Tp, typename _Fn, typename... _Ts>
|
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__subject_seq_combinator(_It __first, _It __last, _Tp& __value, _Fn __f,
|
|
|
|
_Ts... __args)
|
|
|
|
{
|
|
|
|
auto __find_non_zero = [](_It __first, _It __last) {
|
|
|
|
for (; __first != __last; ++__first)
|
|
|
|
if (*__first != '0')
|
|
|
|
break;
|
|
|
|
return __first;
|
|
|
|
};
|
|
|
|
|
|
|
|
auto __p = __find_non_zero(__first, __last);
|
|
|
|
if (__p == __last || !__in_pattern(*__p, __args...))
|
|
|
|
{
|
|
|
|
if (__p == __first)
|
|
|
|
return {__first, errc::invalid_argument};
|
|
|
|
else
|
|
|
|
{
|
|
|
|
__value = 0;
|
|
|
|
return {__p, {}};
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
auto __r = __f(__p, __last, __value, __args...);
|
|
|
|
if (__r.ec == errc::result_out_of_range)
|
|
|
|
{
|
|
|
|
for (; __r.ptr != __last; ++__r.ptr)
|
|
|
|
{
|
|
|
|
if (!__in_pattern(*__r.ptr, __args...))
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return __r;
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_unsigned<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__from_chars_atoi(const char* __first, const char* __last, _Tp& __value)
|
|
|
|
{
|
|
|
|
using __tx = __itoa::__traits<_Tp>;
|
|
|
|
using __output_type = typename __tx::type;
|
|
|
|
|
|
|
|
return __subject_seq_combinator(
|
|
|
|
__first, __last, __value,
|
|
|
|
[](const char* __first, const char* __last,
|
|
|
|
_Tp& __value) -> from_chars_result {
|
|
|
|
__output_type __a, __b;
|
|
|
|
auto __p = __tx::__read(__first, __last, __a, __b);
|
|
|
|
if (__p == __last || !__in_pattern(*__p))
|
|
|
|
{
|
2020-11-28 03:13:05 +08:00
|
|
|
__output_type __m = numeric_limits<_Tp>::max();
|
2018-08-01 10:38:30 +08:00
|
|
|
if (__m >= __a && __m - __a >= __b)
|
|
|
|
{
|
|
|
|
__value = __a + __b;
|
|
|
|
return {__p, {}};
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return {__p, errc::result_out_of_range};
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_signed<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__from_chars_atoi(const char* __first, const char* __last, _Tp& __value)
|
|
|
|
{
|
2021-05-12 23:46:24 +08:00
|
|
|
using __t = decltype(__to_unsigned_like(__value));
|
2018-08-01 10:38:30 +08:00
|
|
|
return __sign_combinator(__first, __last, __value, __from_chars_atoi<__t>);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_unsigned<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__from_chars_integral(const char* __first, const char* __last, _Tp& __value,
|
|
|
|
int __base)
|
|
|
|
{
|
|
|
|
if (__base == 10)
|
|
|
|
return __from_chars_atoi(__first, __last, __value);
|
|
|
|
|
|
|
|
return __subject_seq_combinator(
|
|
|
|
__first, __last, __value,
|
2021-07-28 05:30:47 +08:00
|
|
|
[](const char* __p, const char* __lastx, _Tp& __value,
|
2018-08-01 10:38:30 +08:00
|
|
|
int __base) -> from_chars_result {
|
|
|
|
using __tl = numeric_limits<_Tp>;
|
|
|
|
auto __digits = __tl::digits / log2f(float(__base));
|
|
|
|
_Tp __a = __in_pattern(*__p++, __base).__val, __b = 0;
|
|
|
|
|
2021-07-28 05:30:47 +08:00
|
|
|
for (int __i = 1; __p != __lastx; ++__i, ++__p)
|
2018-08-01 10:38:30 +08:00
|
|
|
{
|
|
|
|
if (auto __c = __in_pattern(*__p, __base))
|
|
|
|
{
|
|
|
|
if (__i < __digits - 1)
|
|
|
|
__a = __a * __base + __c.__val;
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (!__itoa::__mul_overflowed(__a, __base, __a))
|
|
|
|
++__p;
|
|
|
|
__b = __c.__val;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2021-07-28 05:30:47 +08:00
|
|
|
if (__p == __lastx || !__in_pattern(*__p, __base))
|
2018-08-01 10:38:30 +08:00
|
|
|
{
|
2020-11-28 03:13:05 +08:00
|
|
|
if (__tl::max() - __a >= __b)
|
2018-08-01 10:38:30 +08:00
|
|
|
{
|
|
|
|
__value = __a + __b;
|
|
|
|
return {__p, {}};
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return {__p, errc::result_out_of_range};
|
|
|
|
},
|
|
|
|
__base);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_signed<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
__from_chars_integral(const char* __first, const char* __last, _Tp& __value,
|
|
|
|
int __base)
|
|
|
|
{
|
2021-05-12 23:46:24 +08:00
|
|
|
using __t = decltype(__to_unsigned_like(__value));
|
2018-08-01 10:38:30 +08:00
|
|
|
return __sign_combinator(__first, __last, __value,
|
|
|
|
__from_chars_integral<__t>, __base);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_integral<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
from_chars(const char* __first, const char* __last, _Tp& __value)
|
|
|
|
{
|
|
|
|
return __from_chars_atoi(__first, __last, __value);
|
|
|
|
}
|
|
|
|
|
2019-03-21 02:13:23 +08:00
|
|
|
template <typename _Tp, typename enable_if<is_integral<_Tp>::value, int>::type = 0>
|
2018-08-01 10:38:30 +08:00
|
|
|
inline _LIBCPP_INLINE_VISIBILITY from_chars_result
|
|
|
|
from_chars(const char* __first, const char* __last, _Tp& __value, int __base)
|
|
|
|
{
|
|
|
|
_LIBCPP_ASSERT(2 <= __base && __base <= 36, "base not in [2, 36]");
|
|
|
|
return __from_chars_integral(__first, __last, __value, __base);
|
|
|
|
}
|
|
|
|
|
2021-04-21 00:03:32 +08:00
|
|
|
#endif // _LIBCPP_CXX03_LANG
|
2018-08-01 10:38:30 +08:00
|
|
|
|
|
|
|
_LIBCPP_END_NAMESPACE_STD
|
|
|
|
|
2018-10-26 09:00:56 +08:00
|
|
|
_LIBCPP_POP_MACROS
|
|
|
|
|
2021-04-21 00:03:32 +08:00
|
|
|
#endif // _LIBCPP_CHARCONV
|