
The main change is to allow a UCS scalar value as fill character. Especially for char based formatting this increase the number of valid characters. Originally this was to be expected ABI breaking, however the current change does not seem to break the ABI. Implements - P2572 std::format() fill character allowances Depends on D144499 Reviewed By: ldionne, tahonermann, #libc Differential Revision: https://reviews.llvm.org/D144742
369 lines
13 KiB
C++
369 lines
13 KiB
C++
// -*- C++ -*-
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
|
|
#define _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
|
|
|
|
#include <__charconv/to_chars_integral.h>
|
|
#include <__charconv/to_chars_result.h>
|
|
#include <__charconv/traits.h>
|
|
#include <__concepts/arithmetic.h>
|
|
#include <__concepts/same_as.h>
|
|
#include <__config>
|
|
#include <__format/concepts.h>
|
|
#include <__format/format_error.h>
|
|
#include <__format/formatter_output.h>
|
|
#include <__format/parser_std_format_spec.h>
|
|
#include <__system_error/errc.h>
|
|
#include <__type_traits/make_unsigned.h>
|
|
#include <__utility/unreachable.h>
|
|
#include <array>
|
|
#include <limits>
|
|
#include <string>
|
|
#include <string_view>
|
|
|
|
#ifndef _LIBCPP_HAS_NO_LOCALIZATION
|
|
# include <locale>
|
|
#endif
|
|
|
|
#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
|
|
# pragma GCC system_header
|
|
#endif
|
|
|
|
_LIBCPP_PUSH_MACROS
|
|
#include <__undef_macros>
|
|
|
|
_LIBCPP_BEGIN_NAMESPACE_STD
|
|
|
|
#if _LIBCPP_STD_VER >= 20
|
|
|
|
namespace __formatter {
|
|
|
|
//
|
|
// Generic
|
|
//
|
|
|
|
_LIBCPP_HIDE_FROM_ABI inline char* __insert_sign(char* __buf, bool __negative, __format_spec::__sign __sign) {
|
|
if (__negative)
|
|
*__buf++ = '-';
|
|
else
|
|
switch (__sign) {
|
|
case __format_spec::__sign::__default:
|
|
case __format_spec::__sign::__minus:
|
|
// No sign added.
|
|
break;
|
|
case __format_spec::__sign::__plus:
|
|
*__buf++ = '+';
|
|
break;
|
|
case __format_spec::__sign::__space:
|
|
*__buf++ = ' ';
|
|
break;
|
|
}
|
|
|
|
return __buf;
|
|
}
|
|
|
|
/**
|
|
* Determines the required grouping based on the size of the input.
|
|
*
|
|
* The grouping's last element will be repeated. For simplicity this repeating
|
|
* is unwrapped based on the length of the input. (When the input is short some
|
|
* groups are not processed.)
|
|
*
|
|
* @returns The size of the groups to write. This means the number of
|
|
* separator characters written is size() - 1.
|
|
*
|
|
* @note Since zero-sized groups cause issues they are silently ignored.
|
|
*
|
|
* @note The grouping field of the locale is always a @c std::string,
|
|
* regardless whether the @c std::numpunct's type is @c char or @c wchar_t.
|
|
*/
|
|
_LIBCPP_HIDE_FROM_ABI inline string __determine_grouping(ptrdiff_t __size, const string& __grouping) {
|
|
_LIBCPP_ASSERT(!__grouping.empty() && __size > __grouping[0],
|
|
"The slow grouping formatting is used while there will be no "
|
|
"separators written");
|
|
string __r;
|
|
auto __end = __grouping.end() - 1;
|
|
auto __ptr = __grouping.begin();
|
|
|
|
while (true) {
|
|
__size -= *__ptr;
|
|
if (__size > 0)
|
|
__r.push_back(*__ptr);
|
|
else {
|
|
// __size <= 0 so the value pushed will be <= *__ptr.
|
|
__r.push_back(*__ptr + __size);
|
|
return __r;
|
|
}
|
|
|
|
// Proceed to the next group.
|
|
if (__ptr != __end) {
|
|
do {
|
|
++__ptr;
|
|
// Skip grouping with a width of 0.
|
|
} while (*__ptr == 0 && __ptr != __end);
|
|
}
|
|
}
|
|
|
|
__libcpp_unreachable();
|
|
}
|
|
|
|
//
|
|
// Char
|
|
//
|
|
|
|
template <__fmt_char_type _CharT>
|
|
_LIBCPP_HIDE_FROM_ABI auto __format_char(
|
|
integral auto __value,
|
|
output_iterator<const _CharT&> auto __out_it,
|
|
__format_spec::__parsed_specifications<_CharT> __specs) -> decltype(__out_it) {
|
|
using _Tp = decltype(__value);
|
|
if constexpr (!same_as<_CharT, _Tp>) {
|
|
// cmp_less and cmp_greater can't be used for character types.
|
|
if constexpr (signed_integral<_CharT> == signed_integral<_Tp>) {
|
|
if (__value < numeric_limits<_CharT>::min() || __value > numeric_limits<_CharT>::max())
|
|
std::__throw_format_error("Integral value outside the range of the char type");
|
|
} else if constexpr (signed_integral<_CharT>) {
|
|
// _CharT is signed _Tp is unsigned
|
|
if (__value > static_cast<make_unsigned_t<_CharT>>(numeric_limits<_CharT>::max()))
|
|
std::__throw_format_error("Integral value outside the range of the char type");
|
|
} else {
|
|
// _CharT is unsigned _Tp is signed
|
|
if (__value < 0 || static_cast<make_unsigned_t<_Tp>>(__value) > numeric_limits<_CharT>::max())
|
|
std::__throw_format_error("Integral value outside the range of the char type");
|
|
}
|
|
}
|
|
|
|
const auto __c = static_cast<_CharT>(__value);
|
|
return __formatter::__write(_VSTD::addressof(__c), _VSTD::addressof(__c) + 1, _VSTD::move(__out_it), __specs);
|
|
}
|
|
|
|
//
|
|
// Integer
|
|
//
|
|
|
|
/** Wrapper around @ref to_chars, returning the output pointer. */
|
|
template <integral _Tp>
|
|
_LIBCPP_HIDE_FROM_ABI char* __to_buffer(char* __first, char* __last, _Tp __value, int __base) {
|
|
// TODO FMT Evaluate code overhead due to not calling the internal function
|
|
// directly. (Should be zero overhead.)
|
|
to_chars_result __r = _VSTD::to_chars(__first, __last, __value, __base);
|
|
_LIBCPP_ASSERT(__r.ec == errc(0), "Internal buffer too small");
|
|
return __r.ptr;
|
|
}
|
|
|
|
/**
|
|
* Helper to determine the buffer size to output a integer in Base @em x.
|
|
*
|
|
* There are several overloads for the supported bases. The function uses the
|
|
* base as template argument so it can be used in a constant expression.
|
|
*/
|
|
template <unsigned_integral _Tp, size_t _Base>
|
|
consteval size_t __buffer_size() noexcept
|
|
requires(_Base == 2)
|
|
{
|
|
return numeric_limits<_Tp>::digits // The number of binary digits.
|
|
+ 2 // Reserve space for the '0[Bb]' prefix.
|
|
+ 1; // Reserve space for the sign.
|
|
}
|
|
|
|
template <unsigned_integral _Tp, size_t _Base>
|
|
consteval size_t __buffer_size() noexcept
|
|
requires(_Base == 8)
|
|
{
|
|
return numeric_limits<_Tp>::digits // The number of binary digits.
|
|
/ 3 // Adjust to octal.
|
|
+ 1 // Turn floor to ceil.
|
|
+ 1 // Reserve space for the '0' prefix.
|
|
+ 1; // Reserve space for the sign.
|
|
}
|
|
|
|
template <unsigned_integral _Tp, size_t _Base>
|
|
consteval size_t __buffer_size() noexcept
|
|
requires(_Base == 10)
|
|
{
|
|
return numeric_limits<_Tp>::digits10 // The floored value.
|
|
+ 1 // Turn floor to ceil.
|
|
+ 1; // Reserve space for the sign.
|
|
}
|
|
|
|
template <unsigned_integral _Tp, size_t _Base>
|
|
consteval size_t __buffer_size() noexcept
|
|
requires(_Base == 16)
|
|
{
|
|
return numeric_limits<_Tp>::digits // The number of binary digits.
|
|
/ 4 // Adjust to hexadecimal.
|
|
+ 2 // Reserve space for the '0[Xx]' prefix.
|
|
+ 1; // Reserve space for the sign.
|
|
}
|
|
|
|
template <unsigned_integral _Tp, class _CharT, class _FormatContext>
|
|
_LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator __format_integer(
|
|
_Tp __value,
|
|
_FormatContext& __ctx,
|
|
__format_spec::__parsed_specifications<_CharT> __specs,
|
|
bool __negative,
|
|
char* __begin,
|
|
char* __end,
|
|
const char* __prefix,
|
|
int __base) {
|
|
char* __first = __formatter::__insert_sign(__begin, __negative, __specs.__std_.__sign_);
|
|
if (__specs.__std_.__alternate_form_ && __prefix)
|
|
while (*__prefix)
|
|
*__first++ = *__prefix++;
|
|
|
|
char* __last = __formatter::__to_buffer(__first, __end, __value, __base);
|
|
|
|
# ifndef _LIBCPP_HAS_NO_LOCALIZATION
|
|
if (__specs.__std_.__locale_specific_form_) {
|
|
const auto& __np = std::use_facet<numpunct<_CharT>>(__ctx.locale());
|
|
string __grouping = __np.grouping();
|
|
ptrdiff_t __size = __last - __first;
|
|
// Writing the grouped form has more overhead than the normal output
|
|
// routines. If there will be no separators written the locale-specific
|
|
// form is identical to the normal routine. Test whether to grouped form
|
|
// is required.
|
|
if (!__grouping.empty() && __size > __grouping[0])
|
|
return __formatter::__write_using_decimal_separators(
|
|
__ctx.out(),
|
|
__begin,
|
|
__first,
|
|
__last,
|
|
__formatter::__determine_grouping(__size, __grouping),
|
|
__np.thousands_sep(),
|
|
__specs);
|
|
}
|
|
# endif
|
|
auto __out_it = __ctx.out();
|
|
if (__specs.__alignment_ != __format_spec::__alignment::__zero_padding)
|
|
__first = __begin;
|
|
else {
|
|
// __buf contains [sign][prefix]data
|
|
// ^ location of __first
|
|
// The zero padding is done like:
|
|
// - Write [sign][prefix]
|
|
// - Write data right aligned with '0' as fill character.
|
|
__out_it = __formatter::__copy(__begin, __first, _VSTD::move(__out_it));
|
|
__specs.__alignment_ = __format_spec::__alignment::__right;
|
|
__specs.__fill_.__data[0] = _CharT('0');
|
|
int32_t __size = __first - __begin;
|
|
|
|
__specs.__width_ -= _VSTD::min(__size, __specs.__width_);
|
|
}
|
|
|
|
if (__specs.__std_.__type_ != __format_spec::__type::__hexadecimal_upper_case) [[likely]]
|
|
return __formatter::__write(__first, __last, __ctx.out(), __specs);
|
|
|
|
return __formatter::__write_transformed(__first, __last, __ctx.out(), __specs, __formatter::__hex_to_upper);
|
|
}
|
|
|
|
template <unsigned_integral _Tp, class _CharT, class _FormatContext>
|
|
_LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
|
|
__format_integer(_Tp __value,
|
|
_FormatContext& __ctx,
|
|
__format_spec::__parsed_specifications<_CharT> __specs,
|
|
bool __negative = false) {
|
|
switch (__specs.__std_.__type_) {
|
|
case __format_spec::__type::__binary_lower_case: {
|
|
array<char, __formatter::__buffer_size<decltype(__value), 2>()> __array;
|
|
return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0b", 2);
|
|
}
|
|
case __format_spec::__type::__binary_upper_case: {
|
|
array<char, __formatter::__buffer_size<decltype(__value), 2>()> __array;
|
|
return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0B", 2);
|
|
}
|
|
case __format_spec::__type::__octal: {
|
|
// Octal is special; if __value == 0 there's no prefix.
|
|
array<char, __formatter::__buffer_size<decltype(__value), 8>()> __array;
|
|
return __formatter::__format_integer(
|
|
__value, __ctx, __specs, __negative, __array.begin(), __array.end(), __value != 0 ? "0" : nullptr, 8);
|
|
}
|
|
case __format_spec::__type::__default:
|
|
case __format_spec::__type::__decimal: {
|
|
array<char, __formatter::__buffer_size<decltype(__value), 10>()> __array;
|
|
return __formatter::__format_integer(
|
|
__value, __ctx, __specs, __negative, __array.begin(), __array.end(), nullptr, 10);
|
|
}
|
|
case __format_spec::__type::__hexadecimal_lower_case: {
|
|
array<char, __formatter::__buffer_size<decltype(__value), 16>()> __array;
|
|
return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0x", 16);
|
|
}
|
|
case __format_spec::__type::__hexadecimal_upper_case: {
|
|
array<char, __formatter::__buffer_size<decltype(__value), 16>()> __array;
|
|
return __formatter::__format_integer(__value, __ctx, __specs, __negative, __array.begin(), __array.end(), "0X", 16);
|
|
}
|
|
default:
|
|
_LIBCPP_ASSERT(false, "The parse function should have validated the type");
|
|
__libcpp_unreachable();
|
|
}
|
|
}
|
|
|
|
template <signed_integral _Tp, class _CharT, class _FormatContext>
|
|
_LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
|
|
__format_integer(_Tp __value, _FormatContext& __ctx, __format_spec::__parsed_specifications<_CharT> __specs) {
|
|
// Depending on the std-format-spec string the sign and the value
|
|
// might not be outputted together:
|
|
// - alternate form may insert a prefix string.
|
|
// - zero-padding may insert additional '0' characters.
|
|
// Therefore the value is processed as a positive unsigned value.
|
|
// The function @ref __insert_sign will a '-' when the value was negative.
|
|
auto __r = std::__to_unsigned_like(__value);
|
|
bool __negative = __value < 0;
|
|
if (__negative)
|
|
__r = std::__complement(__r);
|
|
|
|
return __formatter::__format_integer(__r, __ctx, __specs, __negative);
|
|
}
|
|
|
|
//
|
|
// Formatter arithmetic (bool)
|
|
//
|
|
|
|
template <class _CharT>
|
|
struct _LIBCPP_TEMPLATE_VIS __bool_strings;
|
|
|
|
template <>
|
|
struct _LIBCPP_TEMPLATE_VIS __bool_strings<char> {
|
|
static constexpr string_view __true{"true"};
|
|
static constexpr string_view __false{"false"};
|
|
};
|
|
|
|
# ifndef _LIBCPP_HAS_NO_WIDE_CHARACTERS
|
|
template <>
|
|
struct _LIBCPP_TEMPLATE_VIS __bool_strings<wchar_t> {
|
|
static constexpr wstring_view __true{L"true"};
|
|
static constexpr wstring_view __false{L"false"};
|
|
};
|
|
# endif
|
|
|
|
template <class _CharT, class _FormatContext>
|
|
_LIBCPP_HIDE_FROM_ABI typename _FormatContext::iterator
|
|
__format_bool(bool __value, _FormatContext& __ctx, __format_spec::__parsed_specifications<_CharT> __specs) {
|
|
# ifndef _LIBCPP_HAS_NO_LOCALIZATION
|
|
if (__specs.__std_.__locale_specific_form_) {
|
|
const auto& __np = std::use_facet<numpunct<_CharT>>(__ctx.locale());
|
|
basic_string<_CharT> __str = __value ? __np.truename() : __np.falsename();
|
|
return __formatter::__write_string_no_precision(basic_string_view<_CharT>{__str}, __ctx.out(), __specs);
|
|
}
|
|
# endif
|
|
basic_string_view<_CharT> __str =
|
|
__value ? __formatter::__bool_strings<_CharT>::__true : __formatter::__bool_strings<_CharT>::__false;
|
|
return __formatter::__write(__str.begin(), __str.end(), __ctx.out(), __specs);
|
|
}
|
|
|
|
} // namespace __formatter
|
|
|
|
#endif //_LIBCPP_STD_VER >= 20
|
|
|
|
_LIBCPP_END_NAMESPACE_STD
|
|
|
|
_LIBCPP_POP_MACROS
|
|
|
|
#endif // _LIBCPP___FORMAT_FORMATTER_INTEGRAL_H
|