From 4e34d4d3eebd5756933ed1ed5b7026cebd6f43f8 Mon Sep 17 00:00:00 2001 From: Vladislav Shchapov Date: Fri, 26 Nov 2021 21:03:14 +0500 Subject: [PATCH 1/3] Move fmt::detail::formatbuf to format.h --- include/fmt/format.h | 32 ++++++++++++++++++++++++++++++++ include/fmt/ostream.h | 32 +------------------------------- 2 files changed, 33 insertions(+), 31 deletions(-) diff --git a/include/fmt/format.h b/include/fmt/format.h index 3cf123ee4e10..52b16779ce8d 100644 --- a/include/fmt/format.h +++ b/include/fmt/format.h @@ -265,6 +265,38 @@ FMT_END_NAMESPACE FMT_BEGIN_NAMESPACE namespace detail { + +template class formatbuf : public Streambuf { + private: + using char_type = typename Streambuf::char_type; + using streamsize = decltype(std::declval().sputn(nullptr, 0)); + using int_type = typename Streambuf::int_type; + using traits_type = typename Streambuf::traits_type; + + buffer& buffer_; + + public: + explicit formatbuf(buffer& buf) : buffer_(buf) {} + + protected: + // The put area is always empty. This makes the implementation simpler and has + // the advantage that the streambuf and the buffer are always in sync and + // sputc never writes into uninitialized memory. A disadvantage is that each + // call to sputc always results in a (virtual) call to overflow. There is no + // disadvantage here for sputn since this always results in a call to xsputn. + + auto overflow(int_type ch) -> int_type override { + if (!traits_type::eq_int_type(ch, traits_type::eof())) + buffer_.push_back(static_cast(ch)); + return ch; + } + + auto xsputn(const char_type* s, streamsize count) -> streamsize override { + buffer_.append(s, s + count); + return count; + } +}; + // An equivalent of `*reinterpret_cast(&source)` that doesn't have // undefined behavior (e.g. due to type aliasing). // Example: uint64_t d = bit_cast(2.718); diff --git a/include/fmt/ostream.h b/include/fmt/ostream.h index dd005fa144f5..0ebdd60f14bf 100644 --- a/include/fmt/ostream.h +++ b/include/fmt/ostream.h @@ -18,36 +18,6 @@ template class basic_printf_context; namespace detail { -template class formatbuf : public std::basic_streambuf { - private: - using int_type = typename std::basic_streambuf::int_type; - using traits_type = typename std::basic_streambuf::traits_type; - - buffer& buffer_; - - public: - explicit formatbuf(buffer& buf) : buffer_(buf) {} - - protected: - // The put area is always empty. This makes the implementation simpler and has - // the advantage that the streambuf and the buffer are always in sync and - // sputc never writes into uninitialized memory. A disadvantage is that each - // call to sputc always results in a (virtual) call to overflow. There is no - // disadvantage here for sputn since this always results in a call to xsputn. - - auto overflow(int_type ch = traits_type::eof()) -> int_type override { - if (!traits_type::eq_int_type(ch, traits_type::eof())) - buffer_.push_back(static_cast(ch)); - return ch; - } - - auto xsputn(const Char* s, std::streamsize count) - -> std::streamsize override { - buffer_.append(s, s + count); - return count; - } -}; - // Checks if T has a user-defined operator<<. template class is_streamable { @@ -97,7 +67,7 @@ void write_buffer(std::basic_ostream& os, buffer& buf) { template void format_value(buffer& buf, const T& value, locale_ref loc = locale_ref()) { - auto&& format_buf = formatbuf(buf); + auto&& format_buf = formatbuf>(buf); auto&& output = std::basic_ostream(&format_buf); #if !defined(FMT_STATIC_THOUSANDS_SEPARATOR) if (loc) output.imbue(loc.get()); From e10e6854443899b568d7585ca2420c72cf12ddc5 Mon Sep 17 00:00:00 2001 From: Vladislav Shchapov Date: Thu, 25 Nov 2021 23:33:01 +0500 Subject: [PATCH 2/3] Replace std::basic_ostringstream to std::basic_ostream with custom formatbuf --- include/fmt/chrono.h | 47 +++++++++++++++++++++++--------------------- 1 file changed, 25 insertions(+), 22 deletions(-) diff --git a/include/fmt/chrono.h b/include/fmt/chrono.h index d54c8ae79ec0..76b2330b4b45 100644 --- a/include/fmt/chrono.h +++ b/include/fmt/chrono.h @@ -11,8 +11,9 @@ #include #include #include +#include #include -#include +#include #include #include "format.h" @@ -291,23 +292,24 @@ inline null<> gmtime_r(...) { return null<>(); } inline null<> gmtime_s(...) { return null<>(); } template -inline auto do_write(const std::tm& time, const std::locale& loc, char format, - char modifier) -> std::basic_string { - auto&& os = std::basic_ostringstream(); +inline void do_write(buffer& buf, const std::tm& time, + const std::locale& loc, char format, char modifier) { + auto&& format_buf = formatbuf>(buf); + auto&& os = std::basic_ostream(&format_buf); os.imbue(loc); using iterator = std::ostreambuf_iterator; const auto& facet = std::use_facet>(loc); auto end = facet.put(os, os, Char(' '), &time, format, modifier); if (end.failed()) FMT_THROW(format_error("failed to format time")); - return std::move(os).str(); } template ::value)> auto write(OutputIt out, const std::tm& time, const std::locale& loc, char format, char modifier = 0) -> OutputIt { - auto str = do_write(time, loc, format, modifier); - return std::copy(str.begin(), str.end(), out); + auto&& buffer = get_buffer(out); + do_write(buffer, time, loc, format, modifier); + return buffer.out(); } inline const std::locale& get_classic_locale() { @@ -319,7 +321,8 @@ template ::value)> auto write(OutputIt out, const std::tm& time, const std::locale& loc, char format, char modifier = 0) -> OutputIt { - auto str = do_write(time, loc, format, modifier); + auto&& buffer = basic_memory_buffer(); + do_write(buffer, time, loc, format, modifier); if (detail::is_utf8() && loc != get_classic_locale()) { // char16_t and char32_t codecvts are broken in MSVC (linkage errors) and // gcc-4. @@ -347,11 +350,11 @@ auto write(OutputIt out, const std::tm& time, const std::locale& loc, code_unit* to_next = nullptr; constexpr size_t buf_size = 32; code_unit buf[buf_size] = {}; - auto result = f.in(mb, str.data(), str.data() + str.size(), from_next, buf, - buf + buf_size, to_next); + auto result = f.in(mb, buffer.data(), buffer.data() + buffer.size(), + from_next, buf, buf + buf_size, to_next); if (result != std::codecvt_base::ok) FMT_THROW(format_error("failed to format time")); - str.clear(); + buffer.clear(); for (code_unit* p = buf; p != to_next; ++p) { uint32_t c = static_cast(*p); if (sizeof(code_unit) == 2 && c >= 0xd800 && c <= 0xdfff) { @@ -363,25 +366,25 @@ auto write(OutputIt out, const std::tm& time, const std::locale& loc, c = (c << 10) + static_cast(*p) - 0x35fdc00; } if (c < 0x80) { - str.push_back(static_cast(c)); + buffer.push_back(static_cast(c)); } else if (c < 0x800) { - str.push_back(static_cast(0xc0 | (c >> 6))); - str.push_back(static_cast(0x80 | (c & 0x3f))); + buffer.push_back(static_cast(0xc0 | (c >> 6))); + buffer.push_back(static_cast(0x80 | (c & 0x3f))); } else if ((c >= 0x800 && c <= 0xd7ff) || (c >= 0xe000 && c <= 0xffff)) { - str.push_back(static_cast(0xe0 | (c >> 12))); - str.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); - str.push_back(static_cast(0x80 | (c & 0x3f))); + buffer.push_back(static_cast(0xe0 | (c >> 12))); + buffer.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); + buffer.push_back(static_cast(0x80 | (c & 0x3f))); } else if (c >= 0x10000 && c <= 0x10ffff) { - str.push_back(static_cast(0xf0 | (c >> 18))); - str.push_back(static_cast(0x80 | ((c & 0x3ffff) >> 12))); - str.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); - str.push_back(static_cast(0x80 | (c & 0x3f))); + buffer.push_back(static_cast(0xf0 | (c >> 18))); + buffer.push_back(static_cast(0x80 | ((c & 0x3ffff) >> 12))); + buffer.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); + buffer.push_back(static_cast(0x80 | (c & 0x3f))); } else { FMT_THROW(format_error("failed to format time")); } } } - return std::copy(str.begin(), str.end(), out); + return copy_str(buffer.data(), buffer.data() + buffer.size(), out); } } // namespace detail From 608a9a3441c374c41db9c5571c570e8faa3db0a1 Mon Sep 17 00:00:00 2001 From: Vladislav Shchapov Date: Sat, 27 Nov 2021 14:25:48 +0500 Subject: [PATCH 3/3] Use tm.tm_zone --- include/fmt/chrono.h | 173 ++++++++++++++++++++++++++++--------------- 1 file changed, 112 insertions(+), 61 deletions(-) diff --git a/include/fmt/chrono.h b/include/fmt/chrono.h index 76b2330b4b45..5825a810081d 100644 --- a/include/fmt/chrono.h +++ b/include/fmt/chrono.h @@ -291,38 +291,42 @@ inline null<> localtime_s(...) { return null<>(); } inline null<> gmtime_r(...) { return null<>(); } inline null<> gmtime_s(...) { return null<>(); } -template -inline void do_write(buffer& buf, const std::tm& time, - const std::locale& loc, char format, char modifier) { - auto&& format_buf = formatbuf>(buf); - auto&& os = std::basic_ostream(&format_buf); - os.imbue(loc); - using iterator = std::ostreambuf_iterator; - const auto& facet = std::use_facet>(loc); - auto end = facet.put(os, os, Char(' '), &time, format, modifier); - if (end.failed()) FMT_THROW(format_error("failed to format time")); -} - -template ::value)> -auto write(OutputIt out, const std::tm& time, const std::locale& loc, - char format, char modifier = 0) -> OutputIt { - auto&& buffer = get_buffer(out); - do_write(buffer, time, loc, format, modifier); - return buffer.out(); -} - inline const std::locale& get_classic_locale() { static const auto& locale = std::locale::classic(); return locale; } -template ::value)> -auto write(OutputIt out, const std::tm& time, const std::locale& loc, - char format, char modifier = 0) -> OutputIt { - auto&& buffer = basic_memory_buffer(); - do_write(buffer, time, loc, format, modifier); +template struct codecvt_result { + static constexpr const size_t max_size = 32; + CodeUnit buf[max_size]; + CodeUnit* end; +}; +template +constexpr const size_t codecvt_result::max_size; + +template +void write_codecvt(codecvt_result& out, string_view in_buf, + const std::locale& loc) { + using codecvt = std::codecvt; +#if FMT_CLANG_VERSION +# pragma clang diagnostic push +# pragma clang diagnostic ignored "-Wdeprecated" + auto& f = std::use_facet(loc); +# pragma clang diagnostic pop +#else + auto& f = std::use_facet(loc); +#endif + auto mb = std::mbstate_t(); + const char* from_next = nullptr; + auto result = f.in(mb, in_buf.begin(), in_buf.end(), from_next, + std::begin(out.buf), std::end(out.buf), out.end); + if (result != std::codecvt_base::ok) + FMT_THROW(format_error("failed to format time")); +} + +template +auto write_encoded_tm_str(OutputIt out, string_view in, const std::locale& loc) + -> OutputIt { if (detail::is_utf8() && loc != get_classic_locale()) { // char16_t and char32_t codecvts are broken in MSVC (linkage errors) and // gcc-4. @@ -335,56 +339,89 @@ auto write(OutputIt out, const std::tm& time, const std::locale& loc, using code_unit = char32_t; #endif - using codecvt = std::codecvt; -#if FMT_CLANG_VERSION -# pragma clang diagnostic push -# pragma clang diagnostic ignored "-Wdeprecated" - auto& f = std::use_facet(loc); -# pragma clang diagnostic pop -#else - auto& f = std::use_facet(loc); -#endif - - auto mb = std::mbstate_t(); - const char* from_next = nullptr; - code_unit* to_next = nullptr; - constexpr size_t buf_size = 32; - code_unit buf[buf_size] = {}; - auto result = f.in(mb, buffer.data(), buffer.data() + buffer.size(), - from_next, buf, buf + buf_size, to_next); - if (result != std::codecvt_base::ok) - FMT_THROW(format_error("failed to format time")); - buffer.clear(); - for (code_unit* p = buf; p != to_next; ++p) { + using unit_t = codecvt_result; + unit_t unit; + write_codecvt(unit, in, loc); + // In UTF-8 is used one to four one-byte code units. + auto&& buf = basic_memory_buffer(); + for (code_unit* p = unit.buf; p != unit.end; ++p) { uint32_t c = static_cast(*p); if (sizeof(code_unit) == 2 && c >= 0xd800 && c <= 0xdfff) { // surrogate pair ++p; - if (p == to_next || (c & 0xfc00) != 0xd800 || (*p & 0xfc00) != 0xdc00) { + if (p == unit.end || (c & 0xfc00) != 0xd800 || + (*p & 0xfc00) != 0xdc00) { FMT_THROW(format_error("failed to format time")); } c = (c << 10) + static_cast(*p) - 0x35fdc00; } if (c < 0x80) { - buffer.push_back(static_cast(c)); + buf.push_back(static_cast(c)); } else if (c < 0x800) { - buffer.push_back(static_cast(0xc0 | (c >> 6))); - buffer.push_back(static_cast(0x80 | (c & 0x3f))); + buf.push_back(static_cast(0xc0 | (c >> 6))); + buf.push_back(static_cast(0x80 | (c & 0x3f))); } else if ((c >= 0x800 && c <= 0xd7ff) || (c >= 0xe000 && c <= 0xffff)) { - buffer.push_back(static_cast(0xe0 | (c >> 12))); - buffer.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); - buffer.push_back(static_cast(0x80 | (c & 0x3f))); + buf.push_back(static_cast(0xe0 | (c >> 12))); + buf.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); + buf.push_back(static_cast(0x80 | (c & 0x3f))); } else if (c >= 0x10000 && c <= 0x10ffff) { - buffer.push_back(static_cast(0xf0 | (c >> 18))); - buffer.push_back(static_cast(0x80 | ((c & 0x3ffff) >> 12))); - buffer.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); - buffer.push_back(static_cast(0x80 | (c & 0x3f))); + buf.push_back(static_cast(0xf0 | (c >> 18))); + buf.push_back(static_cast(0x80 | ((c & 0x3ffff) >> 12))); + buf.push_back(static_cast(0x80 | ((c & 0xfff) >> 6))); + buf.push_back(static_cast(0x80 | (c & 0x3f))); } else { FMT_THROW(format_error("failed to format time")); } } + return copy_str(buf.data(), buf.data() + buf.size(), out); } - return copy_str(buffer.data(), buffer.data() + buffer.size(), out); + return copy_str(in.data(), in.data() + in.size(), out); +} + +template ::value)> +auto write_tm_str(OutputIt out, string_view sv, const std::locale& loc) + -> OutputIt { + codecvt_result unit; + write_codecvt(unit, sv, loc); + return copy_str(unit.buf, unit.end, out); +} + +template ::value)> +auto write_tm_str(OutputIt out, string_view sv, const std::locale& loc) + -> OutputIt { + return write_encoded_tm_str(out, sv, loc); +} + +template +inline void do_write(buffer& buf, const std::tm& time, + const std::locale& loc, char format, char modifier) { + auto&& format_buf = formatbuf>(buf); + auto&& os = std::basic_ostream(&format_buf); + os.imbue(loc); + using iterator = std::ostreambuf_iterator; + const auto& facet = std::use_facet>(loc); + auto end = facet.put(os, os, Char(' '), &time, format, modifier); + if (end.failed()) FMT_THROW(format_error("failed to format time")); +} + +template ::value)> +auto write(OutputIt out, const std::tm& time, const std::locale& loc, + char format, char modifier = 0) -> OutputIt { + auto&& buf = get_buffer(out); + do_write(buf, time, loc, format, modifier); + return buf.out(); +} + +template ::value)> +auto write(OutputIt out, const std::tm& time, const std::locale& loc, + char format, char modifier = 0) -> OutputIt { + auto&& buf = basic_memory_buffer(); + do_write(buf, time, loc, format, modifier); + return write_encoded_tm_str(out, string_view(buf.data(), buf.size()), loc); } } // namespace detail @@ -881,6 +918,12 @@ template struct has_member_data_tm_gmtoff> : std::true_type {}; +template +struct has_member_data_tm_zone : std::false_type {}; +template +struct has_member_data_tm_zone> + : std::true_type {}; + #if defined(_WIN32) inline void tzset_once() { static bool init = []() -> bool { @@ -1038,6 +1081,14 @@ template class tm_writer { #endif } + void format_tz_name_impl(std::true_type) { + if (is_classic_) + out_ = write_tm_str(out_, tm_.tm_zone, loc_); + else + format_localized('Z'); + } + void format_tz_name_impl(std::false_type) { format_localized('Z'); } + void format_localized(char format, char modifier = 0) { out_ = write(out_, tm_, loc_, format, modifier); } @@ -1147,7 +1198,7 @@ template class tm_writer { void on_utc_offset() { format_utc_offset_impl(has_member_data_tm_gmtoff{}); } - void on_tz_name() { format_localized('Z'); } + void on_tz_name() { format_tz_name_impl(has_member_data_tm_zone{}); } void on_year(numeric_system ns) { if (is_classic_ || ns == numeric_system::standard)