From a265e25b7924d7edec77c28ee76182e69bfcc3fe Mon Sep 17 00:00:00 2001 From: Victor Zverovich Date: Tue, 19 May 2020 12:56:06 -0700 Subject: [PATCH] Optimize small string parsing --- include/fmt/format.h | 71 +++++++++++++++++++++++++++++--------------- 1 file changed, 47 insertions(+), 24 deletions(-) diff --git a/include/fmt/format.h b/include/fmt/format.h index 30de8ec4..928227bd 100644 --- a/include/fmt/format.h +++ b/include/fmt/format.h @@ -288,7 +288,6 @@ template <> constexpr int num_bits() { std::numeric_limits::digits); } - // A workaround for gcc 4.8 to make void_t work in a SFINAE context. template struct void_t_impl { using type = void; }; @@ -2508,9 +2507,55 @@ template struct id_adapter { Handler& handler; }; +template +FMT_CONSTEXPR FMT_INLINE const Char* parse_replacement_field( + const Char* begin, const Char* end, Handler&& handler) { + ++begin; + if (begin == end) return handler.on_error("invalid format string"), end; + if (static_cast(*begin) == '}') { + handler.on_arg_id(); + handler.on_replacement_field(begin); + } else if (*begin == '{') { + handler.on_text(begin, begin + 1); + } else { + begin = parse_arg_id(begin, end, id_adapter{handler}); + Char c = begin != end ? *begin : Char(); + if (c == '}') { + handler.on_replacement_field(begin); + } else if (c == ':') { + begin = handler.on_format_specs(begin + 1, end); + if (begin == end || *begin != '}') + return handler.on_error("unknown format specifier"), end; + } else { + return handler.on_error("missing '}' in format string"), end; + } + } + return begin + 1; +} + template FMT_CONSTEXPR void parse_format_string(basic_string_view format_str, Handler&& handler) { + auto begin = format_str.data(); + auto end = begin + format_str.size(); + if (end - begin < 32) { + // Use a simple loop instead of memchr for small strings. + const Char* p = begin; + while (p != end) { + auto c = *p++; + if (c == '{') { + handler.on_text(begin, p - 1); + begin = p = parse_replacement_field(p - 1, end, handler); + } else if (c == '}') { + if (p == end || *p != '}') + return handler.on_error("unmatched '}' in format string"); + handler.on_text(begin, p); + begin = ++p; + } + } + handler.on_text(begin, end); + return; + } struct writer { FMT_CONSTEXPR void operator()(const Char* begin, const Char* end) { if (begin + 1 >= end) { @@ -2532,8 +2577,6 @@ FMT_CONSTEXPR void parse_format_string(basic_string_view format_str, } Handler& handler_; } write{handler}; - auto begin = format_str.data(); - auto end = begin + format_str.size(); while (begin != end) { // Doing two passes with memchr (one for '{' and another for '}') is up to // 2.5x faster than the naive one-pass implementation on big format strings. @@ -2541,27 +2584,7 @@ FMT_CONSTEXPR void parse_format_string(basic_string_view format_str, if (*begin != '{' && !find(begin + 1, end, '{', p)) return write(begin, end); write(begin, p); - ++p; - if (p == end) return handler.on_error("invalid format string"); - if (static_cast(*p) == '}') { - handler.on_arg_id(); - handler.on_replacement_field(p); - } else if (*p == '{') { - handler.on_text(p, p + 1); - } else { - p = parse_arg_id(p, end, id_adapter{handler}); - Char c = p != end ? *p : Char(); - if (c == '}') { - handler.on_replacement_field(p); - } else if (c == ':') { - p = handler.on_format_specs(p + 1, end); - if (p == end || *p != '}') - return handler.on_error("unknown format specifier"); - } else { - return handler.on_error("missing '}' in format string"); - } - } - begin = p + 1; + begin = parse_replacement_field(p, end, handler); } }