-- 70f43a482d7d4ae4a255f17ca02b0106653dd600 by Shaindel Schwartz <shaindel@google.com>: Internal change PiperOrigin-RevId: 201571193 -- 93e6e9c2e683158be49d9dd1f5cb1a91d0c0f556 by Abseil Team <absl-team@google.com>: Internal change. PiperOrigin-RevId: 201567108 -- fbd8ee94fbe9f2448e5adf5e88706f9c8216048f by Juemin Yang <jueminyang@google.com>: str_format release PiperOrigin-RevId: 201565129 -- 387faa301555a8a888c4429df52734aa806dca46 by Abseil Team <absl-team@google.com>: Adds a defaulted allocator parameter to the size_type constructor of InlinedVector PiperOrigin-RevId: 201558711 -- 39b15ea2c68d7129d70cbde7e71af900032595ec by Matt Calabrese <calabrese@google.com>: Update the variant implementation to eliminate unnecessary checking on alternative access when the index is known or required to be correct. PiperOrigin-RevId: 201529535 -- adab77f1f7bb363aa534297f22aae2b0f08889ea by Abseil Team <absl-team@google.com>: Import of CCTZ from GitHub. PiperOrigin-RevId: 201458388 -- a701dc0ba62e3cadf0de14203415b91df4ee8151 by Greg Falcon <gfalcon@google.com>: Internal cleanup PiperOrigin-RevId: 201394836 -- 8a7191410b8f440fdfa27f722ff05e451502ab61 by Abseil Team <absl-team@google.com>: Import of CCTZ from GitHub. PiperOrigin-RevId: 201369269 GitOrigin-RevId: 70f43a482d7d4ae4a255f17ca02b0106653dd600 Change-Id: I8ab073b30b4e27405a3b6da2c826bb4f3f0b9af6
		
			
				
	
	
		
			291 lines
		
	
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			291 lines
		
	
	
	
		
			10 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| #ifndef ABSL_STRINGS_INTERNAL_STR_FORMAT_PARSER_H_
 | |
| #define ABSL_STRINGS_INTERNAL_STR_FORMAT_PARSER_H_
 | |
| 
 | |
| #include <limits.h>
 | |
| #include <stddef.h>
 | |
| #include <stdlib.h>
 | |
| 
 | |
| #include <cassert>
 | |
| #include <initializer_list>
 | |
| #include <iosfwd>
 | |
| #include <iterator>
 | |
| #include <memory>
 | |
| #include <vector>
 | |
| 
 | |
| #include "absl/strings/internal/str_format/checker.h"
 | |
| #include "absl/strings/internal/str_format/extension.h"
 | |
| 
 | |
| namespace absl {
 | |
| namespace str_format_internal {
 | |
| 
 | |
| // The analyzed properties of a single specified conversion.
 | |
| struct UnboundConversion {
 | |
|   UnboundConversion()
 | |
|       : flags() /* This is required to zero all the fields of flags. */ {
 | |
|     flags.basic = true;
 | |
|   }
 | |
| 
 | |
|   class InputValue {
 | |
|    public:
 | |
|     void set_value(int value) {
 | |
|       assert(value >= 0);
 | |
|       value_ = value;
 | |
|     }
 | |
|     int value() const { return value_; }
 | |
| 
 | |
|     // Marks the value as "from arg". aka the '*' format.
 | |
|     // Requires `value >= 1`.
 | |
|     // When set, is_from_arg() return true and get_from_arg() returns the
 | |
|     // original value.
 | |
|     // `value()`'s return value is unspecfied in this state.
 | |
|     void set_from_arg(int value) {
 | |
|       assert(value > 0);
 | |
|       value_ = -value - 1;
 | |
|     }
 | |
|     bool is_from_arg() const { return value_ < -1; }
 | |
|     int get_from_arg() const {
 | |
|       assert(is_from_arg());
 | |
|       return -value_ - 1;
 | |
|     }
 | |
| 
 | |
|    private:
 | |
|     int value_ = -1;
 | |
|   };
 | |
| 
 | |
|   // No need to initialize. It will always be set in the parser.
 | |
|   int arg_position;
 | |
| 
 | |
|   InputValue width;
 | |
|   InputValue precision;
 | |
| 
 | |
|   Flags flags;
 | |
|   LengthMod length_mod;
 | |
|   ConversionChar conv;
 | |
| };
 | |
| 
 | |
| // Consume conversion spec prefix (not including '%') of '*src' if valid.
 | |
| // Examples of valid specs would be e.g.: "s", "d", "-12.6f".
 | |
| // If valid, the front of src is advanced such that src becomes the
 | |
| // part following the conversion spec, and the spec part is broken down and
 | |
| // returned in 'conv'.
 | |
| // If invalid, returns false and leaves 'src' unmodified.
 | |
| // For example:
 | |
| //   Given "d9", returns "d", and leaves src="9",
 | |
| //   Given "!", returns "" and leaves src="!".
 | |
| bool ConsumeUnboundConversion(string_view* src, UnboundConversion* conv,
 | |
|                               int* next_arg);
 | |
| 
 | |
| // Parse the format std::string provided in 'src' and pass the identified items into
 | |
| // 'consumer'.
 | |
| // Text runs will be passed by calling
 | |
| //   Consumer::Append(string_view);
 | |
| // ConversionItems will be passed by calling
 | |
| //   Consumer::ConvertOne(UnboundConversion, string_view);
 | |
| // In the case of ConvertOne, the string_view that is passed is the
 | |
| // portion of the format std::string corresponding to the conversion, not including
 | |
| // the leading %. On success, it returns true. On failure, it stops and returns
 | |
| // false.
 | |
| template <typename Consumer>
 | |
| bool ParseFormatString(string_view src, Consumer consumer) {
 | |
|   int next_arg = 0;
 | |
|   while (!src.empty()) {
 | |
|     const char* percent =
 | |
|         static_cast<const char*>(memchr(src.begin(), '%', src.size()));
 | |
|     if (!percent) {
 | |
|       // We found the last substring.
 | |
|       return consumer.Append(src);
 | |
|     }
 | |
|     // We found a percent, so push the text run then process the percent.
 | |
|     size_t percent_loc = percent - src.data();
 | |
|     if (!consumer.Append(string_view(src.data(), percent_loc))) return false;
 | |
|     if (percent + 1 >= src.end()) return false;
 | |
| 
 | |
|     UnboundConversion conv;
 | |
| 
 | |
|     switch (percent[1]) {
 | |
|       case '%':
 | |
|         if (!consumer.Append("%")) return false;
 | |
|         src.remove_prefix(percent_loc + 2);
 | |
|         continue;
 | |
| 
 | |
| #define PARSER_CASE(ch)                                     \
 | |
|   case #ch[0]:                                              \
 | |
|     src.remove_prefix(percent_loc + 2);                     \
 | |
|     conv.conv = ConversionChar::FromId(ConversionChar::ch); \
 | |
|     conv.arg_position = ++next_arg;                         \
 | |
|     break;
 | |
|         ABSL_CONVERSION_CHARS_EXPAND_(PARSER_CASE, );
 | |
| #undef PARSER_CASE
 | |
| 
 | |
|       default:
 | |
|         src.remove_prefix(percent_loc + 1);
 | |
|         if (!ConsumeUnboundConversion(&src, &conv, &next_arg)) return false;
 | |
|         break;
 | |
|     }
 | |
|     if (next_arg == 0) {
 | |
|       // This indicates an error in the format std::string.
 | |
|       // The only way to get next_arg == 0 is to have a positional argument
 | |
|       // first which sets next_arg to -1 and then a non-positional argument
 | |
|       // which does ++next_arg.
 | |
|       // Checking here seems to be the cheapeast place to do it.
 | |
|       return false;
 | |
|     }
 | |
|     if (!consumer.ConvertOne(
 | |
|             conv, string_view(percent + 1, src.data() - (percent + 1)))) {
 | |
|       return false;
 | |
|     }
 | |
|   }
 | |
|   return true;
 | |
| }
 | |
| 
 | |
| // Always returns true, or fails to compile in a constexpr context if s does not
 | |
| // point to a constexpr char array.
 | |
| constexpr bool EnsureConstexpr(string_view s) {
 | |
|   return s.empty() || s[0] == s[0];
 | |
| }
 | |
| 
 | |
| class ParsedFormatBase {
 | |
|  public:
 | |
|   explicit ParsedFormatBase(string_view format, bool allow_ignored,
 | |
|                             std::initializer_list<Conv> convs);
 | |
| 
 | |
|   ParsedFormatBase(const ParsedFormatBase& other) { *this = other; }
 | |
| 
 | |
|   ParsedFormatBase(ParsedFormatBase&& other) { *this = std::move(other); }
 | |
| 
 | |
|   ParsedFormatBase& operator=(const ParsedFormatBase& other) {
 | |
|     if (this == &other) return *this;
 | |
|     has_error_ = other.has_error_;
 | |
|     items_ = other.items_;
 | |
|     size_t text_size = items_.empty() ? 0 : items_.back().text_end;
 | |
|     data_.reset(new char[text_size]);
 | |
|     memcpy(data_.get(), other.data_.get(), text_size);
 | |
|     return *this;
 | |
|   }
 | |
| 
 | |
|   ParsedFormatBase& operator=(ParsedFormatBase&& other) {
 | |
|     if (this == &other) return *this;
 | |
|     has_error_ = other.has_error_;
 | |
|     data_ = std::move(other.data_);
 | |
|     items_ = std::move(other.items_);
 | |
|     // Reset the vector to make sure the invariants hold.
 | |
|     other.items_.clear();
 | |
|     return *this;
 | |
|   }
 | |
| 
 | |
|   template <typename Consumer>
 | |
|   bool ProcessFormat(Consumer consumer) const {
 | |
|     const char* const base = data_.get();
 | |
|     string_view text(base, 0);
 | |
|     for (const auto& item : items_) {
 | |
|       text = string_view(text.end(), (base + item.text_end) - text.end());
 | |
|       if (item.is_conversion) {
 | |
|         if (!consumer.ConvertOne(item.conv, text)) return false;
 | |
|       } else {
 | |
|         if (!consumer.Append(text)) return false;
 | |
|       }
 | |
|     }
 | |
|     return !has_error_;
 | |
|   }
 | |
| 
 | |
|   bool has_error() const { return has_error_; }
 | |
| 
 | |
|  private:
 | |
|   // Returns whether the conversions match and if !allow_ignored it verifies
 | |
|   // that all conversions are used by the format.
 | |
|   bool MatchesConversions(bool allow_ignored,
 | |
|                           std::initializer_list<Conv> convs) const;
 | |
| 
 | |
|   struct ParsedFormatConsumer;
 | |
| 
 | |
|   struct ConversionItem {
 | |
|     bool is_conversion;
 | |
|     // Points to the past-the-end location of this element in the data_ array.
 | |
|     size_t text_end;
 | |
|     UnboundConversion conv;
 | |
|   };
 | |
| 
 | |
|   bool has_error_;
 | |
|   std::unique_ptr<char[]> data_;
 | |
|   std::vector<ConversionItem> items_;
 | |
| };
 | |
| 
 | |
| 
 | |
| // A value type representing a preparsed format.  These can be created, copied
 | |
| // around, and reused to speed up formatting loops.
 | |
| // The user must specify through the template arguments the conversion
 | |
| // characters used in the format. This will be checked at compile time.
 | |
| //
 | |
| // This class uses Conv enum values to specify each argument.
 | |
| // This allows for more flexibility as you can specify multiple possible
 | |
| // conversion characters for each argument.
 | |
| // ParsedFormat<char...> is a simplified alias for when the user only
 | |
| // needs to specify a single conversion character for each argument.
 | |
| //
 | |
| // Example:
 | |
| //   // Extended format supports multiple characters per argument:
 | |
| //   using MyFormat = ExtendedParsedFormat<Conv::d | Conv::x>;
 | |
| //   MyFormat GetFormat(bool use_hex) {
 | |
| //     if (use_hex) return MyFormat("foo %x bar");
 | |
| //     return MyFormat("foo %d bar");
 | |
| //   }
 | |
| //   // 'format' can be used with any value that supports 'd' and 'x',
 | |
| //   // like `int`.
 | |
| //   auto format = GetFormat(use_hex);
 | |
| //   value = StringF(format, i);
 | |
| //
 | |
| // This class also supports runtime format checking with the ::New() and
 | |
| // ::NewAllowIgnored() factory functions.
 | |
| // This is the only API that allows the user to pass a runtime specified format
 | |
| // std::string. These factory functions will return NULL if the format does not match
 | |
| // the conversions requested by the user.
 | |
| template <str_format_internal::Conv... C>
 | |
| class ExtendedParsedFormat : public str_format_internal::ParsedFormatBase {
 | |
|  public:
 | |
|   explicit ExtendedParsedFormat(string_view format)
 | |
| #if ABSL_INTERNAL_ENABLE_FORMAT_CHECKER
 | |
|       __attribute__((
 | |
|           enable_if(str_format_internal::EnsureConstexpr(format),
 | |
|                     "Format std::string is not constexpr."),
 | |
|           enable_if(str_format_internal::ValidFormatImpl<C...>(format),
 | |
|                     "Format specified does not match the template arguments.")))
 | |
| #endif  // ABSL_INTERNAL_ENABLE_FORMAT_CHECKER
 | |
|       : ExtendedParsedFormat(format, false) {
 | |
|   }
 | |
| 
 | |
|   // ExtendedParsedFormat factory function.
 | |
|   // The user still has to specify the conversion characters, but they will not
 | |
|   // be checked at compile time. Instead, it will be checked at runtime.
 | |
|   // This delays the checking to runtime, but allows the user to pass
 | |
|   // dynamically sourced formats.
 | |
|   // It returns NULL if the format does not match the conversion characters.
 | |
|   // The user is responsible for checking the return value before using it.
 | |
|   //
 | |
|   // The 'New' variant will check that all the specified arguments are being
 | |
|   // consumed by the format and return NULL if any argument is being ignored.
 | |
|   // The 'NewAllowIgnored' variant will not verify this and will allow formats
 | |
|   // that ignore arguments.
 | |
|   static std::unique_ptr<ExtendedParsedFormat> New(string_view format) {
 | |
|     return New(format, false);
 | |
|   }
 | |
|   static std::unique_ptr<ExtendedParsedFormat> NewAllowIgnored(
 | |
|       string_view format) {
 | |
|     return New(format, true);
 | |
|   }
 | |
| 
 | |
|  private:
 | |
|   static std::unique_ptr<ExtendedParsedFormat> New(string_view format,
 | |
|                                                    bool allow_ignored) {
 | |
|     std::unique_ptr<ExtendedParsedFormat> conv(
 | |
|         new ExtendedParsedFormat(format, allow_ignored));
 | |
|     if (conv->has_error()) return nullptr;
 | |
|     return conv;
 | |
|   }
 | |
| 
 | |
|   ExtendedParsedFormat(string_view s, bool allow_ignored)
 | |
|       : ParsedFormatBase(s, allow_ignored, {C...}) {}
 | |
| };
 | |
| }  // namespace str_format_internal
 | |
| }  // namespace absl
 | |
| 
 | |
| #endif  // ABSL_STRINGS_INTERNAL_STR_FORMAT_PARSER_H_
 |