123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188 |
- // Copyright (c) 2012 The Chromium Authors. All rights reserved.
- // Use of this source code is governed by a BSD-style license that can be
- // found in the LICENSE file.
- // A JSON parser, converting from a base::StringPiece to a base::Value.
- //
- // The JSON spec is:
- // https://tools.ietf.org/rfc/rfc8259.txt
- // which obsoletes the earlier RFCs 4627, 7158 and 7159.
- //
- // This RFC should be equivalent to the informal spec:
- // https://www.json.org/json-en.html
- //
- // Implementation choices permitted by the RFC:
- // - Nesting is limited (to a configurable depth, 200 by default).
- // - Numbers are limited to those representable by a finite double. The
- // conversion from a JSON number (in the base::StringPiece input) to a
- // double-flavored base::Value may also be lossy.
- // - The input (which must be UTF-8) may begin with a BOM (Byte Order Mark).
- // - Duplicate object keys (strings) are silently allowed. Last key-value pair
- // wins. Previous pairs are discarded.
- //
- // Configurable (see the JSONParserOptions type) deviations from the RFC:
- // - Allow trailing commas: "[1,2,]".
- // - Replace invalid Unicode with U+FFFD REPLACEMENT CHARACTER.
- //
- // Non-configurable deviations from the RFC:
- // - Allow "// etc\n" and "/* etc */" C-style comments.
- // - Allow ASCII control characters, including literal (not escaped) NUL bytes
- // and new lines, within a JSON string.
- // - Allow "\\v" escapes within a JSON string, producing a vertical tab.
- // - Allow "\\x23" escapes within a JSON string. Subtly, the 2-digit hex value
- // is a Unicode code point, not a UTF-8 byte. For example, "\\xFF" in the
- // JSON source decodes to a base::Value whose string contains "\xC3\xBF", the
- // UTF-8 encoding of U+00FF LATIN SMALL LETTER Y WITH DIAERESIS. Converting
- // from UTF-8 to UTF-16, e.g. via UTF8ToWide, will recover a 16-bit 0x00FF.
- #ifndef BASE_JSON_JSON_READER_H_
- #define BASE_JSON_JSON_READER_H_
- #include <memory>
- #include <string>
- #include "base/base_export.h"
- #include "base/json/json_common.h"
- #include "base/optional.h"
- #include "base/strings/string_piece.h"
- #include "base/values.h"
- namespace base {
- namespace internal {
- class JSONParser;
- }
- enum JSONParserOptions {
- // Parses the input strictly according to RFC 8259, except for where noted
- // above.
- JSON_PARSE_RFC = 0,
- // Allows commas to exist after the last element in structures.
- JSON_ALLOW_TRAILING_COMMAS = 1 << 0,
- // If set the parser replaces invalid code points (i.e. lone
- // surrogates) with the Unicode replacement character (U+FFFD). If
- // not set, invalid code points trigger a hard error and parsing
- // fails.
- JSON_REPLACE_INVALID_CHARACTERS = 1 << 1,
- };
- class BASE_EXPORT JSONReader {
- public:
- // Error codes during parsing.
- //
- // TODO(crbug.com/1069271, crbug.com/1070409): move this enum from JSONReader
- // (a higher level API, which can be backed by multiple implementations) to
- // JSONParser (a lower level API, a single implementation). Such a move would
- // also remove the ValueWithError.error_code field and move the
- // kInvalidEscape, kSyntaxError, etc. strings defined in this .h file.
- enum JsonParseError {
- JSON_NO_ERROR = 0,
- JSON_INVALID_ESCAPE,
- JSON_SYNTAX_ERROR,
- JSON_UNEXPECTED_TOKEN,
- JSON_TRAILING_COMMA,
- JSON_TOO_MUCH_NESTING,
- JSON_UNEXPECTED_DATA_AFTER_ROOT,
- JSON_UNSUPPORTED_ENCODING,
- JSON_UNQUOTED_DICTIONARY_KEY,
- JSON_TOO_LARGE,
- JSON_UNREPRESENTABLE_NUMBER,
- JSON_PARSE_ERROR_COUNT
- };
- struct BASE_EXPORT ValueWithError {
- ValueWithError();
- ValueWithError(ValueWithError&& other);
- ValueWithError& operator=(ValueWithError&& other);
- ~ValueWithError();
- Optional<Value> value;
- // Contains default values if |value| exists, or the error status if |value|
- // is base::nullopt.
- JsonParseError error_code = JSON_NO_ERROR;
- std::string error_message;
- int error_line = 0;
- int error_column = 0;
- DISALLOW_COPY_AND_ASSIGN(ValueWithError);
- };
- // String versions of parse error codes.
- static const char kInvalidEscape[];
- static const char kSyntaxError[];
- static const char kUnexpectedToken[];
- static const char kTrailingComma[];
- static const char kTooMuchNesting[];
- static const char kUnexpectedDataAfterRoot[];
- static const char kUnsupportedEncoding[];
- static const char kUnquotedDictionaryKey[];
- static const char kInputTooLarge[];
- static const char kUnrepresentableNumber[];
- // Constructs a reader.
- JSONReader(int options = JSON_PARSE_RFC,
- size_t max_depth = internal::kAbsoluteMaxDepth);
- ~JSONReader();
- // Reads and parses |json|, returning a Value.
- // If |json| is not a properly formed JSON string, returns base::nullopt.
- static Optional<Value> Read(StringPiece json,
- int options = JSON_PARSE_RFC,
- size_t max_depth = internal::kAbsoluteMaxDepth);
- // Deprecated. Use the Read() method above.
- // Reads and parses |json|, returning a Value.
- // If |json| is not a properly formed JSON string, returns nullptr.
- // Wrap this in base::FooValue::From() to check the Value is of type Foo and
- // convert to a FooValue at the same time.
- static std::unique_ptr<Value> ReadDeprecated(
- StringPiece json,
- int options = JSON_PARSE_RFC,
- size_t max_depth = internal::kAbsoluteMaxDepth);
- // Reads and parses |json| like Read(). Returns a ValueWithError, which on
- // error, will be populated with a formatted error message, an error code, and
- // the error location if appropriate.
- static ValueWithError ReadAndReturnValueWithError(
- StringPiece json,
- int options = JSON_PARSE_RFC);
- // Deprecated. Use the ReadAndReturnValueWithError() method above.
- // Reads and parses |json| like Read(). |error_code_out| and |error_msg_out|
- // are optional. If specified and nullptr is returned, they will be populated
- // an error code and a formatted error message (including error location if
- // appropriate). Otherwise, they will be unmodified.
- static std::unique_ptr<Value> ReadAndReturnErrorDeprecated(
- StringPiece json,
- int options, // JSONParserOptions
- int* error_code_out,
- std::string* error_msg_out,
- int* error_line_out = nullptr,
- int* error_column_out = nullptr);
- // Converts a JSON parse error code into a human readable message.
- // Returns an empty string if error_code is JSON_NO_ERROR.
- static std::string ErrorCodeToString(JsonParseError error_code);
- // Non-static version of Read() above.
- Optional<Value> ReadToValue(StringPiece json);
- // Deprecated. Use the ReadToValue() method above.
- // Non-static version of Read() above.
- std::unique_ptr<Value> ReadToValueDeprecated(StringPiece json);
- // Converts error_code_ to a human-readable string, including line and column
- // numbers if appropriate.
- std::string GetErrorMessage() const;
- private:
- std::unique_ptr<internal::JSONParser> parser_;
- };
- } // namespace base
- #endif // BASE_JSON_JSON_READER_H_
|