用于EagleEye3.0 规则集漏报和误报测试的示例项目,项目收集于github和gitee
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

220 lines
8.8 KiB

5 months ago
/* Copyright (c) 2018, 2019, Oracle and/or its affiliates. All rights reserved.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is also distributed with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have included with MySQL.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
#include "sql/json_schema.h"
#include "my_rapidjson_size_t.h" // IWYU pragma: keep
#include <rapidjson/document.h>
#include <rapidjson/error/error.h>
#include <rapidjson/memorystream.h>
#include <rapidjson/reader.h>
#include <rapidjson/schema.h>
#include <rapidjson/stringbuffer.h>
#include <string>
#include <utility>
#include "my_alloc.h"
#include "my_dbug.h"
#include "my_inttypes.h"
#include "my_sys.h"
#include "mysqld_error.h"
#include "sql/json_syntax_check.h"
#include "sql/sql_exception_handler.h"
/**
parse_json_schema will parse a JSON input into a JSON Schema. If the input
isn't a valid JSON, or if the JSON is too deeply nested, an error will be
returned to the user.
@param json_schema_str A pointer to the JSON Schema input
@param json_schema_length The length of the JSON Schema input
@param function_name The function name of the caller (to be used in error
reporting)
@param[out] schema_document An object where the JSON Schema will be put. This
variable MUST be initialized.
@retval true on error (my_error has been called)
@retval false on success. The JSON Schema can be found in the output
parameter schema_document.
*/
static bool parse_json_schema(const char *json_schema_str,
size_t json_schema_length,
const char *function_name,
rapidjson::Document *schema_document) {
DBUG_ASSERT(schema_document != nullptr);
// Check if the JSON schema is valid. Invalid JSON would be caught by
// rapidjson::Document::Parse, but it will not catch documents that are too
// deeply nested.
size_t error_offset;
std::string error_message;
if (!is_valid_json_syntax(json_schema_str, json_schema_length, &error_offset,
&error_message)) {
my_error(ER_INVALID_JSON_TEXT_IN_PARAM, MYF(0), 1, function_name,
error_message.c_str(), error_offset, "");
return true;
}
if (schema_document->Parse(json_schema_str, json_schema_length)
.HasParseError()) {
// The document should already be valid, since is_valid_json_syntax
// succeeded.
DBUG_ASSERT(false);
return true;
}
// We require the JSON Schema to be an object
if (!schema_document->IsObject()) {
my_error(ER_INVALID_JSON_TYPE, MYF(0), 1, function_name, "object");
return true;
}
return false;
}
bool is_valid_json_schema(const char *document_str, size_t document_length,
const char *json_schema_str,
size_t json_schema_length, const char *function_name,
bool *is_valid,
Json_schema_validation_report *validation_report) {
rapidjson::Document schema_document;
if (parse_json_schema(json_schema_str, json_schema_length, function_name,
&schema_document)) {
return true;
}
return Json_schema_validator(schema_document)
.is_valid_json_schema(document_str, document_length, function_name,
is_valid, validation_report);
}
Json_schema_validator::Json_schema_validator(
const rapidjson::Document &schema_document)
: m_cached_schema(schema_document, &m_remote_document_provider) {}
unique_ptr_destroy_only<const Json_schema_validator>
create_json_schema_validator(MEM_ROOT *mem_root, const char *json_schema_str,
size_t json_schema_length,
const char *function_name) {
rapidjson::Document schema_document;
if (parse_json_schema(json_schema_str, json_schema_length, function_name,
&schema_document)) {
return nullptr;
}
return make_unique_destroy_only<const Json_schema_validator>(mem_root,
schema_document);
}
bool Json_schema_validator::is_valid_json_schema(
const char *document_str, size_t document_length, const char *function_name,
bool *is_valid, Json_schema_validation_report *validation_report) const {
// Set up the JSON Schema validator using Syntax_check_handler that will catch
// JSON documents that are too deeply nested.
Syntax_check_handler syntaxCheckHandler;
rapidjson::GenericSchemaValidator<rapidjson::SchemaDocument,
Syntax_check_handler>
validator(m_cached_schema, syntaxCheckHandler);
rapidjson::Reader reader;
rapidjson::MemoryStream stream(document_str, document_length);
// Wrap this in a try-catch since rapidjson calls std::regex_search
// (which isn't noexcept).
try {
rapidjson::ParseResult parse_success = reader.Parse(stream, validator);
// We may end up in a few different error scenarios here:
// 1) The document is valid JSON, but invalid according to schema.
// - parse_success will indicate error, and validator.IsValid() is false.
// 2) The JSON document is invalid (parsing failed), but not too deep.
// - parse_success will indicate error, and validator.IsValid() is true.
// 3) The JSON document is too deep.
// - parse_success will indicate error, and validator.IsValid() is false.
// The only way do distinguish this from case 1, is to see if the
// syntax check handler has raised an error.
if (syntaxCheckHandler.too_deep_error_raised()) {
// The JSON document was too deep, and an error is already reported by the
// Syntax_check_handler.
return true;
}
if (!parse_success && validator.IsValid()) {
// Couldn't parse the JSON document.
std::pair<std::string, size_t> error = get_error_from_reader(reader);
my_error(ER_INVALID_JSON_TEXT_IN_PARAM, MYF(0), 2, function_name,
error.first.c_str(), error.second, "");
return true;
}
// Otherwise, we have a syntactically correct JSON document, so we can
// safely check the result from the validator.
} catch (...) {
handle_std_exception(function_name);
return true;
}
// If we encountered a remote reference in the JSON schema, report an error
// back to the user that this isn't supported.
if (m_remote_document_provider.used()) {
my_error(ER_NOT_SUPPORTED_YET, MYF(0), "references in JSON Schema");
return true;
}
*is_valid = validator.IsValid();
if (!validator.IsValid() && validation_report != nullptr) {
// Populate the validation report. Since the validator is local to this
// function, all strings provided by the validator must be allocated so
// that they survive beyond this function.
rapidjson::StringBuffer string_buffer;
// Where in the JSON Schema the validation failed.
validator.GetInvalidSchemaPointer().StringifyUriFragment(string_buffer);
std::string schema_location(string_buffer.GetString(),
string_buffer.GetSize());
// Where in the JSON document the validation failed.
string_buffer.Clear();
validator.GetInvalidDocumentPointer().StringifyUriFragment(string_buffer);
std::string document_location(string_buffer.GetString(),
string_buffer.GetSize());
validation_report->set_error_report(std::move(schema_location),
validator.GetInvalidSchemaKeyword(),
std::move(document_location));
}
return false;
}
std::string Json_schema_validation_report::human_readable_reason() const {
std::string reason;
reason.append("The JSON document location '");
reason.append(document_location());
reason.append("' failed requirement '");
reason.append(schema_failed_keyword());
reason.append("' at JSON Schema location '");
reason.append(schema_location());
reason.append("'");
return reason;
}