用于EagleEye3.0 规则集漏报和误报测试的示例项目,项目收集于github和gitee
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

235 lines
10 KiB

5 months ago
#ifndef SQL_PLANNER_INCLUDED
#define SQL_PLANNER_INCLUDED
/* Copyright (c) 2000, 2018, Oracle and/or its affiliates. All rights reserved.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License, version 2.0,
as published by the Free Software Foundation.
This program is also distributed with certain software (including
but not limited to OpenSSL) that is licensed under separate terms,
as designated in a particular file or component or in included license
documentation. The authors of MySQL hereby grant you an additional
permission to link the program and your derivative works with the
separately licensed software that they have included with MySQL.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License, version 2.0, for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
/**
@file sql/sql_planner.h
Join planner classes.
*/
#include <sys/types.h>
#include "my_inttypes.h"
#include "my_table_map.h"
class Cost_model_server;
class JOIN;
class JOIN_TAB;
class Key_use;
class Opt_trace_object;
class THD;
struct TABLE_LIST;
struct POSITION;
typedef ulonglong nested_join_map;
/**
This class determines the optimal join order for tables within
a basic query block, ie a query specification clause, possibly extended
with semi-joined tables from embedded subqueries.
This class takes as prerequisite a join class where all dependencies among
tables have been sorted out, all possible access paths have been
sorted out, and all statistics information has been filled in.
The class has a sole public function that will calculate the most
optimal plan based on the inputs and the environment, such as prune level
and greedy optimizer search depth. For more information, see the
function headers for the private functions greedy_search(),
best_extension_by_limited_search() and eq_ref_extension_by_limited_search().
*/
class Optimize_table_order {
public:
Optimize_table_order(THD *thd_arg, JOIN *join_arg, TABLE_LIST *sjm_nest_arg);
~Optimize_table_order() {}
/**
Entry point to table join order optimization.
For further description, see class header and private function headers.
@return false if successful, true if error
*/
bool choose_table_order();
private:
THD *const thd; // Pointer to current THD
JOIN *const join; // Pointer to the current plan being developed
const uint search_depth; // Maximum search depth to apply in greedy search
const uint prune_level; // pruning heuristics to be applied
// (0 = EXHAUSTIVE, 1 = PRUNE_BY_TIME_OR_ROWS)
/**
Bitmap of all join nests embedding the last table appended to the current
partial join.
*/
nested_join_map cur_embedding_map;
/**
If non-NULL, we are optimizing a materialized semi-join nest.
If NULL, we are optimizing a complete join plan.
*/
const TABLE_LIST *const emb_sjm_nest;
/**
When calculating a plan for a materialized semi-join nest,
best_access_path() needs to know not only the remaining tables within the
semi-join nest, but also all tables outside of this nest, because there may
be key references between the semi-join nest and the outside tables
that should not be considered when materializing the semi-join nest.
@c excluded_tables tracks these tables.
*/
const table_map excluded_tables;
/*
No need to call advance_sj_state() when
1) there are no semijoin nests or
2) we are optimizing a materialized semijoin nest.
*/
const bool has_sj;
/**
If true, find_best_ref() must go through all keys, no shortcutting
allowed.
*/
bool test_all_ref_keys;
/// True if we found a complete plan using only allowed semijoin strategies.
bool found_plan_with_allowed_sj;
/**
False/true at start/end of choose_table_order().
Helps member functions know if current plan is in join->positions or
join->best_positions.
*/
bool got_final_plan;
inline Key_use *find_best_ref(const JOIN_TAB *tab,
const table_map remaining_tables,
const uint idx, const double prefix_rowcount,
bool *found_condition,
table_map *ref_depends_map,
uint *used_key_parts);
double calculate_scan_cost(const JOIN_TAB *tab, const uint idx,
const Key_use *best_ref,
const double prefix_rowcount,
const bool found_condition,
const bool disable_jbuf,
double *rows_after_filtering,
Opt_trace_object *trace_access_scan);
void best_access_path(JOIN_TAB *tab, const table_map remaining_tables,
const uint idx, bool disable_jbuf,
const double prefix_rowcount, POSITION *pos);
bool semijoin_loosescan_fill_driving_table_position(
const JOIN_TAB *s, table_map remaining_tables, uint idx,
double prefix_rowcount, POSITION *loose_scan_pos);
bool check_interleaving_with_nj(JOIN_TAB *next_tab);
void advance_sj_state(table_map remaining_tables, const JOIN_TAB *tab,
uint idx);
void backout_nj_state(const table_map remaining_tables, const JOIN_TAB *tab);
void optimize_straight_join(table_map join_tables);
bool greedy_search(table_map remaining_tables);
bool best_extension_by_limited_search(table_map remaining_tables, uint idx,
uint current_search_depth);
table_map eq_ref_extension_by_limited_search(table_map remaining_tables,
uint idx,
uint current_search_depth);
bool consider_plan(uint idx, Opt_trace_object *trace_obj);
bool fix_semijoin_strategies();
bool semijoin_firstmatch_loosescan_access_paths(uint first_tab, uint last_tab,
table_map remaining_tables,
bool loosescan,
double *newcount,
double *newcost);
void semijoin_mat_scan_access_paths(uint last_inner_tab, uint last_outer_tab,
table_map remaining_tables,
TABLE_LIST *sjm_nest, double *newcount,
double *newcost);
void semijoin_mat_lookup_access_paths(uint last_inner, TABLE_LIST *sjm_nest,
double *newcount, double *newcost);
void semijoin_dupsweedout_access_paths(uint first_tab, uint last_tab,
double *newcount, double *newcost);
double lateral_derived_cost(const JOIN_TAB *tab, const uint idx,
const double prefix_rowcount,
const Cost_model_server *cost_model);
static uint determine_search_depth(uint search_depth, uint table_count);
};
void get_partial_join_cost(JOIN *join, uint n_tables, double *cost_arg,
double *rowcount_arg);
/**
Calculate 'Post read filtering' effect of JOIN::conds for table
'tab'. Only conditions that are not directly involved in the chosen
access method shall be included in the calculation of this 'Post
read filtering' effect.
The function first identifies fields that are directly used by the
access method. This includes columns used by range and ref access types,
and predicates on the identified columns (if any) will not be taken into
account when the filtering effect is calculated.
The function will then calculate the filtering effect of any predicate
that applies to 'tab' and is not depending on the columns used by the
access method. The source of information with highest accuracy is
always preferred and is as follows:
1) Row estimates from the range optimizer
2) Row estimates from index statistics (records per key)
3) Guesstimates
Thus, after identifying columns that are used by the access method,
the function will look for rows estimates made by the range optimizer.
If found, the estimates from the range optimizer are calculated into
the filtering effect.
The function then goes through JOIN::conds to get estimates from any
remaining predicate that applies to 'tab' and does not depend on any
tables that come later in the join sequence. Predicates that depend on
columns that are either used by the access method or used in the row
estimate from the range optimizer will not be considered in this phase.
@param tab The table condition filtering effect is calculated
for
@param keyuse Describes the 'ref' access method (if any) that is
chosen
@param used_tables Tables earlier in the join sequence than 'tab'
@param fanout The number of rows read by the chosen access
method for each row combination of previous tables
@param is_join_buffering Whether or not condition filtering is about
to be calculated for an access method using join
buffering.
@param write_to_trace Wheter we should print the filtering effect calculated
by histogram statistics and the final aggregated filtering
effect to optimizer trace.
@param parent_trace The parent trace object where the final aggregated
filtering effect will be printed if "write_to_trace" is
set to true.
@return the 'post read filtering' effect (between 0 and 1) of
JOIN::conds
*/
float calculate_condition_filter(const JOIN_TAB *const tab,
const Key_use *const keyuse,
table_map used_tables, double fanout,
bool is_join_buffering, bool write_to_trace,
Opt_trace_object &parent_trace);
#endif /* SQL_PLANNER_INCLUDED */