12
12
You should have received a copy of the GNU General Public License
13
13
along with this program; if not, write to the Free Software
14
Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA */
14
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */
20
select_query and join optimization
20
mysql_select and join optimization
22
23
@defgroup Query_Optimizer Query Optimizer
32
#include "drizzled/sql_select.h" /* include join.h */
34
#include "drizzled/error.h"
35
#include "drizzled/gettext.h"
36
#include "drizzled/util/test.h"
37
#include "drizzled/name_resolution_context_state.h"
38
#include "drizzled/nested_join.h"
39
#include "drizzled/probes.h"
40
#include "drizzled/show.h"
41
#include "drizzled/item/cache.h"
42
#include "drizzled/item/cmpfunc.h"
43
#include "drizzled/item/copy_string.h"
44
#include "drizzled/item/uint.h"
45
#include "drizzled/cached_item.h"
46
#include "drizzled/sql_base.h"
47
#include "drizzled/field/blob.h"
48
#include "drizzled/check_stack_overrun.h"
49
#include "drizzled/lock.h"
50
#include "drizzled/item/outer_ref.h"
51
#include "drizzled/index_hint.h"
52
#include "drizzled/records.h"
53
#include "drizzled/internal/iocache.h"
54
#include "drizzled/drizzled.h"
55
#include "drizzled/plugin/storage_engine.h"
57
#include "drizzled/sql_union.h"
58
#include "drizzled/optimizer/key_field.h"
59
#include "drizzled/optimizer/position.h"
60
#include "drizzled/optimizer/sargable_param.h"
61
#include "drizzled/optimizer/key_use.h"
62
#include "drizzled/optimizer/range.h"
63
#include "drizzled/optimizer/quick_range_select.h"
64
#include "drizzled/optimizer/quick_ror_intersect_select.h"
66
#include "drizzled/filesort.h"
73
static int sort_keyuse(optimizer::KeyUse *a, optimizer::KeyUse *b);
74
static COND *build_equal_items(Session *session, COND *cond,
26
#include <drizzled/server_includes.h>
27
#include <drizzled/sql_select.h>
28
#include "sj_tmp_table.h"
30
#include <mysys/my_bit.h>
31
#include <drizzled/drizzled_error_messages.h>
32
#include <libdrizzle/gettext.h>
34
const char *join_type_str[]={ "UNKNOWN","system","const","eq_ref","ref",
35
"MAYBE_REF","ALL","range","index",
36
"ref_or_null","unique_subquery","index_subquery",
40
struct st_sargable_param;
42
static void optimize_keyuse(JOIN *join, DYNAMIC_ARRAY *keyuse_array);
43
static bool make_join_statistics(JOIN *join, TableList *leaves, COND *conds,
44
DYNAMIC_ARRAY *keyuse);
45
static bool update_ref_and_keys(THD *thd, DYNAMIC_ARRAY *keyuse,
47
uint tables, COND *conds,
48
COND_EQUAL *cond_equal,
49
table_map table_map, SELECT_LEX *select_lex,
50
st_sargable_param **sargables);
51
static int sort_keyuse(KEYUSE *a,KEYUSE *b);
52
static void set_position(JOIN *join,uint index,JOIN_TAB *table,KEYUSE *key);
53
static bool create_ref_for_key(JOIN *join, JOIN_TAB *j, KEYUSE *org_keyuse,
54
table_map used_tables);
55
static bool choose_plan(JOIN *join,table_map join_tables);
57
static void best_access_path(JOIN *join, JOIN_TAB *s, THD *thd,
58
table_map remaining_tables, uint idx,
59
double record_count, double read_time);
60
static void optimize_straight_join(JOIN *join, table_map join_tables);
61
static bool greedy_search(JOIN *join, table_map remaining_tables,
62
uint depth, uint prune_level);
63
static bool best_extension_by_limited_search(JOIN *join,
64
table_map remaining_tables,
65
uint idx, double record_count,
66
double read_time, uint depth,
68
static uint determine_search_depth(JOIN* join);
69
static int join_tab_cmp(const void* ptr1, const void* ptr2);
70
static int join_tab_cmp_straight(const void* ptr1, const void* ptr2);
72
TODO: 'find_best' is here only temporarily until 'greedy_search' is
75
static bool find_best(JOIN *join,table_map rest_tables,uint index,
76
double record_count,double read_time);
77
static uint cache_record_length(JOIN *join,uint index);
78
static double prev_record_reads(JOIN *join, uint idx, table_map found_ref);
79
static bool get_best_combination(JOIN *join);
80
static store_key *get_store_key(THD *thd,
81
KEYUSE *keyuse, table_map used_tables,
82
KEY_PART_INFO *key_part, uchar *key_buff,
84
static bool make_simple_join(JOIN *join,Table *tmp_table);
85
static void make_outerjoin_info(JOIN *join);
86
static bool make_join_select(JOIN *join,SQL_SELECT *select,COND *item);
87
static bool make_join_readinfo(JOIN *join, uint64_t options, uint no_jbuf_after);
88
static bool only_eq_ref_tables(JOIN *join, order_st *order, table_map tables);
89
static void update_depend_map(JOIN *join);
90
static void update_depend_map(JOIN *join, order_st *order);
91
static order_st *remove_const(JOIN *join,order_st *first_order,COND *cond,
92
bool change_list, bool *simple_order);
93
static int return_zero_rows(JOIN *join, select_result *res,TableList *tables,
94
List<Item> &fields, bool send_row,
95
uint64_t select_options, const char *info,
97
static COND *build_equal_items(THD *thd, COND *cond,
75
98
COND_EQUAL *inherited,
76
99
List<TableList> *join_list,
77
100
COND_EQUAL **cond_equal_ref);
101
static COND* substitute_for_best_equal_field(COND *cond,
102
COND_EQUAL *cond_equal,
103
void *table_join_idx);
104
static COND *simplify_joins(JOIN *join, List<TableList> *join_list,
105
COND *conds, bool top, bool in_sj);
106
static bool check_interleaving_with_nj(JOIN_TAB *last, JOIN_TAB *next);
107
static void restore_prev_nj_state(JOIN_TAB *last);
108
static void reset_nj_counters(List<TableList> *join_list);
109
static uint build_bitmap_for_nested_joins(List<TableList> *join_list,
113
void advance_sj_state(const table_map remaining_tables, const JOIN_TAB *tab);
114
static void restore_prev_sj_state(const table_map remaining_tables,
115
const JOIN_TAB *tab);
117
static COND *optimize_cond(JOIN *join, COND *conds,
118
List<TableList> *join_list,
119
Item::cond_result *cond_value);
120
static bool const_expression_in_where(COND *conds,Item *item, Item **comp_item);
121
static int do_select(JOIN *join,List<Item> *fields,Table *tmp_table);
123
static enum_nested_loop_state
124
evaluate_join_record(JOIN *join, JOIN_TAB *join_tab,
126
static enum_nested_loop_state
127
evaluate_null_complemented_join_record(JOIN *join, JOIN_TAB *join_tab);
128
static enum_nested_loop_state
129
flush_cached_records(JOIN *join, JOIN_TAB *join_tab, bool skip_last);
130
static enum_nested_loop_state
131
end_send(JOIN *join, JOIN_TAB *join_tab, bool end_of_records);
132
static enum_nested_loop_state
133
end_write(JOIN *join, JOIN_TAB *join_tab, bool end_of_records);
134
static enum_nested_loop_state
135
end_update(JOIN *join, JOIN_TAB *join_tab, bool end_of_records);
136
static enum_nested_loop_state
137
end_unique_update(JOIN *join, JOIN_TAB *join_tab, bool end_of_records);
139
static int join_read_const_table(JOIN_TAB *tab, POSITION *pos);
140
static int join_read_system(JOIN_TAB *tab);
141
static int join_read_const(JOIN_TAB *tab);
142
static int join_read_key(JOIN_TAB *tab);
143
static int join_read_always_key(JOIN_TAB *tab);
144
static int join_read_last_key(JOIN_TAB *tab);
145
static int join_no_more_records(READ_RECORD *info);
146
static int join_read_next(READ_RECORD *info);
147
static int join_read_next_different(READ_RECORD *info);
148
static int join_init_quick_read_record(JOIN_TAB *tab);
149
static int test_if_quick_select(JOIN_TAB *tab);
150
static int join_init_read_record(JOIN_TAB *tab);
151
static int join_read_first(JOIN_TAB *tab);
152
static int join_read_next_same(READ_RECORD *info);
153
static int join_read_next_same_diff(READ_RECORD *info);
154
static int join_read_last(JOIN_TAB *tab);
155
static int join_read_prev_same(READ_RECORD *info);
156
static int join_read_prev(READ_RECORD *info);
157
int join_read_always_key_or_null(JOIN_TAB *tab);
158
int join_read_next_same_or_null(READ_RECORD *info);
159
static COND *make_cond_for_table(COND *cond,table_map table,
160
table_map used_table,
161
bool exclude_expensive_cond);
79
162
static Item* part_of_refkey(Table *form,Field *field);
80
static bool cmp_buffer_with_ref(JoinTable *tab);
81
static void change_cond_ref_to_const(Session *session,
82
list<COND_CMP>& save_list,
87
static bool copy_blobs(Field **ptr);
163
static bool test_if_skip_sort_order(JOIN_TAB *tab,order_st *order,
164
ha_rows select_limit, bool no_changes,
166
static bool list_contains_unique_index(Table *table,
167
bool (*find_func) (Field *, void *), void *data);
168
static bool find_field_in_item_list (Field *field, void *data);
169
static bool find_field_in_order_list (Field *field, void *data);
170
static int create_sort_index(THD *thd, JOIN *join, order_st *order,
171
ha_rows filesort_limit, ha_rows select_limit,
173
static int remove_duplicates(JOIN *join,Table *entry,List<Item> &fields,
175
static int remove_dup_with_compare(THD *thd, Table *entry, Field **field,
176
ulong offset,Item *having);
177
static int remove_dup_with_hash_index(THD *thd,Table *table,
178
uint field_count, Field **first_field,
89
static bool eval_const_cond(COND *cond)
91
return ((Item_func*) cond)->val_int() ? true : false;
180
ulong key_length,Item *having);
181
static int join_init_cache(THD *thd,JOIN_TAB *tables,uint table_count);
182
static ulong used_blob_length(CACHE_FIELD **ptr);
183
static bool store_record_in_cache(JOIN_CACHE *cache);
184
static void reset_cache_read(JOIN_CACHE *cache);
185
static void reset_cache_write(JOIN_CACHE *cache);
186
static void read_cached_record(JOIN_TAB *tab);
187
static bool cmp_buffer_with_ref(JOIN_TAB *tab);
188
static order_st *create_distinct_group(THD *thd, Item **ref_pointer_array,
189
order_st *order, List<Item> &fields,
190
List<Item> &all_fields,
191
bool *all_order_by_fields_used);
192
static bool test_if_subpart(order_st *a,order_st *b);
193
static Table *get_sort_by_table(order_st *a,order_st *b,TableList *tables);
194
static void calc_group_buffer(JOIN *join,order_st *group);
195
static bool make_group_fields(JOIN *main_join, JOIN *curr_join);
196
static bool alloc_group_fields(JOIN *join,order_st *group);
197
// Create list for using with tempory table
198
static bool change_to_use_tmp_fields(THD *thd, Item **ref_pointer_array,
199
List<Item> &new_list1,
200
List<Item> &new_list2,
201
uint elements, List<Item> &items);
202
// Create list for using with tempory table
203
static bool change_refs_to_tmp_fields(THD *thd, Item **ref_pointer_array,
204
List<Item> &new_list1,
205
List<Item> &new_list2,
206
uint elements, List<Item> &items);
207
static void init_tmptable_sum_functions(Item_sum **func);
208
static void update_tmptable_sum_func(Item_sum **func,Table *tmp_table);
209
static void copy_sum_funcs(Item_sum **func_ptr, Item_sum **end);
210
static bool add_ref_to_table_cond(THD *thd, JOIN_TAB *join_tab);
211
static bool setup_sum_funcs(THD *thd, Item_sum **func_ptr);
212
static bool init_sum_functions(Item_sum **func, Item_sum **end);
213
static bool update_sum_func(Item_sum **func);
214
void select_describe(JOIN *join, bool need_tmp_table,bool need_order,
215
bool distinct, const char *message=NullS);
216
static Item *remove_additional_cond(Item* conds);
217
static void add_group_and_distinct_keys(JOIN *join, JOIN_TAB *join_tab);
218
static bool test_if_ref(Item_field *left_item,Item *right_item);
219
static bool replace_where_subcondition(JOIN *join, Item *old_cond,
220
Item *new_cond, bool fix_fields);
95
223
This is used to mark equalities that were made from i-th IN-equality.
262
382
ref->outer_ref= new_ref;
263
383
ref->ref= &ref->outer_ref;
265
if (!ref->fixed && ref->fix_fields(session, 0))
385
if (!ref->fixed && ref->fix_fields(thd, 0))
267
session->used_tables|= item->used_tables();
387
thd->used_tables|= item->used_tables();
392
#define MAGIC_IN_WHERE_TOP_LEVEL 10
394
Function to setup clauses without sum functions.
396
inline int setup_without_group(THD *thd, Item **ref_pointer_array,
400
List<Item> &all_fields,
403
order_st *group, bool *hidden_group_fields)
406
nesting_map save_allow_sum_func=thd->lex->allow_sum_func ;
408
thd->lex->allow_sum_func&= ~(1 << thd->lex->current_select->nest_level);
409
res= setup_conds(thd, tables, leaves, conds);
411
thd->lex->allow_sum_func|= 1 << thd->lex->current_select->nest_level;
412
res= res || setup_order(thd, ref_pointer_array, tables, fields, all_fields,
414
thd->lex->allow_sum_func&= ~(1 << thd->lex->current_select->nest_level);
415
res= res || setup_group(thd, ref_pointer_array, tables, fields, all_fields,
416
group, hidden_group_fields);
417
thd->lex->allow_sum_func= save_allow_sum_func;
272
421
/*****************************************************************************
273
422
Check fields, find best join, do the select and output fields.
274
select_query assumes that all tables are already opened
423
mysql_select assumes that all tables are already opened
275
424
*****************************************************************************/
427
Prepare of whole select (including sub queries in future).
430
Add check of calculation of GROUP functions and fields:
431
SELECT COUNT(*)+table.col1 from table1;
439
JOIN::prepare(Item ***rref_pointer_array,
440
TableList *tables_init,
441
uint wild_num, COND *conds_init, uint og_num,
442
order_st *order_init, order_st *group_init,
444
order_st *proc_param_init, SELECT_LEX *select_lex_arg,
445
SELECT_LEX_UNIT *unit_arg)
447
// to prevent double initialization on EXPLAIN
453
group_list= group_init;
455
proc_param= proc_param_init;
456
tables_list= tables_init;
457
select_lex= select_lex_arg;
458
select_lex->join= this;
459
join_list= &select_lex->top_join_list;
460
union_part= unit_arg->is_union();
462
thd->lex->current_select->is_item_list_lookup= 1;
464
If we have already executed SELECT, then it have not sense to prevent
465
its table from update (see unique_table())
467
if (thd->derived_tables_processing)
468
select_lex->exclude_from_table_unique_test= true;
470
/* Check that all tables, fields, conds and order are ok */
472
if (!(select_options & OPTION_SETUP_TABLES_DONE) &&
473
setup_tables_and_check_access(thd, &select_lex->context, join_list,
474
tables_list, &select_lex->leaf_tables,
478
TableList *table_ptr;
479
for (table_ptr= select_lex->leaf_tables;
481
table_ptr= table_ptr->next_leaf)
484
if (setup_wild(thd, tables_list, fields_list, &all_fields, wild_num) ||
485
select_lex->setup_ref_array(thd, og_num) ||
486
setup_fields(thd, (*rref_pointer_array), fields_list, MARK_COLUMNS_READ,
488
setup_without_group(thd, (*rref_pointer_array), tables_list,
489
select_lex->leaf_tables, fields_list,
490
all_fields, &conds, order, group_list,
491
&hidden_group_fields))
492
return(-1); /* purecov: inspected */
494
ref_pointer_array= *rref_pointer_array;
498
nesting_map save_allow_sum_func= thd->lex->allow_sum_func;
499
thd->where="having clause";
500
thd->lex->allow_sum_func|= 1 << select_lex_arg->nest_level;
501
select_lex->having_fix_field= 1;
502
bool having_fix_rc= (!having->fixed &&
503
(having->fix_fields(thd, &having) ||
504
having->check_cols(1)));
505
select_lex->having_fix_field= 0;
506
if (having_fix_rc || thd->is_error())
507
return(-1); /* purecov: inspected */
508
thd->lex->allow_sum_func= save_allow_sum_func;
512
Item_subselect *subselect;
513
Item_in_subselect *in_subs= NULL;
515
Are we in a subquery predicate?
516
TODO: the block below will be executed for every PS execution without need.
518
if ((subselect= select_lex->master_unit()->item))
520
bool do_semijoin= !test(thd->variables.optimizer_switch &
521
OPTIMIZER_SWITCH_NO_SEMIJOIN);
522
if (subselect->substype() == Item_subselect::IN_SUBS)
523
in_subs= (Item_in_subselect*)subselect;
526
Check if we're in subquery that is a candidate for flattening into a
527
semi-join (which is done done in flatten_subqueries()). The
529
1. Subquery predicate is an IN/=ANY subq predicate
530
2. Subquery is a single SELECT (not a UNION)
531
3. Subquery does not have GROUP BY or order_st BY
532
4. Subquery does not use aggregate functions or HAVING
533
5. Subquery predicate is at the AND-top-level of ON/WHERE clause
534
6. No execution method was already chosen (by a prepared statement).
536
(*). We are not in a subquery of a single table UPDATE/DELETE that
537
doesn't have a JOIN (TODO: We should handle this at some
538
point by switching to multi-table UPDATE/DELETE)
540
(**). We're not in a confluent table-less subquery, like
544
!select_lex->master_unit()->first_select()->next_select() && // 2
545
!select_lex->group_list.elements && !order && // 3
546
!having && !select_lex->with_sum_func && // 4
547
thd->thd_marker && // 5
548
select_lex->outer_select()->join && // (*)
549
select_lex->master_unit()->first_select()->leaf_tables && // (**)
551
in_subs->exec_method == Item_in_subselect::NOT_TRANSFORMED) // 6
554
if (!in_subs->left_expr->fixed &&
555
in_subs->left_expr->fix_fields(thd, &in_subs->left_expr))
560
Check that the right part of the subselect contains no more than one
561
column. E.g. in SELECT 1 IN (SELECT * ..) the right part is (SELECT * ...)
563
if (subselect->substype() == Item_subselect::IN_SUBS &&
564
(select_lex->item_list.elements !=
565
((Item_in_subselect*)subselect)->left_expr->cols()))
567
my_error(ER_OPERAND_COLUMNS, MYF(0), ((Item_in_subselect*)subselect)->left_expr->cols());
572
/* Register the subquery for further processing */
573
select_lex->outer_select()->join->sj_subselects.append(thd->mem_root, in_subs);
574
in_subs->expr_join_nest= (TableList*)thd->thd_marker;
578
bool do_materialize= !test(thd->variables.optimizer_switch &
579
OPTIMIZER_SWITCH_NO_MATERIALIZATION);
581
Check if the subquery predicate can be executed via materialization.
582
The required conditions are:
583
1. Subquery predicate is an IN/=ANY subq predicate
584
2. Subquery is a single SELECT (not a UNION)
585
3. Subquery is not a table-less query. In this case there is no
586
point in materializing.
587
4. Subquery predicate is a top-level predicate
588
(this implies it is not negated)
589
TODO: this is a limitation that should be lifeted once we
590
implement correct NULL semantics (WL#3830)
591
5. Subquery is non-correlated
593
This is an overly restrictive condition. It can be extended to:
594
(Subquery is non-correlated ||
595
Subquery is correlated to any query outer to IN predicate ||
596
(Subquery is correlated to the immediate outer query &&
597
Subquery !contains {GROUP BY, order_st BY [LIMIT],
598
aggregate functions) && subquery predicate is not under "NOT IN"))
599
6. No execution method was already chosen (by a prepared statement).
601
(*) The subquery must be part of a SELECT statement. The current
602
condition also excludes multi-table update statements.
604
We have to determine whether we will perform subquery materialization
605
before calling the IN=>EXISTS transformation, so that we know whether to
606
perform the whole transformation or only that part of it which wraps
607
Item_in_subselect in an Item_in_optimizer.
609
if (do_materialize &&
611
!select_lex->master_unit()->first_select()->next_select() && // 2
612
select_lex->master_unit()->first_select()->leaf_tables && // 3
613
thd->lex->sql_command == SQLCOM_SELECT) // *
615
if (in_subs->is_top_level_item() && // 4
616
!in_subs->is_correlated && // 5
617
in_subs->exec_method == Item_in_subselect::NOT_TRANSFORMED) // 6
618
in_subs->exec_method= Item_in_subselect::MATERIALIZATION;
621
Item_subselect::trans_res trans_res;
622
if ((trans_res= subselect->select_transformer(this)) !=
623
Item_subselect::RES_OK)
625
return((trans_res == Item_subselect::RES_ERROR));
634
for (ord= order; ord; ord= ord->next)
636
Item *item= *ord->item;
637
if (item->with_sum_func && item->type() != Item::SUM_FUNC_ITEM)
638
item->split_sum_func(thd, ref_pointer_array, all_fields);
642
if (having && having->with_sum_func)
643
having->split_sum_func2(thd, ref_pointer_array, all_fields,
645
if (select_lex->inner_sum_func_list)
647
Item_sum *end=select_lex->inner_sum_func_list;
648
Item_sum *item_sum= end;
651
item_sum= item_sum->next;
652
item_sum->split_sum_func2(thd, ref_pointer_array,
653
all_fields, item_sum->ref_by, false);
654
} while (item_sum != end);
657
if (select_lex->inner_refs_list.elements &&
658
fix_inner_refs(thd, all_fields, select_lex, ref_pointer_array))
662
Check if there are references to un-aggregated columns when computing
663
aggregate functions with implicit grouping (there is no GROUP BY).
665
MODE_ONLY_FULL_GROUP_BY is enabled here by default
667
if (!group_list && select_lex->full_group_by_flag == (NON_AGG_FIELD_USED | SUM_FUNC_USED))
669
my_message(ER_MIX_OF_GROUP_FUNC_AND_FIELDS,
670
ER(ER_MIX_OF_GROUP_FUNC_AND_FIELDS), MYF(0));
674
/* Caclulate the number of groups */
676
for (order_st *group_tmp= group_list ; group_tmp ; group_tmp= group_tmp->next)
681
goto err; /* purecov: inspected */
683
if (result && result->prepare(fields_list, unit_arg))
684
goto err; /* purecov: inspected */
686
/* Init join struct */
687
count_field_types(select_lex, &tmp_table_param, all_fields, 0);
688
ref_pointer_array_size= all_fields.elements*sizeof(Item*);
689
this->group= group_list != 0;
692
#ifdef RESTRICTED_GROUP
693
if (sum_func_count && !group_list && (func_count || field_count))
695
my_message(ER_WRONG_SUM_SELECT,ER(ER_WRONG_SUM_SELECT),MYF(0));
699
if (select_lex->olap == ROLLUP_TYPE && rollup_init())
701
if (alloc_func_list())
707
return(-1); /* purecov: inspected */
712
Remove the predicates pushed down into the subquery
715
JOIN::remove_subq_pushed_predicates()
716
where IN Must be NULL
717
OUT The remaining WHERE condition, or NULL
720
Given that this join will be executed using (unique|index)_subquery,
721
without "checking NULL", remove the predicates that were pushed down
724
If the subquery compares scalar values, we can remove the condition that
725
was wrapped into trig_cond (it will be checked when needed by the subquery
728
If the subquery compares row values, we need to keep the wrapped
729
equalities in the WHERE clause: when the left (outer) tuple has both NULL
730
and non-NULL values, we'll do a full table scan and will rely on the
731
equalities corresponding to non-NULL parts of left tuple to filter out
732
non-matching records.
734
TODO: We can remove the equalities that will be guaranteed to be true by the
735
fact that subquery engine will be using index lookup. This must be done only
736
for cases where there are no conversion errors of significance, e.g. 257
737
that is searched in a byte. But this requires homogenization of the return
738
codes of all Field*::store() methods.
741
void JOIN::remove_subq_pushed_predicates(Item **where)
743
if (conds->type() == Item::FUNC_ITEM &&
744
((Item_func *)this->conds)->functype() == Item_func::EQ_FUNC &&
745
((Item_func *)conds)->arguments()[0]->type() == Item::REF_ITEM &&
746
((Item_func *)conds)->arguments()[1]->type() == Item::FIELD_ITEM &&
747
test_if_ref ((Item_field *)((Item_func *)conds)->arguments()[1],
748
((Item_func *)conds)->arguments()[0]))
278
757
Index lookup-based subquery: save some flags for EXPLAIN output
796
Check if the table's rowid is included in the temptable
799
sj_table_is_included()
801
join_tab The table to be checked
804
SemiJoinDuplicateElimination: check the table's rowid should be included
805
in the temptable. This is so if
807
1. The table is not embedded within some semi-join nest
808
2. The has been pulled out of a semi-join nest, or
810
3. The table is functionally dependent on some previous table
812
[4. This is also true for constant tables that can't be
813
NULL-complemented but this function is not called for such tables]
816
true - Include table's rowid
820
static bool sj_table_is_included(JOIN *join, JOIN_TAB *join_tab)
822
if (join_tab->emb_sj_nest)
825
/* Check if this table is functionally dependent on the tables that
826
are within the same outer join nest
828
TableList *embedding= join_tab->table->pos_in_table_list->embedding;
829
if (join_tab->type == JT_EQ_REF)
831
Table_map_iterator it(join_tab->ref.depend_map & ~PSEUDO_TABLE_BITS);
833
while ((idx= it.next_bit())!=Table_map_iterator::BITMAP_END)
835
JOIN_TAB *ref_tab= join->join_tab + idx;
836
if (embedding == ref_tab->table->pos_in_table_list->embedding)
839
/* Ok, functionally dependent */
842
/* Not functionally dependent => need to include*/
848
Setup the strategies to eliminate semi-join duplicates.
851
setup_semijoin_dups_elimination()
853
options Join options (needed to see if join buffering will be
855
no_jbuf_after Another bit of information re where join buffering will
859
Setup the strategies to eliminate semi-join duplicates. ATM there are 3
862
1. DuplicateWeedout (use of temptable to remove duplicates based on rowids
864
2. FirstMatch (pick only the 1st matching row combination of inner tables)
865
3. InsideOut (scanning the sj-inner table in a way that groups duplicates
866
together and picking the 1st one)
868
The join order has "duplicate-generating ranges", and every range is
869
served by one strategy or a combination of FirstMatch with with some
872
"Duplicate-generating range" is defined as a range within the join order
873
that contains all of the inner tables of a semi-join. All ranges must be
874
disjoint, if tables of several semi-joins are interleaved, then the ranges
875
are joined together, which is equivalent to converting
876
SELECT ... WHERE oe1 IN (SELECT ie1 ...) AND oe2 IN (SELECT ie2 )
878
SELECT ... WHERE (oe1, oe2) IN (SELECT ie1, ie2 ... ...)
881
Applicability conditions are as follows:
883
DuplicateWeedout strategy
884
~~~~~~~~~~~~~~~~~~~~~~~~~
886
(ot|nt)* [ it ((it|ot|nt)* (it|ot))] (nt)*
887
+------+ +=========================+ +---+
890
(1) - Prefix of OuterTables (those that participate in
891
IN-equality and/or are correlated with subquery) and outer
892
Noncorrelated Tables.
893
(2) - The handled range. The range starts with the first sj-inner
894
table, and covers all sj-inner and outer tables
895
Within the range, Inner, Outer, outer Noncorrelated tables
896
may follow in any order.
897
(3) - The suffix of outer Noncorrelated tables.
902
(ot|nt)* [ it ((it|nt)* it) ] (nt)*
903
+------+ +==================+ +---+
906
(1) - Prefix of outer and non-correlated tables
907
(2) - The handled range, which may contain only inner and
908
non-correlated tables.
909
(3) - The suffix of outer Noncorrelated tables.
914
(ot|ct|nt) [ insideout_tbl (ot|nt|it)* it ] (ot|nt)*
915
+--------+ +===========+ +=============+ +------+
918
(1) - Prefix that may contain any outer tables. The prefix must contain
919
all the non-trivially correlated outer tables. (non-trivially means
920
that the correlation is not just through the IN-equality).
922
(2) - Inner table for which the InsideOut scan is performed.
924
(3) - The remainder of the duplicate-generating range. It is served by
925
application of FirstMatch strategy, with the exception that
926
outer IN-correlated tables are considered to be non-correlated.
928
(4) - THe suffix of outer and outer non-correlated tables.
930
If several strategies are applicable, their relative priorities are:
935
This function walks over the join order and sets up the strategies by
936
setting appropriate members in join_tab structures.
940
true Out of memory error
944
int setup_semijoin_dups_elimination(JOIN *join, uint64_t options, uint no_jbuf_after)
946
table_map cur_map= join->const_table_map | PSEUDO_TABLE_BITS;
949
0 - invalid (EOF marker),
951
2 - Temptable (maybe confluent),
952
3 - Temptable with join buffering
955
uint start_idx; /* Left range bound */
956
uint end_idx; /* Right range bound */
958
For Temptable strategy: Bitmap of all outer and correlated tables from
959
all involved join nests.
961
table_map outer_tables;
962
} dups_ranges [MAX_TABLES];
964
TableList *emb_insideout_nest= NULL;
965
table_map emb_sj_map= 0; /* A bitmap of sj-nests (that is, their sj-inner
966
tables) whose ranges we're in */
967
table_map emb_outer_tables= 0; /* sj-outer tables for those sj-nests */
968
table_map range_start_map= 0; /* table_map at current range start */
969
bool dealing_with_jbuf= false; /* true <=> table within cur range uses join buf */
974
First pass: locate the duplicate-generating ranges and pick the strategies.
976
for (i=join->const_tables ; i < join->tables ; i++)
978
JOIN_TAB *tab=join->join_tab+i;
979
Table *table=tab->table;
980
cur_map |= table->map;
982
if (tab->emb_sj_nest) // Encountered an sj-inner table
986
dups_ranges[cur_range].start_idx= i;
987
range_start_map= cur_map & ~table->map;
989
Remember if this is a possible start of range that is covered by
990
the InsideOut strategy (the reason that it is not covered could
991
be that it overlaps with anther semi-join's range. we don't
992
support InsideOut for joined ranges)
994
if (join->best_positions[i].use_insideout_scan)
995
emb_insideout_nest= tab->emb_sj_nest;
998
emb_sj_map |= tab->emb_sj_nest->sj_inner_tables;
999
emb_outer_tables |= tab->emb_sj_nest->nested_join->sj_depends_on;
1001
if (tab->emb_sj_nest != emb_insideout_nest)
1004
Two different semi-joins interleave. This cannot be handled by
1007
emb_insideout_nest= NULL;
1011
if (emb_sj_map) /* We're in duplicate-generating range */
1013
if (i != join->const_tables && !(options & SELECT_NO_JOIN_CACHE) &&
1014
tab->type == JT_ALL && tab->use_quick != 2 && !tab->first_inner &&
1015
i <= no_jbuf_after && !dealing_with_jbuf)
1018
This table uses join buffering, which makes use of FirstMatch or
1019
InsideOut strategies impossible for the current and (we assume)
1020
preceding duplicate-producing ranges.
1021
That is, for the join order:
1023
x x [ x x] x [x x x] x [x x X* x] x
1025
+-----+ +-----+ | join buffering use
1028
we'll have to remove r1 and r2 and use duplicate-elimination
1029
strategy that spans all the tables, starting from the very 1st
1032
dealing_with_jbuf= true;
1033
emb_insideout_nest= false;
1036
Absorb all preceding duplicate-eliminating ranges. Their strategies
1039
for (int prev_range= 0; prev_range < cur_range; prev_range++)
1041
dups_ranges[cur_range].outer_tables |=
1042
dups_ranges[prev_range].outer_tables;
1044
dups_ranges[0].start_idx= 0; /* Will need to start from the 1st table */
1045
dups_ranges[0].outer_tables= dups_ranges[cur_range].outer_tables;
1050
Check if we are at the end of duplicate-producing range. We are if
1052
1. It's an InsideOut range (which presumes all correlated tables are
1053
in the prefix), and all inner tables are in the join order prefix,
1055
2. It's a DuplicateElimination range (possibly covering several
1056
SJ-nests), and all inner, outer, and correlated tables of all
1057
sj-nests are in the join order prefix.
1059
bool end_of_range= false;
1060
if (emb_insideout_nest &&
1061
bitmap_covers(cur_map, emb_insideout_nest->sj_inner_tables))
1063
/* Save that this range is handled with InsideOut: */
1064
dups_ranges[cur_range].strategy= 1;
1067
else if (bitmap_covers(cur_map, emb_outer_tables | emb_sj_map))
1070
This is a complete range to be handled with either DuplicateWeedout
1073
dups_ranges[cur_range].strategy= dealing_with_jbuf? 3 : 2;
1075
This will hold tables from within the range that need to be put
1076
into the join buffer before we can use the FirstMatch on its tail.
1078
dups_ranges[cur_range].outer_tables= emb_outer_tables &
1085
dups_ranges[cur_range].end_idx= i+1;
1086
emb_sj_map= emb_outer_tables= 0;
1087
emb_insideout_nest= NULL;
1088
dealing_with_jbuf= false;
1089
dups_ranges[++cur_range].strategy= 0;
1094
THD *thd= join->thd;
1095
SJ_TMP_TABLE **next_sjtbl_ptr= &join->sj_tmp_tables;
1097
Second pass: setup the chosen strategies
1099
for (int j= 0; j < cur_range; j++)
1101
JOIN_TAB *tab=join->join_tab + dups_ranges[j].start_idx;
1103
if (dups_ranges[j].strategy == 1) // InsideOut strategy
1105
tab->insideout_match_tab= join->join_tab + dups_ranges[j].end_idx - 1;
1108
else // DuplicateWeedout strategy
1110
SJ_TMP_TABLE::TAB sjtabs[MAX_TABLES];
1111
table_map cur_map= join->const_table_map | PSEUDO_TABLE_BITS;
1112
uint jt_rowid_offset= 0; // # tuple bytes are already occupied (w/o NULL bytes)
1113
uint jt_null_bits= 0; // # null bits in tuple bytes
1114
SJ_TMP_TABLE::TAB *last_tab= sjtabs;
1115
uint rowid_keep_flags= JOIN_TAB::CALL_POSITION | JOIN_TAB::KEEP_ROWID;
1116
JOIN_TAB *last_outer_tab= tab - 1;
1118
Walk through the range and remember
1119
- tables that need their rowids to be put into temptable
1120
- the last outer table
1122
for (; tab < join->join_tab + dups_ranges[j].end_idx; tab++)
1124
if (sj_table_is_included(join, tab))
1126
last_tab->join_tab= tab;
1127
last_tab->rowid_offset= jt_rowid_offset;
1128
jt_rowid_offset += tab->table->file->ref_length;
1129
if (tab->table->maybe_null)
1131
last_tab->null_byte= jt_null_bits / 8;
1132
last_tab->null_bit= jt_null_bits++;
1135
tab->table->prepare_for_position();
1136
tab->rowid_keep_flags= rowid_keep_flags;
1138
cur_map |= tab->table->map;
1139
if (!tab->emb_sj_nest && bitmap_covers(cur_map,
1140
dups_ranges[j].outer_tables))
1141
last_outer_tab= tab;
1144
if (jt_rowid_offset) /* Temptable has at least one rowid */
1146
SJ_TMP_TABLE *sjtbl;
1147
uint tabs_size= (last_tab - sjtabs) * sizeof(SJ_TMP_TABLE::TAB);
1148
if (!(sjtbl= (SJ_TMP_TABLE*)thd->alloc(sizeof(SJ_TMP_TABLE))) ||
1149
!(sjtbl->tabs= (SJ_TMP_TABLE::TAB*) thd->alloc(tabs_size)))
1151
memcpy(sjtbl->tabs, sjtabs, tabs_size);
1152
sjtbl->tabs_end= sjtbl->tabs + (last_tab - sjtabs);
1153
sjtbl->rowid_len= jt_rowid_offset;
1154
sjtbl->null_bits= jt_null_bits;
1155
sjtbl->null_bytes= (jt_null_bits + 7)/8;
1157
*next_sjtbl_ptr= sjtbl;
1158
next_sjtbl_ptr= &(sjtbl->next);
1162
create_duplicate_weedout_tmp_table(thd,
1167
join->join_tab[dups_ranges[j].start_idx].flush_weedout_table= sjtbl;
1168
join->join_tab[dups_ranges[j].end_idx - 1].check_weed_out_table= sjtbl;
1170
tab= last_outer_tab + 1;
1171
jump_to= last_outer_tab;
1174
/* Create the FirstMatch tail */
1175
for (; tab < join->join_tab + dups_ranges[j].end_idx; tab++)
1177
if (tab->emb_sj_nest)
1178
tab->do_firstmatch= jump_to;
1187
static void cleanup_sj_tmp_tables(JOIN *join)
1189
for (SJ_TMP_TABLE *sj_tbl= join->sj_tmp_tables; sj_tbl;
1190
sj_tbl= sj_tbl->next)
1192
if (sj_tbl->tmp_table)
1194
sj_tbl->tmp_table->free_tmp_table(join->thd);
1197
join->sj_tmp_tables= NULL;
1200
uint make_join_orderinfo(JOIN *join);
1203
global select optimisation.
1206
error code saved in field 'error'
1217
// to prevent double initialization on EXPLAIN
1222
thd_proc_info(thd, "optimizing");
1223
row_limit= ((select_distinct || order || group_list) ? HA_POS_ERROR :
1224
unit->select_limit_cnt);
1225
/* select_limit is used to decide if we are likely to scan the whole table */
1226
select_limit= unit->select_limit_cnt;
1227
if (having || (select_options & OPTION_FOUND_ROWS))
1228
select_limit= HA_POS_ERROR;
1229
do_send_rows = (unit->select_limit_cnt) ? 1 : 0;
1230
// Ignore errors of execution if option IGNORE present
1231
if (thd->lex->ignore)
1232
thd->lex->current_select->no_error= 1;
1234
#ifdef HAVE_REF_TO_FIELDS // Not done yet
1235
/* Add HAVING to WHERE if possible */
1236
if (having && !group_list && !sum_func_count)
1243
else if ((conds=new Item_cond_and(conds,having)))
1246
Item_cond_and can't be fixed after creation, so we do not check
1249
conds->fix_fields(thd, &conds);
1250
conds->change_ref_to_fields(thd, tables_list);
1251
conds->top_level_item();
1256
SELECT_LEX *sel= thd->lex->current_select;
1257
if (sel->first_cond_optimization)
1260
The following code will allocate the new items in a permanent
1261
MEMROOT for prepared statements and stored procedures.
1263
sel->first_cond_optimization= 0;
1265
/* Convert all outer joins to inner joins if possible */
1266
conds= simplify_joins(this, join_list, conds, true, false);
1267
build_bitmap_for_nested_joins(join_list, 0);
1270
conds= optimize_cond(this, conds, join_list, &cond_value);
1271
if (thd->is_error())
1278
having= optimize_cond(this, having, join_list, &having_value);
1279
if (thd->is_error())
1284
if (select_lex->where)
1285
select_lex->cond_value= cond_value;
1286
if (select_lex->having)
1287
select_lex->having_value= having_value;
1289
if (cond_value == Item::COND_FALSE || having_value == Item::COND_FALSE ||
1290
(!unit->select_limit_cnt && !(select_options & OPTION_FOUND_ROWS)))
1291
{ /* Impossible cond */
1292
zero_result_cause= having_value == Item::COND_FALSE ?
1293
"Impossible HAVING" : "Impossible WHERE";
1299
/* Optimize count(*), min() and max() */
1300
if (tables_list && tmp_table_param.sum_func_count && ! group_list)
1304
opt_sum_query() returns HA_ERR_KEY_NOT_FOUND if no rows match
1305
to the WHERE conditions,
1306
or 1 if all items were resolved,
1307
or 0, or an error number HA_ERR_...
1309
if ((res=opt_sum_query(select_lex->leaf_tables, all_fields, conds)))
1311
if (res == HA_ERR_KEY_NOT_FOUND)
1313
zero_result_cause= "No matching min/max row";
1324
zero_result_cause= "No matching min/max row";
1328
zero_result_cause= "Select tables optimized away";
1329
tables_list= 0; // All tables resolved
1331
Extract all table-independent conditions and replace the WHERE
1332
clause with them. All other conditions were computed by opt_sum_query
1333
and the MIN/MAX/COUNT function(s) have been replaced by constants,
1334
so there is no need to compute the whole WHERE clause again.
1335
Notice that make_cond_for_table() will always succeed to remove all
1336
computed conditions, because opt_sum_query() is applicable only to
1338
Preserve conditions for EXPLAIN.
1340
if (conds && !(thd->lex->describe & DESCRIBE_EXTENDED))
1342
COND *table_independent_conds=
1343
make_cond_for_table(conds, PSEUDO_TABLE_BITS, 0, 0);
1344
conds= table_independent_conds;
1353
error= -1; // Error is sent to client
1354
sort_by_table= get_sort_by_table(order, group_list, select_lex->leaf_tables);
1356
/* Calculate how to do the join */
1357
thd_proc_info(thd, "statistics");
1358
if (make_join_statistics(this, select_lex->leaf_tables, conds, &keyuse) ||
1359
thd->is_fatal_error)
1364
/* Remove distinct if only const tables */
1365
select_distinct= select_distinct && (const_tables != tables);
1366
thd_proc_info(thd, "preparing");
1367
if (result->initialize_tables(this))
1369
return(1); // error == -1
1371
if (const_table_map != found_const_table_map &&
1372
!(select_options & SELECT_DESCRIBE) &&
1374
!(conds->used_tables() & RAND_TABLE_BIT) ||
1375
select_lex->master_unit() == &thd->lex->unit)) // upper level SELECT
1377
zero_result_cause= "no matching row in const table";
1381
if (!(thd->options & OPTION_BIG_SELECTS) &&
1382
best_read > (double) thd->variables.max_join_size &&
1383
!(select_options & SELECT_DESCRIBE))
1384
{ /* purecov: inspected */
1385
my_message(ER_TOO_BIG_SELECT, ER(ER_TOO_BIG_SELECT), MYF(0));
1389
if (const_tables && !thd->locked_tables &&
1390
!(select_options & SELECT_NO_UNLOCK))
1391
mysql_unlock_some_tables(thd, table, const_tables);
1392
if (!conds && outer_join)
1394
/* Handle the case where we have an OUTER JOIN without a WHERE */
1395
conds=new Item_int((int64_t) 1,1); // Always true
1397
select= make_select(*table, const_table_map,
1398
const_table_map, conds, 1, &error);
1400
{ /* purecov: inspected */
1401
error= -1; /* purecov: inspected */
1405
reset_nj_counters(join_list);
1406
make_outerjoin_info(this);
1409
Among the equal fields belonging to the same multiple equality
1410
choose the one that is to be retrieved first and substitute
1411
all references to these in where condition for a reference for
1416
conds= substitute_for_best_equal_field(conds, cond_equal, map2table);
1417
conds->update_used_tables();
1421
Permorm the the optimization on fields evaluation mentioned above
1422
for all on expressions.
1424
for (JOIN_TAB *tab= join_tab + const_tables; tab < join_tab + tables ; tab++)
1426
if (*tab->on_expr_ref)
1428
*tab->on_expr_ref= substitute_for_best_equal_field(*tab->on_expr_ref,
1431
(*tab->on_expr_ref)->update_used_tables();
1435
if (conds &&!outer_join && const_table_map != found_const_table_map &&
1436
(select_options & SELECT_DESCRIBE) &&
1437
select_lex->master_unit() == &thd->lex->unit) // upper level SELECT
1439
conds=new Item_int((int64_t) 0,1); // Always false
1441
if (make_join_select(this, select, conds))
1444
"Impossible WHERE noticed after reading const tables";
1445
return(0); // error == 0
1448
error= -1; /* if goto err */
1450
/* Optimize distinct away if possible */
1452
order_st *org_order= order;
1453
order=remove_const(this, order,conds,1, &simple_order);
1454
if (thd->is_error())
1461
If we are using order_st BY NULL or order_st BY const_expression,
1462
return result in any order (even if we are using a GROUP BY)
1464
if (!order && org_order)
1468
Check if we can optimize away GROUP BY/DISTINCT.
1469
We can do that if there are no aggregate functions, the
1470
fields in DISTINCT clause (if present) and/or columns in GROUP BY
1471
(if present) contain direct references to all key parts of
1472
an unique index (in whatever order) and if the key parts of the
1473
unique index cannot contain NULLs.
1474
Note that the unique keys for DISTINCT and GROUP BY should not
1475
be the same (as long as they are unique).
1477
The FROM clause must contain a single non-constant table.
1479
if (tables - const_tables == 1 && (group_list || select_distinct) &&
1480
!tmp_table_param.sum_func_count &&
1481
(!join_tab[const_tables].select ||
1482
!join_tab[const_tables].select->quick ||
1483
join_tab[const_tables].select->quick->get_type() !=
1484
QUICK_SELECT_I::QS_TYPE_GROUP_MIN_MAX))
1487
list_contains_unique_index(join_tab[const_tables].table,
1488
find_field_in_order_list,
1489
(void *) group_list))
1492
We have found that grouping can be removed since groups correspond to
1493
only one row anyway, but we still have to guarantee correct result
1494
order. The line below effectively rewrites the query from GROUP BY
1495
<fields> to order_st BY <fields>. There are two exceptions:
1496
- if skip_sort_order is set (see above), then we can simply skip
1498
- we can only rewrite order_st BY if the order_st BY fields are 'compatible'
1499
with the GROUP BY ones, i.e. either one is a prefix of another.
1500
We only check if the order_st BY is a prefix of GROUP BY. In this case
1501
test_if_subpart() copies the ASC/DESC attributes from the original
1503
If GROUP BY is a prefix of order_st BY, then it is safe to leave
1506
if (!order || test_if_subpart(group_list, order))
1507
order= skip_sort_order ? 0 : group_list;
1509
If we have an IGNORE INDEX FOR GROUP BY(fields) clause, this must be
1510
rewritten to IGNORE INDEX FOR order_st BY(fields).
1512
join_tab->table->keys_in_use_for_order_by=
1513
join_tab->table->keys_in_use_for_group_by;
1517
if (select_distinct &&
1518
list_contains_unique_index(join_tab[const_tables].table,
1519
find_field_in_item_list,
1520
(void *) &fields_list))
1525
if (group_list || tmp_table_param.sum_func_count)
1527
if (! hidden_group_fields && rollup.state == ROLLUP::STATE_NONE)
1530
else if (select_distinct && tables - const_tables == 1)
1533
We are only using one table. In this case we change DISTINCT to a
1535
- The GROUP BY can be done through indexes (no sort) and the order_st
1536
BY only uses selected fields.
1537
(In this case we can later optimize away GROUP BY and order_st BY)
1538
- We are scanning the whole table without LIMIT
1540
- We are using CALC_FOUND_ROWS
1541
- We are using an order_st BY that can't be optimized away.
1543
We don't want to use this optimization when we are using LIMIT
1544
because in this case we can just create a temporary table that
1545
holds LIMIT rows and stop when this table is full.
1547
JOIN_TAB *tab= &join_tab[const_tables];
1548
bool all_order_fields_used;
1550
skip_sort_order= test_if_skip_sort_order(tab, order, select_limit, 1,
1551
&tab->table->keys_in_use_for_order_by);
1552
if ((group_list=create_distinct_group(thd, select_lex->ref_pointer_array,
1553
order, fields_list, all_fields,
1554
&all_order_fields_used)))
1556
bool skip_group= (skip_sort_order &&
1557
test_if_skip_sort_order(tab, group_list, select_limit, 1,
1558
&tab->table->keys_in_use_for_group_by) != 0);
1559
count_field_types(select_lex, &tmp_table_param, all_fields, 0);
1560
if ((skip_group && all_order_fields_used) ||
1561
select_limit == HA_POS_ERROR ||
1562
(order && !skip_sort_order))
1564
/* Change DISTINCT to GROUP BY */
1567
if (all_order_fields_used)
1569
if (order && skip_sort_order)
1572
Force MySQL to read the table in sorted order to get result in
1575
tmp_table_param.quick_group=0;
1579
group=1; // For end_write_group
1584
else if (thd->is_fatal_error) // End of memory
1589
order_st *old_group_list;
1590
group_list= remove_const(this, (old_group_list= group_list), conds,
1591
rollup.state == ROLLUP::STATE_NONE,
1593
if (thd->is_error())
1598
if (old_group_list && !group_list)
1601
if (!group_list && group)
1603
order=0; // The output has only one row
1605
select_distinct= 0; // No need in distinct for 1 row
1606
group_optimized_away= 1;
1609
calc_group_buffer(this, group_list);
1610
send_group_parts= tmp_table_param.group_parts; /* Save org parts */
1612
if (test_if_subpart(group_list, order) ||
1613
(!group_list && tmp_table_param.sum_func_count))
1616
// Can't use sort on head table if using row cache
1626
Check if we need to create a temporary table.
1627
This has to be done if all tables are not already read (const tables)
1628
and one of the following conditions holds:
1629
- We are using DISTINCT (simple distinct's are already optimized away)
1630
- We are using an order_st BY or GROUP BY on fields not in the first table
1631
- We are using different order_st BY and GROUP BY orders
1632
- The user wants us to buffer the result.
1634
need_tmp= (const_tables != tables &&
1635
((select_distinct || !simple_order || !simple_group) ||
1636
(group_list && order) ||
1637
test(select_options & OPTION_BUFFER_RESULT)));
1639
uint no_jbuf_after= make_join_orderinfo(this);
1640
uint64_t select_opts_for_readinfo=
1641
(select_options & (SELECT_DESCRIBE | SELECT_NO_JOIN_CACHE)) | (0);
1643
sj_tmp_tables= NULL;
1644
if (!select_lex->sj_nests.is_empty())
1645
setup_semijoin_dups_elimination(this, select_opts_for_readinfo,
1648
// No cache for MATCH == 'Don't use join buffering when we use MATCH'.
1649
if (make_join_readinfo(this, select_opts_for_readinfo, no_jbuf_after))
1652
/* Create all structures needed for materialized subquery execution. */
1653
if (setup_subquery_materialization())
1657
is this simple IN subquery?
1659
if (!group_list && !order &&
1660
unit->item && unit->item->substype() == Item_subselect::IN_SUBS &&
1661
tables == 1 && conds &&
1667
if (join_tab[0].type == JT_EQ_REF &&
1668
join_tab[0].ref.items[0]->name == in_left_expr_name)
1670
remove_subq_pushed_predicates(&where);
1671
save_index_subquery_explain_info(join_tab, where);
1672
join_tab[0].type= JT_UNIQUE_SUBQUERY;
1676
subselect_uniquesubquery_engine(thd,
1681
else if (join_tab[0].type == JT_REF &&
1682
join_tab[0].ref.items[0]->name == in_left_expr_name)
1684
remove_subq_pushed_predicates(&where);
1685
save_index_subquery_explain_info(join_tab, where);
1686
join_tab[0].type= JT_INDEX_SUBQUERY;
1690
subselect_indexsubquery_engine(thd,
1697
} else if (join_tab[0].type == JT_REF_OR_NULL &&
1698
join_tab[0].ref.items[0]->name == in_left_expr_name &&
1699
having->name == in_having_cond)
1701
join_tab[0].type= JT_INDEX_SUBQUERY;
1703
conds= remove_additional_cond(conds);
1704
save_index_subquery_explain_info(join_tab, conds);
1706
change_engine(new subselect_indexsubquery_engine(thd,
1716
Need to tell handlers that to play it safe, it should fetch all
1717
columns of the primary key of the tables: this is because MySQL may
1718
build row pointers for the rows, and for all columns of the primary key
1719
the read set has not necessarily been set by the server code.
1721
if (need_tmp || select_distinct || group_list || order)
1723
for (uint i = const_tables; i < tables; i++)
1724
join_tab[i].table->prepare_for_position();
1727
if (const_tables != tables)
1730
Because filesort always does a full table scan or a quick range scan
1731
we must add the removed reference to the select for the table.
1732
We only need to do this when we have a simple_order or simple_group
1733
as in other cases the join is done before the sort.
1735
if ((order || group_list) &&
1736
(join_tab[const_tables].type != JT_ALL) &&
1737
(join_tab[const_tables].type != JT_REF_OR_NULL) &&
1738
((order && simple_order) || (group_list && simple_group)))
1740
if (add_ref_to_table_cond(thd,&join_tab[const_tables])) {
1745
if (!(select_options & SELECT_BIG_RESULT) &&
1748
!test_if_skip_sort_order(&join_tab[const_tables], group_list,
1749
unit->select_limit_cnt, 0,
1750
&join_tab[const_tables].table->
1751
keys_in_use_for_group_by))) ||
1753
tmp_table_param.quick_group)
1755
need_tmp=1; simple_order=simple_group=0; // Force tmp table without sort
1760
Force using of tmp table if sorting by a SP or UDF function due to
1761
their expensive and probably non-deterministic nature.
1763
for (order_st *tmp_order= order; tmp_order ; tmp_order=tmp_order->next)
1765
Item *item= *tmp_order->item;
1766
if (item->is_expensive())
1768
/* Force tmp table without sort */
1769
need_tmp=1; simple_order=simple_group=0;
1777
if (select_options & SELECT_DESCRIBE)
1785
The loose index scan access method guarantees that all grouping or
1786
duplicate row elimination (for distinct) is already performed
1787
during data retrieval, and that all MIN/MAX functions are already
1788
computed for each group. Thus all MIN/MAX functions should be
1789
treated as regular functions, and there is no need to perform
1790
grouping in the main execution loop.
1791
Notice that currently loose index scan is applicable only for
1792
single table queries, thus it is sufficient to test only the first
1793
join_tab element of the plan for its access method.
1795
if (join_tab->is_using_loose_index_scan())
1796
tmp_table_param.precomputed_group_by= true;
1798
/* Create a tmp table if distinct or if the sort is too complicated */
1801
thd_proc_info(thd, "Creating tmp table");
1803
init_items_ref_array();
1805
tmp_table_param.hidden_field_count= (all_fields.elements -
1806
fields_list.elements);
1807
order_st *tmp_group= ((!simple_group && !(test_flags & TEST_NO_KEY_GROUP)) ? group_list :
1810
Pushing LIMIT to the temporary table creation is not applicable
1811
when there is order_st BY or GROUP BY or there is no GROUP BY, but
1812
there are aggregate functions, because in all these cases we need
1815
ha_rows tmp_rows_limit= ((order == 0 || skip_sort_order) &&
1817
!thd->lex->current_select->with_sum_func) ?
1818
select_limit : HA_POS_ERROR;
1820
if (!(exec_tmp_table1=
1821
create_tmp_table(thd, &tmp_table_param, all_fields,
1823
group_list ? 0 : select_distinct,
1824
group_list && simple_group,
1833
We don't have to store rows in temp table that doesn't match HAVING if:
1834
- we are sorting the table and writing complete group rows to the
1836
- We are using DISTINCT without resolving the distinct as a GROUP BY
1839
If having is not handled here, it will be checked before the row
1840
is sent to the client.
1843
(sort_and_group || (exec_tmp_table1->distinct && !group_list)))
1846
/* if group or order on first table, sort first */
1847
if (group_list && simple_group)
1849
thd_proc_info(thd, "Sorting for group");
1850
if (create_sort_index(thd, this, group_list,
1851
HA_POS_ERROR, HA_POS_ERROR, false) ||
1852
alloc_group_fields(this, group_list) ||
1853
make_sum_func_list(all_fields, fields_list, 1) ||
1854
setup_sum_funcs(thd, sum_funcs))
1862
if (make_sum_func_list(all_fields, fields_list, 0) ||
1863
setup_sum_funcs(thd, sum_funcs))
1868
if (!group_list && ! exec_tmp_table1->distinct && order && simple_order)
1870
thd_proc_info(thd, "Sorting for order");
1871
if (create_sort_index(thd, this, order,
1872
HA_POS_ERROR, HA_POS_ERROR, true))
1881
Optimize distinct when used on some of the tables
1882
SELECT DISTINCT t1.a FROM t1,t2 WHERE t1.b=t2.b
1883
In this case we can stop scanning t2 when we have found one t1.a
1886
if (exec_tmp_table1->distinct)
1888
table_map used_tables= thd->used_tables;
1889
JOIN_TAB *last_join_tab= join_tab+tables-1;
1892
if (used_tables & last_join_tab->table->map)
1894
last_join_tab->not_used_in_distinct=1;
1895
} while (last_join_tab-- != join_tab);
1896
/* Optimize "select distinct b from t1 order by key_part_1 limit #" */
1897
if (order && skip_sort_order)
1899
/* Should always succeed */
1900
if (test_if_skip_sort_order(&join_tab[const_tables],
1901
order, unit->select_limit_cnt, 0,
1902
&join_tab[const_tables].table->
1903
keys_in_use_for_order_by))
1909
If this join belongs to an uncacheable subquery save
1912
if (select_lex->uncacheable && !is_top_level_join() &&
1913
init_save_join_tab())
1914
return(-1); /* purecov: inspected */
1923
Restore values in temporary join.
1925
void JOIN::restore_tmp()
1927
memcpy(tmp_join, this, (size_t) sizeof(JOIN));
1934
unit->offset_limit_cnt= (ha_rows)(select_lex->offset_limit ?
1935
select_lex->offset_limit->val_uint() :
1940
if (exec_tmp_table1)
1942
exec_tmp_table1->file->extra(HA_EXTRA_RESET_STATE);
1943
exec_tmp_table1->file->ha_delete_all_rows();
1944
free_io_cache(exec_tmp_table1);
1945
filesort_free_buffers(exec_tmp_table1,0);
1947
if (exec_tmp_table2)
1949
exec_tmp_table2->file->extra(HA_EXTRA_RESET_STATE);
1950
exec_tmp_table2->file->ha_delete_all_rows();
1951
free_io_cache(exec_tmp_table2);
1952
filesort_free_buffers(exec_tmp_table2,0);
1955
set_items_ref_array(items0);
1958
memcpy(join_tab, join_tab_save, sizeof(JOIN_TAB) * tables);
1963
/* Reset of sum functions */
1966
Item_sum *func, **func_ptr= sum_funcs;
1967
while ((func= *(func_ptr++)))
1975
@brief Save the original join layout
1977
@details Saves the original join layout so it can be reused in
1978
re-execution and for EXPLAIN.
1980
@return Operation status
1982
@retval 1 error occurred.
1986
JOIN::init_save_join_tab()
1988
if (!(tmp_join= (JOIN*)thd->alloc(sizeof(JOIN))))
1989
return 1; /* purecov: inspected */
1990
error= 0; // Ensure that tmp_join.error= 0
1997
JOIN::save_join_tab()
1999
if (!join_tab_save && select_lex->master_unit()->uncacheable)
2001
if (!(join_tab_save= (JOIN_TAB*)thd->memdup((uchar*) join_tab,
2002
sizeof(JOIN_TAB) * tables)))
2013
Note, that create_sort_index calls test_if_skip_sort_order and may
2014
finally replace sorting with index scan if there is a LIMIT clause in
2015
the query. It's never shown in EXPLAIN!
2018
When can we have here thd->net.report_error not zero?
2023
List<Item> *columns_list= &fields_list;
2026
thd_proc_info(thd, "executing");
2028
(void) result->prepare2(); // Currently, this cannot fail.
2030
if (!tables_list && (tables || !select_lex->with_sum_func))
2031
{ // Only test of functions
2032
if (select_options & SELECT_DESCRIBE)
2033
select_describe(this, false, false, false,
2034
(zero_result_cause?zero_result_cause:"No tables used"));
2037
result->send_fields(*columns_list,
2038
Protocol::SEND_NUM_ROWS | Protocol::SEND_EOF);
2040
We have to test for 'conds' here as the WHERE may not be constant
2041
even if we don't have any tables for prepared statements or if
2042
conds uses something like 'rand()'.
2044
if (cond_value != Item::COND_FALSE &&
2045
(!conds || conds->val_int()) &&
2046
(!having || having->val_int()))
2048
if (do_send_rows && result->send_data(fields_list))
2052
error= (int) result->send_eof();
2053
send_records= ((select_options & OPTION_FOUND_ROWS) ? 1 :
2054
thd->sent_row_count);
2059
error=(int) result->send_eof();
2063
/* Single select (without union) always returns 0 or 1 row */
2064
thd->limit_found_rows= send_records;
2065
thd->examined_row_count= 0;
2069
Don't reset the found rows count if there're no tables as
2070
FOUND_ROWS() may be called. Never reset the examined row count here.
2071
It must be accumulated from all join iterations of all join parts.
2074
thd->limit_found_rows= 0;
2076
if (zero_result_cause)
2078
(void) return_zero_rows(this, result, select_lex->leaf_tables,
2080
send_row_on_empty_set(),
2087
if ((this->select_lex->options & OPTION_SCHEMA_TABLE) &&
2088
get_schema_tables_result(this, PROCESSED_BY_JOIN_EXEC))
2091
if (select_options & SELECT_DESCRIBE)
2094
Check if we managed to optimize order_st BY away and don't use temporary
2095
table to resolve order_st BY: in that case, we only may need to do
2096
filesort for GROUP BY.
2098
if (!order && !no_order && (!skip_sort_order || !need_tmp))
2101
Reset 'order' to 'group_list' and reinit variables describing
2105
simple_order= simple_group;
2109
(order != group_list || !(select_options & SELECT_BIG_RESULT)) &&
2110
(const_tables == tables ||
2111
((simple_order || skip_sort_order) &&
2112
test_if_skip_sort_order(&join_tab[const_tables], order,
2114
&join_tab[const_tables].table->
2115
keys_in_use_for_query))))
2118
select_describe(this, need_tmp,
2119
order != 0 && !skip_sort_order,
2121
!tables ? "No tables used" : NullS);
2125
JOIN *curr_join= this;
2126
List<Item> *curr_all_fields= &all_fields;
2127
List<Item> *curr_fields_list= &fields_list;
2128
Table *curr_tmp_table= 0;
2130
Initialize examined rows here because the values from all join parts
2131
must be accumulated in examined_row_count. Hence every join
2132
iteration must count from zero.
2134
curr_join->examined_rows= 0;
2136
/* Create a tmp table if distinct or if the sort is too complicated */
2142
We are in a non cacheable sub query. Get the saved join structure
2144
(curr_join may have been modified during last exection and we need
2147
curr_join= tmp_join;
2149
curr_tmp_table= exec_tmp_table1;
2151
/* Copy data to the temporary table */
2152
thd_proc_info(thd, "Copying to tmp table");
2153
if (!curr_join->sort_and_group &&
2154
curr_join->const_tables != curr_join->tables)
2155
curr_join->join_tab[curr_join->const_tables].sorted= 0;
2156
if ((tmp_error= do_select(curr_join, (List<Item> *) 0, curr_tmp_table)))
2161
curr_tmp_table->file->info(HA_STATUS_VARIABLE);
2163
if (curr_join->having)
2164
curr_join->having= curr_join->tmp_having= 0; // Allready done
2166
/* Change sum_fields reference to calculated fields in tmp_table */
2167
curr_join->all_fields= *curr_all_fields;
2170
items1= items0 + all_fields.elements;
2171
if (sort_and_group || curr_tmp_table->group)
2173
if (change_to_use_tmp_fields(thd, items1,
2174
tmp_fields_list1, tmp_all_fields1,
2175
fields_list.elements, all_fields))
2180
if (change_refs_to_tmp_fields(thd, items1,
2181
tmp_fields_list1, tmp_all_fields1,
2182
fields_list.elements, all_fields))
2185
curr_join->tmp_all_fields1= tmp_all_fields1;
2186
curr_join->tmp_fields_list1= tmp_fields_list1;
2187
curr_join->items1= items1;
2189
curr_all_fields= &tmp_all_fields1;
2190
curr_fields_list= &tmp_fields_list1;
2191
curr_join->set_items_ref_array(items1);
2193
if (sort_and_group || curr_tmp_table->group)
2195
curr_join->tmp_table_param.field_count+=
2196
curr_join->tmp_table_param.sum_func_count+
2197
curr_join->tmp_table_param.func_count;
2198
curr_join->tmp_table_param.sum_func_count=
2199
curr_join->tmp_table_param.func_count= 0;
2203
curr_join->tmp_table_param.field_count+=
2204
curr_join->tmp_table_param.func_count;
2205
curr_join->tmp_table_param.func_count= 0;
2208
if (curr_tmp_table->group)
2209
{ // Already grouped
2210
if (!curr_join->order && !curr_join->no_order && !skip_sort_order)
2211
curr_join->order= curr_join->group_list; /* order by group */
2212
curr_join->group_list= 0;
2216
If we have different sort & group then we must sort the data by group
2217
and copy it to another tmp table
2218
This code is also used if we are using distinct something
2219
we haven't been able to store in the temporary table yet
2220
like SEC_TO_TIME(SUM(...)).
2223
if ((curr_join->group_list && (!test_if_subpart(curr_join->group_list, curr_join->order) || curr_join->select_distinct)) || (curr_join->select_distinct && curr_join->tmp_table_param.using_indirect_summary_function))
2224
{ /* Must copy to another table */
2225
/* Free first data from old join */
2226
curr_join->join_free();
2227
if (make_simple_join(curr_join, curr_tmp_table))
2229
calc_group_buffer(curr_join, group_list);
2230
count_field_types(select_lex, &curr_join->tmp_table_param,
2231
curr_join->tmp_all_fields1,
2232
curr_join->select_distinct && !curr_join->group_list);
2233
curr_join->tmp_table_param.hidden_field_count=
2234
(curr_join->tmp_all_fields1.elements-
2235
curr_join->tmp_fields_list1.elements);
2238
if (exec_tmp_table2)
2239
curr_tmp_table= exec_tmp_table2;
2242
/* group data to new table */
2245
If the access method is loose index scan then all MIN/MAX
2246
functions are precomputed, and should be treated as regular
2247
functions. See extended comment in JOIN::exec.
2249
if (curr_join->join_tab->is_using_loose_index_scan())
2250
curr_join->tmp_table_param.precomputed_group_by= true;
2252
if (!(curr_tmp_table=
2253
exec_tmp_table2= create_tmp_table(thd,
2254
&curr_join->tmp_table_param,
2257
curr_join->select_distinct &&
2258
!curr_join->group_list,
2259
1, curr_join->select_options,
2263
curr_join->exec_tmp_table2= exec_tmp_table2;
2265
if (curr_join->group_list)
2267
thd_proc_info(thd, "Creating sort index");
2268
if (curr_join->join_tab == join_tab && save_join_tab())
2272
if (create_sort_index(thd, curr_join, curr_join->group_list,
2273
HA_POS_ERROR, HA_POS_ERROR, false) ||
2274
make_group_fields(this, curr_join))
2278
sortorder= curr_join->sortorder;
2281
thd_proc_info(thd, "Copying to group table");
2283
if (curr_join != this)
2287
curr_join->sum_funcs= sum_funcs2;
2288
curr_join->sum_funcs_end= sum_funcs_end2;
2292
curr_join->alloc_func_list();
2293
sum_funcs2= curr_join->sum_funcs;
2294
sum_funcs_end2= curr_join->sum_funcs_end;
2297
if (curr_join->make_sum_func_list(*curr_all_fields, *curr_fields_list,
2300
curr_join->group_list= 0;
2301
if (!curr_join->sort_and_group &&
2302
curr_join->const_tables != curr_join->tables)
2303
curr_join->join_tab[curr_join->const_tables].sorted= 0;
2304
if (setup_sum_funcs(curr_join->thd, curr_join->sum_funcs) ||
2305
(tmp_error= do_select(curr_join, (List<Item> *) 0, curr_tmp_table)))
2310
end_read_record(&curr_join->join_tab->read_record);
2311
curr_join->const_tables= curr_join->tables; // Mark free for cleanup()
2312
curr_join->join_tab[0].table= 0; // Table is freed
2314
// No sum funcs anymore
2317
items2= items1 + all_fields.elements;
2318
if (change_to_use_tmp_fields(thd, items2,
2319
tmp_fields_list2, tmp_all_fields2,
2320
fields_list.elements, tmp_all_fields1))
2322
curr_join->tmp_fields_list2= tmp_fields_list2;
2323
curr_join->tmp_all_fields2= tmp_all_fields2;
2325
curr_fields_list= &curr_join->tmp_fields_list2;
2326
curr_all_fields= &curr_join->tmp_all_fields2;
2327
curr_join->set_items_ref_array(items2);
2328
curr_join->tmp_table_param.field_count+=
2329
curr_join->tmp_table_param.sum_func_count;
2330
curr_join->tmp_table_param.sum_func_count= 0;
2332
if (curr_tmp_table->distinct)
2333
curr_join->select_distinct=0; /* Each row is unique */
2335
curr_join->join_free(); /* Free quick selects */
2336
if (curr_join->select_distinct && ! curr_join->group_list)
2338
thd_proc_info(thd, "Removing duplicates");
2339
if (curr_join->tmp_having)
2340
curr_join->tmp_having->update_used_tables();
2341
if (remove_duplicates(curr_join, curr_tmp_table,
2342
*curr_fields_list, curr_join->tmp_having))
2344
curr_join->tmp_having=0;
2345
curr_join->select_distinct=0;
2347
curr_tmp_table->reginfo.lock_type= TL_UNLOCK;
2348
if (make_simple_join(curr_join, curr_tmp_table))
2350
calc_group_buffer(curr_join, curr_join->group_list);
2351
count_field_types(select_lex, &curr_join->tmp_table_param,
2352
*curr_all_fields, 0);
2356
if (curr_join->group || curr_join->tmp_table_param.sum_func_count)
2358
if (make_group_fields(this, curr_join))
2365
init_items_ref_array();
2366
items3= ref_pointer_array + (all_fields.elements*4);
2367
setup_copy_fields(thd, &curr_join->tmp_table_param,
2368
items3, tmp_fields_list3, tmp_all_fields3,
2369
curr_fields_list->elements, *curr_all_fields);
2370
tmp_table_param.save_copy_funcs= curr_join->tmp_table_param.copy_funcs;
2371
tmp_table_param.save_copy_field= curr_join->tmp_table_param.copy_field;
2372
tmp_table_param.save_copy_field_end=
2373
curr_join->tmp_table_param.copy_field_end;
2374
curr_join->tmp_all_fields3= tmp_all_fields3;
2375
curr_join->tmp_fields_list3= tmp_fields_list3;
2379
curr_join->tmp_table_param.copy_funcs= tmp_table_param.save_copy_funcs;
2380
curr_join->tmp_table_param.copy_field= tmp_table_param.save_copy_field;
2381
curr_join->tmp_table_param.copy_field_end=
2382
tmp_table_param.save_copy_field_end;
2384
curr_fields_list= &tmp_fields_list3;
2385
curr_all_fields= &tmp_all_fields3;
2386
curr_join->set_items_ref_array(items3);
2388
if (curr_join->make_sum_func_list(*curr_all_fields, *curr_fields_list,
2390
setup_sum_funcs(curr_join->thd, curr_join->sum_funcs) ||
2391
thd->is_fatal_error)
2394
if (curr_join->group_list || curr_join->order)
2396
thd_proc_info(thd, "Sorting result");
2397
/* If we have already done the group, add HAVING to sorted table */
2398
if (curr_join->tmp_having && ! curr_join->group_list &&
2399
! curr_join->sort_and_group)
2401
// Some tables may have been const
2402
curr_join->tmp_having->update_used_tables();
2403
JOIN_TAB *curr_table= &curr_join->join_tab[curr_join->const_tables];
2404
table_map used_tables= (curr_join->const_table_map |
2405
curr_table->table->map);
2407
Item* sort_table_cond= make_cond_for_table(curr_join->tmp_having,
2410
if (sort_table_cond)
2412
if (!curr_table->select)
2413
if (!(curr_table->select= new SQL_SELECT))
2415
if (!curr_table->select->cond)
2416
curr_table->select->cond= sort_table_cond;
2417
else // This should never happen
2419
if (!(curr_table->select->cond=
2420
new Item_cond_and(curr_table->select->cond,
2424
Item_cond_and do not need fix_fields for execution, its parameters
2425
are fixed or do not need fix_fields, too
2427
curr_table->select->cond->quick_fix_field();
2429
curr_table->select_cond= curr_table->select->cond;
2430
curr_table->select_cond->top_level_item();
2431
curr_join->tmp_having= make_cond_for_table(curr_join->tmp_having,
2438
curr_join->select_limit= HA_POS_ERROR;
2442
We can abort sorting after thd->select_limit rows if we there is no
2443
WHERE clause for any tables after the sorted one.
2445
JOIN_TAB *curr_table= &curr_join->join_tab[curr_join->const_tables+1];
2446
JOIN_TAB *end_table= &curr_join->join_tab[curr_join->tables];
2447
for (; curr_table < end_table ; curr_table++)
2450
table->keyuse is set in the case there was an original WHERE clause
2451
on the table that was optimized away.
2453
if (curr_table->select_cond ||
2454
(curr_table->keyuse && !curr_table->first_inner))
2456
/* We have to sort all rows */
2457
curr_join->select_limit= HA_POS_ERROR;
2462
if (curr_join->join_tab == join_tab && save_join_tab())
2467
Here we sort rows for order_st BY/GROUP BY clause, if the optimiser
2468
chose FILESORT to be faster than INDEX SCAN or there is no
2469
suitable index present.
2470
Note, that create_sort_index calls test_if_skip_sort_order and may
2471
finally replace sorting with index scan if there is a LIMIT clause in
2472
the query. XXX: it's never shown in EXPLAIN!
2473
OPTION_FOUND_ROWS supersedes LIMIT and is taken into account.
2475
if (create_sort_index(thd, curr_join,
2476
curr_join->group_list ?
2477
curr_join->group_list : curr_join->order,
2478
curr_join->select_limit,
2479
(select_options & OPTION_FOUND_ROWS ?
2480
HA_POS_ERROR : unit->select_limit_cnt),
2481
curr_join->group_list ? true : false))
2483
sortorder= curr_join->sortorder;
2484
if (curr_join->const_tables != curr_join->tables &&
2485
!curr_join->join_tab[curr_join->const_tables].table->sort.io_cache)
2488
If no IO cache exists for the first table then we are using an
2489
INDEX SCAN and no filesort. Thus we should not remove the sorted
2490
attribute on the INDEX SCAN.
2496
/* XXX: When can we have here thd->is_error() not zero? */
2497
if (thd->is_error())
2499
error= thd->is_error();
2502
curr_join->having= curr_join->tmp_having;
2503
curr_join->fields= curr_fields_list;
2506
thd_proc_info(thd, "Sending data");
2507
result->send_fields(*curr_fields_list,
2508
Protocol::SEND_NUM_ROWS | Protocol::SEND_EOF);
2509
error= do_select(curr_join, curr_fields_list, NULL);
2510
thd->limit_found_rows= curr_join->send_records;
2513
/* Accumulate the counts from all join iterations of all join parts. */
2514
thd->examined_row_count+= curr_join->examined_rows;
2517
With EXPLAIN EXTENDED we have to restore original ref_array
2518
for a derived table which is always materialized.
2519
Otherwise we would not be able to print the query correctly.
2522
(thd->lex->describe & DESCRIBE_EXTENDED) &&
2523
select_lex->linkage == DERIVED_TABLE_TYPE)
2524
set_items_ref_array(items0);
2534
Return error that hold JOIN.
2540
select_lex->join= 0;
2544
if (join_tab != tmp_join->join_tab)
2546
JOIN_TAB *tab, *end;
2547
for (tab= join_tab, end= tab+tables ; tab != end ; tab++)
2550
tmp_join->tmp_join= 0;
2551
tmp_table_param.copy_field=0;
2552
return(tmp_join->destroy());
2557
if (exec_tmp_table1)
2558
exec_tmp_table1->free_tmp_table(thd);
2559
if (exec_tmp_table2)
2560
exec_tmp_table2->free_tmp_table(thd);
2562
delete_dynamic(&keyuse);
313
2569
An entry point to single-unit select (a select without UNION).
315
@param session thread Cursor
2571
@param thd thread handler
316
2572
@param rref_pointer_array a reference to ref_pointer_array of
317
2573
the top-level select_lex for this query
318
2574
@param tables list of all tables used in this query.
319
2575
The tables have been pre-opened.
320
@param wild_num number of wildcards used in the top level
2576
@param wild_num number of wildcards used in the top level
321
2577
select of this query.
322
2578
For example statement
323
2579
SELECT *, t1.*, catalog.t2.* FROM t0, t1, t2;
444
session->set_proc_info("end");
2703
thd_proc_info(thd, "end");
445
2704
err|= select_lex->cleanup();
446
return(err || session->is_error());
2705
return(err || thd->is_error());
448
2707
return(join->error);
451
inline Item *and_items(Item* cond, Item *item)
2711
int subq_sj_candidate_cmp(Item_in_subselect* const *el1,
2712
Item_in_subselect* const *el2)
2714
return ((*el1)->sj_convert_priority < (*el2)->sj_convert_priority) ? 1 :
2715
( ((*el1)->sj_convert_priority == (*el2)->sj_convert_priority)? 0 : -1);
2719
inline Item * and_items(Item* cond, Item *item)
453
2721
return (cond? (new Item_cond_and(cond, item)) : item);
2725
static TableList *alloc_join_nest(THD *thd)
2728
if (!(tbl= (TableList*) thd->calloc(ALIGN_SIZE(sizeof(TableList))+
2729
sizeof(nested_join_st))))
2731
tbl->nested_join= (nested_join_st*) ((uchar*)tbl +
2732
ALIGN_SIZE(sizeof(TableList)));
2737
void fix_list_after_tbl_changes(SELECT_LEX *new_parent, List<TableList> *tlist)
2739
List_iterator<TableList> it(*tlist);
2741
while ((table= it++))
2744
table->on_expr->fix_after_pullout(new_parent, &table->on_expr);
2745
if (table->nested_join)
2746
fix_list_after_tbl_changes(new_parent, &table->nested_join->join_list);
2752
Convert a subquery predicate into a TableList semi-join nest
2755
convert_subq_to_sj()
2756
parent_join Parent join, the one that has subq_pred in its WHERE/ON
2758
subq_pred Subquery predicate to be converted
2761
Convert a subquery predicate into a TableList semi-join nest. All the
2762
prerequisites are already checked, so the conversion is always successfull.
2764
Prepared Statements: the transformation is permanent:
2765
- Changes in TableList structures are naturally permanent
2766
- Item tree changes are performed on statement MEM_ROOT:
2767
= we activate statement MEM_ROOT
2768
= this function is called before the first fix_prepare_information
2771
This is intended because the criteria for subquery-to-sj conversion remain
2772
constant for the lifetime of the Prepared Statement.
2776
true Out of memory error
2779
bool convert_subq_to_sj(JOIN *parent_join, Item_in_subselect *subq_pred)
2781
SELECT_LEX *parent_lex= parent_join->select_lex;
2782
TableList *emb_tbl_nest= NULL;
2783
List<TableList> *emb_join_list= &parent_lex->top_join_list;
2784
THD *thd= parent_join->thd;
2787
1. Find out where to put the predicate into.
2788
Note: for "t1 LEFT JOIN t2" this will be t2, a leaf.
2790
if ((void*)subq_pred->expr_join_nest != (void*)1)
2792
if (subq_pred->expr_join_nest->nested_join)
2797
... [LEFT] JOIN ( ... ) ON (subquery AND whatever) ...
2799
The sj-nest will be inserted into the brackets nest.
2801
emb_tbl_nest= subq_pred->expr_join_nest;
2802
emb_join_list= &emb_tbl_nest->nested_join->join_list;
2804
else if (!subq_pred->expr_join_nest->outer_join)
2809
... INNER JOIN tblX ON (subquery AND whatever) ...
2811
The sj-nest will be tblX's "sibling", i.e. another child of its
2812
parent. This is ok because tblX is joined as an inner join.
2814
emb_tbl_nest= subq_pred->expr_join_nest->embedding;
2816
emb_join_list= &emb_tbl_nest->nested_join->join_list;
2818
else if (!subq_pred->expr_join_nest->nested_join)
2820
TableList *outer_tbl= subq_pred->expr_join_nest;
2821
TableList *wrap_nest;
2825
... LEFT JOIN tbl ON (on_expr AND subq_pred) ...
2827
we'll need to convert it into:
2829
... LEFT JOIN ( tbl SJ (subq_tables) ) ON (on_expr AND subq_pred) ...
2831
|<----- wrap_nest ---->|
2833
Q: other subqueries may be pointing to this element. What to do?
2834
A1: simple solution: copy *subq_pred->expr_join_nest= *parent_nest.
2835
But we'll need to fix other pointers.
2836
A2: Another way: have TableList::next_ptr so the following
2837
subqueries know the table has been nested.
2838
A3: changes in the TableList::outer_join will make everything work
2841
if (!(wrap_nest= alloc_join_nest(parent_join->thd)))
2845
wrap_nest->embedding= outer_tbl->embedding;
2846
wrap_nest->join_list= outer_tbl->join_list;
2847
wrap_nest->alias= (char*) "(sj-wrap)";
2849
wrap_nest->nested_join->join_list.empty();
2850
wrap_nest->nested_join->join_list.push_back(outer_tbl);
2852
outer_tbl->embedding= wrap_nest;
2853
outer_tbl->join_list= &wrap_nest->nested_join->join_list;
2856
wrap_nest will take place of outer_tbl, so move the outer join flag
2859
wrap_nest->outer_join= outer_tbl->outer_join;
2860
outer_tbl->outer_join= 0;
2862
wrap_nest->on_expr= outer_tbl->on_expr;
2863
outer_tbl->on_expr= NULL;
2865
List_iterator<TableList> li(*wrap_nest->join_list);
2869
if (tbl == outer_tbl)
2871
li.replace(wrap_nest);
2876
Ok now wrap_nest 'contains' outer_tbl and we're ready to add the
2877
semi-join nest into it
2879
emb_join_list= &wrap_nest->nested_join->join_list;
2880
emb_tbl_nest= wrap_nest;
2885
nested_join_st *nested_join;
2886
if (!(sj_nest= alloc_join_nest(parent_join->thd)))
2890
nested_join= sj_nest->nested_join;
2892
sj_nest->join_list= emb_join_list;
2893
sj_nest->embedding= emb_tbl_nest;
2894
sj_nest->alias= (char*) "(sj-nest)";
2895
/* Nests do not participate in those 'chains', so: */
2896
/* sj_nest->next_leaf= sj_nest->next_local= sj_nest->next_global == NULL*/
2897
emb_join_list->push_back(sj_nest);
2900
nested_join->used_tables and nested_join->not_null_tables are
2901
initialized in simplify_joins().
2905
2. Walk through subquery's top list and set 'embedding' to point to the
2908
st_select_lex *subq_lex= subq_pred->unit->first_select();
2909
nested_join->join_list.empty();
2910
List_iterator_fast<TableList> li(subq_lex->top_join_list);
2911
TableList *tl, *last_leaf;
2914
tl->embedding= sj_nest;
2915
tl->join_list= &nested_join->join_list;
2916
nested_join->join_list.push_back(tl);
2920
Reconnect the next_leaf chain.
2921
TODO: Do we have to put subquery's tables at the end of the chain?
2922
Inserting them at the beginning would be a bit faster.
2923
NOTE: We actually insert them at the front! That's because the order is
2924
reversed in this list.
2926
for (tl= parent_lex->leaf_tables; tl->next_leaf; tl= tl->next_leaf) {};
2927
tl->next_leaf= subq_lex->leaf_tables;
2931
Same as above for next_local chain
2932
(a theory: a next_local chain always starts with ::leaf_tables
2933
because view's tables are inserted after the view)
2935
for (tl= parent_lex->leaf_tables; tl->next_local; tl= tl->next_local) {};
2936
tl->next_local= subq_lex->leaf_tables;
2938
/* A theory: no need to re-connect the next_global chain */
2940
/* 3. Remove the original subquery predicate from the WHERE/ON */
2942
// The subqueries were replaced for Item_int(1) earlier
2943
subq_pred->exec_method= Item_in_subselect::SEMI_JOIN; // for subsequent executions
2944
/*TODO: also reset the 'with_subselect' there. */
2946
/* n. Adjust the parent_join->tables counter */
2947
uint table_no= parent_join->tables;
2948
/* n. Walk through child's tables and adjust table->map */
2949
for (tl= subq_lex->leaf_tables; tl; tl= tl->next_leaf, table_no++)
2951
tl->table->tablenr= table_no;
2952
tl->table->map= ((table_map)1) << table_no;
2953
SELECT_LEX *old_sl= tl->select_lex;
2954
tl->select_lex= parent_join->select_lex;
2955
for(TableList *emb= tl->embedding; emb && emb->select_lex == old_sl; emb= emb->embedding)
2956
emb->select_lex= parent_join->select_lex;
2958
parent_join->tables += subq_lex->join->tables;
2961
Put the subquery's WHERE into semi-join's sj_on_expr
2962
Add the subquery-induced equalities too.
2964
SELECT_LEX *save_lex= thd->lex->current_select;
2965
thd->lex->current_select=subq_lex;
2966
if (!subq_pred->left_expr->fixed &&
2967
subq_pred->left_expr->fix_fields(thd, &subq_pred->left_expr))
2969
thd->lex->current_select=save_lex;
2971
sj_nest->nested_join->sj_corr_tables= subq_pred->used_tables();
2972
sj_nest->nested_join->sj_depends_on= subq_pred->used_tables() |
2973
subq_pred->left_expr->used_tables();
2974
sj_nest->sj_on_expr= subq_lex->where;
2977
Create the IN-equalities and inject them into semi-join's ON expression.
2978
Additionally, for InsideOut strategy
2979
- Record the number of IN-equalities.
2980
- Create list of pointers to (oe1, ..., ieN). We'll need the list to
2981
see which of the expressions are bound and which are not (for those
2982
we'll produce a distinct stream of (ie_i1,...ie_ik).
2984
(TODO: can we just create a list of pointers and hope the expressions
2985
will not substitute themselves on fix_fields()? or we need to wrap
2986
them into Item_direct_view_refs and store pointers to those. The
2987
pointers to Item_direct_view_refs are guaranteed to be stable as
2988
Item_direct_view_refs doesn't substitute itself with anything in
2989
Item_direct_view_ref::fix_fields.
2991
sj_nest->sj_in_exprs= subq_pred->left_expr->cols();
2992
sj_nest->nested_join->sj_outer_expr_list.empty();
2994
if (subq_pred->left_expr->cols() == 1)
2996
nested_join->sj_outer_expr_list.push_back(subq_pred->left_expr);
2998
Item *item_eq= new Item_func_eq(subq_pred->left_expr,
2999
subq_lex->ref_pointer_array[0]);
3000
item_eq->name= (char*)subq_sj_cond_name;
3001
sj_nest->sj_on_expr= and_items(sj_nest->sj_on_expr, item_eq);
3005
for (uint i= 0; i < subq_pred->left_expr->cols(); i++)
3007
nested_join->sj_outer_expr_list.push_back(subq_pred->left_expr->
3010
new Item_func_eq(subq_pred->left_expr->element_index(i),
3011
subq_lex->ref_pointer_array[i]);
3012
item_eq->name= (char*)subq_sj_cond_name + (i % 64);
3013
sj_nest->sj_on_expr= and_items(sj_nest->sj_on_expr, item_eq);
3016
/* Fix the created equality and AND */
3017
sj_nest->sj_on_expr->fix_fields(parent_join->thd, &sj_nest->sj_on_expr);
3020
Walk through sj nest's WHERE and ON expressions and call
3021
item->fix_table_changes() for all items.
3023
sj_nest->sj_on_expr->fix_after_pullout(parent_lex, &sj_nest->sj_on_expr);
3024
fix_list_after_tbl_changes(parent_lex, &sj_nest->nested_join->join_list);
3027
/* Unlink the child select_lex so it doesn't show up in EXPLAIN: */
3028
subq_lex->master_unit()->exclude_level();
3030
/* Inject sj_on_expr into the parent's WHERE or ON */
3033
emb_tbl_nest->on_expr= and_items(emb_tbl_nest->on_expr,
3034
sj_nest->sj_on_expr);
3035
emb_tbl_nest->on_expr->fix_fields(parent_join->thd, &emb_tbl_nest->on_expr);
3039
/* Inject into the WHERE */
3040
parent_join->conds= and_items(parent_join->conds, sj_nest->sj_on_expr);
3041
parent_join->conds->fix_fields(parent_join->thd, &parent_join->conds);
3042
parent_join->select_lex->where= parent_join->conds;
3050
Convert candidate subquery predicates to semi-joins
3053
JOIN::flatten_subqueries()
3056
Convert candidate subquery predicates to semi-joins.
3063
bool JOIN::flatten_subqueries()
3065
Item_in_subselect **in_subq;
3066
Item_in_subselect **in_subq_end;
3068
if (sj_subselects.elements() == 0)
3071
/* 1. Fix children subqueries */
3072
for (in_subq= sj_subselects.front(), in_subq_end= sj_subselects.back();
3073
in_subq != in_subq_end; in_subq++)
3075
JOIN *child_join= (*in_subq)->unit->first_select()->join;
3076
child_join->outer_tables = child_join->tables;
3077
if (child_join->flatten_subqueries())
3079
(*in_subq)->sj_convert_priority=
3080
(*in_subq)->is_correlated * MAX_TABLES + child_join->outer_tables;
3083
//dump_TableList_struct(select_lex, select_lex->leaf_tables);
3085
2. Pick which subqueries to convert:
3086
sort the subquery array
3087
- prefer correlated subqueries over uncorrelated;
3088
- prefer subqueries that have greater number of outer tables;
3090
sj_subselects.sort(subq_sj_candidate_cmp);
3091
// #tables-in-parent-query + #tables-in-subquery < MAX_TABLES
3092
/* Replace all subqueries to be flattened with Item_int(1) */
3093
for (in_subq= sj_subselects.front();
3094
in_subq != in_subq_end &&
3095
tables + ((*in_subq)->sj_convert_priority % MAX_TABLES) < MAX_TABLES;
3098
if (replace_where_subcondition(this, *in_subq, new Item_int(1), false))
3102
for (in_subq= sj_subselects.front();
3103
in_subq != in_subq_end &&
3104
tables + ((*in_subq)->sj_convert_priority % MAX_TABLES) < MAX_TABLES;
3107
if (convert_subq_to_sj(this, *in_subq))
3111
/* 3. Finalize those we didn't convert */
3112
for (; in_subq!= in_subq_end; in_subq++)
3114
JOIN *child_join= (*in_subq)->unit->first_select()->join;
3115
Item_subselect::trans_res res;
3116
(*in_subq)->changed= 0;
3117
(*in_subq)->fixed= 0;
3118
res= (*in_subq)->select_transformer(child_join);
3119
if (res == Item_subselect::RES_ERROR)
3122
(*in_subq)->changed= 1;
3123
(*in_subq)->fixed= 1;
3125
Item *substitute= (*in_subq)->substitution;
3126
bool do_fix_fields= !(*in_subq)->substitution->fixed;
3127
if (replace_where_subcondition(this, *in_subq, substitute, do_fix_fields))
3130
//if ((*in_subq)->fix_fields(thd, (*in_subq)->ref_ptr))
3133
sj_subselects.clear();
3139
Setup for execution all subqueries of a query, for which the optimizer
3140
chose hash semi-join.
3142
@details Iterate over all subqueries of the query, and if they are under an
3143
IN predicate, and the optimizer chose to compute it via hash semi-join:
3144
- try to initialize all data structures needed for the materialized execution
3145
of the IN predicate,
3146
- if this fails, then perform the IN=>EXISTS transformation which was
3147
previously blocked during JOIN::prepare.
3149
This method is part of the "code generation" query processing phase.
3151
This phase must be called after substitute_for_best_equal_field() because
3152
that function may replace items with other items from a multiple equality,
3153
and we need to reference the correct items in the index access method of the
3156
@return Operation status
3157
@retval false success.
3158
@retval true error occurred.
3161
bool JOIN::setup_subquery_materialization()
3163
for (SELECT_LEX_UNIT *un= select_lex->first_inner_unit(); un;
3164
un= un->next_unit())
3166
for (SELECT_LEX *sl= un->first_select(); sl; sl= sl->next_select())
3168
Item_subselect *subquery_predicate= sl->master_unit()->item;
3169
if (subquery_predicate &&
3170
subquery_predicate->substype() == Item_subselect::IN_SUBS)
3172
Item_in_subselect *in_subs= (Item_in_subselect*) subquery_predicate;
3173
if (in_subs->exec_method == Item_in_subselect::MATERIALIZATION &&
3174
in_subs->setup_engine())
3184
Check if table's KEYUSE elements have an eq_ref(outer_tables) candidate
3187
find_eq_ref_candidate()
3188
table Table to be checked
3189
sj_inner_tables Bitmap of inner tables. eq_ref(inner_table) doesn't
3193
Check if table's KEYUSE elements have an eq_ref(outer_tables) candidate
3196
Check again if it is feasible to factor common parts with constant table
3200
true - There exists an eq_ref(outer-tables) candidate
3204
bool find_eq_ref_candidate(Table *table, table_map sj_inner_tables)
3206
KEYUSE *keyuse= table->reginfo.join_tab->keyuse;
3211
while (1) /* For each key */
3214
KEY *keyinfo= table->key_info + key;
3215
key_part_map bound_parts= 0;
3216
if ((keyinfo->flags & HA_NOSAME) == HA_NOSAME)
3218
do /* For all equalities on all key parts */
3220
/* Check if this is "t.keypart = expr(outer_tables) */
3221
if (!(keyuse->used_tables & sj_inner_tables) &&
3222
!(keyuse->optimize & KEY_OPTIMIZE_REF_OR_NULL))
3224
bound_parts |= 1 << keyuse->keypart;
3227
} while (keyuse->key == key && keyuse->table == table);
3229
if (bound_parts == PREV_BITS(uint, keyinfo->key_parts))
3231
if (keyuse->table != table)
3239
if (keyuse->table != table)
3242
while (keyuse->key == key);
3251
Pull tables out of semi-join nests, if possible
3254
pull_out_semijoin_tables()
3255
join The join where to do the semi-join flattening
3258
Try to pull tables out of semi-join nests.
3261
When this function is called, the join may have several semi-join nests
3262
(possibly within different semi-join nests), but it is guaranteed that
3263
one semi-join nest does not contain another.
3266
A table can be pulled out of the semi-join nest if
3267
- It is a constant table
3271
* Pulled out tables have JOIN_TAB::emb_sj_nest == NULL (like the outer
3273
* Tables that were not pulled out have JOIN_TAB::emb_sj_nest.
3274
* Semi-join nests TableList::sj_inner_tables
3276
This operation is (and should be) performed at each PS execution since
3277
tables may become/cease to be constant across PS reexecutions.
3281
1 - Out of memory error
3284
int pull_out_semijoin_tables(JOIN *join)
3287
List_iterator<TableList> sj_list_it(join->select_lex->sj_nests);
3289
/* Try pulling out of the each of the semi-joins */
3290
while ((sj_nest= sj_list_it++))
3292
/* Action #1: Mark the constant tables to be pulled out */
3293
table_map pulled_tables= 0;
3295
List_iterator<TableList> child_li(sj_nest->nested_join->join_list);
3297
while ((tbl= child_li++))
3301
tbl->table->reginfo.join_tab->emb_sj_nest= sj_nest;
3302
if (tbl->table->map & join->const_table_map)
3304
pulled_tables |= tbl->table->map;
3310
Action #2: Find which tables we can pull out based on
3311
update_ref_and_keys() data. Note that pulling one table out can allow
3312
us to pull out some other tables too.
3314
bool pulled_a_table;
3317
pulled_a_table= false;
3319
while ((tbl= child_li++))
3321
if (tbl->table && !(pulled_tables & tbl->table->map))
3323
if (find_eq_ref_candidate(tbl->table,
3324
sj_nest->nested_join->used_tables &
3327
pulled_a_table= true;
3328
pulled_tables |= tbl->table->map;
3332
} while (pulled_a_table);
3335
if ((sj_nest)->nested_join->used_tables == pulled_tables)
3337
(sj_nest)->sj_inner_tables= 0;
3338
while ((tbl= child_li++))
3341
tbl->table->reginfo.join_tab->emb_sj_nest= NULL;
3346
/* Record the bitmap of inner tables, mark the inner tables */
3347
table_map inner_tables=(sj_nest)->nested_join->used_tables &
3349
(sj_nest)->sj_inner_tables= inner_tables;
3350
while ((tbl= child_li++))
3354
if (inner_tables & tbl->table->map)
3355
tbl->table->reginfo.join_tab->emb_sj_nest= (sj_nest);
3357
tbl->table->reginfo.join_tab->emb_sj_nest= NULL;
456
3365
/*****************************************************************************
457
Create JoinTableS, make a guess about the table types,
3366
Create JOIN_TABS, make a guess about the table types,
458
3367
Approximate how many records will be used in each table
459
3368
*****************************************************************************/
460
ha_rows get_quick_record_count(Session *session, optimizer::SqlSelect *select, Table *table, const key_map *keys,ha_rows limit)
3371
static ha_rows get_quick_record_count(THD *thd, SQL_SELECT *select,
3373
const key_map *keys,ha_rows limit)
463
if (check_stack_overrun(session, STACK_MIN_SIZE, NULL))
3376
if (check_stack_overrun(thd, STACK_MIN_SIZE, NULL))
464
3377
return(0); // Fatal error flag is set
467
3380
select->head=table;
468
3381
table->reginfo.impossible_range=0;
469
if ((error= select->test_quick_select(session, *(key_map *)keys,(table_map) 0,
3382
if ((error= select->test_quick_select(thd, *(key_map *)keys,(table_map) 0,
470
3383
limit, 0, false)) == 1)
471
3384
return(select->quick->records);
472
3385
if (error == -1)
478
3391
return(HA_POS_ERROR); /* This shouldn't happend */
3395
This structure is used to collect info on potentially sargable
3396
predicates in order to check whether they become sargable after
3397
reading const tables.
3398
We form a bitmap of indexes that can be used for sargable predicates.
3399
Only such indexes are involved in range analysis.
3401
typedef struct st_sargable_param
3403
Field *field; /* field against which to check sargability */
3404
Item **arg_value; /* values of potential keys for lookups */
3405
uint num_values; /* number of values in the above array */
3409
Calculate the best possible join and initialize the join structure.
3418
make_join_statistics(JOIN *join, TableList *tables, COND *conds,
3419
DYNAMIC_ARRAY *keyuse_array)
3423
uint i,table_count,const_count,key;
3424
table_map found_const_table_map, all_table_map, found_ref, refs;
3425
key_map const_ref, eq_part;
3426
Table **table_vector;
3427
JOIN_TAB *stat,*stat_end,*s,**stat_ref;
3428
KEYUSE *keyuse,*start_keyuse;
3429
table_map outer_join=0;
3430
SARGABLE_PARAM *sargables= 0;
3431
JOIN_TAB *stat_vector[MAX_TABLES+1];
3433
table_count=join->tables;
3434
stat=(JOIN_TAB*) join->thd->calloc(sizeof(JOIN_TAB)*table_count);
3435
stat_ref=(JOIN_TAB**) join->thd->alloc(sizeof(JOIN_TAB*)*MAX_TABLES);
3436
table_vector=(Table**) join->thd->alloc(sizeof(Table*)*(table_count*2));
3437
if (!stat || !stat_ref || !table_vector)
3438
return(1); // Eom /* purecov: inspected */
3440
join->best_ref=stat_vector;
3442
stat_end=stat+table_count;
3443
found_const_table_map= all_table_map=0;
3448
s++, tables= tables->next_leaf, i++)
3450
TableList *embedding= tables->embedding;
3453
s->const_keys.init();
3454
s->checked_keys.init();
3455
s->needed_reg.init();
3456
table_vector[i]=s->table=table=tables->table;
3457
table->pos_in_table_list= tables;
3458
error= table->file->info(HA_STATUS_VARIABLE | HA_STATUS_NO_LOCK);
3461
table->file->print_error(error, MYF(0));
3464
table->quick_keys.clear_all();
3465
table->reginfo.join_tab=s;
3466
table->reginfo.not_exists_optimize=0;
3467
memset(table->const_key_parts, 0,
3468
sizeof(key_part_map)*table->s->keys);
3469
all_table_map|= table->map;
3471
s->info=0; // For describe
3473
s->dependent= tables->dep_tables;
3474
s->key_dependent= 0;
3475
if (tables->schema_table)
3476
table->file->stats.records= 2;
3477
table->quick_condition_rows= table->file->stats.records;
3479
s->on_expr_ref= &tables->on_expr;
3480
if (*s->on_expr_ref)
3482
/* s is the only inner table of an outer join */
3483
if (!table->file->stats.records && !embedding)
3485
s->dependent= 0; // Ignore LEFT JOIN depend.
3486
set_position(join,const_count++,s,(KEYUSE*) 0);
3489
outer_join|= table->map;
3490
s->embedding_map= 0;
3491
for (;embedding; embedding= embedding->embedding)
3492
s->embedding_map|= embedding->nested_join->nj_map;
3495
if (embedding && !(embedding->sj_on_expr && ! embedding->embedding))
3497
/* s belongs to a nested join, maybe to several embedded joins */
3498
s->embedding_map= 0;
3501
nested_join_st *nested_join= embedding->nested_join;
3502
s->embedding_map|=nested_join->nj_map;
3503
s->dependent|= embedding->dep_tables;
3504
embedding= embedding->embedding;
3505
outer_join|= nested_join->used_tables;
3510
if ((table->file->stats.records <= 1) &&
3512
(table->file->ha_table_flags() & HA_STATS_RECORDS_IS_EXACT) && !join->no_const_tables)
3514
set_position(join,const_count++,s,(KEYUSE*) 0);
3518
join->outer_join=outer_join;
3520
if (join->outer_join)
3523
Build transitive closure for relation 'to be dependent on'.
3524
This will speed up the plan search for many cases with outer joins,
3525
as well as allow us to catch illegal cross references/
3526
Warshall's algorithm is used to build the transitive closure.
3527
As we use bitmaps to represent the relation the complexity
3528
of the algorithm is O((number of tables)^2).
3530
for (i= 0, s= stat ; i < table_count ; i++, s++)
3532
for (uint j= 0 ; j < table_count ; j++)
3534
table= stat[j].table;
3535
if (s->dependent & table->map)
3536
s->dependent |= table->reginfo.join_tab->dependent;
3539
s->table->maybe_null= 1;
3541
/* Catch illegal cross references for outer joins */
3542
for (i= 0, s= stat ; i < table_count ; i++, s++)
3544
if (s->dependent & s->table->map)
3546
join->tables=0; // Don't use join->table
3547
my_message(ER_WRONG_OUTER_JOIN, ER(ER_WRONG_OUTER_JOIN), MYF(0));
3550
s->key_dependent= s->dependent;
3554
if (conds || outer_join)
3555
if (update_ref_and_keys(join->thd, keyuse_array, stat, join->tables,
3556
conds, join->cond_equal,
3557
~outer_join, join->select_lex, &sargables))
3560
/* Read tables with 0 or 1 rows (system tables) */
3561
join->const_table_map= 0;
3563
for (POSITION *p_pos=join->positions, *p_end=p_pos+const_count;
3570
join->const_table_map|=s->table->map;
3571
if ((tmp=join_read_const_table(s, p_pos)))
3574
return(1); // Fatal error
3577
found_const_table_map|= s->table->map;
3580
/* loop until no more const tables are found */
3584
more_const_tables_found:
3589
We only have to loop from stat_vector + const_count as
3590
set_position() will move all const_tables first in stat_vector
3593
for (JOIN_TAB **pos=stat_vector+const_count ; (s= *pos) ; pos++)
3598
If equi-join condition by a key is null rejecting and after a
3599
substitution of a const table the key value happens to be null
3600
then we can state that there are no matches for this equi-join.
3602
if ((keyuse= s->keyuse) && *s->on_expr_ref && !s->embedding_map)
3605
When performing an outer join operation if there are no matching rows
3606
for the single row of the outer table all the inner tables are to be
3607
null complemented and thus considered as constant tables.
3608
Here we apply this consideration to the case of outer join operations
3609
with a single inner table only because the case with nested tables
3610
would require a more thorough analysis.
3611
TODO. Apply single row substitution to null complemented inner tables
3612
for nested outer join operations.
3614
while (keyuse->table == table)
3616
if (!(keyuse->val->used_tables() & ~join->const_table_map) &&
3617
keyuse->val->is_null() && keyuse->null_rejecting)
3620
mark_as_null_row(table);
3621
found_const_table_map|= table->map;
3622
join->const_table_map|= table->map;
3623
set_position(join,const_count++,s,(KEYUSE*) 0);
3624
goto more_const_tables_found;
3630
if (s->dependent) // If dependent on some table
3632
// All dep. must be constants
3633
if (s->dependent & ~(found_const_table_map))
3635
if (table->file->stats.records <= 1L &&
3636
(table->file->ha_table_flags() & HA_STATS_RECORDS_IS_EXACT) &&
3637
!table->pos_in_table_list->embedding)
3641
join->const_table_map|=table->map;
3642
set_position(join,const_count++,s,(KEYUSE*) 0);
3643
if ((tmp= join_read_const_table(s, join->positions+const_count-1)))
3646
return(1); // Fatal error
3649
found_const_table_map|= table->map;
3653
/* check if table can be read by key or table only uses const refs */
3654
if ((keyuse=s->keyuse))
3657
while (keyuse->table == table)
3659
start_keyuse=keyuse;
3661
s->keys.set_bit(key); // QQ: remove this ?
3664
const_ref.clear_all();
3665
eq_part.clear_all();
3668
if (keyuse->val->type() != Item::NULL_ITEM && !keyuse->optimize)
3670
if (!((~found_const_table_map) & keyuse->used_tables))
3671
const_ref.set_bit(keyuse->keypart);
3673
refs|=keyuse->used_tables;
3674
eq_part.set_bit(keyuse->keypart);
3677
} while (keyuse->table == table && keyuse->key == key);
3679
if (eq_part.is_prefix(table->key_info[key].key_parts) &&
3680
!table->pos_in_table_list->embedding)
3682
if ((table->key_info[key].flags & (HA_NOSAME))
3685
if (const_ref == eq_part)
3686
{ // Found everything for ref.
3690
join->const_table_map|=table->map;
3691
set_position(join,const_count++,s,start_keyuse);
3692
if (create_ref_for_key(join, s, start_keyuse,
3693
found_const_table_map))
3695
if ((tmp=join_read_const_table(s,
3696
join->positions+const_count-1)))
3699
return(1); // Fatal error
3702
found_const_table_map|= table->map;
3706
found_ref|= refs; // Table is const if all refs are const
3708
else if (const_ref == eq_part)
3709
s->const_keys.set_bit(key);
3714
} while (join->const_table_map & found_ref && ref_changed);
3717
Update info on indexes that can be used for search lookups as
3718
reading const tables may has added new sargable predicates.
3720
if (const_count && sargables)
3722
for( ; sargables->field ; sargables++)
3724
Field *field= sargables->field;
3725
JOIN_TAB *join_tab= field->table->reginfo.join_tab;
3726
key_map possible_keys= field->key_start;
3727
possible_keys.intersect(field->table->keys_in_use_for_query);
3729
for (uint j=0; j < sargables->num_values; j++)
3730
is_const&= sargables->arg_value[j]->const_item();
3732
join_tab[0].const_keys.merge(possible_keys);
3736
if (pull_out_semijoin_tables(join))
3739
/* Calc how many (possible) matched records in each table */
3741
for (s=stat ; s < stat_end ; s++)
3743
if (s->type == JT_SYSTEM || s->type == JT_CONST)
3745
/* Only one matching row */
3746
s->found_records=s->records=s->read_time=1; s->worst_seeks=1.0;
3749
/* Approximate found rows and time to read them */
3750
s->found_records=s->records=s->table->file->stats.records;
3751
s->read_time=(ha_rows) s->table->file->scan_time();
3754
Set a max range of how many seeks we can expect when using keys
3755
This is can't be to high as otherwise we are likely to use
3758
s->worst_seeks= min((double) s->found_records / 10,
3759
(double) s->read_time*3);
3760
if (s->worst_seeks < 2.0) // Fix for small tables
3764
Add to stat->const_keys those indexes for which all group fields or
3765
all select distinct fields participate in one index.
3767
add_group_and_distinct_keys(join, s);
3769
if (!s->const_keys.is_clear_all() &&
3770
!s->table->pos_in_table_list->embedding)
3774
select= make_select(s->table, found_const_table_map,
3775
found_const_table_map,
3776
*s->on_expr_ref ? *s->on_expr_ref : conds,
3780
records= get_quick_record_count(join->thd, select, s->table,
3781
&s->const_keys, join->row_limit);
3782
s->quick=select->quick;
3783
s->needed_reg=select->needed_reg;
3785
if (records == 0 && s->table->reginfo.impossible_range)
3788
Impossible WHERE or ON expression
3789
In case of ON, we mark that the we match one empty NULL row.
3790
In case of WHERE, don't set found_const_table_map to get the
3791
caller to abort with a zero row result.
3793
join->const_table_map|= s->table->map;
3794
set_position(join,const_count++,s,(KEYUSE*) 0);
3796
if (*s->on_expr_ref)
3798
/* Generate empty row */
3799
s->info= "Impossible ON condition";
3800
found_const_table_map|= s->table->map;
3802
mark_as_null_row(s->table); // All fields are NULL
3805
if (records != HA_POS_ERROR)
3807
s->found_records=records;
3808
s->read_time= (ha_rows) (s->quick ? s->quick->read_time : 0.0);
3814
join->join_tab=stat;
3815
join->map2table=stat_ref;
3816
join->table= join->all_tables=table_vector;
3817
join->const_tables=const_count;
3818
join->found_const_table_map=found_const_table_map;
3820
/* Find an optimal join order of the non-constant tables. */
3821
if (join->const_tables != join->tables)
3823
optimize_keyuse(join, keyuse_array);
3824
if (choose_plan(join, all_table_map & ~join->const_table_map))
3829
memcpy(join->best_positions, join->positions,
3830
sizeof(POSITION)*join->const_tables);
3831
join->best_read=1.0;
3833
/* Generate an execution plan from the found optimal join order. */
3834
return(join->thd->killed || get_best_combination(join));
481
3838
/*****************************************************************************
482
3839
Check with keys are used and with tables references with tables
483
3840
Updates in stat:
486
3843
keyuse Pointer to possible keys
487
3844
*****************************************************************************/
3846
/// Used when finding key fields
3847
typedef struct key_field_t {
3849
Item *val; ///< May be empty if diff constant
3851
uint optimize; // KEY_OPTIMIZE_*
3854
If true, the condition this struct represents will not be satisfied
3857
bool null_rejecting;
3858
bool *cond_guard; /* See KEYUSE::cond_guard */
3859
uint sj_pred_no; /* See KEYUSE::sj_pred_no */
3863
Merge new key definitions to old ones, remove those not used in both.
3865
This is called for OR between different levels.
3867
To be able to do 'ref_or_null' we merge a comparison of a column
3868
and 'column IS NULL' to one test. This is useful for sub select queries
3869
that are internally transformed to something like:.
3872
SELECT * FROM t1 WHERE t1.key=outer_ref_field or t1.key IS NULL
3875
KEY_FIELD::null_rejecting is processed as follows: @n
3876
result has null_rejecting=true if it is set for both ORed references.
3878
- (t2.key = t1.field OR t2.key = t1.field) -> null_rejecting=true
3879
- (t2.key = t1.field OR t2.key <=> t1.field) -> null_rejecting=false
3882
The result of this is that we're missing some 'ref' accesses.
3883
OptimizerTeam: Fix this
3887
merge_key_fields(KEY_FIELD *start,KEY_FIELD *new_fields,KEY_FIELD *end,
3890
if (start == new_fields)
3891
return start; // Impossible or
3892
if (new_fields == end)
3893
return start; // No new fields, skip all
3895
KEY_FIELD *first_free=new_fields;
3897
/* Mark all found fields in old array */
3898
for (; new_fields != end ; new_fields++)
3900
for (KEY_FIELD *old=start ; old != first_free ; old++)
3902
if (old->field == new_fields->field)
3905
NOTE: below const_item() call really works as "!used_tables()", i.e.
3906
it can return false where it is feasible to make it return true.
3908
The cause is as follows: Some of the tables are already known to be
3909
const tables (the detection code is in make_join_statistics(),
3910
above the update_ref_and_keys() call), but we didn't propagate
3911
information about this: Table::const_table is not set to true, and
3912
Item::update_used_tables() hasn't been called for each item.
3913
The result of this is that we're missing some 'ref' accesses.
3914
TODO: OptimizerTeam: Fix this
3916
if (!new_fields->val->const_item())
3919
If the value matches, we can use the key reference.
3920
If not, we keep it until we have examined all new values
3922
if (old->val->eq(new_fields->val, old->field->binary()))
3924
old->level= and_level;
3925
old->optimize= ((old->optimize & new_fields->optimize &
3926
KEY_OPTIMIZE_EXISTS) |
3927
((old->optimize | new_fields->optimize) &
3928
KEY_OPTIMIZE_REF_OR_NULL));
3929
old->null_rejecting= (old->null_rejecting &&
3930
new_fields->null_rejecting);
3933
else if (old->eq_func && new_fields->eq_func &&
3934
old->val->eq_by_collation(new_fields->val,
3935
old->field->binary(),
3936
old->field->charset()))
3939
old->level= and_level;
3940
old->optimize= ((old->optimize & new_fields->optimize &
3941
KEY_OPTIMIZE_EXISTS) |
3942
((old->optimize | new_fields->optimize) &
3943
KEY_OPTIMIZE_REF_OR_NULL));
3944
old->null_rejecting= (old->null_rejecting &&
3945
new_fields->null_rejecting);
3947
else if (old->eq_func && new_fields->eq_func &&
3948
((old->val->const_item() && old->val->is_null()) ||
3949
new_fields->val->is_null()))
3951
/* field = expression OR field IS NULL */
3952
old->level= and_level;
3953
old->optimize= KEY_OPTIMIZE_REF_OR_NULL;
3955
Remember the NOT NULL value unless the value does not depend
3958
if (!old->val->used_tables() && old->val->is_null())
3959
old->val= new_fields->val;
3960
/* The referred expression can be NULL: */
3961
old->null_rejecting= 0;
3966
We are comparing two different const. In this case we can't
3967
use a key-lookup on this so it's better to remove the value
3968
and let the range optimzier handle it
3970
if (old == --first_free) // If last item
3972
*old= *first_free; // Remove old value
3973
old--; // Retry this value
3978
/* Remove all not used items */
3979
for (KEY_FIELD *old=start ; old != first_free ;)
3981
if (old->level != and_level)
3982
{ // Not used in all levels
3983
if (old == --first_free)
3985
*old= *first_free; // Remove old value
3995
Add a possible key to array of possible keys if it's usable as a key
3997
@param key_fields Pointer to add key, if usable
3998
@param and_level And level, to be stored in KEY_FIELD
3999
@param cond Condition predicate
4000
@param field Field used in comparision
4001
@param eq_func True if we used =, <=> or IS NULL
4002
@param value Value used for comparison with field
4003
@param usable_tables Tables which can be used for key optimization
4004
@param sargables IN/OUT Array of found sargable candidates
4007
If we are doing a NOT NULL comparison on a NOT NULL field in a outer join
4008
table, we store this to be able to do not exists optimization later.
4011
*key_fields is incremented if we stored a key in the array
4015
add_key_field(KEY_FIELD **key_fields,uint and_level, Item_func *cond,
4016
Field *field, bool eq_func, Item **value, uint num_values,
4017
table_map usable_tables, SARGABLE_PARAM **sargables)
4019
uint exists_optimize= 0;
4020
if (!(field->flags & PART_KEY_FLAG))
4022
// Don't remove column IS NULL on a LEFT JOIN table
4023
if (!eq_func || (*value)->type() != Item::NULL_ITEM ||
4024
!field->table->maybe_null || field->null_ptr)
4025
return; // Not a key. Skip it
4026
exists_optimize= KEY_OPTIMIZE_EXISTS;
4027
assert(num_values == 1);
4031
table_map used_tables=0;
4033
for (uint i=0; i<num_values; i++)
4035
used_tables|=(value[i])->used_tables();
4036
if (!((value[i])->used_tables() & (field->table->map | RAND_TABLE_BIT)))
4041
if (!(usable_tables & field->table->map))
4043
if (!eq_func || (*value)->type() != Item::NULL_ITEM ||
4044
!field->table->maybe_null || field->null_ptr)
4045
return; // Can't use left join optimize
4046
exists_optimize= KEY_OPTIMIZE_EXISTS;
4050
JOIN_TAB *stat=field->table->reginfo.join_tab;
4051
key_map possible_keys=field->key_start;
4052
possible_keys.intersect(field->table->keys_in_use_for_query);
4053
stat[0].keys.merge(possible_keys); // Add possible keys
4056
Save the following cases:
4058
Field LIKE constant where constant doesn't start with a wildcard
4059
Field = field2 where field2 is in a different table
4066
stat[0].key_dependent|=used_tables;
4069
for (uint i=0; i<num_values; i++)
4071
if (!(is_const&= value[i]->const_item()))
4075
stat[0].const_keys.merge(possible_keys);
4079
Save info to be able check whether this predicate can be
4080
considered as sargable for range analisis after reading const tables.
4081
We do not save info about equalities as update_const_equal_items
4082
will take care of updating info on keys from sargable equalities.
4085
(*sargables)->field= field;
4086
(*sargables)->arg_value= value;
4087
(*sargables)->num_values= num_values;
4090
We can't always use indexes when comparing a string index to a
4091
number. cmp_type() is checked to allow compare of dates to numbers.
4092
eq_func is NEVER true when num_values > 1
4097
Additional optimization: if we're processing
4098
"t.key BETWEEN c1 AND c1" then proceed as if we were processing
4100
TODO: This is a very limited fix. A more generic fix is possible.
4101
There are 2 options:
4102
A) Make equality propagation code be able to handle BETWEEN
4103
(including cases like t1.key BETWEEN t2.key AND t3.key)
4104
B) Make range optimizer to infer additional "t.key = c" equalities
4105
and use them in equality propagation process (see details in
4108
if ((cond->functype() != Item_func::BETWEEN) ||
4109
((Item_func_between*) cond)->negated ||
4110
!value[0]->eq(value[1], field->binary()))
4115
if (field->result_type() == STRING_RESULT)
4117
if ((*value)->result_type() != STRING_RESULT)
4119
if (field->cmp_type() != (*value)->result_type())
4125
We can't use indexes if the effective collation
4126
of the operation differ from the field collation.
4128
if (field->cmp_type() == STRING_RESULT &&
4129
((Field_str*)field)->charset() != cond->compare_collation())
4136
For the moment eq_func is always true. This slot is reserved for future
4137
extensions where we want to remembers other things than just eq comparisons
4140
/* Store possible eq field */
4141
(*key_fields)->field= field;
4142
(*key_fields)->eq_func= eq_func;
4143
(*key_fields)->val= *value;
4144
(*key_fields)->level= and_level;
4145
(*key_fields)->optimize= exists_optimize;
4147
If the condition has form "tbl.keypart = othertbl.field" and
4148
othertbl.field can be NULL, there will be no matches if othertbl.field
4150
We use null_rejecting in add_not_null_conds() to add
4151
'othertbl.field IS NOT NULL' to tab->select_cond.
4153
(*key_fields)->null_rejecting= ((cond->functype() == Item_func::EQ_FUNC ||
4154
cond->functype() == Item_func::MULT_EQUAL_FUNC) &&
4155
((*value)->type() == Item::FIELD_ITEM) &&
4156
((Item_field*)*value)->field->maybe_null());
4157
(*key_fields)->cond_guard= NULL;
4158
(*key_fields)->sj_pred_no= (cond->name >= subq_sj_cond_name &&
4159
cond->name < subq_sj_cond_name + 64)?
4160
cond->name - subq_sj_cond_name: UINT_MAX;
4165
Add possible keys to array of possible keys originated from a simple
4168
@param key_fields Pointer to add key, if usable
4169
@param and_level And level, to be stored in KEY_FIELD
4170
@param cond Condition predicate
4171
@param field Field used in comparision
4172
@param eq_func True if we used =, <=> or IS NULL
4173
@param value Value used for comparison with field
4174
Is NULL for BETWEEN and IN
4175
@param usable_tables Tables which can be used for key optimization
4176
@param sargables IN/OUT Array of found sargable candidates
4179
If field items f1 and f2 belong to the same multiple equality and
4180
a key is added for f1, the the same key is added for f2.
4183
*key_fields is incremented if we stored a key in the array
4187
add_key_equal_fields(KEY_FIELD **key_fields, uint and_level,
4188
Item_func *cond, Item_field *field_item,
4189
bool eq_func, Item **val,
4190
uint num_values, table_map usable_tables,
4191
SARGABLE_PARAM **sargables)
4193
Field *field= field_item->field;
4194
add_key_field(key_fields, and_level, cond, field,
4195
eq_func, val, num_values, usable_tables, sargables);
4196
Item_equal *item_equal= field_item->item_equal;
4200
Add to the set of possible key values every substitution of
4201
the field for an equal field included into item_equal
4203
Item_equal_iterator it(*item_equal);
4205
while ((item= it++))
4207
if (!field->eq(item->field))
4209
add_key_field(key_fields, and_level, cond, item->field,
4210
eq_func, val, num_values, usable_tables,
4218
add_key_fields(JOIN *join, KEY_FIELD **key_fields, uint *and_level,
4219
COND *cond, table_map usable_tables,
4220
SARGABLE_PARAM **sargables)
4222
if (cond->type() == Item_func::COND_ITEM)
4224
List_iterator_fast<Item> li(*((Item_cond*) cond)->argument_list());
4225
KEY_FIELD *org_key_fields= *key_fields;
4227
if (((Item_cond*) cond)->functype() == Item_func::COND_AND_FUNC)
4231
add_key_fields(join, key_fields, and_level, item, usable_tables,
4233
for (; org_key_fields != *key_fields ; org_key_fields++)
4234
org_key_fields->level= *and_level;
4239
add_key_fields(join, key_fields, and_level, li++, usable_tables,
4244
KEY_FIELD *start_key_fields= *key_fields;
4246
add_key_fields(join, key_fields, and_level, item, usable_tables,
4248
*key_fields=merge_key_fields(org_key_fields,start_key_fields,
4249
*key_fields,++(*and_level));
4256
Subquery optimization: Conditions that are pushed down into subqueries
4257
are wrapped into Item_func_trig_cond. We process the wrapped condition
4258
but need to set cond_guard for KEYUSE elements generated from it.
4261
if (cond->type() == Item::FUNC_ITEM &&
4262
((Item_func*)cond)->functype() == Item_func::TRIG_COND_FUNC)
4264
Item *cond_arg= ((Item_func*)cond)->arguments()[0];
4265
if (!join->group_list && !join->order &&
4267
join->unit->item->substype() == Item_subselect::IN_SUBS &&
4268
!join->unit->is_union())
4270
KEY_FIELD *save= *key_fields;
4271
add_key_fields(join, key_fields, and_level, cond_arg, usable_tables,
4273
// Indicate that this ref access candidate is for subquery lookup:
4274
for (; save != *key_fields; save++)
4275
save->cond_guard= ((Item_func_trig_cond*)cond)->get_trig_var();
4281
/* If item is of type 'field op field/constant' add it to key_fields */
4282
if (cond->type() != Item::FUNC_ITEM)
4284
Item_func *cond_func= (Item_func*) cond;
4285
switch (cond_func->select_optimize()) {
4286
case Item_func::OPTIMIZE_NONE:
4288
case Item_func::OPTIMIZE_KEY:
4292
if (cond_func->key_item()->real_item()->type() == Item::FIELD_ITEM &&
4293
!(cond_func->used_tables() & OUTER_REF_TABLE_BIT))
4295
values= cond_func->arguments()+1;
4296
if (cond_func->functype() == Item_func::NE_FUNC &&
4297
cond_func->arguments()[1]->real_item()->type() == Item::FIELD_ITEM &&
4298
!(cond_func->arguments()[0]->used_tables() & OUTER_REF_TABLE_BIT))
4300
assert(cond_func->functype() != Item_func::IN_FUNC ||
4301
cond_func->argument_count() != 2);
4302
add_key_equal_fields(key_fields, *and_level, cond_func,
4303
(Item_field*) (cond_func->key_item()->real_item()),
4305
cond_func->argument_count()-1,
4306
usable_tables, sargables);
4308
if (cond_func->functype() == Item_func::BETWEEN)
4310
values= cond_func->arguments();
4311
for (uint i= 1 ; i < cond_func->argument_count() ; i++)
4313
Item_field *field_item;
4314
if (cond_func->arguments()[i]->real_item()->type() == Item::FIELD_ITEM
4316
!(cond_func->arguments()[i]->used_tables() & OUTER_REF_TABLE_BIT))
4318
field_item= (Item_field *) (cond_func->arguments()[i]->real_item());
4319
add_key_equal_fields(key_fields, *and_level, cond_func,
4320
field_item, 0, values, 1, usable_tables,
4327
case Item_func::OPTIMIZE_OP:
4329
bool equal_func=(cond_func->functype() == Item_func::EQ_FUNC ||
4330
cond_func->functype() == Item_func::EQUAL_FUNC);
4332
if (cond_func->arguments()[0]->real_item()->type() == Item::FIELD_ITEM &&
4333
!(cond_func->arguments()[0]->used_tables() & OUTER_REF_TABLE_BIT))
4335
add_key_equal_fields(key_fields, *and_level, cond_func,
4336
(Item_field*) (cond_func->arguments()[0])->real_item(),
4338
cond_func->arguments()+1, 1, usable_tables,
4341
if (cond_func->arguments()[1]->real_item()->type() == Item::FIELD_ITEM &&
4342
cond_func->functype() != Item_func::LIKE_FUNC &&
4343
!(cond_func->arguments()[1]->used_tables() & OUTER_REF_TABLE_BIT))
4345
add_key_equal_fields(key_fields, *and_level, cond_func,
4346
(Item_field*) (cond_func->arguments()[1])->real_item(),
4348
cond_func->arguments(),1,usable_tables,
4353
case Item_func::OPTIMIZE_NULL:
4354
/* column_name IS [NOT] NULL */
4355
if (cond_func->arguments()[0]->real_item()->type() == Item::FIELD_ITEM &&
4356
!(cond_func->used_tables() & OUTER_REF_TABLE_BIT))
4358
Item *tmp=new Item_null;
4359
if (unlikely(!tmp)) // Should never be true
4361
add_key_equal_fields(key_fields, *and_level, cond_func,
4362
(Item_field*) (cond_func->arguments()[0])->real_item(),
4363
cond_func->functype() == Item_func::ISNULL_FUNC,
4364
&tmp, 1, usable_tables, sargables);
4367
case Item_func::OPTIMIZE_EQUAL:
4368
Item_equal *item_equal= (Item_equal *) cond;
4369
Item *const_item= item_equal->get_const();
4370
Item_equal_iterator it(*item_equal);
4375
For each field field1 from item_equal consider the equality
4376
field1=const_item as a condition allowing an index access of the table
4377
with field1 by the keys value of field1.
4379
while ((item= it++))
4381
add_key_field(key_fields, *and_level, cond_func, item->field,
4382
true, &const_item, 1, usable_tables, sargables);
4388
Consider all pairs of different fields included into item_equal.
4389
For each of them (field1, field1) consider the equality
4390
field1=field2 as a condition allowing an index access of the table
4391
with field1 by the keys value of field2.
4393
Item_equal_iterator fi(*item_equal);
4394
while ((item= fi++))
4396
Field *field= item->field;
4397
while ((item= it++))
4399
if (!field->eq(item->field))
4401
add_key_field(key_fields, *and_level, cond_func, field,
4402
true, (Item **) &item, 1, usable_tables,
491
4414
Add all keys with uses 'field' for some keypart.
493
4416
If field->and_level != and_level then only mark key_part as const_part.
495
uint32_t max_part_bit(key_part_map bits)
4420
max_part_bit(key_part_map bits)
498
4423
for (found=0; bits & 1 ; found++,bits>>=1) ;
502
static int sort_keyuse(optimizer::KeyUse *a, optimizer::KeyUse *b)
4428
add_key_part(DYNAMIC_ARRAY *keyuse_array,KEY_FIELD *key_field)
4430
Field *field=key_field->field;
4431
Table *form= field->table;
4434
if (key_field->eq_func && !(key_field->optimize & KEY_OPTIMIZE_EXISTS))
4436
for (uint key= 0 ; key < form->sizeKeys() ; key++)
4438
if (!(form->keys_in_use_for_query.is_set(key)))
4441
uint key_parts= (uint) form->key_info[key].key_parts;
4442
for (uint part=0 ; part < key_parts ; part++)
4444
if (field->eq(form->key_info[key].key_part[part].field))
4446
keyuse.table= field->table;
4447
keyuse.val = key_field->val;
4449
keyuse.keypart=part;
4450
keyuse.keypart_map= (key_part_map) 1 << part;
4451
keyuse.used_tables=key_field->val->used_tables();
4452
keyuse.optimize= key_field->optimize & KEY_OPTIMIZE_REF_OR_NULL;
4453
keyuse.null_rejecting= key_field->null_rejecting;
4454
keyuse.cond_guard= key_field->cond_guard;
4455
keyuse.sj_pred_no= key_field->sj_pred_no;
4456
VOID(insert_dynamic(keyuse_array,(uchar*) &keyuse));
4464
sort_keyuse(KEYUSE *a,KEYUSE *b)
505
if (a->getTable()->tablenr != b->getTable()->tablenr)
506
return static_cast<int>((a->getTable()->tablenr - b->getTable()->tablenr));
507
if (a->getKey() != b->getKey())
508
return static_cast<int>((a->getKey() - b->getKey()));
509
if (a->getKeypart() != b->getKeypart())
510
return static_cast<int>((a->getKeypart() - b->getKeypart()));
4467
if (a->table->tablenr != b->table->tablenr)
4468
return (int) (a->table->tablenr - b->table->tablenr);
4469
if (a->key != b->key)
4470
return (int) (a->key - b->key);
4471
if (a->keypart != b->keypart)
4472
return (int) (a->keypart - b->keypart);
511
4473
// Place const values before other ones
512
if ((res= test((a->getUsedTables() & ~OUTER_REF_TABLE_BIT)) -
513
test((b->getUsedTables() & ~OUTER_REF_TABLE_BIT))))
4474
if ((res= test((a->used_tables & ~OUTER_REF_TABLE_BIT)) -
4475
test((b->used_tables & ~OUTER_REF_TABLE_BIT))))
515
4477
/* Place rows that are not 'OPTIMIZE_REF_OR_NULL' first */
516
return static_cast<int>(((a->getOptimizeFlags() & KEY_OPTIMIZE_REF_OR_NULL) -
517
(b->getOptimizeFlags() & KEY_OPTIMIZE_REF_OR_NULL)));
4478
return (int) ((a->optimize & KEY_OPTIMIZE_REF_OR_NULL) -
4479
(b->optimize & KEY_OPTIMIZE_REF_OR_NULL));
4484
Add to KEY_FIELD array all 'ref' access candidates within nested join.
4486
This function populates KEY_FIELD array with entries generated from the
4487
ON condition of the given nested join, and does the same for nested joins
4488
contained within this nested join.
4490
@param[in] nested_join_table Nested join pseudo-table to process
4491
@param[in,out] end End of the key field array
4492
@param[in,out] and_level And-level
4493
@param[in,out] sargables Array of found sargable candidates
4497
We can add accesses to the tables that are direct children of this nested
4498
join (1), and are not inner tables w.r.t their neighbours (2).
4500
Example for #1 (outer brackets pair denotes nested join this function is
4503
... LEFT JOIN (t1 LEFT JOIN (t2 ... ) ) ON cond
4507
... LEFT JOIN (t1 LEFT JOIN t2 ) ON cond
4509
In examples 1-2 for condition cond, we can add 'ref' access candidates to
4513
... LEFT JOIN (t1, t2 LEFT JOIN t3 ON inner_cond) ON cond
4515
Here we can add 'ref' access candidates for t1 and t2, but not for t3.
4518
static void add_key_fields_for_nj(JOIN *join, TableList *nested_join_table,
4519
KEY_FIELD **end, uint *and_level,
4520
SARGABLE_PARAM **sargables)
4522
List_iterator<TableList> li(nested_join_table->nested_join->join_list);
4523
List_iterator<TableList> li2(nested_join_table->nested_join->join_list);
4524
bool have_another = false;
4525
table_map tables= 0;
4527
assert(nested_join_table->nested_join);
4529
while ((table= li++) || (have_another && (li=li2, have_another=false,
4532
if (table->nested_join)
4534
if (!table->on_expr)
4536
/* It's a semi-join nest. Walk into it as if it wasn't a nest */
4539
li= List_iterator<TableList>(table->nested_join->join_list);
4542
add_key_fields_for_nj(join, table, end, and_level, sargables);
4545
if (!table->on_expr)
4546
tables |= table->table->map;
4548
if (nested_join_table->on_expr)
4549
add_key_fields(join, end, and_level, nested_join_table->on_expr, tables,
522
4555
Update keyuse array with all possible keys we can use to fetch rows.
525
@param[out] keyuse Put here ordered array of KeyUse structures
4558
@param[out] keyuse Put here ordered array of KEYUSE structures
526
4559
@param join_tab Array in tablenr_order
527
4560
@param tables Number of tables in join
528
4561
@param cond WHERE condition (note that the function analyzes
777
4814
/* Intersect the keys of all group fields. */
778
4815
cur_item= indexed_fields_it++;
779
possible_keys|= cur_item->field->part_of_key;
4816
possible_keys.merge(cur_item->field->part_of_key);
780
4817
while ((cur_item= indexed_fields_it++))
782
possible_keys&= cur_item->field->part_of_key;
785
if (possible_keys.any())
786
join_tab->const_keys|= possible_keys;
790
Compare two JoinTable objects based on the number of accessed records.
792
@param ptr1 pointer to first JoinTable object
793
@param ptr2 pointer to second JoinTable object
4819
possible_keys.intersect(cur_item->field->part_of_key);
4822
if (!possible_keys.is_clear_all())
4823
join_tab->const_keys.merge(possible_keys);
4827
/*****************************************************************************
4828
Go through all combinations of not marked tables and find the one
4829
which uses least records
4830
*****************************************************************************/
4832
/** Save const tables first as used tables. */
4835
set_position(JOIN *join,uint idx,JOIN_TAB *table,KEYUSE *key)
4837
join->positions[idx].table= table;
4838
join->positions[idx].key=key;
4839
join->positions[idx].records_read=1.0; /* This is a const table */
4840
join->positions[idx].ref_depend_map= 0;
4842
/* Move the const table as down as possible in best_ref */
4843
JOIN_TAB **pos=join->best_ref+idx+1;
4844
JOIN_TAB *next=join->best_ref[idx];
4845
for (;next != table ; pos++)
4847
JOIN_TAB *tmp=pos[0];
4851
join->best_ref[idx]=table;
4856
Given a semi-join nest, find out which of the IN-equalities are bound
4859
get_bound_sj_equalities()
4860
sj_nest Semi-join nest
4861
remaining_tables Tables that are not yet bound
4864
Given a semi-join nest, find out which of the IN-equalities have their
4865
left part expression bound (i.e. the said expression doesn't refer to
4866
any of remaining_tables and can be evaluated).
4869
Bitmap of bound IN-equalities.
4872
uint64_t get_bound_sj_equalities(TableList *sj_nest,
4873
table_map remaining_tables)
4875
List_iterator<Item> li(sj_nest->nested_join->sj_outer_expr_list);
4879
while ((item= li++))
4882
Q: should this take into account equality propagation and how?
4883
A: If e->outer_side is an Item_field, walk over the equality
4884
class and see if there is an element that is bound?
4885
(this is an optional feature)
4887
if (!(item->used_tables() & remaining_tables))
4897
Find the best access path for an extension of a partial execution
4898
plan and add this path to the plan.
4900
The function finds the best access path to table 's' from the passed
4901
partial plan where an access path is the general term for any means to
4902
access the data in 's'. An access path may use either an index or a scan,
4903
whichever is cheaper. The input partial plan is passed via the array
4904
'join->positions' of length 'idx'. The chosen access method for 's' and its
4905
cost are stored in 'join->positions[idx]'.
4907
@param join pointer to the structure providing all context info
4909
@param s the table to be joined by the function
4910
@param thd thread for the connection that submitted the query
4911
@param remaining_tables set of tables not included into the partial plan yet
4912
@param idx the length of the partial plan
4913
@param record_count estimate for the number of records returned by the
4915
@param read_time the cost of the partial plan
4922
best_access_path(JOIN *join,
4925
table_map remaining_tables,
4927
double record_count,
4928
double read_time __attribute__((unused)))
4930
KEYUSE *best_key= 0;
4931
uint best_max_key_part= 0;
4932
bool found_constraint= 0;
4933
double best= DBL_MAX;
4934
double best_time= DBL_MAX;
4935
double records= DBL_MAX;
4936
table_map best_ref_depends_map= 0;
4939
uint best_is_sj_inside_out= 0;
4942
{ /* Use key if possible */
4943
Table *table= s->table;
4944
KEYUSE *keyuse,*start_key=0;
4945
double best_records= DBL_MAX;
4946
uint32_t max_key_part=0;
4947
uint64_t bound_sj_equalities= 0;
4948
bool try_sj_inside_out= false;
4950
Discover the bound equalites. We need to do this, if
4951
1. The next table is an SJ-inner table, and
4952
2. It is the first table from that semijoin, and
4953
3. We're not within a semi-join range (i.e. all semi-joins either have
4954
all or none of their tables in join_table_map), except
4955
s->emb_sj_nest (which we've just entered).
4956
3. All correlation references from this sj-nest are bound
4958
if (s->emb_sj_nest && // (1)
4959
s->emb_sj_nest->sj_in_exprs < 64 &&
4960
((remaining_tables & s->emb_sj_nest->sj_inner_tables) == // (2)
4961
s->emb_sj_nest->sj_inner_tables) && // (2)
4962
join->cur_emb_sj_nests == s->emb_sj_nest->sj_inner_tables && // (3)
4963
!(remaining_tables & s->emb_sj_nest->nested_join->sj_corr_tables)) // (4)
4965
/* This table is an InsideOut scan candidate */
4966
bound_sj_equalities= get_bound_sj_equalities(s->emb_sj_nest,
4968
try_sj_inside_out= true;
4971
/* Test how we can use keys */
4972
rec= s->records/MATCHING_ROWS_IN_OTHER_TABLE; // Assumed records/key
4973
for (keyuse=s->keyuse ; keyuse->table == table ;)
4975
key_part_map found_part= 0;
4976
table_map found_ref= 0;
4977
uint key= keyuse->key;
4978
KEY *keyinfo= table->key_info+key;
4979
/* Bitmap of keyparts where the ref access is over 'keypart=const': */
4980
key_part_map const_part= 0;
4981
/* The or-null keypart in ref-or-null access: */
4982
key_part_map ref_or_null_part= 0;
4984
/* Calculate how many key segments of the current key we can use */
4986
uint64_t handled_sj_equalities=0;
4987
key_part_map sj_insideout_map= 0;
4989
do /* For each keypart */
4991
uint keypart= keyuse->keypart;
4992
table_map best_part_found_ref= 0;
4993
double best_prev_record_reads= DBL_MAX;
4995
do /* For each way to access the keypart */
4999
if 1. expression doesn't refer to forward tables
5000
2. we won't get two ref-or-null's
5002
if (!(remaining_tables & keyuse->used_tables) &&
5003
!(ref_or_null_part && (keyuse->optimize &
5004
KEY_OPTIMIZE_REF_OR_NULL)))
5006
found_part|= keyuse->keypart_map;
5007
if (!(keyuse->used_tables & ~join->const_table_map))
5008
const_part|= keyuse->keypart_map;
5010
double tmp2= prev_record_reads(join, idx, (found_ref |
5011
keyuse->used_tables));
5012
if (tmp2 < best_prev_record_reads)
5014
best_part_found_ref= keyuse->used_tables & ~join->const_table_map;
5015
best_prev_record_reads= tmp2;
5017
if (rec > keyuse->ref_table_rows)
5018
rec= keyuse->ref_table_rows;
5020
If there is one 'key_column IS NULL' expression, we can
5021
use this ref_or_null optimisation of this field
5023
if (keyuse->optimize & KEY_OPTIMIZE_REF_OR_NULL)
5024
ref_or_null_part |= keyuse->keypart_map;
5027
if (try_sj_inside_out && keyuse->sj_pred_no != UINT_MAX)
5029
if (!(remaining_tables & keyuse->used_tables))
5030
bound_sj_equalities |= 1ULL << keyuse->sj_pred_no;
5033
handled_sj_equalities |= 1ULL << keyuse->sj_pred_no;
5034
sj_insideout_map |= ((key_part_map)1) << keyuse->keypart;
5039
} while (keyuse->table == table && keyuse->key == key &&
5040
keyuse->keypart == keypart);
5041
found_ref|= best_part_found_ref;
5042
} while (keyuse->table == table && keyuse->key == key);
5045
Assume that that each key matches a proportional part of table.
5047
if (!found_part && !handled_sj_equalities)
5048
continue; // Nothing usable found
5050
if (rec < MATCHING_ROWS_IN_OTHER_TABLE)
5051
rec= MATCHING_ROWS_IN_OTHER_TABLE; // Fix for small tables
5053
bool sj_inside_out_scan= false;
5055
found_constraint= 1;
5057
Check if InsideOut scan is applicable:
5058
1. All IN-equalities are either "bound" or "handled"
5059
2. Index keyparts are
5062
if (try_sj_inside_out &&
5063
table->covering_keys.is_set(key) &&
5064
(handled_sj_equalities | bound_sj_equalities) == // (1)
5065
PREV_BITS(uint64_t, s->emb_sj_nest->sj_in_exprs)) // (1)
5067
uint n_fixed_parts= max_part_bit(found_part);
5068
if (n_fixed_parts != keyinfo->key_parts &&
5069
(PREV_BITS(uint, n_fixed_parts) | sj_insideout_map) ==
5070
PREV_BITS(uint, keyinfo->key_parts))
5073
Not all parts are fixed. Produce bitmap of remaining bits and
5074
check if all of them are covered.
5076
sj_inside_out_scan= true;
5080
It's a confluent ref scan.
5082
That is, all found KEYUSE elements refer to IN-equalities,
5083
and there is really no ref access because there is no
5084
t.keypart0 = {bound expression}
5086
Calculate the cost of complete loose index scan.
5088
records= (double)s->table->file->stats.records;
5090
/* The cost is entire index scan cost (divided by 2) */
5091
best_time= s->table->file->index_only_read_time(key, records);
5093
/* Now figure how many different keys we will get */
5095
if ((rpc= keyinfo->rec_per_key[keyinfo->key_parts-1]))
5096
records= records / rpc;
5103
Check if we found full key
5105
if (found_part == PREV_BITS(uint,keyinfo->key_parts) &&
5108
max_key_part= UINT32_MAX;
5109
if ((keyinfo->flags & (HA_NOSAME | HA_NULL_PART_KEY)) == HA_NOSAME)
5111
tmp = prev_record_reads(join, idx, found_ref);
5117
{ /* We found a const key */
5119
ReuseRangeEstimateForRef-1:
5120
We get here if we've found a ref(const) (c_i are constants):
5121
"(keypart1=c1) AND ... AND (keypartN=cN)" [ref_const_cond]
5123
If range optimizer was able to construct a "range"
5124
access on this index, then its condition "quick_cond" was
5125
eqivalent to ref_const_cond (*), and we can re-use E(#rows)
5126
from the range optimizer.
5128
Proof of (*): By properties of range and ref optimizers
5129
quick_cond will be equal or tighther than ref_const_cond.
5130
ref_const_cond already covers "smallest" possible interval -
5131
a singlepoint interval over all keyparts. Therefore,
5132
quick_cond is equivalent to ref_const_cond (if it was an
5133
empty interval we wouldn't have got here).
5135
if (table->quick_keys.is_set(key))
5136
records= (double) table->quick_rows[key];
5139
/* quick_range couldn't use key! */
5140
records= (double) s->records/rec;
5145
if (!(records=keyinfo->rec_per_key[keyinfo->key_parts-1]))
5146
{ /* Prefer longer keys */
5148
((double) s->records / (double) rec *
5150
((double) (table->s->max_key_length-keyinfo->key_length) /
5151
(double) table->s->max_key_length)));
5153
records=2.0; /* Can't be as good as a unique */
5156
ReuseRangeEstimateForRef-2: We get here if we could not reuse
5157
E(#rows) from range optimizer. Make another try:
5159
If range optimizer produced E(#rows) for a prefix of the ref
5160
access we're considering, and that E(#rows) is lower then our
5161
current estimate, make an adjustment. The criteria of when we
5162
can make an adjustment is a special case of the criteria used
5163
in ReuseRangeEstimateForRef-3.
5165
if (table->quick_keys.is_set(key) &&
5166
const_part & (1 << table->quick_key_parts[key]) &&
5167
table->quick_n_ranges[key] == 1 &&
5168
records > (double) table->quick_rows[key])
5170
records= (double) table->quick_rows[key];
5173
/* Limit the number of matched rows */
5175
set_if_smaller(tmp, (double) thd->variables.max_seeks_for_key);
5176
if (table->covering_keys.is_set(key))
5178
/* we can use only index tree */
5179
tmp= record_count * table->file->index_only_read_time(key, tmp);
5182
tmp= record_count*min(tmp,s->worst_seeks);
5188
Use as much key-parts as possible and a uniq key is better
5189
than a not unique key
5190
Set tmp to (previous record count) * (records / combination)
5192
if ((found_part & 1) &&
5193
(!(table->file->index_flags(key, 0, 0) & HA_ONLY_WHOLE_INDEX) ||
5194
found_part == PREV_BITS(uint,keyinfo->key_parts)))
5196
max_key_part= max_part_bit(found_part);
5198
ReuseRangeEstimateForRef-3:
5199
We're now considering a ref[or_null] access via
5200
(t.keypart1=e1 AND ... AND t.keypartK=eK) [ OR
5201
(same-as-above but with one cond replaced
5202
with "t.keypart_i IS NULL")] (**)
5204
Try re-using E(#rows) from "range" optimizer:
5205
We can do so if "range" optimizer used the same intervals as
5206
in (**). The intervals used by range optimizer may be not
5207
available at this point (as "range" access might have choosen to
5208
create quick select over another index), so we can't compare
5209
them to (**). We'll make indirect judgements instead.
5210
The sufficient conditions for re-use are:
5211
(C1) All e_i in (**) are constants, i.e. found_ref==false. (if
5212
this is not satisfied we have no way to know which ranges
5213
will be actually scanned by 'ref' until we execute the
5215
(C2) max #key parts in 'range' access == K == max_key_part (this
5216
is apparently a necessary requirement)
5218
We also have a property that "range optimizer produces equal or
5219
tighter set of scan intervals than ref(const) optimizer". Each
5220
of the intervals in (**) are "tightest possible" intervals when
5221
one limits itself to using keyparts 1..K (which we do in #2).
5222
From here it follows that range access used either one, or
5223
both of the (I1) and (I2) intervals:
5225
(t.keypart1=c1 AND ... AND t.keypartK=eK) (I1)
5226
(same-as-above but with one cond replaced
5227
with "t.keypart_i IS NULL") (I2)
5229
The remaining part is to exclude the situation where range
5230
optimizer used one interval while we're considering
5231
ref-or-null and looking for estimate for two intervals. This
5232
is done by last limitation:
5234
(C3) "range optimizer used (have ref_or_null?2:1) intervals"
5236
if (table->quick_keys.is_set(key) && !found_ref && //(C1)
5237
table->quick_key_parts[key] == max_key_part && //(C2)
5238
table->quick_n_ranges[key] == 1+test(ref_or_null_part)) //(C3)
5240
tmp= records= (double) table->quick_rows[key];
5244
/* Check if we have statistic about the distribution */
5245
if ((records= keyinfo->rec_per_key[max_key_part-1]))
5248
Fix for the case where the index statistics is too
5250
(1) We're considering ref(const) and there is quick select
5252
(2) and that quick select uses more keyparts (i.e. it will
5253
scan equal/smaller interval then this ref(const))
5254
(3) and E(#rows) for quick select is higher then our
5257
We'll use E(#rows) from quick select.
5259
Q: Why do we choose to use 'ref'? Won't quick select be
5260
cheaper in some cases ?
5261
TODO: figure this out and adjust the plan choice if needed.
5263
if (!found_ref && table->quick_keys.is_set(key) && // (1)
5264
table->quick_key_parts[key] > max_key_part && // (2)
5265
records < (double)table->quick_rows[key]) // (3)
5266
records= (double)table->quick_rows[key];
5273
Assume that the first key part matches 1% of the file
5274
and that the whole key matches 10 (duplicates) or 1
5276
Assume also that more key matches proportionally more
5278
This gives the formula:
5279
records = (x * (b-a) + a*c-b)/(c-1)
5281
b = records matched by whole key
5282
a = records matched by first key part (1% of all records?)
5283
c = number of key parts in key
5284
x = used key parts (1 <= x <= c)
5287
if (!(rec_per_key=(double)
5288
keyinfo->rec_per_key[keyinfo->key_parts-1]))
5289
rec_per_key=(double) s->records/rec+1;
5293
else if (rec_per_key/(double) s->records >= 0.01)
5297
double a=s->records*0.01;
5298
if (keyinfo->key_parts > 1)
5299
tmp= (max_key_part * (rec_per_key - a) +
5300
a*keyinfo->key_parts - rec_per_key)/
5301
(keyinfo->key_parts-1);
5304
set_if_bigger(tmp,1.0);
5306
records = (ulong) tmp;
5309
if (ref_or_null_part)
5311
/* We need to do two key searches to find key */
5317
ReuseRangeEstimateForRef-4: We get here if we could not reuse
5318
E(#rows) from range optimizer. Make another try:
5320
If range optimizer produced E(#rows) for a prefix of the ref
5321
access we're considering, and that E(#rows) is lower then our
5322
current estimate, make the adjustment.
5324
The decision whether we can re-use the estimate from the range
5325
optimizer is the same as in ReuseRangeEstimateForRef-3,
5326
applied to first table->quick_key_parts[key] key parts.
5328
if (table->quick_keys.is_set(key) &&
5329
table->quick_key_parts[key] <= max_key_part &&
5330
const_part & (1 << table->quick_key_parts[key]) &&
5331
table->quick_n_ranges[key] == 1 + test(ref_or_null_part &
5333
records > (double) table->quick_rows[key])
5335
tmp= records= (double) table->quick_rows[key];
5339
/* Limit the number of matched rows */
5340
set_if_smaller(tmp, (double) thd->variables.max_seeks_for_key);
5341
if (table->covering_keys.is_set(key))
5343
/* we can use only index tree */
5344
tmp= record_count * table->file->index_only_read_time(key, tmp);
5347
tmp= record_count * min(tmp,s->worst_seeks);
5350
tmp= best_time; // Do nothing
5353
if (sj_inside_out_scan && !start_key)
5361
if (tmp < best_time - records/(double) TIME_FOR_COMPARE)
5363
best_time= tmp + records/(double) TIME_FOR_COMPARE;
5365
best_records= records;
5366
best_key= start_key;
5367
best_max_key_part= max_key_part;
5368
best_ref_depends_map= found_ref;
5369
best_is_sj_inside_out= sj_inside_out_scan;
5372
records= best_records;
5376
Don't test table scan if it can't be better.
5377
Prefer key lookup if we would use the same key for scanning.
5379
Don't do a table scan on InnoDB tables, if we can read the used
5380
parts of the row from any of the used index.
5381
This is because table scans uses index and we would not win
5382
anything by using a table scan.
5384
A word for word translation of the below if-statement in sergefp's
5385
understanding: we check if we should use table scan if:
5386
(1) The found 'ref' access produces more records than a table scan
5387
(or index scan, or quick select), or 'ref' is more expensive than
5389
(2) This doesn't hold: the best way to perform table scan is to to perform
5390
'range' access using index IDX, and the best way to perform 'ref'
5391
access is to use the same index IDX, with the same or more key parts.
5392
(note: it is not clear how this rule is/should be extended to
5393
index_merge quick selects)
5394
(3) See above note about InnoDB.
5395
(4) NOT ("FORCE INDEX(...)" is used for table and there is 'ref' access
5396
path, but there is no quick select)
5397
If the condition in the above brackets holds, then the only possible
5398
"table scan" access method is ALL/index (there is no quick select).
5399
Since we have a 'ref' access path, and FORCE INDEX instructs us to
5400
choose it over ALL/index, there is no need to consider a full table
5403
if ((records >= s->found_records || best > s->read_time) && // (1)
5404
!(s->quick && best_key && s->quick->index == best_key->key && // (2)
5405
best_max_key_part >= s->table->quick_key_parts[best_key->key]) &&// (2)
5406
!((s->table->file->ha_table_flags() & HA_TABLE_SCAN_ON_INDEX) && // (3)
5407
! s->table->covering_keys.is_clear_all() && best_key && !s->quick) &&// (3)
5408
!(s->table->force_index && best_key && !s->quick)) // (4)
5409
{ // Check full join
5410
ha_rows rnd_records= s->found_records;
5412
If there is a filtering condition on the table (i.e. ref analyzer found
5413
at least one "table.keyXpartY= exprZ", where exprZ refers only to tables
5414
preceding this table in the join order we're now considering), then
5415
assume that 25% of the rows will be filtered out by this condition.
5417
This heuristic is supposed to force tables used in exprZ to be before
5418
this table in join order.
5420
if (found_constraint)
5421
rnd_records-= rnd_records/4;
5424
If applicable, get a more accurate estimate. Don't use the two
5427
if (s->table->quick_condition_rows != s->found_records)
5428
rnd_records= s->table->quick_condition_rows;
5431
Range optimizer never proposes a RANGE if it isn't better
5432
than FULL: so if RANGE is present, it's always preferred to FULL.
5433
Here we estimate its cost.
5439
- read record range through 'quick'
5440
- skip rows which does not satisfy WHERE constraints
5442
We take into account possible use of join cache for ALL/index
5443
access (see first else-branch below), but we don't take it into
5444
account here for range/index_merge access. Find out why this is so.
5447
(s->quick->read_time +
5448
(s->found_records - rnd_records)/(double) TIME_FOR_COMPARE);
5452
/* Estimate cost of reading table. */
5453
tmp= s->table->file->scan_time();
5454
if (s->table->map & join->outer_join) // Can't use join cache
5457
For each record we have to:
5458
- read the whole table record
5459
- skip rows which does not satisfy join condition
5463
(s->records - rnd_records)/(double) TIME_FOR_COMPARE);
5467
/* We read the table as many times as join buffer becomes full. */
5468
tmp*= (1.0 + floor((double) cache_record_length(join,idx) *
5470
(double) thd->variables.join_buff_size));
5472
We don't make full cartesian product between rows in the scanned
5473
table and existing records because we skip all rows from the
5474
scanned table, which does not satisfy join condition when
5475
we read the table (see flush_cached_records for details). Here we
5476
take into account cost to read and skip these records.
5478
tmp+= (s->records - rnd_records)/(double) TIME_FOR_COMPARE;
5483
We estimate the cost of evaluating WHERE clause for found records
5484
as record_count * rnd_records / TIME_FOR_COMPARE. This cost plus
5485
tmp give us total cost of using Table SCAN
5487
if (best == DBL_MAX ||
5488
(tmp + record_count/(double) TIME_FOR_COMPARE*rnd_records <
5489
best + record_count/(double) TIME_FOR_COMPARE*records))
5492
If the table has a range (s->quick is set) make_join_select()
5493
will ensure that this will be used
5496
records= rows2double(rnd_records);
5498
/* range/index_merge/ALL/index access method are "independent", so: */
5499
best_ref_depends_map= 0;
5500
best_is_sj_inside_out= false;
5504
/* Update the cost information for the current partial plan */
5505
join->positions[idx].records_read= records;
5506
join->positions[idx].read_time= best;
5507
join->positions[idx].key= best_key;
5508
join->positions[idx].table= s;
5509
join->positions[idx].ref_depend_map= best_ref_depends_map;
5510
join->positions[idx].use_insideout_scan= best_is_sj_inside_out;
5513
idx == join->const_tables &&
5514
s->table == join->sort_by_table &&
5515
join->unit->select_limit_cnt >= records)
5516
join->sort_by_table= (Table*) 1; // Must use temporary table
5523
Selects and invokes a search strategy for an optimal query plan.
5525
The function checks user-configurable parameters that control the search
5526
strategy for an optimal plan, selects the search method and then invokes
5527
it. Each specific optimization procedure stores the final optimal plan in
5528
the array 'join->best_positions', and the cost of the plan in
5531
@param join pointer to the structure providing all context info for
5533
@param join_tables set of the tables in the query
5536
'MAX_TABLES+2' denotes the old implementation of find_best before
5537
the greedy version. Will be removed when greedy_search is approved.
5546
choose_plan(JOIN *join, table_map join_tables)
5548
uint search_depth= join->thd->variables.optimizer_search_depth;
5549
uint prune_level= join->thd->variables.optimizer_prune_level;
5550
bool straight_join= test(join->select_options & SELECT_STRAIGHT_JOIN);
5552
join->cur_embedding_map= 0;
5553
reset_nj_counters(join->join_list);
5555
if (SELECT_STRAIGHT_JOIN option is set)
5556
reorder tables so dependent tables come after tables they depend
5557
on, otherwise keep tables in the order they were specified in the query
5559
Apply heuristic: pre-sort all access plans with respect to the number of
5562
my_qsort(join->best_ref + join->const_tables,
5563
join->tables - join->const_tables, sizeof(JOIN_TAB*),
5564
straight_join ? join_tab_cmp_straight : join_tab_cmp);
5565
join->cur_emb_sj_nests= 0;
5568
optimize_straight_join(join, join_tables);
5572
if (search_depth == MAX_TABLES+2)
5574
TODO: 'MAX_TABLES+2' denotes the old implementation of find_best before
5575
the greedy version. Will be removed when greedy_search is approved.
5577
join->best_read= DBL_MAX;
5578
if (find_best(join, join_tables, join->const_tables, 1.0, 0.0))
5583
if (search_depth == 0)
5584
/* Automatically determine a reasonable value for 'search_depth' */
5585
search_depth= determine_search_depth(join);
5586
if (greedy_search(join, join_tables, search_depth, prune_level))
5592
Store the cost of this query into a user variable
5593
Don't update last_query_cost for statements that are not "flat joins" :
5594
i.e. they have subqueries, unions or call stored procedures.
5595
TODO: calculate a correct cost for a query with subqueries and UNIONs.
5597
if (join->thd->lex->is_single_level_stmt())
5598
join->thd->status_var.last_query_cost= join->best_read;
5604
Compare two JOIN_TAB objects based on the number of accessed records.
5606
@param ptr1 pointer to first JOIN_TAB object
5607
@param ptr2 pointer to second JOIN_TAB object
796
5610
The order relation implemented by join_tab_cmp() is not transitive,
5664
Heuristic procedure to automatically guess a reasonable degree of
5665
exhaustiveness for the greedy search procedure.
5667
The procedure estimates the optimization time and selects a search depth
5668
big enough to result in a near-optimal QEP, that doesn't take too long to
5669
find. If the number of tables in the query exceeds some constant, then
5670
search_depth is set to this constant.
5672
@param join pointer to the structure providing all context info for
5676
This is an extremely simplistic implementation that serves as a stub for a
5677
more advanced analysis of the join. Ideally the search depth should be
5678
determined by learning from previous query optimizations, because it will
5679
depend on the CPU power (and other factors).
5682
this value should be determined dynamically, based on statistics:
5683
uint max_tables_for_exhaustive_opt= 7;
5686
this value could be determined by some mapping of the form:
5687
depth : table_count -> [max_tables_for_exhaustive_opt..MAX_EXHAUSTIVE]
5690
A positive integer that specifies the search depth (and thus the
5691
exhaustiveness) of the depth-first search algorithm used by
5696
determine_search_depth(JOIN *join)
5698
uint table_count= join->tables - join->const_tables;
5700
/* TODO: this value should be determined dynamically, based on statistics: */
5701
uint max_tables_for_exhaustive_opt= 7;
5703
if (table_count <= max_tables_for_exhaustive_opt)
5704
search_depth= table_count+1; // use exhaustive for small number of tables
5707
TODO: this value could be determined by some mapping of the form:
5708
depth : table_count -> [max_tables_for_exhaustive_opt..MAX_EXHAUSTIVE]
5710
search_depth= max_tables_for_exhaustive_opt; // use greedy search
5712
return search_depth;
5717
Select the best ways to access the tables in a query without reordering them.
5719
Find the best access paths for each query table and compute their costs
5720
according to their order in the array 'join->best_ref' (thus without
5721
reordering the join tables). The function calls sequentially
5722
'best_access_path' for each table in the query to select the best table
5723
access method. The final optimal plan is stored in the array
5724
'join->best_positions', and the corresponding cost in 'join->best_read'.
5726
@param join pointer to the structure providing all context info for
5728
@param join_tables set of the tables in the query
5731
This function can be applied to:
5732
- queries with STRAIGHT_JOIN
5733
- internally to compute the cost of an arbitrary QEP
5735
Thus 'optimize_straight_join' can be used at any stage of the query
5736
optimization process to finalize a QEP as it is.
5740
optimize_straight_join(JOIN *join, table_map join_tables)
5743
uint idx= join->const_tables;
5744
double record_count= 1.0;
5745
double read_time= 0.0;
5747
for (JOIN_TAB **pos= join->best_ref + idx ; (s= *pos) ; pos++)
5749
/* Find the best access method from 's' to the current partial plan */
5750
advance_sj_state(join_tables, s);
5751
best_access_path(join, s, join->thd, join_tables, idx,
5752
record_count, read_time);
5753
/* compute the cost of the new plan extended with 's' */
5754
record_count*= join->positions[idx].records_read;
5755
read_time+= join->positions[idx].read_time;
5756
join_tables&= ~(s->table->map);
5760
read_time+= record_count / (double) TIME_FOR_COMPARE;
5761
if (join->sort_by_table &&
5762
join->sort_by_table != join->positions[join->const_tables].table->table)
5763
read_time+= record_count; // We have to make a temp table
5764
memcpy(join->best_positions, join->positions, sizeof(POSITION)*idx);
5765
join->best_read= read_time;
5770
Find a good, possibly optimal, query execution plan (QEP) by a greedy search.
5772
The search procedure uses a hybrid greedy/exhaustive search with controlled
5773
exhaustiveness. The search is performed in N = card(remaining_tables)
5774
steps. Each step evaluates how promising is each of the unoptimized tables,
5775
selects the most promising table, and extends the current partial QEP with
5776
that table. Currenly the most 'promising' table is the one with least
5777
expensive extension.\
5779
There are two extreme cases:
5780
-# When (card(remaining_tables) < search_depth), the estimate finds the
5781
best complete continuation of the partial QEP. This continuation can be
5782
used directly as a result of the search.
5783
-# When (search_depth == 1) the 'best_extension_by_limited_search'
5784
consideres the extension of the current QEP with each of the remaining
5787
All other cases are in-between these two extremes. Thus the parameter
5788
'search_depth' controlls the exhaustiveness of the search. The higher the
5789
value, the longer the optimizaton time and possibly the better the
5790
resulting plan. The lower the value, the fewer alternative plans are
5791
estimated, but the more likely to get a bad QEP.
5793
All intermediate and final results of the procedure are stored in 'join':
5794
- join->positions : modified for every partial QEP that is explored
5795
- join->best_positions: modified for the current best complete QEP
5796
- join->best_read : modified for the current best complete QEP
5797
- join->best_ref : might be partially reordered
5799
The final optimal plan is stored in 'join->best_positions', and its
5800
corresponding cost in 'join->best_read'.
5803
The following pseudocode describes the algorithm of 'greedy_search':
5806
procedure greedy_search
5807
input: remaining_tables
5812
(t, a) = best_extension(pplan, remaining_tables);
5813
pplan = concat(pplan, (t, a));
5814
remaining_tables = remaining_tables - t;
5815
} while (remaining_tables != {})
5820
where 'best_extension' is a placeholder for a procedure that selects the
5821
most "promising" of all tables in 'remaining_tables'.
5822
Currently this estimate is performed by calling
5823
'best_extension_by_limited_search' to evaluate all extensions of the
5824
current QEP of size 'search_depth', thus the complexity of 'greedy_search'
5825
mainly depends on that of 'best_extension_by_limited_search'.
5828
If 'best_extension()' == 'best_extension_by_limited_search()', then the
5829
worst-case complexity of this algorithm is <=
5830
O(N*N^search_depth/search_depth). When serch_depth >= N, then the
5831
complexity of greedy_search is O(N!).
5834
In the future, 'greedy_search' might be extended to support other
5835
implementations of 'best_extension', e.g. some simpler quadratic procedure.
5837
@param join pointer to the structure providing all context info
5839
@param remaining_tables set of tables not included into the partial plan yet
5840
@param search_depth controlls the exhaustiveness of the search
5841
@param prune_level the pruning heuristics that should be applied during
5851
greedy_search(JOIN *join,
5852
table_map remaining_tables,
5856
double record_count= 1.0;
5857
double read_time= 0.0;
5858
uint idx= join->const_tables; // index into 'join->best_ref'
5860
uint size_remain; // cardinality of remaining_tables
5862
JOIN_TAB *best_table; // the next plan node to be added to the curr QEP
5864
/* number of tables that remain to be optimized */
5865
size_remain= my_count_bits(remaining_tables);
5868
/* Find the extension of the current QEP with the lowest cost */
5869
join->best_read= DBL_MAX;
5870
if (best_extension_by_limited_search(join, remaining_tables, idx, record_count,
5871
read_time, search_depth, prune_level))
5874
if (size_remain <= search_depth)
5877
'join->best_positions' contains a complete optimal extension of the
5878
current partial QEP.
5883
/* select the first table in the optimal extension as most promising */
5884
best_pos= join->best_positions[idx];
5885
best_table= best_pos.table;
5887
Each subsequent loop of 'best_extension_by_limited_search' uses
5888
'join->positions' for cost estimates, therefore we have to update its
5891
join->positions[idx]= best_pos;
5893
/* find the position of 'best_table' in 'join->best_ref' */
5895
JOIN_TAB *pos= join->best_ref[best_idx];
5896
while (pos && best_table != pos)
5897
pos= join->best_ref[++best_idx];
5898
assert((pos != NULL)); // should always find 'best_table'
5899
/* move 'best_table' at the first free position in the array of joins */
5900
swap_variables(JOIN_TAB*, join->best_ref[idx], join->best_ref[best_idx]);
5902
/* compute the cost of the new plan extended with 'best_table' */
5903
record_count*= join->positions[idx].records_read;
5904
read_time+= join->positions[idx].read_time;
5906
remaining_tables&= ~(best_table->table->map);
5914
Find a good, possibly optimal, query execution plan (QEP) by a possibly
5917
The procedure searches for the optimal ordering of the query tables in set
5918
'remaining_tables' of size N, and the corresponding optimal access paths to
5919
each table. The choice of a table order and an access path for each table
5920
constitutes a query execution plan (QEP) that fully specifies how to
5923
The maximal size of the found plan is controlled by the parameter
5924
'search_depth'. When search_depth == N, the resulting plan is complete and
5925
can be used directly as a QEP. If search_depth < N, the found plan consists
5926
of only some of the query tables. Such "partial" optimal plans are useful
5927
only as input to query optimization procedures, and cannot be used directly
5930
The algorithm begins with an empty partial plan stored in 'join->positions'
5931
and a set of N tables - 'remaining_tables'. Each step of the algorithm
5932
evaluates the cost of the partial plan extended by all access plans for
5933
each of the relations in 'remaining_tables', expands the current partial
5934
plan with the access plan that results in lowest cost of the expanded
5935
partial plan, and removes the corresponding relation from
5936
'remaining_tables'. The algorithm continues until it either constructs a
5937
complete optimal plan, or constructs an optimal plartial plan with size =
5940
The final optimal plan is stored in 'join->best_positions'. The
5941
corresponding cost of the optimal plan is in 'join->best_read'.
5944
The procedure uses a recursive depth-first search where the depth of the
5945
recursion (and thus the exhaustiveness of the search) is controlled by the
5946
parameter 'search_depth'.
5949
The pseudocode below describes the algorithm of
5950
'best_extension_by_limited_search'. The worst-case complexity of this
5951
algorithm is O(N*N^search_depth/search_depth). When serch_depth >= N, then
5952
the complexity of greedy_search is O(N!).
5955
procedure best_extension_by_limited_search(
5956
pplan in, // in, partial plan of tables-joined-so-far
5957
pplan_cost, // in, cost of pplan
5958
remaining_tables, // in, set of tables not referenced in pplan
5959
best_plan_so_far, // in/out, best plan found so far
5960
best_plan_so_far_cost,// in/out, cost of best_plan_so_far
5961
search_depth) // in, maximum size of the plans being considered
5963
for each table T from remaining_tables
5965
// Calculate the cost of using table T as above
5966
cost = complex-series-of-calculations;
5968
// Add the cost to the cost so far.
5971
if (pplan_cost >= best_plan_so_far_cost)
5972
// pplan_cost already too great, stop search
5975
pplan= expand pplan by best_access_method;
5976
remaining_tables= remaining_tables - table T;
5977
if (remaining_tables is not an empty set
5981
best_extension_by_limited_search(pplan, pplan_cost,
5984
best_plan_so_far_cost,
5989
best_plan_so_far_cost= pplan_cost;
5990
best_plan_so_far= pplan;
5997
When 'best_extension_by_limited_search' is called for the first time,
5998
'join->best_read' must be set to the largest possible value (e.g. DBL_MAX).
5999
The actual implementation provides a way to optionally use pruning
6000
heuristic (controlled by the parameter 'prune_level') to reduce the search
6001
space by skipping some partial plans.
6004
The parameter 'search_depth' provides control over the recursion
6005
depth, and thus the size of the resulting optimal plan.
6007
@param join pointer to the structure providing all context info
6009
@param remaining_tables set of tables not included into the partial plan yet
6010
@param idx length of the partial QEP in 'join->positions';
6011
since a depth-first search is used, also corresponds
6012
to the current depth of the search tree;
6013
also an index in the array 'join->best_ref';
6014
@param record_count estimate for the number of records returned by the
6016
@param read_time the cost of the best partial plan
6017
@param search_depth maximum depth of the recursion and thus size of the
6019
(0 < search_depth <= join->tables+1).
6020
@param prune_level pruning heuristics that should be applied during
6022
(values: 0 = EXHAUSTIVE, 1 = PRUNE_BY_TIME_OR_ROWS)
6031
best_extension_by_limited_search(JOIN *join,
6032
table_map remaining_tables,
6034
double record_count,
6039
THD *thd= join->thd;
6040
if (thd->killed) // Abort
6044
'join' is a partial plan with lower cost than the best plan so far,
6045
so continue expanding it further with the tables in 'remaining_tables'.
6048
double best_record_count= DBL_MAX;
6049
double best_read_time= DBL_MAX;
6051
for (JOIN_TAB **pos= join->best_ref + idx ; (s= *pos) ; pos++)
6053
table_map real_table_bit= s->table->map;
6054
if ((remaining_tables & real_table_bit) &&
6055
!(remaining_tables & s->dependent) &&
6056
(!idx || !check_interleaving_with_nj(join->positions[idx-1].table, s)))
6058
double current_record_count, current_read_time;
6059
advance_sj_state(remaining_tables, s);
6062
psergey-insideout-todo:
6063
when best_access_path() detects it could do an InsideOut scan or
6064
some other scan, have it return an insideout scan and a flag that
6065
requests to "fork" this loop iteration. (Q: how does that behave
6066
when the depth is insufficient??)
6068
/* Find the best access method from 's' to the current partial plan */
6069
best_access_path(join, s, thd, remaining_tables, idx,
6070
record_count, read_time);
6071
/* Compute the cost of extending the plan with 's' */
6072
current_record_count= record_count * join->positions[idx].records_read;
6073
current_read_time= read_time + join->positions[idx].read_time;
6075
/* Expand only partial plans with lower cost than the best QEP so far */
6076
if ((current_read_time +
6077
current_record_count / (double) TIME_FOR_COMPARE) >= join->best_read)
6079
restore_prev_nj_state(s);
6080
restore_prev_sj_state(remaining_tables, s);
6085
Prune some less promising partial plans. This heuristic may miss
6086
the optimal QEPs, thus it results in a non-exhaustive search.
6088
if (prune_level == 1)
6090
if (best_record_count > current_record_count ||
6091
best_read_time > current_read_time ||
6092
(idx == join->const_tables && s->table == join->sort_by_table)) // 's' is the first table in the QEP
6094
if (best_record_count >= current_record_count &&
6095
best_read_time >= current_read_time &&
6096
/* TODO: What is the reasoning behind this condition? */
6097
(!(s->key_dependent & remaining_tables) ||
6098
join->positions[idx].records_read < 2.0))
6100
best_record_count= current_record_count;
6101
best_read_time= current_read_time;
6106
restore_prev_nj_state(s);
6107
restore_prev_sj_state(remaining_tables, s);
6112
if ( (search_depth > 1) && (remaining_tables & ~real_table_bit) )
6113
{ /* Recursively expand the current partial plan */
6114
swap_variables(JOIN_TAB*, join->best_ref[idx], *pos);
6115
if (best_extension_by_limited_search(join,
6116
remaining_tables & ~real_table_bit,
6118
current_record_count,
6123
swap_variables(JOIN_TAB*, join->best_ref[idx], *pos);
6127
'join' is either the best partial QEP with 'search_depth' relations,
6128
or the best complete QEP so far, whichever is smaller.
6130
current_read_time+= current_record_count / (double) TIME_FOR_COMPARE;
6131
if (join->sort_by_table &&
6132
join->sort_by_table !=
6133
join->positions[join->const_tables].table->table)
6134
/* We have to make a temp table */
6135
current_read_time+= current_record_count;
6136
if ((search_depth == 1) || (current_read_time < join->best_read))
6138
memcpy(join->best_positions, join->positions,
6139
sizeof(POSITION) * (idx + 1));
6140
join->best_read= current_read_time - 0.001;
6143
restore_prev_nj_state(s);
6144
restore_prev_sj_state(remaining_tables, s);
6153
- TODO: this function is here only temporarily until 'greedy_search' is
6154
tested and accepted.
6161
find_best(JOIN *join,table_map rest_tables,uint idx,double record_count,
6164
THD *thd= join->thd;
6169
read_time+=record_count/(double) TIME_FOR_COMPARE;
6170
if (join->sort_by_table &&
6171
join->sort_by_table !=
6172
join->positions[join->const_tables].table->table)
6173
read_time+=record_count; // We have to make a temp table
6174
if (read_time < join->best_read)
6176
memcpy(join->best_positions, join->positions, sizeof(POSITION)*idx);
6177
join->best_read= read_time - 0.001;
6181
if (read_time+record_count/(double) TIME_FOR_COMPARE >= join->best_read)
6182
return(false); /* Found better before */
6185
double best_record_count=DBL_MAX,best_read_time=DBL_MAX;
6186
for (JOIN_TAB **pos=join->best_ref+idx ; (s=*pos) ; pos++)
6188
table_map real_table_bit=s->table->map;
6189
if ((rest_tables & real_table_bit) && !(rest_tables & s->dependent) &&
6190
(!idx|| !check_interleaving_with_nj(join->positions[idx-1].table, s)))
6192
double records, best;
6193
advance_sj_state(rest_tables, s);
6194
best_access_path(join, s, thd, rest_tables, idx, record_count,
6196
records= join->positions[idx].records_read;
6197
best= join->positions[idx].read_time;
6199
Go to the next level only if there hasn't been a better key on
6200
this level! This will cut down the search for a lot simple cases!
6202
double current_record_count=record_count*records;
6203
double current_read_time=read_time+best;
6204
if (best_record_count > current_record_count ||
6205
best_read_time > current_read_time ||
6206
(idx == join->const_tables && s->table == join->sort_by_table))
6208
if (best_record_count >= current_record_count &&
6209
best_read_time >= current_read_time &&
6210
(!(s->key_dependent & rest_tables) || records < 2.0))
6212
best_record_count=current_record_count;
6213
best_read_time=current_read_time;
6215
swap_variables(JOIN_TAB*, join->best_ref[idx], *pos);
6216
if (find_best(join,rest_tables & ~real_table_bit,idx+1,
6217
current_record_count,current_read_time))
6219
swap_variables(JOIN_TAB*, join->best_ref[idx], *pos);
6221
restore_prev_nj_state(s);
6222
restore_prev_sj_state(rest_tables, s);
6223
if (join->select_options & SELECT_STRAIGHT_JOIN)
6224
break; // Don't test all combinations
845
6232
Find how much space the prevous read not const tables takes in cache.
847
void calc_used_field_length(Session *, JoinTable *join_tab)
6235
static void calc_used_field_length(THD *thd __attribute__((unused)),
849
uint32_t null_fields,blobs,fields,rec_length;
6238
uint null_fields,blobs,fields,rec_length;
850
6239
Field **f_ptr,*field;
6240
MY_BITMAP *read_set= join_tab->table->read_set;;
852
6242
null_fields= blobs= fields= rec_length=0;
853
for (f_ptr=join_tab->table->getFields() ; (field= *f_ptr) ; f_ptr++)
6243
for (f_ptr=join_tab->table->field ; (field= *f_ptr) ; f_ptr++)
855
if (field->isReadSet())
6245
if (bitmap_is_set(read_set, field->field_index))
857
uint32_t flags=field->flags;
6247
uint flags=field->flags;
859
6249
rec_length+=field->pack_length();
860
6250
if (flags & BLOB_FLAG)
862
6252
if (!(flags & NOT_NULL_FLAG))
866
6256
if (null_fields)
6836
Fill in outer join related info for the execution plan structure.
6838
For each outer join operation left after simplification of the
6839
original query the function set up the following pointers in the linear
6840
structure join->join_tab representing the selected execution plan.
6841
The first inner table t0 for the operation is set to refer to the last
6842
inner table tk through the field t0->last_inner.
6843
Any inner table ti for the operation are set to refer to the first
6844
inner table ti->first_inner.
6845
The first inner table t0 for the operation is set to refer to the
6846
first inner table of the embedding outer join operation, if there is any,
6847
through the field t0->first_upper.
6848
The on expression for the outer join operation is attached to the
6849
corresponding first inner table through the field t0->on_expr_ref.
6850
Here ti are structures of the JOIN_TAB type.
6852
EXAMPLE. For the query:
6856
(t2, t3 LEFT JOIN t4 ON t3.a=t4.a)
6857
ON (t1.a=t2.a AND t1.b=t3.b)
6861
given the execution plan with the table order t1,t2,t3,t4
6862
is selected, the following references will be set;
6863
t4->last_inner=[t4], t4->first_inner=[t4], t4->first_upper=[t2]
6864
t2->last_inner=[t4], t2->first_inner=t3->first_inner=[t2],
6865
on expression (t1.a=t2.a AND t1.b=t3.b) will be attached to
6866
*t2->on_expr_ref, while t3.a=t4.a will be attached to *t4->on_expr_ref.
6868
@param join reference to the info fully describing the query
6871
The function assumes that the simplification procedure has been
6872
already applied to the join query (see simplify_joins).
6873
This function can be called only after the execution plan
6878
make_outerjoin_info(JOIN *join)
6880
for (uint i=join->const_tables ; i < join->tables ; i++)
6882
JOIN_TAB *tab=join->join_tab+i;
6883
Table *table=tab->table;
6884
TableList *tbl= table->pos_in_table_list;
6885
TableList *embedding= tbl->embedding;
6887
if (tbl->outer_join)
6890
Table tab is the only one inner table for outer join.
6891
(Like table t4 for the table reference t3 LEFT JOIN t4 ON t3.a=t4.a
6892
is in the query above.)
6894
tab->last_inner= tab->first_inner= tab;
6895
tab->on_expr_ref= &tbl->on_expr;
6896
tab->cond_equal= tbl->cond_equal;
6898
tab->first_upper= embedding->nested_join->first_nested;
6900
for ( ; embedding ; embedding= embedding->embedding)
6902
/* Ignore sj-nests: */
6903
if (!embedding->on_expr)
6905
nested_join_st *nested_join= embedding->nested_join;
6906
if (!nested_join->counter_)
6909
Table tab is the first inner table for nested_join.
6910
Save reference to it in the nested join structure.
6912
nested_join->first_nested= tab;
6913
tab->on_expr_ref= &embedding->on_expr;
6914
tab->cond_equal= tbl->cond_equal;
6915
if (embedding->embedding)
6916
tab->first_upper= embedding->embedding->nested_join->first_nested;
6918
if (!tab->first_inner)
6919
tab->first_inner= nested_join->first_nested;
6920
if (++nested_join->counter_ < nested_join->join_list.elements)
6922
/* Table tab is the last inner table for nested join. */
6923
nested_join->first_nested->last_inner= tab;
6931
make_join_select(JOIN *join,SQL_SELECT *select,COND *cond)
6933
THD *thd= join->thd;
6936
add_not_null_conds(join);
6937
table_map used_tables;
6938
if (cond) /* Because of QUICK_GROUP_MIN_MAX_SELECT */
6939
{ /* there may be a select without a cond. */
6940
if (join->tables > 1)
6941
cond->update_used_tables(); // Tablenr may have changed
6942
if (join->const_tables == join->tables &&
6943
thd->lex->current_select->master_unit() ==
6944
&thd->lex->unit) // not upper level SELECT
6945
join->const_table_map|=RAND_TABLE_BIT;
6946
{ // Check const tables
6948
make_cond_for_table(cond,
6949
join->const_table_map,
6951
for (JOIN_TAB *tab= join->join_tab+join->const_tables;
6952
tab < join->join_tab+join->tables ; tab++)
6954
if (*tab->on_expr_ref)
6956
JOIN_TAB *cond_tab= tab->first_inner;
6957
COND *tmp= make_cond_for_table(*tab->on_expr_ref,
6958
join->const_table_map,
6962
tmp= new Item_func_trig_cond(tmp, &cond_tab->not_null_compl);
6965
tmp->quick_fix_field();
6966
cond_tab->select_cond= !cond_tab->select_cond ? tmp :
6967
new Item_cond_and(cond_tab->select_cond,
6969
if (!cond_tab->select_cond)
6971
cond_tab->select_cond->quick_fix_field();
6974
if (const_cond && !const_cond->val_int())
6976
return(1); // Impossible const condition
6980
used_tables=((select->const_tables=join->const_table_map) |
6981
OUTER_REF_TABLE_BIT | RAND_TABLE_BIT);
6982
for (uint i=join->const_tables ; i < join->tables ; i++)
6984
JOIN_TAB *tab=join->join_tab+i;
6986
first_inner is the X in queries like:
6987
SELECT * FROM t1 LEFT OUTER JOIN (t2 JOIN t3) ON X
6989
JOIN_TAB *first_inner_tab= tab->first_inner;
6990
table_map current_map= tab->table->map;
6991
bool use_quick_range=0;
6995
Following force including random expression in last table condition.
6996
It solve problem with select like SELECT * FROM t1 WHERE rand() > 0.5
6998
if (i == join->tables-1)
6999
current_map|= OUTER_REF_TABLE_BIT | RAND_TABLE_BIT;
7000
used_tables|=current_map;
7002
if (tab->type == JT_REF && tab->quick &&
7003
(uint) tab->ref.key == tab->quick->index &&
7004
tab->ref.key_length < tab->quick->max_used_key_length)
7006
/* Range uses longer key; Use this instead of ref on key */
7011
tab->ref.key_parts=0; // Don't use ref key.
7012
join->best_positions[i].records_read= rows2double(tab->quick->records);
7014
We will use join cache here : prevent sorting of the first
7015
table only and sort at the end.
7017
if (i != join->const_tables && join->tables > join->const_tables + 1)
7023
tmp= make_cond_for_table(cond,used_tables,current_map, 0);
7024
if (cond && !tmp && tab->quick)
7026
if (tab->type != JT_ALL)
7029
Don't use the quick method
7030
We come here in the case where we have 'key=constant' and
7031
the test is removed by make_cond_for_table()
7039
Hack to handle the case where we only refer to a table
7040
in the ON part of an OUTER JOIN. In this case we want the code
7041
below to check if we should use 'quick' instead.
7043
tmp= new Item_int((int64_t) 1,1); // Always true
7047
if (tmp || !cond || tab->type == JT_REF || tab->type == JT_REF_OR_NULL ||
7048
tab->type == JT_EQ_REF)
7050
SQL_SELECT *sel= tab->select= ((SQL_SELECT*)
7051
thd->memdup((uchar*) select,
7054
return(1); // End of memory
7056
If tab is an inner table of an outer join operation,
7057
add a match guard to the pushed down predicate.
7058
The guard will turn the predicate on only after
7059
the first match for outer tables is encountered.
7064
Because of QUICK_GROUP_MIN_MAX_SELECT there may be a select without
7065
a cond, so neutralize the hack above.
7067
if (!(tmp= add_found_match_trig_cond(first_inner_tab, tmp, 0)))
7069
tab->select_cond=sel->cond=tmp;
7070
/* Push condition to storage engine if this is enabled
7071
and the condition is not guarded */
7072
tab->table->file->pushed_cond= NULL;
7073
if (thd->variables.engine_condition_pushdown)
7076
make_cond_for_table(tmp, current_map, current_map, 0);
7079
/* Push condition to handler */
7080
if (!tab->table->file->cond_push(push_cond))
7081
tab->table->file->pushed_cond= push_cond;
7086
tab->select_cond= sel->cond= NULL;
7088
sel->head=tab->table;
7091
/* Use quick key read if it's a constant and it's not used
7093
if (tab->needed_reg.is_clear_all() && tab->type != JT_EQ_REF
7094
&& (tab->type != JT_REF || (uint) tab->ref.key == tab->quick->index))
7096
sel->quick=tab->quick; // Use value from get_quick_...
7097
sel->quick_keys.clear_all();
7098
sel->needed_reg.clear_all();
7106
uint ref_key=(uint) sel->head->reginfo.join_tab->ref.key+1;
7107
if (i == join->const_tables && ref_key)
7109
if (!tab->const_keys.is_clear_all() &&
7110
tab->table->reginfo.impossible_range)
7113
else if (tab->type == JT_ALL && ! use_quick_range)
7115
if (!tab->const_keys.is_clear_all() &&
7116
tab->table->reginfo.impossible_range)
7117
return(1); // Impossible range
7119
We plan to scan all rows.
7120
Check again if we should use an index.
7121
We could have used an column from a previous table in
7122
the index if we are using limit and this is the first table
7125
if ((cond && (!tab->keys.is_subset(tab->const_keys) && i > 0)) ||
7126
(!tab->const_keys.is_clear_all() && (i == join->const_tables) && (join->unit->select_limit_cnt < join->best_positions[i].records_read) && ((join->select_options & OPTION_FOUND_ROWS) == false)))
7128
/* Join with outer join condition */
7129
COND *orig_cond=sel->cond;
7130
sel->cond= and_conds(sel->cond, *tab->on_expr_ref);
7133
We can't call sel->cond->fix_fields,
7134
as it will break tab->on_expr if it's AND condition
7135
(fix_fields currently removes extra AND/OR levels).
7136
Yet attributes of the just built condition are not needed.
7137
Thus we call sel->cond->quick_fix_field for safety.
7139
if (sel->cond && !sel->cond->fixed)
7140
sel->cond->quick_fix_field();
7142
if (sel->test_quick_select(thd, tab->keys,
7143
used_tables & ~ current_map,
7144
(join->select_options &
7147
join->unit->select_limit_cnt), 0,
7151
Before reporting "Impossible WHERE" for the whole query
7152
we have to check isn't it only "impossible ON" instead
7154
sel->cond=orig_cond;
7155
if (!*tab->on_expr_ref ||
7156
sel->test_quick_select(thd, tab->keys,
7157
used_tables & ~ current_map,
7158
(join->select_options &
7161
join->unit->select_limit_cnt),0,
7163
return(1); // Impossible WHERE
7166
sel->cond=orig_cond;
7168
/* Fix for EXPLAIN */
7170
join->best_positions[i].records_read= (double)sel->quick->records;
7174
sel->needed_reg=tab->needed_reg;
7175
sel->quick_keys.clear_all();
7177
if (!sel->quick_keys.is_subset(tab->checked_keys) ||
7178
!sel->needed_reg.is_subset(tab->checked_keys))
7180
tab->keys=sel->quick_keys;
7181
tab->keys.merge(sel->needed_reg);
7182
tab->use_quick= (!sel->needed_reg.is_clear_all() &&
7183
(select->quick_keys.is_clear_all() ||
7185
(select->quick->records >= 100L)))) ?
7187
sel->read_tables= used_tables & ~current_map;
7189
if (i != join->const_tables && tab->use_quick != 2)
7190
{ /* Read with cache */
7192
(tmp=make_cond_for_table(cond,
7193
join->const_table_map |
7197
tab->cache.select=(SQL_SELECT*)
7198
thd->memdup((uchar*) sel, sizeof(SQL_SELECT));
7199
tab->cache.select->cond=tmp;
7200
tab->cache.select->read_tables=join->const_table_map;
7207
Push down conditions from all on expressions.
7208
Each of these conditions are guarded by a variable
7209
that turns if off just before null complemented row for
7210
outer joins is formed. Thus, the condition from an
7211
'on expression' are guaranteed not to be checked for
7212
the null complemented row.
7215
/* First push down constant conditions from on expressions */
7216
for (JOIN_TAB *join_tab= join->join_tab+join->const_tables;
7217
join_tab < join->join_tab+join->tables ; join_tab++)
7219
if (*join_tab->on_expr_ref)
7221
JOIN_TAB *cond_tab= join_tab->first_inner;
7222
COND *tmp= make_cond_for_table(*join_tab->on_expr_ref,
7223
join->const_table_map,
7227
tmp= new Item_func_trig_cond(tmp, &cond_tab->not_null_compl);
7230
tmp->quick_fix_field();
7231
cond_tab->select_cond= !cond_tab->select_cond ? tmp :
7232
new Item_cond_and(cond_tab->select_cond,tmp);
7233
if (!cond_tab->select_cond)
7235
cond_tab->select_cond->quick_fix_field();
7239
/* Push down non-constant conditions from on expressions */
7240
JOIN_TAB *last_tab= tab;
7241
while (first_inner_tab && first_inner_tab->last_inner == last_tab)
7244
Table tab is the last inner table of an outer join.
7245
An on expression is always attached to it.
7247
COND *on_expr= *first_inner_tab->on_expr_ref;
7249
table_map used_tables2= (join->const_table_map |
7250
OUTER_REF_TABLE_BIT | RAND_TABLE_BIT);
7251
for (tab= join->join_tab+join->const_tables; tab <= last_tab ; tab++)
7253
current_map= tab->table->map;
7254
used_tables2|= current_map;
7255
COND *tmp_cond= make_cond_for_table(on_expr, used_tables2,
7259
JOIN_TAB *cond_tab= tab < first_inner_tab ? first_inner_tab : tab;
7261
First add the guards for match variables of
7262
all embedding outer join operations.
7264
if (!(tmp_cond= add_found_match_trig_cond(cond_tab->first_inner,
7269
Now add the guard turning the predicate off for
7270
the null complemented row.
7272
tmp_cond= new Item_func_trig_cond(tmp_cond,
7276
tmp_cond->quick_fix_field();
7277
/* Add the predicate to other pushed down predicates */
7278
cond_tab->select_cond= !cond_tab->select_cond ? tmp_cond :
7279
new Item_cond_and(cond_tab->select_cond,
7281
if (!cond_tab->select_cond)
7283
cond_tab->select_cond->quick_fix_field();
7286
first_inner_tab= first_inner_tab->first_upper;
7295
Check if given expression uses only table fields covered by the given index
7298
uses_index_fields_only()
7299
item Expression to check
7300
tbl The table having the index
7301
keyno The index number
7302
other_tbls_ok true <=> Fields of other non-const tables are allowed
7305
Check if given expression only uses fields covered by index #keyno in the
7306
table tbl. The expression can use any fields in any other tables.
7308
The expression is guaranteed not to be AND or OR - those constructs are
7309
handled outside of this function.
7316
bool uses_index_fields_only(Item *item, Table *tbl, uint keyno,
7319
if (item->const_item())
7323
Don't push down the triggered conditions. Nested outer joins execution
7324
code may need to evaluate a condition several times (both triggered and
7325
untriggered), and there is no way to put thi
7326
TODO: Consider cloning the triggered condition and using the copies for:
7327
1. push the first copy down, to have most restrictive index condition
7329
2. Put the second copy into tab->select_cond.
7331
if (item->type() == Item::FUNC_ITEM &&
7332
((Item_func*)item)->functype() == Item_func::TRIG_COND_FUNC)
7335
if (!(item->used_tables() & tbl->map))
7336
return other_tbls_ok;
7338
Item::Type item_type= item->type();
7339
switch (item_type) {
7340
case Item::FUNC_ITEM:
7342
/* This is a function, apply condition recursively to arguments */
7343
Item_func *item_func= (Item_func*)item;
7345
Item **item_end= (item_func->arguments()) + item_func->argument_count();
7346
for (child= item_func->arguments(); child != item_end; child++)
7348
if (!uses_index_fields_only(*child, tbl, keyno, other_tbls_ok))
7353
case Item::COND_ITEM:
7355
/* This is a function, apply condition recursively to arguments */
7356
List_iterator<Item> li(*((Item_cond*)item)->argument_list());
7360
if (!uses_index_fields_only(item, tbl, keyno, other_tbls_ok))
7365
case Item::FIELD_ITEM:
7367
Item_field *item_field= (Item_field*)item;
7368
if (item_field->field->table != tbl)
7370
return item_field->field->part_of_key.is_set(keyno);
7372
case Item::REF_ITEM:
7373
return uses_index_fields_only(item->real_item(), tbl, keyno,
7376
return false; /* Play it safe, don't push unknown non-const items */
1212
7381
#define ICP_COND_USES_INDEX_ONLY 10
1218
void JoinTable::cleanup()
7384
Get a part of the condition that can be checked using only index fields
7387
make_cond_for_index()
7388
cond The source condition
7389
table The table that is partially available
7390
keyno The index in the above table. Only fields covered by the index
7392
other_tbls_ok true <=> Fields of other non-const tables are allowed
7395
Get a part of the condition that can be checked when for the given table
7396
we have values only of fields covered by some index. The condition may
7397
refer to other tables, it is assumed that we have values of all of their
7401
make_cond_for_index(
7402
"cond(t1.field) AND cond(t2.key1) AND cond(t2.non_key) AND cond(t2.key2)",
7405
"cond(t1.field) AND cond(t2.key2)"
7408
Index condition, or NULL if no condition could be inferred.
7411
Item *make_cond_for_index(Item *cond, Table *table, uint keyno,
7416
if (cond->type() == Item::COND_ITEM)
7419
if (((Item_cond*) cond)->functype() == Item_func::COND_AND_FUNC)
7421
Item_cond_and *new_cond=new Item_cond_and;
7424
List_iterator<Item> li(*((Item_cond*) cond)->argument_list());
7428
Item *fix= make_cond_for_index(item, table, keyno, other_tbls_ok);
7430
new_cond->argument_list()->push_back(fix);
7431
n_marked += test(item->marker == ICP_COND_USES_INDEX_ONLY);
7433
if (n_marked ==((Item_cond*)cond)->argument_list()->elements)
7434
cond->marker= ICP_COND_USES_INDEX_ONLY;
7435
switch (new_cond->argument_list()->elements) {
7439
return new_cond->argument_list()->head();
7441
new_cond->quick_fix_field();
7447
Item_cond_or *new_cond=new Item_cond_or;
7450
List_iterator<Item> li(*((Item_cond*) cond)->argument_list());
7454
Item *fix= make_cond_for_index(item, table, keyno, other_tbls_ok);
7457
new_cond->argument_list()->push_back(fix);
7458
n_marked += test(item->marker == ICP_COND_USES_INDEX_ONLY);
7460
if (n_marked ==((Item_cond*)cond)->argument_list()->elements)
7461
cond->marker= ICP_COND_USES_INDEX_ONLY;
7462
new_cond->quick_fix_field();
7463
new_cond->top_level_item();
7468
if (!uses_index_fields_only(cond, table, keyno, other_tbls_ok))
7470
cond->marker= ICP_COND_USES_INDEX_ONLY;
7475
Item *make_cond_remainder(Item *cond, bool exclude_index)
7477
if (exclude_index && cond->marker == ICP_COND_USES_INDEX_ONLY)
7478
return 0; /* Already checked */
7480
if (cond->type() == Item::COND_ITEM)
7482
table_map tbl_map= 0;
7483
if (((Item_cond*) cond)->functype() == Item_func::COND_AND_FUNC)
7485
/* Create new top level AND item */
7486
Item_cond_and *new_cond=new Item_cond_and;
7489
List_iterator<Item> li(*((Item_cond*) cond)->argument_list());
7493
Item *fix= make_cond_remainder(item, exclude_index);
7496
new_cond->argument_list()->push_back(fix);
7497
tbl_map |= fix->used_tables();
7500
switch (new_cond->argument_list()->elements) {
7504
return new_cond->argument_list()->head();
7506
new_cond->quick_fix_field();
7507
((Item_cond*)new_cond)->used_tables_cache= tbl_map;
7513
Item_cond_or *new_cond=new Item_cond_or;
7516
List_iterator<Item> li(*((Item_cond*) cond)->argument_list());
7520
Item *fix= make_cond_remainder(item, false);
7523
new_cond->argument_list()->push_back(fix);
7524
tbl_map |= fix->used_tables();
7526
new_cond->quick_fix_field();
7527
((Item_cond*)new_cond)->used_tables_cache= tbl_map;
7528
new_cond->top_level_item();
7537
Try to extract and push the index condition
7541
tab A join tab that has tab->table->file and its condition
7543
keyno Index for which extract and push the condition
7544
other_tbls_ok true <=> Fields of other non-const tables are allowed
7547
Try to extract and push the index condition down to table handler
7550
static void push_index_cond(JOIN_TAB *tab, uint keyno, bool other_tbls_ok)
7553
if (tab->table->file->index_flags(keyno, 0, 1) & HA_DO_INDEX_COND_PUSHDOWN &&
7554
tab->join->thd->variables.engine_condition_pushdown)
7556
idx_cond= make_cond_for_index(tab->select_cond, tab->table, keyno,
7561
tab->pre_idx_push_select_cond= tab->select_cond;
7562
Item *idx_remainder_cond=
7563
tab->table->file->idx_cond_push(keyno, idx_cond);
7566
Disable eq_ref's "lookup cache" if we've pushed down an index
7568
TODO: This check happens to work on current ICP implementations, but
7569
there may exist a compliant implementation that will not work
7570
correctly with it. Sort this out when we stabilize the condition
7573
if (idx_remainder_cond != idx_cond)
7574
tab->ref.disable_cache= true;
7576
Item *row_cond= make_cond_remainder(tab->select_cond, true);
7580
if (!idx_remainder_cond)
7581
tab->select_cond= row_cond;
7584
tab->select_cond= new Item_cond_and(row_cond, idx_remainder_cond);
7585
tab->select_cond->quick_fix_field();
7586
((Item_cond_and*)tab->select_cond)->used_tables_cache=
7587
row_cond->used_tables() | idx_remainder_cond->used_tables();
7591
tab->select_cond= idx_remainder_cond;
7594
tab->select->cond= tab->select_cond;
7604
Determine if the set is already ordered for order_st BY, so it can
7605
disable join cache because it will change the ordering of the results.
7606
Code handles sort table that is at any location (not only first after
7607
the const tables) despite the fact that it's currently prohibited.
7608
We must disable join cache if the first non-const table alone is
7609
ordered. If there is a temp table the ordering is done as a last
7610
operation and doesn't prevent join cache usage.
7612
uint make_join_orderinfo(JOIN *join)
7616
return join->tables;
7618
for (i=join->const_tables ; i < join->tables ; i++)
7620
JOIN_TAB *tab=join->join_tab+i;
7621
Table *table=tab->table;
7622
if ((table == join->sort_by_table &&
7623
(!join->order || join->skip_sort_order)) ||
7624
(join->sort_by_table == (Table *) 1 && i != join->const_tables))
7634
Plan refinement stage: do various set ups for the executioner
7637
make_join_readinfo()
7638
join Join being processed
7639
options Join's options (checking for SELECT_DESCRIBE,
7640
SELECT_NO_JOIN_CACHE)
7641
no_jbuf_after Don't use join buffering after table with this number.
7644
Plan refinement stage: do various set ups for the executioner
7645
- set up use of join buffering
7646
- push index conditions
7647
- increment counters
7652
true - Out of memory
7656
make_join_readinfo(JOIN *join, uint64_t options, uint no_jbuf_after)
7659
bool statistics= test(!(join->select_options & SELECT_DESCRIBE));
7662
for (i=join->const_tables ; i < join->tables ; i++)
7664
JOIN_TAB *tab=join->join_tab+i;
7665
Table *table=tab->table;
7666
bool using_join_cache;
7667
tab->read_record.table= table;
7668
tab->read_record.file=table->file;
7669
tab->next_select=sub_select; /* normal select */
7671
TODO: don't always instruct first table's ref/range access method to
7672
produce sorted output.
7674
tab->sorted= sorted;
7675
sorted= 0; // only first must be sorted
7676
if (tab->insideout_match_tab)
7678
if (!(tab->insideout_buf= (uchar*)join->thd->alloc(tab->table->key_info
7683
switch (tab->type) {
7684
case JT_SYSTEM: // Only happens with left join
7685
table->status=STATUS_NO_RECORD;
7686
tab->read_first_record= join_read_system;
7687
tab->read_record.read_record= join_no_more_records;
7689
case JT_CONST: // Only happens with left join
7690
table->status=STATUS_NO_RECORD;
7691
tab->read_first_record= join_read_const;
7692
tab->read_record.read_record= join_no_more_records;
7693
if (table->covering_keys.is_set(tab->ref.key) &&
7697
table->file->extra(HA_EXTRA_KEYREAD);
7701
table->status=STATUS_NO_RECORD;
7704
delete tab->select->quick;
7705
tab->select->quick=0;
7709
tab->read_first_record= join_read_key;
7710
tab->read_record.read_record= join_no_more_records;
7711
if (table->covering_keys.is_set(tab->ref.key) &&
7715
table->file->extra(HA_EXTRA_KEYREAD);
7718
push_index_cond(tab, tab->ref.key, true);
7720
case JT_REF_OR_NULL:
7722
table->status=STATUS_NO_RECORD;
7725
delete tab->select->quick;
7726
tab->select->quick=0;
7730
if (table->covering_keys.is_set(tab->ref.key) &&
7734
table->file->extra(HA_EXTRA_KEYREAD);
7737
push_index_cond(tab, tab->ref.key, true);
7738
if (tab->type == JT_REF)
7740
tab->read_first_record= join_read_always_key;
7741
tab->read_record.read_record= tab->insideout_match_tab?
7742
join_read_next_same_diff : join_read_next_same;
7746
tab->read_first_record= join_read_always_key_or_null;
7747
tab->read_record.read_record= join_read_next_same_or_null;
7752
If previous table use cache
7753
If the incoming data set is already sorted don't use cache.
7755
table->status=STATUS_NO_RECORD;
7756
using_join_cache= false;
7757
if (i != join->const_tables && !(options & SELECT_NO_JOIN_CACHE) &&
7758
tab->use_quick != 2 && !tab->first_inner && i <= no_jbuf_after &&
7759
!tab->insideout_match_tab)
7761
if ((options & SELECT_DESCRIBE) ||
7762
!join_init_cache(join->thd,join->join_tab+join->const_tables,
7763
i-join->const_tables))
7765
using_join_cache= true;
7766
tab[-1].next_select=sub_select_cache; /* Patch previous */
7769
/* These init changes read_record */
7770
if (tab->use_quick == 2)
7772
join->thd->server_status|=SERVER_QUERY_NO_GOOD_INDEX_USED;
7773
tab->read_first_record= join_init_quick_read_record;
7775
status_var_increment(join->thd->status_var.select_range_check_count);
7779
tab->read_first_record= join_init_read_record;
7780
if (i == join->const_tables)
7782
if (tab->select && tab->select->quick)
7785
status_var_increment(join->thd->status_var.select_range_count);
7789
join->thd->server_status|=SERVER_QUERY_NO_INDEX_USED;
7791
status_var_increment(join->thd->status_var.select_scan_count);
7796
if (tab->select && tab->select->quick)
7799
status_var_increment(join->thd->status_var.select_full_range_join_count);
7803
join->thd->server_status|=SERVER_QUERY_NO_INDEX_USED;
7805
status_var_increment(join->thd->status_var.select_full_join_count);
7808
if (!table->no_keyread)
7810
if (tab->select && tab->select->quick &&
7811
tab->select->quick->index != MAX_KEY && //not index_merge
7812
table->covering_keys.is_set(tab->select->quick->index))
7815
table->file->extra(HA_EXTRA_KEYREAD);
7817
else if (!table->covering_keys.is_clear_all() &&
7818
!(tab->select && tab->select->quick))
7819
{ // Only read index tree
7820
if (!tab->insideout_match_tab)
7823
See bug #26447: "Using the clustered index for a table scan
7824
is always faster than using a secondary index".
7826
if (table->s->primary_key != MAX_KEY &&
7827
table->file->primary_key_is_clustered())
7828
tab->index= table->s->primary_key;
7830
tab->index= table->find_shortest_key(&table->covering_keys);
7832
tab->read_first_record= join_read_first;
7833
tab->type=JT_NEXT; // Read with index_first / index_next
7836
if (tab->select && tab->select->quick &&
7837
tab->select->quick->index != MAX_KEY && ! tab->table->key_read)
7838
push_index_cond(tab, tab->select->quick->index, !using_join_cache);
7842
break; /* purecov: deadcode */
7845
abort(); /* purecov: deadcode */
7848
join->join_tab[join->tables-1].next_select=0; /* Set by do_select */
7854
Give error if we some tables are done with a full join.
7856
This is used by multi_table_update and multi_table_delete when running
7859
@param join Join condition
7864
1 Error (full join used)
7867
bool error_if_full_join(JOIN *join)
7869
for (JOIN_TAB *tab=join->join_tab, *end=join->join_tab+join->tables;
7873
if (tab->type == JT_ALL && (!tab->select || !tab->select->quick))
7875
my_message(ER_UPDATE_WITHOUT_KEY_IN_SAFE_MODE,
7876
ER(ER_UPDATE_WITHOUT_KEY_IN_SAFE_MODE), MYF(0));
7888
void JOIN_TAB::cleanup()
1226
size_t size= cache.end - cache.buff;
1227
global_join_buffer.sub(size);
2512
9613
if (!(left_const && right_const) &&
2513
9614
args[0]->result_type() == args[1]->result_type())
2517
resolve_const_item(session, &args[1], args[0]);
2518
func->update_used_tables();
2519
change_cond_ref_to_const(session, save_list, and_father, and_father,
2522
else if (left_const)
2524
resolve_const_item(session, &args[0], args[1]);
2525
func->update_used_tables();
2526
change_cond_ref_to_const(session, save_list, and_father, and_father,
9618
resolve_const_item(thd, &args[1], args[0]);
9619
func->update_used_tables();
9620
change_cond_ref_to_const(thd, save_list, and_father, and_father,
9623
else if (left_const)
9625
resolve_const_item(thd, &args[0], args[1]);
9626
func->update_used_tables();
9627
change_cond_ref_to_const(thd, save_list, and_father, and_father,
9637
Simplify joins replacing outer joins by inner joins whenever it's
9640
The function, during a retrieval of join_list, eliminates those
9641
outer joins that can be converted into inner join, possibly nested.
9642
It also moves the on expressions for the converted outer joins
9643
and from inner joins to conds.
9644
The function also calculates some attributes for nested joins:
9648
- on_expr_dep_tables
9649
The first two attributes are used to test whether an outer join can
9650
be substituted for an inner join. The third attribute represents the
9651
relation 'to be dependent on' for tables. If table t2 is dependent
9652
on table t1, then in any evaluated execution plan table access to
9653
table t2 must precede access to table t2. This relation is used also
9654
to check whether the query contains invalid cross-references.
9655
The forth attribute is an auxiliary one and is used to calculate
9657
As the attribute dep_tables qualifies possibles orders of tables in the
9658
execution plan, the dependencies required by the straight join
9659
modifiers are reflected in this attribute as well.
9660
The function also removes all braces that can be removed from the join
9661
expression without changing its meaning.
9664
An outer join can be replaced by an inner join if the where condition
9665
or the on expression for an embedding nested join contains a conjunctive
9666
predicate rejecting null values for some attribute of the inner tables.
9670
SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a WHERE t2.b < 5
9672
the predicate t2.b < 5 rejects nulls.
9673
The query is converted first to:
9675
SELECT * FROM t1 INNER JOIN t2 ON t2.a=t1.a WHERE t2.b < 5
9677
then to the equivalent form:
9679
SELECT * FROM t1, t2 ON t2.a=t1.a WHERE t2.b < 5 AND t2.a=t1.a
9683
Similarly the following query:
9685
SELECT * from t1 LEFT JOIN (t2, t3) ON t2.a=t1.a t3.b=t1.b
9690
SELECT * FROM t1, (t2, t3) WHERE t2.c < 5 AND t2.a=t1.a t3.b=t1.b
9694
One conversion might trigger another:
9696
SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a
9697
LEFT JOIN t3 ON t3.b=t2.b
9698
WHERE t3 IS NOT NULL =>
9699
SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a, t3
9700
WHERE t3 IS NOT NULL AND t3.b=t2.b =>
9701
SELECT * FROM t1, t2, t3
9702
WHERE t3 IS NOT NULL AND t3.b=t2.b AND t2.a=t1.a
9705
The function removes all unnecessary braces from the expression
9706
produced by the conversions.
9709
SELECT * FROM t1, (t2, t3) WHERE t2.c < 5 AND t2.a=t1.a AND t3.b=t1.b
9711
finally is converted to:
9713
SELECT * FROM t1, t2, t3 WHERE t2.c < 5 AND t2.a=t1.a AND t3.b=t1.b
9718
It also will remove braces from the following queries:
9720
SELECT * from (t1 LEFT JOIN t2 ON t2.a=t1.a) LEFT JOIN t3 ON t3.b=t2.b
9721
SELECT * from (t1, (t2,t3)) WHERE t1.a=t2.a AND t2.b=t3.b.
9724
The benefit of this simplification procedure is that it might return
9725
a query for which the optimizer can evaluate execution plan with more
9726
join orders. With a left join operation the optimizer does not
9727
consider any plan where one of the inner tables is before some of outer
9731
The function is implemented by a recursive procedure. On the recursive
9732
ascent all attributes are calculated, all outer joins that can be
9733
converted are replaced and then all unnecessary braces are removed.
9734
As join list contains join tables in the reverse order sequential
9735
elimination of outer joins does not require extra recursive calls.
9738
Remove all semi-joins that have are within another semi-join (i.e. have
9739
an "ancestor" semi-join nest)
9742
Here is an example of a join query with invalid cross references:
9744
SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t3.a LEFT JOIN t3 ON t3.b=t1.b
9747
@param join reference to the query info
9748
@param join_list list representation of the join to be converted
9749
@param conds conditions to add on expressions for converted joins
9750
@param top true <=> conds is the where condition
9753
- The new condition, if success
9758
simplify_joins(JOIN *join, List<TableList> *join_list, COND *conds, bool top,
9762
nested_join_st *nested_join;
9763
TableList *prev_table= 0;
9764
List_iterator<TableList> li(*join_list);
9767
Try to simplify join operations from join_list.
9768
The most outer join operation is checked for conversion first.
9770
while ((table= li++))
9772
table_map used_tables;
9773
table_map not_null_tables= (table_map) 0;
9775
if ((nested_join= table->nested_join))
9778
If the element of join_list is a nested join apply
9779
the procedure to its nested join list first.
9783
Item *expr= table->on_expr;
9785
If an on expression E is attached to the table,
9786
check all null rejected predicates in this expression.
9787
If such a predicate over an attribute belonging to
9788
an inner table of an embedded outer join is found,
9789
the outer join is converted to an inner join and
9790
the corresponding on expression is added to E.
9792
expr= simplify_joins(join, &nested_join->join_list,
9793
expr, false, in_sj || table->sj_on_expr);
9795
if (!table->prep_on_expr || expr != table->on_expr)
9799
table->on_expr= expr;
9800
table->prep_on_expr= expr->copy_andor_structure(join->thd);
9803
nested_join->used_tables= (table_map) 0;
9804
nested_join->not_null_tables=(table_map) 0;
9805
conds= simplify_joins(join, &nested_join->join_list, conds, top,
9806
in_sj || table->sj_on_expr);
9807
used_tables= nested_join->used_tables;
9808
not_null_tables= nested_join->not_null_tables;
9812
if (!table->prep_on_expr)
9813
table->prep_on_expr= table->on_expr;
9814
used_tables= table->table->map;
9816
not_null_tables= conds->not_null_tables();
9819
if (table->embedding)
9821
table->embedding->nested_join->used_tables|= used_tables;
9822
table->embedding->nested_join->not_null_tables|= not_null_tables;
9825
if (!table->outer_join || (used_tables & not_null_tables))
9828
For some of the inner tables there are conjunctive predicates
9829
that reject nulls => the outer join can be replaced by an inner join.
9831
table->outer_join= 0;
9834
/* Add ON expression to the WHERE or upper-level ON condition. */
9837
conds= and_conds(conds, table->on_expr);
9838
conds->top_level_item();
9839
/* conds is always a new item as both cond and on_expr existed */
9840
assert(!conds->fixed);
9841
conds->fix_fields(join->thd, &conds);
9844
conds= table->on_expr;
9845
table->prep_on_expr= table->on_expr= 0;
9853
Only inner tables of non-convertible outer joins
9854
remain with on_expr.
9858
table->dep_tables|= table->on_expr->used_tables();
9859
if (table->embedding)
9861
table->dep_tables&= ~table->embedding->nested_join->used_tables;
9863
Embedding table depends on tables used
9864
in embedded on expressions.
9866
table->embedding->on_expr_dep_tables|= table->on_expr->used_tables();
9869
table->dep_tables&= ~table->table->map;
9874
/* The order of tables is reverse: prev_table follows table */
9875
if (prev_table->straight)
9876
prev_table->dep_tables|= used_tables;
9877
if (prev_table->on_expr)
9879
prev_table->dep_tables|= table->on_expr_dep_tables;
9880
table_map prev_used_tables= prev_table->nested_join ?
9881
prev_table->nested_join->used_tables :
9882
prev_table->table->map;
9884
If on expression contains only references to inner tables
9885
we still make the inner tables dependent on the outer tables.
9886
It would be enough to set dependency only on one outer table
9887
for them. Yet this is really a rare case.
9889
if (!(prev_table->on_expr->used_tables() & ~prev_used_tables))
9890
prev_table->dep_tables|= used_tables;
9897
Flatten nested joins that can be flattened.
9898
no ON expression and not a semi-join => can be flattened.
9901
while ((table= li++))
9903
nested_join= table->nested_join;
9904
if (table->sj_on_expr && !in_sj)
9907
If this is a semi-join that is not contained within another semi-join,
9908
leave it intact (otherwise it is flattened)
9910
join->select_lex->sj_nests.push_back(table);
9912
else if (nested_join && !table->on_expr)
9915
List_iterator<TableList> it(nested_join->join_list);
9918
tbl->embedding= table->embedding;
9919
tbl->join_list= table->join_list;
9921
li.replace(nested_join->join_list);
9929
Assign each nested join structure a bit in nested_join_map.
9931
Assign each nested join structure (except "confluent" ones - those that
9932
embed only one element) a bit in nested_join_map.
9934
@param join Join being processed
9935
@param join_list List of tables
9936
@param first_unused Number of first unused bit in nested_join_map before the
9940
This function is called after simplify_joins(), when there are no
9941
redundant nested joins, #non_confluent_nested_joins <= #tables_in_join so
9942
we will not run out of bits in nested_join_map.
9945
First unused bit in nested_join_map after the call.
9948
static uint build_bitmap_for_nested_joins(List<TableList> *join_list,
9951
List_iterator<TableList> li(*join_list);
9953
while ((table= li++))
9955
nested_join_st *nested_join;
9956
if ((nested_join= table->nested_join))
9959
It is guaranteed by simplify_joins() function that a nested join
9960
that has only one child is either
9961
- a single-table view (the child is the underlying table), or
9962
- a single-table semi-join nest
9964
We don't assign bits to such sj-nests because
9965
1. it is redundant (a "sequence" of one table cannot be interleaved
9967
2. we could run out bits in nested_join_map otherwise.
9969
if (nested_join->join_list.elements != 1)
9971
/* Don't assign bits to sj-nests */
9973
nested_join->nj_map= (nested_join_map) 1 << first_unused++;
9974
first_unused= build_bitmap_for_nested_joins(&nested_join->join_list,
9979
return(first_unused);
9984
Set nested_join_st::counter=0 in all nested joins in passed list.
9986
Recursively set nested_join_st::counter=0 for all nested joins contained in
9987
the passed join_list.
9989
@param join_list List of nested joins to process. It may also contain base
9990
tables which will be ignored.
9993
static void reset_nj_counters(List<TableList> *join_list)
9995
List_iterator<TableList> li(*join_list);
9997
while ((table= li++))
9999
nested_join_st *nested_join;
10000
if ((nested_join= table->nested_join))
10002
nested_join->counter_= 0;
10003
reset_nj_counters(&nested_join->join_list);
2535
10011
Check interleaving with an inner tables of an outer join for
2536
10012
extension table.
2538
Check if table next_tab can be added to current partial join order, and
10014
Check if table next_tab can be added to current partial join order, and
2539
10015
if yes, record that it has been added.
2541
10017
The function assumes that both current partial join order and its
2542
10018
extension with next_tab are valid wrt table dependencies.
2546
10022
LIMITATIONS ON JOIN order_st
2547
10023
The nested [outer] joins executioner algorithm imposes these limitations
2548
10024
on join order:
2549
1. "Outer tables first" - any "outer" table must be before any
10025
1. "Outer tables first" - any "outer" table must be before any
2550
10026
corresponding "inner" table.
2551
10027
2. "No interleaving" - tables inside a nested join must form a continuous
2552
sequence in join order (i.e. the sequence must not be interrupted by
10028
sequence in join order (i.e. the sequence must not be interrupted by
2553
10029
tables that are outside of this nested join).
2555
10031
#1 is checked elsewhere, this function checks #2 provided that #1 has
2556
10032
been already checked.
2558
10034
WHY NEED NON-INTERLEAVING
2559
Consider an example:
10035
Consider an example:
2561
10037
select * from t0 join t1 left join (t2 join t3) on cond1
3359
int safe_index_read(JoinTable *tab)
10917
SemiJoinDuplicateElimination: Weed out duplicate row combinations
10920
do_sj_dups_weedout()
10924
1 The row combination is a duplicate (discard it)
10925
0 The row combination is not a duplicate (continue)
10928
int do_sj_dups_weedout(THD *thd, SJ_TMP_TABLE *sjtbl)
10931
SJ_TMP_TABLE::TAB *tab= sjtbl->tabs;
10932
SJ_TMP_TABLE::TAB *tab_end= sjtbl->tabs_end;
10933
uchar *ptr= sjtbl->tmp_table->record[0] + 1;
10934
uchar *nulls_ptr= ptr;
10936
/* Put the the rowids tuple into table->record[0]: */
10938
// 1. Store the length
10939
if (((Field_varstring*)(sjtbl->tmp_table->field[0]))->length_bytes == 1)
10941
*ptr= (uchar)(sjtbl->rowid_len + sjtbl->null_bytes);
10946
int2store(ptr, sjtbl->rowid_len + sjtbl->null_bytes);
10950
// 2. Zero the null bytes
10951
if (sjtbl->null_bytes)
10953
memset(ptr, 0, sjtbl->null_bytes);
10954
ptr += sjtbl->null_bytes;
10957
// 3. Put the rowids
10958
for (uint i=0; tab != tab_end; tab++, i++)
10960
handler *h= tab->join_tab->table->file;
10961
if (tab->join_tab->table->maybe_null && tab->join_tab->table->null_row)
10963
/* It's a NULL-complemented row */
10964
*(nulls_ptr + tab->null_byte) |= tab->null_bit;
10965
memset(ptr + tab->rowid_offset, 0, h->ref_length);
10969
/* Copy the rowid value */
10970
if (tab->join_tab->rowid_keep_flags & JOIN_TAB::CALL_POSITION)
10971
h->position(tab->join_tab->table->record[0]);
10972
memcpy(ptr + tab->rowid_offset, h->ref, h->ref_length);
10976
error= sjtbl->tmp_table->file->ha_write_row(sjtbl->tmp_table->record[0]);
10979
/* create_myisam_from_heap will generate error if needed */
10980
if (sjtbl->tmp_table->file->is_fatal_error(error, HA_CHECK_DUP) &&
10981
create_myisam_from_heap(thd, sjtbl->tmp_table, sjtbl->start_recinfo,
10982
&sjtbl->recinfo, error, 1))
10984
//return (error == HA_ERR_FOUND_DUPP_KEY || error== HA_ERR_FOUND_DUPP_UNIQUE) ? 1: -1;
10992
SemiJoinDuplicateElimination: Reset the temporary table
10995
int do_sj_reset(SJ_TMP_TABLE *sj_tbl)
10997
if (sj_tbl->tmp_table)
10998
return sj_tbl->tmp_table->file->ha_delete_all_rows();
11003
Process one record of the nested loop join.
11005
This function will evaluate parts of WHERE/ON clauses that are
11006
applicable to the partial record on hand and in case of success
11007
submit this record to the next level of the nested loop.
11010
static enum_nested_loop_state
11011
evaluate_join_record(JOIN *join, JOIN_TAB *join_tab,
11014
bool not_used_in_distinct=join_tab->not_used_in_distinct;
11015
ha_rows found_records=join->found_records;
11016
COND *select_cond= join_tab->select_cond;
11018
if (error > 0 || (join->thd->is_error())) // Fatal error
11019
return NESTED_LOOP_ERROR;
11021
return NESTED_LOOP_NO_MORE_ROWS;
11022
if (join->thd->killed) // Aborted by user
11024
join->thd->send_kill_message();
11025
return NESTED_LOOP_KILLED; /* purecov: inspected */
11027
if (!select_cond || select_cond->val_int())
11030
There is no select condition or the attached pushed down
11031
condition is true => a match is found.
11034
while (join_tab->first_unmatched && found)
11037
The while condition is always false if join_tab is not
11038
the last inner join table of an outer join operation.
11040
JOIN_TAB *first_unmatched= join_tab->first_unmatched;
11042
Mark that a match for current outer table is found.
11043
This activates push down conditional predicates attached
11044
to the all inner tables of the outer join.
11046
first_unmatched->found= 1;
11047
for (JOIN_TAB *tab= first_unmatched; tab <= join_tab; tab++)
11049
if (tab->table->reginfo.not_exists_optimize)
11050
return NESTED_LOOP_NO_MORE_ROWS;
11051
/* Check all predicates that has just been activated. */
11053
Actually all predicates non-guarded by first_unmatched->found
11054
will be re-evaluated again. It could be fixed, but, probably,
11055
it's not worth doing now.
11057
if (tab->select_cond && !tab->select_cond->val_int())
11059
/* The condition attached to table tab is false */
11060
if (tab == join_tab)
11065
Set a return point if rejected predicate is attached
11066
not to the last table of the current nest level.
11068
join->return_tab= tab;
11069
return NESTED_LOOP_OK;
11074
Check whether join_tab is not the last inner table
11075
for another embedding outer join.
11077
if ((first_unmatched= first_unmatched->first_upper) &&
11078
first_unmatched->last_inner != join_tab)
11079
first_unmatched= 0;
11080
join_tab->first_unmatched= first_unmatched;
11083
JOIN_TAB *return_tab= join->return_tab;
11084
join_tab->found_match= true;
11085
if (join_tab->check_weed_out_table)
11087
int res= do_sj_dups_weedout(join->thd, join_tab->check_weed_out_table);
11089
return NESTED_LOOP_ERROR;
11091
return NESTED_LOOP_OK;
11093
else if (join_tab->do_firstmatch)
11096
We should return to the join_tab->do_firstmatch after we have
11097
enumerated all the suffixes for current prefix row combination
11099
return_tab= join_tab->do_firstmatch;
11103
It was not just a return to lower loop level when one
11104
of the newly activated predicates is evaluated as false
11105
(See above join->return_tab= tab).
11107
join->examined_rows++;
11108
join->thd->row_count++;
11112
enum enum_nested_loop_state rc;
11113
/* A match from join_tab is found for the current partial join. */
11114
rc= (*join_tab->next_select)(join, join_tab+1, 0);
11115
if (rc != NESTED_LOOP_OK && rc != NESTED_LOOP_NO_MORE_ROWS)
11117
if (return_tab < join->return_tab)
11118
join->return_tab= return_tab;
11120
if (join->return_tab < join_tab)
11121
return NESTED_LOOP_OK;
11123
Test if this was a SELECT DISTINCT query on a table that
11124
was not in the field list; In this case we can abort if
11125
we found a row, as no new rows can be added to the result.
11127
if (not_used_in_distinct && found_records != join->found_records)
11128
return NESTED_LOOP_NO_MORE_ROWS;
11131
join_tab->read_record.file->unlock_row();
11136
The condition pushed down to the table join_tab rejects all rows
11137
with the beginning coinciding with the current partial join.
11139
join->examined_rows++;
11140
join->thd->row_count++;
11141
join_tab->read_record.file->unlock_row();
11143
return NESTED_LOOP_OK;
11150
Construct a NULL complimented partial join record and feed it to the next
11151
level of the nested loop. This function is used in case we have
11152
an OUTER join and no matching record was found.
11155
static enum_nested_loop_state
11156
evaluate_null_complemented_join_record(JOIN *join, JOIN_TAB *join_tab)
11159
The table join_tab is the first inner table of a outer join operation
11160
and no matches has been found for the current outer row.
11162
JOIN_TAB *last_inner_tab= join_tab->last_inner;
11163
/* Cache variables for faster loop */
11165
for ( ; join_tab <= last_inner_tab ; join_tab++)
11167
/* Change the the values of guard predicate variables. */
11168
join_tab->found= 1;
11169
join_tab->not_null_compl= 0;
11170
/* The outer row is complemented by nulls for each inner tables */
11171
restore_record(join_tab->table,s->default_values); // Make empty record
11172
mark_as_null_row(join_tab->table); // For group by without error
11173
select_cond= join_tab->select_cond;
11174
/* Check all attached conditions for inner table rows. */
11175
if (select_cond && !select_cond->val_int())
11176
return NESTED_LOOP_OK;
11180
The row complemented by nulls might be the first row
11181
of embedding outer joins.
11182
If so, perform the same actions as in the code
11183
for the first regular outer join row above.
11187
JOIN_TAB *first_unmatched= join_tab->first_unmatched;
11188
if ((first_unmatched= first_unmatched->first_upper) &&
11189
first_unmatched->last_inner != join_tab)
11190
first_unmatched= 0;
11191
join_tab->first_unmatched= first_unmatched;
11192
if (!first_unmatched)
11194
first_unmatched->found= 1;
11195
for (JOIN_TAB *tab= first_unmatched; tab <= join_tab; tab++)
11197
if (tab->select_cond && !tab->select_cond->val_int())
11199
join->return_tab= tab;
11200
return NESTED_LOOP_OK;
11205
The row complemented by nulls satisfies all conditions
11206
attached to inner tables.
11207
Send the row complemented by nulls to be joined with the
11210
return (*join_tab->next_select)(join, join_tab+1, 0);
11214
static enum_nested_loop_state
11215
flush_cached_records(JOIN *join,JOIN_TAB *join_tab,bool skip_last)
11217
enum_nested_loop_state rc= NESTED_LOOP_OK;
11221
join_tab->table->null_row= 0;
11222
if (!join_tab->cache.records)
11223
return NESTED_LOOP_OK; /* Nothing to do */
11225
(void) store_record_in_cache(&join_tab->cache); // Must save this for later
11226
if (join_tab->use_quick == 2)
11228
if (join_tab->select->quick)
11229
{ /* Used quick select last. reset it */
11230
delete join_tab->select->quick;
11231
join_tab->select->quick=0;
11234
/* read through all records */
11235
if ((error=join_init_read_record(join_tab)))
11237
reset_cache_write(&join_tab->cache);
11238
return error < 0 ? NESTED_LOOP_NO_MORE_ROWS: NESTED_LOOP_ERROR;
11241
for (JOIN_TAB *tmp=join->join_tab; tmp != join_tab ; tmp++)
11243
tmp->status=tmp->table->status;
11244
tmp->table->status=0;
11247
info= &join_tab->read_record;
11250
if (join->thd->killed)
11252
join->thd->send_kill_message();
11253
return NESTED_LOOP_KILLED; // Aborted by user /* purecov: inspected */
11255
SQL_SELECT *select=join_tab->select;
11256
if (rc == NESTED_LOOP_OK &&
11257
(!join_tab->cache.select || !join_tab->cache.select->skip_record()))
11260
reset_cache_read(&join_tab->cache);
11261
for (i=(join_tab->cache.records- (skip_last ? 1 : 0)) ; i-- > 0 ;)
11263
read_cached_record(join_tab);
11264
if (!select || !select->skip_record())
11267
if (!join_tab->check_weed_out_table ||
11268
!(res= do_sj_dups_weedout(join->thd, join_tab->check_weed_out_table)))
11270
rc= (join_tab->next_select)(join,join_tab+1,0);
11271
if (rc != NESTED_LOOP_OK && rc != NESTED_LOOP_NO_MORE_ROWS)
11273
reset_cache_write(&join_tab->cache);
11278
return NESTED_LOOP_ERROR;
11282
} while (!(error=info->read_record(info)));
11285
read_cached_record(join_tab); // Restore current record
11286
reset_cache_write(&join_tab->cache);
11287
if (error > 0) // Fatal error
11288
return NESTED_LOOP_ERROR; /* purecov: inspected */
11289
for (JOIN_TAB *tmp2=join->join_tab; tmp2 != join_tab ; tmp2++)
11290
tmp2->table->status=tmp2->status;
11291
return NESTED_LOOP_OK;
11294
int safe_index_read(JOIN_TAB *tab)
3362
11297
Table *table= tab->table;
3363
if ((error=table->cursor->index_read_map(table->getInsertRecord(),
11298
if ((error=table->file->index_read_map(table->record[0],
3364
11299
tab->ref.key_buff,
3365
11300
make_prev_keypart_map(tab->ref.key_parts),
3366
11301
HA_READ_KEY_EXACT)))
6256
static void print_table_array(Session *session, String *str, TableList **table,
15359
/** Allocate memory needed for other rollup functions. */
15361
bool JOIN::rollup_init()
15366
tmp_table_param.quick_group= 0; // Can't create groups in tmp table
15367
rollup.state= ROLLUP::STATE_INITED;
15370
Create pointers to the different sum function groups
15371
These are updated by rollup_make_fields()
15373
tmp_table_param.group_parts= send_group_parts;
15375
if (!(rollup.null_items= (Item_null_result**) thd->alloc((sizeof(Item*) +
15377
sizeof(List<Item>) +
15378
ref_pointer_array_size)
15379
* send_group_parts )))
15382
rollup.fields= (List<Item>*) (rollup.null_items + send_group_parts);
15383
rollup.ref_pointer_arrays= (Item***) (rollup.fields + send_group_parts);
15384
ref_array= (Item**) (rollup.ref_pointer_arrays+send_group_parts);
15387
Prepare space for field list for the different levels
15388
These will be filled up in rollup_make_fields()
15390
for (i= 0 ; i < send_group_parts ; i++)
15392
rollup.null_items[i]= new (thd->mem_root) Item_null_result();
15393
List<Item> *rollup_fields= &rollup.fields[i];
15394
rollup_fields->empty();
15395
rollup.ref_pointer_arrays[i]= ref_array;
15396
ref_array+= all_fields.elements;
15398
for (i= 0 ; i < send_group_parts; i++)
15400
for (j=0 ; j < fields_list.elements ; j++)
15401
rollup.fields[i].push_back(rollup.null_items[i]);
15403
List_iterator<Item> it(all_fields);
15405
while ((item= it++))
15407
order_st *group_tmp;
15408
bool found_in_group= 0;
15410
for (group_tmp= group_list; group_tmp; group_tmp= group_tmp->next)
15412
if (*group_tmp->item == item)
15414
item->maybe_null= 1;
15416
if (item->const_item())
15419
For ROLLUP queries each constant item referenced in GROUP BY list
15420
is wrapped up into an Item_func object yielding the same value
15421
as the constant item. The objects of the wrapper class are never
15422
considered as constant items and besides they inherit all
15423
properties of the Item_result_field class.
15424
This wrapping allows us to ensure writing constant items
15425
into temporary tables whenever the result of the ROLLUP
15426
operation has to be written into a temporary table, e.g. when
15427
ROLLUP is used together with DISTINCT in the SELECT list.
15428
Usually when creating temporary tables for a intermidiate
15429
result we do not include fields for constant expressions.
15431
Item* new_item= new Item_func_rollup_const(item);
15434
new_item->fix_fields(thd, (Item **) 0);
15435
thd->change_item_tree(it.ref(), new_item);
15436
for (order_st *tmp= group_tmp; tmp; tmp= tmp->next)
15438
if (*tmp->item == item)
15439
thd->change_item_tree(tmp->item, new_item);
15444
if (item->type() == Item::FUNC_ITEM && !found_in_group)
15446
bool changed= false;
15447
if (change_group_ref(thd, (Item_func *) item, group_list, &changed))
15450
We have to prevent creation of a field in a temporary table for
15451
an expression that contains GROUP BY attributes.
15452
Marking the expression item as 'with_sum_func' will ensure this.
15455
item->with_sum_func= 1;
15463
Fill up rollup structures with pointers to fields to use.
15465
Creates copies of item_sum items for each sum level.
15467
@param fields_arg List of all fields (hidden and real ones)
15468
@param sel_fields Pointer to selected fields
15469
@param func Store here a pointer to all fields
15473
In this case func is pointing to next not used element.
15478
bool JOIN::rollup_make_fields(List<Item> &fields_arg, List<Item> &sel_fields,
15481
List_iterator_fast<Item> it(fields_arg);
15482
Item *first_field= sel_fields.head();
15486
Create field lists for the different levels
15488
The idea here is to have a separate field list for each rollup level to
15489
avoid all runtime checks of which columns should be NULL.
15491
The list is stored in reverse order to get sum function in such an order
15492
in func that it makes it easy to reset them with init_sum_functions()
15494
Assuming: SELECT a, b, c SUM(b) FROM t1 GROUP BY a,b WITH ROLLUP
15496
rollup.fields[0] will contain list where a,b,c is NULL
15497
rollup.fields[1] will contain list where b,c is NULL
15499
rollup.ref_pointer_array[#] points to fields for rollup.fields[#]
15501
sum_funcs_end[0] points to all sum functions
15502
sum_funcs_end[1] points to all sum functions, except grand totals
15506
for (level=0 ; level < send_group_parts ; level++)
15509
uint pos= send_group_parts - level -1;
15510
bool real_fields= 0;
15512
List_iterator<Item> new_it(rollup.fields[pos]);
15513
Item **ref_array_start= rollup.ref_pointer_arrays[pos];
15514
order_st *start_group;
15516
/* Point to first hidden field */
15517
Item **ref_array= ref_array_start + fields_arg.elements-1;
15519
/* Remember where the sum functions ends for the previous level */
15520
sum_funcs_end[pos+1]= *func;
15522
/* Find the start of the group for this level */
15523
for (i= 0, start_group= group_list ;
15525
start_group= start_group->next)
15529
while ((item= it++))
15531
if (item == first_field)
15533
real_fields= 1; // End of hidden fields
15534
ref_array= ref_array_start;
15537
if (item->type() == Item::SUM_FUNC_ITEM && !item->const_item() &&
15538
(!((Item_sum*) item)->depended_from() ||
15539
((Item_sum *)item)->depended_from() == select_lex))
15543
This is a top level summary function that must be replaced with
15544
a sum function that is reset for this level.
15546
NOTE: This code creates an object which is not that nice in a
15547
sub select. Fortunately it's not common to have rollup in
15550
item= item->copy_or_same(thd);
15551
((Item_sum*) item)->make_unique();
15552
*(*func)= (Item_sum*) item;
15557
/* Check if this is something that is part of this group by */
15558
order_st *group_tmp;
15559
for (group_tmp= start_group, i= pos ;
15560
group_tmp ; group_tmp= group_tmp->next, i++)
15562
if (*group_tmp->item == item)
15565
This is an element that is used by the GROUP BY and should be
15566
set to NULL in this level
15568
Item_null_result *null_item= new (thd->mem_root) Item_null_result();
15571
item->maybe_null= 1; // Value will be null sometimes
15572
null_item->result_field= item->get_tmp_table_field();
15581
(void) new_it++; // Point to next item
15582
new_it.replace(item); // Replace previous
15589
sum_funcs_end[0]= *func; // Point to last function
15594
Send all rollup levels higher than the current one to the client.
15598
SELECT a, b, c SUM(b) FROM t1 GROUP BY a,b WITH ROLLUP
15601
@param idx Level we are on:
15602
- 0 = Total sum level
15603
- 1 = First group changed (a)
15604
- 2 = Second group changed (a,b)
15609
1 If send_data_failed()
15612
int JOIN::rollup_send_data(uint idx)
15615
for (i= send_group_parts ; i-- > idx ; )
15617
/* Get reference pointers to sum functions in place */
15618
memcpy(ref_pointer_array, rollup.ref_pointer_arrays[i],
15619
ref_pointer_array_size);
15620
if ((!having || having->val_int()))
15622
if (send_records < unit->select_limit_cnt && do_send_rows &&
15623
result->send_data(rollup.fields[i]))
15628
/* Restore ref_pointer_array */
15629
set_items_ref_array(current_ref_pointer_array);
15634
Write all rollup levels higher than the current one to a temp table.
15638
SELECT a, b, SUM(c) FROM t1 GROUP BY a,b WITH ROLLUP
15641
@param idx Level we are on:
15642
- 0 = Total sum level
15643
- 1 = First group changed (a)
15644
- 2 = Second group changed (a,b)
15645
@param table reference to temp table
15650
1 if write_data_failed()
15653
int JOIN::rollup_write_data(uint idx, Table *table_arg)
15656
for (i= send_group_parts ; i-- > idx ; )
15658
/* Get reference pointers to sum functions in place */
15659
memcpy(ref_pointer_array, rollup.ref_pointer_arrays[i],
15660
ref_pointer_array_size);
15661
if ((!having || having->val_int()))
15665
List_iterator_fast<Item> it(rollup.fields[i]);
15666
while ((item= it++))
15668
if (item->type() == Item::NULL_ITEM && item->is_result_field())
15669
item->save_in_result_field(1);
15671
copy_sum_funcs(sum_funcs_end[i+1], sum_funcs_end[i]);
15672
if ((write_error= table_arg->file->ha_write_row(table_arg->record[0])))
15674
if (create_myisam_from_heap(thd, table_arg,
15675
tmp_table_param.start_recinfo,
15676
&tmp_table_param.recinfo,
15682
/* Restore ref_pointer_array */
15683
set_items_ref_array(current_ref_pointer_array);
15688
clear results if there are not rows found for group
15689
(end_send_group/end_write_group)
15694
clear_tables(this);
15695
copy_fields(&tmp_table_param);
15699
Item_sum *func, **func_ptr= sum_funcs;
15700
while ((func= *(func_ptr++)))
15708
Send a description about what how the select will be done to stdout.
15711
void select_describe(JOIN *join, bool need_tmp_table, bool need_order,
15712
bool distinct,const char *message)
15714
List<Item> field_list;
15715
List<Item> item_list;
15716
THD *thd=join->thd;
15717
select_result *result=join->result;
15718
Item *item_null= new Item_null();
15719
const CHARSET_INFO * const cs= system_charset_info;
15721
/* Don't log this into the slow query log */
15722
thd->server_status&= ~(SERVER_QUERY_NO_INDEX_USED | SERVER_QUERY_NO_GOOD_INDEX_USED);
15723
join->unit->offset_limit_cnt= 0;
15726
NOTE: the number/types of items pushed into item_list must be in sync with
15727
EXPLAIN column types as they're "defined" in THD::send_explain_fields()
15731
item_list.push_back(new Item_int((int32_t)
15732
join->select_lex->select_number));
15733
item_list.push_back(new Item_string(join->select_lex->type,
15734
strlen(join->select_lex->type), cs));
15735
for (uint i=0 ; i < 7; i++)
15736
item_list.push_back(item_null);
15737
if (join->thd->lex->describe & DESCRIBE_EXTENDED)
15738
item_list.push_back(item_null);
15740
item_list.push_back(new Item_string(message,strlen(message),cs));
15741
if (result->send_data(item_list))
15744
else if (join->select_lex == join->unit->fake_select_lex)
15747
here we assume that the query will return at least two rows, so we
15748
show "filesort" in EXPLAIN. Of course, sometimes we'll be wrong
15749
and no filesort will be actually done, but executing all selects in
15750
the UNION to provide precise EXPLAIN information will hardly be
15753
char table_name_buffer[NAME_LEN];
15756
item_list.push_back(new Item_null);
15758
item_list.push_back(new Item_string(join->select_lex->type,
15759
strlen(join->select_lex->type),
15763
SELECT_LEX *sl= join->unit->first_select();
15764
uint len= 6, lastop= 0;
15765
memcpy(table_name_buffer, STRING_WITH_LEN("<union"));
15766
for (; sl && len + lastop + 5 < NAME_LEN; sl= sl->next_select())
15769
lastop= snprintf(table_name_buffer + len, NAME_LEN - len,
15770
"%u,", sl->select_number);
15772
if (sl || len + lastop >= NAME_LEN)
15774
memcpy(table_name_buffer + len, STRING_WITH_LEN("...>") + 1);
15780
table_name_buffer[len - 1]= '>'; // change ',' to '>'
15782
item_list.push_back(new Item_string(table_name_buffer, len, cs));
15785
item_list.push_back(new Item_string(join_type_str[JT_ALL],
15786
strlen(join_type_str[JT_ALL]),
15788
/* possible_keys */
15789
item_list.push_back(item_null);
15791
item_list.push_back(item_null);
15793
item_list.push_back(item_null);
15795
item_list.push_back(item_null);
15797
if (join->thd->lex->describe & DESCRIBE_EXTENDED)
15798
item_list.push_back(item_null);
15800
item_list.push_back(item_null);
15802
if (join->unit->global_parameters->order_list.first)
15803
item_list.push_back(new Item_string("Using filesort",
15806
item_list.push_back(new Item_string("", 0, cs));
15808
if (result->send_data(item_list))
15813
table_map used_tables=0;
15814
for (uint i=0 ; i < join->tables ; i++)
15816
JOIN_TAB *tab=join->join_tab+i;
15817
Table *table=tab->table;
15818
TableList *table_list= tab->table->pos_in_table_list;
15820
char buff1[512], buff2[512], buff3[512];
15821
char keylen_str_buf[64];
15822
String extra(buff, sizeof(buff),cs);
15823
char table_name_buffer[NAME_LEN];
15824
String tmp1(buff1,sizeof(buff1),cs);
15825
String tmp2(buff2,sizeof(buff2),cs);
15826
String tmp3(buff3,sizeof(buff3),cs);
15835
item_list.push_back(new Item_uint((uint32_t)
15836
join->select_lex->select_number));
15838
item_list.push_back(new Item_string(join->select_lex->type,
15839
strlen(join->select_lex->type),
15841
if (tab->type == JT_ALL && tab->select && tab->select->quick)
15843
quick_type= tab->select->quick->get_type();
15844
if ((quick_type == QUICK_SELECT_I::QS_TYPE_INDEX_MERGE) ||
15845
(quick_type == QUICK_SELECT_I::QS_TYPE_ROR_INTERSECT) ||
15846
(quick_type == QUICK_SELECT_I::QS_TYPE_ROR_UNION))
15847
tab->type = JT_INDEX_MERGE;
15849
tab->type = JT_RANGE;
15852
if (table->derived_select_number)
15854
/* Derived table name generation */
15855
int len= snprintf(table_name_buffer, sizeof(table_name_buffer)-1,
15857
table->derived_select_number);
15858
item_list.push_back(new Item_string(table_name_buffer, len, cs));
15862
TableList *real_table= table->pos_in_table_list;
15863
item_list.push_back(new Item_string(real_table->alias,
15864
strlen(real_table->alias),
15867
/* "type" column */
15868
item_list.push_back(new Item_string(join_type_str[tab->type],
15869
strlen(join_type_str[tab->type]),
15871
/* Build "possible_keys" value and add it to item_list */
15872
if (!tab->keys.is_clear_all())
15875
for (j=0 ; j < table->s->keys ; j++)
15877
if (tab->keys.is_set(j))
15881
tmp1.append(table->key_info[j].name,
15882
strlen(table->key_info[j].name),
15883
system_charset_info);
15888
item_list.push_back(new Item_string(tmp1.ptr(),tmp1.length(),cs));
15890
item_list.push_back(item_null);
15892
/* Build "key", "key_len", and "ref" values and add them to item_list */
15893
if (tab->ref.key_parts)
15895
KEY *key_info=table->key_info+ tab->ref.key;
15896
register uint length;
15897
item_list.push_back(new Item_string(key_info->name,
15898
strlen(key_info->name),
15899
system_charset_info));
15900
length= int64_t2str(tab->ref.key_length, keylen_str_buf, 10) -
15902
item_list.push_back(new Item_string(keylen_str_buf, length,
15903
system_charset_info));
15904
for (store_key **ref=tab->ref.key_copy ; *ref ; ref++)
15908
tmp2.append((*ref)->name(), strlen((*ref)->name()),
15909
system_charset_info);
15911
item_list.push_back(new Item_string(tmp2.ptr(),tmp2.length(),cs));
15913
else if (tab->type == JT_NEXT)
15915
KEY *key_info=table->key_info+ tab->index;
15916
register uint length;
15917
item_list.push_back(new Item_string(key_info->name,
15918
strlen(key_info->name),cs));
15919
length= int64_t2str(key_info->key_length, keylen_str_buf, 10) -
15921
item_list.push_back(new Item_string(keylen_str_buf,
15923
system_charset_info));
15924
item_list.push_back(item_null);
15926
else if (tab->select && tab->select->quick)
15928
tab->select->quick->add_keys_and_lengths(&tmp2, &tmp3);
15929
item_list.push_back(new Item_string(tmp2.ptr(),tmp2.length(),cs));
15930
item_list.push_back(new Item_string(tmp3.ptr(),tmp3.length(),cs));
15931
item_list.push_back(item_null);
15935
if (table_list->schema_table && table_list->schema_table->i_s_requested_object & OPTIMIZE_I_S_TABLE)
15937
const char *tmp_buff;
15939
if (table_list->has_db_lookup_value)
15941
f_idx= table_list->schema_table->idx_field1;
15942
tmp_buff= table_list->schema_table->fields_info[f_idx].field_name;
15943
tmp2.append(tmp_buff, strlen(tmp_buff), cs);
15945
if (table_list->has_table_lookup_value)
15947
if (table_list->has_db_lookup_value)
15949
f_idx= table_list->schema_table->idx_field2;
15950
tmp_buff= table_list->schema_table->fields_info[f_idx].field_name;
15951
tmp2.append(tmp_buff, strlen(tmp_buff), cs);
15954
item_list.push_back(new Item_string(tmp2.ptr(),tmp2.length(),cs));
15956
item_list.push_back(item_null);
15959
item_list.push_back(item_null);
15960
item_list.push_back(item_null);
15961
item_list.push_back(item_null);
15964
/* Add "rows" field to item_list. */
15965
if (table_list->schema_table)
15968
if (join->thd->lex->describe & DESCRIBE_EXTENDED)
15969
item_list.push_back(item_null);
15971
item_list.push_back(item_null);
15975
double examined_rows;
15976
if (tab->select && tab->select->quick)
15977
examined_rows= rows2double(tab->select->quick->records);
15978
else if (tab->type == JT_NEXT || tab->type == JT_ALL)
15979
examined_rows= rows2double(tab->limit ? tab->limit :
15980
tab->table->file->records());
15982
examined_rows= join->best_positions[i].records_read;
15984
item_list.push_back(new Item_int((int64_t) (uint64_t) examined_rows,
15985
MY_INT64_NUM_DECIMAL_DIGITS));
15987
/* Add "filtered" field to item_list. */
15988
if (join->thd->lex->describe & DESCRIBE_EXTENDED)
15992
f= (float) (100.0 * join->best_positions[i].records_read /
15994
item_list.push_back(new Item_float(f, 2));
15998
/* Build "Extra" field and add it to item_list. */
15999
bool key_read=table->key_read;
16000
if ((tab->type == JT_NEXT || tab->type == JT_CONST) &&
16001
table->covering_keys.is_set(tab->index))
16003
if (quick_type == QUICK_SELECT_I::QS_TYPE_ROR_INTERSECT &&
16004
!((QUICK_ROR_INTERSECT_SELECT*)tab->select->quick)->need_to_fetch_row)
16008
item_list.push_back(new Item_string(tab->info,strlen(tab->info),cs));
16009
else if (tab->packed_info & TAB_INFO_HAVE_VALUE)
16011
if (tab->packed_info & TAB_INFO_USING_INDEX)
16012
extra.append(STRING_WITH_LEN("; Using index"));
16013
if (tab->packed_info & TAB_INFO_USING_WHERE)
16014
extra.append(STRING_WITH_LEN("; Using where"));
16015
if (tab->packed_info & TAB_INFO_FULL_SCAN_ON_NULL)
16016
extra.append(STRING_WITH_LEN("; Full scan on NULL key"));
16017
/* Skip initial "; "*/
16018
const char *str= extra.ptr();
16019
uint32_t len= extra.length();
16025
item_list.push_back(new Item_string(str, len, cs));
16029
uint keyno= MAX_KEY;
16030
if (tab->ref.key_parts)
16031
keyno= tab->ref.key;
16032
else if (tab->select && tab->select->quick)
16033
keyno = tab->select->quick->index;
16035
if (keyno != MAX_KEY && keyno == table->file->pushed_idx_cond_keyno &&
16036
table->file->pushed_idx_cond)
16037
extra.append(STRING_WITH_LEN("; Using index condition"));
16039
if (quick_type == QUICK_SELECT_I::QS_TYPE_ROR_UNION ||
16040
quick_type == QUICK_SELECT_I::QS_TYPE_ROR_INTERSECT ||
16041
quick_type == QUICK_SELECT_I::QS_TYPE_INDEX_MERGE)
16043
extra.append(STRING_WITH_LEN("; Using "));
16044
tab->select->quick->add_info_string(&extra);
16048
if (tab->use_quick == 2)
16050
/* 4 bits per 1 hex digit + terminating '\0' */
16051
char buf[MAX_KEY / 4 + 1];
16052
extra.append(STRING_WITH_LEN("; Range checked for each "
16053
"record (index map: 0x"));
16054
extra.append(tab->keys.print(buf));
16057
else if (tab->select->cond)
16059
const COND *pushed_cond= tab->table->file->pushed_cond;
16061
if (thd->variables.engine_condition_pushdown && pushed_cond)
16063
extra.append(STRING_WITH_LEN("; Using where with pushed "
16065
if (thd->lex->describe & DESCRIBE_EXTENDED)
16067
extra.append(STRING_WITH_LEN(": "));
16068
((COND *)pushed_cond)->print(&extra, QT_ORDINARY);
16072
extra.append(STRING_WITH_LEN("; Using where"));
16077
if (quick_type == QUICK_SELECT_I::QS_TYPE_GROUP_MIN_MAX)
16078
extra.append(STRING_WITH_LEN("; Using index for group-by"));
16080
extra.append(STRING_WITH_LEN("; Using index"));
16082
if (table->reginfo.not_exists_optimize)
16083
extra.append(STRING_WITH_LEN("; Not exists"));
16085
if (quick_type == QUICK_SELECT_I::QS_TYPE_RANGE &&
16086
!(((QUICK_RANGE_SELECT*)(tab->select->quick))->mrr_flags &
16087
HA_MRR_USE_DEFAULT_IMPL))
16089
extra.append(STRING_WITH_LEN("; Using MRR"));
16092
if (table_list->schema_table &&
16093
table_list->schema_table->i_s_requested_object & OPTIMIZE_I_S_TABLE)
16095
if (!table_list->table_open_method)
16096
extra.append(STRING_WITH_LEN("; Skip_open_table"));
16097
else if (table_list->table_open_method == OPEN_FRM_ONLY)
16098
extra.append(STRING_WITH_LEN("; Open_frm_only"));
16100
extra.append(STRING_WITH_LEN("; Open_full_table"));
16101
if (table_list->has_db_lookup_value &&
16102
table_list->has_table_lookup_value)
16103
extra.append(STRING_WITH_LEN("; Scanned 0 databases"));
16104
else if (table_list->has_db_lookup_value ||
16105
table_list->has_table_lookup_value)
16106
extra.append(STRING_WITH_LEN("; Scanned 1 database"));
16108
extra.append(STRING_WITH_LEN("; Scanned all databases"));
16110
if (need_tmp_table)
16113
extra.append(STRING_WITH_LEN("; Using temporary"));
16118
extra.append(STRING_WITH_LEN("; Using filesort"));
16120
if (distinct & test_all_bits(used_tables,thd->used_tables))
16121
extra.append(STRING_WITH_LEN("; Distinct"));
16123
if (tab->insideout_match_tab)
16125
extra.append(STRING_WITH_LEN("; LooseScan"));
16128
if (tab->flush_weedout_table)
16129
extra.append(STRING_WITH_LEN("; Start temporary"));
16130
else if (tab->check_weed_out_table)
16131
extra.append(STRING_WITH_LEN("; End temporary"));
16132
else if (tab->do_firstmatch)
16134
extra.append(STRING_WITH_LEN("; FirstMatch("));
16135
Table *prev_table=tab->do_firstmatch->table;
16136
if (prev_table->derived_select_number)
16138
char namebuf[NAME_LEN];
16139
/* Derived table name generation */
16140
int len= snprintf(namebuf, sizeof(namebuf)-1,
16142
prev_table->derived_select_number);
16143
extra.append(namebuf, len);
16146
extra.append(prev_table->pos_in_table_list->alias);
16147
extra.append(STRING_WITH_LEN(")"));
16150
for (uint part= 0; part < tab->ref.key_parts; part++)
16152
if (tab->ref.cond_guards[part])
16154
extra.append(STRING_WITH_LEN("; Full scan on NULL key"));
16159
if (i > 0 && tab[-1].next_select == sub_select_cache)
16160
extra.append(STRING_WITH_LEN("; Using join buffer"));
16162
/* Skip initial "; "*/
16163
const char *str= extra.ptr();
16164
uint32_t len= extra.length();
16170
item_list.push_back(new Item_string(str, len, cs));
16172
// For next iteration
16173
used_tables|=table->map;
16174
if (result->send_data(item_list))
16178
for (SELECT_LEX_UNIT *unit= join->select_lex->first_inner_unit();
16180
unit= unit->next_unit())
16182
if (mysql_explain_union(thd, unit, result))
16189
bool mysql_explain_union(THD *thd, SELECT_LEX_UNIT *unit, select_result *result)
16192
SELECT_LEX *first= unit->first_select();
16194
for (SELECT_LEX *sl= first;
16196
sl= sl->next_select())
16198
// drop UNCACHEABLE_EXPLAIN, because it is for internal usage only
16199
uint8_t uncacheable= (sl->uncacheable & ~UNCACHEABLE_EXPLAIN);
16200
sl->type= (((&thd->lex->select_lex)==sl)?
16201
(sl->first_inner_unit() || sl->next_select() ?
16202
"PRIMARY" : "SIMPLE"):
16204
((sl->linkage == DERIVED_TABLE_TYPE) ?
16206
((uncacheable & UNCACHEABLE_DEPENDENT) ?
16207
"DEPENDENT SUBQUERY":
16208
(uncacheable?"UNCACHEABLE SUBQUERY":
16210
((uncacheable & UNCACHEABLE_DEPENDENT) ?
16212
uncacheable?"UNCACHEABLE UNION":
16214
sl->options|= SELECT_DESCRIBE;
16216
if (unit->is_union())
16218
unit->fake_select_lex->select_number= UINT_MAX; // jost for initialization
16219
unit->fake_select_lex->type= "UNION RESULT";
16220
unit->fake_select_lex->options|= SELECT_DESCRIBE;
16221
if (!(res= unit->prepare(thd, result, SELECT_NO_UNLOCK | SELECT_DESCRIBE)))
16223
res|= unit->cleanup();
16227
thd->lex->current_select= first;
16228
unit->set_limit(unit->global_parameters);
16229
res= mysql_select(thd, &first->ref_pointer_array,
16230
(TableList*) first->table_list.first,
16231
first->with_wild, first->item_list,
16233
first->order_list.elements +
16234
first->group_list.elements,
16235
(order_st*) first->order_list.first,
16236
(order_st*) first->group_list.first,
16238
(order_st*) thd->lex->proc_list.first,
16239
first->options | thd->options | SELECT_DESCRIBE,
16240
result, unit, first);
16242
return(res || thd->is_error());
16246
static void print_table_array(THD *thd, String *str, TableList **table,
6257
16247
TableList **end)
6259
(*table)->print(session, str, QT_ORDINARY);
16249
(*table)->print(thd, str, QT_ORDINARY);
6261
16251
for (TableList **tbl= table + 1; tbl < end; tbl++)