~drizzle-trunk/drizzle/development

1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1
/* - mode: c; c-basic-offset: 2; indent-tabs-mode: nil; -*-
2
 *  vim:expandtab:shiftwidth=2:tabstop=2:smarttab:
3
 *
4
 *  Copyright (C) 2008-2009 Sun Microsystems
5
 *
6
 *  This program is free software; you can redistribute it and/or modify
7
 *  it under the terms of the GNU General Public License as published by
8
 *  the Free Software Foundation; either version 2 of the License, or
9
 *  (at your option) any later version.
10
 *
11
 *  This program is distributed in the hope that it will be useful,
12
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
13
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14
 *  GNU General Public License for more details.
15
 *
16
 *  You should have received a copy of the GNU General Public License
17
 *  along with this program; if not, write to the Free Software
18
 *  Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
19
 */
20
21
/**
22
 * @file
23
 *
1541.1.1 by Brian Aker
JOIN -> Join rename
24
 * Implementation of the Join class
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
25
 * 
26
 * @defgroup Query_Optimizer  Query Optimizer
27
 * @{
28
 */
29
1241.9.36 by Monty Taylor
ZOMG. I deleted drizzled/server_includes.h.
30
#include "config.h"
1241.9.1 by Monty Taylor
Removed global.h. Fixed all the headers.
31
32
#include <float.h>
33
#include <math.h>
34
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
35
#include "drizzled/item/cache.h"
36
#include "drizzled/item/cmpfunc.h"
37
#include "drizzled/item/copy_string.h"
38
#include "drizzled/item/uint.h"
39
#include "drizzled/cached_item.h"
40
#include "drizzled/sql_base.h"
41
#include "drizzled/sql_select.h" /* include join.h */
42
#include "drizzled/lock.h"
43
#include "drizzled/nested_join.h"
44
#include "drizzled/join.h"
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
45
#include "drizzled/join_cache.h"
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
46
#include "drizzled/show.h"
47
#include "drizzled/field/blob.h"
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
48
#include "drizzled/optimizer/position.h"
1108.6.39 by Padraig O'Sullivan
Placed the SargableParam class in the optimizer namespace and sub-directory.
49
#include "drizzled/optimizer/sargable_param.h"
1108.6.56 by Padraig O'Sullivan
Extracted KeyUse into its own header file and placed it within the
50
#include "drizzled/optimizer/key_use.h"
1237.9.2 by Padraig O'Sullivan
Moved opt_range.[cc,h] into the optimizer directory and namespace and renamed the files to
51
#include "drizzled/optimizer/range.h"
1237.9.1 by Padraig O'Sullivan
Moved the opt_sum.cc file into the optimizer directory and renamed it to sum.cc. Added a header file
52
#include "drizzled/optimizer/sum.h"
1240.7.1 by Padraig O'Sullivan
Created an ExplainPlan class in the optimizer namespace. All printing of an explain in drizzle goes
53
#include "drizzled/optimizer/explain_plan.h"
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
54
#include "drizzled/optimizer/access_method_factory.h"
55
#include "drizzled/optimizer/access_method.h"
1237.9.4 by Padraig O'Sullivan
Removed the inclusion of drizzled/field.h in the server_includes header file.
56
#include "drizzled/records.h"
1241.7.6 by Padraig O'Sullivan
Added some dtrace probes for tracing the optimizer.
57
#include "drizzled/probes.h"
1241.9.64 by Monty Taylor
Moved remaining non-public portions of mysys and mystrings to drizzled/internal.
58
#include "drizzled/internal/my_bit.h"
59
#include "drizzled/internal/my_sys.h"
60
#include "drizzled/internal/iocache.h"
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
61
1067.4.4 by Nathan Williams
The rest of the files in the drizzled directory were purged of the cmin macro and replace with std::min (except for the definition in globals.h and 1 usage in stacktrace.cc).
62
#include <algorithm>
63
64
using namespace std;
1280.1.10 by Monty Taylor
Put everything in drizzled into drizzled namespace.
65
66
namespace drizzled
67
{
68
69
extern plugin::StorageEngine *heap_engine;
1241.9.16 by Monty Taylor
Removed global bitsets.
70
extern std::bitset<12> test_flags;
71
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
72
/** Declarations of static functions used in this source file. */
1541.1.1 by Brian Aker
JOIN -> Join rename
73
static bool make_group_fields(Join *main_join, Join *curr_join);
74
static void calc_group_buffer(Join *join,order_st *group);
75
static bool alloc_group_fields(Join *join,order_st *group);
76
static uint32_t cache_record_length(Join *join, uint32_t index);
77
static double prev_record_reads(Join *join, uint32_t idx, table_map found_ref);
78
static bool get_best_combination(Join *join);
79
static void set_position(Join *join,
1108.6.56 by Padraig O'Sullivan
Extracted KeyUse into its own header file and placed it within the
80
                         uint32_t index,
81
                         JoinTable *table,
82
                         optimizer::KeyUse *key);
1541.1.1 by Brian Aker
JOIN -> Join rename
83
static bool choose_plan(Join *join,table_map join_tables);
84
static void best_access_path(Join *join, JoinTable *s,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
85
                             Session *session,
86
                             table_map remaining_tables,
87
                             uint32_t idx,
88
                             double record_count,
89
                             double read_time);
1541.1.1 by Brian Aker
JOIN -> Join rename
90
static void optimize_straight_join(Join *join, table_map join_tables);
91
static bool greedy_search(Join *join, table_map remaining_tables, uint32_t depth, uint32_t prune_level);
92
static bool best_extension_by_limited_search(Join *join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
93
                                             table_map remaining_tables,
94
                                             uint32_t idx,
95
                                             double record_count,
96
                                             double read_time,
97
                                             uint32_t depth,
98
                                             uint32_t prune_level);
1541.1.1 by Brian Aker
JOIN -> Join rename
99
static uint32_t determine_search_depth(Join* join);
100
static bool make_simple_join(Join *join,Table *tmp_table);
101
static void make_outerjoin_info(Join *join);
102
static bool make_join_select(Join *join, optimizer::SqlSelect *select,COND *item);
103
static bool make_join_readinfo(Join *join);
104
static void update_depend_map(Join *join);
105
static void update_depend_map(Join *join, order_st *order);
106
static order_st *remove_constants(Join *join,order_st *first_order,COND *cond, bool change_list, bool *simple_order);
107
static int return_zero_rows(Join *join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
108
                            select_result *res,
109
                            TableList *tables,
110
                            List<Item> &fields,
111
                            bool send_row,
112
                            uint64_t select_options,
113
                            const char *info,
114
                            Item *having);
1541.1.1 by Brian Aker
JOIN -> Join rename
115
static COND *simplify_joins(Join *join, List<TableList> *join_list, COND *conds, bool top);
116
static int remove_duplicates(Join *join,Table *entry,List<Item> &fields, Item *having);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
117
static int setup_without_group(Session *session, 
118
                               Item **ref_pointer_array,
119
                               TableList *tables,
120
                               TableList *,
121
                               List<Item> &fields,
122
                               List<Item> &all_fields,
123
                               COND **conds,
124
                               order_st *order,
125
                               order_st *group,
126
                               bool *hidden_group_fields);
1541.1.1 by Brian Aker
JOIN -> Join rename
127
static bool make_join_statistics(Join *join, TableList *leaves, COND *conds, DYNAMIC_ARRAY *keyuse);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
128
static uint32_t build_bitmap_for_nested_joins(List<TableList> *join_list, uint32_t first_unused);
129
static Table *get_sort_by_table(order_st *a,order_st *b,TableList *tables);
130
static void reset_nj_counters(List<TableList> *join_list);
131
static bool test_if_subpart(order_st *a,order_st *b);
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
132
static void restore_prev_nj_state(JoinTable *last);
133
static bool add_ref_to_table_cond(Session *session, JoinTable *join_tab);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
134
static void free_blobs(Field **ptr); /* Rename this method...conflicts with another in global namespace... */
135
136
/**
137
  Prepare of whole select (including sub queries in future).
138
139
  @todo
140
    Add check of calculation of GROUP functions and fields:
141
    SELECT COUNT(*)+table.col1 from table1;
142
143
  @retval
144
    -1   on error
145
  @retval
146
    0   on success
147
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
148
int Join::prepare(Item ***rref_pointer_array,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
149
                  TableList *tables_init,
150
                  uint32_t wild_num,
151
                  COND *conds_init,
152
                  uint32_t og_num,
153
                  order_st *order_init,
154
                  order_st *group_init,
155
                  Item *having_init,
156
                  Select_Lex *select_lex_arg,
157
                  Select_Lex_Unit *unit_arg)
158
{
159
  // to prevent double initialization on EXPLAIN
160
  if (optimized)
161
    return 0;
162
163
  conds= conds_init;
164
  order= order_init;
165
  group_list= group_init;
166
  having= having_init;
167
  tables_list= tables_init;
168
  select_lex= select_lex_arg;
169
  select_lex->join= this;
170
  join_list= &select_lex->top_join_list;
171
  union_part= unit_arg->is_union();
172
173
  session->lex->current_select->is_item_list_lookup= 1;
174
  /*
175
    If we have already executed SELECT, then it have not sense to prevent
176
    its table from update (see unique_table())
177
  */
178
  if (session->derived_tables_processing)
179
    select_lex->exclude_from_table_unique_test= true;
180
181
  /* Check that all tables, fields, conds and order are ok */
182
183
  if (!(select_options & OPTION_SETUP_TABLES_DONE) &&
184
      setup_tables_and_check_access(session, &select_lex->context, join_list,
185
                                    tables_list, &select_lex->leaf_tables,
186
                                    false))
1637.1.3 by Brian Aker
This fixes the parser to no longer do the bad syntax around the cross join
187
  {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
188
      return(-1);
1637.1.3 by Brian Aker
This fixes the parser to no longer do the bad syntax around the cross join
189
  }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
190
191
  TableList *table_ptr;
192
  for (table_ptr= select_lex->leaf_tables;
193
       table_ptr;
194
       table_ptr= table_ptr->next_leaf)
195
    tables++;
196
197
  if (setup_wild(session, fields_list, &all_fields, wild_num) ||
198
      select_lex->setup_ref_array(session, og_num) ||
199
      setup_fields(session, (*rref_pointer_array), fields_list, MARK_COLUMNS_READ,
200
       &all_fields, 1) ||
201
      setup_without_group(session, (*rref_pointer_array), tables_list,
202
        select_lex->leaf_tables, fields_list,
203
        all_fields, &conds, order, group_list,
204
        &hidden_group_fields))
971.6.11 by Eric Day
Removed purecov messages.
205
    return(-1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
206
207
  ref_pointer_array= *rref_pointer_array;
208
209
  if (having)
210
  {
211
    nesting_map save_allow_sum_func= session->lex->allow_sum_func;
212
    session->where="having clause";
213
    session->lex->allow_sum_func|= 1 << select_lex_arg->nest_level;
214
    select_lex->having_fix_field= 1;
215
    bool having_fix_rc= (!having->fixed &&
216
       (having->fix_fields(session, &having) ||
217
        having->check_cols(1)));
218
    select_lex->having_fix_field= 0;
219
    if (having_fix_rc || session->is_error())
971.6.11 by Eric Day
Removed purecov messages.
220
      return(-1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
221
    session->lex->allow_sum_func= save_allow_sum_func;
222
  }
223
224
  {
225
    Item_subselect *subselect;
226
    Item_in_subselect *in_subs= NULL;
227
    /*
228
      Are we in a subquery predicate?
229
      TODO: the block below will be executed for every PS execution without need.
230
    */
231
    if ((subselect= select_lex->master_unit()->item))
232
    {
233
      if (subselect->substype() == Item_subselect::IN_SUBS)
234
        in_subs= (Item_in_subselect*)subselect;
235
236
      {
1280.1.3 by Brian Aker
Fixing test cases/removed dead optimizer switches.
237
        bool do_materialize= true;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
238
        /*
239
          Check if the subquery predicate can be executed via materialization.
240
          The required conditions are:
241
          1. Subquery predicate is an IN/=ANY subq predicate
242
          2. Subquery is a single SELECT (not a UNION)
243
          3. Subquery is not a table-less query. In this case there is no
244
             point in materializing.
245
          4. Subquery predicate is a top-level predicate
246
             (this implies it is not negated)
247
             TODO: this is a limitation that should be lifeted once we
248
             implement correct NULL semantics (WL#3830)
249
          5. Subquery is non-correlated
250
             TODO:
251
             This is an overly restrictive condition. It can be extended to:
252
             (Subquery is non-correlated ||
253
              Subquery is correlated to any query outer to IN predicate ||
254
              (Subquery is correlated to the immediate outer query &&
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
255
               Subquery !contains {GROUP BY, ORDER BY [LIMIT],
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
256
               aggregate functions) && subquery predicate is not under "NOT IN"))
257
          6. No execution method was already chosen (by a prepared statement).
258
259
          (*) The subquery must be part of a SELECT statement. The current
260
               condition also excludes multi-table update statements.
261
262
          We have to determine whether we will perform subquery materialization
263
          before calling the IN=>EXISTS transformation, so that we know whether to
264
          perform the whole transformation or only that part of it which wraps
265
          Item_in_subselect in an Item_in_optimizer.
266
        */
267
        if (do_materialize &&
268
            in_subs  &&                                                   // 1
269
            !select_lex->master_unit()->first_select()->next_select() &&  // 2
270
            select_lex->master_unit()->first_select()->leaf_tables &&     // 3
271
            session->lex->sql_command == SQLCOM_SELECT)                       // *
272
        {
273
          if (in_subs->is_top_level_item() &&                             // 4
274
              !in_subs->is_correlated &&                                  // 5
275
              in_subs->exec_method == Item_in_subselect::NOT_TRANSFORMED) // 6
276
            in_subs->exec_method= Item_in_subselect::MATERIALIZATION;
277
        }
278
279
        Item_subselect::trans_res trans_res;
280
        if ((trans_res= subselect->select_transformer(this)) !=
281
            Item_subselect::RES_OK)
282
        {
283
          return((trans_res == Item_subselect::RES_ERROR));
284
        }
285
      }
286
    }
287
  }
288
289
  if (order)
290
  {
291
    order_st *ord;
292
    for (ord= order; ord; ord= ord->next)
293
    {
294
      Item *item= *ord->item;
295
      if (item->with_sum_func && item->type() != Item::SUM_FUNC_ITEM)
296
        item->split_sum_func(session, ref_pointer_array, all_fields);
297
    }
298
  }
299
300
  if (having && having->with_sum_func)
301
    having->split_sum_func(session, ref_pointer_array, all_fields,
302
                           &having, true);
303
  if (select_lex->inner_sum_func_list)
304
  {
305
    Item_sum *end=select_lex->inner_sum_func_list;
306
    Item_sum *item_sum= end;
307
    do
308
    {
309
      item_sum= item_sum->next;
310
      item_sum->split_sum_func(session, ref_pointer_array,
311
                               all_fields, item_sum->ref_by, false);
312
    } while (item_sum != end);
313
  }
314
315
  if (select_lex->inner_refs_list.elements &&
316
      fix_inner_refs(session, all_fields, select_lex, ref_pointer_array))
317
    return(-1);
318
319
  /*
320
    Check if there are references to un-aggregated columns when computing
321
    aggregate functions with implicit grouping (there is no GROUP BY).
322
323
    MODE_ONLY_FULL_GROUP_BY is enabled here by default
324
  */
1089.6.3 by Padraig O'Sullivan
Replaced an instance where a uint8_t type was being used to hold a
325
  if (! group_list && 
326
      select_lex->full_group_by_flag.test(NON_AGG_FIELD_USED) &&
327
      select_lex->full_group_by_flag.test(SUM_FUNC_USED))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
328
  {
329
    my_message(ER_MIX_OF_GROUP_FUNC_AND_FIELDS,
330
               ER(ER_MIX_OF_GROUP_FUNC_AND_FIELDS), MYF(0));
331
    return(-1);
332
  }
333
  {
334
    /* Caclulate the number of groups */
335
    send_group_parts= 0;
336
    for (order_st *group_tmp= group_list ; group_tmp ; group_tmp= group_tmp->next)
337
      send_group_parts++;
338
  }
339
340
  if (error)
971.6.11 by Eric Day
Removed purecov messages.
341
    goto err;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
342
1308.2.11 by Jay Pipes
* Adds CREATE TABLE as a specific CreateTableStatement message in the
343
  /* 
344
   * The below will create the new table for
345
   * CREATE TABLE ... SELECT
346
   *
347
   * @see create_table_from_items() in drizzled/sql_insert.cc
348
   */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
349
  if (result && result->prepare(fields_list, unit_arg))
971.6.11 by Eric Day
Removed purecov messages.
350
    goto err;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
351
352
  /* Init join struct */
353
  count_field_types(select_lex, &tmp_table_param, all_fields, 0);
354
  ref_pointer_array_size= all_fields.elements*sizeof(Item*);
355
  this->group= group_list != 0;
356
  unit= unit_arg;
357
358
#ifdef RESTRICTED_GROUP
359
  if (sum_func_count && !group_list && (func_count || field_count))
360
  {
361
    my_message(ER_WRONG_SUM_SELECT,ER(ER_WRONG_SUM_SELECT),MYF(0));
362
    goto err;
363
  }
364
#endif
365
  if (select_lex->olap == ROLLUP_TYPE && rollup_init())
366
    goto err;
367
  if (alloc_func_list())
368
    goto err;
369
370
  return(0); // All OK
371
372
err:
971.6.11 by Eric Day
Removed purecov messages.
373
  return(-1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
374
}
375
376
/*
377
  Remove the predicates pushed down into the subquery
378
379
  SYNOPSIS
1541.1.1 by Brian Aker
JOIN -> Join rename
380
    Join::remove_subq_pushed_predicates()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
381
      where   IN  Must be NULL
382
              OUT The remaining WHERE condition, or NULL
383
384
  DESCRIPTION
385
    Given that this join will be executed using (unique|index)_subquery,
386
    without "checking NULL", remove the predicates that were pushed down
387
    into the subquery.
388
389
    If the subquery compares scalar values, we can remove the condition that
390
    was wrapped into trig_cond (it will be checked when needed by the subquery
391
    engine)
392
393
    If the subquery compares row values, we need to keep the wrapped
394
    equalities in the WHERE clause: when the left (outer) tuple has both NULL
395
    and non-NULL values, we'll do a full table scan and will rely on the
396
    equalities corresponding to non-NULL parts of left tuple to filter out
397
    non-matching records.
398
399
    TODO: We can remove the equalities that will be guaranteed to be true by the
400
    fact that subquery engine will be using index lookup. This must be done only
401
    for cases where there are no conversion errors of significance, e.g. 257
402
    that is searched in a byte. But this requires homogenization of the return
403
    codes of all Field*::store() methods.
404
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
405
void Join::remove_subq_pushed_predicates(Item **where)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
406
{
407
  if (conds->type() == Item::FUNC_ITEM &&
408
      ((Item_func *)this->conds)->functype() == Item_func::EQ_FUNC &&
409
      ((Item_func *)conds)->arguments()[0]->type() == Item::REF_ITEM &&
410
      ((Item_func *)conds)->arguments()[1]->type() == Item::FIELD_ITEM &&
411
      test_if_ref ((Item_field *)((Item_func *)conds)->arguments()[1],
412
                   ((Item_func *)conds)->arguments()[0]))
413
  {
414
    *where= 0;
415
    return;
416
  }
417
}
418
419
/**
420
  global select optimisation.
421
422
  @note
423
    error code saved in field 'error'
424
425
  @retval
426
    0   success
427
  @retval
428
    1   error
429
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
430
int Join::optimize()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
431
{
432
  // to prevent double initialization on EXPLAIN
433
  if (optimized)
1108.6.58 by Padraig O'Sullivan
Small formatting changes.
434
    return 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
435
  optimized= 1;
436
437
  session->set_proc_info("optimizing");
438
  row_limit= ((select_distinct || order || group_list) ? HA_POS_ERROR :
439
        unit->select_limit_cnt);
440
  /* select_limit is used to decide if we are likely to scan the whole table */
441
  select_limit= unit->select_limit_cnt;
442
  if (having || (select_options & OPTION_FOUND_ROWS))
443
    select_limit= HA_POS_ERROR;
444
  do_send_rows = (unit->select_limit_cnt) ? 1 : 0;
445
  // Ignore errors of execution if option IGNORE present
446
  if (session->lex->ignore)
447
    session->lex->current_select->no_error= 1;
448
449
#ifdef HAVE_REF_TO_FIELDS     // Not done yet
450
  /* Add HAVING to WHERE if possible */
451
  if (having && !group_list && !sum_func_count)
452
  {
453
    if (!conds)
454
    {
455
      conds= having;
456
      having= 0;
457
    }
458
    else if ((conds=new Item_cond_and(conds,having)))
459
    {
460
      /*
461
        Item_cond_and can't be fixed after creation, so we do not check
462
        conds->fixed
463
      */
464
      conds->fix_fields(session, &conds);
465
      conds->change_ref_to_fields(session, tables_list);
466
      conds->top_level_item();
467
      having= 0;
468
    }
469
  }
470
#endif
471
472
  /* Convert all outer joins to inner joins if possible */
1100.2.3 by Brian Aker
Remove final bits on SJ
473
  conds= simplify_joins(this, join_list, conds, true);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
474
  build_bitmap_for_nested_joins(join_list, 0);
475
476
  conds= optimize_cond(this, conds, join_list, &cond_value);
477
  if (session->is_error())
478
  {
479
    error= 1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
480
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
481
  }
482
483
  {
484
    having= optimize_cond(this, having, join_list, &having_value);
485
    if (session->is_error())
486
    {
487
      error= 1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
488
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
489
    }
490
    if (select_lex->where)
491
      select_lex->cond_value= cond_value;
492
    if (select_lex->having)
493
      select_lex->having_value= having_value;
494
495
    if (cond_value == Item::COND_FALSE || having_value == Item::COND_FALSE ||
496
        (!unit->select_limit_cnt && !(select_options & OPTION_FOUND_ROWS)))
497
    {           /* Impossible cond */
498
      zero_result_cause=  having_value == Item::COND_FALSE ?
499
                           "Impossible HAVING" : "Impossible WHERE";
1637.5.3 by Prafulla Tekawade
Reverting the fix for 592473
500
      tables = 0;
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
501
      goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
502
    }
503
  }
504
505
  /* Optimize count(*), cmin() and cmax() */
506
  if (tables_list && tmp_table_param.sum_func_count && ! group_list)
507
  {
508
    int res;
509
    /*
1237.9.1 by Padraig O'Sullivan
Moved the opt_sum.cc file into the optimizer directory and renamed it to sum.cc. Added a header file
510
      optimizer::sum_query() returns HA_ERR_KEY_NOT_FOUND if no rows match
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
511
      to the WHERE conditions,
512
      or 1 if all items were resolved,
513
      or 0, or an error number HA_ERR_...
514
    */
1237.9.1 by Padraig O'Sullivan
Moved the opt_sum.cc file into the optimizer directory and renamed it to sum.cc. Added a header file
515
    if ((res= optimizer::sum_query(select_lex->leaf_tables, all_fields, conds)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
516
    {
517
      if (res == HA_ERR_KEY_NOT_FOUND)
518
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
519
        zero_result_cause= "No matching min/max row";
1637.5.3 by Prafulla Tekawade
Reverting the fix for 592473
520
        tables = 0;
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
521
        goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
522
      }
523
      if (res > 1)
524
      {
525
        error= res;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
526
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
527
      }
528
      if (res < 0)
529
      {
530
        zero_result_cause= "No matching min/max row";
1637.5.3 by Prafulla Tekawade
Reverting the fix for 592473
531
        tables = 0;
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
532
        goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
533
      }
534
      zero_result_cause= "Select tables optimized away";
535
      tables_list= 0;       // All tables resolved
1637.5.3 by Prafulla Tekawade
Reverting the fix for 592473
536
      const_tables= tables;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
537
      /*
538
        Extract all table-independent conditions and replace the WHERE
1237.9.1 by Padraig O'Sullivan
Moved the opt_sum.cc file into the optimizer directory and renamed it to sum.cc. Added a header file
539
        clause with them. All other conditions were computed by optimizer::sum_query
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
540
        and the MIN/MAX/COUNT function(s) have been replaced by constants,
541
        so there is no need to compute the whole WHERE clause again.
542
        Notice that make_cond_for_table() will always succeed to remove all
1237.9.1 by Padraig O'Sullivan
Moved the opt_sum.cc file into the optimizer directory and renamed it to sum.cc. Added a header file
543
        computed conditions, because optimizer::sum_query() is applicable only to
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
544
        conjunctions.
545
        Preserve conditions for EXPLAIN.
546
      */
547
      if (conds && !(session->lex->describe & DESCRIBE_EXTENDED))
548
      {
549
        COND *table_independent_conds= make_cond_for_table(conds, PSEUDO_TABLE_BITS, 0, 0);
550
        conds= table_independent_conds;
551
      }
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
552
      goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
553
    }
554
  }
555
  if (!tables_list)
556
  {
557
    error= 0;
558
    return(0);
559
  }
560
  error= -1;          // Error is sent to client
561
  sort_by_table= get_sort_by_table(order, group_list, select_lex->leaf_tables);
562
563
  /* Calculate how to do the join */
564
  session->set_proc_info("statistics");
565
  if (make_join_statistics(this, select_lex->leaf_tables, conds, &keyuse) ||
566
      session->is_fatal_error)
567
  {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
568
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
569
  }
570
571
  /* Remove distinct if only const tables */
572
  select_distinct= select_distinct && (const_tables != tables);
573
  session->set_proc_info("preparing");
574
  if (result->initialize_tables(this))
575
  {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
576
    return 1;        // error == -1
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
577
  }
578
  if (const_table_map != found_const_table_map &&
579
      !(select_options & SELECT_DESCRIBE) &&
580
      (!conds ||
581
       !(conds->used_tables() & RAND_TABLE_BIT) ||
582
       select_lex->master_unit() == &session->lex->unit)) // upper level SELECT
583
  {
584
    zero_result_cause= "no matching row in const table";
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
585
    goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
586
  }
587
  if (!(session->options & OPTION_BIG_SELECTS) &&
588
      best_read > (double) session->variables.max_join_size &&
589
      !(select_options & SELECT_DESCRIBE))
971.6.11 by Eric Day
Removed purecov messages.
590
  {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
591
    my_message(ER_TOO_BIG_SELECT, ER(ER_TOO_BIG_SELECT), MYF(0));
592
    error= -1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
593
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
594
  }
1054.1.8 by Brian Aker
Remove lock_tables list from session.
595
  if (const_tables && !(select_options & SELECT_NO_UNLOCK))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
596
    mysql_unlock_some_tables(session, table, const_tables);
597
  if (!conds && outer_join)
598
  {
599
    /* Handle the case where we have an OUTER JOIN without a WHERE */
600
    conds=new Item_int((int64_t) 1,1);  // Always true
601
  }
1237.9.2 by Padraig O'Sullivan
Moved opt_range.[cc,h] into the optimizer directory and namespace and renamed the files to
602
  select= optimizer::make_select(*table, const_table_map,
603
                                 const_table_map, conds, 1, &error);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
604
  if (error)
971.6.11 by Eric Day
Removed purecov messages.
605
  {
606
    error= -1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
607
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
608
  }
609
610
  reset_nj_counters(join_list);
611
  make_outerjoin_info(this);
612
613
  /*
614
    Among the equal fields belonging to the same multiple equality
615
    choose the one that is to be retrieved first and substitute
616
    all references to these in where condition for a reference for
617
    the selected field.
618
  */
619
  if (conds)
620
  {
621
    conds= substitute_for_best_equal_field(conds, cond_equal, map2table);
622
    conds->update_used_tables();
623
  }
624
625
  /*
626
    Permorm the the optimization on fields evaluation mentioned above
627
    for all on expressions.
628
  */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
629
  for (JoinTable *tab= join_tab + const_tables; tab < join_tab + tables ; tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
630
  {
631
    if (*tab->on_expr_ref)
632
    {
633
      *tab->on_expr_ref= substitute_for_best_equal_field(*tab->on_expr_ref,
634
                                                         tab->cond_equal,
635
                                                         map2table);
636
      (*tab->on_expr_ref)->update_used_tables();
637
    }
638
  }
639
640
  if (conds &&!outer_join && const_table_map != found_const_table_map &&
641
      (select_options & SELECT_DESCRIBE) &&
642
      select_lex->master_unit() == &session->lex->unit) // upper level SELECT
643
  {
644
    conds=new Item_int((int64_t) 0,1);  // Always false
645
  }
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
646
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
647
  if (make_join_select(this, select, conds))
648
  {
649
    zero_result_cause=
650
      "Impossible WHERE noticed after reading const tables";
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
651
    goto setup_subq_exit;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
652
  }
653
654
  error= -1;          /* if goto err */
655
656
  /* Optimize distinct away if possible */
657
  {
658
    order_st *org_order= order;
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
659
    order= remove_constants(this, order,conds,1, &simple_order);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
660
    if (session->is_error())
661
    {
662
      error= 1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
663
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
664
    }
665
666
    /*
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
667
      If we are using ORDER BY NULL or ORDER BY const_expression,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
668
      return result in any order (even if we are using a GROUP BY)
669
    */
670
    if (!order && org_order)
671
      skip_sort_order= 1;
672
  }
673
  /*
674
     Check if we can optimize away GROUP BY/DISTINCT.
675
     We can do that if there are no aggregate functions, the
676
     fields in DISTINCT clause (if present) and/or columns in GROUP BY
677
     (if present) contain direct references to all key parts of
678
     an unique index (in whatever order) and if the key parts of the
679
     unique index cannot contain NULLs.
680
     Note that the unique keys for DISTINCT and GROUP BY should not
681
     be the same (as long as they are unique).
682
683
     The FROM clause must contain a single non-constant table.
684
  */
685
  if (tables - const_tables == 1 && (group_list || select_distinct) &&
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
686
      ! tmp_table_param.sum_func_count &&
687
      (! join_tab[const_tables].select ||
688
       ! join_tab[const_tables].select->quick ||
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
689
       join_tab[const_tables].select->quick->get_type() !=
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
690
       optimizer::QuickSelectInterface::QS_TYPE_GROUP_MIN_MAX))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
691
  {
692
    if (group_list && list_contains_unique_index(join_tab[const_tables].table, find_field_in_order_list, (void *) group_list))
693
    {
694
      /*
695
        We have found that grouping can be removed since groups correspond to
696
        only one row anyway, but we still have to guarantee correct result
697
        order. The line below effectively rewrites the query from GROUP BY
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
698
        <fields> to ORDER BY <fields>. There are two exceptions:
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
699
        - if skip_sort_order is set (see above), then we can simply skip
700
          GROUP BY;
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
701
        - we can only rewrite ORDER BY if the ORDER BY fields are 'compatible'
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
702
          with the GROUP BY ones, i.e. either one is a prefix of another.
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
703
          We only check if the ORDER BY is a prefix of GROUP BY. In this case
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
704
          test_if_subpart() copies the ASC/DESC attributes from the original
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
705
          ORDER BY fields.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
706
          If GROUP BY is a prefix of order_st BY, then it is safe to leave
707
          'order' as is.
708
       */
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
709
      if (! order || test_if_subpart(group_list, order))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
710
          order= skip_sort_order ? 0 : group_list;
711
      /*
712
        If we have an IGNORE INDEX FOR GROUP BY(fields) clause, this must be
713
        rewritten to IGNORE INDEX FOR order_st BY(fields).
714
      */
715
      join_tab->table->keys_in_use_for_order_by=
716
        join_tab->table->keys_in_use_for_group_by;
717
      group_list= 0;
718
      group= 0;
719
    }
720
    if (select_distinct &&
721
       list_contains_unique_index(join_tab[const_tables].table,
722
                                 find_field_in_item_list,
723
                                 (void *) &fields_list))
724
    {
725
      select_distinct= 0;
726
    }
727
  }
728
  if (group_list || tmp_table_param.sum_func_count)
729
  {
730
    if (! hidden_group_fields && rollup.state == ROLLUP::STATE_NONE)
731
      select_distinct=0;
732
  }
733
  else if (select_distinct && tables - const_tables == 1)
734
  {
735
    /*
736
      We are only using one table. In this case we change DISTINCT to a
737
      GROUP BY query if:
738
      - The GROUP BY can be done through indexes (no sort) and the order_st
739
        BY only uses selected fields.
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
740
        (In this case we can later optimize away GROUP BY and order_st BY)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
741
      - We are scanning the whole table without LIMIT
742
        This can happen if:
743
        - We are using CALC_FOUND_ROWS
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
744
        - We are using an ORDER BY that can't be optimized away.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
745
746
      We don't want to use this optimization when we are using LIMIT
747
      because in this case we can just create a temporary table that
748
      holds LIMIT rows and stop when this table is full.
749
    */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
750
    JoinTable *tab= &join_tab[const_tables];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
751
    bool all_order_fields_used;
752
    if (order)
753
      skip_sort_order= test_if_skip_sort_order(tab, order, select_limit, 1,
754
        &tab->table->keys_in_use_for_order_by);
755
    if ((group_list=create_distinct_group(session, select_lex->ref_pointer_array,
756
                                          order, fields_list, all_fields,
757
                  &all_order_fields_used)))
758
    {
759
      bool skip_group= (skip_sort_order &&
760
        test_if_skip_sort_order(tab, group_list, select_limit, 1,
761
                                &tab->table->keys_in_use_for_group_by) != 0);
762
      count_field_types(select_lex, &tmp_table_param, all_fields, 0);
763
      if ((skip_group && all_order_fields_used) ||
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
764
          select_limit == HA_POS_ERROR ||
765
          (order && !skip_sort_order))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
766
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
767
        /*  Change DISTINCT to GROUP BY */
768
        select_distinct= 0;
769
        no_order= !order;
770
        if (all_order_fields_used)
771
        {
772
          if (order && skip_sort_order)
773
          {
774
            /*
775
              Force MySQL to read the table in sorted order to get result in
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
776
              ORDER BY order.
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
777
            */
778
            tmp_table_param.quick_group=0;
779
          }
780
          order=0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
781
        }
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
782
        group=1;        // For end_write_group
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
783
      }
784
      else
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
785
        group_list= 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
786
    }
787
    else if (session->is_fatal_error)     // End of memory
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
788
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
789
  }
790
  simple_group= 0;
791
  {
792
    order_st *old_group_list;
793
    group_list= remove_constants(this, (old_group_list= group_list), conds,
794
                                 rollup.state == ROLLUP::STATE_NONE,
795
                                 &simple_group);
796
    if (session->is_error())
797
    {
798
      error= 1;
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
799
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
800
    }
801
    if (old_group_list && !group_list)
802
      select_distinct= 0;
803
  }
804
  if (!group_list && group)
805
  {
806
    order=0;          // The output has only one row
807
    simple_order=1;
808
    select_distinct= 0;                       // No need in distinct for 1 row
809
    group_optimized_away= 1;
810
  }
811
812
  calc_group_buffer(this, group_list);
813
  send_group_parts= tmp_table_param.group_parts; /* Save org parts */
814
815
  if (test_if_subpart(group_list, order) ||
816
      (!group_list && tmp_table_param.sum_func_count))
817
    order=0;
818
819
  // Can't use sort on head table if using row cache
820
  if (full_join)
821
  {
822
    if (group_list)
823
      simple_group=0;
824
    if (order)
825
      simple_order=0;
826
  }
827
828
  /*
829
    Check if we need to create a temporary table.
830
    This has to be done if all tables are not already read (const tables)
831
    and one of the following conditions holds:
832
    - We are using DISTINCT (simple distinct's are already optimized away)
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
833
    - We are using an ORDER BY or GROUP BY on fields not in the first table
834
    - We are using different ORDER BY and GROUP BY orders
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
835
    - The user wants us to buffer the result.
836
  */
837
  need_tmp= (const_tables != tables &&
838
       ((select_distinct || !simple_order || !simple_group) ||
839
        (group_list && order) ||
840
        test(select_options & OPTION_BUFFER_RESULT)));
841
842
  // No cache for MATCH == 'Don't use join buffering when we use MATCH'.
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
843
  if (make_join_readinfo(this))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
844
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
845
846
  /* Create all structures needed for materialized subquery execution. */
847
  if (setup_subquery_materialization())
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
848
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
849
1240.8.10 by Dennis Schoen
move caching after subquery initialization
850
  /* Cache constant expressions in WHERE, HAVING, ON clauses. */
851
  cache_const_exprs();
852
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
853
  /*
854
    is this simple IN subquery?
855
  */
856
  if (!group_list && !order &&
857
      unit->item && unit->item->substype() == Item_subselect::IN_SUBS &&
858
      tables == 1 && conds &&
859
      !unit->is_union())
860
  {
861
    if (!having)
862
    {
863
      Item *where= conds;
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
864
      if (join_tab[0].type == AM_EQ_REF && join_tab[0].ref.items[0]->name == in_left_expr_name)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
865
      {
866
        remove_subq_pushed_predicates(&where);
867
        save_index_subquery_explain_info(join_tab, where);
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
868
        join_tab[0].type= AM_UNIQUE_SUBQUERY;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
869
        error= 0;
870
        return(unit->item->
871
                    change_engine(new
872
                                  subselect_uniquesubquery_engine(session,
873
                                                                  join_tab,
874
                                                                  unit->item,
875
                                                                  where)));
876
      }
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
877
      else if (join_tab[0].type == AM_REF &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
878
         join_tab[0].ref.items[0]->name == in_left_expr_name)
879
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
880
        remove_subq_pushed_predicates(&where);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
881
        save_index_subquery_explain_info(join_tab, where);
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
882
        join_tab[0].type= AM_INDEX_SUBQUERY;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
883
        error= 0;
884
        return(unit->item->
885
                    change_engine(new
886
                                  subselect_indexsubquery_engine(session,
887
                                                                 join_tab,
888
                                                                 unit->item,
889
                                                                 where,
890
                                                                 NULL,
891
                                                                 0)));
892
      }
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
893
    } 
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
894
    else if (join_tab[0].type == AM_REF_OR_NULL &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
895
         join_tab[0].ref.items[0]->name == in_left_expr_name &&
896
               having->name == in_having_cond)
897
    {
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
898
      join_tab[0].type= AM_INDEX_SUBQUERY;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
899
      error= 0;
900
      conds= remove_additional_cond(conds);
901
      save_index_subquery_explain_info(join_tab, conds);
902
      return(unit->item->
903
      change_engine(new subselect_indexsubquery_engine(session,
904
                   join_tab,
905
                   unit->item,
906
                   conds,
907
                                                                   having,
908
                   1)));
909
    }
910
911
  }
912
  /*
913
    Need to tell handlers that to play it safe, it should fetch all
914
    columns of the primary key of the tables: this is because MySQL may
915
    build row pointers for the rows, and for all columns of the primary key
916
    the read set has not necessarily been set by the server code.
917
  */
918
  if (need_tmp || select_distinct || group_list || order)
919
  {
920
    for (uint32_t i = const_tables; i < tables; i++)
921
      join_tab[i].table->prepare_for_position();
922
  }
923
924
  if (const_tables != tables)
925
  {
926
    /*
927
      Because filesort always does a full table scan or a quick range scan
928
      we must add the removed reference to the select for the table.
929
      We only need to do this when we have a simple_order or simple_group
930
      as in other cases the join is done before the sort.
931
    */
932
    if ((order || group_list) &&
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
933
        (join_tab[const_tables].type != AM_ALL) &&
934
        (join_tab[const_tables].type != AM_REF_OR_NULL) &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
935
        ((order && simple_order) || (group_list && simple_group)))
936
    {
937
      if (add_ref_to_table_cond(session,&join_tab[const_tables])) {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
938
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
939
      }
940
    }
941
942
    if (!(select_options & SELECT_BIG_RESULT) &&
943
        ((group_list &&
944
          (!simple_group ||
945
           !test_if_skip_sort_order(&join_tab[const_tables], group_list,
946
                                    unit->select_limit_cnt, 0,
947
                                    &join_tab[const_tables].table->
948
                                    keys_in_use_for_group_by))) ||
949
         select_distinct) &&
950
        tmp_table_param.quick_group)
951
    {
952
      need_tmp=1; simple_order=simple_group=0;  // Force tmp table without sort
953
    }
954
    if (order)
955
    {
956
      /*
957
        Force using of tmp table if sorting by a SP or UDF function due to
958
        their expensive and probably non-deterministic nature.
959
      */
960
      for (order_st *tmp_order= order; tmp_order ; tmp_order=tmp_order->next)
961
      {
962
        Item *item= *tmp_order->item;
963
        if (item->is_expensive())
964
        {
965
          /* Force tmp table without sort */
966
          need_tmp=1; simple_order=simple_group=0;
967
          break;
968
        }
969
      }
970
    }
971
  }
972
973
  tmp_having= having;
974
  if (select_options & SELECT_DESCRIBE)
975
  {
976
    error= 0;
977
    return(0);
978
  }
979
  having= 0;
980
981
  /*
982
    The loose index scan access method guarantees that all grouping or
983
    duplicate row elimination (for distinct) is already performed
984
    during data retrieval, and that all MIN/MAX functions are already
985
    computed for each group. Thus all MIN/MAX functions should be
986
    treated as regular functions, and there is no need to perform
987
    grouping in the main execution loop.
988
    Notice that currently loose index scan is applicable only for
989
    single table queries, thus it is sufficient to test only the first
990
    join_tab element of the plan for its access method.
991
  */
992
  if (join_tab->is_using_loose_index_scan())
993
    tmp_table_param.precomputed_group_by= true;
994
995
  /* Create a tmp table if distinct or if the sort is too complicated */
996
  if (need_tmp)
997
  {
998
    session->set_proc_info("Creating tmp table");
999
1000
    init_items_ref_array();
1001
1002
    tmp_table_param.hidden_field_count= (all_fields.elements -
1003
           fields_list.elements);
1089.6.1 by Padraig O'Sullivan
Converted the test_flags variable from a uint32_t to std::bitset.
1004
    order_st *tmp_group= ((!simple_group && 
1005
                           ! (test_flags.test(TEST_NO_KEY_GROUP))) ? group_list :
1006
                                                                     (order_st*) 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1007
    /*
1008
      Pushing LIMIT to the temporary table creation is not applicable
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
1009
      when there is ORDER BY or GROUP BY or there is no GROUP BY, but
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1010
      there are aggregate functions, because in all these cases we need
1011
      all result rows.
1012
    */
1013
    ha_rows tmp_rows_limit= ((order == 0 || skip_sort_order) &&
1014
                             !tmp_group &&
1015
                             !session->lex->current_select->with_sum_func) ?
1016
                            select_limit : HA_POS_ERROR;
1017
1018
    if (!(exec_tmp_table1=
1116.1.1 by Brian Aker
Fix for Stewart's patch (includes hack to solve MAX rows problem).
1019
          create_tmp_table(session, &tmp_table_param, all_fields,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1020
                           tmp_group,
1116.1.1 by Brian Aker
Fix for Stewart's patch (includes hack to solve MAX rows problem).
1021
                           group_list ? 0 : select_distinct,
1022
                           group_list && simple_group,
1023
                           select_options,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1024
                           tmp_rows_limit,
1116.1.1 by Brian Aker
Fix for Stewart's patch (includes hack to solve MAX rows problem).
1025
                           (char *) "")))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1026
    {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
1027
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1028
    }
1029
1030
    /*
1031
      We don't have to store rows in temp table that doesn't match HAVING if:
1032
      - we are sorting the table and writing complete group rows to the
1033
        temp table.
1034
      - We are using DISTINCT without resolving the distinct as a GROUP BY
1035
        on all columns.
1036
1037
      If having is not handled here, it will be checked before the row
1038
      is sent to the client.
1039
    */
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1040
    if (tmp_having && (sort_and_group || (exec_tmp_table1->distinct && !group_list)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1041
      having= tmp_having;
1042
1043
    /* if group or order on first table, sort first */
1044
    if (group_list && simple_group)
1045
    {
1046
      session->set_proc_info("Sorting for group");
1047
      if (create_sort_index(session, this, group_list,
1048
          HA_POS_ERROR, HA_POS_ERROR, false) ||
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1049
          alloc_group_fields(this, group_list) ||
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1050
          make_sum_func_list(all_fields, fields_list, 1) ||
1051
          setup_sum_funcs(session, sum_funcs))
1052
      {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
1053
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1054
      }
1055
      group_list=0;
1056
    }
1057
    else
1058
    {
1059
      if (make_sum_func_list(all_fields, fields_list, 0) ||
1060
          setup_sum_funcs(session, sum_funcs))
1061
      {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
1062
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1063
      }
1064
1065
      if (!group_list && ! exec_tmp_table1->distinct && order && simple_order)
1066
      {
1067
        session->set_proc_info("Sorting for order");
1068
        if (create_sort_index(session, this, order,
1069
                              HA_POS_ERROR, HA_POS_ERROR, true))
1070
        {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
1071
          return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1072
        }
1073
        order=0;
1074
      }
1075
    }
1076
1077
    /*
1078
      Optimize distinct when used on some of the tables
1079
      SELECT DISTINCT t1.a FROM t1,t2 WHERE t1.b=t2.b
1080
      In this case we can stop scanning t2 when we have found one t1.a
1081
    */
1082
1083
    if (exec_tmp_table1->distinct)
1084
    {
1085
      table_map used_tables= session->used_tables;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1086
      JoinTable *last_join_tab= join_tab+tables-1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1087
      do
1088
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1089
        if (used_tables & last_join_tab->table->map)
1090
          break;
1091
        last_join_tab->not_used_in_distinct=1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1092
      } while (last_join_tab-- != join_tab);
1093
      /* Optimize "select distinct b from t1 order by key_part_1 limit #" */
1094
      if (order && skip_sort_order)
1095
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1096
        /* Should always succeed */
1097
        if (test_if_skip_sort_order(&join_tab[const_tables],
1098
                  order, unit->select_limit_cnt, 0,
1099
                                          &join_tab[const_tables].table->
1100
                                            keys_in_use_for_order_by))
1101
          order= 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1102
      }
1103
    }
1104
1105
    /*
1106
      If this join belongs to an uncacheable subquery save
1107
      the original join
1108
    */
1858.1.1 by Padraig O'Sullivan
Replaced a uint8_t member with a standard bitset since it was being used as a bitset....
1109
    if (select_lex->uncacheable.any() && 
1110
        ! is_top_level_join() &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1111
        init_save_join_tab())
1858.1.1 by Padraig O'Sullivan
Replaced a uint8_t member with a standard bitset since it was being used as a bitset....
1112
    {
1113
      return -1;
1114
    }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1115
  }
1116
1117
  error= 0;
1858.1.1 by Padraig O'Sullivan
Replaced a uint8_t member with a standard bitset since it was being used as a bitset....
1118
  return 0;
1588.1.3 by Stewart Smith
Fix assertion failure on HAVING subquery. Drizzle bug lp:588408 (MySQL bug 46680 - http://bugs.mysql.com/bug.php?id=46680).
1119
1120
setup_subq_exit:
1121
  /* Even with zero matching rows, subqueries in the HAVING clause
1122
     may need to be evaluated if there are aggregate functions in the query.
1123
  */
1124
  if (setup_subquery_materialization())
1125
    return 1;
1126
  error= 0;
1127
  return 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1128
}
1129
1130
/**
1131
  Restore values in temporary join.
1132
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1133
void Join::restore_tmp()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1134
{
1541.1.1 by Brian Aker
JOIN -> Join rename
1135
  memcpy(tmp_join, this, (size_t) sizeof(Join));
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1136
}
1137
1541.1.1 by Brian Aker
JOIN -> Join rename
1138
int Join::reinit()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1139
{
1140
  unit->offset_limit_cnt= (ha_rows)(select_lex->offset_limit ?
1141
                                    select_lex->offset_limit->val_uint() :
1142
                                    0UL);
1143
1144
  first_record= 0;
1145
1146
  if (exec_tmp_table1)
1147
  {
1208.3.2 by brian
Update for Cursor renaming.
1148
    exec_tmp_table1->cursor->extra(HA_EXTRA_RESET_STATE);
1149
    exec_tmp_table1->cursor->ha_delete_all_rows();
1109.1.4 by Brian Aker
More Table refactor
1150
    exec_tmp_table1->free_io_cache();
1151
    exec_tmp_table1->filesort_free_buffers();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1152
  }
1153
  if (exec_tmp_table2)
1154
  {
1208.3.2 by brian
Update for Cursor renaming.
1155
    exec_tmp_table2->cursor->extra(HA_EXTRA_RESET_STATE);
1156
    exec_tmp_table2->cursor->ha_delete_all_rows();
1109.1.4 by Brian Aker
More Table refactor
1157
    exec_tmp_table2->free_io_cache();
1158
    exec_tmp_table2->filesort_free_buffers();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1159
  }
1160
  if (items0)
1161
    set_items_ref_array(items0);
1162
1163
  if (join_tab_save)
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1164
    memcpy(join_tab, join_tab_save, sizeof(JoinTable) * tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1165
1166
  if (tmp_join)
1167
    restore_tmp();
1168
1169
  /* Reset of sum functions */
1170
  if (sum_funcs)
1171
  {
1172
    Item_sum *func, **func_ptr= sum_funcs;
1173
    while ((func= *(func_ptr++)))
1174
      func->clear();
1175
  }
1176
1177
  return(0);
1178
}
1179
1180
/**
1181
   @brief Save the original join layout
1182
1183
   @details Saves the original join layout so it can be reused in
1184
   re-execution and for EXPLAIN.
1185
1186
   @return Operation status
1187
   @retval 0      success.
1188
   @retval 1      error occurred.
1189
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1190
bool Join::init_save_join_tab()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1191
{
1541.1.1 by Brian Aker
JOIN -> Join rename
1192
  if (!(tmp_join= (Join*)session->alloc(sizeof(Join))))
971.6.11 by Eric Day
Removed purecov messages.
1193
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1194
  error= 0;              // Ensure that tmp_join.error= 0
1195
  restore_tmp();
1196
  return 0;
1197
}
1198
1541.1.1 by Brian Aker
JOIN -> Join rename
1199
bool Join::save_join_tab()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1200
{
1858.1.1 by Padraig O'Sullivan
Replaced a uint8_t member with a standard bitset since it was being used as a bitset....
1201
  if (! join_tab_save && select_lex->master_unit()->uncacheable.any())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1202
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1203
    if (!(join_tab_save= (JoinTable*)session->memdup((unsigned char*) join_tab,
1204
            sizeof(JoinTable) * tables)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1205
      return 1;
1206
  }
1207
  return 0;
1208
}
1209
1210
/**
1211
  Exec select.
1212
1213
  @todo
1214
    Note, that create_sort_index calls test_if_skip_sort_order and may
1215
    finally replace sorting with index scan if there is a LIMIT clause in
1216
    the query.  It's never shown in EXPLAIN!
1217
1218
  @todo
1219
    When can we have here session->net.report_error not zero?
1220
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1221
void Join::exec()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1222
{
1223
  List<Item> *columns_list= &fields_list;
1224
  int      tmp_error;
1225
1226
  session->set_proc_info("executing");
1227
  error= 0;
1228
1229
  if (!tables_list && (tables || !select_lex->with_sum_func))
1230
  {                                           
1231
    /* Only test of functions */
1232
    if (select_options & SELECT_DESCRIBE)
1240.7.1 by Padraig O'Sullivan
Created an ExplainPlan class in the optimizer namespace. All printing of an explain in drizzle goes
1233
    {
1234
      optimizer::ExplainPlan planner(this, 
1235
                                     false,
1236
                                     false,
1237
                                     false,
1238
                                     (zero_result_cause ? zero_result_cause : "No tables used"));
1239
      planner.printPlan();
1240
    }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1241
    else
1242
    {
971.3.63 by Eric Day
Removed protocol field flags.
1243
      result->send_fields(*columns_list);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1244
      /*
1245
        We have to test for 'conds' here as the WHERE may not be constant
1246
        even if we don't have any tables for prepared statements or if
1247
        conds uses something like 'rand()'.
1248
      */
1249
      if (cond_value != Item::COND_FALSE &&
1250
          (!conds || conds->val_int()) &&
1251
          (!having || having->val_int()))
1252
      {
1253
        if (do_send_rows && result->send_data(fields_list))
1254
          error= 1;
1255
        else
1256
        {
1257
          error= (int) result->send_eof();
1258
          send_records= ((select_options & OPTION_FOUND_ROWS) ? 1 : session->sent_row_count);
1259
        }
1260
      }
1261
      else
1262
      {
1263
        error= (int) result->send_eof();
1264
        send_records= 0;
1265
      }
1266
    }
1267
    /* Single select (without union) always returns 0 or 1 row */
1268
    session->limit_found_rows= send_records;
1269
    session->examined_row_count= 0;
1270
    return;
1271
  }
1272
  /*
1273
    Don't reset the found rows count if there're no tables as
1274
    FOUND_ROWS() may be called. Never reset the examined row count here.
1275
    It must be accumulated from all join iterations of all join parts.
1276
  */
1277
  if (tables)
1278
    session->limit_found_rows= 0;
1279
1280
  if (zero_result_cause)
1281
  {
1282
    (void) return_zero_rows(this, result, select_lex->leaf_tables,
1283
                            *columns_list,
1284
          send_row_on_empty_set(),
1285
          select_options,
1286
          zero_result_cause,
1287
          having);
1288
    return;
1289
  }
1290
1291
  if (select_options & SELECT_DESCRIBE)
1292
  {
1293
    /*
1273.2.11 by Stewart Smith
fix accidental mangling of comment: s/order_st BY/ORDER BY/. in drizzled/join.cc
1294
      Check if we managed to optimize ORDER BY away and don't use temporary
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1295
      table to resolve order_st BY: in that case, we only may need to do
1296
      filesort for GROUP BY.
1297
    */
1298
    if (!order && !no_order && (!skip_sort_order || !need_tmp))
1299
    {
1300
      /* Reset 'order' to 'group_list' and reinit variables describing 'order' */
1301
      order= group_list;
1302
      simple_order= simple_group;
1303
      skip_sort_order= 0;
1304
    }
1305
    if (order && (order != group_list || !(select_options & SELECT_BIG_RESULT)))
1306
    {
1307
      if (const_tables == tables 
1308
        || ((simple_order || skip_sort_order) 
1309
          && test_if_skip_sort_order(&join_tab[const_tables], order, select_limit, 0, &join_tab[const_tables].table->keys_in_use_for_query)))
1310
      order= 0;
1311
    }
1312
    having= tmp_having;
1240.7.1 by Padraig O'Sullivan
Created an ExplainPlan class in the optimizer namespace. All printing of an explain in drizzle goes
1313
    optimizer::ExplainPlan planner(this,
1314
                                   need_tmp,
1315
                                   order != 0 && ! skip_sort_order,
1316
                                   select_distinct,
1317
                                   ! tables ? "No tables used" : NULL);
1318
    planner.printPlan();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1319
    return;
1320
  }
1321
1541.1.1 by Brian Aker
JOIN -> Join rename
1322
  Join *curr_join= this;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1323
  List<Item> *curr_all_fields= &all_fields;
1324
  List<Item> *curr_fields_list= &fields_list;
1325
  Table *curr_tmp_table= 0;
1326
  /*
1327
    Initialize examined rows here because the values from all join parts
1328
    must be accumulated in examined_row_count. Hence every join
1329
    iteration must count from zero.
1330
  */
1331
  curr_join->examined_rows= 0;
1332
1333
  /* Create a tmp table if distinct or if the sort is too complicated */
1334
  if (need_tmp)
1335
  {
1336
    if (tmp_join)
1337
    {
1338
      /*
1339
        We are in a non cacheable sub query. Get the saved join structure
1340
        after optimization.
1341
        (curr_join may have been modified during last exection and we need
1342
        to reset it)
1343
      */
1344
      curr_join= tmp_join;
1345
    }
1346
    curr_tmp_table= exec_tmp_table1;
1347
1348
    /* Copy data to the temporary table */
1349
    session->set_proc_info("Copying to tmp table");
1350
    if (! curr_join->sort_and_group && curr_join->const_tables != curr_join->tables)
1351
      curr_join->join_tab[curr_join->const_tables].sorted= 0;
1352
    if ((tmp_error= do_select(curr_join, (List<Item> *) 0, curr_tmp_table)))
1353
    {
1354
      error= tmp_error;
1355
      return;
1356
    }
1208.3.2 by brian
Update for Cursor renaming.
1357
    curr_tmp_table->cursor->info(HA_STATUS_VARIABLE);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1358
1359
    if (curr_join->having)
1360
      curr_join->having= curr_join->tmp_having= 0; // Allready done
1361
1362
    /* Change sum_fields reference to calculated fields in tmp_table */
1363
    curr_join->all_fields= *curr_all_fields;
1364
    if (!items1)
1365
    {
1366
      items1= items0 + all_fields.elements;
1367
      if (sort_and_group || curr_tmp_table->group)
1368
      {
1369
        if (change_to_use_tmp_fields(session, items1,
1370
                  tmp_fields_list1, tmp_all_fields1,
1371
                  fields_list.elements, all_fields))
1372
          return;
1373
      }
1374
      else
1375
      {
1376
        if (change_refs_to_tmp_fields(session, items1,
1377
                    tmp_fields_list1, tmp_all_fields1,
1378
                    fields_list.elements, all_fields))
1379
          return;
1380
      }
1381
      curr_join->tmp_all_fields1= tmp_all_fields1;
1382
      curr_join->tmp_fields_list1= tmp_fields_list1;
1383
      curr_join->items1= items1;
1384
    }
1385
    curr_all_fields= &tmp_all_fields1;
1386
    curr_fields_list= &tmp_fields_list1;
1387
    curr_join->set_items_ref_array(items1);
1388
1389
    if (sort_and_group || curr_tmp_table->group)
1390
    {
1391
      curr_join->tmp_table_param.field_count+= curr_join->tmp_table_param.sum_func_count
1392
                                             + curr_join->tmp_table_param.func_count;
1393
      curr_join->tmp_table_param.sum_func_count= 0;
1394
      curr_join->tmp_table_param.func_count= 0;
1395
    }
1396
    else
1397
    {
1398
      curr_join->tmp_table_param.field_count+= curr_join->tmp_table_param.func_count;
1399
      curr_join->tmp_table_param.func_count= 0;
1400
    }
1401
1402
    if (curr_tmp_table->group)
1403
    {           // Already grouped
1404
      if (!curr_join->order && !curr_join->no_order && !skip_sort_order)
1405
        curr_join->order= curr_join->group_list;  /* order by group */
1406
      curr_join->group_list= 0;
1407
    }
1408
1409
    /*
1410
      If we have different sort & group then we must sort the data by group
1411
      and copy it to another tmp table
1412
      This code is also used if we are using distinct something
1413
      we haven't been able to store in the temporary table yet
1414
      like SEC_TO_TIME(SUM(...)).
1415
    */
1416
1417
    if ((curr_join->group_list && (!test_if_subpart(curr_join->group_list, curr_join->order) || curr_join->select_distinct)) 
1418
        || (curr_join->select_distinct && curr_join->tmp_table_param.using_indirect_summary_function))
1419
    {         /* Must copy to another table */
1420
      /* Free first data from old join */
1421
      curr_join->join_free();
1422
      if (make_simple_join(curr_join, curr_tmp_table))
1423
        return;
1424
      calc_group_buffer(curr_join, group_list);
1425
      count_field_types(select_lex, &curr_join->tmp_table_param,
1426
      curr_join->tmp_all_fields1,
1427
      curr_join->select_distinct && !curr_join->group_list);
1428
      curr_join->tmp_table_param.hidden_field_count= curr_join->tmp_all_fields1.elements
1429
                                                   - curr_join->tmp_fields_list1.elements;
1430
1431
      if (exec_tmp_table2)
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1432
      {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1433
        curr_tmp_table= exec_tmp_table2;
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1434
      }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1435
      else
1436
      {
1437
        /* group data to new table */
1438
1439
        /*
1440
          If the access method is loose index scan then all MIN/MAX
1441
          functions are precomputed, and should be treated as regular
1541.1.1 by Brian Aker
JOIN -> Join rename
1442
          functions. See extended comment in Join::exec.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1443
        */
1444
        if (curr_join->join_tab->is_using_loose_index_scan())
1445
          curr_join->tmp_table_param.precomputed_group_by= true;
1446
1447
        if (!(curr_tmp_table=
1448
              exec_tmp_table2= create_tmp_table(session,
1449
                                                &curr_join->tmp_table_param,
1450
                                                *curr_all_fields,
1451
                                                (order_st*) 0,
1452
                                                curr_join->select_distinct &&
1453
                                                !curr_join->group_list,
1454
                                                1, curr_join->select_options,
1455
                                                HA_POS_ERROR,
1456
                                                (char *) "")))
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1457
        {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1458
          return;
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1459
        }
1460
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1461
        curr_join->exec_tmp_table2= exec_tmp_table2;
1462
      }
1463
      if (curr_join->group_list)
1464
      {
1465
        session->set_proc_info("Creating sort index");
1466
        if (curr_join->join_tab == join_tab && save_join_tab())
1467
        {
1468
          return;
1469
        }
1470
        if (create_sort_index(session, curr_join, curr_join->group_list,
1471
                  HA_POS_ERROR, HA_POS_ERROR, false) ||
1472
            make_group_fields(this, curr_join))
1473
        {
1474
          return;
1475
        }
1476
        sortorder= curr_join->sortorder;
1477
      }
1478
1479
      session->set_proc_info("Copying to group table");
1480
      tmp_error= -1;
1481
      if (curr_join != this)
1482
      {
1483
        if (sum_funcs2)
1484
        {
1485
          curr_join->sum_funcs= sum_funcs2;
1486
          curr_join->sum_funcs_end= sum_funcs_end2;
1487
        }
1488
        else
1489
        {
1490
          curr_join->alloc_func_list();
1491
          sum_funcs2= curr_join->sum_funcs;
1492
          sum_funcs_end2= curr_join->sum_funcs_end;
1493
        }
1494
      }
1495
      if (curr_join->make_sum_func_list(*curr_all_fields, *curr_fields_list, 1, true))
1496
        return;
1497
      curr_join->group_list= 0;
1498
1499
      if (!curr_join->sort_and_group && (curr_join->const_tables != curr_join->tables))
1500
        curr_join->join_tab[curr_join->const_tables].sorted= 0;
1501
      
1502
      if (setup_sum_funcs(curr_join->session, curr_join->sum_funcs) 
1503
        || (tmp_error= do_select(curr_join, (List<Item> *) 0, curr_tmp_table)))
1504
      {
1505
        error= tmp_error;
1506
        return;
1507
      }
1538 by Brian Aker
Code shuffle on ReadRecord
1508
      curr_join->join_tab->read_record.end_read_record();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1509
      curr_join->const_tables= curr_join->tables; // Mark free for cleanup()
1510
      curr_join->join_tab[0].table= 0;           // Table is freed
1511
1512
      // No sum funcs anymore
1513
      if (!items2)
1514
      {
1515
        items2= items1 + all_fields.elements;
1516
        if (change_to_use_tmp_fields(session, items2,
1517
                  tmp_fields_list2, tmp_all_fields2,
1518
                  fields_list.elements, tmp_all_fields1))
1519
          return;
1520
        curr_join->tmp_fields_list2= tmp_fields_list2;
1521
        curr_join->tmp_all_fields2= tmp_all_fields2;
1522
      }
1523
      curr_fields_list= &curr_join->tmp_fields_list2;
1524
      curr_all_fields= &curr_join->tmp_all_fields2;
1525
      curr_join->set_items_ref_array(items2);
1526
      curr_join->tmp_table_param.field_count+= curr_join->tmp_table_param.sum_func_count;
1527
      curr_join->tmp_table_param.sum_func_count= 0;
1528
    }
1529
    if (curr_tmp_table->distinct)
1530
      curr_join->select_distinct=0;   /* Each row is unique */
1531
1532
    curr_join->join_free();     /* Free quick selects */
1533
    if (curr_join->select_distinct && ! curr_join->group_list)
1534
    {
1535
      session->set_proc_info("Removing duplicates");
1536
      if (curr_join->tmp_having)
1537
        curr_join->tmp_having->update_used_tables();
1538
1539
      if (remove_duplicates(curr_join, curr_tmp_table,
1540
          *curr_fields_list, curr_join->tmp_having))
1541
        return;
1542
      
1543
      curr_join->tmp_having=0;
1544
      curr_join->select_distinct=0;
1545
    }
1546
    curr_tmp_table->reginfo.lock_type= TL_UNLOCK;
1547
    if (make_simple_join(curr_join, curr_tmp_table))
1548
      return;
1549
    calc_group_buffer(curr_join, curr_join->group_list);
1550
    count_field_types(select_lex, &curr_join->tmp_table_param, *curr_all_fields, 0);
1551
1552
  }
1553
1554
  if (curr_join->group || curr_join->tmp_table_param.sum_func_count)
1555
  {
1556
    if (make_group_fields(this, curr_join))
1557
      return;
1558
1559
    if (! items3)
1560
    {
1561
      if (! items0)
1562
        init_items_ref_array();
1563
      items3= ref_pointer_array + (all_fields.elements*4);
1564
      setup_copy_fields(session, &curr_join->tmp_table_param,
1565
      items3, tmp_fields_list3, tmp_all_fields3,
1566
      curr_fields_list->elements, *curr_all_fields);
1101.1.16 by Monty Taylor
Reverted 1103
1567
      tmp_table_param.save_copy_funcs= curr_join->tmp_table_param.copy_funcs;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1568
      tmp_table_param.save_copy_field= curr_join->tmp_table_param.copy_field;
1569
      tmp_table_param.save_copy_field_end= curr_join->tmp_table_param.copy_field_end;
1570
      curr_join->tmp_all_fields3= tmp_all_fields3;
1571
      curr_join->tmp_fields_list3= tmp_fields_list3;
1572
    }
1573
    else
1574
    {
1101.1.16 by Monty Taylor
Reverted 1103
1575
      curr_join->tmp_table_param.copy_funcs= tmp_table_param.save_copy_funcs;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1576
      curr_join->tmp_table_param.copy_field= tmp_table_param.save_copy_field;
1577
      curr_join->tmp_table_param.copy_field_end= tmp_table_param.save_copy_field_end;
1578
    }
1579
    curr_fields_list= &tmp_fields_list3;
1580
    curr_all_fields= &tmp_all_fields3;
1581
    curr_join->set_items_ref_array(items3);
1582
1583
    if (curr_join->make_sum_func_list(*curr_all_fields, *curr_fields_list,
1584
              1, true) ||
1585
        setup_sum_funcs(curr_join->session, curr_join->sum_funcs) ||
1586
        session->is_fatal_error)
1587
      return;
1588
  }
1589
  if (curr_join->group_list || curr_join->order)
1590
  {
1591
    session->set_proc_info("Sorting result");
1592
    /* If we have already done the group, add HAVING to sorted table */
1593
    if (curr_join->tmp_having && ! curr_join->group_list && ! curr_join->sort_and_group)
1594
    {
1595
      // Some tables may have been const
1596
      curr_join->tmp_having->update_used_tables();
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1597
      JoinTable *curr_table= &curr_join->join_tab[curr_join->const_tables];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1598
      table_map used_tables= (curr_join->const_table_map |
1599
            curr_table->table->map);
1600
1601
      Item* sort_table_cond= make_cond_for_table(curr_join->tmp_having, used_tables, used_tables, 0);
1602
      if (sort_table_cond)
1603
      {
1604
        if (!curr_table->select)
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
1605
          if (!(curr_table->select= new optimizer::SqlSelect))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1606
            return;
1607
        if (!curr_table->select->cond)
1608
          curr_table->select->cond= sort_table_cond;
1609
        else          // This should never happen
1610
        {
1611
          if (!(curr_table->select->cond=
1612
          new Item_cond_and(curr_table->select->cond,
1613
                sort_table_cond)))
1614
            return;
1615
          /*
1616
            Item_cond_and do not need fix_fields for execution, its parameters
1617
            are fixed or do not need fix_fields, too
1618
          */
1619
          curr_table->select->cond->quick_fix_field();
1620
        }
1621
        curr_table->select_cond= curr_table->select->cond;
1622
        curr_table->select_cond->top_level_item();
1623
        curr_join->tmp_having= make_cond_for_table(curr_join->tmp_having,
1624
                    ~ (table_map) 0,
1625
                    ~used_tables, 0);
1626
      }
1627
    }
1628
    {
1629
      if (group)
1630
        curr_join->select_limit= HA_POS_ERROR;
1631
      else
1632
      {
1633
        /*
1634
          We can abort sorting after session->select_limit rows if we there is no
1635
          WHERE clause for any tables after the sorted one.
1636
        */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1637
        JoinTable *curr_table= &curr_join->join_tab[curr_join->const_tables+1];
1638
        JoinTable *end_table= &curr_join->join_tab[curr_join->tables];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1639
        for (; curr_table < end_table ; curr_table++)
1640
        {
1641
          /*
1642
            table->keyuse is set in the case there was an original WHERE clause
1643
            on the table that was optimized away.
1644
          */
1645
          if (curr_table->select_cond ||
1646
              (curr_table->keyuse && !curr_table->first_inner))
1647
          {
1648
            /* We have to sort all rows */
1649
            curr_join->select_limit= HA_POS_ERROR;
1650
            break;
1651
          }
1652
        }
1653
      }
1654
      if (curr_join->join_tab == join_tab && save_join_tab())
1655
        return;
1656
      /*
1657
        Here we sort rows for order_st BY/GROUP BY clause, if the optimiser
1658
        chose FILESORT to be faster than INDEX SCAN or there is no
1659
        suitable index present.
1660
        Note, that create_sort_index calls test_if_skip_sort_order and may
1661
        finally replace sorting with index scan if there is a LIMIT clause in
1662
        the query. XXX: it's never shown in EXPLAIN!
1663
        OPTION_FOUND_ROWS supersedes LIMIT and is taken into account.
1664
      */
1665
      if (create_sort_index(session, curr_join,
1666
          curr_join->group_list ?
1667
          curr_join->group_list : curr_join->order,
1668
          curr_join->select_limit,
1669
          (select_options & OPTION_FOUND_ROWS ?
1670
           HA_POS_ERROR : unit->select_limit_cnt),
1671
                            curr_join->group_list ? true : false))
1672
        return;
1673
1674
      sortorder= curr_join->sortorder;
1675
      if (curr_join->const_tables != curr_join->tables &&
1676
          !curr_join->join_tab[curr_join->const_tables].table->sort.io_cache)
1677
      {
1678
        /*
1679
          If no IO cache exists for the first table then we are using an
1680
          INDEX SCAN and no filesort. Thus we should not remove the sorted
1681
          attribute on the INDEX SCAN.
1682
        */
1683
        skip_sort_order= 1;
1684
      }
1685
    }
1686
  }
1687
  /* XXX: When can we have here session->is_error() not zero? */
1688
  if (session->is_error())
1689
  {
1690
    error= session->is_error();
1691
    return;
1692
  }
1693
  curr_join->having= curr_join->tmp_having;
1694
  curr_join->fields= curr_fields_list;
1695
1696
  session->set_proc_info("Sending data");
971.3.63 by Eric Day
Removed protocol field flags.
1697
  result->send_fields(*curr_fields_list);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1698
  error= do_select(curr_join, curr_fields_list, NULL);
1699
  session->limit_found_rows= curr_join->send_records;
1700
1701
  /* Accumulate the counts from all join iterations of all join parts. */
1702
  session->examined_row_count+= curr_join->examined_rows;
1703
1704
  /*
1705
    With EXPLAIN EXTENDED we have to restore original ref_array
1706
    for a derived table which is always materialized.
1707
    Otherwise we would not be able to print the query  correctly.
1708
  */
1709
  if (items0 && (session->lex->describe & DESCRIBE_EXTENDED) && select_lex->linkage == DERIVED_TABLE_TYPE)
1710
    set_items_ref_array(items0);
1711
1712
  return;
1713
}
1714
1715
/**
1716
  Clean up join.
1717
1718
  @return
1541.1.1 by Brian Aker
JOIN -> Join rename
1719
    Return error that hold Join.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1720
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1721
int Join::destroy()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1722
{
1723
  select_lex->join= 0;
1724
1725
  if (tmp_join)
1726
  {
1727
    if (join_tab != tmp_join->join_tab)
1728
    {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1729
      JoinTable *tab, *end;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1730
      for (tab= join_tab, end= tab+tables ; tab != end ; tab++)
1731
        tab->cleanup();
1732
    }
1733
    tmp_join->tmp_join= 0;
1734
    tmp_table_param.copy_field=0;
1735
    return(tmp_join->destroy());
1736
  }
1737
  cond_equal= 0;
1738
1739
  cleanup(1);
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1740
  exec_tmp_table1= NULL;
1741
  exec_tmp_table2= NULL;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1742
  delete select;
1743
  delete_dynamic(&keyuse);
1532.1.1 by Brian Aker
Merge of change to flip table instance to be share instance
1744
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1745
  return(error);
1746
}
1747
1748
/**
1749
  Setup for execution all subqueries of a query, for which the optimizer
1750
  chose hash semi-join.
1751
1752
  @details Iterate over all subqueries of the query, and if they are under an
1753
  IN predicate, and the optimizer chose to compute it via hash semi-join:
1754
  - try to initialize all data structures needed for the materialized execution
1755
    of the IN predicate,
1756
  - if this fails, then perform the IN=>EXISTS transformation which was
1541.1.1 by Brian Aker
JOIN -> Join rename
1757
    previously blocked during Join::prepare.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1758
1759
  This method is part of the "code generation" query processing phase.
1760
1761
  This phase must be called after substitute_for_best_equal_field() because
1762
  that function may replace items with other items from a multiple equality,
1763
  and we need to reference the correct items in the index access method of the
1764
  IN predicate.
1765
1766
  @return Operation status
1767
  @retval false     success.
1768
  @retval true      error occurred.
1769
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1770
bool Join::setup_subquery_materialization()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1771
{
1772
  for (Select_Lex_Unit *un= select_lex->first_inner_unit(); un;
1773
       un= un->next_unit())
1774
  {
1775
    for (Select_Lex *sl= un->first_select(); sl; sl= sl->next_select())
1776
    {
1777
      Item_subselect *subquery_predicate= sl->master_unit()->item;
1778
      if (subquery_predicate &&
1779
          subquery_predicate->substype() == Item_subselect::IN_SUBS)
1780
      {
1781
        Item_in_subselect *in_subs= (Item_in_subselect*) subquery_predicate;
1782
        if (in_subs->exec_method == Item_in_subselect::MATERIALIZATION &&
1783
            in_subs->setup_engine())
1784
          return true;
1785
      }
1786
    }
1787
  }
1788
  return false;
1789
}
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1790
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1791
/**
1541.1.1 by Brian Aker
JOIN -> Join rename
1792
  Partially cleanup Join after it has executed: close index or rnd read
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1793
  (table cursors), free quick selects.
1794
1541.1.1 by Brian Aker
JOIN -> Join rename
1795
    This function is called in the end of execution of a Join, before the used
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1796
    tables are unlocked and closed.
1797
1798
    For a join that is resolved using a temporary table, the first sweep is
1799
    performed against actual tables and an intermediate result is inserted
1800
    into the temprorary table.
1801
    The last sweep is performed against the temporary table. Therefore,
1802
    the base tables and associated buffers used to fill the temporary table
1803
    are no longer needed, and this function is called to free them.
1804
1805
    For a join that is performed without a temporary table, this function
1806
    is called after all rows are sent, but before EOF packet is sent.
1807
1808
    For a simple SELECT with no subqueries this function performs a full
1541.1.1 by Brian Aker
JOIN -> Join rename
1809
    cleanup of the Join and calls mysql_unlock_read_tables to free used base
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1810
    tables.
1811
1541.1.1 by Brian Aker
JOIN -> Join rename
1812
    If a Join is executed for a subquery or if it has a subquery, we can't
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1813
    do the full cleanup and need to do a partial cleanup only.
1541.1.1 by Brian Aker
JOIN -> Join rename
1814
    - If a Join is not the top level join, we must not unlock the tables
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1815
    because the outer select may not have been evaluated yet, and we
1816
    can't unlock only selected tables of a query.
1541.1.1 by Brian Aker
JOIN -> Join rename
1817
    - Additionally, if this Join corresponds to a correlated subquery, we
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1818
    should not free quick selects and join buffers because they will be
1819
    needed for the next execution of the correlated subquery.
1541.1.1 by Brian Aker
JOIN -> Join rename
1820
    - However, if this is a Join for a [sub]select, which is not
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1821
    a correlated subquery itself, but has subqueries, we can free it
1541.1.1 by Brian Aker
JOIN -> Join rename
1822
    fully and also free Joins of all its subqueries. The exception
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1823
    is a subquery in SELECT list, e.g: @n
1824
    SELECT a, (select cmax(b) from t1) group by c @n
1825
    This subquery will not be evaluated at first sweep and its value will
1826
    not be inserted into the temporary table. Instead, it's evaluated
1827
    when selecting from the temporary table. Therefore, it can't be freed
1828
    here even though it's not correlated.
1829
1830
  @todo
1831
    Unlock tables even if the join isn't top level select in the tree
1832
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1833
void Join::join_free()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1834
{
1835
  Select_Lex_Unit *tmp_unit;
1836
  Select_Lex *sl;
1837
  /*
1541.1.1 by Brian Aker
JOIN -> Join rename
1838
    Optimization: if not EXPLAIN and we are done with the Join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1839
    free all tables.
1840
  */
1858.1.1 by Padraig O'Sullivan
Replaced a uint8_t member with a standard bitset since it was being used as a bitset....
1841
  bool full= (select_lex->uncacheable.none() && ! session->lex->describe);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1842
  bool can_unlock= full;
1843
1844
  cleanup(full);
1845
1846
  for (tmp_unit= select_lex->first_inner_unit();
1847
       tmp_unit;
1848
       tmp_unit= tmp_unit->next_unit())
1849
    for (sl= tmp_unit->first_select(); sl; sl= sl->next_select())
1850
    {
1851
      Item_subselect *subselect= sl->master_unit()->item;
1852
      bool full_local= full && (!subselect || subselect->is_evaluated());
1853
      /*
1854
        If this join is evaluated, we can fully clean it up and clean up all
1855
        its underlying joins even if they are correlated -- they will not be
1856
        used any more anyway.
1857
        If this join is not yet evaluated, we still must clean it up to
1858
        close its table cursors -- it may never get evaluated, as in case of
1859
        ... HAVING false OR a IN (SELECT ...))
1860
        but all table cursors must be closed before the unlock.
1861
      */
1862
      sl->cleanup_all_joins(full_local);
1541.1.1 by Brian Aker
JOIN -> Join rename
1863
      /* Can't unlock if at least one Join is still needed */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1864
      can_unlock= can_unlock && full_local;
1865
    }
1866
1867
  /*
1868
    We are not using tables anymore
1869
    Unlock all tables. We may be in an INSERT .... SELECT statement.
1870
  */
1871
  if (can_unlock && lock && session->lock &&
1872
      !(select_options & SELECT_NO_UNLOCK) &&
1873
      !select_lex->subquery_in_having &&
1874
      (select_lex == (session->lex->unit.fake_select_lex ?
1875
                      session->lex->unit.fake_select_lex : &session->lex->select_lex)))
1876
  {
1877
    /*
1878
      TODO: unlock tables even if the join isn't top level select in the
1879
      tree.
1880
    */
1881
    mysql_unlock_read_tables(session, lock);           // Don't free join->lock
1882
    lock= 0;
1883
  }
1884
1885
  return;
1886
}
1887
1888
1889
/**
1890
  Free resources of given join.
1891
1892
  @param fill   true if we should free all resources, call with full==1
1893
                should be last, before it this function can be called with
1894
                full==0
1895
1896
  @note
1897
    With subquery this function definitely will be called several times,
1898
    but even for simple query it can be called several times.
1899
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1900
void Join::cleanup(bool full)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1901
{
1902
  if (table)
1903
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
1904
    JoinTable *tab,*end;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1905
    /*
1906
      Only a sorted table may be cached.  This sorted table is always the
1907
      first non const table in join->table
1908
    */
1909
    if (tables > const_tables) // Test for not-const tables
1910
    {
1109.1.4 by Brian Aker
More Table refactor
1911
      table[const_tables]->free_io_cache();
1912
      table[const_tables]->filesort_free_buffers(full);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1913
    }
1914
1915
    if (full)
1916
    {
1917
      for (tab= join_tab, end= tab+tables; tab != end; tab++)
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1918
        tab->cleanup();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1919
      table= 0;
1920
    }
1921
    else
1922
    {
1923
      for (tab= join_tab, end= tab+tables; tab != end; tab++)
1924
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1925
        if (tab->table)
1208.3.2 by brian
Update for Cursor renaming.
1926
          tab->table->cursor->ha_index_or_rnd_end();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1927
      }
1928
    }
1929
  }
1930
  /*
1931
    We are not using tables anymore
1932
    Unlock all tables. We may be in an INSERT .... SELECT statement.
1933
  */
1934
  if (full)
1935
  {
1936
    if (tmp_join)
1937
      tmp_table_param.copy_field= 0;
1101.1.16 by Monty Taylor
Reverted 1103
1938
    group_fields.delete_elements();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1939
    /*
1940
      We can't call delete_elements() on copy_funcs as this will cause
1941
      problems in free_elements() as some of the elements are then deleted.
1942
    */
1101.1.16 by Monty Taylor
Reverted 1103
1943
    tmp_table_param.copy_funcs.empty();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1944
    /*
1541.1.1 by Brian Aker
JOIN -> Join rename
1945
      If we have tmp_join and 'this' Join is not tmp_join and
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1946
      tmp_table_param.copy_field's  of them are equal then we have to remove
1947
      pointer to  tmp_table_param.copy_field from tmp_join, because it qill
1948
      be removed in tmp_table_param.cleanup().
1949
    */
1950
    if (tmp_join &&
1951
        tmp_join != this &&
1952
        tmp_join->tmp_table_param.copy_field ==
1953
        tmp_table_param.copy_field)
1954
    {
1101.1.16 by Monty Taylor
Reverted 1103
1955
      tmp_join->tmp_table_param.copy_field=
1956
        tmp_join->tmp_table_param.save_copy_field= 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1957
    }
1101.1.16 by Monty Taylor
Reverted 1103
1958
    tmp_table_param.cleanup();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1959
  }
1960
  return;
1961
}
1962
1963
/*
1541.1.1 by Brian Aker
JOIN -> Join rename
1964
  used only in Join::clear
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1965
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1966
static void clear_tables(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1967
{
1968
  /*
1969
    must clear only the non-const tables, as const tables
1970
    are not re-calculated.
1971
  */
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
1972
  for (uint32_t i= join->const_tables; i < join->tables; i++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1973
    join->table[i]->mark_as_null_row();   // All fields are NULL
1974
}
1975
1976
/**
1977
  Make an array of pointers to sum_functions to speed up
1978
  sum_func calculation.
1979
1980
  @retval
1981
    0 ok
1982
  @retval
1983
    1 Error
1984
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
1985
bool Join::alloc_func_list()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
1986
{
1987
  uint32_t func_count, group_parts;
1988
1989
  func_count= tmp_table_param.sum_func_count;
1990
  /*
1991
    If we are using rollup, we need a copy of the summary functions for
1992
    each level
1993
  */
1994
  if (rollup.state != ROLLUP::STATE_NONE)
1995
    func_count*= (send_group_parts+1);
1996
1997
  group_parts= send_group_parts;
1998
  /*
1999
    If distinct, reserve memory for possible
2000
    disctinct->group_by optimization
2001
  */
2002
  if (select_distinct)
2003
  {
2004
    group_parts+= fields_list.elements;
2005
    /*
2006
      If the order_st clause is specified then it's possible that
2007
      it also will be optimized, so reserve space for it too
2008
    */
2009
    if (order)
2010
    {
2011
      order_st *ord;
2012
      for (ord= order; ord; ord= ord->next)
2013
        group_parts++;
2014
    }
2015
  }
2016
2017
  /* This must use calloc() as rollup_make_fields depends on this */
2018
  sum_funcs= (Item_sum**) session->calloc(sizeof(Item_sum**) * (func_count+1) +
2019
              sizeof(Item_sum***) * (group_parts+1));
2020
  sum_funcs_end= (Item_sum***) (sum_funcs+func_count+1);
2021
  return(sum_funcs == 0);
2022
}
2023
2024
/**
2025
  Initialize 'sum_funcs' array with all Item_sum objects.
2026
2027
  @param field_list        All items
2028
  @param send_fields       Items in select list
2029
  @param before_group_by   Set to 1 if this is called before GROUP BY handling
2030
  @param recompute         Set to true if sum_funcs must be recomputed
2031
2032
  @retval
2033
    0  ok
2034
  @retval
2035
    1  error
2036
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2037
bool Join::make_sum_func_list(List<Item> &field_list, 
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2038
                              List<Item> &send_fields,
2039
                              bool before_group_by, 
2040
                              bool recompute)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2041
{
2042
  List_iterator_fast<Item> it(field_list);
2043
  Item_sum **func;
2044
  Item *item;
2045
2046
  if (*sum_funcs && !recompute)
2047
    return(false); /* We have already initialized sum_funcs. */
2048
2049
  func= sum_funcs;
2050
  while ((item=it++))
2051
  {
2052
    if (item->type() == Item::SUM_FUNC_ITEM && !item->const_item() &&
2053
        (!((Item_sum*) item)->depended_from() ||
2054
         ((Item_sum *)item)->depended_from() == select_lex))
2055
      *func++= (Item_sum*) item;
2056
  }
2057
  if (before_group_by && rollup.state == ROLLUP::STATE_INITED)
2058
  {
2059
    rollup.state= ROLLUP::STATE_READY;
2060
    if (rollup_make_fields(field_list, send_fields, &func))
2061
      return(true);     // Should never happen
2062
  }
2063
  else if (rollup.state == ROLLUP::STATE_NONE)
2064
  {
2065
    for (uint32_t i=0 ; i <= send_group_parts ;i++)
2066
      sum_funcs_end[i]= func;
2067
  }
2068
  else if (rollup.state == ROLLUP::STATE_READY)
2069
    return(false);                         // Don't put end marker
2070
  *func=0;          // End marker
2071
  return(false);
2072
}
2073
2074
/** Allocate memory needed for other rollup functions. */
1541.1.1 by Brian Aker
JOIN -> Join rename
2075
bool Join::rollup_init()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2076
{
2077
  uint32_t i,j;
2078
  Item **ref_array;
2079
2080
  tmp_table_param.quick_group= 0; // Can't create groups in tmp table
2081
  rollup.state= ROLLUP::STATE_INITED;
2082
2083
  /*
2084
    Create pointers to the different sum function groups
2085
    These are updated by rollup_make_fields()
2086
  */
2087
  tmp_table_param.group_parts= send_group_parts;
2088
2089
  if (!(rollup.null_items= (Item_null_result**) session->alloc((sizeof(Item*) +
2090
                                                sizeof(Item**) +
2091
                                                sizeof(List<Item>) +
2092
                        ref_pointer_array_size)
2093
                        * send_group_parts )))
2094
    return 1;
2095
2096
  rollup.fields= (List<Item>*) (rollup.null_items + send_group_parts);
2097
  rollup.ref_pointer_arrays= (Item***) (rollup.fields + send_group_parts);
2098
  ref_array= (Item**) (rollup.ref_pointer_arrays+send_group_parts);
2099
2100
  /*
2101
    Prepare space for field list for the different levels
2102
    These will be filled up in rollup_make_fields()
2103
  */
2104
  for (i= 0 ; i < send_group_parts ; i++)
2105
  {
2106
    rollup.null_items[i]= new (session->mem_root) Item_null_result();
2107
    List<Item> *rollup_fields= &rollup.fields[i];
2108
    rollup_fields->empty();
2109
    rollup.ref_pointer_arrays[i]= ref_array;
2110
    ref_array+= all_fields.elements;
2111
  }
2112
  for (i= 0 ; i < send_group_parts; i++)
2113
  {
2114
    for (j=0 ; j < fields_list.elements ; j++)
2115
      rollup.fields[i].push_back(rollup.null_items[i]);
2116
  }
2117
  List_iterator<Item> it(all_fields);
2118
  Item *item;
2119
  while ((item= it++))
2120
  {
2121
    order_st *group_tmp;
2122
    bool found_in_group= 0;
2123
2124
    for (group_tmp= group_list; group_tmp; group_tmp= group_tmp->next)
2125
    {
2126
      if (*group_tmp->item == item)
2127
      {
2128
        item->maybe_null= 1;
2129
        found_in_group= 1;
2130
        if (item->const_item())
2131
        {
2132
          /*
2133
            For ROLLUP queries each constant item referenced in GROUP BY list
2134
            is wrapped up into an Item_func object yielding the same value
2135
            as the constant item. The objects of the wrapper class are never
2136
            considered as constant items and besides they inherit all
2137
            properties of the Item_result_field class.
2138
            This wrapping allows us to ensure writing constant items
2139
            into temporary tables whenever the result of the ROLLUP
2140
            operation has to be written into a temporary table, e.g. when
2141
            ROLLUP is used together with DISTINCT in the SELECT list.
2142
            Usually when creating temporary tables for a intermidiate
2143
            result we do not include fields for constant expressions.
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2144
          */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2145
          Item* new_item= new Item_func_rollup_const(item);
2146
          if (!new_item)
2147
            return 1;
2148
          new_item->fix_fields(session, (Item **) 0);
2149
          session->change_item_tree(it.ref(), new_item);
2150
          for (order_st *tmp= group_tmp; tmp; tmp= tmp->next)
2151
          {
2152
            if (*tmp->item == item)
2153
              session->change_item_tree(tmp->item, new_item);
2154
          }
2155
        }
2156
      }
2157
    }
2158
    if (item->type() == Item::FUNC_ITEM && !found_in_group)
2159
    {
2160
      bool changed= false;
2161
      if (change_group_ref(session, (Item_func *) item, group_list, &changed))
2162
        return 1;
2163
      /*
2164
        We have to prevent creation of a field in a temporary table for
2165
        an expression that contains GROUP BY attributes.
2166
        Marking the expression item as 'with_sum_func' will ensure this.
2167
      */
2168
      if (changed)
2169
        item->with_sum_func= 1;
2170
    }
2171
  }
2172
  return 0;
2173
}
2174
2175
/**
2176
  Fill up rollup structures with pointers to fields to use.
2177
2178
  Creates copies of item_sum items for each sum level.
2179
2180
  @param fields_arg   List of all fields (hidden and real ones)
2181
  @param sel_fields   Pointer to selected fields
2182
  @param func     Store here a pointer to all fields
2183
2184
  @retval
2185
    0 if ok;
2186
    In this case func is pointing to next not used element.
2187
  @retval
2188
    1    on error
2189
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2190
bool Join::rollup_make_fields(List<Item> &fields_arg, List<Item> &sel_fields, Item_sum ***func)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2191
{
2192
  List_iterator_fast<Item> it(fields_arg);
2193
  Item *first_field= sel_fields.head();
2194
  uint32_t level;
2195
2196
  /*
2197
    Create field lists for the different levels
2198
2199
    The idea here is to have a separate field list for each rollup level to
2200
    avoid all runtime checks of which columns should be NULL.
2201
2202
    The list is stored in reverse order to get sum function in such an order
2203
    in func that it makes it easy to reset them with init_sum_functions()
2204
2205
    Assuming:  SELECT a, b, c SUM(b) FROM t1 GROUP BY a,b WITH ROLLUP
2206
2207
    rollup.fields[0] will contain list where a,b,c is NULL
2208
    rollup.fields[1] will contain list where b,c is NULL
2209
    ...
2210
    rollup.ref_pointer_array[#] points to fields for rollup.fields[#]
2211
    ...
2212
    sum_funcs_end[0] points to all sum functions
2213
    sum_funcs_end[1] points to all sum functions, except grand totals
2214
    ...
2215
  */
2216
2217
  for (level=0 ; level < send_group_parts ; level++)
2218
  {
2219
    uint32_t i;
2220
    uint32_t pos= send_group_parts - level -1;
2221
    bool real_fields= 0;
2222
    Item *item;
2223
    List_iterator<Item> new_it(rollup.fields[pos]);
2224
    Item **ref_array_start= rollup.ref_pointer_arrays[pos];
2225
    order_st *start_group;
2226
2227
    /* Point to first hidden field */
2228
    Item **ref_array= ref_array_start + fields_arg.elements-1;
2229
2230
    /* Remember where the sum functions ends for the previous level */
2231
    sum_funcs_end[pos+1]= *func;
2232
2233
    /* Find the start of the group for this level */
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2234
    for (i= 0, start_group= group_list ;i++ < pos ;start_group= start_group->next)
2235
    {}
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2236
2237
    it.rewind();
2238
    while ((item= it++))
2239
    {
2240
      if (item == first_field)
2241
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2242
        real_fields= 1;       // End of hidden fields
2243
        ref_array= ref_array_start;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2244
      }
2245
2246
      if (item->type() == Item::SUM_FUNC_ITEM && !item->const_item() &&
2247
          (!((Item_sum*) item)->depended_from() ||
2248
           ((Item_sum *)item)->depended_from() == select_lex))
2249
2250
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2251
        /*
2252
          This is a top level summary function that must be replaced with
2253
          a sum function that is reset for this level.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2254
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2255
          NOTE: This code creates an object which is not that nice in a
2256
          sub select.  Fortunately it's not common to have rollup in
2257
          sub selects.
2258
        */
2259
        item= item->copy_or_same(session);
2260
        ((Item_sum*) item)->make_unique();
2261
        *(*func)= (Item_sum*) item;
2262
        (*func)++;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2263
      }
2264
      else
2265
      {
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2266
        /* Check if this is something that is part of this group by */
2267
        order_st *group_tmp;
2268
        for (group_tmp= start_group, i= pos ;
2269
                  group_tmp ; group_tmp= group_tmp->next, i++)
2270
        {
2271
                if (*group_tmp->item == item)
2272
          {
2273
            /*
2274
              This is an element that is used by the GROUP BY and should be
2275
              set to NULL in this level
2276
            */
2277
                  Item_null_result *null_item= new (session->mem_root) Item_null_result();
2278
                  if (!null_item)
2279
                    return 1;
2280
            item->maybe_null= 1;    // Value will be null sometimes
2281
                  null_item->result_field= item->get_tmp_table_field();
2282
                  item= null_item;
2283
            break;
2284
          }
2285
        }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2286
      }
2287
      *ref_array= item;
2288
      if (real_fields)
2289
      {
2290
  (void) new_it++;      // Point to next item
2291
  new_it.replace(item);     // Replace previous
2292
  ref_array++;
2293
      }
2294
      else
2295
  ref_array--;
2296
    }
2297
  }
2298
  sum_funcs_end[0]= *func;      // Point to last function
2299
  return 0;
2300
}
2301
2302
/**
2303
  Send all rollup levels higher than the current one to the client.
2304
2305
  @b SAMPLE
2306
    @code
2307
      SELECT a, b, c SUM(b) FROM t1 GROUP BY a,b WITH ROLLUP
2308
  @endcode
2309
2310
  @param idx    Level we are on:
2311
                        - 0 = Total sum level
2312
                        - 1 = First group changed  (a)
2313
                        - 2 = Second group changed (a,b)
2314
2315
  @retval
2316
    0   ok
2317
  @retval
2318
    1   If send_data_failed()
2319
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2320
int Join::rollup_send_data(uint32_t idx)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2321
{
2322
  uint32_t i;
2323
  for (i= send_group_parts ; i-- > idx ; )
2324
  {
2325
    /* Get reference pointers to sum functions in place */
2326
    memcpy(ref_pointer_array, rollup.ref_pointer_arrays[i],
2327
     ref_pointer_array_size);
2328
    if ((!having || having->val_int()))
2329
    {
2330
      if (send_records < unit->select_limit_cnt && do_send_rows &&
2331
    result->send_data(rollup.fields[i]))
2332
  return 1;
2333
      send_records++;
2334
    }
2335
  }
2336
  /* Restore ref_pointer_array */
2337
  set_items_ref_array(current_ref_pointer_array);
2338
  return 0;
2339
}
2340
2341
/**
2342
  Write all rollup levels higher than the current one to a temp table.
2343
2344
  @b SAMPLE
2345
    @code
2346
      SELECT a, b, SUM(c) FROM t1 GROUP BY a,b WITH ROLLUP
2347
  @endcode
2348
2349
  @param idx                 Level we are on:
2350
                               - 0 = Total sum level
2351
                               - 1 = First group changed  (a)
2352
                               - 2 = Second group changed (a,b)
2353
  @param table               reference to temp table
2354
2355
  @retval
2356
    0   ok
2357
  @retval
2358
    1   if write_data_failed()
2359
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2360
int Join::rollup_write_data(uint32_t idx, Table *table_arg)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2361
{
2362
  uint32_t i;
2363
  for (i= send_group_parts ; i-- > idx ; )
2364
  {
2365
    /* Get reference pointers to sum functions in place */
2366
    memcpy(ref_pointer_array, rollup.ref_pointer_arrays[i],
1487.1.1 by Brian Aker
There is room for improvement around this. We should be using rows as well
2367
           ref_pointer_array_size);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2368
    if ((!having || having->val_int()))
2369
    {
2370
      int write_error;
2371
      Item *item;
2372
      List_iterator_fast<Item> it(rollup.fields[i]);
2373
      while ((item= it++))
2374
      {
2375
        if (item->type() == Item::NULL_ITEM && item->is_result_field())
2376
          item->save_in_result_field(1);
2377
      }
2378
      copy_sum_funcs(sum_funcs_end[i+1], sum_funcs_end[i]);
1672.3.6 by Brian Aker
First pass in encapsulating row
2379
      if ((write_error= table_arg->cursor->insertRecord(table_arg->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2380
      {
1487.1.1 by Brian Aker
There is room for improvement around this. We should be using rows as well
2381
        my_error(ER_USE_SQL_BIG_RESULT, MYF(0));
2382
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2383
      }
2384
    }
2385
  }
2386
  /* Restore ref_pointer_array */
2387
  set_items_ref_array(current_ref_pointer_array);
2388
  return 0;
2389
}
2390
2391
/**
2392
  clear results if there are not rows found for group
2393
  (end_send_group/end_write_group)
2394
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2395
void Join::clear()
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2396
{
2397
  clear_tables(this);
2398
  copy_fields(&tmp_table_param);
2399
2400
  if (sum_funcs)
2401
  {
2402
    Item_sum *func, **func_ptr= sum_funcs;
2403
    while ((func= *(func_ptr++)))
2404
      func->clear();
2405
  }
2406
}
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2407
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2408
/**
1541.1.1 by Brian Aker
JOIN -> Join rename
2409
  change select_result object of Join.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2410
2411
  @param res    new select_result object
2412
2413
  @retval
2414
    false   OK
2415
  @retval
2416
    true    error
2417
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2418
bool Join::change_result(select_result *res)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2419
{
2420
  result= res;
2421
  if (result->prepare(fields_list, select_lex->master_unit()))
2422
  {
2423
    return(true);
2424
  }
2425
  return(false);
2426
}
2427
2428
/**
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2429
  Cache constant expressions in WHERE, HAVING, ON conditions.
2430
*/
2431
1541.1.1 by Brian Aker
JOIN -> Join rename
2432
void Join::cache_const_exprs()
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2433
{
1240.8.3 by Dennis Schoen
fix uchar and FALSE
2434
  bool cache_flag= false;
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2435
  bool *analyzer_arg= &cache_flag;
2436
2437
  /* No need in cache if all tables are constant. */
2438
  if (const_tables == tables)
2439
    return;
2440
2441
  if (conds)
1240.8.4 by Dennis Schoen
add Item functions
2442
    conds->compile(&Item::cache_const_expr_analyzer, (unsigned char **)&analyzer_arg,
2443
                  &Item::cache_const_expr_transformer, (unsigned char *)&cache_flag);
1240.8.3 by Dennis Schoen
fix uchar and FALSE
2444
  cache_flag= false;
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2445
  if (having)
1240.8.4 by Dennis Schoen
add Item functions
2446
    having->compile(&Item::cache_const_expr_analyzer, (unsigned char **)&analyzer_arg,
2447
                    &Item::cache_const_expr_transformer, (unsigned char *)&cache_flag);
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2448
1240.8.3 by Dennis Schoen
fix uchar and FALSE
2449
  for (JoinTable *tab= join_tab + const_tables; tab < join_tab + tables ; tab++)
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2450
  {
2451
    if (*tab->on_expr_ref)
2452
    {
1240.8.3 by Dennis Schoen
fix uchar and FALSE
2453
      cache_flag= false;
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2454
      (*tab->on_expr_ref)->compile(&Item::cache_const_expr_analyzer,
1240.8.4 by Dennis Schoen
add Item functions
2455
                                 (unsigned char **)&analyzer_arg,
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2456
                                 &Item::cache_const_expr_transformer,
1240.8.4 by Dennis Schoen
add Item functions
2457
                                 (unsigned char *)&cache_flag);
1240.8.2 by Dennis Schoen
add cache_const_exprs() to JOIN
2458
    }
2459
  }
2460
}
2461
2462
/**
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2463
  @brief
2464
  
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2465
  Process one record of the nested loop join.
2466
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2467
  @details 
2468
2469
  This function will evaluate parts of WHERE/ON clauses that are
2470
  applicable to the partial record on hand and in case of success
2471
  submit this record to the next level of the nested loop.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2472
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2473
enum_nested_loop_state evaluate_join_record(Join *join, JoinTable *join_tab, int error)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2474
{
1039.2.7 by Jay Pipes
Yet more style and indentation cleanups.
2475
  bool not_used_in_distinct= join_tab->not_used_in_distinct;
2476
  ha_rows found_records= join->found_records;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2477
  COND *select_cond= join_tab->select_cond;
2478
2479
  if (error > 0 || (join->session->is_error()))     // Fatal error
2480
    return NESTED_LOOP_ERROR;
2481
  if (error < 0)
2482
    return NESTED_LOOP_NO_MORE_ROWS;
2483
  if (join->session->killed)			// Aborted by user
2484
  {
2485
    join->session->send_kill_message();
971.6.11 by Eric Day
Removed purecov messages.
2486
    return NESTED_LOOP_KILLED;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2487
  }
2488
  if (!select_cond || select_cond->val_int())
2489
  {
2490
    /*
2491
      There is no select condition or the attached pushed down
2492
      condition is true => a match is found.
2493
    */
2494
    bool found= 1;
2495
    while (join_tab->first_unmatched && found)
2496
    {
2497
      /*
2498
        The while condition is always false if join_tab is not
2499
        the last inner join table of an outer join operation.
2500
      */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2501
      JoinTable *first_unmatched= join_tab->first_unmatched;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2502
      /*
2503
        Mark that a match for current outer table is found.
2504
        This activates push down conditional predicates attached
2505
        to the all inner tables of the outer join.
2506
      */
2507
      first_unmatched->found= 1;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2508
      for (JoinTable *tab= first_unmatched; tab <= join_tab; tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2509
      {
2510
        if (tab->table->reginfo.not_exists_optimize)
2511
          return NESTED_LOOP_NO_MORE_ROWS;
2512
        /* Check all predicates that has just been activated. */
2513
        /*
2514
          Actually all predicates non-guarded by first_unmatched->found
2515
          will be re-evaluated again. It could be fixed, but, probably,
2516
          it's not worth doing now.
2517
        */
2518
        if (tab->select_cond && !tab->select_cond->val_int())
2519
        {
2520
          /* The condition attached to table tab is false */
2521
          if (tab == join_tab)
2522
            found= 0;
2523
          else
2524
          {
2525
            /*
2526
              Set a return point if rejected predicate is attached
2527
              not to the last table of the current nest level.
2528
            */
2529
            join->return_tab= tab;
2530
            return NESTED_LOOP_OK;
2531
          }
2532
        }
2533
      }
2534
      /*
2535
        Check whether join_tab is not the last inner table
2536
        for another embedding outer join.
2537
      */
2538
      if ((first_unmatched= first_unmatched->first_upper) &&
2539
          first_unmatched->last_inner != join_tab)
2540
        first_unmatched= 0;
2541
      join_tab->first_unmatched= first_unmatched;
2542
    }
2543
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2544
    JoinTable *return_tab= join->return_tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2545
    join_tab->found_match= true;
2546
2547
    /*
2548
      It was not just a return to lower loop level when one
2549
      of the newly activated predicates is evaluated as false
2550
      (See above join->return_tab= tab).
2551
    */
2552
    join->examined_rows++;
2553
    join->session->row_count++;
2554
2555
    if (found)
2556
    {
2557
      enum enum_nested_loop_state rc;
2558
      /* A match from join_tab is found for the current partial join. */
2559
      rc= (*join_tab->next_select)(join, join_tab+1, 0);
2560
      if (rc != NESTED_LOOP_OK && rc != NESTED_LOOP_NO_MORE_ROWS)
2561
        return rc;
2562
      if (return_tab < join->return_tab)
2563
        join->return_tab= return_tab;
2564
2565
      if (join->return_tab < join_tab)
2566
        return NESTED_LOOP_OK;
2567
      /*
2568
        Test if this was a SELECT DISTINCT query on a table that
2569
        was not in the field list;  In this case we can abort if
2570
        we found a row, as no new rows can be added to the result.
2571
      */
2572
      if (not_used_in_distinct && found_records != join->found_records)
2573
        return NESTED_LOOP_NO_MORE_ROWS;
2574
    }
2575
    else
1208.3.2 by brian
Update for Cursor renaming.
2576
      join_tab->read_record.cursor->unlock_row();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2577
  }
2578
  else
2579
  {
2580
    /*
2581
      The condition pushed down to the table join_tab rejects all rows
2582
      with the beginning coinciding with the current partial join.
2583
    */
2584
    join->examined_rows++;
2585
    join->session->row_count++;
1208.3.2 by brian
Update for Cursor renaming.
2586
    join_tab->read_record.cursor->unlock_row();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2587
  }
2588
  return NESTED_LOOP_OK;
2589
}
2590
2591
/**
2592
  @details
2593
    Construct a NULL complimented partial join record and feed it to the next
2594
    level of the nested loop. This function is used in case we have
2595
    an OUTER join and no matching record was found.
2596
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2597
enum_nested_loop_state evaluate_null_complemented_join_record(Join *join, JoinTable *join_tab)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2598
{
2599
  /*
2600
    The table join_tab is the first inner table of a outer join operation
2601
    and no matches has been found for the current outer row.
2602
  */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2603
  JoinTable *last_inner_tab= join_tab->last_inner;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2604
  /* Cache variables for faster loop */
2605
  COND *select_cond;
2606
  for ( ; join_tab <= last_inner_tab ; join_tab++)
2607
  {
2608
    /* Change the the values of guard predicate variables. */
2609
    join_tab->found= 1;
2610
    join_tab->not_null_compl= 0;
2611
    /* The outer row is complemented by nulls for each inner tables */
2612
    join_tab->table->restoreRecordAsDefault();  // Make empty record
2613
    join_tab->table->mark_as_null_row();       // For group by without error
2614
    select_cond= join_tab->select_cond;
2615
    /* Check all attached conditions for inner table rows. */
2616
    if (select_cond && !select_cond->val_int())
2617
      return NESTED_LOOP_OK;
2618
  }
2619
  join_tab--;
2620
  /*
2621
    The row complemented by nulls might be the first row
2622
    of embedding outer joins.
2623
    If so, perform the same actions as in the code
2624
    for the first regular outer join row above.
2625
  */
2626
  for ( ; ; )
2627
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2628
    JoinTable *first_unmatched= join_tab->first_unmatched;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2629
    if ((first_unmatched= first_unmatched->first_upper) && first_unmatched->last_inner != join_tab)
2630
      first_unmatched= 0;
2631
    join_tab->first_unmatched= first_unmatched;
2632
    if (! first_unmatched)
2633
      break;
2634
    first_unmatched->found= 1;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2635
    for (JoinTable *tab= first_unmatched; tab <= join_tab; tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2636
    {
2637
      if (tab->select_cond && !tab->select_cond->val_int())
2638
      {
2639
        join->return_tab= tab;
2640
        return NESTED_LOOP_OK;
2641
      }
2642
    }
2643
  }
2644
  /*
2645
    The row complemented by nulls satisfies all conditions
2646
    attached to inner tables.
2647
    Send the row complemented by nulls to be joined with the
2648
    remaining tables.
2649
  */
2650
  return (*join_tab->next_select)(join, join_tab+1, 0);
2651
}
2652
1541.1.1 by Brian Aker
JOIN -> Join rename
2653
enum_nested_loop_state flush_cached_records(Join *join, JoinTable *join_tab, bool skip_last)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2654
{
2655
  enum_nested_loop_state rc= NESTED_LOOP_OK;
2656
  int error;
1538 by Brian Aker
Code shuffle on ReadRecord
2657
  ReadRecord *info;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2658
2659
  join_tab->table->null_row= 0;
2660
  if (!join_tab->cache.records)
1539.1.7 by Brian Aker
JoinCache rename.
2661
  {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2662
    return NESTED_LOOP_OK;                      /* Nothing to do */
1539.1.7 by Brian Aker
JoinCache rename.
2663
  }
2664
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2665
  if (skip_last)
1539.1.7 by Brian Aker
JoinCache rename.
2666
  {
2667
    (void) join_tab->cache.store_record_in_cache(); // Must save this for later
2668
  }
2669
2670
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2671
  if (join_tab->use_quick == 2)
2672
  {
2673
    if (join_tab->select->quick)
2674
    {					/* Used quick select last. reset it */
2675
      delete join_tab->select->quick;
2676
      join_tab->select->quick=0;
2677
    }
2678
  }
2679
  /* read through all records */
2680
  if ((error=join_init_read_record(join_tab)))
2681
  {
1539.1.7 by Brian Aker
JoinCache rename.
2682
    join_tab->cache.reset_cache_write();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2683
    return error < 0 ? NESTED_LOOP_NO_MORE_ROWS: NESTED_LOOP_ERROR;
2684
  }
2685
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2686
  for (JoinTable *tmp=join->join_tab; tmp != join_tab ; tmp++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2687
  {
2688
    tmp->status=tmp->table->status;
2689
    tmp->table->status=0;
2690
  }
2691
2692
  info= &join_tab->read_record;
2693
  do
2694
  {
2695
    if (join->session->killed)
2696
    {
2697
      join->session->send_kill_message();
971.6.11 by Eric Day
Removed purecov messages.
2698
      return NESTED_LOOP_KILLED;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2699
    }
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
2700
    optimizer::SqlSelect *select= join_tab->select;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2701
    if (rc == NESTED_LOOP_OK &&
2702
        (!join_tab->cache.select || !join_tab->cache.select->skip_record()))
2703
    {
2704
      uint32_t i;
1539.1.7 by Brian Aker
JoinCache rename.
2705
      join_tab->cache.reset_cache_read();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2706
      for (i=(join_tab->cache.records- (skip_last ? 1 : 0)) ; i-- > 0 ;)
2707
      {
1089.1.13 by Brian Aker
Sorting methods into class files.
2708
	      join_tab->readCachedRecord();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2709
	      if (!select || !select->skip_record())
2710
        {
2711
          int res= 0;
1100.2.1 by Brian Aker
First pass through removing most of the semi_join code.
2712
2713
          rc= (join_tab->next_select)(join,join_tab+1,0);
2714
          if (rc != NESTED_LOOP_OK && rc != NESTED_LOOP_NO_MORE_ROWS)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2715
          {
1539.1.7 by Brian Aker
JoinCache rename.
2716
            join_tab->cache.reset_cache_write();
1100.2.1 by Brian Aker
First pass through removing most of the semi_join code.
2717
            return rc;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2718
          }
1100.2.1 by Brian Aker
First pass through removing most of the semi_join code.
2719
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2720
          if (res == -1)
2721
            return NESTED_LOOP_ERROR;
2722
        }
2723
      }
2724
    }
2725
  } while (!(error=info->read_record(info)));
2726
2727
  if (skip_last)
1089.1.13 by Brian Aker
Sorting methods into class files.
2728
    join_tab->readCachedRecord();		// Restore current record
1539.1.7 by Brian Aker
JoinCache rename.
2729
  join_tab->cache.reset_cache_write();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2730
  if (error > 0)				// Fatal error
971.6.11 by Eric Day
Removed purecov messages.
2731
    return NESTED_LOOP_ERROR;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2732
  for (JoinTable *tmp2=join->join_tab; tmp2 != join_tab ; tmp2++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2733
    tmp2->table->status=tmp2->status;
2734
  return NESTED_LOOP_OK;
2735
}
2736
2737
/*****************************************************************************
2738
  DESCRIPTION
2739
    Functions that end one nested loop iteration. Different functions
2740
    are used to support GROUP BY clause and to redirect records
2741
    to a table (e.g. in case of SELECT into a temporary table) or to the
2742
    network client.
2743
2744
  RETURN VALUES
2745
    NESTED_LOOP_OK           - the record has been successfully handled
2746
    NESTED_LOOP_ERROR        - a fatal error (like table corruption)
2747
                               was detected
2748
    NESTED_LOOP_KILLED       - thread shutdown was requested while processing
2749
                               the record
2750
    NESTED_LOOP_QUERY_LIMIT  - the record has been successfully handled;
2751
                               additionally, the nested loop produced the
2752
                               number of rows specified in the LIMIT clause
2753
                               for the query
2754
    NESTED_LOOP_CURSOR_LIMIT - the record has been successfully handled;
2755
                               additionally, there is a cursor and the nested
2756
                               loop algorithm produced the number of rows
2757
                               that is specified for current cursor fetch
2758
                               operation.
2759
   All return values except NESTED_LOOP_OK abort the nested loop.
2760
*****************************************************************************/
1541.1.1 by Brian Aker
JOIN -> Join rename
2761
enum_nested_loop_state end_send(Join *join, JoinTable *, bool end_of_records)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2762
{
2763
  if (! end_of_records)
2764
  {
2765
    int error;
2766
    if (join->having && join->having->val_int() == 0)
2767
      return NESTED_LOOP_OK;               // Didn't match having
2768
    error= 0;
2769
    if (join->do_send_rows)
2770
      error=join->result->send_data(*join->fields);
2771
    if (error)
971.6.11 by Eric Day
Removed purecov messages.
2772
      return NESTED_LOOP_ERROR;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2773
    if (++join->send_records >= join->unit->select_limit_cnt &&	join->do_send_rows)
2774
    {
2775
      if (join->select_options & OPTION_FOUND_ROWS)
2776
      {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
2777
        JoinTable *jt=join->join_tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2778
        if ((join->tables == 1) && !join->tmp_table && !join->sort_and_group
2779
            && !join->send_group_parts && !join->having && !jt->select_cond &&
2780
            !(jt->select && jt->select->quick) &&
1233.1.2 by Brian Aker
Move stat read define into engine flags.
2781
            (jt->table->cursor->getEngine()->check_flag(HTON_BIT_STATS_RECORDS_IS_EXACT)) &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2782
                  (jt->ref.key < 0))
2783
        {
2784
          /* Join over all rows in table;  Return number of found rows */
2785
          Table *table= jt->table;
2786
2787
          join->select_options^= OPTION_FOUND_ROWS;
2788
          if (table->sort.record_pointers ||
2789
              (table->sort.io_cache && my_b_inited(table->sort.io_cache)))
2790
          {
2791
            /* Using filesort */
2792
            join->send_records= table->sort.found_records;
2793
          }
2794
          else
2795
          {
1208.3.2 by brian
Update for Cursor renaming.
2796
            table->cursor->info(HA_STATUS_VARIABLE);
2797
            join->send_records= table->cursor->stats.records;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2798
          }
2799
        }
2800
        else
2801
        {
2802
          join->do_send_rows= 0;
2803
          if (join->unit->fake_select_lex)
2804
            join->unit->fake_select_lex->select_limit= 0;
2805
          return NESTED_LOOP_OK;
2806
        }
2807
      }
2808
      return NESTED_LOOP_QUERY_LIMIT;      // Abort nicely
2809
    }
2810
    else if (join->send_records >= join->fetch_limit)
2811
    {
2812
      /*
2813
        There is a server side cursor and all rows for
2814
        this fetch request are sent.
2815
      */
2816
      return NESTED_LOOP_CURSOR_LIMIT;
2817
    }
2818
  }
2819
2820
  return NESTED_LOOP_OK;
2821
}
2822
1541.1.1 by Brian Aker
JOIN -> Join rename
2823
enum_nested_loop_state end_write(Join *join, JoinTable *, bool end_of_records)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2824
{
2825
  Table *table= join->tmp_table;
2826
2827
  if (join->session->killed)			// Aborted by user
2828
  {
2829
    join->session->send_kill_message();
971.6.11 by Eric Day
Removed purecov messages.
2830
    return NESTED_LOOP_KILLED;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2831
  }
2832
  if (!end_of_records)
2833
  {
2834
    copy_fields(&join->tmp_table_param);
2835
    copy_funcs(join->tmp_table_param.items_to_copy);
2836
    if (!join->having || join->having->val_int())
2837
    {
2838
      int error;
2839
      join->found_records++;
1672.3.6 by Brian Aker
First pass in encapsulating row
2840
      if ((error=table->cursor->insertRecord(table->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2841
      {
1208.3.2 by brian
Update for Cursor renaming.
2842
        if (!table->cursor->is_fatal_error(error, HA_CHECK_DUP))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2843
          goto end;
1487.1.1 by Brian Aker
There is room for improvement around this. We should be using rows as well
2844
2845
        my_error(ER_USE_SQL_BIG_RESULT, MYF(0));
2846
        return NESTED_LOOP_ERROR;        // Table is_full error
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2847
      }
2848
      if (++join->send_records >= join->tmp_table_param.end_write_records && join->do_send_rows)
2849
      {
2850
        if (!(join->select_options & OPTION_FOUND_ROWS))
2851
          return NESTED_LOOP_QUERY_LIMIT;
2852
        join->do_send_rows= 0;
2853
        join->unit->select_limit_cnt= HA_POS_ERROR;
2854
        return NESTED_LOOP_OK;
2855
      }
2856
    }
2857
  }
2858
end:
2859
  return NESTED_LOOP_OK;
2860
}
2861
2862
/** Group by searching after group record and updating it if possible. */
1541.1.1 by Brian Aker
JOIN -> Join rename
2863
enum_nested_loop_state end_update(Join *join, JoinTable *, bool end_of_records)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2864
{
2865
  Table *table= join->tmp_table;
2866
  order_st *group;
2867
  int	error;
2868
2869
  if (end_of_records)
2870
    return NESTED_LOOP_OK;
2871
  if (join->session->killed)			// Aborted by user
2872
  {
2873
    join->session->send_kill_message();
971.6.11 by Eric Day
Removed purecov messages.
2874
    return NESTED_LOOP_KILLED;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2875
  }
2876
2877
  join->found_records++;
2878
  copy_fields(&join->tmp_table_param);		// Groups are copied twice.
2879
  /* Make a key of group index */
2880
  for (group=table->group ; group ; group=group->next)
2881
  {
2882
    Item *item= *group->item;
2883
    item->save_org_in_field(group->field);
2884
    /* Store in the used key if the field was 0 */
2885
    if (item->maybe_null)
2886
      group->buff[-1]= (char) group->field->is_null();
2887
  }
1672.3.6 by Brian Aker
First pass in encapsulating row
2888
  if (!table->cursor->index_read_map(table->getUpdateRecord(),
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2889
                                   join->tmp_table_param.group_buff,
2890
                                   HA_WHOLE_KEY,
2891
                                   HA_READ_KEY_EXACT))
2892
  {						/* Update old record */
2893
    table->restoreRecord();
2894
    update_tmptable_sum_func(join->sum_funcs,table);
1672.3.6 by Brian Aker
First pass in encapsulating row
2895
    if ((error= table->cursor->updateRecord(table->getUpdateRecord(),
2896
                                          table->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2897
    {
1216.1.1 by Brian Aker
Move print_error up to Engine.
2898
      table->print_error(error,MYF(0));
971.6.11 by Eric Day
Removed purecov messages.
2899
      return NESTED_LOOP_ERROR;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2900
    }
2901
    return NESTED_LOOP_OK;
2902
  }
2903
2904
  /*
2905
    Copy null bits from group key to table
2906
    We can't copy all data as the key may have different format
2907
    as the row data (for example as with VARCHAR keys)
2908
  */
1534 by Brian Aker
Remove of KeyPartInfo
2909
  KeyPartInfo *key_part;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2910
  for (group=table->group,key_part=table->key_info[0].key_part;
2911
       group ;
2912
       group=group->next,key_part++)
2913
  {
2914
    if (key_part->null_bit)
1672.3.6 by Brian Aker
First pass in encapsulating row
2915
      memcpy(table->getInsertRecord()+key_part->offset, group->buff, 1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2916
  }
2917
  init_tmptable_sum_functions(join->sum_funcs);
2918
  copy_funcs(join->tmp_table_param.items_to_copy);
1672.3.6 by Brian Aker
First pass in encapsulating row
2919
  if ((error=table->cursor->insertRecord(table->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2920
  {
1487.1.1 by Brian Aker
There is room for improvement around this. We should be using rows as well
2921
    my_error(ER_USE_SQL_BIG_RESULT, MYF(0));
2922
    return NESTED_LOOP_ERROR;        // Table is_full error
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2923
  }
2924
  join->send_records++;
2925
  return NESTED_LOOP_OK;
2926
}
2927
2928
/** Like end_update, but this is done with unique constraints instead of keys.  */
1541.1.1 by Brian Aker
JOIN -> Join rename
2929
enum_nested_loop_state end_unique_update(Join *join, JoinTable *, bool end_of_records)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2930
{
2931
  Table *table= join->tmp_table;
2932
  int	error;
2933
2934
  if (end_of_records)
2935
    return NESTED_LOOP_OK;
2936
  if (join->session->killed)			// Aborted by user
2937
  {
2938
    join->session->send_kill_message();
971.6.11 by Eric Day
Removed purecov messages.
2939
    return NESTED_LOOP_KILLED;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2940
  }
2941
2942
  init_tmptable_sum_functions(join->sum_funcs);
2943
  copy_fields(&join->tmp_table_param);		// Groups are copied twice.
2944
  copy_funcs(join->tmp_table_param.items_to_copy);
2945
1672.3.6 by Brian Aker
First pass in encapsulating row
2946
  if (!(error= table->cursor->insertRecord(table->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2947
    join->send_records++;			// New group
2948
  else
2949
  {
1216.1.1 by Brian Aker
Move print_error up to Engine.
2950
    if ((int) table->get_dup_key(error) < 0)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2951
    {
1216.1.1 by Brian Aker
Move print_error up to Engine.
2952
      table->print_error(error,MYF(0));
971.6.11 by Eric Day
Removed purecov messages.
2953
      return NESTED_LOOP_ERROR;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2954
    }
1672.3.6 by Brian Aker
First pass in encapsulating row
2955
    if (table->cursor->rnd_pos(table->getUpdateRecord(),table->cursor->dup_ref))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2956
    {
1216.1.1 by Brian Aker
Move print_error up to Engine.
2957
      table->print_error(error,MYF(0));
971.6.11 by Eric Day
Removed purecov messages.
2958
      return NESTED_LOOP_ERROR;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2959
    }
2960
    table->restoreRecord();
2961
    update_tmptable_sum_func(join->sum_funcs,table);
1672.3.6 by Brian Aker
First pass in encapsulating row
2962
    if ((error= table->cursor->updateRecord(table->getUpdateRecord(),
2963
                                          table->getInsertRecord())))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2964
    {
1216.1.1 by Brian Aker
Move print_error up to Engine.
2965
      table->print_error(error,MYF(0));
971.6.11 by Eric Day
Removed purecov messages.
2966
      return NESTED_LOOP_ERROR;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2967
    }
2968
  }
2969
  return NESTED_LOOP_OK;
2970
}
2971
2972
/**
2973
  allocate group fields or take prepared (cached).
2974
2975
  @param main_join   join of current select
2976
  @param curr_join   current join (join of current select or temporary copy
2977
                     of it)
2978
2979
  @retval
2980
    0   ok
2981
  @retval
2982
    1   failed
2983
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
2984
static bool make_group_fields(Join *main_join, Join *curr_join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2985
{
1101.1.16 by Monty Taylor
Reverted 1103
2986
  if (main_join->group_fields_cache.elements)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2987
  {
2988
    curr_join->group_fields= main_join->group_fields_cache;
2989
    curr_join->sort_and_group= 1;
2990
  }
2991
  else
2992
  {
2993
    if (alloc_group_fields(curr_join, curr_join->group_list))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
2994
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
2995
    main_join->group_fields_cache= curr_join->group_fields;
2996
  }
2997
  return (0);
2998
}
2999
3000
/**
3001
  calc how big buffer we need for comparing group entries.
3002
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3003
static void calc_group_buffer(Join *join,order_st *group)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3004
{
3005
  uint32_t key_length=0, parts=0, null_parts=0;
3006
3007
  if (group)
3008
    join->group= 1;
3009
  for (; group ; group=group->next)
3010
  {
3011
    Item *group_item= *group->item;
3012
    Field *field= group_item->get_tmp_table_field();
3013
    if (field)
3014
    {
3015
      enum_field_types type;
3016
      if ((type= field->type()) == DRIZZLE_TYPE_BLOB)
3017
        key_length+=MAX_BLOB_WIDTH;   // Can't be used as a key
3018
      else if (type == DRIZZLE_TYPE_VARCHAR)
3019
        key_length+= field->field_length + HA_KEY_BLOB_LENGTH;
3020
      else
3021
        key_length+= field->pack_length();
3022
    }
3023
    else
3024
    {
3025
      switch (group_item->result_type()) {
3026
      case REAL_RESULT:
3027
        key_length+= sizeof(double);
3028
        break;
3029
      case INT_RESULT:
3030
        key_length+= sizeof(int64_t);
3031
        break;
3032
      case DECIMAL_RESULT:
3033
        key_length+= my_decimal_get_binary_size(group_item->max_length -
3034
                                                (group_item->decimals ? 1 : 0),
3035
                                                group_item->decimals);
3036
        break;
3037
      case STRING_RESULT:
3038
      {
3039
        enum enum_field_types type= group_item->field_type();
3040
        /*
3041
          As items represented as DATE/TIME fields in the group buffer
3042
          have STRING_RESULT result type, we increase the length
3043
          by 8 as maximum pack length of such fields.
3044
        */
3045
        if (type == DRIZZLE_TYPE_DATE ||
3046
            type == DRIZZLE_TYPE_DATETIME ||
3047
            type == DRIZZLE_TYPE_TIMESTAMP)
3048
        {
3049
          key_length+= 8;
3050
        }
3051
        else
3052
        {
3053
          /*
3054
            Group strings are taken as varstrings and require an length field.
3055
            A field is not yet created by create_tmp_field()
3056
            and the sizes should match up.
3057
          */
3058
          key_length+= group_item->max_length + HA_KEY_BLOB_LENGTH;
3059
        }
3060
        break;
3061
      }
3062
      default:
3063
        /* This case should never be choosen */
3064
        assert(0);
3065
        my_error(ER_OUT_OF_RESOURCES, MYF(ME_FATALERROR));
3066
      }
3067
    }
3068
    parts++;
3069
    if (group_item->maybe_null)
3070
      null_parts++;
3071
  }
3072
  join->tmp_table_param.group_length=key_length+null_parts;
3073
  join->tmp_table_param.group_parts=parts;
3074
  join->tmp_table_param.group_null_parts=null_parts;
3075
}
3076
3077
/**
1101.1.16 by Monty Taylor
Reverted 1103
3078
  Get a list of buffers for saveing last group.
3079
3080
  Groups are saved in reverse order for easyer check loop.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3081
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3082
static bool alloc_group_fields(Join *join,order_st *group)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3083
{
3084
  if (group)
3085
  {
3086
    for (; group ; group=group->next)
3087
    {
1221.1.1 by Jay Pipes
Fixes some valgrind warnings regarding conditionals depending on unintialized variables. Use initializer lists properly, dang it. :) Also, removed the new_Cached_item() function's use_result_field, as this was only used for views and was producing a valgrind warning unnecessarily.
3088
      Cached_item *tmp= new_Cached_item(join->session, *group->item);
1101.1.16 by Monty Taylor
Reverted 1103
3089
      if (!tmp || join->group_fields.push_front(tmp))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3090
        return true;
3091
    }
3092
  }
3093
  join->sort_and_group=1;     /* Mark for do_select */
3094
  return false;
3095
}
3096
1541.1.1 by Brian Aker
JOIN -> Join rename
3097
static uint32_t cache_record_length(Join *join,uint32_t idx)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3098
{
3099
  uint32_t length=0;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3100
  JoinTable **pos,**end;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3101
  Session *session=join->session;
3102
3103
  for (pos=join->best_ref+join->const_tables,end=join->best_ref+idx ;
3104
       pos != end ;
3105
       pos++)
3106
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3107
    JoinTable *join_tab= *pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3108
    if (!join_tab->used_fieldlength)    /* Not calced yet */
3109
      calc_used_field_length(session, join_tab);
3110
    length+=join_tab->used_fieldlength;
3111
  }
3112
  return length;
3113
}
3114
3115
/*
3116
  Get the number of different row combinations for subset of partial join
3117
3118
  SYNOPSIS
3119
    prev_record_reads()
3120
      join       The join structure
3121
      idx        Number of tables in the partial join order (i.e. the
3122
                 partial join order is in join->positions[0..idx-1])
3123
      found_ref  Bitmap of tables for which we need to find # of distinct
3124
                 row combinations.
3125
3126
  DESCRIPTION
3127
    Given a partial join order (in join->positions[0..idx-1]) and a subset of
3128
    tables within that join order (specified in found_ref), find out how many
3129
    distinct row combinations of subset tables will be in the result of the
3130
    partial join order.
3131
3132
    This is used as follows: Suppose we have a table accessed with a ref-based
3133
    method. The ref access depends on current rows of tables in found_ref.
3134
    We want to count # of different ref accesses. We assume two ref accesses
3135
    will be different if at least one of access parameters is different.
3136
    Example: consider a query
3137
3138
    SELECT * FROM t1, t2, t3 WHERE t1.key=c1 AND t2.key=c2 AND t3.key=t1.field
3139
3140
    and a join order:
3141
      t1,  ref access on t1.key=c1
3142
      t2,  ref access on t2.key=c2
3143
      t3,  ref access on t3.key=t1.field
3144
3145
    For t1: n_ref_scans = 1, n_distinct_ref_scans = 1
3146
    For t2: n_ref_scans = records_read(t1), n_distinct_ref_scans=1
3147
    For t3: n_ref_scans = records_read(t1)*records_read(t2)
3148
            n_distinct_ref_scans = #records_read(t1)
3149
3150
    The reason for having this function (at least the latest version of it)
3151
    is that we need to account for buffering in join execution.
3152
3153
    An edge-case example: if we have a non-first table in join accessed via
3154
    ref(const) or ref(param) where there is a small number of different
3155
    values of param, then the access will likely hit the disk cache and will
3156
    not require any disk seeks.
3157
3158
    The proper solution would be to assume an LRU disk cache of some size,
3159
    calculate probability of cache hits, etc. For now we just count
3160
    identical ref accesses as one.
3161
3162
  RETURN
3163
    Expected number of row combinations
3164
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3165
static double prev_record_reads(Join *join, uint32_t idx, table_map found_ref)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3166
{
3167
  double found=1.0;
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
3168
  optimizer::Position *pos_end= join->getSpecificPosInPartialPlan(-1);
3169
  for (optimizer::Position *pos= join->getSpecificPosInPartialPlan(idx - 1); 
1108.6.10 by Padraig O'Sullivan
Changing some accessors to be more clear on whether they are accessing the
3170
       pos != pos_end; 
3171
       pos--)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3172
  {
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
3173
    if (pos->examinePosition(found_ref))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3174
    {
1108.6.28 by Padraig O'Sullivan
Made all data members of the Position class private.
3175
      found_ref|= pos->getRefDependMap();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3176
      /*
1541.1.1 by Brian Aker
JOIN -> Join rename
3177
        For the case of "t1 LEFT Join t2 ON ..." where t2 is a const table
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3178
        with no matching row we will get position[t2].records_read==0.
3179
        Actually the size of output is one null-complemented row, therefore
3180
        we will use value of 1 whenever we get records_read==0.
3181
3182
        Note
3183
        - the above case can't occur if inner part of outer join has more
3184
          than one table: table with no matches will not be marked as const.
3185
3186
        - Ideally we should add 1 to records_read for every possible null-
3187
          complemented row. We're not doing it because: 1. it will require
3188
          non-trivial code and add overhead. 2. The value of records_read
3189
          is an inprecise estimate and adding 1 (or, in the worst case,
3190
          #max_nested_outer_joins=64-1) will not make it any more precise.
3191
      */
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
3192
      if (pos->getFanout() > DBL_EPSILON)
3193
        found*= pos->getFanout();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3194
    }
3195
  }
3196
  return found;
3197
}
3198
3199
/**
3200
  Set up join struct according to best position.
3201
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3202
static bool get_best_combination(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3203
{
3204
  uint32_t i,tablenr;
3205
  table_map used_tables;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3206
  JoinTable *join_tab,*j;
1108.6.56 by Padraig O'Sullivan
Extracted KeyUse into its own header file and placed it within the
3207
  optimizer::KeyUse *keyuse;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3208
  uint32_t table_count;
3209
  Session *session=join->session;
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
3210
  optimizer::Position cur_pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3211
3212
  table_count=join->tables;
3213
  if (!(join->join_tab=join_tab=
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3214
  (JoinTable*) session->alloc(sizeof(JoinTable)*table_count)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3215
    return(true);
3216
3217
  join->full_join=0;
3218
3219
  used_tables= OUTER_REF_TABLE_BIT;   // Outer row is already read
3220
  for (j=join_tab, tablenr=0 ; tablenr < table_count ; tablenr++,j++)
3221
  {
3222
    Table *form;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
3223
    cur_pos= join->getPosFromOptimalPlan(tablenr);
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
3224
    *j= *cur_pos.getJoinTable();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3225
    form=join->table[tablenr]=j->table;
3226
    used_tables|= form->map;
3227
    form->reginfo.join_tab=j;
3228
    if (!*j->on_expr_ref)
1541.1.1 by Brian Aker
JOIN -> Join rename
3229
      form->reginfo.not_exists_optimize=0;  // Only with LEFT Join
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
3230
    if (j->type == AM_CONST)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3231
      continue;         // Handled in make_join_stat..
3232
3233
    j->ref.key = -1;
3234
    j->ref.key_parts=0;
3235
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
3236
    if (j->type == AM_SYSTEM)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3237
      continue;
1108.6.27 by Padraig O'Sullivan
Made the key member of the Position class private.
3238
    if (j->keys.none() || ! (keyuse= cur_pos.getKeyUse()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3239
    {
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
3240
      j->type= AM_ALL;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3241
      if (tablenr != join->const_tables)
3242
        join->full_join=1;
3243
    }
3244
    else if (create_ref_for_key(join, j, keyuse, used_tables))
3245
      return(true);                        // Something went wrong
3246
  }
3247
3248
  for (i=0 ; i < table_count ; i++)
3249
    join->map2table[join->join_tab[i].table->tablenr]=join->join_tab+i;
3250
  update_depend_map(join);
3251
  return(0);
3252
}
3253
3254
/** Save const tables first as used tables. */
1541.1.1 by Brian Aker
JOIN -> Join rename
3255
static void set_position(Join *join,
1108.6.56 by Padraig O'Sullivan
Extracted KeyUse into its own header file and placed it within the
3256
                         uint32_t idx,
3257
                         JoinTable *table,
3258
                         optimizer::KeyUse *key)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3259
{
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
3260
  optimizer::Position tmp_pos(1.0, /* This is a const table */
3261
                              0.0,
3262
                              table,
3263
                              key,
3264
                              0);
1108.6.6 by Padraig O'Sullivan
Adding accessors to the JOIN class for the positions member. The end goal is
3265
  join->setPosInPartialPlan(idx, tmp_pos);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3266
3267
  /* Move the const table as down as possible in best_ref */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3268
  JoinTable **pos=join->best_ref+idx+1;
3269
  JoinTable *next=join->best_ref[idx];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3270
  for (;next != table ; pos++)
3271
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3272
    JoinTable *tmp=pos[0];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3273
    pos[0]=next;
3274
    next=tmp;
3275
  }
3276
  join->best_ref[idx]=table;
3277
}
3278
3279
/**
3280
  Selects and invokes a search strategy for an optimal query plan.
3281
3282
  The function checks user-configurable parameters that control the search
3283
  strategy for an optimal plan, selects the search method and then invokes
3284
  it. Each specific optimization procedure stores the final optimal plan in
3285
  the array 'join->best_positions', and the cost of the plan in
3286
  'join->best_read'.
3287
3288
  @param join         pointer to the structure providing all context info for
3289
                      the query
3290
  @param join_tables  set of the tables in the query
3291
3292
  @retval
3293
    false       ok
3294
  @retval
3295
    true        Fatal error
3296
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3297
static bool choose_plan(Join *join, table_map join_tables)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3298
{
3299
  uint32_t search_depth= join->session->variables.optimizer_search_depth;
3300
  uint32_t prune_level=  join->session->variables.optimizer_prune_level;
3301
  bool straight_join= test(join->select_options & SELECT_STRAIGHT_JOIN);
3302
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
3303
  join->cur_embedding_map.reset();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3304
  reset_nj_counters(join->join_list);
3305
  /*
3306
    if (SELECT_STRAIGHT_JOIN option is set)
3307
      reorder tables so dependent tables come after tables they depend
3308
      on, otherwise keep tables in the order they were specified in the query
3309
    else
3310
      Apply heuristic: pre-sort all access plans with respect to the number of
3311
      records accessed.
3312
  */
1280.1.10 by Monty Taylor
Put everything in drizzled into drizzled namespace.
3313
  internal::my_qsort(join->best_ref + join->const_tables,
3314
                     join->tables - join->const_tables, sizeof(JoinTable*),
3315
                     straight_join ? join_tab_cmp_straight : join_tab_cmp);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3316
  if (straight_join)
3317
  {
3318
    optimize_straight_join(join, join_tables);
3319
  }
3320
  else
3321
  {
1108.6.21 by Padraig O'Sullivan
Removed some dead code from the optimizer. find_best() was never being used
3322
    if (search_depth == 0)
3323
      /* Automatically determine a reasonable value for 'search_depth' */
3324
      search_depth= determine_search_depth(join);
3325
    if (greedy_search(join, join_tables, search_depth, prune_level))
1108.6.49 by Padraig O'Sullivan
Fixing up one style issue with a return statement.
3326
      return true;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3327
  }
3328
3329
  /*
3330
    Store the cost of this query into a user variable
3331
    Don't update last_query_cost for statements that are not "flat joins" :
3332
    i.e. they have subqueries, unions or call stored procedures.
3333
    TODO: calculate a correct cost for a query with subqueries and UNIONs.
3334
  */
3335
  if (join->session->lex->is_single_level_stmt())
3336
    join->session->status_var.last_query_cost= join->best_read;
3337
  return(false);
3338
}
3339
3340
/**
3341
  Find the best access path for an extension of a partial execution
3342
  plan and add this path to the plan.
3343
3344
  The function finds the best access path to table 's' from the passed
3345
  partial plan where an access path is the general term for any means to
3346
  access the data in 's'. An access path may use either an index or a scan,
3347
  whichever is cheaper. The input partial plan is passed via the array
3348
  'join->positions' of length 'idx'. The chosen access method for 's' and its
3349
  cost are stored in 'join->positions[idx]'.
3350
3351
  @param join             pointer to the structure providing all context info
3352
                          for the query
3353
  @param s                the table to be joined by the function
3354
  @param session              thread for the connection that submitted the query
3355
  @param remaining_tables set of tables not included into the partial plan yet
3356
  @param idx              the length of the partial plan
3357
  @param record_count     estimate for the number of records returned by the
3358
                          partial plan
3359
  @param read_time        the cost of the partial plan
3360
3361
  @return
3362
    None
3363
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3364
static void best_access_path(Join *join,
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3365
                             JoinTable *s,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3366
                             Session *session,
3367
                             table_map remaining_tables,
3368
                             uint32_t idx,
3369
                             double record_count,
3370
                             double)
3371
{
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
3372
  optimizer::KeyUse *best_key= NULL;
1161.2.1 by Padraig O'Sullivan
Fix for bug 444827.
3373
  uint32_t best_max_key_part= 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3374
  bool found_constraint= 0;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
3375
  double best= DBL_MAX;
3376
  double best_time= DBL_MAX;
3377
  double records= DBL_MAX;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3378
  table_map best_ref_depends_map= 0;
3379
  double tmp;
3380
  ha_rows rec;
3381
3382
  if (s->keyuse)
3383
  {                                            /* Use key if possible */
3384
    Table *table= s->table;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
3385
    optimizer::KeyUse *keyuse= NULL;
3386
    optimizer::KeyUse *start_key= NULL;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3387
    double best_records= DBL_MAX;
3388
    uint32_t max_key_part=0;
3389
3390
    /* Test how we can use keys */
3391
    rec= s->records/MATCHING_ROWS_IN_OTHER_TABLE;  // Assumed records/key
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
3392
    for (keyuse= s->keyuse; keyuse->getTable() == table; )
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3393
    {
3394
      key_part_map found_part= 0;
3395
      table_map found_ref= 0;
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3396
      uint32_t key= keyuse->getKey();
1535 by Brian Aker
Rename of KEY to KeyInfo
3397
      KeyInfo *keyinfo= table->key_info + key;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3398
      /* Bitmap of keyparts where the ref access is over 'keypart=const': */
3399
      key_part_map const_part= 0;
3400
      /* The or-null keypart in ref-or-null access: */
3401
      key_part_map ref_or_null_part= 0;
3402
3403
      /* Calculate how many key segments of the current key we can use */
3404
      start_key= keyuse;
3405
3406
      do /* For each keypart */
3407
      {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3408
        uint32_t keypart= keyuse->getKeypart();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3409
        table_map best_part_found_ref= 0;
3410
        double best_prev_record_reads= DBL_MAX;
3411
3412
        do /* For each way to access the keypart */
3413
        {
3414
3415
          /*
3416
            if 1. expression doesn't refer to forward tables
3417
               2. we won't get two ref-or-null's
3418
          */
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3419
          if (! (remaining_tables & keyuse->getUsedTables()) &&
3420
              ! (ref_or_null_part && (keyuse->getOptimizeFlags() &
3421
                                      KEY_OPTIMIZE_REF_OR_NULL)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3422
          {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3423
            found_part|= keyuse->getKeypartMap();
3424
            if (! (keyuse->getUsedTables() & ~join->const_table_map))
3425
              const_part|= keyuse->getKeypartMap();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3426
3427
            double tmp2= prev_record_reads(join, idx, (found_ref |
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3428
                                                       keyuse->getUsedTables()));
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3429
            if (tmp2 < best_prev_record_reads)
3430
            {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3431
              best_part_found_ref= keyuse->getUsedTables() & ~join->const_table_map;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3432
              best_prev_record_reads= tmp2;
3433
            }
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3434
            if (rec > keyuse->getTableRows())
3435
              rec= keyuse->getTableRows();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3436
      /*
3437
        If there is one 'key_column IS NULL' expression, we can
3438
        use this ref_or_null optimisation of this field
3439
      */
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3440
            if (keyuse->getOptimizeFlags() & KEY_OPTIMIZE_REF_OR_NULL)
3441
              ref_or_null_part|= keyuse->getKeypartMap();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3442
          }
3443
3444
          keyuse++;
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3445
        } while (keyuse->getTable() == table && keyuse->getKey() == key &&
3446
                 keyuse->getKeypart() == keypart);
3447
        found_ref|= best_part_found_ref;
3448
      } while (keyuse->getTable() == table && keyuse->getKey() == key);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3449
3450
      /*
3451
        Assume that that each key matches a proportional part of table.
3452
      */
1100.2.1 by Brian Aker
First pass through removing most of the semi_join code.
3453
      if (!found_part)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3454
        continue;                               // Nothing usable found
3455
3456
      if (rec < MATCHING_ROWS_IN_OTHER_TABLE)
3457
        rec= MATCHING_ROWS_IN_OTHER_TABLE;      // Fix for small tables
3458
3459
      {
3460
        found_constraint= 1;
3461
3462
        /*
3463
          Check if we found full key
3464
        */
3465
        if (found_part == PREV_BITS(uint,keyinfo->key_parts) &&
3466
            !ref_or_null_part)
3467
        {                                         /* use eq key */
3468
          max_key_part= UINT32_MAX;
3469
          if ((keyinfo->flags & (HA_NOSAME | HA_NULL_PART_KEY)) == HA_NOSAME)
3470
          {
3471
            tmp = prev_record_reads(join, idx, found_ref);
3472
            records=1.0;
3473
          }
3474
          else
3475
          {
3476
            if (!found_ref)
3477
            {                                     /* We found a const key */
3478
              /*
3479
                ReuseRangeEstimateForRef-1:
3480
                We get here if we've found a ref(const) (c_i are constants):
3481
                  "(keypart1=c1) AND ... AND (keypartN=cN)"   [ref_const_cond]
3482
3483
                If range optimizer was able to construct a "range"
3484
                access on this index, then its condition "quick_cond" was
3485
                eqivalent to ref_const_cond (*), and we can re-use E(#rows)
3486
                from the range optimizer.
3487
3488
                Proof of (*): By properties of range and ref optimizers
3489
                quick_cond will be equal or tighther than ref_const_cond.
3490
                ref_const_cond already covers "smallest" possible interval -
3491
                a singlepoint interval over all keyparts. Therefore,
3492
                quick_cond is equivalent to ref_const_cond (if it was an
3493
                empty interval we wouldn't have got here).
3494
              */
3495
              if (table->quick_keys.test(key))
3496
                records= (double) table->quick_rows[key];
3497
              else
3498
              {
3499
                /* quick_range couldn't use key! */
3500
                records= (double) s->records/rec;
3501
              }
3502
            }
3503
            else
3504
            {
3505
              if (!(records=keyinfo->rec_per_key[keyinfo->key_parts-1]))
3506
              {                                   /* Prefer longer keys */
3507
                records=
3508
                  ((double) s->records / (double) rec *
3509
                   (1.0 +
1532.1.15 by Brian Aker
Partial encapsulation of TableShare from Table.
3510
                    ((double) (table->getShare()->max_key_length-keyinfo->key_length) /
3511
                     (double) table->getShare()->max_key_length)));
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3512
                if (records < 2.0)
3513
                  records=2.0;               /* Can't be as good as a unique */
3514
              }
3515
              /*
3516
                ReuseRangeEstimateForRef-2:  We get here if we could not reuse
3517
                E(#rows) from range optimizer. Make another try:
3518
3519
                If range optimizer produced E(#rows) for a prefix of the ref
3520
                access we're considering, and that E(#rows) is lower then our
3521
                current estimate, make an adjustment. The criteria of when we
3522
                can make an adjustment is a special case of the criteria used
3523
                in ReuseRangeEstimateForRef-3.
3524
              */
3525
              if (table->quick_keys.test(key) &&
3526
                  const_part & (1 << table->quick_key_parts[key]) &&
3527
                  table->quick_n_ranges[key] == 1 &&
3528
                  records > (double) table->quick_rows[key])
3529
              {
3530
                records= (double) table->quick_rows[key];
3531
              }
3532
            }
3533
            /* Limit the number of matched rows */
3534
            tmp= records;
3535
            set_if_smaller(tmp, (double) session->variables.max_seeks_for_key);
3536
            if (table->covering_keys.test(key))
3537
            {
3538
              /* we can use only index tree */
1208.3.2 by brian
Update for Cursor renaming.
3539
              tmp= record_count * table->cursor->index_only_read_time(key, tmp);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3540
            }
3541
            else
1067.4.4 by Nathan Williams
The rest of the files in the drizzled directory were purged of the cmin macro and replace with std::min (except for the definition in globals.h and 1 usage in stacktrace.cc).
3542
              tmp= record_count * min(tmp,s->worst_seeks);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3543
          }
3544
        }
3545
        else
3546
        {
3547
          /*
3548
            Use as much key-parts as possible and a uniq key is better
3549
            than a not unique key
3550
            Set tmp to (previous record count) * (records / combination)
3551
          */
3552
          if ((found_part & 1) &&
1235.1.14 by Brian Aker
Final move of index flags up to Engine (new interface still needed).
3553
              (!(table->index_flags(key) & HA_ONLY_WHOLE_INDEX) ||
1235.1.12 by Brian Aker
Clean up index interface before moving to SE.
3554
               found_part == PREV_BITS(uint, keyinfo->key_parts)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3555
          {
3556
            max_key_part= max_part_bit(found_part);
3557
            /*
3558
              ReuseRangeEstimateForRef-3:
3559
              We're now considering a ref[or_null] access via
3560
              (t.keypart1=e1 AND ... AND t.keypartK=eK) [ OR
3561
              (same-as-above but with one cond replaced
3562
               with "t.keypart_i IS NULL")]  (**)
3563
3564
              Try re-using E(#rows) from "range" optimizer:
3565
              We can do so if "range" optimizer used the same intervals as
3566
              in (**). The intervals used by range optimizer may be not
3567
              available at this point (as "range" access might have choosen to
3568
              create quick select over another index), so we can't compare
3569
              them to (**). We'll make indirect judgements instead.
3570
              The sufficient conditions for re-use are:
3571
              (C1) All e_i in (**) are constants, i.e. found_ref==false. (if
3572
                   this is not satisfied we have no way to know which ranges
3573
                   will be actually scanned by 'ref' until we execute the
3574
                   join)
3575
              (C2) max #key parts in 'range' access == K == max_key_part (this
3576
                   is apparently a necessary requirement)
3577
3578
              We also have a property that "range optimizer produces equal or
3579
              tighter set of scan intervals than ref(const) optimizer". Each
3580
              of the intervals in (**) are "tightest possible" intervals when
3581
              one limits itself to using keyparts 1..K (which we do in #2).
3582
              From here it follows that range access used either one, or
3583
              both of the (I1) and (I2) intervals:
3584
3585
               (t.keypart1=c1 AND ... AND t.keypartK=eK)  (I1)
3586
               (same-as-above but with one cond replaced
3587
                with "t.keypart_i IS NULL")               (I2)
3588
3589
              The remaining part is to exclude the situation where range
3590
              optimizer used one interval while we're considering
3591
              ref-or-null and looking for estimate for two intervals. This
3592
              is done by last limitation:
3593
3594
              (C3) "range optimizer used (have ref_or_null?2:1) intervals"
3595
            */
3596
            if (table->quick_keys.test(key) && !found_ref &&          //(C1)
3597
                table->quick_key_parts[key] == max_key_part &&          //(C2)
3598
                table->quick_n_ranges[key] == 1+((ref_or_null_part)?1:0)) //(C3)
3599
            {
3600
              tmp= records= (double) table->quick_rows[key];
3601
            }
3602
            else
3603
            {
3604
              /* Check if we have statistic about the distribution */
3605
              if ((records= keyinfo->rec_per_key[max_key_part-1]))
3606
              {
3607
                /*
3608
                  Fix for the case where the index statistics is too
3609
                  optimistic: If
3610
                  (1) We're considering ref(const) and there is quick select
3611
                      on the same index,
3612
                  (2) and that quick select uses more keyparts (i.e. it will
3613
                      scan equal/smaller interval then this ref(const))
3614
                  (3) and E(#rows) for quick select is higher then our
3615
                      estimate,
3616
                  Then
3617
                    We'll use E(#rows) from quick select.
3618
3619
                  Q: Why do we choose to use 'ref'? Won't quick select be
3620
                  cheaper in some cases ?
3621
                  TODO: figure this out and adjust the plan choice if needed.
3622
                */
3623
                if (!found_ref && table->quick_keys.test(key) &&    // (1)
3624
                    table->quick_key_parts[key] > max_key_part &&     // (2)
3625
                    records < (double)table->quick_rows[key])         // (3)
3626
                  records= (double)table->quick_rows[key];
3627
3628
                tmp= records;
3629
              }
3630
              else
3631
              {
3632
                /*
1208.3.2 by brian
Update for Cursor renaming.
3633
                  Assume that the first key part matches 1% of the cursor
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3634
                  and that the whole key matches 10 (duplicates) or 1
3635
                  (unique) records.
3636
                  Assume also that more key matches proportionally more
3637
                  records
3638
                  This gives the formula:
3639
                  records = (x * (b-a) + a*c-b)/(c-1)
3640
3641
                  b = records matched by whole key
3642
                  a = records matched by first key part (1% of all records?)
3643
                  c = number of key parts in key
3644
                  x = used key parts (1 <= x <= c)
3645
                */
3646
                double rec_per_key;
3647
                if (!(rec_per_key=(double)
3648
                      keyinfo->rec_per_key[keyinfo->key_parts-1]))
3649
                  rec_per_key=(double) s->records/rec+1;
3650
3651
                if (!s->records)
3652
                  tmp = 0;
3653
                else if (rec_per_key/(double) s->records >= 0.01)
3654
                  tmp = rec_per_key;
3655
                else
3656
                {
3657
                  double a=s->records*0.01;
3658
                  if (keyinfo->key_parts > 1)
3659
                    tmp= (max_key_part * (rec_per_key - a) +
3660
                          a*keyinfo->key_parts - rec_per_key)/
3661
                         (keyinfo->key_parts-1);
3662
                  else
3663
                    tmp= a;
3664
                  set_if_bigger(tmp,1.0);
3665
                }
3666
                records = (uint32_t) tmp;
3667
              }
3668
3669
              if (ref_or_null_part)
3670
              {
3671
                /* We need to do two key searches to find key */
3672
                tmp *= 2.0;
3673
                records *= 2.0;
3674
              }
3675
3676
              /*
3677
                ReuseRangeEstimateForRef-4:  We get here if we could not reuse
3678
                E(#rows) from range optimizer. Make another try:
3679
3680
                If range optimizer produced E(#rows) for a prefix of the ref
3681
                access we're considering, and that E(#rows) is lower then our
3682
                current estimate, make the adjustment.
3683
3684
                The decision whether we can re-use the estimate from the range
3685
                optimizer is the same as in ReuseRangeEstimateForRef-3,
3686
                applied to first table->quick_key_parts[key] key parts.
3687
              */
3688
              if (table->quick_keys.test(key) &&
3689
                  table->quick_key_parts[key] <= max_key_part &&
3690
                  const_part & (1 << table->quick_key_parts[key]) &&
3691
                  table->quick_n_ranges[key] == 1 + ((ref_or_null_part &
3692
                                                     const_part) ? 1 : 0) &&
3693
                  records > (double) table->quick_rows[key])
3694
              {
3695
                tmp= records= (double) table->quick_rows[key];
3696
              }
3697
            }
3698
3699
            /* Limit the number of matched rows */
3700
            set_if_smaller(tmp, (double) session->variables.max_seeks_for_key);
3701
            if (table->covering_keys.test(key))
3702
            {
3703
              /* we can use only index tree */
1208.3.2 by brian
Update for Cursor renaming.
3704
              tmp= record_count * table->cursor->index_only_read_time(key, tmp);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3705
            }
3706
            else
1067.4.4 by Nathan Williams
The rest of the files in the drizzled directory were purged of the cmin macro and replace with std::min (except for the definition in globals.h and 1 usage in stacktrace.cc).
3707
              tmp= record_count * min(tmp,s->worst_seeks);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3708
          }
3709
          else
3710
            tmp= best_time;                    // Do nothing
3711
        }
3712
3713
      }
3714
      if (tmp < best_time - records/(double) TIME_FOR_COMPARE)
3715
      {
3716
        best_time= tmp + records/(double) TIME_FOR_COMPARE;
3717
        best= tmp;
3718
        best_records= records;
3719
        best_key= start_key;
3720
        best_max_key_part= max_key_part;
3721
        best_ref_depends_map= found_ref;
3722
      }
3723
    }
3724
    records= best_records;
3725
  }
3726
3727
  /*
3728
    Don't test table scan if it can't be better.
3729
    Prefer key lookup if we would use the same key for scanning.
3730
3731
    Don't do a table scan on InnoDB tables, if we can read the used
3732
    parts of the row from any of the used index.
3733
    This is because table scans uses index and we would not win
3734
    anything by using a table scan.
3735
3736
    A word for word translation of the below if-statement in sergefp's
3737
    understanding: we check if we should use table scan if:
3738
    (1) The found 'ref' access produces more records than a table scan
3739
        (or index scan, or quick select), or 'ref' is more expensive than
3740
        any of them.
3741
    (2) This doesn't hold: the best way to perform table scan is to to perform
3742
        'range' access using index IDX, and the best way to perform 'ref'
3743
        access is to use the same index IDX, with the same or more key parts.
3744
        (note: it is not clear how this rule is/should be extended to
3745
        index_merge quick selects)
3746
    (3) See above note about InnoDB.
3747
    (4) NOT ("FORCE INDEX(...)" is used for table and there is 'ref' access
3748
             path, but there is no quick select)
3749
        If the condition in the above brackets holds, then the only possible
3750
        "table scan" access method is ALL/index (there is no quick select).
3751
        Since we have a 'ref' access path, and FORCE INDEX instructs us to
3752
        choose it over ALL/index, there is no need to consider a full table
3753
        scan.
3754
  */
3755
  if ((records >= s->found_records || best > s->read_time) &&            // (1)
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3756
      ! (s->quick && best_key && s->quick->index == best_key->getKey() &&      // (2)
3757
        best_max_key_part >= s->table->quick_key_parts[best_key->getKey()]) &&// (2)
1233.1.4 by Brian Aker
Added:
3758
      ! ((s->table->cursor->getEngine()->check_flag(HTON_BIT_TABLE_SCAN_ON_INDEX)) &&   // (3)
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
3759
        ! s->table->covering_keys.none() && best_key && !s->quick) && // (3)
3760
      ! (s->table->force_index && best_key && !s->quick))                 // (4)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3761
  {                                             // Check full join
3762
    ha_rows rnd_records= s->found_records;
3763
    /*
3764
      If there is a filtering condition on the table (i.e. ref analyzer found
3765
      at least one "table.keyXpartY= exprZ", where exprZ refers only to tables
3766
      preceding this table in the join order we're now considering), then
3767
      assume that 25% of the rows will be filtered out by this condition.
3768
3769
      This heuristic is supposed to force tables used in exprZ to be before
3770
      this table in join order.
3771
    */
3772
    if (found_constraint)
3773
      rnd_records-= rnd_records/4;
3774
3775
    /*
3776
      If applicable, get a more accurate estimate. Don't use the two
3777
      heuristics at once.
3778
    */
3779
    if (s->table->quick_condition_rows != s->found_records)
3780
      rnd_records= s->table->quick_condition_rows;
3781
3782
    /*
3783
      Range optimizer never proposes a RANGE if it isn't better
3784
      than FULL: so if RANGE is present, it's always preferred to FULL.
3785
      Here we estimate its cost.
3786
    */
3787
    if (s->quick)
3788
    {
3789
      /*
3790
        For each record we:
3791
        - read record range through 'quick'
3792
        - skip rows which does not satisfy WHERE constraints
3793
        TODO:
3794
        We take into account possible use of join cache for ALL/index
3795
        access (see first else-branch below), but we don't take it into
3796
        account here for range/index_merge access. Find out why this is so.
3797
      */
3798
      tmp= record_count *
3799
        (s->quick->read_time +
3800
         (s->found_records - rnd_records)/(double) TIME_FOR_COMPARE);
3801
    }
3802
    else
3803
    {
3804
      /* Estimate cost of reading table. */
1208.3.2 by brian
Update for Cursor renaming.
3805
      tmp= s->table->cursor->scan_time();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3806
      if (s->table->map & join->outer_join)     // Can't use join cache
3807
      {
3808
        /*
3809
          For each record we have to:
3810
          - read the whole table record
3811
          - skip rows which does not satisfy join condition
3812
        */
3813
        tmp= record_count *
3814
          (tmp +
3815
           (s->records - rnd_records)/(double) TIME_FOR_COMPARE);
3816
      }
3817
      else
3818
      {
3819
        /* We read the table as many times as join buffer becomes full. */
3820
        tmp*= (1.0 + floor((double) cache_record_length(join,idx) *
3821
                           record_count /
3822
                           (double) session->variables.join_buff_size));
3823
        /*
3824
            We don't make full cartesian product between rows in the scanned
3825
           table and existing records because we skip all rows from the
3826
           scanned table, which does not satisfy join condition when
3827
           we read the table (see flush_cached_records for details). Here we
3828
           take into account cost to read and skip these records.
3829
        */
3830
        tmp+= (s->records - rnd_records)/(double) TIME_FOR_COMPARE;
3831
      }
3832
    }
3833
3834
    /*
3835
      We estimate the cost of evaluating WHERE clause for found records
3836
      as record_count * rnd_records / TIME_FOR_COMPARE. This cost plus
3837
      tmp give us total cost of using Table SCAN
3838
    */
3839
    if (best == DBL_MAX ||
3840
        (tmp  + record_count/(double) TIME_FOR_COMPARE*rnd_records <
3841
         best + record_count/(double) TIME_FOR_COMPARE*records))
3842
    {
3843
      /*
3844
        If the table has a range (s->quick is set) make_join_select()
3845
        will ensure that this will be used
3846
      */
3847
      best= tmp;
3848
      records= rows2double(rnd_records);
3849
      best_key= 0;
3850
      /* range/index_merge/ALL/index access method are "independent", so: */
3851
      best_ref_depends_map= 0;
3852
    }
3853
  }
3854
3855
  /* Update the cost information for the current partial plan */
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
3856
  optimizer::Position tmp_pos(records,
3857
                              best,
3858
                              s,
3859
                              best_key,
3860
                              best_ref_depends_map);
1108.6.6 by Padraig O'Sullivan
Adding accessors to the JOIN class for the positions member. The end goal is
3861
  join->setPosInPartialPlan(idx, tmp_pos);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3862
3863
  if (!best_key &&
3864
      idx == join->const_tables &&
3865
      s->table == join->sort_by_table &&
3866
      join->unit->select_limit_cnt >= records)
3867
    join->sort_by_table= (Table*) 1;  // Must use temporary table
3868
3869
  return;
3870
}
3871
3872
/**
3873
  Select the best ways to access the tables in a query without reordering them.
3874
3875
    Find the best access paths for each query table and compute their costs
3876
    according to their order in the array 'join->best_ref' (thus without
3877
    reordering the join tables). The function calls sequentially
3878
    'best_access_path' for each table in the query to select the best table
3879
    access method. The final optimal plan is stored in the array
3880
    'join->best_positions', and the corresponding cost in 'join->best_read'.
3881
3882
  @param join          pointer to the structure providing all context info for
3883
                       the query
3884
  @param join_tables   set of the tables in the query
3885
3886
  @note
3887
    This function can be applied to:
3888
    - queries with STRAIGHT_JOIN
3889
    - internally to compute the cost of an arbitrary QEP
3890
  @par
3891
    Thus 'optimize_straight_join' can be used at any stage of the query
3892
    optimization process to finalize a QEP as it is.
3893
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
3894
static void optimize_straight_join(Join *join, table_map join_tables)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3895
{
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3896
  JoinTable *s;
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
3897
  optimizer::Position partial_pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3898
  uint32_t idx= join->const_tables;
3899
  double    record_count= 1.0;
3900
  double    read_time=    0.0;
3901
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
3902
  for (JoinTable **pos= join->best_ref + idx ; (s= *pos) ; pos++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3903
  {
3904
    /* Find the best access method from 's' to the current partial plan */
3905
    best_access_path(join, s, join->session, join_tables, idx,
3906
                     record_count, read_time);
3907
    /* compute the cost of the new plan extended with 's' */
1108.6.7 by Padraig O'Sullivan
More work on attempts to encapsulate the positions member of JOIN. We can
3908
    partial_pos= join->getPosFromPartialPlan(idx);
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
3909
    record_count*= partial_pos.getFanout();
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
3910
    read_time+=    partial_pos.getCost();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3911
    join_tables&= ~(s->table->map);
3912
    ++idx;
3913
  }
3914
3915
  read_time+= record_count / (double) TIME_FOR_COMPARE;
1108.6.7 by Padraig O'Sullivan
More work on attempts to encapsulate the positions member of JOIN. We can
3916
  partial_pos= join->getPosFromPartialPlan(join->const_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3917
  if (join->sort_by_table &&
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
3918
      partial_pos.hasTableForSorting(join->sort_by_table))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3919
    read_time+= record_count;  // We have to make a temp table
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
3920
  join->copyPartialPlanIntoOptimalPlan(idx);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
3921
  join->best_read= read_time;
3922
}
3923
3924
/**
3925
  Find a good, possibly optimal, query execution plan (QEP) by a greedy search.
3926
3927
    The search procedure uses a hybrid greedy/exhaustive search with controlled
3928
    exhaustiveness. The search is performed in N = card(remaining_tables)
3929
    steps. Each step evaluates how promising is each of the unoptimized tables,
3930
    selects the most promising table, and extends the current partial QEP with
3931
    that table.  Currenly the most 'promising' table is the one with least
3932
    expensive extension.\
3933
3934
    There are two extreme cases:
3935
    -# When (card(remaining_tables) < search_depth), the estimate finds the
3936
    best complete continuation of the partial QEP. This continuation can be
3937
    used directly as a result of the search.
3938
    -# When (search_depth == 1) the 'best_extension_by_limited_search'
3939
    consideres the extension of the current QEP with each of the remaining
3940
    unoptimized tables.
3941
3942
    All other cases are in-between these two extremes. Thus the parameter
3943
    'search_depth' controlls the exhaustiveness of the search. The higher the
3944
    value, the longer the optimizaton time and possibly the better the
3945
    resulting plan. The lower the value, the fewer alternative plans are
3946
    estimated, but the more likely to get a bad QEP.
3947
3948
    All intermediate and final results of the procedure are stored in 'join':
3949
    - join->positions     : modified for every partial QEP that is explored
3950
    - join->best_positions: modified for the current best complete QEP
3951
    - join->best_read     : modified for the current best complete QEP
3952
    - join->best_ref      : might be partially reordered
3953
3954
    The final optimal plan is stored in 'join->best_positions', and its
3955
    corresponding cost in 'join->best_read'.
3956
3957
  @note
3958
    The following pseudocode describes the algorithm of 'greedy_search':
3959
3960
    @code
3961
    procedure greedy_search
3962
    input: remaining_tables
3963
    output: pplan;
3964
    {
3965
      pplan = <>;
3966
      do {
3967
        (t, a) = best_extension(pplan, remaining_tables);
3968
        pplan = concat(pplan, (t, a));
3969
        remaining_tables = remaining_tables - t;
3970
      } while (remaining_tables != {})
3971
      return pplan;
3972
    }
3973
3974
  @endcode
3975
    where 'best_extension' is a placeholder for a procedure that selects the
3976
    most "promising" of all tables in 'remaining_tables'.
3977
    Currently this estimate is performed by calling
3978
    'best_extension_by_limited_search' to evaluate all extensions of the
3979
    current QEP of size 'search_depth', thus the complexity of 'greedy_search'
3980
    mainly depends on that of 'best_extension_by_limited_search'.
3981
3982
  @par
3983
    If 'best_extension()' == 'best_extension_by_limited_search()', then the
3984
    worst-case complexity of this algorithm is <=
3985
    O(N*N^search_depth/search_depth). When serch_depth >= N, then the
3986
    complexity of greedy_search is O(N!).
3987
3988
  @par
3989
    In the future, 'greedy_search' might be extended to support other
3990
    implementations of 'best_extension', e.g. some simpler quadratic procedure.
3991
3992
  @param join             pointer to the structure providing all context info
3993
                          for the query
3994
  @param remaining_tables set of tables not included into the partial plan yet
3995
  @param search_depth     controlls the exhaustiveness of the search
3996
  @param prune_level      the pruning heuristics that should be applied during
3997
                          search
3998
3999
  @retval
4000
    false       ok
4001
  @retval
4002
    true        Fatal error
4003
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
4004
static bool greedy_search(Join      *join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4005
              table_map remaining_tables,
4006
              uint32_t      search_depth,
4007
              uint32_t      prune_level)
4008
{
4009
  double    record_count= 1.0;
4010
  double    read_time=    0.0;
4011
  uint32_t      idx= join->const_tables; // index into 'join->best_ref'
4012
  uint32_t      best_idx;
4013
  uint32_t      size_remain;    // cardinality of remaining_tables
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
4014
  optimizer::Position best_pos;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4015
  JoinTable  *best_table; // the next plan node to be added to the curr QEP
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4016
4017
  /* number of tables that remain to be optimized */
1280.1.10 by Monty Taylor
Put everything in drizzled into drizzled namespace.
4018
  size_remain= internal::my_count_bits(remaining_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4019
4020
  do {
4021
    /* Find the extension of the current QEP with the lowest cost */
4022
    join->best_read= DBL_MAX;
4023
    if (best_extension_by_limited_search(join, remaining_tables, idx, record_count,
4024
                                         read_time, search_depth, prune_level))
4025
      return(true);
4026
4027
    if (size_remain <= search_depth)
4028
    {
4029
      /*
4030
        'join->best_positions' contains a complete optimal extension of the
4031
        current partial QEP.
4032
      */
4033
      return(false);
4034
    }
4035
4036
    /* select the first table in the optimal extension as most promising */
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4037
    best_pos= join->getPosFromOptimalPlan(idx);
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
4038
    best_table= best_pos.getJoinTable();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4039
    /*
4040
      Each subsequent loop of 'best_extension_by_limited_search' uses
4041
      'join->positions' for cost estimates, therefore we have to update its
4042
      value.
4043
    */
1108.6.7 by Padraig O'Sullivan
More work on attempts to encapsulate the positions member of JOIN. We can
4044
    join->setPosInPartialPlan(idx, best_pos);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4045
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
4046
    /*
4047
      We need to make best_extension_by_limited_search aware of the fact
4048
      that it's not starting from top level, but from a rather specific
4049
      position in the list of nested joins.
4050
    */
4051
    check_interleaving_with_nj (best_table);
4052
    
4053
      
4054
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4055
    /* find the position of 'best_table' in 'join->best_ref' */
4056
    best_idx= idx;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4057
    JoinTable *pos= join->best_ref[best_idx];
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4058
    while (pos && best_table != pos)
4059
      pos= join->best_ref[++best_idx];
4060
    assert((pos != NULL)); // should always find 'best_table'
4061
    /* move 'best_table' at the first free position in the array of joins */
4062
    std::swap(join->best_ref[idx], join->best_ref[best_idx]);
4063
4064
    /* compute the cost of the new plan extended with 'best_table' */
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
4065
    optimizer::Position partial_pos= join->getPosFromPartialPlan(idx);
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
4066
    record_count*= partial_pos.getFanout();
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
4067
    read_time+=    partial_pos.getCost();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4068
4069
    remaining_tables&= ~(best_table->table->map);
4070
    --size_remain;
4071
    ++idx;
4072
  } while (true);
4073
}
4074
4075
4076
/**
4077
  Find a good, possibly optimal, query execution plan (QEP) by a possibly
4078
  exhaustive search.
4079
4080
    The procedure searches for the optimal ordering of the query tables in set
4081
    'remaining_tables' of size N, and the corresponding optimal access paths to
4082
    each table. The choice of a table order and an access path for each table
4083
    constitutes a query execution plan (QEP) that fully specifies how to
4084
    execute the query.
4085
4086
    The maximal size of the found plan is controlled by the parameter
4087
    'search_depth'. When search_depth == N, the resulting plan is complete and
4088
    can be used directly as a QEP. If search_depth < N, the found plan consists
4089
    of only some of the query tables. Such "partial" optimal plans are useful
4090
    only as input to query optimization procedures, and cannot be used directly
4091
    to execute a query.
4092
4093
    The algorithm begins with an empty partial plan stored in 'join->positions'
4094
    and a set of N tables - 'remaining_tables'. Each step of the algorithm
4095
    evaluates the cost of the partial plan extended by all access plans for
4096
    each of the relations in 'remaining_tables', expands the current partial
4097
    plan with the access plan that results in lowest cost of the expanded
4098
    partial plan, and removes the corresponding relation from
4099
    'remaining_tables'. The algorithm continues until it either constructs a
4100
    complete optimal plan, or constructs an optimal plartial plan with size =
4101
    search_depth.
4102
4103
    The final optimal plan is stored in 'join->best_positions'. The
4104
    corresponding cost of the optimal plan is in 'join->best_read'.
4105
4106
  @note
4107
    The procedure uses a recursive depth-first search where the depth of the
4108
    recursion (and thus the exhaustiveness of the search) is controlled by the
4109
    parameter 'search_depth'.
4110
4111
  @note
4112
    The pseudocode below describes the algorithm of
4113
    'best_extension_by_limited_search'. The worst-case complexity of this
4114
    algorithm is O(N*N^search_depth/search_depth). When serch_depth >= N, then
4115
    the complexity of greedy_search is O(N!).
4116
4117
    @code
4118
    procedure best_extension_by_limited_search(
4119
      pplan in,             // in, partial plan of tables-joined-so-far
4120
      pplan_cost,           // in, cost of pplan
4121
      remaining_tables,     // in, set of tables not referenced in pplan
4122
      best_plan_so_far,     // in/out, best plan found so far
4123
      best_plan_so_far_cost,// in/out, cost of best_plan_so_far
4124
      search_depth)         // in, maximum size of the plans being considered
4125
    {
4126
      for each table T from remaining_tables
4127
      {
4128
        // Calculate the cost of using table T as above
4129
        cost = complex-series-of-calculations;
4130
4131
        // Add the cost to the cost so far.
4132
        pplan_cost+= cost;
4133
4134
        if (pplan_cost >= best_plan_so_far_cost)
4135
          // pplan_cost already too great, stop search
4136
          continue;
4137
4138
        pplan= expand pplan by best_access_method;
4139
        remaining_tables= remaining_tables - table T;
4140
        if (remaining_tables is not an empty set
4141
            and
4142
            search_depth > 1)
4143
        {
4144
          best_extension_by_limited_search(pplan, pplan_cost,
4145
                                           remaining_tables,
4146
                                           best_plan_so_far,
4147
                                           best_plan_so_far_cost,
4148
                                           search_depth - 1);
4149
        }
4150
        else
4151
        {
4152
          best_plan_so_far_cost= pplan_cost;
4153
          best_plan_so_far= pplan;
4154
        }
4155
      }
4156
    }
4157
    @endcode
4158
4159
  @note
4160
    When 'best_extension_by_limited_search' is called for the first time,
4161
    'join->best_read' must be set to the largest possible value (e.g. DBL_MAX).
4162
    The actual implementation provides a way to optionally use pruning
4163
    heuristic (controlled by the parameter 'prune_level') to reduce the search
4164
    space by skipping some partial plans.
4165
4166
  @note
4167
    The parameter 'search_depth' provides control over the recursion
4168
    depth, and thus the size of the resulting optimal plan.
4169
4170
  @param join             pointer to the structure providing all context info
4171
                          for the query
4172
  @param remaining_tables set of tables not included into the partial plan yet
4173
  @param idx              length of the partial QEP in 'join->positions';
4174
                          since a depth-first search is used, also corresponds
4175
                          to the current depth of the search tree;
4176
                          also an index in the array 'join->best_ref';
4177
  @param record_count     estimate for the number of records returned by the
4178
                          best partial plan
4179
  @param read_time        the cost of the best partial plan
4180
  @param search_depth     maximum depth of the recursion and thus size of the
4181
                          found optimal plan
4182
                          (0 < search_depth <= join->tables+1).
4183
  @param prune_level      pruning heuristics that should be applied during
4184
                          optimization
4185
                          (values: 0 = EXHAUSTIVE, 1 = PRUNE_BY_TIME_OR_ROWS)
4186
4187
  @retval
4188
    false       ok
4189
  @retval
4190
    true        Fatal error
4191
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
4192
static bool best_extension_by_limited_search(Join *join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4193
                                             table_map remaining_tables,
4194
                                             uint32_t idx,
4195
                                             double record_count,
4196
                                             double read_time,
4197
                                             uint32_t search_depth,
4198
                                             uint32_t prune_level)
4199
{
4200
  Session *session= join->session;
4201
  if (session->killed)  // Abort
4202
    return(true);
4203
4204
  /*
4205
     'join' is a partial plan with lower cost than the best plan so far,
4206
     so continue expanding it further with the tables in 'remaining_tables'.
4207
  */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4208
  JoinTable *s;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4209
  double best_record_count= DBL_MAX;
4210
  double best_read_time=    DBL_MAX;
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
4211
  optimizer::Position partial_pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4212
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4213
  for (JoinTable **pos= join->best_ref + idx ; (s= *pos) ; pos++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4214
  {
4215
    table_map real_table_bit= s->table->map;
4216
    if ((remaining_tables & real_table_bit) &&
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
4217
        ! (remaining_tables & s->dependent) &&
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
4218
        (! idx || ! check_interleaving_with_nj(s)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4219
    {
4220
      double current_record_count, current_read_time;
4221
4222
      /*
4223
        psergey-insideout-todo:
4224
          when best_access_path() detects it could do an InsideOut scan or
4225
          some other scan, have it return an insideout scan and a flag that
4226
          requests to "fork" this loop iteration. (Q: how does that behave
4227
          when the depth is insufficient??)
4228
      */
4229
      /* Find the best access method from 's' to the current partial plan */
4230
      best_access_path(join, s, session, remaining_tables, idx,
4231
                       record_count, read_time);
4232
      /* Compute the cost of extending the plan with 's' */
1108.6.6 by Padraig O'Sullivan
Adding accessors to the JOIN class for the positions member. The end goal is
4233
      partial_pos= join->getPosFromPartialPlan(idx);
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
4234
      current_record_count= record_count * partial_pos.getFanout();
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
4235
      current_read_time=    read_time + partial_pos.getCost();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4236
4237
      /* Expand only partial plans with lower cost than the best QEP so far */
4238
      if ((current_read_time +
4239
           current_record_count / (double) TIME_FOR_COMPARE) >= join->best_read)
4240
      {
4241
        restore_prev_nj_state(s);
4242
        continue;
4243
      }
4244
4245
      /*
4246
        Prune some less promising partial plans. This heuristic may miss
4247
        the optimal QEPs, thus it results in a non-exhaustive search.
4248
      */
4249
      if (prune_level == 1)
4250
      {
4251
        if (best_record_count > current_record_count ||
4252
            best_read_time > current_read_time ||
4253
            (idx == join->const_tables && s->table == join->sort_by_table)) // 's' is the first table in the QEP
4254
        {
4255
          if (best_record_count >= current_record_count &&
4256
              best_read_time >= current_read_time &&
4257
              /* TODO: What is the reasoning behind this condition? */
1108.6.17 by Padraig O'Sullivan
Removed the 2.0 constant in the optimizer from the parts that I have
4258
              (! (s->key_dependent & remaining_tables) ||
4259
               partial_pos.isConstTable()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4260
          {
4261
            best_record_count= current_record_count;
4262
            best_read_time=    current_read_time;
4263
          }
4264
        }
4265
        else
4266
        {
4267
          restore_prev_nj_state(s);
4268
          continue;
4269
        }
4270
      }
4271
4272
      if ( (search_depth > 1) && (remaining_tables & ~real_table_bit) )
4273
      { /* Recursively expand the current partial plan */
4274
        std::swap(join->best_ref[idx], *pos);
4275
        if (best_extension_by_limited_search(join,
4276
                                             remaining_tables & ~real_table_bit,
4277
                                             idx + 1,
4278
                                             current_record_count,
4279
                                             current_read_time,
4280
                                             search_depth - 1,
4281
                                             prune_level))
4282
          return(true);
4283
        std::swap(join->best_ref[idx], *pos);
4284
      }
4285
      else
4286
      { /*
4287
          'join' is either the best partial QEP with 'search_depth' relations,
4288
          or the best complete QEP so far, whichever is smaller.
4289
        */
1108.6.6 by Padraig O'Sullivan
Adding accessors to the JOIN class for the positions member. The end goal is
4290
        partial_pos= join->getPosFromPartialPlan(join->const_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4291
        current_read_time+= current_record_count / (double) TIME_FOR_COMPARE;
4292
        if (join->sort_by_table &&
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
4293
            partial_pos.hasTableForSorting(join->sort_by_table))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4294
          /* We have to make a temp table */
4295
          current_read_time+= current_record_count;
4296
        if ((search_depth == 1) || (current_read_time < join->best_read))
4297
        {
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4298
          join->copyPartialPlanIntoOptimalPlan(idx + 1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4299
          join->best_read= current_read_time - 0.001;
4300
        }
4301
      }
4302
      restore_prev_nj_state(s);
4303
    }
4304
  }
4305
  return(false);
4306
}
4307
4308
/**
4309
  Heuristic procedure to automatically guess a reasonable degree of
4310
  exhaustiveness for the greedy search procedure.
4311
4312
  The procedure estimates the optimization time and selects a search depth
4313
  big enough to result in a near-optimal QEP, that doesn't take too long to
4314
  find. If the number of tables in the query exceeds some constant, then
4315
  search_depth is set to this constant.
4316
4317
  @param join   pointer to the structure providing all context info for
4318
                the query
4319
4320
  @note
4321
    This is an extremely simplistic implementation that serves as a stub for a
4322
    more advanced analysis of the join. Ideally the search depth should be
4323
    determined by learning from previous query optimizations, because it will
4324
    depend on the CPU power (and other factors).
4325
4326
  @todo
4327
    this value should be determined dynamically, based on statistics:
4328
    uint32_t max_tables_for_exhaustive_opt= 7;
4329
4330
  @todo
4331
    this value could be determined by some mapping of the form:
4332
    depth : table_count -> [max_tables_for_exhaustive_opt..MAX_EXHAUSTIVE]
4333
4334
  @return
4335
    A positive integer that specifies the search depth (and thus the
4336
    exhaustiveness) of the depth-first search algorithm used by
4337
    'greedy_search'.
4338
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
4339
static uint32_t determine_search_depth(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4340
{
4341
  uint32_t table_count=  join->tables - join->const_tables;
4342
  uint32_t search_depth;
4343
  /* TODO: this value should be determined dynamically, based on statistics: */
4344
  uint32_t max_tables_for_exhaustive_opt= 7;
4345
4346
  if (table_count <= max_tables_for_exhaustive_opt)
4347
    search_depth= table_count+1; // use exhaustive for small number of tables
4348
  else
4349
    /*
4350
      TODO: this value could be determined by some mapping of the form:
4351
      depth : table_count -> [max_tables_for_exhaustive_opt..MAX_EXHAUSTIVE]
4352
    */
4353
    search_depth= max_tables_for_exhaustive_opt; // use greedy search
4354
4355
  return search_depth;
4356
}
4357
1541.1.1 by Brian Aker
JOIN -> Join rename
4358
static bool make_simple_join(Join *join,Table *tmp_table)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4359
{
4360
  Table **tableptr;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4361
  JoinTable *join_tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4362
4363
  /*
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4364
    Reuse Table * and JoinTable if already allocated by a previous call
1541.1.1 by Brian Aker
JOIN -> Join rename
4365
    to this function through Join::exec (may happen for sub-queries).
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4366
  */
4367
  if (!join->table_reexec)
4368
  {
4369
    if (!(join->table_reexec= (Table**) join->session->alloc(sizeof(Table*))))
971.6.11 by Eric Day
Removed purecov messages.
4370
      return(true);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4371
    if (join->tmp_join)
4372
      join->tmp_join->table_reexec= join->table_reexec;
4373
  }
4374
  if (!join->join_tab_reexec)
4375
  {
4376
    if (!(join->join_tab_reexec=
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4377
          (JoinTable*) join->session->alloc(sizeof(JoinTable))))
971.6.11 by Eric Day
Removed purecov messages.
4378
      return(true);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4379
    if (join->tmp_join)
4380
      join->tmp_join->join_tab_reexec= join->join_tab_reexec;
4381
  }
4382
  tableptr= join->table_reexec;
4383
  join_tab= join->join_tab_reexec;
4384
4385
  join->join_tab=join_tab;
4386
  join->table=tableptr; tableptr[0]=tmp_table;
4387
  join->tables=1;
4388
  join->const_tables=0;
4389
  join->const_table_map=0;
4390
  join->tmp_table_param.field_count= join->tmp_table_param.sum_func_count=
4391
    join->tmp_table_param.func_count=0;
4392
  join->tmp_table_param.copy_field=join->tmp_table_param.copy_field_end=0;
4393
  join->first_record=join->sort_and_group=0;
4394
  join->send_records=(ha_rows) 0;
4395
  join->group=0;
4396
  join->row_limit=join->unit->select_limit_cnt;
4397
  join->do_send_rows = (join->row_limit) ? 1 : 0;
4398
4399
  join_tab->cache.buff=0;			/* No caching */
4400
  join_tab->table=tmp_table;
4401
  join_tab->select=0;
4402
  join_tab->select_cond=0;
4403
  join_tab->quick=0;
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4404
  join_tab->type= AM_ALL;			/* Map through all records */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4405
  join_tab->keys.set();                     /* test everything in quick */
4406
  join_tab->info=0;
4407
  join_tab->on_expr_ref=0;
4408
  join_tab->last_inner= 0;
4409
  join_tab->first_unmatched= 0;
4410
  join_tab->ref.key = -1;
4411
  join_tab->not_used_in_distinct=0;
4412
  join_tab->read_first_record= join_init_read_record;
4413
  join_tab->join=join;
4414
  join_tab->ref.key_parts= 0;
1711.6.5 by Brian Aker
Updating so that structures have constructor (removed memset calls).
4415
  join_tab->read_record.init();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4416
  tmp_table->status=0;
4417
  tmp_table->null_row=0;
1711.6.5 by Brian Aker
Updating so that structures have constructor (removed memset calls).
4418
4419
  return false;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4420
}
4421
4422
/**
4423
  Fill in outer join related info for the execution plan structure.
4424
4425
    For each outer join operation left after simplification of the
4426
    original query the function set up the following pointers in the linear
4427
    structure join->join_tab representing the selected execution plan.
4428
    The first inner table t0 for the operation is set to refer to the last
4429
    inner table tk through the field t0->last_inner.
4430
    Any inner table ti for the operation are set to refer to the first
4431
    inner table ti->first_inner.
4432
    The first inner table t0 for the operation is set to refer to the
4433
    first inner table of the embedding outer join operation, if there is any,
4434
    through the field t0->first_upper.
4435
    The on expression for the outer join operation is attached to the
4436
    corresponding first inner table through the field t0->on_expr_ref.
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4437
    Here ti are structures of the JoinTable type.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4438
4439
  EXAMPLE. For the query:
4440
  @code
4441
        SELECT * FROM t1
4442
                      LEFT JOIN
4443
                      (t2, t3 LEFT JOIN t4 ON t3.a=t4.a)
4444
                      ON (t1.a=t2.a AND t1.b=t3.b)
4445
          WHERE t1.c > 5,
4446
  @endcode
4447
4448
    given the execution plan with the table order t1,t2,t3,t4
4449
    is selected, the following references will be set;
4450
    t4->last_inner=[t4], t4->first_inner=[t4], t4->first_upper=[t2]
4451
    t2->last_inner=[t4], t2->first_inner=t3->first_inner=[t2],
4452
    on expression (t1.a=t2.a AND t1.b=t3.b) will be attached to
4453
    *t2->on_expr_ref, while t3.a=t4.a will be attached to *t4->on_expr_ref.
4454
4455
  @param join   reference to the info fully describing the query
4456
4457
  @note
4458
    The function assumes that the simplification procedure has been
4459
    already applied to the join query (see simplify_joins).
4460
    This function can be called only after the execution plan
4461
    has been chosen.
4462
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
4463
static void make_outerjoin_info(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4464
{
4465
  for (uint32_t i=join->const_tables ; i < join->tables ; i++)
4466
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4467
    JoinTable *tab=join->join_tab+i;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4468
    Table *table=tab->table;
4469
    TableList *tbl= table->pos_in_table_list;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
4470
    TableList *embedding= tbl->getEmbedding();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4471
4472
    if (tbl->outer_join)
4473
    {
4474
      /*
4475
        Table tab is the only one inner table for outer join.
4476
        (Like table t4 for the table reference t3 LEFT JOIN t4 ON t3.a=t4.a
4477
        is in the query above.)
4478
      */
4479
      tab->last_inner= tab->first_inner= tab;
4480
      tab->on_expr_ref= &tbl->on_expr;
4481
      tab->cond_equal= tbl->cond_equal;
4482
      if (embedding)
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
4483
        tab->first_upper= embedding->getNestedJoin()->first_nested;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4484
    }
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
4485
    for ( ; embedding ; embedding= embedding->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4486
    {
4487
      /* Ignore sj-nests: */
4488
      if (!embedding->on_expr)
4489
        continue;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
4490
      nested_join_st *nested_join= embedding->getNestedJoin();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4491
      if (!nested_join->counter_)
4492
      {
4493
        /*
4494
          Table tab is the first inner table for nested_join.
4495
          Save reference to it in the nested join structure.
4496
        */
4497
        nested_join->first_nested= tab;
4498
        tab->on_expr_ref= &embedding->on_expr;
4499
        tab->cond_equal= tbl->cond_equal;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
4500
        if (embedding->getEmbedding())
4501
          tab->first_upper= embedding->getEmbedding()->getNestedJoin()->first_nested;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4502
      }
4503
      if (!tab->first_inner)
4504
        tab->first_inner= nested_join->first_nested;
4505
      if (++nested_join->counter_ < nested_join->join_list.elements)
4506
        break;
4507
      /* Table tab is the last inner table for nested join. */
4508
      nested_join->first_nested->last_inner= tab;
4509
    }
4510
  }
4511
  return;
4512
}
4513
1541.1.1 by Brian Aker
JOIN -> Join rename
4514
static bool make_join_select(Join *join,
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
4515
                             optimizer::SqlSelect *select,
1237.9.2 by Padraig O'Sullivan
Moved opt_range.[cc,h] into the optimizer directory and namespace and renamed the files to
4516
                             COND *cond)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4517
{
4518
  Session *session= join->session;
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
4519
  optimizer::Position cur_pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4520
  if (select)
4521
  {
4522
    add_not_null_conds(join);
4523
    table_map used_tables;
4524
    if (cond)                /* Because of QUICK_GROUP_MIN_MAX_SELECT */
4525
    {                        /* there may be a select without a cond. */
4526
      if (join->tables > 1)
4527
        cond->update_used_tables();		// Tablenr may have changed
4528
      if (join->const_tables == join->tables &&
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4529
          session->lex->current_select->master_unit() ==
4530
          &session->lex->unit)		// not upper level SELECT
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4531
        join->const_table_map|=RAND_TABLE_BIT;
4532
      {						// Check const tables
4533
        COND *const_cond=
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4534
          make_cond_for_table(cond,
4535
              join->const_table_map,
4536
              (table_map) 0, 1);
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4537
        for (JoinTable *tab= join->join_tab+join->const_tables;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4538
            tab < join->join_tab+join->tables ; tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4539
        {
4540
          if (*tab->on_expr_ref)
4541
          {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4542
            JoinTable *cond_tab= tab->first_inner;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4543
            COND *tmp= make_cond_for_table(*tab->on_expr_ref,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4544
                join->const_table_map,
4545
                (  table_map) 0, 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4546
            if (!tmp)
4547
              continue;
4548
            tmp= new Item_func_trig_cond(tmp, &cond_tab->not_null_compl);
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4549
            if (! tmp)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4550
              return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4551
            tmp->quick_fix_field();
4552
            cond_tab->select_cond= !cond_tab->select_cond ? tmp :
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4553
              new Item_cond_and(cond_tab->select_cond,
4554
                  tmp);
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4555
            if (! cond_tab->select_cond)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4556
              return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4557
            cond_tab->select_cond->quick_fix_field();
4558
          }
4559
        }
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4560
        if (const_cond && ! const_cond->val_int())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4561
        {
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4562
          return 1;	 // Impossible const condition
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4563
        }
4564
      }
4565
    }
4566
    used_tables=((select->const_tables=join->const_table_map) |
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4567
        OUTER_REF_TABLE_BIT | RAND_TABLE_BIT);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4568
    for (uint32_t i=join->const_tables ; i < join->tables ; i++)
4569
    {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4570
      JoinTable *tab=join->join_tab+i;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4571
      /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4572
         first_inner is the X in queries like:
4573
         SELECT * FROM t1 LEFT OUTER JOIN (t2 JOIN t3) ON X
4574
       */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4575
      JoinTable *first_inner_tab= tab->first_inner;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4576
      table_map current_map= tab->table->map;
4577
      bool use_quick_range=0;
4578
      COND *tmp;
4579
4580
      /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4581
         Following force including random expression in last table condition.
4582
         It solve problem with select like SELECT * FROM t1 WHERE rand() > 0.5
4583
       */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4584
      if (i == join->tables-1)
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4585
        current_map|= OUTER_REF_TABLE_BIT | RAND_TABLE_BIT;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4586
      used_tables|=current_map;
4587
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4588
      if (tab->type == AM_REF && tab->quick &&
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4589
          (uint32_t) tab->ref.key == tab->quick->index &&
4590
          tab->ref.key_length < tab->quick->max_used_key_length)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4591
      {
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4592
        /* Range uses longer key;  Use this instead of ref on key */
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4593
        tab->type= AM_ALL;
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4594
        use_quick_range= 1;
4595
        tab->use_quick= 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4596
        tab->ref.key= -1;
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4597
        tab->ref.key_parts= 0;		// Don't use ref key.
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4598
        cur_pos= join->getPosFromOptimalPlan(i);
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
4599
        cur_pos.setFanout(rows2double(tab->quick->records));
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4600
        /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4601
           We will use join cache here : prevent sorting of the first
4602
           table only and sort at the end.
4603
         */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4604
        if (i != join->const_tables && join->tables > join->const_tables + 1)
4605
          join->full_join= 1;
4606
      }
4607
4608
      tmp= NULL;
4609
      if (cond)
4610
        tmp= make_cond_for_table(cond,used_tables,current_map, 0);
4611
      if (cond && !tmp && tab->quick)
4612
      {						// Outer join
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4613
        if (tab->type != AM_ALL)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4614
        {
4615
          /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4616
             Don't use the quick method
4617
             We come here in the case where we have 'key=constant' and
4618
             the test is removed by make_cond_for_table()
4619
           */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4620
          delete tab->quick;
4621
          tab->quick= 0;
4622
        }
4623
        else
4624
        {
4625
          /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4626
             Hack to handle the case where we only refer to a table
4627
             in the ON part of an OUTER JOIN. In this case we want the code
4628
             below to check if we should use 'quick' instead.
4629
           */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4630
          tmp= new Item_int((int64_t) 1,1);	// Always true
4631
        }
4632
4633
      }
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4634
      if (tmp || !cond || tab->type == AM_REF || tab->type == AM_REF_OR_NULL ||
4635
          tab->type == AM_EQ_REF)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4636
      {
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
4637
        optimizer::SqlSelect *sel= tab->select= ((optimizer::SqlSelect*)
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4638
            session->memdup((unsigned char*) select,
4639
              sizeof(*select)));
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4640
        if (! sel)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4641
          return 1;			// End of memory
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4642
        /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4643
           If tab is an inner table of an outer join operation,
4644
           add a match guard to the pushed down predicate.
4645
           The guard will turn the predicate on only after
4646
           the first match for outer tables is encountered.
4647
         */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4648
        if (cond && tmp)
4649
        {
4650
          /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4651
             Because of QUICK_GROUP_MIN_MAX_SELECT there may be a select without
4652
             a cond, so neutralize the hack above.
4653
           */
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4654
          if (! (tmp= add_found_match_trig_cond(first_inner_tab, tmp, 0)))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4655
            return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4656
          tab->select_cond=sel->cond=tmp;
4657
        }
4658
        else
4659
          tab->select_cond= sel->cond= NULL;
4660
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4661
        sel->head=tab->table;
4662
        if (tab->quick)
4663
        {
4664
          /* Use quick key read if it's a constant and it's not used
4665
             with key reading */
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4666
          if (tab->needed_reg.none() && tab->type != AM_EQ_REF
4667
              && (tab->type != AM_REF || (uint32_t) tab->ref.key == tab->quick->index))
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4668
          {
4669
            sel->quick=tab->quick;		// Use value from get_quick_...
4670
            sel->quick_keys.reset();
4671
            sel->needed_reg.reset();
4672
          }
4673
          else
4674
          {
4675
            delete tab->quick;
4676
          }
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4677
          tab->quick= 0;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4678
        }
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4679
        uint32_t ref_key= static_cast<uint32_t>(sel->head->reginfo.join_tab->ref.key + 1);
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4680
        if (i == join->const_tables && ref_key)
4681
        {
4682
          if (tab->const_keys.any() &&
4683
              tab->table->reginfo.impossible_range)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4684
            return 1;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4685
        }
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
4686
        else if (tab->type == AM_ALL && ! use_quick_range)
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4687
        {
4688
          if (tab->const_keys.any() &&
4689
              tab->table->reginfo.impossible_range)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4690
            return 1;				// Impossible range
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4691
          /*
4692
             We plan to scan all rows.
4693
             Check again if we should use an index.
4694
             We could have used an column from a previous table in
4695
             the index if we are using limit and this is the first table
4696
           */
4697
4698
          cur_pos= join->getPosFromOptimalPlan(i);
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4699
          if ((cond && (! ((tab->keys & tab->const_keys) == tab->keys) && i > 0)) ||
4700
              (! tab->const_keys.none() && (i == join->const_tables) &&
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
4701
              (join->unit->select_limit_cnt < cur_pos.getFanout()) && ((join->select_options & OPTION_FOUND_ROWS) == false)))
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4702
          {
4703
            /* Join with outer join condition */
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4704
            COND *orig_cond= sel->cond;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4705
            sel->cond= and_conds(sel->cond, *tab->on_expr_ref);
4706
4707
            /*
4708
               We can't call sel->cond->fix_fields,
4709
               as it will break tab->on_expr if it's AND condition
4710
               (fix_fields currently removes extra AND/OR levels).
4711
               Yet attributes of the just built condition are not needed.
4712
               Thus we call sel->cond->quick_fix_field for safety.
4713
             */
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4714
            if (sel->cond && ! sel->cond->fixed)
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4715
              sel->cond->quick_fix_field();
4716
4717
            if (sel->test_quick_select(session, tab->keys,
4718
                  used_tables & ~ current_map,
4719
                  (join->select_options &
4720
                   OPTION_FOUND_ROWS ?
4721
                   HA_POS_ERROR :
4722
                   join->unit->select_limit_cnt), 0,
4723
                  false) < 0)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4724
            {
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4725
              /*
4726
                 Before reporting "Impossible WHERE" for the whole query
4727
                 we have to check isn't it only "impossible ON" instead
4728
               */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4729
              sel->cond=orig_cond;
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4730
              if (! *tab->on_expr_ref ||
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4731
                  sel->test_quick_select(session, tab->keys,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4732
                    used_tables & ~ current_map,
4733
                    (join->select_options &
4734
                     OPTION_FOUND_ROWS ?
4735
                     HA_POS_ERROR :
4736
                     join->unit->select_limit_cnt),0,
4737
                    false) < 0)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4738
                return 1;			// Impossible WHERE
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4739
            }
4740
            else
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4741
              sel->cond=orig_cond;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4742
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4743
            /* Fix for EXPLAIN */
4744
            if (sel->quick)
4745
            {
4746
              cur_pos= join->getPosFromOptimalPlan(i);
1108.6.25 by Padraig O'Sullivan
Made the records_read member of the Position class private.
4747
              cur_pos.setFanout(static_cast<double>(sel->quick->records));
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4748
            }
4749
          }
4750
          else
4751
          {
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4752
            sel->needed_reg= tab->needed_reg;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4753
            sel->quick_keys.reset();
4754
          }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4755
          if (!((tab->checked_keys & sel->quick_keys) == sel->quick_keys) ||
4756
              !((tab->checked_keys & sel->needed_reg) == sel->needed_reg))
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4757
          {
4758
            tab->keys= sel->quick_keys;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4759
            tab->keys|= sel->needed_reg;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4760
            tab->use_quick= (!sel->needed_reg.none() &&
4761
                (select->quick_keys.none() ||
4762
                 (select->quick &&
4763
                  (select->quick->records >= 100L)))) ?
4764
              2 : 1;
4765
            sel->read_tables= used_tables & ~current_map;
4766
          }
4767
          if (i != join->const_tables && tab->use_quick != 2)
4768
          {					/* Read with cache */
4769
            if (cond &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4770
                (tmp=make_cond_for_table(cond,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4771
                                         join->const_table_map |
4772
                                         current_map,
4773
                                         current_map, 0)))
4774
            {
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
4775
              tab->cache.select= (optimizer::SqlSelect*)
4776
                session->memdup((unsigned char*) sel, sizeof(optimizer::SqlSelect));
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
4777
              tab->cache.select->cond= tmp;
4778
              tab->cache.select->read_tables= join->const_table_map;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4779
            }
4780
          }
4781
        }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4782
      }
4783
4784
      /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4785
         Push down conditions from all on expressions.
4786
         Each of these conditions are guarded by a variable
4787
         that turns if off just before null complemented row for
4788
         outer joins is formed. Thus, the condition from an
4789
         'on expression' are guaranteed not to be checked for
4790
         the null complemented row.
4791
       */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4792
4793
      /* First push down constant conditions from on expressions */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4794
      for (JoinTable *join_tab= join->join_tab+join->const_tables;
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4795
          join_tab < join->join_tab+join->tables ; join_tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4796
      {
4797
        if (*join_tab->on_expr_ref)
4798
        {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4799
          JoinTable *cond_tab= join_tab->first_inner;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4800
          tmp= make_cond_for_table(*join_tab->on_expr_ref,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4801
              join->const_table_map,
4802
              (table_map) 0, 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4803
          if (!tmp)
4804
            continue;
4805
          tmp= new Item_func_trig_cond(tmp, &cond_tab->not_null_compl);
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4806
          if (! tmp)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4807
            return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4808
          tmp->quick_fix_field();
4809
          cond_tab->select_cond= !cond_tab->select_cond ? tmp :
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4810
            new Item_cond_and(cond_tab->select_cond,tmp);
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4811
          if (! cond_tab->select_cond)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4812
            return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4813
          cond_tab->select_cond->quick_fix_field();
4814
        }
4815
      }
4816
4817
      /* Push down non-constant conditions from on expressions */
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4818
      JoinTable *last_tab= tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4819
      while (first_inner_tab && first_inner_tab->last_inner == last_tab)
4820
      {
4821
        /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4822
           Table tab is the last inner table of an outer join.
4823
           An on expression is always attached to it.
4824
         */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4825
        COND *on_expr= *first_inner_tab->on_expr_ref;
4826
4827
        table_map used_tables2= (join->const_table_map |
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4828
            OUTER_REF_TABLE_BIT | RAND_TABLE_BIT);
4829
        for (tab= join->join_tab+join->const_tables; tab <= last_tab ; tab++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4830
        {
4831
          current_map= tab->table->map;
4832
          used_tables2|= current_map;
4833
          COND *tmp_cond= make_cond_for_table(on_expr, used_tables2,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4834
              current_map, 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4835
          if (tmp_cond)
4836
          {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4837
            JoinTable *cond_tab= tab < first_inner_tab ? first_inner_tab : tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4838
            /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4839
               First add the guards for match variables of
4840
               all embedding outer join operations.
4841
             */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4842
            if (!(tmp_cond= add_found_match_trig_cond(cond_tab->first_inner,
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4843
                                                      tmp_cond,
4844
                                                      first_inner_tab)))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4845
              return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4846
            /*
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4847
               Now add the guard turning the predicate off for
4848
               the null complemented row.
4849
             */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4850
            tmp_cond= new Item_func_trig_cond(tmp_cond,
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4851
                &first_inner_tab->
4852
                not_null_compl);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4853
            if (tmp_cond)
4854
              tmp_cond->quick_fix_field();
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4855
            /* Add the predicate to other pushed down predicates */
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4856
            cond_tab->select_cond= !cond_tab->select_cond ? tmp_cond :
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
4857
              new Item_cond_and(cond_tab->select_cond,
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
4858
                                tmp_cond);
4859
            if (! cond_tab->select_cond)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
4860
              return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4861
            cond_tab->select_cond->quick_fix_field();
4862
          }
4863
        }
4864
        first_inner_tab= first_inner_tab->first_upper;
4865
      }
4866
    }
4867
  }
4868
  return(0);
4869
}
4870
4871
/*
4872
  Plan refinement stage: do various set ups for the executioner
4873
4874
  SYNOPSIS
4875
    make_join_readinfo()
4876
      join           Join being processed
4877
      options        Join's options (checking for SELECT_DESCRIBE,
4878
                     SELECT_NO_JOIN_CACHE)
4879
      no_jbuf_after  Don't use join buffering after table with this number.
4880
4881
  DESCRIPTION
4882
    Plan refinement stage: do various set ups for the executioner
4883
      - set up use of join buffering
4884
      - push index conditions
4885
      - increment counters
4886
      - etc
4887
4888
  RETURN
4889
    false - OK
4890
    true  - Out of memory
4891
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
4892
static bool make_join_readinfo(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4893
{
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4894
  bool sorted= true;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4895
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4896
  for (uint32_t i= join->const_tables ; i < join->tables ; i++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4897
  {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4898
    JoinTable *tab=join->join_tab+i;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4899
    Table *table=tab->table;
4900
    tab->read_record.table= table;
1208.3.2 by brian
Update for Cursor renaming.
4901
    tab->read_record.cursor= table->cursor;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4902
    tab->next_select=sub_select;		/* normal select */
4903
    /*
4904
      TODO: don't always instruct first table's ref/range access method to
4905
      produce sorted output.
4906
    */
4907
    tab->sorted= sorted;
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4908
    sorted= false; // only first must be sorted
4909
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4910
    if (tab->insideout_match_tab)
4911
    {
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4912
      if (! (tab->insideout_buf= (unsigned char*) join->session->alloc(tab->table->key_info
4913
                                                                       [tab->index].
4914
                                                                       key_length)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4915
        return true;
4916
    }
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4917
4918
    optimizer::AccessMethodFactory &factory= optimizer::AccessMethodFactory::singleton();
1475.1.4 by Padraig O'Sullivan
Used shared_ptr for the pointer returned from the factory method since we can use boost now...yay
4919
    boost::shared_ptr<optimizer::AccessMethod> access_method(factory.createAccessMethod(tab->type));
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4920
4921
    if (! access_method)
4922
    {
4923
      /**
4924
       * @todo
4925
       * Is abort() the correct thing to call here? I call this here because it was what was called in
4926
       * the default case for the switch statement that used to be here.
4927
       */
971.6.11 by Eric Day
Removed purecov messages.
4928
      abort();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4929
    }
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4930
4931
    access_method->getStats(table, tab);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4932
  }
1475.1.3 by Padraig O'Sullivan
Integrated the AccessMethodFactory class into the code base. We have now abstracted out the concept of an access method.
4933
4934
  join->join_tab[join->tables-1].next_select= NULL; /* Set by do_select */
4935
4936
  return false;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4937
}
4938
4939
/** Update the dependency map for the tables. */
1541.1.1 by Brian Aker
JOIN -> Join rename
4940
static void update_depend_map(Join *join)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4941
{
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4942
  JoinTable *join_tab=join->join_tab, *end=join_tab+join->tables;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4943
4944
  for (; join_tab != end ; join_tab++)
4945
  {
1089.1.14 by Brian Aker
Fix TABLE_REF structure
4946
    table_reference_st *ref= &join_tab->ref;
4947
    table_map depend_map= 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4948
    Item **item=ref->items;
4949
    uint32_t i;
4950
    for (i=0 ; i < ref->key_parts ; i++,item++)
4951
      depend_map|=(*item)->used_tables();
4952
    ref->depend_map=depend_map & ~OUTER_REF_TABLE_BIT;
4953
    depend_map&= ~OUTER_REF_TABLE_BIT;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4954
    for (JoinTable **tab=join->map2table; depend_map; tab++,depend_map>>=1 )
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4955
    {
4956
      if (depend_map & 1)
4957
        ref->depend_map|=(*tab)->ref.depend_map;
4958
    }
4959
  }
4960
}
4961
4962
/** Update the dependency map for the sort order. */
1541.1.1 by Brian Aker
JOIN -> Join rename
4963
static void update_depend_map(Join *join, order_st *order)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4964
{
4965
  for (; order ; order=order->next)
4966
  {
4967
    table_map depend_map;
4968
    order->item[0]->update_used_tables();
4969
    order->depend_map=depend_map=order->item[0]->used_tables();
4970
    // Not item_sum(), RAND() and no reference to table outside of sub select
4971
    if (!(order->depend_map & (OUTER_REF_TABLE_BIT | RAND_TABLE_BIT))
4972
        && !order->item[0]->with_sum_func)
4973
    {
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
4974
      for (JoinTable **tab=join->map2table; depend_map; tab++, depend_map>>=1)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
4975
      {
4976
        if (depend_map & 1)
4977
          order->depend_map|=(*tab)->ref.depend_map;
4978
      }
4979
    }
4980
  }
4981
}
4982
4983
/**
4984
  Remove all constants and check if order_st only contains simple
4985
  expressions.
4986
4987
  simple_order is set to 1 if sort_order only uses fields from head table
4988
  and the head table is not a LEFT JOIN table.
4989
4990
  @param join			Join handler
4991
  @param first_order		List of SORT or GROUP order
4992
  @param cond			WHERE statement
4993
  @param change_list		Set to 1 if we should remove things from list.
4994
                               If this is not set, then only simple_order is
4995
                               calculated.
4996
  @param simple_order		Set to 1 if we are only using simple expressions
4997
4998
  @return
4999
    Returns new sort order
5000
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
5001
static order_st *remove_constants(Join *join,order_st *first_order, COND *cond, bool change_list, bool *simple_order)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5002
{
5003
  if (join->tables == join->const_tables)
5004
    return change_list ? 0 : first_order;		// No need to sort
5005
5006
  order_st *order,**prev_ptr;
5007
  table_map first_table= join->join_tab[join->const_tables].table->map;
5008
  table_map not_const_tables= ~join->const_table_map;
5009
  table_map ref;
5010
5011
  prev_ptr= &first_order;
5012
  *simple_order= *join->join_tab[join->const_tables].on_expr_ref ? 0 : 1;
5013
5014
  /* NOTE: A variable of not_const_tables ^ first_table; breaks gcc 2.7 */
5015
5016
  update_depend_map(join, first_order);
5017
  for (order=first_order; order ; order=order->next)
5018
  {
5019
    table_map order_tables=order->item[0]->used_tables();
5020
    if (order->item[0]->with_sum_func)
5021
      *simple_order=0;				// Must do a temp table to sort
5022
    else if (!(order_tables & not_const_tables))
5023
    {
5024
      if (order->item[0]->with_subselect)
5025
        order->item[0]->val_str(&order->item[0]->str_value);
5026
      continue;					// skip const item
5027
    }
5028
    else
5029
    {
5030
      if (order_tables & (RAND_TABLE_BIT | OUTER_REF_TABLE_BIT))
5031
        *simple_order=0;
5032
      else
5033
      {
5034
        Item *comp_item=0;
5035
        if (cond && const_expression_in_where(cond,order->item[0], &comp_item))
5036
        {
5037
          continue;
5038
        }
5039
        if ((ref=order_tables & (not_const_tables ^ first_table)))
5040
        {
5041
          if (!(order_tables & first_table) &&
5042
                    only_eq_ref_tables(join,first_order, ref))
5043
          {
5044
            continue;
5045
          }
5046
          *simple_order=0;			// Must do a temp table to sort
5047
        }
5048
      }
5049
    }
5050
    if (change_list)
5051
      *prev_ptr= order;				// use this entry
5052
    prev_ptr= &order->next;
5053
  }
5054
  if (change_list)
5055
    *prev_ptr=0;
5056
  if (prev_ptr == &first_order)			// Nothing to sort/group
5057
    *simple_order=1;
5058
  return(first_order);
5059
}
5060
1541.1.1 by Brian Aker
JOIN -> Join rename
5061
static int return_zero_rows(Join *join,
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5062
                            select_result *result,
5063
                            TableList *tables,
5064
		                        List<Item> &fields,
5065
                            bool send_row,
5066
                            uint64_t select_options,
5067
                            const char *info,
5068
                            Item *having)
5069
{
5070
  if (select_options & SELECT_DESCRIBE)
5071
  {
1240.7.1 by Padraig O'Sullivan
Created an ExplainPlan class in the optimizer namespace. All printing of an explain in drizzle goes
5072
    optimizer::ExplainPlan planner(join,
5073
                                   false,
5074
                                   false,
5075
                                   false,
5076
                                   info);
5077
    planner.printPlan();
5078
    return 0;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5079
  }
5080
5081
  join->join_free();
5082
5083
  if (send_row)
5084
  {
5085
    for (TableList *table= tables; table; table= table->next_leaf)
5086
      table->table->mark_as_null_row();		// All fields are NULL
5087
    if (having && having->val_int() == 0)
5088
      send_row=0;
5089
  }
971.3.70 by Eric Day
Fixed style issues found by Jay.
5090
  if (! (result->send_fields(fields)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5091
  {
5092
    if (send_row)
5093
    {
5094
      List_iterator_fast<Item> it(fields);
5095
      Item *item;
5096
      while ((item= it++))
5097
        item->no_rows_in_result();
5098
      result->send_data(fields);
5099
    }
5100
    result->send_eof();				// Should be safe
5101
  }
5102
  /* Update results for FOUND_ROWS */
5103
  join->session->limit_found_rows= join->session->examined_row_count= 0;
5104
  return(0);
5105
}
5106
5107
/**
5108
  Simplify joins replacing outer joins by inner joins whenever it's
5109
  possible.
5110
5111
    The function, during a retrieval of join_list,  eliminates those
5112
    outer joins that can be converted into inner join, possibly nested.
5113
    It also moves the on expressions for the converted outer joins
5114
    and from inner joins to conds.
5115
    The function also calculates some attributes for nested joins:
5116
    - used_tables
5117
    - not_null_tables
5118
    - dep_tables.
5119
    - on_expr_dep_tables
5120
    The first two attributes are used to test whether an outer join can
5121
    be substituted for an inner join. The third attribute represents the
5122
    relation 'to be dependent on' for tables. If table t2 is dependent
5123
    on table t1, then in any evaluated execution plan table access to
5124
    table t2 must precede access to table t2. This relation is used also
5125
    to check whether the query contains  invalid cross-references.
5126
    The forth attribute is an auxiliary one and is used to calculate
5127
    dep_tables.
5128
    As the attribute dep_tables qualifies possibles orders of tables in the
5129
    execution plan, the dependencies required by the straight join
5130
    modifiers are reflected in this attribute as well.
5131
    The function also removes all braces that can be removed from the join
5132
    expression without changing its meaning.
5133
5134
  @note
5135
    An outer join can be replaced by an inner join if the where condition
5136
    or the on expression for an embedding nested join contains a conjunctive
5137
    predicate rejecting null values for some attribute of the inner tables.
5138
5139
    E.g. in the query:
5140
    @code
5141
      SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a WHERE t2.b < 5
5142
    @endcode
5143
    the predicate t2.b < 5 rejects nulls.
5144
    The query is converted first to:
5145
    @code
5146
      SELECT * FROM t1 INNER JOIN t2 ON t2.a=t1.a WHERE t2.b < 5
5147
    @endcode
5148
    then to the equivalent form:
5149
    @code
5150
      SELECT * FROM t1, t2 ON t2.a=t1.a WHERE t2.b < 5 AND t2.a=t1.a
5151
    @endcode
5152
5153
5154
    Similarly the following query:
5155
    @code
5156
      SELECT * from t1 LEFT JOIN (t2, t3) ON t2.a=t1.a t3.b=t1.b
5157
        WHERE t2.c < 5
5158
    @endcode
5159
    is converted to:
5160
    @code
5161
      SELECT * FROM t1, (t2, t3) WHERE t2.c < 5 AND t2.a=t1.a t3.b=t1.b
5162
5163
    @endcode
5164
5165
    One conversion might trigger another:
5166
    @code
5167
      SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a
5168
                       LEFT JOIN t3 ON t3.b=t2.b
5169
        WHERE t3 IS NOT NULL =>
5170
      SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t1.a, t3
5171
        WHERE t3 IS NOT NULL AND t3.b=t2.b =>
5172
      SELECT * FROM t1, t2, t3
5173
        WHERE t3 IS NOT NULL AND t3.b=t2.b AND t2.a=t1.a
5174
  @endcode
5175
5176
    The function removes all unnecessary braces from the expression
5177
    produced by the conversions.
5178
    E.g.
5179
    @code
5180
      SELECT * FROM t1, (t2, t3) WHERE t2.c < 5 AND t2.a=t1.a AND t3.b=t1.b
5181
    @endcode
5182
    finally is converted to:
5183
    @code
5184
      SELECT * FROM t1, t2, t3 WHERE t2.c < 5 AND t2.a=t1.a AND t3.b=t1.b
5185
5186
    @endcode
5187
5188
5189
    It also will remove braces from the following queries:
5190
    @code
5191
      SELECT * from (t1 LEFT JOIN t2 ON t2.a=t1.a) LEFT JOIN t3 ON t3.b=t2.b
5192
      SELECT * from (t1, (t2,t3)) WHERE t1.a=t2.a AND t2.b=t3.b.
5193
    @endcode
5194
5195
    The benefit of this simplification procedure is that it might return
5196
    a query for which the optimizer can evaluate execution plan with more
5197
    join orders. With a left join operation the optimizer does not
5198
    consider any plan where one of the inner tables is before some of outer
5199
    tables.
5200
5201
  IMPLEMENTATION
5202
    The function is implemented by a recursive procedure.  On the recursive
5203
    ascent all attributes are calculated, all outer joins that can be
5204
    converted are replaced and then all unnecessary braces are removed.
5205
    As join list contains join tables in the reverse order sequential
5206
    elimination of outer joins does not require extra recursive calls.
5207
5208
  SEMI-JOIN NOTES
5209
    Remove all semi-joins that have are within another semi-join (i.e. have
5210
    an "ancestor" semi-join nest)
5211
5212
  EXAMPLES
5213
    Here is an example of a join query with invalid cross references:
5214
    @code
5215
      SELECT * FROM t1 LEFT JOIN t2 ON t2.a=t3.a LEFT JOIN t3 ON t3.b=t1.b
5216
    @endcode
5217
5218
  @param join        reference to the query info
5219
  @param join_list   list representation of the join to be converted
5220
  @param conds       conditions to add on expressions for converted joins
5221
  @param top         true <=> conds is the where condition
5222
5223
  @return
5224
    - The new condition, if success
5225
    - 0, otherwise
5226
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
5227
static COND *simplify_joins(Join *join, List<TableList> *join_list, COND *conds, bool top)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5228
{
5229
  TableList *table;
5230
  nested_join_st *nested_join;
5231
  TableList *prev_table= 0;
5232
  List_iterator<TableList> li(*join_list);
5233
5234
  /*
5235
    Try to simplify join operations from join_list.
5236
    The most outer join operation is checked for conversion first.
5237
  */
5238
  while ((table= li++))
5239
  {
5240
    table_map used_tables;
5241
    table_map not_null_tables= (table_map) 0;
5242
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5243
    if ((nested_join= table->getNestedJoin()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5244
    {
5245
      /*
5246
         If the element of join_list is a nested join apply
5247
         the procedure to its nested join list first.
5248
      */
5249
      if (table->on_expr)
5250
      {
5251
        Item *expr= table->on_expr;
5252
        /*
5253
           If an on expression E is attached to the table,
5254
           check all null rejected predicates in this expression.
5255
           If such a predicate over an attribute belonging to
5256
           an inner table of an embedded outer join is found,
5257
           the outer join is converted to an inner join and
5258
           the corresponding on expression is added to E.
5259
	      */
1100.2.3 by Brian Aker
Remove final bits on SJ
5260
        expr= simplify_joins(join, &nested_join->join_list, expr, false);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5261
5262
        if (!table->prep_on_expr || expr != table->on_expr)
5263
        {
5264
          assert(expr);
5265
5266
          table->on_expr= expr;
5267
          table->prep_on_expr= expr->copy_andor_structure(join->session);
5268
        }
5269
      }
5270
      nested_join->used_tables= (table_map) 0;
5271
      nested_join->not_null_tables=(table_map) 0;
1100.2.3 by Brian Aker
Remove final bits on SJ
5272
      conds= simplify_joins(join, &nested_join->join_list, conds, top);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5273
      used_tables= nested_join->used_tables;
5274
      not_null_tables= nested_join->not_null_tables;
5275
    }
5276
    else
5277
    {
5278
      if (!table->prep_on_expr)
5279
        table->prep_on_expr= table->on_expr;
5280
      used_tables= table->table->map;
5281
      if (conds)
5282
        not_null_tables= conds->not_null_tables();
5283
    }
5284
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5285
    if (table->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5286
    {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5287
      table->getEmbedding()->getNestedJoin()->used_tables|= used_tables;
5288
      table->getEmbedding()->getNestedJoin()->not_null_tables|= not_null_tables;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5289
    }
5290
5291
    if (!table->outer_join || (used_tables & not_null_tables))
5292
    {
5293
      /*
5294
        For some of the inner tables there are conjunctive predicates
5295
        that reject nulls => the outer join can be replaced by an inner join.
5296
      */
5297
      table->outer_join= 0;
5298
      if (table->on_expr)
5299
      {
5300
        /* Add ON expression to the WHERE or upper-level ON condition. */
5301
        if (conds)
5302
        {
5303
          conds= and_conds(conds, table->on_expr);
5304
          conds->top_level_item();
5305
          /* conds is always a new item as both cond and on_expr existed */
5306
          assert(!conds->fixed);
5307
          conds->fix_fields(join->session, &conds);
5308
        }
5309
        else
5310
          conds= table->on_expr;
5311
        table->prep_on_expr= table->on_expr= 0;
5312
      }
5313
    }
5314
5315
    if (!top)
5316
      continue;
5317
5318
    /*
5319
      Only inner tables of non-convertible outer joins
5320
      remain with on_expr.
5321
    */
5322
    if (table->on_expr)
5323
    {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5324
      table->setDepTables(table->getDepTables() | table->on_expr->used_tables());
5325
      if (table->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5326
      {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5327
        table->setDepTables(table->getDepTables() & ~table->getEmbedding()->getNestedJoin()->used_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5328
        /*
5329
           Embedding table depends on tables used
5330
           in embedded on expressions.
5331
        */
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5332
        table->getEmbedding()->setOnExprDepTables(table->getEmbedding()->getOnExprDepTables() & table->on_expr->used_tables());
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5333
      }
5334
      else
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5335
        table->setDepTables(table->getDepTables() & ~table->table->map);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5336
    }
5337
5338
    if (prev_table)
5339
    {
1685.7.3 by Prafulla Tekawade
Fix for Bug 585644,585628
5340
      //If this is straight join, set prev table to be dependent on all tables
5341
      //from this nested join, so that correct join order is selected.
1685.7.4 by Prafulla Tekawade
Adding previously (accidentally) deleted code to the condition
5342
      if ((test(join->select_options & SELECT_STRAIGHT_JOIN)) ||
5343
          prev_table->straight)
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5344
        prev_table->setDepTables(prev_table->getDepTables() | used_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5345
      if (prev_table->on_expr)
5346
      {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5347
        prev_table->setDepTables(prev_table->getDepTables() | table->getOnExprDepTables());
5348
        table_map prev_used_tables= prev_table->getNestedJoin() ?
5349
	                            prev_table->getNestedJoin()->used_tables :
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5350
	                            prev_table->table->map;
5351
        /*
5352
          If on expression contains only references to inner tables
5353
          we still make the inner tables dependent on the outer tables.
5354
          It would be enough to set dependency only on one outer table
5355
          for them. Yet this is really a rare case.
5356
	      */
5357
        if (!(prev_table->on_expr->used_tables() & ~prev_used_tables))
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5358
          prev_table->setDepTables(prev_table->getDepTables() | used_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5359
      }
5360
    }
5361
    prev_table= table;
5362
  }
5363
5364
  /*
5365
    Flatten nested joins that can be flattened.
5366
    no ON expression and not a semi-join => can be flattened.
5367
  */
5368
  li.rewind();
5369
  while ((table= li++))
5370
  {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5371
    nested_join= table->getNestedJoin();
1100.2.3 by Brian Aker
Remove final bits on SJ
5372
    if (nested_join && !table->on_expr)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5373
    {
5374
      TableList *tbl;
5375
      List_iterator<TableList> it(nested_join->join_list);
5376
      while ((tbl= it++))
5377
      {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5378
        tbl->setEmbedding(table->getEmbedding());
1637.2.6 by Vijay Samuel
Merge encapsulate TableList-1.
5379
        tbl->setJoinList(table->getJoinList());
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5380
      }
5381
      li.replace(nested_join->join_list);
5382
    }
5383
  }
5384
  return(conds);
5385
}
5386
1541.1.1 by Brian Aker
JOIN -> Join rename
5387
static int remove_duplicates(Join *join, Table *entry,List<Item> &fields, Item *having)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5388
{
5389
  int error;
5390
  uint32_t reclength,offset;
5391
  uint32_t field_count;
5392
  Session *session= join->session;
5393
5394
  entry->reginfo.lock_type=TL_WRITE;
5395
5396
  /* Calculate how many saved fields there is in list */
5397
  field_count=0;
5398
  List_iterator<Item> it(fields);
5399
  Item *item;
5400
  while ((item=it++))
5401
  {
5402
    if (item->get_tmp_table_field() && ! item->const_item())
5403
      field_count++;
5404
  }
5405
5406
  if (!field_count && !(join->select_options & OPTION_FOUND_ROWS) && !having)
5407
  {                    // only const items with no OPTION_FOUND_ROWS
5408
    join->unit->select_limit_cnt= 1;		// Only send first row
5409
    return(0);
5410
  }
1578.2.16 by Brian Aker
Merge in change to getTable() to private the field objects.
5411
  Field **first_field=entry->getFields() + entry->getShare()->sizeFields() - field_count;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5412
  offset= (field_count ?
1672.3.6 by Brian Aker
First pass in encapsulating row
5413
           entry->getField(entry->getShare()->sizeFields() - field_count)->offset(entry->getInsertRecord()) : 0);
1578.2.8 by Brian Aker
Encapsulate record length.
5414
  reclength= entry->getShare()->getRecordLength() - offset;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5415
1109.1.4 by Brian Aker
More Table refactor
5416
  entry->free_io_cache();				// Safety
1208.3.2 by brian
Update for Cursor renaming.
5417
  entry->cursor->info(HA_STATUS_VARIABLE);
1532.1.15 by Brian Aker
Partial encapsulation of TableShare from Table.
5418
  if (entry->getShare()->db_type() == heap_engine ||
5419
      (!entry->getShare()->blob_fields &&
1208.3.2 by brian
Update for Cursor renaming.
5420
       ((ALIGN_SIZE(reclength) + HASH_OVERHEAD) * entry->cursor->stats.records <
1578.4.9 by Brian Aker
Modification to use std::vector
5421
        session->variables.sortbuff_size)))
1578.4.10 by Brian Aker
Simple code {} commit (aka style)
5422
  {
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5423
    error= remove_dup_with_hash_index(join->session, entry,
1578.4.9 by Brian Aker
Modification to use std::vector
5424
                                      field_count, first_field,
5425
                                      reclength, having);
1578.4.10 by Brian Aker
Simple code {} commit (aka style)
5426
  }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5427
  else
1578.4.10 by Brian Aker
Simple code {} commit (aka style)
5428
  {
5429
    error= remove_dup_with_compare(join->session, entry, first_field, offset, having);
5430
  }
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5431
5432
  free_blobs(first_field);
1578.4.10 by Brian Aker
Simple code {} commit (aka style)
5433
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5434
  return(error);
5435
}
5436
5437
/**
5438
  Function to setup clauses without sum functions.
5439
*/
5440
static int setup_without_group(Session *session, 
5441
                               Item **ref_pointer_array,
5442
                               TableList *tables,
5443
                               TableList *,
5444
                               List<Item> &fields,
5445
                               List<Item> &all_fields,
5446
                               COND **conds,
5447
                               order_st *order,
5448
                               order_st *group,
5449
                               bool *hidden_group_fields)
5450
{
5451
  int res;
5452
  nesting_map save_allow_sum_func=session->lex->allow_sum_func ;
5453
5454
  session->lex->allow_sum_func&= ~(1 << session->lex->current_select->nest_level);
1109.1.5 by Brian Aker
More extraction from sql_base
5455
  res= session->setup_conds(tables, conds);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5456
5457
  session->lex->allow_sum_func|= 1 << session->lex->current_select->nest_level;
5458
  res= res || setup_order(session, ref_pointer_array, tables, fields, all_fields,
5459
                          order);
5460
  session->lex->allow_sum_func&= ~(1 << session->lex->current_select->nest_level);
5461
  res= res || setup_group(session, ref_pointer_array, tables, fields, all_fields,
5462
                          group, hidden_group_fields);
5463
  session->lex->allow_sum_func= save_allow_sum_func;
5464
  return(res);
5465
}
5466
5467
/**
5468
  Calculate the best possible join and initialize the join structure.
5469
5470
  @retval
5471
    0	ok
5472
  @retval
5473
    1	Fatal error
5474
*/
1541.1.1 by Brian Aker
JOIN -> Join rename
5475
static bool make_join_statistics(Join *join, TableList *tables, COND *conds, DYNAMIC_ARRAY *keyuse_array)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5476
{
5477
  int error;
5478
  Table *table;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5479
  uint32_t i;
5480
  uint32_t table_count;
5481
  uint32_t const_count;
5482
  uint32_t key;
5483
  table_map found_const_table_map;
5484
  table_map all_table_map;
5485
  table_map found_ref;
5486
  table_map refs;
5487
  key_map const_ref;
5488
  key_map eq_part;
5489
  Table **table_vector= NULL;
5490
  JoinTable *stat= NULL;
5491
  JoinTable *stat_end= NULL;
5492
  JoinTable *s= NULL;
5493
  JoinTable **stat_ref= NULL;
5494
  optimizer::KeyUse *keyuse= NULL;
5495
  optimizer::KeyUse *start_keyuse= NULL;
5496
  table_map outer_join= 0;
1108.6.39 by Padraig O'Sullivan
Placed the SargableParam class in the optimizer namespace and sub-directory.
5497
  vector<optimizer::SargableParam> sargables;
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
5498
  JoinTable *stat_vector[MAX_TABLES+1];
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
5499
  optimizer::Position *partial_pos;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5500
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5501
  table_count= join->tables;
5502
  stat= (JoinTable*) join->session->calloc(sizeof(JoinTable)*table_count);
5503
  stat_ref= (JoinTable**) join->session->alloc(sizeof(JoinTable*)*MAX_TABLES);
5504
  table_vector= (Table**) join->session->alloc(sizeof(Table*)*(table_count*2));
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
5505
  if (! stat || ! stat_ref || ! table_vector)
971.6.11 by Eric Day
Removed purecov messages.
5506
    return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5507
5508
  join->best_ref=stat_vector;
5509
5510
  stat_end=stat+table_count;
5511
  found_const_table_map= all_table_map=0;
5512
  const_count=0;
5513
5514
  for (s= stat, i= 0;
5515
       tables;
5516
       s++, tables= tables->next_leaf, i++)
5517
  {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5518
    TableList *embedding= tables->getEmbedding();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5519
    stat_vector[i]=s;
5520
    s->keys.reset();
5521
    s->const_keys.reset();
5522
    s->checked_keys.reset();
5523
    s->needed_reg.reset();
5524
    table_vector[i]=s->table=table=tables->table;
5525
    table->pos_in_table_list= tables;
1680.6.1 by Brian Aker
Remove call for using special new for a cursor.
5526
    assert(table->cursor);
1208.3.2 by brian
Update for Cursor renaming.
5527
    error= table->cursor->info(HA_STATUS_VARIABLE | HA_STATUS_NO_LOCK);
1108.6.15 by Padraig O'Sullivan
Fixing various style related issues pointed out by Jay during code review.
5528
    if (error)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5529
    {
1216.1.1 by Brian Aker
Move print_error up to Engine.
5530
        table->print_error(error, MYF(0));
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5531
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5532
    }
5533
    table->quick_keys.reset();
5534
    table->reginfo.join_tab=s;
5535
    table->reginfo.not_exists_optimize=0;
5536
    memset(table->const_key_parts, 0,
1578.2.10 by Brian Aker
keys and fields partial encapsulation.
5537
           sizeof(key_part_map)*table->getShare()->sizeKeys());
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5538
    all_table_map|= table->map;
5539
    s->join=join;
5540
    s->info=0;					// For describe
5541
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5542
    s->dependent= tables->getDepTables();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5543
    s->key_dependent= 0;
1208.3.2 by brian
Update for Cursor renaming.
5544
    table->quick_condition_rows= table->cursor->stats.records;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5545
5546
    s->on_expr_ref= &tables->on_expr;
5547
    if (*s->on_expr_ref)
5548
    {
5549
      /* s is the only inner table of an outer join */
1208.3.2 by brian
Update for Cursor renaming.
5550
      if (!table->cursor->stats.records && !embedding)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5551
      {						// Empty table
5552
        s->dependent= 0;                        // Ignore LEFT JOIN depend.
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5553
        set_position(join, const_count++, s, (optimizer::KeyUse*) 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5554
        continue;
5555
      }
5556
      outer_join|= table->map;
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
5557
      s->embedding_map.reset();
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5558
      for (;embedding; embedding= embedding->getEmbedding())
5559
        s->embedding_map|= embedding->getNestedJoin()->nj_map;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5560
      continue;
5561
    }
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5562
    if (embedding && !(false && ! embedding->getEmbedding()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5563
    {
5564
      /* s belongs to a nested join, maybe to several embedded joins */
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
5565
      s->embedding_map.reset();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5566
      do
5567
      {
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5568
        nested_join_st *nested_join= embedding->getNestedJoin();
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
5569
        s->embedding_map|= nested_join->nj_map;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5570
        s->dependent|= embedding->getDepTables();
5571
        embedding= embedding->getEmbedding();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5572
        outer_join|= nested_join->used_tables;
5573
      }
5574
      while (embedding);
5575
      continue;
5576
    }
1208.3.2 by brian
Update for Cursor renaming.
5577
    if ((table->cursor->stats.records <= 1) && !s->dependent &&
1233.1.2 by Brian Aker
Move stat read define into engine flags.
5578
	      (table->cursor->getEngine()->check_flag(HTON_BIT_STATS_RECORDS_IS_EXACT)) &&
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5579
        !join->no_const_tables)
5580
    {
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5581
      set_position(join, const_count++, s, (optimizer::KeyUse*) 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5582
    }
5583
  }
5584
  stat_vector[i]=0;
5585
  join->outer_join=outer_join;
5586
5587
  if (join->outer_join)
5588
  {
5589
    /*
5590
       Build transitive closure for relation 'to be dependent on'.
5591
       This will speed up the plan search for many cases with outer joins,
5592
       as well as allow us to catch illegal cross references/
5593
       Warshall's algorithm is used to build the transitive closure.
5594
       As we use bitmaps to represent the relation the complexity
5595
       of the algorithm is O((number of tables)^2).
5596
    */
5597
    for (i= 0, s= stat ; i < table_count ; i++, s++)
5598
    {
5599
      for (uint32_t j= 0 ; j < table_count ; j++)
5600
      {
5601
        table= stat[j].table;
5602
        if (s->dependent & table->map)
5603
          s->dependent |= table->reginfo.join_tab->dependent;
5604
      }
5605
      if (s->dependent)
5606
        s->table->maybe_null= 1;
5607
    }
5608
    /* Catch illegal cross references for outer joins */
5609
    for (i= 0, s= stat ; i < table_count ; i++, s++)
5610
    {
5611
      if (s->dependent & s->table->map)
5612
      {
5613
        join->tables=0;			// Don't use join->table
5614
        my_message(ER_WRONG_OUTER_JOIN, ER(ER_WRONG_OUTER_JOIN), MYF(0));
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5615
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5616
      }
5617
      s->key_dependent= s->dependent;
5618
    }
5619
  }
5620
5621
  if (conds || outer_join)
5622
    if (update_ref_and_keys(join->session, keyuse_array, stat, join->tables,
5623
                            conds, join->cond_equal,
1108.6.33 by Padraig O'Sullivan
Use std::vector to hold an array of SargableParam objects instead of a
5624
                            ~outer_join, join->select_lex, sargables))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5625
      return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5626
5627
  /* Read tables with 0 or 1 rows (system tables) */
5628
  join->const_table_map= 0;
5629
1108.6.29 by Padraig O'Sullivan
Added an optimizer namespace and sub-directory within drizzled. Moved the
5630
  optimizer::Position *p_pos= join->getFirstPosInPartialPlan();
5631
  optimizer::Position *p_end= join->getSpecificPosInPartialPlan(const_count);
1108.6.8 by Padraig O'Sullivan
Made the positions member of the JOIN class private (finally got that
5632
  while (p_pos < p_end)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5633
  {
5634
    int tmp;
1108.6.26 by Padraig O'Sullivan
Made the table member of Position private and added necessary accessors
5635
    s= p_pos->getJoinTable();
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5636
    s->type= AM_SYSTEM;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5637
    join->const_table_map|=s->table->map;
1108.6.16 by Padraig O'Sullivan
Adding space after negation operators in places where I forgot that.
5638
    if ((tmp= join_read_const_table(s, p_pos)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5639
    {
5640
      if (tmp > 0)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5641
        return 1;			// Fatal error
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5642
    }
5643
    else
5644
      found_const_table_map|= s->table->map;
1108.6.8 by Padraig O'Sullivan
Made the positions member of the JOIN class private (finally got that
5645
    p_pos++;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5646
  }
5647
5648
  /* loop until no more const tables are found */
5649
  int ref_changed;
5650
  do
5651
  {
5652
  more_const_tables_found:
5653
    ref_changed = 0;
5654
    found_ref=0;
5655
5656
    /*
5657
      We only have to loop from stat_vector + const_count as
5658
      set_position() will move all const_tables first in stat_vector
5659
    */
5660
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5661
    for (JoinTable **pos= stat_vector+const_count; (s= *pos); pos++)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5662
    {
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5663
      table= s->table;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5664
5665
      /*
5666
        If equi-join condition by a key is null rejecting and after a
5667
        substitution of a const table the key value happens to be null
5668
        then we can state that there are no matches for this equi-join.
5669
      */
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
5670
      if ((keyuse= s->keyuse) && *s->on_expr_ref && s->embedding_map.none())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5671
      {
5672
        /*
5673
          When performing an outer join operation if there are no matching rows
5674
          for the single row of the outer table all the inner tables are to be
5675
          null complemented and thus considered as constant tables.
5676
          Here we apply this consideration to the case of outer join operations
5677
          with a single inner table only because the case with nested tables
5678
          would require a more thorough analysis.
5679
          TODO. Apply single row substitution to null complemented inner tables
5680
          for nested outer join operations.
5681
        */
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5682
        while (keyuse->getTable() == table)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5683
        {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5684
          if (! (keyuse->getVal()->used_tables() & ~join->const_table_map) &&
5685
              keyuse->getVal()->is_null() && keyuse->isNullRejected())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5686
          {
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5687
            s->type= AM_CONST;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5688
            table->mark_as_null_row();
5689
            found_const_table_map|= table->map;
5690
            join->const_table_map|= table->map;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5691
            set_position(join, const_count++, s, (optimizer::KeyUse*) 0);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5692
            goto more_const_tables_found;
5693
           }
5694
          keyuse++;
5695
        }
5696
      }
5697
5698
      if (s->dependent)				// If dependent on some table
5699
      {
5700
        // All dep. must be constants
5701
        if (s->dependent & ~(found_const_table_map))
5702
          continue;
1208.3.2 by brian
Update for Cursor renaming.
5703
        if (table->cursor->stats.records <= 1L &&
1233.1.2 by Brian Aker
Move stat read define into engine flags.
5704
            (table->cursor->getEngine()->check_flag(HTON_BIT_STATS_RECORDS_IS_EXACT)) &&
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5705
                  !table->pos_in_table_list->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5706
        {					// system table
5707
          int tmp= 0;
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5708
          s->type= AM_SYSTEM;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5709
          join->const_table_map|=table->map;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5710
          set_position(join, const_count++, s, (optimizer::KeyUse*) 0);
1108.6.10 by Padraig O'Sullivan
Changing some accessors to be more clear on whether they are accessing the
5711
          partial_pos= join->getSpecificPosInPartialPlan(const_count - 1);
1108.6.8 by Padraig O'Sullivan
Made the positions member of the JOIN class private (finally got that
5712
          if ((tmp= join_read_const_table(s, partial_pos)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5713
          {
5714
            if (tmp > 0)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5715
              return 1;			// Fatal error
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5716
          }
5717
          else
5718
            found_const_table_map|= table->map;
5719
          continue;
5720
        }
5721
      }
5722
      /* check if table can be read by key or table only uses const refs */
5723
      if ((keyuse=s->keyuse))
5724
      {
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5725
        s->type= AM_REF;
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5726
        while (keyuse->getTable() == table)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5727
        {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5728
          start_keyuse= keyuse;
5729
          key= keyuse->getKey();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5730
          s->keys.set(key);               // QQ: remove this ?
5731
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5732
          refs= 0;
5733
          const_ref.reset();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5734
          eq_part.reset();
5735
          do
5736
          {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5737
            if (keyuse->getVal()->type() != Item::NULL_ITEM && 
5738
                ! keyuse->getOptimizeFlags())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5739
            {
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5740
              if (! ((~found_const_table_map) & keyuse->getUsedTables()))
5741
                const_ref.set(keyuse->getKeypart());
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5742
              else
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5743
                refs|= keyuse->getUsedTables();
5744
              eq_part.set(keyuse->getKeypart());
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5745
            }
5746
            keyuse++;
1108.6.57 by Padraig O'Sullivan
Made all members of the KeyUse class private and provided appropriate
5747
          } while (keyuse->getTable() == table && keyuse->getKey() == key);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5748
5749
          if (is_keymap_prefix(eq_part, table->key_info[key].key_parts) &&
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5750
              ! table->pos_in_table_list->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5751
          {
5752
            if ((table->key_info[key].flags & (HA_NOSAME)) == HA_NOSAME)
5753
            {
5754
              if (const_ref == eq_part)
5755
              {					// Found everything for ref.
5756
                int tmp;
5757
                ref_changed = 1;
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5758
                s->type= AM_CONST;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5759
                join->const_table_map|= table->map;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5760
                set_position(join, const_count++, s, start_keyuse);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5761
                if (create_ref_for_key(join, s, start_keyuse, found_const_table_map))
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5762
                  return 1;
1108.6.10 by Padraig O'Sullivan
Changing some accessors to be more clear on whether they are accessing the
5763
                partial_pos= join->getSpecificPosInPartialPlan(const_count - 1);
1108.6.8 by Padraig O'Sullivan
Made the positions member of the JOIN class private (finally got that
5764
                if ((tmp=join_read_const_table(s, partial_pos)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5765
                {
5766
                  if (tmp > 0)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5767
                    return 1;			// Fatal error
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5768
                }
5769
                else
5770
                  found_const_table_map|= table->map;
5771
                break;
5772
              }
5773
              else
5774
                found_ref|= refs;      // Table is const if all refs are const
5775
            }
5776
            else if (const_ref == eq_part)
5777
              s->const_keys.set(key);
5778
          }
5779
        }
5780
      }
5781
    }
5782
  } while (join->const_table_map & found_ref && ref_changed);
5783
5784
  /*
5785
    Update info on indexes that can be used for search lookups as
5786
    reading const tables may has added new sargable predicates.
5787
  */
1108.6.33 by Padraig O'Sullivan
Use std::vector to hold an array of SargableParam objects instead of a
5788
  if (const_count && ! sargables.empty())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5789
  {
1108.6.39 by Padraig O'Sullivan
Placed the SargableParam class in the optimizer namespace and sub-directory.
5790
    vector<optimizer::SargableParam>::iterator iter= sargables.begin();
1108.6.33 by Padraig O'Sullivan
Use std::vector to hold an array of SargableParam objects instead of a
5791
    while (iter != sargables.end())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5792
    {
1108.6.38 by Padraig O'Sullivan
Made all data members of the SargableParam class private.
5793
      Field *field= (*iter).getField();
1660.1.3 by Brian Aker
Encapsulate Table in field
5794
      JoinTable *join_tab= field->getTable()->reginfo.join_tab;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5795
      key_map possible_keys= field->key_start;
1660.1.3 by Brian Aker
Encapsulate Table in field
5796
      possible_keys&= field->getTable()->keys_in_use_for_query;
1108.6.38 by Padraig O'Sullivan
Made all data members of the SargableParam class private.
5797
      bool is_const= true;
5798
      for (uint32_t j= 0; j < (*iter).getNumValues(); j++)
5799
        is_const&= (*iter).isConstItem(j);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5800
      if (is_const)
5801
        join_tab[0].const_keys|= possible_keys;
1108.6.33 by Padraig O'Sullivan
Use std::vector to hold an array of SargableParam objects instead of a
5802
      ++iter;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5803
    }
5804
  }
5805
5806
  /* Calc how many (possible) matched records in each table */
5807
5808
  for (s=stat ; s < stat_end ; s++)
5809
  {
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5810
    if (s->type == AM_SYSTEM || s->type == AM_CONST)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5811
    {
5812
      /* Only one matching row */
5813
      s->found_records=s->records=s->read_time=1; s->worst_seeks=1.0;
5814
      continue;
5815
    }
5816
    /* Approximate found rows and time to read them */
1208.3.2 by brian
Update for Cursor renaming.
5817
    s->found_records=s->records=s->table->cursor->stats.records;
5818
    s->read_time=(ha_rows) s->table->cursor->scan_time();
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5819
5820
    /*
5821
      Set a max range of how many seeks we can expect when using keys
5822
      This is can't be to high as otherwise we are likely to use
5823
      table scan.
5824
    */
1067.4.4 by Nathan Williams
The rest of the files in the drizzled directory were purged of the cmin macro and replace with std::min (except for the definition in globals.h and 1 usage in stacktrace.cc).
5825
    s->worst_seeks= min((double) s->found_records / 10,
5826
                        (double) s->read_time*3);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5827
    if (s->worst_seeks < 2.0)			// Fix for small tables
5828
      s->worst_seeks=2.0;
5829
5830
    /*
5831
      Add to stat->const_keys those indexes for which all group fields or
5832
      all select distinct fields participate in one index.
5833
    */
5834
    add_group_and_distinct_keys(join, s);
5835
5836
    if (s->const_keys.any() &&
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5837
        !s->table->pos_in_table_list->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5838
    {
5839
      ha_rows records;
1237.13.3 by Padraig O'Sullivan
Performed numerous style cleanups in range.[cc,h].
5840
      optimizer::SqlSelect *select= NULL;
1237.9.2 by Padraig O'Sullivan
Moved opt_range.[cc,h] into the optimizer directory and namespace and renamed the files to
5841
      select= optimizer::make_select(s->table, found_const_table_map, found_const_table_map, *s->on_expr_ref ? *s->on_expr_ref : conds, 1, &error);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5842
      if (! select)
1108.6.18 by Padraig O'Sullivan
Updating some return statements to adhere to the convention laid out in the
5843
        return 1;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5844
      records= get_quick_record_count(join->session, select, s->table, &s->const_keys, join->row_limit);
5845
      s->quick=select->quick;
5846
      s->needed_reg=select->needed_reg;
5847
      select->quick=0;
5848
      if (records == 0 && s->table->reginfo.impossible_range)
5849
      {
5850
        /*
5851
          Impossible WHERE or ON expression
5852
          In case of ON, we mark that the we match one empty NULL row.
5853
          In case of WHERE, don't set found_const_table_map to get the
5854
          caller to abort with a zero row result.
5855
        */
5856
        join->const_table_map|= s->table->map;
1108.6.60 by Padraig O'Sullivan
Fixed some style related issues Jay pointed out during code review.
5857
        set_position(join, const_count++, s, (optimizer::KeyUse*) 0);
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5858
        s->type= AM_CONST;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5859
        if (*s->on_expr_ref)
5860
        {
5861
          /* Generate empty row */
5862
          s->info= "Impossible ON condition";
5863
          found_const_table_map|= s->table->map;
1108.6.20 by Padraig O'Sullivan
Renamed access_type to access_method due to conflicts on Solaris.
5864
          s->type= AM_CONST;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5865
          s->table->mark_as_null_row();		// All fields are NULL
5866
        }
5867
      }
5868
      if (records != HA_POS_ERROR)
5869
      {
5870
        s->found_records=records;
5871
        s->read_time= (ha_rows) (s->quick ? s->quick->read_time : 0.0);
5872
      }
5873
      delete select;
5874
    }
5875
  }
5876
5877
  join->join_tab=stat;
5878
  join->map2table=stat_ref;
5879
  join->table= join->all_tables=table_vector;
5880
  join->const_tables=const_count;
5881
  join->found_const_table_map=found_const_table_map;
5882
5883
  /* Find an optimal join order of the non-constant tables. */
5884
  if (join->const_tables != join->tables)
5885
  {
5886
    optimize_keyuse(join, keyuse_array);
1280.3.16 by Padraig O'Sullivan
Updated the calls to dtrace probes to use the c_str() pointer from query in Session
5887
    DRIZZLE_QUERY_OPT_CHOOSE_PLAN_START(join->session->query.c_str(), join->session->thread_id);
1241.7.6 by Padraig O'Sullivan
Added some dtrace probes for tracing the optimizer.
5888
    bool res= choose_plan(join, all_table_map & ~join->const_table_map);
5889
    DRIZZLE_QUERY_OPT_CHOOSE_PLAN_DONE(res ? 1 : 0);
5890
    if (res)
5891
      return true;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5892
  }
5893
  else
5894
  {
1108.6.4 by Padraig O'Sullivan
Made the best_positions member of the JOIN class private and added any
5895
    join->copyPartialPlanIntoOptimalPlan(join->const_tables);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5896
    join->best_read= 1.0;
5897
  }
5898
  /* Generate an execution plan from the found optimal join order. */
5899
  return (join->session->killed || get_best_combination(join));
5900
}
5901
5902
/**
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5903
  Assign each nested join structure a bit in the nested join bitset.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5904
5905
    Assign each nested join structure (except "confluent" ones - those that
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5906
    embed only one element) a bit in the nested join bitset.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5907
5908
  @param join          Join being processed
5909
  @param join_list     List of tables
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5910
  @param first_unused  Number of first unused bit in the nest joing bitset before the
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5911
                       call
5912
5913
  @note
5914
    This function is called after simplify_joins(), when there are no
5915
    redundant nested joins, #non_confluent_nested_joins <= #tables_in_join so
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5916
    we will not run out of bits in the nested join bitset.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5917
5918
  @return
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5919
    First unused bit in the nest join bitset after the call.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5920
*/
5921
static uint32_t build_bitmap_for_nested_joins(List<TableList> *join_list, uint32_t first_unused)
5922
{
5923
  List_iterator<TableList> li(*join_list);
5924
  TableList *table;
5925
  while ((table= li++))
5926
  {
5927
    nested_join_st *nested_join;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5928
    if ((nested_join= table->getNestedJoin()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5929
    {
5930
      /*
5931
        It is guaranteed by simplify_joins() function that a nested join
5932
        that has only one child is either
5933
         - a single-table view (the child is the underlying table), or
5934
         - a single-table semi-join nest
5935
5936
        We don't assign bits to such sj-nests because
5937
        1. it is redundant (a "sequence" of one table cannot be interleaved
5938
            with anything)
1100.4.2 by Padraig O'Sullivan
Removed the typedef for nested_join_map and instead just declare these
5939
        2. we could run out of bits in the nested join bitset otherwise.
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5940
      */
5941
      if (nested_join->join_list.elements != 1)
5942
      {
5943
        /* Don't assign bits to sj-nests */
5944
        if (table->on_expr)
1100.4.1 by Padraig O'Sullivan
Modified the nested_join_map typedef to be std::bitset instead of uint64_t.
5945
          nested_join->nj_map.set(first_unused++);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
5946
        first_unused= build_bitmap_for_nested_joins(&nested_join->join_list,
5947
                                                    first_unused);
5948
      }
5949
    }
5950
  }
5951
  return(first_unused);
5952
}
5953
5954
5955
/**
5956
  Return table number if there is only one table in sort order
5957
  and group and order is compatible, else return 0.
5958
*/
5959
static Table *get_sort_by_table(order_st *a,order_st *b,TableList *tables)
5960
{
5961
  table_map map= (table_map) 0;
5962
5963
  if (!a)
5964
    a= b;					// Only one need to be given
5965
  else if (!b)
5966
    b= a;
5967
5968
  for (; a && b; a=a->next,b=b->next)
5969
  {
5970
    if (!(*a->item)->eq(*b->item,1))
5971
      return (Table *) NULL;
5972
    map|= a->item[0]->used_tables();
5973
  }
5974
  if (!map || (map & (RAND_TABLE_BIT | OUTER_REF_TABLE_BIT)))
5975
    return (Table *) NULL;
5976
5977
  for (; !(map & tables->table->map); tables= tables->next_leaf) {};
5978
  if (map != tables->table->map)
5979
    return (Table *) NULL;				// More than one table
5980
  return tables->table;
5981
}
5982
5983
/**
5984
  Set nested_join_st::counter=0 in all nested joins in passed list.
5985
5986
    Recursively set nested_join_st::counter=0 for all nested joins contained in
5987
    the passed join_list.
5988
5989
  @param join_list  List of nested joins to process. It may also contain base
5990
                    tables which will be ignored.
5991
*/
5992
static void reset_nj_counters(List<TableList> *join_list)
5993
{
5994
  List_iterator<TableList> li(*join_list);
5995
  TableList *table;
5996
  while ((table= li++))
5997
  {
5998
    nested_join_st *nested_join;
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
5999
    if ((nested_join= table->getNestedJoin()))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6000
    {
6001
      nested_join->counter_= 0;
6002
      reset_nj_counters(&nested_join->join_list);
6003
    }
6004
  }
6005
  return;
6006
}
6007
6008
/**
6009
  Return 1 if second is a subpart of first argument.
6010
6011
  If first parts has different direction, change it to second part
6012
  (group is sorted like order)
6013
*/
6014
static bool test_if_subpart(order_st *a,order_st *b)
6015
{
6016
  for (; a && b; a=a->next,b=b->next)
6017
  {
6018
    if ((*a->item)->eq(*b->item,1))
6019
      a->asc=b->asc;
6020
    else
6021
      return 0;
6022
  }
6023
  return test(!b);
6024
}
6025
6026
/**
6027
  Nested joins perspective: Remove the last table from the join order.
6028
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
6029
  The algorithm is the reciprocal of check_interleaving_with_nj(), hence
6030
  parent join nest nodes are updated only when the last table in its child
6031
  node is removed. The ASCII graphic below will clarify.
6032
6033
  %A table nesting such as <tt> t1 x [ ( t2 x t3 ) x ( t4 x t5 ) ] </tt>is
6034
  represented by the below join nest tree.
6035
6036
  @verbatim
6037
                     NJ1
6038
                  _/ /  \
6039
                _/  /    NJ2
6040
              _/   /     / \ 
6041
             /    /     /   \
6042
   t1 x [ (t2 x t3) x (t4 x t5) ]
6043
  @endverbatim
6044
6045
  At the point in time when check_interleaving_with_nj() adds the table t5 to
6046
  the query execution plan, QEP, it also directs the node named NJ2 to mark
6047
  the table as covered. NJ2 does so by incrementing its @c counter
6048
  member. Since all of NJ2's tables are now covered by the QEP, the algorithm
6049
  proceeds up the tree to NJ1, incrementing its counter as well. All join
6050
  nests are now completely covered by the QEP.
6051
6052
  restore_prev_nj_state() does the above in reverse. As seen above, the node
6053
  NJ1 contains the nodes t2, t3, and NJ2. Its counter being equal to 3 means
6054
  that the plan covers t2, t3, and NJ2, @e and that the sub-plan (t4 x t5)
6055
  completely covers NJ2. The removal of t5 from the partial plan will first
6056
  decrement NJ2's counter to 1. It will then detect that NJ2 went from being
6057
  completely to partially covered, and hence the algorithm must continue
6058
  upwards to NJ1 and decrement its counter to 2. %A subsequent removal of t4
6059
  will however not influence NJ1 since it did not un-cover the last table in
6060
  NJ2.
6061
6062
  SYNOPSIS
6063
    restore_prev_nj_state()
6064
      last  join table to remove, it is assumed to be the last in current 
6065
            partial join order.
6066
     
6067
  DESCRIPTION
6068
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6069
    Remove the last table from the partial join order and update the nested
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
6070
    joins counters and join->cur_embedding_map. It is ok to call this 
6071
    function for the first table in join order (for which 
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6072
    check_interleaving_with_nj has not been called)
6073
6074
  @param last  join table to remove, it is assumed to be the last in current
6075
               partial join order.
6076
*/
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
6077
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
6078
static void restore_prev_nj_state(JoinTable *last)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6079
{
1637.2.7 by Vijay Samuel
Merge encapsulate TableList-2.
6080
  TableList *last_emb= last->table->pos_in_table_list->getEmbedding();
1541.1.1 by Brian Aker
JOIN -> Join rename
6081
  Join *join= last->join;
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
6082
  for (;last_emb != NULL; last_emb= last_emb->getEmbedding())
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6083
  {
1637.5.9 by Prafulla Tekawade
Fix for Bug 592444
6084
    nested_join_st *nest= last_emb->getNestedJoin();
6085
    
6086
    bool was_fully_covered= nest->is_fully_covered();
6087
    
6088
    if (--nest->counter_ == 0)
6089
      join->cur_embedding_map&= ~nest->nj_map;
6090
    
6091
    if (!was_fully_covered)
6092
      break;
6093
    
6094
    join->cur_embedding_map|= nest->nj_map;
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6095
  }
6096
}
6097
6098
/**
6099
  Create a condition for a const reference and add this to the
6100
  currenct select for the table.
6101
*/
1089.1.1 by Brian Aker
Remove of JOIN_TAB to JoinTable
6102
static bool add_ref_to_table_cond(Session *session, JoinTable *join_tab)
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6103
{
6104
  if (!join_tab->ref.key_parts)
6105
    return(false);
6106
6107
  Item_cond_and *cond=new Item_cond_and();
6108
  Table *table=join_tab->table;
6109
  int error;
6110
  if (!cond)
6111
    return(true);
6112
6113
  for (uint32_t i=0 ; i < join_tab->ref.key_parts ; i++)
6114
  {
1578.2.16 by Brian Aker
Merge in change to getTable() to private the field objects.
6115
    Field *field=table->getField(table->key_info[join_tab->ref.key].key_part[i].fieldnr - 1);
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6116
    Item *value=join_tab->ref.items[i];
6117
    cond->add(new Item_func_equal(new Item_field(field), value));
6118
  }
6119
  if (session->is_fatal_error)
6120
    return(true);
6121
6122
  if (!cond->fixed)
6123
    cond->fix_fields(session, (Item**)&cond);
6124
  if (join_tab->select)
6125
  {
6126
    error=(int) cond->add(join_tab->select->cond);
6127
    join_tab->select_cond=join_tab->select->cond=cond;
6128
  }
1237.9.2 by Padraig O'Sullivan
Moved opt_range.[cc,h] into the optimizer directory and namespace and renamed the files to
6129
  else if ((join_tab->select= optimizer::make_select(join_tab->table, 0, 0, cond, 0,
6130
                                                     &error)))
1039.2.2 by Jay Pipes
Phase 2 of JOIN refactoring.
6131
    join_tab->select_cond=cond;
6132
6133
  return(error ? true : false);
6134
}
6135
6136
static void free_blobs(Field **ptr)
6137
{
6138
  for (; *ptr ; ptr++)
6139
  {
6140
    if ((*ptr)->flags & BLOB_FLAG)
6141
      ((Field_blob *) (*ptr))->free();
6142
  }
6143
}
6144
6145
/**
6146
  @} (end of group Query_Optimizer)
6147
*/
1280.1.10 by Monty Taylor
Put everything in drizzled into drizzled namespace.
6148
6149
} /* namespace drizzled */