sql/item_subselect.cc

/* Copyright (c) 2002, 2015, Oracle and/or its affiliates. All rights reserved. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; version 2 of the License. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, 51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA */ /** @file @brief subselect Item @todo - add function from mysql_select that use JOIN* as parameter to JOIN methods (sql_select.h/sql_select.cc) */ #include "sql_priv.h" /* It is necessary to include set_var.h instead of item.h because there are dependencies on include order for set_var.h and item.h. This will be resolved later. */ #include "sql_class.h" // set_var.h: THD #include "set_var.h" #include "sql_select.h" #include "opt_trace.h" #include "sql_parse.h" // check_stack_overrun #include "sql_derived.h" // mysql_derived_create, ... #include "debug_sync.h" #include "sql_test.h" #include "sql_join_buffer.h" // JOIN_CACHE #include "sql_optimizer.h" // JOIN #include "opt_explain_format.h" Item_subselect::Item_subselect(): Item_result_field(), value_assigned(0), traced_before(false), substitution(NULL), in_cond_of_tab(INT_MIN), engine(NULL), old_engine(NULL), used_tables_cache(0), have_to_be_excluded(0), const_item_cache(1), engine_changed(false), changed(false) { with_subselect= 1; reset(); /* Item value is NULL if select_result_interceptor didn't change this value (i.e. some rows will be found returned) */ null_value= TRUE; } void Item_subselect::init(st_select_lex *select_lex, select_result_interceptor *result) { /* Please see Item_singlerow_subselect::invalidate_and_restore_select_lex(), which depends on alterations to the parse tree implemented here. */ DBUG_ENTER("Item_subselect::init"); DBUG_PRINT("enter", ("select_lex: 0x%lx", (long) select_lex)); unit= select_lex->master_unit(); if (unit->item) { /* Item can be changed in JOIN::prepare while engine in JOIN::optimize => we do not copy old_engine here */ engine= unit->item->engine; parsing_place= unit->item->parsing_place; unit->item->engine= 0; unit->item= this; engine->change_result(this, result); } else { SELECT_LEX *outer_select= unit->outer_select(); /* do not take into account expression inside aggregate functions because they can access original table fields */ parsing_place= (outer_select->in_sum_expr ? NO_MATTER : outer_select->parsing_place); if (unit->is_union()) engine= new subselect_union_engine(unit, result, this); else engine= new subselect_single_select_engine(select_lex, result, this); } { SELECT_LEX *upper= unit->outer_select(); if (upper->parsing_place == IN_HAVING) upper->subquery_in_having= 1; } DBUG_VOID_RETURN; } void Item_subselect::cleanup() { DBUG_ENTER("Item_subselect::cleanup"); Item_result_field::cleanup(); if (old_engine) { if (engine) { engine->cleanup(); delete engine; } engine= old_engine; old_engine= 0; } if (engine) engine->cleanup(); reset(); value_assigned= 0; traced_before= false; in_cond_of_tab= INT_MIN; DBUG_VOID_RETURN; } void Item_singlerow_subselect::cleanup() { DBUG_ENTER("Item_singlerow_subselect::cleanup"); value= 0; row= 0; Item_subselect::cleanup(); DBUG_VOID_RETURN; } bool Item_in_subselect::finalize_exists_transform(SELECT_LEX *select_lex) { DBUG_ASSERT(exec_method == EXEC_EXISTS_OR_MAT || exec_method == EXEC_EXISTS); /* Change SELECT expr1, expr2 to SELECT 1,1 because EXISTS does not care about the selected expressions, only about the existence of rows. If UNION, we have to modify the SELECT list of each SELECT in the UNION, fortunately this function is indeed called for each SELECT_LEX. If this is a prepared statement, we must allow the next execution to use materialization. So, we should back up the original SELECT list. If this is a UNION, this means backing up the N original SELECT lists. To avoid this constraint, we change the SELECT list only if this is not a prepared statement. */ if (unit->thd->stmt_arena->is_conventional()) // not prepared stmt { uint cnt= select_lex->item_list.elements; select_lex->item_list.empty(); for(; cnt > 0; cnt--) select_lex->item_list.push_back(new Item_int(NAME_STRING("Not_used"), (longlong) 1, MY_INT64_NUM_DECIMAL_DIGITS)); Opt_trace_context * const trace= &unit->thd->opt_trace; OPT_TRACE_TRANSFORM(trace, oto0, oto1, select_lex->select_number, "IN (SELECT)", "EXISTS (CORRELATED SELECT)"); oto1.add("put_1_in_SELECT_list", true); } /* Note that if the subquery is "SELECT1 UNION SELECT2" then this is not working optimally (Bug#14215895). */ unit->global_parameters->select_limit= new Item_int((int32) 1); unit->set_limit(unit->global_parameters); select_lex->join->allow_outer_refs= true; // for JOIN::set_prefix_tables() exec_method= EXEC_EXISTS; return false; } /* Removes every predicate injected by IN->EXISTS. This function is different from others: - it wants to remove all traces of IN->EXISTS (for materialization) - remove_subq_pushed_predicates() and remove_additional_cond() want to remove only the conditions of IN->EXISTS which index lookup already satisfies (they are just an optimization). Code reading suggests that remove_additional_cond() is equivalent to "if in_subs->left_expr->cols()==1 then remove_in2exists_conds(where)" but that would still not fix Bug#13915291 of remove_additional_cond(). @param conds condition @returns new condition */ Item *Item_in_subselect::remove_in2exists_conds(Item* conds) { if (conds->created_by_in2exists()) return NULL; if (conds->type() != Item::COND_ITEM) return conds; Item_cond *cnd= static_cast<Item_cond *>(conds); /* If IN->EXISTS has added something to 'conds', cnd must be AND list and we must inspect each member. */ if (cnd->functype() != Item_func::COND_AND_FUNC) return conds; List_iterator<Item> li(*(cnd->argument_list())); Item *item; while ((item= li++)) { // remove() does not invalidate iterator. if (item->created_by_in2exists()) li.remove(); } switch (cnd->argument_list()->elements) { case 0: return NULL; case 1: // AND(x) is the same as x, return x return cnd->argument_list()->head(); default: // otherwise return AND return conds; } } bool Item_in_subselect::finalize_materialization_transform(JOIN *join) { DBUG_ASSERT(exec_method == EXEC_EXISTS_OR_MAT); DBUG_ASSERT(engine->engine_type() == subselect_engine::SINGLE_SELECT_ENGINE); THD * const thd= unit->thd; subselect_single_select_engine *old_engine_derived= static_cast<subselect_single_select_engine*>(engine); DBUG_ASSERT(join == old_engine_derived->join); // No UNION in materialized subquery so this holds: DBUG_ASSERT(join->select_lex == unit->first_select()); DBUG_ASSERT(join->unit == unit); DBUG_ASSERT(unit->global_parameters->select_limit == NULL); exec_method= EXEC_MATERIALIZATION; /* We need to undo several changes which IN->EXISTS had done. But we first back them up, so that the next execution of the statement is allowed to choose IN->EXISTS. */ /* Undo conditions injected by IN->EXISTS. Condition guards, which those conditions maybe used, are not needed anymore. Subquery becomes 'not dependent' again, as before IN->EXISTS. */ if (join->conds) join->conds= remove_in2exists_conds(join->conds); if (join->having) join->having= remove_in2exists_conds(join->having); DBUG_ASSERT(!originally_dependent()); join->select_lex->uncacheable&= ~UNCACHEABLE_DEPENDENT; /* IN->EXISTS uses master_unit(); however, as we cannot have a UNION here, 'unit' must be correct too. */ DBUG_ASSERT(unit == join->select_lex->master_unit()); unit->uncacheable&= ~UNCACHEABLE_DEPENDENT; OPT_TRACE_TRANSFORM(&thd->opt_trace, oto0, oto1, old_engine_derived->join->select_lex->select_number, "IN (SELECT)", "materialization"); oto1.add("chosen", true); subselect_hash_sj_engine * const new_engine= new subselect_hash_sj_engine(thd, this, old_engine_derived); if (!new_engine) return true; if (new_engine->setup(unit->get_unit_column_types())) { /* For some reason we cannot use materialization for this IN predicate. Delete all materialization-related objects, and return error. */ new_engine->cleanup(); delete new_engine; return true; } if (change_engine(new_engine)) return true; join->allow_outer_refs= false; // for JOIN::set_prefix_tables() return false; } void Item_in_subselect::cleanup() { DBUG_ENTER("Item_in_subselect::cleanup"); if (left_expr_cache) { left_expr_cache->delete_elements(); delete left_expr_cache; left_expr_cache= NULL; } left_expr_cache_filled= false; need_expr_cache= TRUE; switch(exec_method) { case EXEC_MATERIALIZATION: unit->first_select()->uncacheable|= UNCACHEABLE_DEPENDENT; unit->uncacheable|= UNCACHEABLE_DEPENDENT; // fall through case EXEC_EXISTS: /* Back to EXISTS_OR_MAT, so that next execution of this statement can choose between the two. */ unit->global_parameters->select_limit= NULL; exec_method= EXEC_EXISTS_OR_MAT; break; default: break; } Item_subselect::cleanup(); DBUG_VOID_RETURN; } Item_subselect::~Item_subselect() { delete engine; } Item_subselect::trans_res Item_subselect::select_transformer(JOIN *join) { DBUG_ENTER("Item_subselect::select_transformer"); DBUG_RETURN(RES_OK); } bool Item_subselect::fix_fields(THD *thd, Item **ref) { char const *save_where= thd->where; uint8 uncacheable; bool res; DBUG_ASSERT(fixed == 0); /* Pointers to THD must match. unit::thd may vary over the lifetime of the item (for example triggers, and thus their Item-s, are in a cache shared by all connections), but reinit_stmt_before_use() keeps it up-to-date, which we check here. subselect_union_engine functions also do sanity checks. */ DBUG_ASSERT(thd == unit->thd); #ifndef DBUG_OFF // Engine accesses THD via its 'item' pointer, check it: DBUG_ASSERT(engine->get_item() == this); #endif engine->set_thd_for_result(); if (check_stack_overrun(thd, STACK_MIN_SIZE, (uchar*)&res)) return TRUE; if (!(res= engine->prepare())) { // all transformation is done (used by prepared statements) changed= 1; /* Substitute the current item with an Item_in_optimizer that was created by Item_in_subselect::select_in_like_transformer and call fix_fields for the substituted item which in turn calls engine->prepare for the subquery predicate. */ if (substitution) { int ret= 0; // did we changed top item of WHERE condition if (unit->outer_select()->where == (*ref)) unit->outer_select()->where= substitution; // correct WHERE for PS else if (unit->outer_select()->having == (*ref)) unit->outer_select()->having= substitution; // correct HAVING for PS (*ref)= substitution; substitution->item_name= item_name; if (have_to_be_excluded) engine->exclude(); substitution= 0; thd->where= "checking transformed subquery"; if (!(*ref)->fixed) ret= (*ref)->fix_fields(thd, ref); thd->where= save_where; return ret; } // Is it one field subselect? if (engine->cols() > max_columns) { my_error(ER_OPERAND_COLUMNS, MYF(0), 1); return TRUE; } fix_length_and_dec(); } else goto err; if ((uncacheable= engine->uncacheable())) { const_item_cache= 0; if (uncacheable & UNCACHEABLE_RAND) used_tables_cache|= RAND_TABLE_BIT; } fixed= 1; err: thd->where= save_where; return res; } /** Apply walk() processor to join conditions. JOINs may be nested. Walk nested joins recursively to apply the processor. */ bool Item_subselect::walk_join_condition(List<TABLE_LIST> *tables, Item_processor processor, bool walk_subquery, uchar *argument) { TABLE_LIST *table; List_iterator<TABLE_LIST> li(*tables); while ((table= li++)) { if (table->join_cond() && table->join_cond()->walk(processor, walk_subquery, argument)) return true; if (table->nested_join != NULL && walk_join_condition(&table->nested_join->join_list, processor, walk_subquery, argument)) return true; } return false; } /** Workaround for bug in gcc 4.1. @See Item_in_subselect::walk() */ bool Item_subselect::walk_body(Item_processor processor, bool walk_subquery, uchar *argument) { if (walk_subquery) { for (SELECT_LEX *lex= unit->first_select(); lex; lex= lex->next_select()) { List_iterator<Item> li(lex->item_list); Item *item; ORDER *order; while ((item=li++)) { if (item->walk(processor, walk_subquery, argument)) return true; } if (lex->join_list != NULL && walk_join_condition(lex->join_list, processor, walk_subquery, argument)) return true; if (lex->where && (lex->where)->walk(processor, walk_subquery, argument)) return true; for (order= lex->group_list.first ; order; order= order->next) { if ((*order->item)->walk(processor, walk_subquery, argument)) return true; } if (lex->having && (lex->having)->walk(processor, walk_subquery, argument)) return true; for (order= lex->order_list.first ; order; order= order->next) { if ((*order->item)->walk(processor, walk_subquery, argument)) return true; } } } return (this->*processor)(argument); } bool Item_subselect::walk(Item_processor processor, bool walk_subquery, uchar *argument) { return walk_body(processor, walk_subquery, argument); } /** Mark a subquery unit with information provided A subquery may belong to WHERE, HAVING, ORDER BY or GROUP BY item trees. This "processor" qualifies subqueries by outer clause type. @note For the WHERE clause of the JOIN query this function also associates a related table with the unit. @param arg Explain_subquery_marker structure @retval false @note We always return "false" as far as we don't want to dive deeper because we explain inner subqueries in their joins contexts. */ bool Item_subselect::explain_subquery_checker(uchar **arg) { Explain_subquery_marker *m= *reinterpret_cast<Explain_subquery_marker **>(arg); if (m->type == CTX_WHERE) { /* A subquery in the WHERE clause may be associated with a few JOIN_TABs simultaneously. */ if (unit->explain_marker == CTX_NONE) unit->explain_marker= CTX_WHERE; else DBUG_ASSERT(unit->explain_marker == CTX_WHERE); m->destination->register_where_subquery(unit); return false; } if (m->type == CTX_HAVING && unit->explain_marker == CTX_WHERE) { /* This subquery was in SELECT list of outer subquery transformed with IN->EXISTS, so is referenced by WHERE and HAVING; see Item_in_subselect::single_value_in_to_exists_transformer() */ return false; } if (unit->explain_marker == CTX_NONE) goto overwrite; if (unit->explain_marker == m->type) return false; /* GROUP BY subqueries may be listed in different item trees simultaneously: 1) in GROUP BY items, 2) in ORDER BY items and/or 3) in SELECT list. If such a subquery in the SELECT list, we mark the subquery as if it belongs to SELECT list, otherwise we mark it as "GROUP BY" subquery. ORDER BY subqueries may be listed twice in SELECT list and ORDER BY list. In this case we mark such a subquery as "SELECT list" subquery. */ if (unit->explain_marker == CTX_GROUP_BY_SQ && m->type == CTX_ORDER_BY_SQ) return false; if (unit->explain_marker == CTX_ORDER_BY_SQ && m->type == CTX_GROUP_BY_SQ) goto overwrite; if (unit->explain_marker == CTX_SELECT_LIST && (m->type == CTX_ORDER_BY_SQ || m->type == CTX_GROUP_BY_SQ)) return false; if ((unit->explain_marker == CTX_ORDER_BY_SQ || unit->explain_marker == CTX_GROUP_BY_SQ) && m->type == CTX_SELECT_LIST) goto overwrite; DBUG_ASSERT(!"Unexpected combination of item trees!"); return false; overwrite: unit->explain_marker= m->type; return false; } bool Item_subselect::exec() { DBUG_ENTER("Item_subselect::exec"); /* Do not execute subselect in case of a fatal error or if the query has been killed. */ THD * const thd= unit->thd; if (thd->is_error() || thd->killed) DBUG_RETURN(true); DBUG_ASSERT(!thd->lex->context_analysis_only); /* Simulate a failure in sub-query execution. Used to test e.g. out of memory or query being killed conditions. */ DBUG_EXECUTE_IF("subselect_exec_fail", DBUG_RETURN(true);); /* Disable tracing of subquery execution if 1) this is not the first time the subselect is executed, and 2) REPEATED_SUBSELECT is disabled */ #ifdef OPTIMIZER_TRACE Opt_trace_context * const trace= &thd->opt_trace; const bool disable_trace= traced_before && !trace->feature_enabled(Opt_trace_context::REPEATED_SUBSELECT); Opt_trace_disable_I_S disable_trace_wrapper(trace, disable_trace); traced_before= true; Opt_trace_object trace_wrapper(trace); Opt_trace_object trace_exec(trace, "subselect_execution"); trace_exec.add_select_number(unit->first_select()->select_number); Opt_trace_array trace_steps(trace, "steps"); #endif bool res= engine->exec(); if (engine_changed) { engine_changed= 0; res= exec(); DBUG_RETURN(res); } DBUG_RETURN(res); } /** Fix used tables information for a subquery after query transformations. Common actions for all predicates involving subqueries. Most actions here involve re-resolving information for conditions and items belonging to the subquery. Notice that the usage information from underlying expressions is not propagated to the subquery predicate, as it belongs to inner layers of the query operator structure. However, when underlying expressions contain outer references into a select_lex on this level, the relevant information must be updated when these expressions are resolved. */ void Item_subselect::fix_after_pullout(st_select_lex *parent_select, st_select_lex *removed_select) { /* Clear usage information for this subquery predicate object */ used_tables_cache= 0; /* Go through all query specification objects of the subquery and re-resolve all relevant expressions belonging to them. */ for (SELECT_LEX *sel= unit->first_select(); sel; sel= sel->next_select()) { if (sel->where) sel->where->fix_after_pullout(parent_select, removed_select); if (sel->having) sel->having->fix_after_pullout(parent_select, removed_select); List_iterator<Item> li(sel->item_list); Item *item; while ((item=li++)) item->fix_after_pullout(parent_select, removed_select); /* No need to call fix_after_pullout() for outer-join conditions, as these cannot have outer references. */ /* Re-resolve ORDER BY and GROUP BY fields */ for (ORDER *order= (ORDER*) sel->order_list.first; order; order= order->next) (*order->item)->fix_after_pullout(parent_select, removed_select); for (ORDER *group= (ORDER*) sel->group_list.first; group; group= group->next) (*group->item)->fix_after_pullout(parent_select, removed_select); } } bool Item_in_subselect::walk(Item_processor processor, bool walk_subquery, uchar *argument) { if (left_expr->walk(processor, walk_subquery, argument)) return true; /* Cannot call "Item_subselect::walk(...)" because with gcc 4.1 Item_in_subselect::walk() was incorrectly called instead. Using Item_subselect::walk_body() instead is a workaround. */ return walk_body(processor, walk_subquery, argument); } /* Compute the IN predicate if the left operand's cache changed. */ bool Item_in_subselect::exec() { DBUG_ENTER("Item_in_subselect::exec"); DBUG_ASSERT(exec_method != EXEC_MATERIALIZATION || (exec_method == EXEC_MATERIALIZATION && engine->engine_type() == subselect_engine::HASH_SJ_ENGINE)); /* Initialize the cache of the left predicate operand. This has to be done as late as now, because Cached_item directly contains a resolved field (not an item, and in some cases (when temp tables are created), these fields end up pointing to the wrong field. One solution is to change Cached_item to not resolve its field upon creation, but to resolve it dynamically from a given Item_ref object. Do not init the cache if a previous execution decided that it is not needed. TODO: the cache should be applied conditionally based on: - rules - e.g. only if the left operand is known to be ordered, and/or - on a cost-based basis, that takes into account the cost of a cache lookup, the cache hit rate, and the savings per cache hit. */ if (need_expr_cache && !left_expr_cache && exec_method == EXEC_MATERIALIZATION && init_left_expr_cache()) DBUG_RETURN(TRUE); if (left_expr_cache != NULL) { const int result= test_if_item_cache_changed(*left_expr_cache); if (left_expr_cache_filled && // cache was previously filled result < 0) // new value is identical to previous cached value { /* We needn't do a full execution, can just reuse "value", "was_null", "null_value" of the previous execution. */ DBUG_RETURN(false); } left_expr_cache_filled= true; } null_value= was_null= false; const bool retval= Item_subselect::exec(); DBUG_RETURN(retval); } Item::Type Item_subselect::type() const { return SUBSELECT_ITEM; } void Item_subselect::fix_length_and_dec() { engine->fix_length_and_dec(0); } table_map Item_subselect::used_tables() const { return (table_map) (engine->uncacheable() ? used_tables_cache : 0L); } bool Item_subselect::const_item() const { if (unit->thd->lex->context_analysis_only) return false; /* Not constant until tables are locked. */ if (!unit->thd->lex->is_query_tables_locked()) return false; return const_item_cache; } Item *Item_subselect::get_tmp_table_item(THD *thd_arg) { if (!with_sum_func && !const_item()) return new Item_field(result_field); return copy_or_same(thd_arg); } void Item_subselect::update_used_tables() { if (!engine->uncacheable()) { // did all used tables become static? if (!(used_tables_cache & ~engine->upper_select_const_tables())) const_item_cache= 1; } } void Item_subselect::print(String *str, enum_query_type query_type) { if (engine) { str->append('('); engine->print(str, query_type); str->append(')'); } else str->append("(...)"); } Item_singlerow_subselect::Item_singlerow_subselect(st_select_lex *select_lex) :Item_subselect(), value(0), no_rows(false) { DBUG_ENTER("Item_singlerow_subselect::Item_singlerow_subselect"); init(select_lex, new select_singlerow_subselect(this)); maybe_null= 1; max_columns= UINT_MAX; DBUG_VOID_RETURN; } st_select_lex * Item_singlerow_subselect::invalidate_and_restore_select_lex() { DBUG_ENTER("Item_singlerow_subselect::invalidate_and_restore_select_lex"); st_select_lex *result= unit->first_select(); DBUG_ASSERT(result); /* This code restore the parse tree in it's state before the execution of Item_singlerow_subselect::Item_singlerow_subselect(), and in particular decouples this object from the SELECT_LEX, so that the SELECT_LEX can be used with a different flavor or Item_subselect instead, as part of query rewriting. */ unit->item= NULL; DBUG_RETURN(result); } Item_maxmin_subselect::Item_maxmin_subselect(THD *thd_param, Item_subselect *parent, st_select_lex *select_lex, bool max_arg, bool ignore_nulls) :Item_singlerow_subselect(), was_values(false) { DBUG_ENTER("Item_maxmin_subselect::Item_maxmin_subselect"); max= max_arg; init(select_lex, new select_max_min_finder_subselect(this, max_arg, ignore_nulls)); max_columns= 1; maybe_null= 1; max_columns= 1; /* Following information was collected during performing fix_fields() of Items belonged to subquery, which will be not repeated */ used_tables_cache= parent->get_used_tables_cache(); const_item_cache= parent->get_const_item_cache(); DBUG_VOID_RETURN; } void Item_maxmin_subselect::cleanup() { DBUG_ENTER("Item_maxmin_subselect::cleanup"); Item_singlerow_subselect::cleanup(); was_values= false; DBUG_VOID_RETURN; } void Item_maxmin_subselect::print(String *str, enum_query_type query_type) { str->append(max?"<max>":"<min>", 5); Item_singlerow_subselect::print(str, query_type); } void Item_singlerow_subselect::reset() { null_value= TRUE; if (value) value->null_value= TRUE; } /** @todo - We cant change name of Item_field or Item_ref, because it will prevent it's correct resolving, but we should save name of removed item => we do not make optimization if top item of list is field or reference. - switch off this optimization for prepare statement, because we do not rollback this changes. Make rollback for it, or special name resolving mode in 5.0. */ Item_subselect::trans_res Item_singlerow_subselect::select_transformer(JOIN *join) { DBUG_ENTER("Item_singlerow_subselect::select_transformer"); if (changed) DBUG_RETURN(RES_OK); SELECT_LEX *select_lex= join->select_lex; THD * const thd= unit->thd; Query_arena *arena= thd->stmt_arena; if (!select_lex->master_unit()->is_union() && !select_lex->table_list.elements && select_lex->item_list.elements == 1 && !select_lex->item_list.head()->with_sum_func && /* We cant change name of Item_field or Item_ref, because it will prevent it's correct resolving, but we should save name of removed item => we do not make optimization if top item of list is field or reference. TODO: solve above problem */ !(select_lex->item_list.head()->type() == FIELD_ITEM || select_lex->item_list.head()->type() == REF_ITEM) && !join->conds && !join->having && /* switch off this optimization for prepare statement, because we do not rollback this changes TODO: make rollback for it, or special name resolving mode in 5.0. */ !arena->is_stmt_prepare_or_first_sp_execute() ) { have_to_be_excluded= 1; if (thd->lex->describe) { char warn_buff[MYSQL_ERRMSG_SIZE]; sprintf(warn_buff, ER(ER_SELECT_REDUCED), select_lex->select_number); push_warning(thd, Sql_condition::WARN_LEVEL_NOTE, ER_SELECT_REDUCED, warn_buff); } substitution= select_lex->item_list.head(); /* as far as we moved content to upper level, field which depend of 'upper' select is not really dependent => we remove this dependence */ substitution->walk(&Item::remove_dependence_processor, 0, (uchar *) select_lex->outer_select()); DBUG_RETURN(RES_REDUCE); } DBUG_RETURN(RES_OK); } void Item_singlerow_subselect::store(uint i, Item *item) { row[i]->store(item); row[i]->cache_value(); } enum Item_result Item_singlerow_subselect::result_type() const { return engine->type(); } /* Don't rely on the result type to calculate field type. Ask the engine instead. */ enum_field_types Item_singlerow_subselect::field_type() const { return engine->field_type(); } void Item_singlerow_subselect::fix_length_and_dec() { if ((max_columns= engine->cols()) == 1) { engine->fix_length_and_dec(row= &value); } else { if (!(row= (Item_cache**) sql_alloc(sizeof(Item_cache*)*max_columns))) return; engine->fix_length_and_dec(row); value= *row; } unsigned_flag= value->unsigned_flag; /* If there are not tables in subquery then ability to have NULL value depends on SELECT list (if single row subquery have tables then it always can be NULL if there are not records fetched). */ if (engine->no_tables()) maybe_null= engine->may_be_null(); } void Item_singlerow_subselect::no_rows_in_result() { /* This is only possible if we have a dependent subquery in the SELECT list and an aggregated outer query based on zero rows, which is an illegal query according to the SQL standard. ONLY_FULL_GROUP_BY rejects such queries. */ if (unit->uncacheable & UNCACHEABLE_DEPENDENT) no_rows= true; } uint Item_singlerow_subselect::cols() { return engine->cols(); } bool Item_singlerow_subselect::check_cols(uint c) { if (c != engine->cols()) { my_error(ER_OPERAND_COLUMNS, MYF(0), c); return 1; } return 0; } bool Item_singlerow_subselect::null_inside() { for (uint i= 0; i < max_columns ; i++) { if (row[i]->null_value) return 1; } return 0; } void Item_singlerow_subselect::bring_value() { if (!exec() && assigned()) null_value= 0; else reset(); } double Item_singlerow_subselect::val_real() { DBUG_ASSERT(fixed == 1); if (!no_rows && !exec() && !value->null_value) { null_value= FALSE; return value->val_real(); } else { reset(); return 0; } } longlong Item_singlerow_subselect::val_int() { DBUG_ASSERT(fixed == 1); if (!no_rows && !exec() && !value->null_value) { null_value= FALSE; return value->val_int(); } else { reset(); return 0; } } String *Item_singlerow_subselect::val_str(String *str) { if (!no_rows && !exec() && !value->null_value) { null_value= FALSE; return value->val_str(str); } else { reset(); return 0; } } my_decimal *Item_singlerow_subselect::val_decimal(my_decimal *decimal_value) { if (!no_rows && !exec() && !value->null_value) { null_value= FALSE; return value->val_decimal(decimal_value); } else { reset(); return 0; } } bool Item_singlerow_subselect::get_date(MYSQL_TIME *ltime, uint fuzzydate) { if (!no_rows && !exec() && !value->null_value) { null_value= false; return value->get_date(ltime, fuzzydate); } else { reset(); return true; } } bool Item_singlerow_subselect::get_time(MYSQL_TIME *ltime) { if (!no_rows && !exec() && !value->null_value) { null_value= false; return value->get_time(ltime); } else { reset(); return true; } } bool Item_singlerow_subselect::val_bool() { if (!no_rows && !exec() && !value->null_value) { null_value= FALSE; return value->val_bool(); } else { reset(); return 0; } } Item_exists_subselect::Item_exists_subselect(st_select_lex *select_lex): Item_subselect(), value(FALSE), exec_method(EXEC_UNSPECIFIED), sj_convert_priority(0), embedding_join_nest(NULL) { DBUG_ENTER("Item_exists_subselect::Item_exists_subselect"); init(select_lex, new select_exists_subselect(this)); max_columns= UINT_MAX; null_value= FALSE; //can't be NULL maybe_null= 0; //can't be NULL DBUG_VOID_RETURN; } void Item_exists_subselect::print(String *str, enum_query_type query_type) { str->append(STRING_WITH_LEN("exists")); Item_subselect::print(str, query_type); } bool Item_in_subselect::test_limit(st_select_lex_unit *unit_arg) { if (unit_arg->fake_select_lex && unit_arg->fake_select_lex->test_limit()) return(1); SELECT_LEX *sl= unit_arg->first_select(); for (; sl; sl= sl->next_select()) { if (sl->test_limit()) return(1); } return(0); } Item_in_subselect::Item_in_subselect(Item * left_exp, st_select_lex *select_lex): Item_exists_subselect(), left_expr(left_exp), left_expr_cache(NULL), left_expr_cache_filled(false), need_expr_cache(TRUE), expr(NULL), optimizer(NULL), was_null(FALSE), abort_on_null(FALSE), in2exists_info(NULL), pushed_cond_guards(NULL), upper_item(NULL) { DBUG_ENTER("Item_in_subselect::Item_in_subselect"); init(select_lex, new select_exists_subselect(this)); max_columns= UINT_MAX; maybe_null= 1; reset(); //if test_limit will fail then error will be reported to client test_limit(select_lex->master_unit()); DBUG_VOID_RETURN; } Item_allany_subselect::Item_allany_subselect(Item * left_exp, chooser_compare_func_creator fc, st_select_lex *select_lex, bool all_arg) :Item_in_subselect(), func_creator(fc), all(all_arg) { DBUG_ENTER("Item_allany_subselect::Item_allany_subselect"); left_expr= left_exp; func= func_creator(all_arg); init(select_lex, new select_exists_subselect(this)); max_columns= 1; abort_on_null= 0; reset(); //if test_limit will fail then error will be reported to client test_limit(select_lex->master_unit()); DBUG_VOID_RETURN; } void Item_exists_subselect::fix_length_and_dec() { decimals= 0; max_length= 1; max_columns= engine->cols(); if (exec_method == EXEC_EXISTS) { /* We need only 1 row to determine existence. Note that if the subquery is "SELECT1 UNION SELECT2" then this is not working optimally (Bug#14215895). */ unit->global_parameters->select_limit= new Item_int((int32) 1); } } double Item_exists_subselect::val_real() { DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } return (double) value; } longlong Item_exists_subselect::val_int() { DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } return value; } /** Return the result of EXISTS as a string value Converts the true/false result into a string value. Note that currently this cannot be NULL, so if the query exection fails it will return 0. @param decimal_value[out] buffer to hold the resulting string value @retval Pointer to the converted string. Can't be a NULL pointer, as currently EXISTS cannot return NULL. */ String *Item_exists_subselect::val_str(String *str) { DBUG_ASSERT(fixed == 1); if (exec()) reset(); str->set((ulonglong)value,&my_charset_bin); return str; } /** Return the result of EXISTS as a decimal value Converts the true/false result into a decimal value. Note that currently this cannot be NULL, so if the query exection fails it will return 0. @param decimal_value[out] Buffer to hold the resulting decimal value @retval Pointer to the converted decimal. Can't be a NULL pointer, as currently EXISTS cannot return NULL. */ my_decimal *Item_exists_subselect::val_decimal(my_decimal *decimal_value) { DBUG_ASSERT(fixed == 1); if (exec()) reset(); int2my_decimal(E_DEC_FATAL_ERROR, value, 0, decimal_value); return decimal_value; } bool Item_exists_subselect::val_bool() { DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } return value != 0; } double Item_in_subselect::val_real() { /* As far as Item_in_subselect called only from Item_in_optimizer this method should not be used */ DBUG_ASSERT(0); DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } if (was_null && !value) null_value= TRUE; return (double) value; } longlong Item_in_subselect::val_int() { /* As far as Item_in_subselect called only from Item_in_optimizer this method should not be used */ DBUG_ASSERT(0); DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } if (was_null && !value) null_value= TRUE; return value; } String *Item_in_subselect::val_str(String *str) { /* As far as Item_in_subselect called only from Item_in_optimizer this method should not be used */ DBUG_ASSERT(0); DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } if (was_null && !value) { null_value= TRUE; return 0; } str->set((ulonglong)value, &my_charset_bin); return str; } bool Item_in_subselect::val_bool() { DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } if (was_null && !value) null_value= TRUE; return value; } my_decimal *Item_in_subselect::val_decimal(my_decimal *decimal_value) { /* As far as Item_in_subselect called only from Item_in_optimizer this method should not be used */ DBUG_ASSERT(0); DBUG_ASSERT(fixed == 1); if (exec()) { reset(); return 0; } if (was_null && !value) null_value= TRUE; int2my_decimal(E_DEC_FATAL_ERROR, value, 0, decimal_value); return decimal_value; } /* Rewrite a single-column IN/ALL/ANY subselect SYNOPSIS Item_in_subselect::single_value_transformer() join Join object of the subquery (i.e. 'child' join). func Subquery comparison creator DESCRIPTION Rewrite a single-column subquery using rule-based approach. The subquery oe $cmp$ (SELECT ie FROM ... WHERE subq_where ... HAVING subq_having) First, try to convert the subquery to scalar-result subquery in one of the forms: - oe $cmp$ (SELECT MAX(...) ) // handled by Item_singlerow_subselect - oe $cmp$ <max>(SELECT ...) // handled by Item_maxmin_subselect If that fails, the subquery will be handled with class Item_in_optimizer. There are two possibilites: - If the subquery execution method is materialization, then the subquery is not transformed any further. - Otherwise the IN predicates is transformed into EXISTS by injecting equi-join predicates and possibly other helper predicates. For details see method single_value_in_like_transformer(). RETURN RES_OK Either subquery was transformed, or appopriate predicates where injected into it. RES_REDUCE The subquery was reduced to non-subquery RES_ERROR Error */ Item_subselect::trans_res Item_in_subselect::single_value_transformer(JOIN *join, Comp_creator *func) { SELECT_LEX *select_lex= join->select_lex; bool subquery_maybe_null= false; DBUG_ENTER("Item_in_subselect::single_value_transformer"); /* Check that the right part of the subselect contains no more than one column. E.g. in SELECT 1 IN (SELECT * ..) the right part is (SELECT * ...) */ // psergey: duplicated_subselect_card_check if (select_lex->item_list.elements > 1) { my_error(ER_OPERAND_COLUMNS, MYF(0), 1); DBUG_RETURN(RES_ERROR); } THD * const thd= unit->thd; /* Check the nullability of the subquery. The subquery should return only one column, so we check the nullability of the first item in SELECT_LEX::item_list. In case the subquery is a union, check the nullability of the first item of each SELECT_LEX belonging to the union. */ for (SELECT_LEX* lex= select_lex->master_unit()->first_select(); lex != NULL && lex->master_unit() == select_lex->master_unit(); lex= lex->next_select()) if (lex->item_list.head()->maybe_null) subquery_maybe_null= true; /* If this is an ALL/ANY single-value subquery predicate, try to rewrite it with a MIN/MAX subquery. E.g. SELECT * FROM t1 WHERE b > ANY (SELECT a FROM t2) can be rewritten with SELECT * FROM t1 WHERE b > (SELECT MIN(a) FROM t2). A predicate may be transformed to use a MIN/MAX subquery if it: 1. has a greater than/less than comparison operator, and 2. is not correlated with the outer query, and 3. UNKNOWN results are treated as FALSE, or can never be generated, and */ if (!func->eqne_op() && // 1 !select_lex->master_unit()->uncacheable && // 2 (abort_on_null || (upper_item && upper_item->top_level()) || // 3 (!left_expr->maybe_null && !subquery_maybe_null))) { if (substitution) { // It is second (third, ...) SELECT of UNION => All is done DBUG_RETURN(RES_OK); } Item *subs; if (!select_lex->group_list.elements && !select_lex->having && !select_lex->with_sum_func && !(select_lex->next_select()) && select_lex->table_list.elements && !(substype() == ALL_SUBS && subquery_maybe_null)) { OPT_TRACE_TRANSFORM(&thd->opt_trace, oto0, oto1, select_lex->select_number, "> ALL/ANY (SELECT)", "SELECT(MIN)"); oto1.add("chosen", true); Item_sum_hybrid *item; nesting_map save_allow_sum_func; if (func->l_op()) { /* (ALL && (> || =>)) || (ANY && (< || =<)) for ALL condition is inverted */ item= new Item_sum_max(join->ref_ptrs[0]); } else { /* (ALL && (< || =<)) || (ANY && (> || =>)) for ALL condition is inverted */ item= new Item_sum_min(join->ref_ptrs[0]); } if (upper_item) upper_item->set_sum_test(item); join->ref_ptrs[0]= item; { List_iterator<Item> it(select_lex->item_list); it++; it.replace(item); } DBUG_EXECUTE("where", print_where(item, "rewrite with MIN/MAX", QT_ORDINARY);); if (thd->variables.sql_mode & MODE_ONLY_FULL_GROUP_BY) { /* If the argument is a field, we assume that fix_fields() has tagged the select_lex with non_agg_field_used. We reverse that decision after this rewrite with MIN/MAX. */ if (item->get_arg(0)->type() == Item::FIELD_ITEM) DBUG_ASSERT(select_lex->non_agg_field_used()); select_lex->set_non_agg_field_used(false); } save_allow_sum_func= thd->lex->allow_sum_func; thd->lex->allow_sum_func|= (nesting_map)1 << thd->lex->current_select->nest_level; /* Item_sum_(max|min) can't substitute other item => we can use 0 as reference, also Item_sum_(max|min) can't be fixed after creation, so we do not check item->fixed */ if (item->fix_fields(thd, 0)) DBUG_RETURN(RES_ERROR); thd->lex->allow_sum_func= save_allow_sum_func; /* we added aggregate function => we have to change statistic */ count_field_types(select_lex, &join->tmp_table_param, join->all_fields, 0); subs= new Item_singlerow_subselect(select_lex); } else { OPT_TRACE_TRANSFORM(&thd->opt_trace, oto0, oto1, select_lex->select_number, "> ALL/ANY (SELECT)", "MIN (SELECT)"); oto1.add("chosen", true); Item_maxmin_subselect *item; subs= item= new Item_maxmin_subselect(thd, this, select_lex, func->l_op(), substype()==ANY_SUBS); if (upper_item) upper_item->set_sub_test(item); } if (upper_item) upper_item->set_subselect(this); /* fix fields is already called for left expression. Note that real_item() should be used for all the runtime created Ref items instead of original left expression because these items would be deleted at the end of the statement. Thus one of 'substitution' arguments can be broken in case of PS. @todo Why do we use real_item()/substitutional_item() instead of the plain left_expr? Because left_expr might be a rollbackable item, and we fail to properly rollback all copies of left_expr at end of execution, so we want to avoid creating copies of left_expr as much as possible, so we use real_item() instead. Doing a proper rollback is difficult: the change was registered for the original item which was the left argument of IN. Then this item was copied to left_expr, which is copied below to substitution->args[0]. To do a proper rollback, we would have to restore the content of both copies as well as the original item. There might be more copies, if AND items have been constructed. The same applies to the right expression. However, using real_item()/substitutional_item() brings its own problems: for example, we lose information that the item is an outer reference; the item can thus wrongly be considered for a Keyuse (causing bug#17766653). When WL#6570 removes the "rolling back" system, all real_item()/substitutional_item() in this file should be removed. */ substitution= func->create(left_expr->substitutional_item(), subs); DBUG_RETURN(RES_OK); } if (!substitution) { /* We're invoked for the 1st (or the only) SELECT in the subquery UNION */ SELECT_LEX_UNIT *master_unit= select_lex->master_unit(); substitution= optimizer; SELECT_LEX *current= thd->lex->current_select; thd->lex->current_select= current->outer_select(); //optimizer never use Item **ref => we can pass 0 as parameter if (!optimizer || optimizer->fix_left(thd, 0)) { thd->lex->current_select= current; DBUG_RETURN(RES_ERROR); } thd->lex->current_select= current; /* We will refer to upper level cache array => we have to save it for SP */ optimizer->keep_top_level_cache(); /* As far as Item_ref_in_optimizer do not substitute itself on fix_fields we can use same item for all selects. */ Item_ref *const left= new Item_direct_ref(&select_lex->context, (Item**)optimizer->get_cache(), (char *)"<no matter>", (char *)in_left_expr_name); if (left == NULL) DBUG_RETURN(RES_ERROR); // Make the left expression "outer" relative to the subquery if (!left_expr->const_item()) left->depended_from= select_lex->outer_select(); expr= left; DBUG_ASSERT(in2exists_info == NULL); in2exists_info= new In2exists_info; in2exists_info->originally_dependent= master_unit->uncacheable & UNCACHEABLE_DEPENDENT; master_unit->uncacheable|= UNCACHEABLE_DEPENDENT; } if (!abort_on_null && left_expr->maybe_null && !pushed_cond_guards) { if (!(pushed_cond_guards= (bool*)join->thd->alloc(sizeof(bool)))) DBUG_RETURN(RES_ERROR); pushed_cond_guards[0]= TRUE; } /* Perform the IN=>EXISTS transformation. */ const trans_res retval= single_value_in_to_exists_transformer(join, func); DBUG_RETURN(retval); } /** Transofrm an IN predicate into EXISTS via predicate injection. @details The transformation injects additional predicates into the subquery (and makes the subquery correlated) as follows. - If the subquery has aggregates, GROUP BY, or HAVING, convert to SELECT ie FROM ... HAVING subq_having AND trigcond(oe $cmp$ ref_or_null_helper<ie>) the addition is wrapped into trigger only when we want to distinguish between NULL and FALSE results. - Otherwise (no aggregates/GROUP BY/HAVING) convert it to one of the following: = If we don't need to distinguish between NULL and FALSE subquery: SELECT 1 FROM ... WHERE (oe $cmp$ ie) AND subq_where = If we need to distinguish between those: SELECT 1 FROM ... WHERE subq_where AND trigcond((oe $cmp$ ie) OR (ie IS NULL)) HAVING trigcond(<is_not_null_test>(ie)) At JOIN::optimize() we will compare costs of materialization and EXISTS; if the former is cheaper we will switch to it. @param join Join object of the subquery (i.e. 'child' join). @param func Subquery comparison creator @retval RES_OK Either subquery was transformed, or appopriate predicates where injected into it. @retval RES_REDUCE The subquery was reduced to non-subquery @retval RES_ERROR Error */ Item_subselect::trans_res Item_in_subselect::single_value_in_to_exists_transformer(JOIN * join, Comp_creator *func) { SELECT_LEX *select_lex= join->select_lex; THD * const thd= unit->thd; DBUG_ENTER("Item_in_subselect::single_value_in_to_exists_transformer"); OPT_TRACE_TRANSFORM(&thd->opt_trace, oto0, oto1, select_lex->select_number, "IN (SELECT)", "EXISTS (CORRELATED SELECT)"); oto1.add("chosen", true); select_lex->uncacheable|= UNCACHEABLE_DEPENDENT; in2exists_info->added_to_where= false; if (join->having || select_lex->with_sum_func || select_lex->group_list.elements) { bool tmp; Item_bool_func *item= func->create(expr, new Item_ref_null_helper(&select_lex->context, this, &join->ref_ptrs[0], (char *)"<ref>", this->full_name())); item->set_created_by_in2exists(); if (!abort_on_null && left_expr->maybe_null) { /* We can encounter "NULL IN (SELECT ...)". Wrap the added condition within a trig_cond. */ item= new Item_func_trig_cond(item, get_cond_guard(0), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL); item->set_created_by_in2exists(); } /* AND and comparison functions can't be changed during fix_fields() we can assign select_lex->having here, and pass 0 as last argument (reference) to fix_fields() */ select_lex->having= join->having= and_items(join->having, item); if (join->having == item) item->item_name.set(in_having_cond); select_lex->having->top_level_item(); select_lex->having_fix_field= 1; /* we do not check join->having->fixed, because Item_and (from and_items) or comparison function (from func->create) can't be fixed after creation */ Opt_trace_array having_trace(&thd->opt_trace, "evaluating_constant_having_conditions"); tmp= join->having->fix_fields(thd, 0); select_lex->having_fix_field= 0; if (tmp) DBUG_RETURN(RES_ERROR); } else { /* Grep for "WL#6570" to see the relevant comment about real_item. */ Item *orig_item= select_lex->item_list.head()->real_item(); if (select_lex->table_list.elements) { bool tmp; Item_bool_func *item= func->create(expr, orig_item); /* We may soon add a 'OR inner IS NULL' to 'item', but that may later be removed if 'inner' is not nullable, so the in2exists mark must be on 'item' too. Not only on the OR node. */ item->set_created_by_in2exists(); if (!abort_on_null && orig_item->maybe_null) { Item_bool_func *having= new Item_is_not_null_test(this, orig_item); having->set_created_by_in2exists(); if (left_expr->maybe_null) { if (!(having= new Item_func_trig_cond(having, get_cond_guard(0), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); having->set_created_by_in2exists(); } /* Item_is_not_null_test can't be changed during fix_fields() we can assign select_lex->having here, and pass 0 as last argument (reference) to fix_fields() */ having->item_name.set(in_having_cond); select_lex->having= join->having= having; select_lex->having_fix_field= 1; /* we do not check join->having->fixed, because Item_and (from and_items) or comparison function (from func->create) can't be fixed after creation */ Opt_trace_array having_trace(&thd->opt_trace, "evaluating_constant_having_conditions"); tmp= join->having->fix_fields(thd, 0); select_lex->having_fix_field= 0; if (tmp) DBUG_RETURN(RES_ERROR); item= new Item_cond_or(item, new Item_func_isnull(orig_item)); item->set_created_by_in2exists(); } /* If we may encounter NULL IN (SELECT ...) and care whether subquery result is NULL or FALSE, wrap condition in a trig_cond. */ if (!abort_on_null && left_expr->maybe_null) { if (!(item= new Item_func_trig_cond(item, get_cond_guard(0), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); item->set_created_by_in2exists(); } /* The following is intentionally not done in row_value_transformer(), see comment of JOIN::remove_subq_pushed_predicates(). */ item->item_name.set(in_additional_cond); /* AND can't be changed during fix_fields() we can assign select_lex->having here, and pass 0 as last argument (reference) to fix_fields() */ select_lex->where= join->conds= and_items(join->conds, item); select_lex->where->top_level_item(); in2exists_info->added_to_where= true; /* we do not check join->conds->fixed, because Item_and can't be fixed after creation */ Opt_trace_array where_trace(&thd->opt_trace, "evaluating_constant_where_conditions"); if (join->conds->fix_fields(thd, 0)) DBUG_RETURN(RES_ERROR); } else { bool tmp; if (select_lex->master_unit()->is_union()) { /* comparison functions can't be changed during fix_fields() we can assign select_lex->having here, and pass 0 as last argument (reference) to fix_fields() */ Item_bool_func *new_having= func->create(expr, new Item_ref_null_helper(&select_lex->context, this, &join->ref_ptrs[0], (char *)"<no matter>", (char *)"<result>")); new_having->set_created_by_in2exists(); if (!abort_on_null && left_expr->maybe_null) { if (!(new_having= new Item_func_trig_cond(new_having, get_cond_guard(0), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); new_having->set_created_by_in2exists(); } new_having->item_name.set(in_having_cond); select_lex->having= join->having= new_having; select_lex->having_fix_field= 1; /* we do not check join->having->fixed, because comparison function (from func->create) can't be fixed after creation */ Opt_trace_array having_trace(&thd->opt_trace, "evaluating_constant_having_conditions"); tmp= join->having->fix_fields(thd, 0); select_lex->having_fix_field= 0; if (tmp) DBUG_RETURN(RES_ERROR); } else { // it is single select without tables => possible optimization // remove the dependence mark since the item is moved to upper // select and is not outer anymore. orig_item->walk(&Item::remove_dependence_processor, 0, (uchar *) select_lex->outer_select()); /* fix_field of substitution item will be done in time of substituting. Note that real_item() should be used for all the runtime created Ref items instead of original left expression because these items would be deleted at the end of the statement. Thus one of 'substitution' arguments can be broken in case of PS. */ substitution= func->create(left_expr->substitutional_item(), orig_item); have_to_be_excluded= 1; if (thd->lex->describe) { char warn_buff[MYSQL_ERRMSG_SIZE]; sprintf(warn_buff, ER(ER_SELECT_REDUCED), select_lex->select_number); push_warning(thd, Sql_condition::WARN_LEVEL_NOTE, ER_SELECT_REDUCED, warn_buff); } DBUG_RETURN(RES_REDUCE); } } } join->having_for_explain= join->having; DBUG_RETURN(RES_OK); } Item_subselect::trans_res Item_in_subselect::row_value_transformer(JOIN *join) { SELECT_LEX *select_lex= join->select_lex; uint cols_num= left_expr->cols(); DBUG_ENTER("Item_in_subselect::row_value_transformer"); // psergey: duplicated_subselect_card_check if (select_lex->item_list.elements != left_expr->cols()) { my_error(ER_OPERAND_COLUMNS, MYF(0), left_expr->cols()); DBUG_RETURN(RES_ERROR); } /* Wrap the current IN predicate in an Item_in_optimizer. The actual substitution in the Item tree takes place in Item_subselect::fix_fields. */ if (!substitution) { //first call for this unit SELECT_LEX_UNIT *master_unit= select_lex->master_unit(); substitution= optimizer; THD * const thd= unit->thd; SELECT_LEX *current= thd->lex->current_select; thd->lex->current_select= current->outer_select(); //optimizer never use Item **ref => we can pass 0 as parameter if (!optimizer || optimizer->fix_left(thd, 0)) { thd->lex->current_select= current; DBUG_RETURN(RES_ERROR); } // we will refer to upper level cache array => we have to save it in PS optimizer->keep_top_level_cache(); thd->lex->current_select= current; DBUG_ASSERT(in2exists_info == NULL); in2exists_info= new In2exists_info; in2exists_info->originally_dependent= master_unit->uncacheable & UNCACHEABLE_DEPENDENT; master_unit->uncacheable|= UNCACHEABLE_DEPENDENT; if (!abort_on_null && left_expr->maybe_null && !pushed_cond_guards) { if (!(pushed_cond_guards= (bool*)join->thd->alloc(sizeof(bool) * left_expr->cols()))) DBUG_RETURN(RES_ERROR); for (uint i= 0; i < cols_num; i++) pushed_cond_guards[i]= TRUE; } } /* Perform the IN=>EXISTS transformation. */ DBUG_RETURN(row_value_in_to_exists_transformer(join)); } /** Tranform a (possibly non-correlated) IN subquery into a correlated EXISTS. @todo The IF-ELSE below can be refactored so that there is no duplication of the statements that create the new conditions. For this we have to invert the IF and the FOR statements as this: for (each left operand) create the equi-join condition if (is_having_used || !abort_on_null) create the "is null" and is_not_null_test items if (is_having_used) add the equi-join and the null tests to HAVING else add the equi-join and the "is null" to WHERE add the is_not_null_test to HAVING */ Item_subselect::trans_res Item_in_subselect::row_value_in_to_exists_transformer(JOIN * join) { SELECT_LEX *select_lex= join->select_lex; THD * const thd= unit->thd; Item *having_item= 0; uint cols_num= left_expr->cols(); bool is_having_used= (join->having || select_lex->with_sum_func || select_lex->group_list.first || !select_lex->table_list.elements); DBUG_ENTER("Item_in_subselect::row_value_in_to_exists_transformer"); OPT_TRACE_TRANSFORM(&thd->opt_trace, oto0, oto1, select_lex->select_number, "IN (SELECT)", "EXISTS (CORRELATED SELECT)"); oto1.add("chosen", true); select_lex->uncacheable|= UNCACHEABLE_DEPENDENT; in2exists_info->added_to_where= false; if (is_having_used) { /* (l1, l2, l3) IN (SELECT v1, v2, v3 ... HAVING having) => EXISTS (SELECT ... HAVING having and (l1 = v1 or is null v1) and (l2 = v2 or is null v2) and (l3 = v3 or is null v3) and is_not_null_test(v1) and is_not_null_test(v2) and is_not_null_test(v3)) where is_not_null_test used to register nulls in case if we have not found matching to return correct NULL value TODO: say here explicitly if the order of AND parts matters or not. */ Item *item_having_part2= 0; for (uint i= 0; i < cols_num; i++) { Item *item_i= join->ref_ptrs[i]; Item **pitem_i= &join->ref_ptrs[i]; DBUG_ASSERT((left_expr->fixed && item_i->fixed) || (item_i->type() == REF_ITEM && ((Item_ref*)(item_i))->ref_type() == Item_ref::OUTER_REF)); if (item_i-> check_cols(left_expr->element_index(i)->cols())) DBUG_RETURN(RES_ERROR); Item_bool_func *item_eq= new Item_func_eq(new Item_ref(&select_lex->context, (*optimizer->get_cache())-> addr(i), (char *)"<no matter>", (char *)in_left_expr_name), new Item_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>") ); item_eq->set_created_by_in2exists(); Item_bool_func *item_isnull= new Item_func_isnull(new Item_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>") ); item_isnull->set_created_by_in2exists(); Item_bool_func *col_item= new Item_cond_or(item_eq, item_isnull); col_item->set_created_by_in2exists(); if (!abort_on_null && left_expr->element_index(i)->maybe_null) { if (!(col_item= new Item_func_trig_cond(col_item, get_cond_guard(i), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); col_item->set_created_by_in2exists(); } having_item= and_items(having_item, col_item); Item_bool_func *item_nnull_test= new Item_is_not_null_test(this, new Item_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>")); item_nnull_test->set_created_by_in2exists(); if (!abort_on_null && left_expr->element_index(i)->maybe_null) { if (!(item_nnull_test= new Item_func_trig_cond(item_nnull_test, get_cond_guard(i), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); item_nnull_test->set_created_by_in2exists(); } item_having_part2= and_items(item_having_part2, item_nnull_test); item_having_part2->top_level_item(); } having_item= and_items(having_item, item_having_part2); having_item->top_level_item(); } else { /* (l1, l2, l3) IN (SELECT v1, v2, v3 ... WHERE where) => EXISTS (SELECT ... WHERE where and (l1 = v1 or is null v1) and (l2 = v2 or is null v2) and (l3 = v3 or is null v3) HAVING is_not_null_test(v1) and is_not_null_test(v2) and is_not_null_test(v3)) where is_not_null_test register NULLs values but reject rows in case when we do not need correct NULL, we have simplier construction: EXISTS (SELECT ... WHERE where and (l1 = v1) and (l2 = v2) and (l3 = v3) */ Item *where_item= 0; for (uint i= 0; i < cols_num; i++) { Item *item_i= join->ref_ptrs[i]; Item **pitem_i= &join->ref_ptrs[i]; DBUG_ASSERT((left_expr->fixed && item_i->fixed) || (item_i->type() == REF_ITEM && ((Item_ref*)(item_i))->ref_type() == Item_ref::OUTER_REF)); if (item_i->check_cols(left_expr->element_index(i)->cols())) DBUG_RETURN(RES_ERROR); Item_ref *const left= new Item_direct_ref(&select_lex->context, (*optimizer->get_cache())->addr(i), (char *)"<no matter>", (char *)in_left_expr_name); if (left == NULL) DBUG_RETURN(RES_ERROR); // Make the left expression "outer" relative to the subquery if (!left_expr->element_index(i)->const_item()) left->depended_from= select_lex->outer_select(); Item_bool_func *item= new Item_func_eq(left, new Item_direct_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>") ); item->set_created_by_in2exists(); if (!abort_on_null) { Item_bool_func *having_col_item= new Item_is_not_null_test(this, new Item_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>")); having_col_item->set_created_by_in2exists(); Item_bool_func *item_isnull= new Item_func_isnull(new Item_direct_ref(&select_lex->context, pitem_i, (char *)"<no matter>", (char *)"<list ref>") ); item_isnull->set_created_by_in2exists(); item= new Item_cond_or(item, item_isnull); item->set_created_by_in2exists(); /* TODO: why we create the above for cases where the right part cant be NULL? */ if (left_expr->element_index(i)->maybe_null) { if (!(item= new Item_func_trig_cond(item, get_cond_guard(i), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); item->set_created_by_in2exists(); if (!(having_col_item= new Item_func_trig_cond(having_col_item, get_cond_guard(i), NULL, Item_func_trig_cond:: OUTER_FIELD_IS_NOT_NULL))) DBUG_RETURN(RES_ERROR); having_col_item->set_created_by_in2exists(); } having_item= and_items(having_item, having_col_item); } where_item= and_items(where_item, item); } /* AND can't be changed during fix_fields() we can assign select_lex->where here, and pass 0 as last argument (reference) to fix_fields() */ select_lex->where= join->conds= and_items(join->conds, where_item); select_lex->where->top_level_item(); in2exists_info->added_to_where= true; Opt_trace_array where_trace(&thd->opt_trace, "evaluating_constant_where_conditions"); if (join->conds->fix_fields(thd, 0)) DBUG_RETURN(RES_ERROR); } if (having_item) { bool res; select_lex->having= join->having= join->having_for_explain= and_items(join->having, having_item); if (having_item == select_lex->having) having_item->item_name.set(in_having_cond); select_lex->having->top_level_item(); /* AND can't be changed during fix_fields() we can assign select_lex->having here, and pass 0 as last argument (reference) to fix_fields() */ select_lex->having_fix_field= 1; Opt_trace_array having_trace(&thd->opt_trace, "evaluating_constant_having_conditions"); res= join->having->fix_fields(thd, 0); select_lex->having_fix_field= 0; if (res) { DBUG_RETURN(RES_ERROR); } } DBUG_RETURN(RES_OK); } Item_subselect::trans_res Item_in_subselect::select_transformer(JOIN *join) { return select_in_like_transformer(join, &eq_creator); } /** Prepare IN/ALL/ANY/SOME subquery transformation and call appropriate transformation function. To decide which transformation procedure (scalar or row) applicable here we have to call fix_fields() for left expression to be able to call cols() method on it. Also this method make arena management for underlying transformation methods. @param join JOIN object of transforming subquery @param func creator of condition function of subquery @retval RES_OK OK @retval RES_REDUCE OK, and current subquery was reduced during transformation @retval RES_ERROR Error */ Item_subselect::trans_res Item_in_subselect::select_in_like_transformer(JOIN *join, Comp_creator *func) { THD * const thd= unit->thd; SELECT_LEX *current= thd->lex->current_select; const char *save_where= thd->where; Item_subselect::trans_res res= RES_ERROR; bool result; DBUG_ENTER("Item_in_subselect::select_in_like_transformer"); #ifndef DBUG_OFF { /* IN/SOME/ALL/ANY subqueries don't support LIMIT clause. Without it, ORDER BY becomes meaningless and should already have been removed in resolve_subquery() */ SELECT_LEX *sl= current->master_unit()->first_select(); for (; sl; sl= sl->next_select()) if (sl->join) DBUG_ASSERT(!sl->join->order || sl->join->order.src == ESC_GROUP_BY); } #endif if (changed) DBUG_RETURN(RES_OK); thd->where= "IN/ALL/ANY subquery"; /* In some optimisation cases we will not need this Item_in_optimizer object, but we can't know it here, but here we need address correct reference on left expresion. //psergey: he means confluent cases like "... IN (SELECT 1)" */ if (!optimizer) { Prepared_stmt_arena_holder ps_arena_holder(thd); optimizer= new Item_in_optimizer(left_expr, this); if (!optimizer) goto err; } thd->lex->current_select= current->outer_select(); result= (!left_expr->fixed && left_expr->fix_fields(thd, optimizer->arguments())); /* fix_fields can change reference to left_expr, we need reassign it */ left_expr= optimizer->arguments()[0]; thd->lex->current_select= current; if (result) goto err; /* If we didn't choose an execution method up to this point, we choose the IN=>EXISTS transformation, at least temporarily. */ if (exec_method == EXEC_UNSPECIFIED) exec_method= EXEC_EXISTS_OR_MAT; /* Both transformers call fix_fields() only for Items created inside them, and all those items do not make permanent changes in the current item arena which allows us to call them with changed arena (if we do not know the nature of Item, we have to call fix_fields() for it only with the original arena to avoid memory leak). */ { Prepared_stmt_arena_holder ps_arena_holder(thd); if (left_expr->cols() == 1) res= single_value_transformer(join, func); else { /* we do not support row operation for ALL/ANY/SOME */ if (func != &eq_creator) { my_error(ER_OPERAND_COLUMNS, MYF(0), 1); DBUG_RETURN(RES_ERROR); } res= row_value_transformer(join); } } err: thd->where= save_where; DBUG_RETURN(res); } void Item_in_subselect::print(String *str, enum_query_type query_type) { if (exec_method == EXEC_EXISTS_OR_MAT || exec_method == EXEC_EXISTS) str->append(STRING_WITH_LEN("<exists>")); else { left_expr->print(str, query_type); str->append(STRING_WITH_LEN(" in ")); } Item_subselect::print(str, query_type); } bool Item_in_subselect::fix_fields(THD *thd_arg, Item **ref) { bool result = 0; if (exec_method == EXEC_SEMI_JOIN) return !( (*ref)= new Item_int(1)); if ((thd_arg->lex->context_analysis_only & CONTEXT_ANALYSIS_ONLY_VIEW) && left_expr && !left_expr->fixed) result = left_expr->fix_fields(thd_arg, &left_expr); return result || Item_subselect::fix_fields(thd_arg, ref); } void Item_in_subselect::fix_after_pullout(st_select_lex *parent_select, st_select_lex *removed_select) { Item_subselect::fix_after_pullout(parent_select, removed_select); left_expr->fix_after_pullout(parent_select, removed_select); used_tables_cache|= left_expr->used_tables(); } /** Initialize the cache of the left operand of the IN predicate. @note This method has the same purpose as alloc_group_fields(), but it takes a different kind of collection of items, and the list we push to is dynamically allocated. @retval TRUE if a memory allocation error occurred @retval FALSE if success */ bool Item_in_subselect::init_left_expr_cache() { JOIN *outer_join; Next_select_func end_select; bool use_result_field= FALSE; outer_join= unit->outer_select()->join; /* An IN predicate might be evaluated in a query for which all tables have been optimzied away. */ if (!outer_join || !outer_join->tables || !outer_join->tables_list) { need_expr_cache= FALSE; return FALSE; } /* If we use end_[send | write]_group to handle complete rows of the outer query, make the cache of the left IN operand use Item_field::result_field instead of Item_field::field. We need this because normally Cached_item_field uses Item::field to fetch field data, while copy_ref_key() that copies the left IN operand into a lookup key uses Item::result_field. In the case end_[send | write]_group result_field is one row behind field. */ end_select= outer_join->join_tab[outer_join->primary_tables-1].next_select; if (end_select == end_send_group || end_select == end_write_group) use_result_field= TRUE; if (!(left_expr_cache= new List<Cached_item>)) return TRUE; for (uint i= 0; i < left_expr->cols(); i++) { Cached_item *cur_item_cache= new_Cached_item(unit->thd, left_expr->element_index(i), use_result_field); if (!cur_item_cache || left_expr_cache->push_front(cur_item_cache)) return TRUE; } return FALSE; } /** Tells an Item that it is in the condition of a JOIN_TAB @param 'join_tab_index' index of JOIN_TAB in JOIN's array The Item records this fact and can deduce from it the estimated number of times that it will be evaluated. */ bool Item_subselect::inform_item_in_cond_of_tab(uchar *join_tab_index) { in_cond_of_tab= *reinterpret_cast<int *>(join_tab_index); return false; } /** Clean up after removing the subquery from the item tree. Call st_select_lex_unit::exclude_tree() to unlink it from its master and to unlink direct st_select_lex children from all_selects_list. Don't unlink subqueries that are not descendants of the starting point (root) of the removal and cleanup. */ bool Item_subselect::clean_up_after_removal(uchar *arg) { st_select_lex *root= static_cast<st_select_lex*>(static_cast<void*>(arg)); st_select_lex *sl= unit->outer_select(); /* While traversing the item tree with Item::walk(), Item_refs may point to Item_subselects at different positions in the query. We should only exclude units that are descendants of the starting point for the walk. Traverse the tree towards the root. Afterwards, we have: 1) sl == root: unit is a descendant of the starting point, or 2) sl == NULL: unit is not a descendant of the starting point */ while (sl != root && sl != NULL) sl= sl->outer_select(); if (sl == root) unit->exclude_tree(); return false; } Item_subselect::trans_res Item_allany_subselect::select_transformer(JOIN *join) { DBUG_ENTER("Item_allany_subselect::select_transformer"); if (upper_item) upper_item->show= 1; trans_res retval= select_in_like_transformer(join, func); DBUG_RETURN(retval); } void Item_allany_subselect::print(String *str, enum_query_type query_type) { if (exec_method == EXEC_EXISTS_OR_MAT || exec_method == EXEC_EXISTS) str->append(STRING_WITH_LEN("<exists>")); else { left_expr->print(str, query_type); str->append(' '); str->append(func->symbol(all)); str->append(all ? " all " : " any ", 5); } Item_subselect::print(str, query_type); } void subselect_engine::set_thd_for_result() { /* select_result's constructor sets neither select_result::thd nor select_result::unit. */ if (result) result->set_thd(item->unit->thd); } subselect_single_select_engine:: subselect_single_select_engine(st_select_lex *select, select_result_interceptor *result_arg, Item_subselect *item_arg) :subselect_engine(item_arg, result_arg), prepared(0), executed(0), optimize_error(0), select_lex(select), join(0) { select_lex->master_unit()->item= item_arg; } void subselect_single_select_engine::cleanup() { DBUG_ENTER("subselect_single_select_engine::cleanup"); prepared= executed= optimize_error= false; join= 0; result->cleanup(); DBUG_VOID_RETURN; } void subselect_union_engine::cleanup() { DBUG_ENTER("subselect_union_engine::cleanup"); result->cleanup(); DBUG_VOID_RETURN; } bool subselect_union_engine::is_executed() const { return unit->executed; } subselect_union_engine::subselect_union_engine(st_select_lex_unit *u, select_result_interceptor *result_arg, Item_subselect *item_arg) :subselect_engine(item_arg, result_arg) { unit= u; unit->item= item_arg; } /** Create and prepare the JOIN object that represents the query execution plan for the subquery. @detail This method is called from Item_subselect::fix_fields. For prepared statements it is called both during the PREPARE and EXECUTE phases in the following ways: - During PREPARE the optimizer needs some properties (join->fields_list.elements) of the JOIN to proceed with preparation of the remaining query (namely to complete ::fix_fields for the subselect related classes. In the end of PREPARE the JOIN is deleted. - When we EXECUTE the query, Item_subselect::fix_fields is called again, and the JOIN object is re-created again, prepared and executed. In the end of execution it is deleted. In all cases the JOIN is created in runtime memory (not in the permanent memory root). @todo Re-check what properties of 'join' are needed during prepare, and see if we can avoid creating a JOIN during JOIN::prepare of the outer join. @retval 0 if success @retval 1 if error */ bool subselect_single_select_engine::prepare() { if (prepared) return 0; THD * const thd= item->unit->thd; join= new JOIN(thd, select_lex->item_list, select_lex->options | SELECT_NO_UNLOCK, result); if (!join || !result) return 1; /* Fatal error is set already. */ prepared= 1; SELECT_LEX *save_select= thd->lex->current_select; thd->lex->current_select= select_lex; if (join->prepare(select_lex->table_list.first, select_lex->with_wild, select_lex->where, select_lex->order_list.elements + select_lex->group_list.elements, select_lex->order_list.first, select_lex->group_list.first, select_lex->having, select_lex, select_lex->master_unit())) return 1; thd->lex->current_select= save_select; return 0; } bool subselect_union_engine::prepare() { THD * const thd= unit->thd; // We can access THD as above, or via 'item', verify equality: DBUG_ASSERT(thd == item->unit->thd); return unit->prepare(thd, result, SELECT_NO_UNLOCK); } bool subselect_indexsubquery_engine::prepare() { /* Should never be called. */ DBUG_ASSERT(FALSE); return 1; } /* makes storage for the output values for the subquery and calcuates their data and column types and their nullability. */ void subselect_engine::set_row(List<Item> &item_list, Item_cache **row) { Item *sel_item; List_iterator_fast<Item> li(item_list); res_type= STRING_RESULT; res_field_type= MYSQL_TYPE_VAR_STRING; for (uint i= 0; (sel_item= li++); i++) { item->max_length= sel_item->max_length; res_type= sel_item->result_type(); res_field_type= sel_item->field_type(); item->decimals= sel_item->decimals; item->unsigned_flag= sel_item->unsigned_flag; maybe_null= sel_item->maybe_null; if (!(row[i]= Item_cache::get_cache(sel_item))) return; row[i]->setup(sel_item); row[i]->store(sel_item); } if (item_list.elements > 1) res_type= ROW_RESULT; } void subselect_single_select_engine::fix_length_and_dec(Item_cache **row) { DBUG_ASSERT(row || select_lex->item_list.elements==1); set_row(select_lex->item_list, row); item->collation.set(row[0]->collation); if (cols() != 1) maybe_null= 0; } void subselect_union_engine::fix_length_and_dec(Item_cache **row) { DBUG_ASSERT(row || unit->first_select()->item_list.elements==1); if (unit->first_select()->item_list.elements == 1) { set_row(unit->types, row); item->collation.set(row[0]->collation); } else { bool maybe_null_saved= maybe_null; set_row(unit->types, row); maybe_null= maybe_null_saved; } } void subselect_indexsubquery_engine::fix_length_and_dec(Item_cache **row) { //this never should be called DBUG_ASSERT(0); } int read_first_record_seq(JOIN_TAB *tab); int rr_sequential(READ_RECORD *info); bool subselect_single_select_engine::exec() { DBUG_ENTER("subselect_single_select_engine::exec"); if (optimize_error) DBUG_RETURN(true); int rc= 0; THD * const thd= item->unit->thd; char const *save_where= thd->where; SELECT_LEX *save_select= thd->lex->current_select; thd->lex->current_select= select_lex; if (!join->optimized) { SELECT_LEX_UNIT *unit= select_lex->master_unit(); unit->set_limit(unit->global_parameters); DBUG_EXECUTE_IF("bug11747970_simulate_error", DBUG_SET("+d,bug11747970_raise_error");); if (join->optimize()) { optimize_error= true; rc= 1; goto exit; } if (item->engine_changed) { rc= 1; goto exit; } } if (select_lex->uncacheable && select_lex->uncacheable != UNCACHEABLE_EXPLAIN && executed) { join->reset(); item->reset(); item->assigned((executed= 0)); } if (!executed) { item->reset_value_registration(); JOIN_TAB *changed_tabs[MAX_TABLES]; JOIN_TAB **last_changed_tab= changed_tabs; if (item->have_guarded_conds()) { /* For at least one of the pushed predicates the following is true: We should not apply optimizations based on the condition that was pushed down into the subquery. Those optimizations are ref[_or_null] acceses. Change them to be full table scans. */ for (uint i= join->const_tables; i < join->primary_tables; i++) { JOIN_TAB *tab=join->join_tab+i; if (tab && tab->keyuse) { for (uint i= 0; i < tab->ref.key_parts; i++) { bool *cond_guard= tab->ref.cond_guards[i]; if (cond_guard && !*cond_guard) { /* Can't use BKA if switching from ref to "full scan on NULL key" @see Item_in_optimizer::val_int() @see TABLE_REF::cond_guards @see push_index_cond() @see setup_join_buffering() */ DBUG_ASSERT(tab->use_join_cache != JOIN_CACHE::ALG_BKA); DBUG_ASSERT(tab->use_join_cache != JOIN_CACHE::ALG_BKA_UNIQUE); /* Change the access method to full table scan */ tab->save_read_first_record= tab->read_first_record; tab->save_read_record= tab->read_record.read_record; tab->read_record.read_record= rr_sequential; tab->read_first_record= read_first_record_seq; tab->read_record.record= tab->table->record[0]; tab->read_record.thd= join->thd; tab->read_record.ref_length= tab->table->file->ref_length; tab->read_record.unlock_row= rr_unlock_row; *(last_changed_tab++)= tab; break; } } } } } join->exec(); /* Enable the optimizations back */ for (JOIN_TAB **ptab= changed_tabs; ptab != last_changed_tab; ptab++) { JOIN_TAB *tab= *ptab; tab->read_record.record= 0; tab->read_record.ref_length= 0; tab->read_first_record= tab->save_read_first_record; tab->read_record.read_record= tab->save_read_record; tab->save_read_first_record= NULL; } executed= true; rc= join->error || thd->is_fatal_error; } exit: thd->where= save_where; thd->lex->current_select= save_select; DBUG_RETURN(rc); } bool subselect_union_engine::exec() { THD * const thd= unit->thd; DBUG_ASSERT(thd == item->unit->thd); char const *save_where= thd->where; const bool res= (unit->optimize() || unit->exec()); thd->where= save_where; return res; } /** Search, using a table scan, for at least one row satisfying select condition. The caller must set item's 'value' to 'false' before calling this function. This function will set it to 'true' if it finds a matching row. @returns false if ok, true if read error. */ bool subselect_indexsubquery_engine::scan_table() { int error; TABLE *table= tab->table; DBUG_ENTER("subselect_indexsubquery_engine::scan_table"); // We never need to do a table scan of the materialized table. DBUG_ASSERT(engine_type() != HASH_SJ_ENGINE); if ((table->file->inited && (error= table->file->ha_index_end())) || (error= table->file->ha_rnd_init(1))) { (void) report_handler_error(table, error); DBUG_RETURN(true); } table->file->extra_opt(HA_EXTRA_CACHE, current_thd->variables.read_buff_size); table->null_row= 0; for (;;) { error=table->file->ha_rnd_next(table->record[0]); if (error && error != HA_ERR_END_OF_FILE) { error= report_handler_error(table, error); break; } /* No more rows */ if (table->status) break; if (!cond || cond->val_int()) { static_cast<Item_in_subselect*>(item)->value= true; break; } } table->file->ha_rnd_end(); DBUG_RETURN(error != 0); } /** Copy ref key and check for null parts in it Construct a search tuple to be used for index lookup. If one of the key parts have a NULL value, the following logic applies: For top level items, e.g. "WHERE <outer_value_list> IN (SELECT <inner_value_list>...)" where one of the outer values are NULL, the IN predicate evaluates to false/UNKNOWN (we don't care) and it's not necessary to evaluate the subquery. That shortcut is taken in Item_in_optimizer::val_int(). Thus, if a key part with a NULL value is found here, the NULL is either not outer or this subquery is not top level. Therefore we cannot shortcut subquery execution if a NULL is found here. Thus, if one of the key parts have a NULL value there are two possibilities: a) The NULL is from the outer_value_list. Since this is not a top level item (see above) we need to check whether this predicate evaluates to NULL or false. That is done by checking if the subquery has a row if the conditions based on outer NULL values are disabled. Index lookup cannot be used for this, so a table scan must be done. b) The NULL is local to the subquery, e.g.: "WHERE ... IN (SELECT ... WHERE inner_col IS NULL)" In this case we're looking for rows with the exact inner_col value of NULL, not rows that match if the "inner_col IS NULL" condition is disabled. Index lookup can be used for this. @see subselect_indexsubquery_engine::exec() @see Item_in_optimizer::val_int() @param[out] require_scan true if a NULL value is found that falls into category a) above, false if index lookup can be used. @param[out] convert_error true if an error occured during conversion of values from one type to another, false otherwise. */ void subselect_indexsubquery_engine::copy_ref_key(bool *require_scan, bool *convert_error) { DBUG_ENTER("subselect_indexsubquery_engine::copy_ref_key"); *require_scan= false; *convert_error= false; for (uint part_no= 0; part_no < tab->ref.key_parts; part_no++) { store_key *s_key= tab->ref.key_copy[part_no]; if (s_key == NULL) continue; // key is const and does not need to be reevaluated const enum store_key::store_key_result store_res= s_key->copy(); tab->ref.key_err= store_res; if (s_key->null_key) { /* If we have materialized the subquery: - this NULL ref item cannot be local to the subquery (any such conditions was handled during materialization) - neither can it be outer, because this case is separately managed in subselect_hash_sj_engine::exec(). */ DBUG_ASSERT(engine_type() != HASH_SJ_ENGINE); const bool *cond_guard= tab->ref.cond_guards[part_no]; /* NULL value is from the outer_value_list if the key part has a cond guard that deactivates the condition. @see TABLE_REF::cond_guards */ if (cond_guard && !*cond_guard) { DBUG_ASSERT(!(static_cast <Item_in_subselect*>(item) ->is_top_level_item())); *require_scan= true; DBUG_VOID_RETURN; } } /* Check if the error is equal to STORE_KEY_FATAL. This is not expressed using the store_key::store_key_result enum because ref.key_err is a boolean and we want to detect both TRUE and STORE_KEY_FATAL from the space of the union of the values of [TRUE, FALSE] and store_key::store_key_result. TODO: fix the variable an return types. */ if (store_res == store_key::STORE_KEY_FATAL) { /* Error converting the left IN operand to the column type of the right IN operand. */ tab->table->status= STATUS_NOT_FOUND; *convert_error= true; DBUG_VOID_RETURN; } } DBUG_VOID_RETURN; } /* Index-lookup subselect 'engine' - run the subquery SYNOPSIS subselect_indexsubquery_engine:exec() full_scan DESCRIPTION The engine is used to resolve subqueries in form oe IN (SELECT key FROM tbl WHERE subq_where) The value of the predicate is calculated as follows: 1. If oe IS NULL, this is a special case, do a full table scan on table tbl and search for row that satisfies subq_where. If such row is found, return NULL, otherwise return FALSE. 2. Make an index lookup via key=oe, search for a row that satisfies subq_where. If found, return TRUE. 3. If check_null==TRUE, make another lookup via key=NULL, search for a row that satisfies subq_where. If found, return NULL, otherwise return FALSE. 4. If unique==true, there can be only one row with key=oe and only one row with key=NULL, we use that fact to shorten the search process. TODO The step #1 can be optimized further when the index has several key parts. Consider a subquery: (oe1, oe2) IN (SELECT keypart1, keypart2 FROM tbl WHERE subq_where) and suppose we need to evaluate it for {oe1, oe2}=={const1, NULL}. Current code will do a full table scan and obtain correct result. There is a better option: instead of evaluating SELECT keypart1, keypart2 FROM tbl WHERE subq_where (1) and checking if it has produced any matching rows, evaluate SELECT keypart2 FROM tbl WHERE subq_where AND keypart1=const1 (2) If this query produces a row, the result is NULL (as we're evaluating "(const1, NULL) IN { (const1, X), ... }", which has a value of UNKNOWN, i.e. NULL). If the query produces no rows, the result is FALSE. We currently evaluate (1) by doing a full table scan. (2) can be evaluated by doing a "ref" scan on "keypart1=const1", which can be much cheaper. We can use index statistics to quickly check whether "ref" scan will be cheaper than full table scan. RETURN 0 1 */ bool subselect_indexsubquery_engine::exec() { DBUG_ENTER("subselect_indexsubquery_engine::exec"); int error; bool null_finding= 0; TABLE *table= tab->table; // 'tl' is NULL if this is a tmp table created by subselect_hash_sj_engine. TABLE_LIST *tl= table->pos_in_table_list; Item_in_subselect *const item_in= static_cast<Item_in_subselect*>(item); item_in->value= false; table->status= 0; if (tl && tl->uses_materialization() && !tab->materialized) { bool err= mysql_handle_single_derived(table->in_use->lex, tl, mysql_derived_create) || mysql_handle_single_derived(table->in_use->lex, tl, mysql_derived_materialize); if (!tab->table->in_use->lex->describe) mysql_handle_single_derived(table->in_use->lex, tl, mysql_derived_cleanup); if (err) DBUG_RETURN(1); tab->materialized= true; } if (check_null) { /* We need to check for NULL if there wasn't a matching value */ *tab->ref.null_ref_key= 0; // Search first for not null item_in->was_null= false; } /* Copy the ref key and check for nulls... */ bool require_scan, convert_error; copy_ref_key(&require_scan, &convert_error); if (convert_error) DBUG_RETURN(0); if (require_scan) { const bool scan_result= scan_table(); DBUG_RETURN(scan_result); } if (!table->file->inited && (error= table->file->ha_index_init(tab->ref.key, !unique /* sorted */))) { (void) report_handler_error(table, error); DBUG_RETURN(true); } error= table->file->ha_index_read_map(table->record[0], tab->ref.key_buff, make_prev_keypart_map(tab->ref.key_parts), HA_READ_KEY_EXACT); if (error && error != HA_ERR_KEY_NOT_FOUND && error != HA_ERR_END_OF_FILE) error= report_handler_error(table, error); else { for (;;) { error= 0; table->null_row= 0; if (!table->status) { if ((!cond || cond->val_int()) && (!having || having->val_int())) { item_in->value= true; if (null_finding) { /* This is dead code; subqueries with check_null==true are always transformed with IN-to-EXISTS and thus their artificial HAVING rejects NULL values... */ DBUG_ASSERT(false); item_in->was_null= true; } break; } if (unique) break; error= table->file->ha_index_next_same(table->record[0], tab->ref.key_buff, tab->ref.key_length); if (error && error != HA_ERR_END_OF_FILE) { error= report_handler_error(table, error); break; } } else { if (!check_null || null_finding) break; /* We don't need to check nulls */ /* Check if there exists a row with a null value in the index. We come here only if ref_or_null, and ref_or_null is always on a single column (first keypart of the index). So we have only one NULL bit to turn on: */ *tab->ref.null_ref_key= 1; null_finding= 1; if ((error= (safe_index_read(tab) == 1))) break; } } } DBUG_RETURN(error != 0); } uint subselect_single_select_engine::cols() const { return select_lex->item_list.elements; } uint subselect_union_engine::cols() const { DBUG_ASSERT(unit->is_prepared()); // should be called after fix_fields() return unit->types.elements; } uint8 subselect_single_select_engine::uncacheable() const { return select_lex->uncacheable; } uint8 subselect_union_engine::uncacheable() const { return unit->uncacheable; } void subselect_single_select_engine::exclude() { select_lex->master_unit()->exclude_level(); } void subselect_union_engine::exclude() { unit->exclude_level(); } void subselect_indexsubquery_engine::exclude() { //this never should be called DBUG_ASSERT(0); } table_map subselect_engine::calc_const_tables(TABLE_LIST *table) { table_map map= 0; for (; table; table= table->next_leaf) { TABLE *tbl= table->table; if (tbl && tbl->const_table) map|= tbl->map; } return map; } table_map subselect_single_select_engine::upper_select_const_tables() const { return calc_const_tables(select_lex->outer_select()->leaf_tables); } table_map subselect_union_engine::upper_select_const_tables() const { return calc_const_tables(unit->outer_select()->leaf_tables); } void subselect_single_select_engine::print(String *str, enum_query_type query_type) { select_lex->print(item->unit->thd, str, query_type); } void subselect_union_engine::print(String *str, enum_query_type query_type) { unit->print(str, query_type); } /* TODO: The ::print method below should be changed as follows. Do it after all other tests pass. void subselect_indexsubquery_engine::print(String *str) { KEY *key_info= tab->table->key_info + tab->ref.key; str->append(STRING_WITH_LEN("<primary_index_lookup>(")); for (uint i= 0; i < key_info->key_parts; i++) tab->ref.items[i]->print(str); str->append(STRING_WITH_LEN(" in ")); str->append(tab->table->s->table_name.str, tab->table->s->table_name.length); str->append(STRING_WITH_LEN(" on ")); str->append(key_info->name); if (cond) { str->append(STRING_WITH_LEN(" where ")); cond->print(str); } str->append(')'); } */ void subselect_indexsubquery_engine::print(String *str, enum_query_type query_type) { if (unique) str->append(STRING_WITH_LEN("<primary_index_lookup>(")); else str->append(STRING_WITH_LEN("<index_lookup>(")); tab->ref.items[0]->print(str, query_type); str->append(STRING_WITH_LEN(" in ")); if (tab->table->pos_in_table_list && tab->table->pos_in_table_list->uses_materialization()) { /* For materialized derived tables/views use table/view alias instead of temporary table name, as it changes on each run and not acceptable for EXPLAIN EXTENDED. */ str->append(tab->table->alias, strlen(tab->table->alias)); } else if (tab->table->s->table_category == TABLE_CATEGORY_TEMPORARY) { // Could be from subselect_hash_sj_engine. str->append(STRING_WITH_LEN("<temporary table>")); } else str->append(tab->table->s->table_name.str, tab->table->s->table_name.length); KEY *key_info= tab->table->key_info+ tab->ref.key; str->append(STRING_WITH_LEN(" on ")); str->append(key_info->name); if (check_null) str->append(STRING_WITH_LEN(" checking NULL")); if (cond) { str->append(STRING_WITH_LEN(" where ")); cond->print(str, query_type); } if (having) { str->append(STRING_WITH_LEN(" having ")); having->print(str, query_type); } str->append(')'); } /** change select_result object of engine. @param si new subselect Item @param res new select_result object @retval FALSE OK @retval TRUE error */ bool subselect_single_select_engine::change_result(Item_subselect *si, select_result_interceptor *res) { item= si; result= res; return select_lex->join->change_result(result, NULL); } /** change select_result object of engine. @param si new subselect Item @param res new select_result object @retval FALSE OK @retval TRUE error */ bool subselect_union_engine::change_result(Item_subselect *si, select_result_interceptor *res) { item= si; int rc= unit->change_result(res, result); result= res; return rc; } /** change select_result emulation, never should be called. @param si new subselect Item @param res new select_result object @retval FALSE OK @retval TRUE error */ bool subselect_indexsubquery_engine::change_result(Item_subselect *si, select_result_interceptor *res) { DBUG_ASSERT(0); return TRUE; } /** Report about presence of tables in subquery. @retval TRUE there are not tables used in subquery @retval FALSE there are some tables in subquery */ bool subselect_single_select_engine::no_tables() const { return(select_lex->table_list.elements == 0); } /* Check statically whether the subquery can return NULL SINOPSYS subselect_single_select_engine::may_be_null() RETURN FALSE can guarantee that the subquery never return NULL TRUE otherwise */ bool subselect_single_select_engine::may_be_null() const { return ((no_tables() && !join->conds && !join->having) ? maybe_null : 1); } /** Report about presence of tables in subquery. @retval TRUE there are not tables used in subquery @retval FALSE there are some tables in subquery */ bool subselect_union_engine::no_tables() const { for (SELECT_LEX *sl= unit->first_select(); sl; sl= sl->next_select()) { if (sl->table_list.elements) return FALSE; } return TRUE; } /** Report about presence of tables in subquery. @retval TRUE there are not tables used in subquery @retval FALSE there are some tables in subquery */ bool subselect_indexsubquery_engine::no_tables() const { /* returning value is correct, but this method should never be called */ return 0; } /****************************************************************************** WL#1110 - Implementation of class subselect_hash_sj_engine ******************************************************************************/ /** Create all structures needed for subquery execution using hash semijoin. @detail - Create a temporary table to store the result of the IN subquery. The temporary table has one hash index on all its columns. If single-column, the index allows at most one NULL row. - Create a new result sink that sends the result stream of the subquery to the temporary table, - Create and initialize a new JOIN_TAB, and TABLE_REF objects to perform lookups into the indexed temporary table. @param tmp_columns columns of temporary table @notice: Currently Item_subselect::init() already chooses and creates at parse time an engine with a corresponding JOIN to execute the subquery. @retval TRUE if error @retval FALSE otherwise */ bool subselect_hash_sj_engine::setup(List<Item> *tmp_columns) { /* The result sink where we will materialize the subquery result. */ select_union *tmp_result_sink; /* The table into which the subquery is materialized. */ TABLE *tmp_table; KEY *tmp_key; /* The only index on the temporary table. */ uint tmp_key_parts; /* Number of keyparts in tmp_key. */ Item_in_subselect *item_in= (Item_in_subselect *) item; DBUG_ENTER("subselect_hash_sj_engine::setup"); /* 1. Create/initialize materialization related objects. */ /* Create and initialize a select result interceptor that stores the result stream in a temporary table. The temporary table itself is managed (created/filled/etc) internally by the interceptor. */ if (!(tmp_result_sink= new select_union)) DBUG_RETURN(TRUE); THD * const thd= item->unit->thd; if (tmp_result_sink->create_result_table( thd, tmp_columns, true, thd->variables.option_bits | TMP_TABLE_ALL_COLUMNS, "materialized-subquery", true, true)) DBUG_RETURN(TRUE); tmp_table= tmp_result_sink->table; tmp_key= tmp_table->key_info; tmp_key_parts= tmp_key->user_defined_key_parts; /* If the subquery has blobs, or the total key lenght is bigger than some length, then the created index cannot be used for lookups and we can't use hash semi join. If this is the case, delete the temporary table since it will not be used, and tell the caller we failed to initialize the engine. */ if (tmp_table->s->keys == 0) { DBUG_ASSERT(tmp_table->s->db_type() == myisam_hton); DBUG_ASSERT( tmp_table->s->uniques || tmp_table->key_info->key_length >= tmp_table->file->max_key_length() || tmp_table->key_info->user_defined_key_parts > tmp_table->file->max_key_parts()); free_tmp_table(thd, tmp_table); delete result; result= NULL; DBUG_RETURN(TRUE); } result= tmp_result_sink; /* Make sure there is only one index on the temp table, and it doesn't have the extra key part created when s->uniques > 0. */ DBUG_ASSERT(tmp_table->s->keys == 1 && tmp_columns->elements == tmp_key_parts); /* 2. Create/initialize execution related objects. */ /* Create and initialize the JOIN_TAB that represents an index lookup plan operator into the materialized subquery result. Notice that: - this JOIN_TAB has no corresponding JOIN (and doesn't need one), and - here we initialize only those members that are used by subselect_indexsubquery_engine, so these objects are incomplete. */ if (!(tab= new (thd->mem_root) JOIN_TAB)) DBUG_RETURN(TRUE); tab->table= tmp_table; tab->ref.key= 0; /* The only temp table index. */ tab->ref.key_length= tmp_key->key_length; if (!(tab->ref.key_buff= (uchar*) thd->calloc(ALIGN_SIZE(tmp_key->key_length) * 2)) || !(tab->ref.key_copy= (store_key**) thd->alloc((sizeof(store_key*) * tmp_key_parts))) || !(tab->ref.items= (Item**) thd->alloc(sizeof(Item*) * tmp_key_parts))) DBUG_RETURN(TRUE); uchar *cur_ref_buff= tab->ref.key_buff; /* Like semijoin-materialization-lookup (see create_subquery_equalities()), create an artificial condition to post-filter those rows matched by index lookups that cannot be distinguished by the index lookup procedure, e.g. because of truncation (if the outer column type's length is bigger than the inner column type's, index lookup will use a truncated outer value as search key, yielding false positives). Prepared statements execution requires that fix_fields is called for every execution. In order to call fix_fields we need to create a Name_resolution_context and a corresponding TABLE_LIST for the temporary table for the subquery, so that all column references to the materialized subquery table can be resolved correctly. */ DBUG_ASSERT(cond == NULL); if (!(cond= new Item_cond_and)) DBUG_RETURN(TRUE); /* Table reference for tmp_table that is used to resolve column references (Item_fields) to columns in tmp_table. */ TABLE_LIST *tmp_table_ref; if (!(tmp_table_ref= (TABLE_LIST*) thd->calloc(sizeof(TABLE_LIST)))) DBUG_RETURN(TRUE); tmp_table_ref->init_one_table("", 0, "materialized-subquery", 21, "materialized-subquery", TL_READ); tmp_table_ref->table= tmp_table; /* Name resolution context for all tmp_table columns created below. */ Name_resolution_context *context= new Name_resolution_context; context->init(); context->first_name_resolution_table= context->last_name_resolution_table= tmp_table_ref; KEY_PART_INFO *key_parts= tmp_key->key_part; for (uint part_no= 0; part_no < tmp_key_parts; part_no++) { /* New equi-join condition for the current column. */ Item_func_eq *eq_cond; /* Item for the corresponding field from the materialized temp table. */ Item_field *right_col_item; const bool nullable= key_parts[part_no].field->real_maybe_null(); tab->ref.items[part_no]= item_in->left_expr->element_index(part_no); if (!(right_col_item= new Item_field(thd, context, key_parts[part_no].field)) || !(eq_cond= new Item_func_eq(tab->ref.items[part_no], right_col_item)) || ((Item_cond_and*)cond)->add(eq_cond)) { delete cond; cond= NULL; DBUG_RETURN(TRUE); } tab->ref.key_copy[part_no]= new store_key_item(thd, key_parts[part_no].field, /* TODO: the NULL byte is taken into account in key_parts[part_no].store_length, so instead of cur_ref_buff + MY_TEST(maybe_null), we could use that information instead. */ cur_ref_buff + (nullable ? 1 : 0), nullable ? cur_ref_buff : 0, key_parts[part_no].length, tab->ref.items[part_no]); if (nullable && // nullable column in tmp table, // and UNKNOWN should not be interpreted as FALSE !item_in->is_top_level_item()) { // It must be the single column, or we wouldn't be here DBUG_ASSERT(tmp_key_parts == 1); // Be ready to search for NULL into inner column: tab->ref.null_ref_key= cur_ref_buff; mat_table_has_nulls= NEX_UNKNOWN; } else { tab->ref.null_ref_key= NULL; mat_table_has_nulls= NEX_IRRELEVANT_OR_FALSE; } cur_ref_buff+= key_parts[part_no].store_length; } tab->ref.key_err= 1; tab->ref.key_parts= tmp_key_parts; if (cond->fix_fields(thd, &cond)) DBUG_RETURN(TRUE); /* Create and optimize the JOIN that will be used to materialize the subquery if not yet created. */ materialize_engine->prepare(); /* Let our engine reuse this query plan for materialization. */ materialize_engine->join->change_result(result, NULL); DBUG_RETURN(FALSE); } subselect_hash_sj_engine::~subselect_hash_sj_engine() { /* Assure that cleanup has been called for this engine. */ DBUG_ASSERT(!tab); delete result; } /** Cleanup performed after each PS execution. @detail Called in the end of JOIN::prepare for PS from Item_subselect::cleanup. */ void subselect_hash_sj_engine::cleanup() { DBUG_ENTER("subselect_hash_sj_engine::cleanup"); is_materialized= false; result->cleanup(); /* Resets the temp table as well. */ THD * const thd= item->unit->thd; DEBUG_SYNC(thd, "before_index_end_in_subselect"); if (tab->table->file->inited) tab->table->file->ha_index_end(); // Close the scan over the index free_tmp_table(thd, tab->table); tab= NULL; materialize_engine->cleanup(); DBUG_VOID_RETURN; } /** Execute a subquery IN predicate via materialization. @detail If needed materialize the subquery into a temporary table, then copmpute the predicate via a lookup into this table. @retval TRUE if error @retval FALSE otherwise */ bool subselect_hash_sj_engine::exec() { Item_in_subselect *item_in= (Item_in_subselect *) item; TABLE *const table= tab->table; DBUG_ENTER("subselect_hash_sj_engine::exec"); /* Optimize and materialize the subquery during the first execution of the subquery predicate. */ if (!is_materialized) { bool res; THD * const thd= item->unit->thd; SELECT_LEX *save_select= thd->lex->current_select; thd->lex->current_select= materialize_engine->select_lex; if ((res= materialize_engine->join->optimize())) goto err; /* purecov: inspected */ materialize_engine->join->exec(); if ((res= MY_TEST(materialize_engine->join->error || thd->is_fatal_error))) goto err; /* TODO: - Unlock all subquery tables as we don't need them. To implement this we need to add new functionality to JOIN::join_free that can unlock all tables in a subquery (and all its subqueries). - The temp table used for grouping in the subquery can be freed immediately after materialization (yet it's done together with unlocking). */ is_materialized= TRUE; // Calculate row count: table->file->info(HA_STATUS_VARIABLE); /* Set tmp_param only if its usable, i.e. tmp_param->copy_field != NULL. */ tmp_param= &(item_in->unit->outer_select()->join->tmp_table_param); if (tmp_param && !tmp_param->copy_field) tmp_param= NULL; err: thd->lex->current_select= save_select; if (res) DBUG_RETURN(res); } // if (!is_materialized) if (table->file->stats.records == 0) { // The correct answer is FALSE. item_in->value= false; DBUG_RETURN(false); } /* Here we could be brutal and set item_in->null_value. But we prefer to be well-behaved and rather set the properties which Item_in_subselect::val_bool() and Item_in_optimizer::val_int() expect, and then those functions will set null_value based on those properties. */ if (item_in->left_expr->element_index(0)->null_value) { /* The first outer expression oe1 is NULL. It is the single outer expression because if there would be more ((oe1,oe2,...)IN(...)) then either they would be non-nullable (so we wouldn't be here) or the predicate would be top-level (so we wouldn't be here, Item_in_optimizer::val_int() would have short-cut). The correct answer is UNKNOWN. Do as if searching with all triggered conditions disabled: this would surely find a row. The caller will translate this to UNKNOWN. */ DBUG_ASSERT(item_in->left_expr->cols() == 1); item_in->value= true; DBUG_RETURN(false); } if (subselect_indexsubquery_engine::exec()) // Search with index DBUG_RETURN(true); if (!item_in->value && // no exact match mat_table_has_nulls != NEX_IRRELEVANT_OR_FALSE) { /* There is only one outer expression. It's not NULL. exec() above has set the answer to FALSE, but if there exists an inner NULL in the temporary table, then the correct answer is UNKNOWN, so let's find out. */ if (mat_table_has_nulls == NEX_UNKNOWN) // We do not know yet { // Search for NULL inside tmp table, and remember the outcome. *tab->ref.null_ref_key= 1; if (!table->file->inited && table->file->ha_index_init(tab->ref.key, false /* sorted */)) DBUG_RETURN(true); if (safe_index_read(tab) == 1) DBUG_RETURN(true); *tab->ref.null_ref_key= 0; // prepare for next searches of non-NULL mat_table_has_nulls= (table->status == 0) ? NEX_TRUE : NEX_IRRELEVANT_OR_FALSE; } if (mat_table_has_nulls == NEX_TRUE) { /* There exists an inner NULL. The correct answer is UNKNOWN. Do as if searching with all triggered conditions enabled; that would not find any match, but Item_is_not_null_test would notice a NULL: */ item_in->value= false; item_in->was_null= true; } } DBUG_RETURN(false); } /** Print the state of this engine into a string for debugging and views. */ void subselect_hash_sj_engine::print(String *str, enum_query_type query_type) { str->append(STRING_WITH_LEN(" <materialize> (")); materialize_engine->print(str, query_type); str->append(STRING_WITH_LEN(" ), ")); if (tab) subselect_indexsubquery_engine::print(str, query_type); else str->append(STRING_WITH_LEN( "<the access method for lookups is not yet created>" )); }

sql/item_subselect.cc (2,283 lines of code) (raw):