mirror of
https://github.com/FirebirdSQL/firebird.git
synced 2025-01-27 20:03:03 +01:00
09c51110b4
Notes: 1) Some optimizations will follow after more deep analysis. 2) The syntax "==" is not yet agreed on. I'd prefer it to be changed.
7608 lines
217 KiB
C++
7608 lines
217 KiB
C++
/*
|
||
* PROGRAM: JRD Access Method
|
||
* MODULE: opt.cpp
|
||
* DESCRIPTION: Optimizer / record selection expression compiler
|
||
*
|
||
* The contents of this file are subject to the Interbase Public
|
||
* License Version 1.0 (the "License"); you may not use this file
|
||
* except in compliance with the License. You may obtain a copy
|
||
* of the License at http://www.Inprise.com/IPL.html
|
||
*
|
||
* Software distributed under the License is distributed on an
|
||
* "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express
|
||
* or implied. See the License for the specific language governing
|
||
* rights and limitations under the License.
|
||
*
|
||
* The Original Code was created by Inprise Corporation
|
||
* and its predecessors. Portions created by Inprise Corporation are
|
||
* Copyright (C) Inprise Corporation.
|
||
*
|
||
* All Rights Reserved.
|
||
* Contributor(s): ______________________________________.
|
||
* 2002.10.12: Nickolay Samofatov: Fixed problems with wrong results produced by
|
||
* outer joins
|
||
* 2001.07.28: John Bellardo: Added code to handle rse_skip nodes.
|
||
* 2001.07.17 Claudio Valderrama: Stop crash with indices and recursive calls
|
||
* of OPT_compile: indicator csb_indices set to zero after used memory is
|
||
* returned to the free pool.
|
||
* 2001.02.15: Claudio Valderrama: Don't obfuscate the plan output if a selectable
|
||
* stored procedure doesn't access tables, views or other procedures directly.
|
||
* 2002.10.29 Sean Leyne - Removed obsolete "Netware" port
|
||
* 2002.10.30: Arno Brinkman: Changes made to gen_retrieval, OPT_compile and make_inversion.
|
||
* Procedure sort_indices added. The changes in gen_retrieval are that now
|
||
* an index with high field-count has priority to build an index from.
|
||
* Procedure make_inversion is changed so that it not pick every index
|
||
* that comes away, this was slow performance with bad selectivity indices
|
||
* which most are foreign_keys with a reference to a few records.
|
||
* 2002.11.01: Arno Brinkman: Added match_indices for better support of OR handling
|
||
* in INNER JOIN (gen_join) statements.
|
||
* 2002.12.15: Arno Brinkman: Added find_used_streams, so that inside opt_compile all the
|
||
* streams are marked active. This causes that more indices can be used for
|
||
* a retrieval. With this change BUG SF #219525 is solved too.
|
||
*
|
||
*/
|
||
|
||
#include "firebird.h"
|
||
#include "../jrd/common.h"
|
||
#include <stdio.h>
|
||
#include <string.h>
|
||
#include "../jrd/ibase.h"
|
||
#include "../jrd/jrd.h"
|
||
#include "../jrd/align.h"
|
||
#include "../jrd/val.h"
|
||
#include "../jrd/req.h"
|
||
#include "../jrd/exe.h"
|
||
#include "../jrd/lls.h"
|
||
#include "../jrd/ods.h"
|
||
#include "../jrd/btr.h"
|
||
#include "../jrd/sort.h"
|
||
#include "../jrd/rse.h"
|
||
#include "../jrd/intl.h"
|
||
#include "../jrd/thd.h"
|
||
#include "../jrd/gdsassert.h"
|
||
#include "../jrd/all_proto.h"
|
||
#include "../jrd/btr_proto.h"
|
||
#include "../jrd/cch_proto.h"
|
||
#include "../jrd/cmp_proto.h"
|
||
#include "../jrd/dpm_proto.h"
|
||
#include "../jrd/err_proto.h"
|
||
#include "../jrd/ext_proto.h"
|
||
#include "../jrd/evl_proto.h"
|
||
#include "../jrd/intl_proto.h"
|
||
|
||
#include "../jrd/lck_proto.h"
|
||
#include "../jrd/met_proto.h"
|
||
#include "../jrd/mov_proto.h"
|
||
#include "../jrd/opt_proto.h"
|
||
#include "../jrd/par_proto.h"
|
||
#include "../jrd/gds_proto.h"
|
||
#include "../jrd/dbg_proto.h"
|
||
#include "../common/classes/array.h"
|
||
#include "../common/classes/objects_array.h"
|
||
|
||
using namespace Jrd;
|
||
|
||
#ifdef DEV_BUILD
|
||
#define OPT_DEBUG
|
||
#endif
|
||
|
||
static bool augment_stack(jrd_nod*, NodeStack&);
|
||
static UINT64 calculate_priority_level(const OptimizerBlk*, const index_desc*);
|
||
static void check_indices(const CompilerScratch::csb_repeat*);
|
||
static bool check_relationship(const OptimizerBlk*, USHORT, USHORT);
|
||
static void check_sorts(RecordSelExpr*);
|
||
static void class_mask(USHORT, jrd_nod**, ULONG *);
|
||
static void clear_bounds(OptimizerBlk*, const index_desc*);
|
||
static jrd_nod* compose(jrd_nod**, jrd_nod*, NOD_T);
|
||
static bool computable(CompilerScratch*, jrd_nod*, SSHORT, bool, bool);
|
||
static void compute_dependencies(const jrd_nod*, ULONG*);
|
||
static void compute_dbkey_streams(const CompilerScratch*, const jrd_nod*, UCHAR*);
|
||
static void compute_rse_streams(const CompilerScratch*, const RecordSelExpr*, UCHAR*);
|
||
static bool check_for_nod_from(const jrd_nod*);
|
||
static SLONG decompose(thread_db*, jrd_nod*, NodeStack&, CompilerScratch*);
|
||
static USHORT distribute_equalities(NodeStack&, CompilerScratch*, USHORT);
|
||
static bool dump_index(const jrd_nod*, SCHAR**, SSHORT*);
|
||
static bool dump_rsb(const jrd_req*, const RecordSource*, SCHAR**, SSHORT*);
|
||
static bool estimate_cost(thread_db*, OptimizerBlk*, USHORT, double *, double *);
|
||
static bool expression_contains(const jrd_nod*, NOD_T);
|
||
static bool expression_contains_stream(const jrd_nod*, UCHAR);
|
||
#ifdef EXPRESSION_INDICES
|
||
static bool expression_equal(thread_db*, OptimizerBlk*, const index_desc*,
|
||
jrd_nod*, USHORT);
|
||
static bool expression_equal2(thread_db*, OptimizerBlk*, jrd_nod*,
|
||
jrd_nod*, USHORT);
|
||
#endif
|
||
static void find_best(thread_db*, OptimizerBlk*, USHORT, USHORT, UCHAR*, const jrd_nod*,
|
||
double, double);
|
||
static jrd_nod* find_dbkey(jrd_nod*, USHORT, SLONG*);
|
||
static USHORT find_order(thread_db*, OptimizerBlk*, UCHAR*, const jrd_nod*);
|
||
static void find_rsbs(RecordSource*, StreamStack*, RsbStack*);
|
||
static void find_used_streams(const RecordSource*, UCHAR*);
|
||
static void form_rivers(thread_db*, OptimizerBlk*, UCHAR*, RiverStack&, jrd_nod**, jrd_nod**, jrd_nod*);
|
||
static bool form_river(thread_db*, OptimizerBlk*, USHORT, UCHAR *, UCHAR *, RiverStack&, jrd_nod**,
|
||
jrd_nod**, jrd_nod*);
|
||
static RecordSource* gen_aggregate(thread_db*, OptimizerBlk*, jrd_nod*);
|
||
static RecordSource* gen_boolean(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
|
||
static RecordSource* gen_first(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
|
||
static void gen_join(thread_db*, OptimizerBlk*, UCHAR*, RiverStack&, jrd_nod**, jrd_nod**, jrd_nod*);
|
||
static RecordSource* gen_navigation(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*, jrd_nod**);
|
||
#ifdef SCROLLABLE_CURSORS
|
||
static RecordSource* gen_nav_rsb(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*, RSE_GET_MODE);
|
||
#else
|
||
static RecordSource* gen_nav_rsb(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*);
|
||
#endif
|
||
static RecordSource* gen_outer(thread_db*, OptimizerBlk*, RecordSelExpr*, RiverStack&, jrd_nod**, jrd_nod**);
|
||
static RecordSource* gen_procedure(thread_db*, OptimizerBlk*, jrd_nod*);
|
||
static RecordSource* gen_residual_boolean(thread_db*, OptimizerBlk*, RecordSource*);
|
||
static RecordSource* gen_retrieval(thread_db*, OptimizerBlk*, SSHORT, jrd_nod**, jrd_nod**, bool, bool,
|
||
jrd_nod**);
|
||
static RecordSource* gen_rsb(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*, SSHORT, jrd_rel*, str*, jrd_nod*, float);
|
||
static RecordSource* gen_skip (thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
|
||
static RecordSource* gen_sort(thread_db*, OptimizerBlk*, UCHAR *, UCHAR *, RecordSource*, jrd_nod*, bool);
|
||
static bool gen_sort_merge(thread_db*, OptimizerBlk*, RiverStack&);
|
||
static RecordSource* gen_union(thread_db*, OptimizerBlk*, jrd_nod*, UCHAR *, USHORT);
|
||
static void get_inactivities(const CompilerScratch*, ULONG*);
|
||
static IndexedRelationship* indexed_relationship(thread_db*, OptimizerBlk*, USHORT);
|
||
static str* make_alias(thread_db*, CompilerScratch*, CompilerScratch::csb_repeat*);
|
||
static jrd_nod* make_binary_node(NOD_T, jrd_nod*, jrd_nod*, bool);
|
||
static RecordSource* make_cross(thread_db*, OptimizerBlk*, RiverStack&);
|
||
static jrd_nod* make_index_node(thread_db*, jrd_rel*, CompilerScratch*, index_desc*);
|
||
static jrd_nod* make_inference_node(CompilerScratch*, jrd_nod*, jrd_nod*, jrd_nod*);
|
||
static jrd_nod* make_inversion(thread_db*, OptimizerBlk*, jrd_nod*, USHORT);
|
||
static jrd_nod* make_missing(thread_db*, OptimizerBlk*, jrd_rel*, jrd_nod*, USHORT, index_desc*);
|
||
static jrd_nod* make_starts(thread_db*, OptimizerBlk*, jrd_rel*, jrd_nod*, USHORT, index_desc*);
|
||
static bool map_equal(const jrd_nod*, const jrd_nod*, const jrd_nod*);
|
||
static void mark_indices(CompilerScratch::csb_repeat*, SSHORT);
|
||
static SSHORT match_index(thread_db*, OptimizerBlk*, SSHORT, jrd_nod*, index_desc*);
|
||
static bool match_indices(thread_db*, OptimizerBlk*, SSHORT, jrd_nod*, index_desc*);
|
||
static USHORT nav_rsb_size(RecordSource*, USHORT, USHORT);
|
||
static bool node_equality(const jrd_nod*, const jrd_nod*);
|
||
static jrd_nod* optimize_like(thread_db*, jrd_nod*);
|
||
#ifdef OPT_DEBUG
|
||
static void print_order(OptimizerBlk*, USHORT, double, double);
|
||
#endif
|
||
static USHORT river_count(USHORT, jrd_nod**);
|
||
static bool river_reference(const River*, const jrd_nod*, bool* field_found = NULL);
|
||
static bool search_stack(const jrd_nod*, const NodeStack&);
|
||
static void set_active(OptimizerBlk*, const River*);
|
||
static void set_direction(const jrd_nod*, jrd_nod*);
|
||
static void set_inactive(OptimizerBlk*, const River*);
|
||
static void set_made_river(OptimizerBlk*, const River*);
|
||
static void set_position(const jrd_nod*, jrd_nod*, const jrd_nod*);
|
||
static void set_rse_inactive(CompilerScratch*, const RecordSelExpr*);
|
||
static void sort_indices_by_selectivity(CompilerScratch::csb_repeat*);
|
||
static SSHORT sort_indices_by_priority(CompilerScratch::csb_repeat*, index_desc**, UINT64*);
|
||
|
||
|
||
/* macro definitions */
|
||
|
||
#ifdef OPT_DEBUG
|
||
const int DEBUG_PUNT = 5;
|
||
const int DEBUG_RELATIONSHIPS = 4;
|
||
const int DEBUG_ALL = 3;
|
||
const int DEBUG_CANDIDATE = 2;
|
||
const int DEBUG_BEST = 1;
|
||
const int DEBUG_NONE = 0;
|
||
|
||
FILE *opt_debug_file = 0;
|
||
static int opt_debug_flag = DEBUG_NONE;
|
||
#endif
|
||
|
||
inline void SET_DEP_BIT(ULONG* array, const SLONG bit)
|
||
{
|
||
array[bit / 32] |= (1L << (bit % 32));
|
||
}
|
||
|
||
inline void CLEAR_DEP_BIT(ULONG* array, const SLONG bit)
|
||
{
|
||
array[bit / 32] &= ~(1L << (bit % 32));
|
||
}
|
||
|
||
inline bool TEST_DEP_BIT(const ULONG* array, const ULONG bit)
|
||
{
|
||
return (array[bit / 32] & (1L << (bit % 32))) != 0;
|
||
}
|
||
|
||
inline bool TEST_DEP_ARRAYS(const ULONG* ar1, const ULONG* ar2)
|
||
{ return (ar1[0] & ar2[0]) || (ar1[1] & ar2[1]) ||
|
||
(ar1[2] & ar2[2]) || (ar1[3] & ar2[3]) ||
|
||
(ar1[4] & ar2[4]) || (ar1[5] & ar2[5]) ||
|
||
(ar1[6] & ar2[6]) || (ar1[7] & ar2[7]);
|
||
}
|
||
|
||
inline int STREAM_INDEX(const jrd_nod* node)
|
||
{
|
||
switch (node->nod_type)
|
||
{
|
||
case nod_relation:
|
||
return e_rel_stream;
|
||
case nod_procedure:
|
||
return e_prc_stream;
|
||
case nod_union:
|
||
return e_uni_stream;
|
||
default:
|
||
return e_agg_stream;
|
||
}
|
||
}
|
||
|
||
/* some arbitrary fudge factors for calculating costs, etc.--
|
||
these could probably be better tuned someday */
|
||
|
||
const double ESTIMATED_SELECTIVITY = 0.01;
|
||
const int INVERSE_ESTIMATE = 10;
|
||
const double INDEX_COST = 30.0;
|
||
const int CACHE_PAGES_PER_STREAM = 15;
|
||
const int SELECTIVITY_THRESHOLD_FACTOR = 10;
|
||
const int OR_SELECTIVITY_THRESHOLD_FACTOR = 2000;
|
||
const UINT64 LOWEST_PRIORITY_LEVEL = 0;
|
||
|
||
/* enumeration of sort datatypes */
|
||
|
||
static const UCHAR sort_dtypes[] =
|
||
{
|
||
0, /* dtype_unknown */
|
||
SKD_text, /* dtype_text */
|
||
SKD_cstring, /* dtype_cstring */
|
||
SKD_varying, /* dtype_varying */
|
||
0,
|
||
0,
|
||
0, /* dtype_packed */
|
||
0, /* dtype_byte */
|
||
SKD_short, /* dtype_short */
|
||
SKD_long, /* dtype_long */
|
||
SKD_quad, /* dtype_quad */
|
||
SKD_float, /* dtype_real */
|
||
SKD_double, /* dtype_double */
|
||
SKD_double, /* dtype_d_float */
|
||
SKD_sql_date, /* dtype_sql_date */
|
||
SKD_sql_time, /* dtype_sql_time */
|
||
SKD_timestamp2, /* dtype_timestamp */
|
||
0, /* dtype_blob */
|
||
0, /* dtype_array */
|
||
SKD_int64 /* dtype_int64 */
|
||
};
|
||
|
||
typedef UCHAR stream_array_t[MAX_STREAMS + 1];
|
||
|
||
|
||
bool OPT_access_path(const jrd_req* request,
|
||
SCHAR* buffer,
|
||
SSHORT buffer_length, USHORT* return_length)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ a c c e s s _ p a t h
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Returns a formatted access path for all
|
||
* RecordSelExpr's in the specified request.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(request, type_req);
|
||
|
||
SCHAR* begin = buffer;
|
||
|
||
/* loop through all RSEs in the request,
|
||
and describe the rsb tree for that rsb */
|
||
|
||
size_t i;
|
||
for (i = 0; i < request->req_fors.getCount(); i++) {
|
||
RecordSource* rsb = request->req_fors[i];
|
||
if (rsb && !dump_rsb(request, rsb, &buffer, &buffer_length))
|
||
break;
|
||
}
|
||
|
||
*return_length = buffer - begin;
|
||
|
||
return (i >= request->req_fors.getCount());
|
||
}
|
||
|
||
|
||
RecordSource* OPT_compile(thread_db* tdbb,
|
||
CompilerScratch* csb,
|
||
RecordSelExpr* rse,
|
||
NodeStack* parent_stack)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ c o m p i l e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
**************************************/
|
||
stream_array_t streams, beds, local_streams, outer_streams, sub_streams,
|
||
key_streams;
|
||
|
||
DEV_BLKCHK(csb, type_csb);
|
||
DEV_BLKCHK(rse, type_nod);
|
||
|
||
SET_TDBB(tdbb);
|
||
Database* dbb = tdbb->tdbb_database;
|
||
|
||
#ifdef OPT_DEBUG
|
||
if (opt_debug_flag != DEBUG_NONE && !opt_debug_file)
|
||
opt_debug_file = fopen("opt_debug.out", "w");
|
||
#endif
|
||
|
||
|
||
/* If there is a boolean, there is some work to be done. First,
|
||
decompose the boolean into conjunctions. Then get descriptions
|
||
of all indices for all relations in the RecordSelExpr. This will give
|
||
us the info necessary to allocate a optimizer block big
|
||
enough to hold this crud. */
|
||
|
||
|
||
/* Do not allocate the index_desc struct. Let BTR_all do the job. The allocated
|
||
memory will then be in csb->csb_rpt[stream].csb_idx_allocation, which
|
||
gets cleaned up before this function exits. */
|
||
|
||
index_desc* idx = NULL;
|
||
|
||
OptimizerBlk* opt = FB_NEW(*tdbb->getDefaultPool()) OptimizerBlk(tdbb->getDefaultPool());
|
||
opt->opt_streams.grow(csb->csb_n_stream);
|
||
RecordSource* rsb = 0;
|
||
|
||
try {
|
||
|
||
opt->opt_csb = csb;
|
||
if (rse->nod_flags & rse_stream)
|
||
opt->opt_g_flags |= opt_g_stream;
|
||
|
||
beds[0] = streams[0] = key_streams[0] = outer_streams[0] = sub_streams[0] = 0;
|
||
NodeStack conjunct_stack;
|
||
RiverStack rivers_stack;
|
||
SLONG conjunct_count = 0;
|
||
|
||
check_sorts(rse);
|
||
jrd_nod* sort = rse->rse_sorted;
|
||
jrd_nod* project = rse->rse_projection;
|
||
jrd_nod* aggregate = rse->rse_aggregate;
|
||
|
||
// put any additional booleans on the conjunct stack, and see if we
|
||
// can generate additional booleans by associativity--this will help
|
||
// to utilize indices that we might not have noticed
|
||
if (rse->rse_boolean) {
|
||
conjunct_count =
|
||
decompose(tdbb, rse->rse_boolean, conjunct_stack, csb);
|
||
}
|
||
|
||
conjunct_count += distribute_equalities(conjunct_stack, csb, conjunct_count);
|
||
|
||
// AB: If we have limit our retrieval with FIRST / SKIP syntax then
|
||
// we may not deliver above conditions (from higher rse's) to this
|
||
// rse, because the results should be consistent.
|
||
if (rse->rse_skip || rse->rse_first) {
|
||
parent_stack = NULL;
|
||
}
|
||
|
||
// clear the csb_active flag of all streams in the RecordSelExpr
|
||
set_rse_inactive(csb, rse);
|
||
|
||
UCHAR* p = streams + 1;
|
||
|
||
// go through the record selection expression generating
|
||
// record source blocks for all streams
|
||
|
||
// CVC: I defined this var here because it's assigned inside an if() shortly
|
||
// below but it's used later in the loop always, so I assume the idea is that
|
||
// iterations where nod_type != nod_rse are the ones that set up a new stream.
|
||
// Hope this isn't some kind of logic error.
|
||
SSHORT stream = -1;
|
||
jrd_nod** ptr = rse->rse_relation;
|
||
for (const jrd_nod* const* const end = ptr + rse->rse_count; ptr < end;
|
||
ptr++)
|
||
{
|
||
jrd_nod* node = *ptr;
|
||
|
||
// find the stream number and place it at the end of the beds array
|
||
// (if this is really a stream and not another RecordSelExpr)
|
||
|
||
if (node->nod_type != nod_rse)
|
||
{
|
||
stream = (USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
|
||
fb_assert(stream <= MAX_UCHAR);
|
||
fb_assert(beds[0] < MAX_STREAMS && beds[0] < MAX_UCHAR);
|
||
beds[++beds[0]] = (UCHAR) stream;
|
||
}
|
||
|
||
// for nodes which are not relations, generate an rsb to
|
||
// represent that work has to be done to retrieve them;
|
||
// find all the substreams involved and compile them as well
|
||
|
||
rsb = NULL;
|
||
local_streams[0] = 0;
|
||
|
||
switch (node->nod_type)
|
||
{
|
||
case nod_union:
|
||
{
|
||
const SSHORT i = (SSHORT) key_streams[0];
|
||
compute_dbkey_streams(csb, node, key_streams);
|
||
rsb =
|
||
gen_union(tdbb, opt, node, key_streams + i + 1,
|
||
(USHORT) (key_streams[0] - i));
|
||
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
|
||
local_streams[++local_streams[0]] =
|
||
(UCHAR)(IPTR) node->nod_arg[e_uni_stream];
|
||
break;
|
||
}
|
||
case nod_aggregate:
|
||
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_STREAMS);
|
||
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_UCHAR);
|
||
rsb = gen_aggregate(tdbb, opt, node);
|
||
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
|
||
local_streams[++local_streams[0]] =
|
||
(UCHAR)(IPTR) node->nod_arg[e_agg_stream];
|
||
break;
|
||
case nod_procedure:
|
||
rsb = gen_procedure(tdbb, opt, node);
|
||
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
|
||
local_streams[++local_streams[0]] =
|
||
(UCHAR)(IPTR) node->nod_arg[e_prc_stream];
|
||
break;
|
||
case nod_rse:
|
||
compute_rse_streams(csb, (RecordSelExpr*) node, beds);
|
||
compute_rse_streams(csb, (RecordSelExpr*) node, local_streams);
|
||
compute_dbkey_streams(csb, node, key_streams);
|
||
// pass RecordSelExpr boolean only to inner substreams because join condition
|
||
// should never exclude records from outer substreams
|
||
if (rse->rse_jointype == blr_inner ||
|
||
(rse->rse_jointype == blr_left && (ptr - rse->rse_relation) == 1) )
|
||
{
|
||
// AB: For an (X LEFT JOIN Y) mark the outer-streams (X) as
|
||
// active because the inner-streams (Y) are always "dependent"
|
||
// on the outer-streams. So that index retrieval nodes could be made.
|
||
// For an INNER JOIN mark previous generated RecordSource's as active.
|
||
if (rse->rse_jointype == blr_left) {
|
||
for (SSHORT i = 1; i <= outer_streams[0]; i++) {
|
||
csb->csb_rpt[outer_streams[i]].csb_flags |= csb_active;
|
||
}
|
||
}
|
||
|
||
const NodeStack::iterator stackSavepoint(conjunct_stack);
|
||
NodeStack::const_iterator stack_end;
|
||
NodeStack deliverStack;
|
||
|
||
if (rse->rse_jointype != blr_inner) {
|
||
// Make list of nodes that can be delivered to a outer-stream.
|
||
// In fact this are all nodes except when a IS NULL (nod_missing)
|
||
// comparision is done.
|
||
// Note! Don't forget that this can be burried inside a expression
|
||
// such as "CASE WHEN (FieldX IS NULL) THEN 0 ELSE 1 END = 0"
|
||
NodeStack::iterator stackItem;
|
||
if (parent_stack)
|
||
{
|
||
stackItem = *parent_stack;
|
||
}
|
||
for (; stackItem.hasData(); ++stackItem) {
|
||
jrd_nod* deliverNode = stackItem.object();
|
||
if (!expression_contains(deliverNode, nod_missing)) {
|
||
deliverStack.push(deliverNode);
|
||
}
|
||
}
|
||
stack_end = conjunct_stack.merge(deliverStack);
|
||
}
|
||
else {
|
||
if (parent_stack)
|
||
{
|
||
stack_end = conjunct_stack.merge(*parent_stack);
|
||
}
|
||
}
|
||
|
||
rsb = OPT_compile(tdbb, csb, (RecordSelExpr*) node, &conjunct_stack);
|
||
|
||
if (rse->rse_jointype != blr_inner) {
|
||
// Remove previously added parent conjuctions from the stack.
|
||
conjunct_stack.split(stack_end, deliverStack);
|
||
}
|
||
else {
|
||
if (parent_stack)
|
||
{
|
||
conjunct_stack.split(stack_end, *parent_stack);
|
||
}
|
||
}
|
||
|
||
if (rse->rse_jointype == blr_left) {
|
||
for (SSHORT i = 1; i <= outer_streams[0]; i++) {
|
||
csb->csb_rpt[outer_streams[i]].csb_flags &= ~csb_active;
|
||
}
|
||
}
|
||
}
|
||
else {
|
||
rsb = OPT_compile(tdbb, csb, (RecordSelExpr*) node, parent_stack);
|
||
if (rse->rse_jointype == blr_left)
|
||
find_used_streams(rsb, outer_streams);
|
||
}
|
||
break;
|
||
}
|
||
|
||
// if an rsb has been generated, we have a non-relation;
|
||
// so it forms a river of its own since it is separately
|
||
// optimized from the streams in this rsb
|
||
|
||
if (rsb) {
|
||
const SSHORT i = local_streams[0];
|
||
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), i) River();
|
||
river->riv_count = (UCHAR) i;
|
||
river->riv_rsb = rsb;
|
||
MOVE_FAST(local_streams + 1, river->riv_streams, i);
|
||
// AB: Save all inner-part streams
|
||
if (rse->rse_jointype == blr_inner ||
|
||
(rse->rse_jointype == blr_left && (ptr - rse->rse_relation)==0))
|
||
{
|
||
find_used_streams(rsb, sub_streams);
|
||
}
|
||
set_made_river(opt, river);
|
||
set_inactive(opt, river);
|
||
rivers_stack.push(river);
|
||
continue;
|
||
}
|
||
|
||
// we have found a base relation; record its stream
|
||
// number in the streams array as a candidate for
|
||
// merging into a river
|
||
|
||
// TMN: Is the intention really to allow streams[0] to overflow?
|
||
// I must assume that is indeed not the intention (not to mention
|
||
// it would make code later on fail), so I added the following fb_assert.
|
||
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
|
||
|
||
++streams[0];
|
||
*p++ = (UCHAR) stream;
|
||
|
||
if (rse->rse_jointype == blr_left) {
|
||
fb_assert(outer_streams[0] < MAX_STREAMS && outer_streams[0] < MAX_UCHAR);
|
||
outer_streams[++outer_streams[0]] = stream;
|
||
}
|
||
|
||
// if we have seen any booleans or sort fields, we may be able to
|
||
// use an index to optimize them; retrieve the current format of
|
||
// all indices at this time so we can determine if it's possible
|
||
// AB: if a parent_stack was available and conjunct_count was 0
|
||
// then no indices where retrieved. Added also OR check on
|
||
// parent_stack below. SF BUG # [ 508594 ]
|
||
|
||
if (conjunct_count || sort || project || aggregate || parent_stack)
|
||
{
|
||
jrd_rel* relation = (jrd_rel*) node->nod_arg[e_rel_relation];
|
||
if (relation && !relation->rel_file)
|
||
{
|
||
csb->csb_rpt[stream].csb_indices =
|
||
BTR_all(tdbb, relation,
|
||
&csb->csb_rpt[stream].csb_idx);
|
||
sort_indices_by_selectivity(&csb->csb_rpt[stream]);
|
||
mark_indices(&csb->csb_rpt[stream], relation->rel_id);
|
||
}
|
||
else
|
||
csb->csb_rpt[stream].csb_indices = 0;
|
||
}
|
||
}
|
||
|
||
// this is an attempt to make sure we have a large enough cache to
|
||
// efficiently retrieve this query; make sure the cache has a minimum
|
||
// number of pages for each stream in the RecordSelExpr (the number is just a guess)
|
||
if (streams[0] > 5) {
|
||
CCH_expand(tdbb, (ULONG) (streams[0] * CACHE_PAGES_PER_STREAM));
|
||
}
|
||
|
||
// At this point we are ready to start optimizing.
|
||
// We will use the opt block to hold information of
|
||
// a global nature, meaning that it needs to stick
|
||
// around for the rest of the optimization process.
|
||
|
||
// Set base-point before the parent/distributed nodes begin.
|
||
opt->opt_base_conjuncts = (SSHORT) conjunct_count;
|
||
|
||
// AB: Add parent conjunctions to conjunct_stack, keep in mind
|
||
// the outer-streams! For outer streams put missing (IS NULL)
|
||
// conjunctions in the missingStack.
|
||
SLONG distributed_count = 0;
|
||
NodeStack missingStack;
|
||
if (parent_stack && parent_stack->getCount())
|
||
{
|
||
NodeStack::iterator iter(*parent_stack);
|
||
for (; iter.hasData() && conjunct_count < MAX_CONJUNCTS; ++iter)
|
||
{
|
||
jrd_nod* node = iter.object();
|
||
if ((rse->rse_jointype != blr_inner) &&
|
||
expression_contains(node, nod_missing))
|
||
{
|
||
// parent missing conjunctions shouldn't be
|
||
// distributed to FULL OUTER JOIN streams at all
|
||
if (rse->rse_jointype != blr_full)
|
||
{
|
||
missingStack.push(node);
|
||
}
|
||
}
|
||
else
|
||
{
|
||
conjunct_stack.push(node);
|
||
conjunct_count++;
|
||
}
|
||
}
|
||
// We've now merged parent, try again to make more conjunctions.
|
||
distributed_count = distribute_equalities(conjunct_stack, csb, conjunct_count);
|
||
conjunct_count += distributed_count;
|
||
}
|
||
// The newly created conjunctions belong to the base conjunctions.
|
||
// After them are starting the parent conjunctions.
|
||
opt->opt_base_parent_conjuncts = opt->opt_base_conjuncts + (SSHORT) distributed_count;
|
||
|
||
// Set base-point before the parent IS NULL nodes begin
|
||
opt->opt_base_missing_conjuncts = (SSHORT) conjunct_count;
|
||
|
||
// Check if size of optimizer block exceeded.
|
||
if (conjunct_count > MAX_CONJUNCTS)
|
||
{
|
||
ERR_post(isc_optimizer_blk_exc, 0);
|
||
// Msg442: size of optimizer block exceeded
|
||
}
|
||
|
||
// Put conjunctions in opt structure.
|
||
// Note that it's a stack and we get the nodes in reversed order from the stack.
|
||
opt->opt_conjuncts.grow(conjunct_count);
|
||
SSHORT i, j, nodeBase;
|
||
for (i = conjunct_count; i > 0; i--)
|
||
{
|
||
jrd_nod* node = conjunct_stack.pop();
|
||
|
||
if (i == opt->opt_base_conjuncts)
|
||
{
|
||
// The base conjunctions.
|
||
j = 0;
|
||
nodeBase = 0;
|
||
}
|
||
else if (i == conjunct_count)
|
||
{
|
||
// The new conjunctions created by "distribution" from the stack.
|
||
j = 0;
|
||
nodeBase = opt->opt_base_conjuncts;
|
||
}
|
||
else if (i == (conjunct_count - distributed_count))
|
||
{
|
||
// The parent conjunctions.
|
||
j = 0;
|
||
nodeBase = opt->opt_base_conjuncts + distributed_count;
|
||
}
|
||
|
||
opt->opt_conjuncts[nodeBase + j].opt_conjunct_node = node;
|
||
compute_dependencies(node, opt->opt_conjuncts[nodeBase + j].opt_dependencies);
|
||
j++;
|
||
}
|
||
|
||
// Put the parent missing nodes on the stack.
|
||
for (i = 0; (i < missingStack.getCount()) && (conjunct_count < MAX_CONJUNCTS); i++)
|
||
{
|
||
opt->opt_conjuncts.grow(conjunct_count + 1);
|
||
jrd_nod* node = missingStack.pop();
|
||
opt->opt_conjuncts[conjunct_count].opt_conjunct_node = node;
|
||
compute_dependencies(node,
|
||
opt->opt_conjuncts[conjunct_count].opt_dependencies);
|
||
conjunct_count++;
|
||
}
|
||
|
||
// attempt to optimize aggregates via an index, if possible
|
||
if (aggregate && !sort && !project) {
|
||
sort = aggregate;
|
||
}
|
||
else {
|
||
rse->rse_aggregate = aggregate = NULL;
|
||
}
|
||
|
||
// AB: Mark the previous used streams (sub-RecordSelExpr's) as active
|
||
for (i = 1; i <= sub_streams[0]; i++) {
|
||
csb->csb_rpt[sub_streams[i]].csb_flags |= csb_active;
|
||
}
|
||
|
||
// outer joins require some extra processing
|
||
if (rse->rse_jointype != blr_inner) {
|
||
rsb = gen_outer(tdbb, opt, rse, rivers_stack, &sort, &project);
|
||
}
|
||
else {
|
||
bool sort_present = (sort);
|
||
bool outer_rivers = false;
|
||
jrd_nod* const saved_sort_node = sort;
|
||
|
||
// AB: If previous rsb's are already on the stack we can't use
|
||
// an navigational-retrieval for an ORDER BY cause the next
|
||
// streams are JOINed to the previous ones
|
||
if (rivers_stack.hasData()) {
|
||
sort = NULL;
|
||
outer_rivers = true;
|
||
// AB: We could already have multiple rivers at this
|
||
// point so try to do some sort/merging now.
|
||
while (rivers_stack.hasMore(1)
|
||
&& gen_sort_merge(tdbb, opt, rivers_stack));
|
||
// AB: Mark the previous used streams (sub-RecordSelExpr's) again
|
||
// as active, because an SORT/MERGE could reset the flags
|
||
for (i = 1; i <= sub_streams[0]; i++) {
|
||
csb->csb_rpt[sub_streams[i]].csb_flags |= csb_active;
|
||
}
|
||
}
|
||
|
||
// attempt to form joins in decreasing order of desirability
|
||
fb_assert(streams[0] != 1 || csb->csb_rpt[streams[1]].csb_relation != 0);
|
||
gen_join(tdbb, opt, streams, rivers_stack, &sort, &project,
|
||
rse->rse_plan);
|
||
|
||
// If there are multiple rivers, try some sort/merging
|
||
while (rivers_stack.hasMore(1)
|
||
&& gen_sort_merge(tdbb, opt, rivers_stack));
|
||
|
||
rsb = make_cross(tdbb, opt, rivers_stack);
|
||
|
||
// AB: When we have a merge then a previous made ordering with
|
||
// an index doesn't guarantee that the result will be in that
|
||
// order. So we assigned the sort node back.
|
||
// SF BUG # [ 221921 ] ORDER BY has no effect
|
||
RecordSource* test_rsb = rsb;
|
||
if ((rsb) && (rsb->rsb_type == rsb_boolean) && (rsb->rsb_next)) {
|
||
test_rsb = rsb->rsb_next;
|
||
}
|
||
if ((sort_present && outer_rivers) ||
|
||
((test_rsb) && (test_rsb->rsb_type == rsb_merge) && !sort && sort_present)) {
|
||
sort = saved_sort_node;
|
||
}
|
||
|
||
// Pick up any residual boolean that may have fallen thru the cracks
|
||
rsb = gen_residual_boolean(tdbb, opt, rsb);
|
||
}
|
||
|
||
// if the aggregate was not optimized via an index, get rid of the
|
||
// sort and flag the fact to the calling routine
|
||
if (aggregate && sort) {
|
||
rse->rse_aggregate = NULL;
|
||
sort = NULL;
|
||
}
|
||
|
||
// check index usage in all the base streams to ensure
|
||
// that any user-specified access plan is followed
|
||
|
||
for (i = 1; i <= streams[0]; i++) {
|
||
check_indices(&csb->csb_rpt[streams[i]]);
|
||
}
|
||
|
||
if (project || sort) {
|
||
// Eliminate any duplicate dbkey streams
|
||
const UCHAR* const b_end = beds + beds[0];
|
||
const UCHAR* const k_end = key_streams + key_streams[0];
|
||
UCHAR* k = &key_streams[1];
|
||
for (const UCHAR* p2 = k; p2 <= k_end; p2++) {
|
||
const UCHAR* q = &beds[1];
|
||
while (q <= b_end && *q != *p2) {
|
||
q++;
|
||
}
|
||
if (q > b_end) {
|
||
*k++ = *p2;
|
||
}
|
||
}
|
||
key_streams[0] = k - &key_streams[1];
|
||
|
||
// Handle project clause, if present.
|
||
if (project) {
|
||
rsb = gen_sort(tdbb, opt, beds, key_streams, rsb, project, true);
|
||
}
|
||
|
||
// Handle sort clause if present
|
||
if (sort) {
|
||
rsb = gen_sort(tdbb, opt, beds, key_streams, rsb, sort, false);
|
||
}
|
||
}
|
||
|
||
// Handle first and/or skip. The skip MUST (if present)
|
||
// appear in the rsb list AFTER the first. Since the gen_first and gen_skip
|
||
// functions add their nodes at the beginning of the rsb list we MUST call
|
||
// gen_skip before gen_first.
|
||
//
|
||
|
||
if (rse->rse_skip) {
|
||
rsb = gen_skip(tdbb, opt, rsb, rse->rse_skip);
|
||
}
|
||
|
||
if (rse->rse_first) {
|
||
rsb = gen_first(tdbb, opt, rsb, rse->rse_first);
|
||
}
|
||
|
||
// release memory allocated for index descriptions
|
||
for (i = 0; i < streams[0]; i++) {
|
||
stream = streams[i + 1];
|
||
delete csb->csb_rpt[stream].csb_idx;
|
||
csb->csb_rpt[stream].csb_idx = 0;
|
||
|
||
// CVC: The following line added because OPT_compile is recursive, both directly
|
||
// and through gen_union(), too. Otherwise, we happen to step on deallocated memory
|
||
// and this is the cause of the crashes with indices that have plagued IB since v4.
|
||
|
||
csb->csb_rpt[stream].csb_indices = 0;
|
||
}
|
||
|
||
DEBUG
|
||
// free up memory for optimizer structures
|
||
delete opt;
|
||
|
||
#ifdef OPT_DEBUG
|
||
if (opt_debug_file) {
|
||
fflush(opt_debug_file);
|
||
//fclose(opt_debug_file);
|
||
//opt_debug_file = 0;
|
||
}
|
||
#endif
|
||
|
||
} // try
|
||
catch (const std::exception&) {
|
||
for (SSHORT i = 0; i < streams[0]; i++) {
|
||
const SSHORT stream = streams[i + 1];
|
||
delete csb->csb_rpt[stream].csb_idx;
|
||
csb->csb_rpt[stream].csb_idx = 0;
|
||
csb->csb_rpt[stream].csb_indices = 0; // Probably needed to be safe
|
||
}
|
||
delete opt;
|
||
throw;
|
||
}
|
||
|
||
if (rse->rse_writelock)
|
||
rsb->rsb_flags |= rsb_writelock;
|
||
|
||
// Assign pointer to list of dependent invariant values
|
||
rsb->rsb_invariants = rse->rse_invariants;
|
||
|
||
return rsb;
|
||
}
|
||
|
||
|
||
jrd_nod* OPT_make_dbkey(OptimizerBlk* opt, jrd_nod* boolean, USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ m a k e _ d b k e y
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* If boolean is an equality comparison on the proper dbkey,
|
||
* make a "bit_dbkey" operator (makes bitmap out of dbkey
|
||
* expression.
|
||
*
|
||
* This is a little hairy, since view dbkeys are expressed as
|
||
* concatenations of primitive dbkeys.
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
|
||
/* If this isn't an equality, it isn't even interesting */
|
||
|
||
if (boolean->nod_type != nod_eql)
|
||
return NULL;
|
||
|
||
/* Find the side of the equality that is potentially a dbkey. If
|
||
neither, make the obvious deduction */
|
||
|
||
jrd_nod* dbkey = boolean->nod_arg[0];
|
||
jrd_nod* value = boolean->nod_arg[1];
|
||
SLONG n = 0;
|
||
|
||
if (dbkey->nod_type != nod_dbkey && dbkey->nod_type != nod_concatenate)
|
||
{
|
||
if (value->nod_type != nod_dbkey &&
|
||
value->nod_type != nod_concatenate)
|
||
{
|
||
return NULL;
|
||
}
|
||
dbkey = value;
|
||
value = boolean->nod_arg[0];
|
||
}
|
||
|
||
/* If the value isn't computable, this has been a waste of time */
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
if (!computable(csb, value, stream, false, false)) {
|
||
return NULL;
|
||
}
|
||
|
||
/* If this is a concatenation, find an appropriate dbkey */
|
||
|
||
if (dbkey->nod_type == nod_concatenate) {
|
||
dbkey = find_dbkey(dbkey, stream, &n);
|
||
if (!dbkey) {
|
||
return NULL;
|
||
}
|
||
}
|
||
|
||
/* Make sure we have the correct stream */
|
||
|
||
if ((USHORT)(IPTR) dbkey->nod_arg[0] != stream)
|
||
return NULL;
|
||
|
||
/* If this is a dbkey for the appropriate stream, it's invertable */
|
||
|
||
dbkey = PAR_make_node(tdbb, 2);
|
||
dbkey->nod_count = 1;
|
||
dbkey->nod_type = nod_bit_dbkey;
|
||
dbkey->nod_arg[0] = value;
|
||
dbkey->nod_arg[1] = (jrd_nod*) (IPTR) n;
|
||
dbkey->nod_impure = CMP_impure(csb, sizeof(impure_inversion));
|
||
|
||
return dbkey;
|
||
}
|
||
|
||
|
||
jrd_nod* OPT_make_index(thread_db* tdbb, OptimizerBlk* opt, jrd_rel* relation,
|
||
index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ m a k e _ i n d e x
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Build node for index scan.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
|
||
/* Allocate both a index retrieval node and block. */
|
||
|
||
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
|
||
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
|
||
retrieval->irb_relation = relation;
|
||
|
||
/* Pick up lower bound segment values */
|
||
|
||
jrd_nod** lower = retrieval->irb_value;
|
||
jrd_nod** upper = retrieval->irb_value + idx->idx_count;
|
||
const OptimizerBlk::opt_segment* const end = opt->opt_segments + idx->idx_count;
|
||
OptimizerBlk::opt_segment* tail;
|
||
|
||
if (idx->idx_flags & idx_descending) {
|
||
for (tail = opt->opt_segments; tail->opt_lower && tail < end; tail++)
|
||
*upper++ = tail->opt_lower;
|
||
for (tail = opt->opt_segments; tail->opt_upper && tail < end; tail++)
|
||
*lower++ = tail->opt_upper;
|
||
retrieval->irb_generic |= irb_descending;
|
||
}
|
||
else {
|
||
for (tail = opt->opt_segments; tail->opt_lower && tail < end; tail++)
|
||
*lower++ = tail->opt_lower;
|
||
for (tail = opt->opt_segments; tail->opt_upper && tail < end; tail++)
|
||
*upper++ = tail->opt_upper;
|
||
}
|
||
|
||
retrieval->irb_lower_count = lower - retrieval->irb_value;
|
||
retrieval->irb_upper_count =
|
||
(upper - retrieval->irb_value) - idx->idx_count;
|
||
|
||
bool equiv = false;
|
||
|
||
for (tail = opt->opt_segments; tail->opt_match && tail < end; tail++)
|
||
{
|
||
if (tail->opt_match->nod_type == nod_equiv)
|
||
{
|
||
equiv = true;
|
||
break;
|
||
}
|
||
}
|
||
|
||
// This index is never used for IS NULL, thus we can ignore NULLs
|
||
// already at index scan. But this rule doesn't apply to nod_equiv
|
||
// which requires NULLs to be found in the index.
|
||
if (!equiv)
|
||
{
|
||
retrieval->irb_generic |= irb_ignore_null_value_key;
|
||
}
|
||
|
||
/* Check to see if this is really an equality retrieval */
|
||
|
||
if (retrieval->irb_lower_count == retrieval->irb_upper_count) {
|
||
retrieval->irb_generic |= irb_equality;
|
||
lower = retrieval->irb_value;
|
||
upper = retrieval->irb_value + idx->idx_count;
|
||
for (const jrd_nod* const* const end_node = lower + retrieval->irb_lower_count;
|
||
lower < end_node;)
|
||
{
|
||
if (*upper++ != *lower++) {
|
||
retrieval->irb_generic &= ~irb_equality;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
/* If we are matching less than the full index, this is a partial match */
|
||
|
||
if (retrieval->irb_upper_count < idx->idx_count)
|
||
retrieval->irb_generic |= irb_partial;
|
||
|
||
/* mark the index as utilized for the purposes of this compile */
|
||
|
||
idx->idx_runtime_flags |= idx_used;
|
||
|
||
return node;
|
||
}
|
||
|
||
|
||
int OPT_match_index(OptimizerBlk* opt, USHORT stream, index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ m a t c h _ i n d e x
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Match any active (computable but not consumed) boolean
|
||
* conjunctions against a given index. This is used by
|
||
* the external relation modules to do index optimization.
|
||
* Return the number of matching items.
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
DEV_BLKCHK(opt, type_opt);
|
||
|
||
/* If there are not conjunctions, don't waste our time */
|
||
|
||
if (!opt->opt_base_conjuncts) {
|
||
return 0;
|
||
}
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
const OptimizerBlk::opt_conjunct* const opt_end =
|
||
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
|
||
USHORT n = 0;
|
||
clear_bounds(opt, idx);
|
||
|
||
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
|
||
tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
|
||
&& computable(csb, node, -1, true, false))
|
||
{
|
||
n += match_index(tdbb, opt, stream, node, idx);
|
||
}
|
||
}
|
||
|
||
return n; // implicit USHORT -> int
|
||
}
|
||
|
||
|
||
#ifdef PC_ENGINE
|
||
void OPT_set_index(thread_db* tdbb,
|
||
jrd_req* request, RecordSource** rsb_ptr, jrd_rel* relation, index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* O P T _ s e t _ i n d e x
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Reset the navigational order of a stream.
|
||
* Given a sequential or navigational rsb,
|
||
* reset the rsb to be a navigational rsb
|
||
* on the specified index.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(request, type_req);
|
||
DEV_BLKCHK(*rsb_ptr, type_rsb);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
|
||
SET_TDBB(tdbb);
|
||
Database* dbb = tdbb->tdbb_database;
|
||
|
||
RecordSource* old_rsb = *rsb_ptr;
|
||
|
||
/* fix up a boolean rsb to point to the actual stream rsb */
|
||
|
||
if (old_rsb->rsb_type == rsb_boolean) {
|
||
rsb_ptr = &old_rsb->rsb_next;
|
||
old_rsb = old_rsb->rsb_next;
|
||
}
|
||
|
||
/* check if there is an existing inversion for
|
||
a boolean expression mapped to an index */
|
||
jrd_nod* inversion = NULL;
|
||
if (old_rsb->rsb_type == rsb_indexed) {
|
||
inversion = (jrd_nod*) old_rsb->rsb_arg[0];
|
||
}
|
||
else if (old_rsb->rsb_type == rsb_navigate) {
|
||
inversion = (jrd_nod*) old_rsb->rsb_arg[RSB_NAV_inversion];
|
||
}
|
||
|
||
/* set up a dummy optimizer block just for the purposes
|
||
of the set index, to pass information to subroutines */
|
||
|
||
OptimizerBlk* opt = FB_NEW(*tdbb->getDefaultPool()) OptimizerBlk(tdbb->getDefaultPool());
|
||
opt->opt_g_flags |= opt_g_stream;
|
||
|
||
/* generate a new rsb for the retrieval, making sure to
|
||
preserve the inversion generated for the last rsb; note
|
||
that if the bitmap for the inversion has already been
|
||
generated, it will be reused since it is already part of
|
||
the impure area--I can't think of any reason not to reuse it--deej */
|
||
RecordSource* new_rsb;
|
||
if (idx) {
|
||
new_rsb = gen_nav_rsb(tdbb, opt, old_rsb->rsb_stream, relation, 0, idx
|
||
#ifdef SCROLLABLE_CURSORS
|
||
, RSE_get_forward
|
||
#endif
|
||
);
|
||
new_rsb->rsb_arg[RSB_NAV_inversion] = (RecordSource*) inversion;
|
||
new_rsb->rsb_cardinality = old_rsb->rsb_cardinality;
|
||
}
|
||
else {
|
||
new_rsb = gen_rsb(tdbb, opt, 0, inversion, old_rsb->rsb_stream,
|
||
relation, 0, 0, (float) old_rsb->rsb_cardinality);
|
||
}
|
||
|
||
/* point the impure area of the new rsb to the impure area of the
|
||
old; since impure area is pre-allocated it would be difficult
|
||
to change now, so just use the same area; NOTE: this implies
|
||
that we must take some pains to ensure that the impure area is
|
||
always large enough to handle a maximum-key index */
|
||
|
||
new_rsb->rsb_impure = old_rsb->rsb_impure;
|
||
|
||
/* find index node if the old rsb was navigational */
|
||
|
||
jrd_nod* index_node = NULL;
|
||
if (old_rsb->rsb_type == rsb_navigate) {
|
||
index_node = (jrd_nod*) old_rsb->rsb_arg[RSB_NAV_index];
|
||
}
|
||
|
||
/* if the new rsb is navigational, set up impure space in request
|
||
for new index node; to convert from non-navigational to navigational,
|
||
we need to adjust the impure area upwards to make room for an impure_inversion
|
||
structure, and vice versa to convert the other way */
|
||
|
||
if (idx) {
|
||
jrd_nod* new_index_node = (jrd_nod*) new_rsb->rsb_arg[RSB_NAV_index];
|
||
if (old_rsb->rsb_type == rsb_navigate)
|
||
new_index_node->nod_impure = index_node->nod_impure;
|
||
else {
|
||
new_index_node->nod_impure = old_rsb->rsb_impure;
|
||
new_rsb->rsb_impure += sizeof(impure_inversion);
|
||
}
|
||
}
|
||
else if (old_rsb->rsb_type == rsb_navigate) {
|
||
new_rsb->rsb_impure -= sizeof(impure_inversion);
|
||
}
|
||
|
||
/* if there was a previous index, release its lock
|
||
and remove its resource from the request */
|
||
|
||
if (old_rsb->rsb_type == rsb_navigate) {
|
||
IndexRetrieval* retrieval =
|
||
(IndexRetrieval*) index_node->nod_arg[e_idx_retrieval];
|
||
const USHORT index_id = retrieval->irb_index;
|
||
IndexLock* index = CMP_get_index_lock(tdbb, relation, index_id);
|
||
if (index) {
|
||
if (index->idl_count)
|
||
--index->idl_count;
|
||
if (!index->idl_count) {
|
||
LCK_release(tdbb, index->idl_lock);
|
||
}
|
||
}
|
||
CMP_release_resource(&request->req_resources, Resource::rsc_index, index_id);
|
||
}
|
||
|
||
/* get lock on new index */
|
||
|
||
if (idx) {
|
||
IndexLock* index = CMP_get_index_lock(tdbb, relation, idx->idx_id);
|
||
if (index) {
|
||
if (!index->idl_count) {
|
||
LCK_lock_non_blocking(tdbb, index->idl_lock, LCK_SR, LCK_WAIT);
|
||
}
|
||
++index->idl_count;
|
||
}
|
||
}
|
||
|
||
/* go out to the vector which stores all rsbs for the
|
||
request, and replace the old with the new */
|
||
|
||
for (size_t i = 0; i < request->req_fors.getCount(); i++) {
|
||
if (request->req_fors[i] == old_rsb) {
|
||
request->req_fors[i] = new_rsb;
|
||
break;
|
||
}
|
||
}
|
||
|
||
/* release unneeded blocks */
|
||
|
||
delete opt;
|
||
if (index_node) {
|
||
delete index_node;
|
||
}
|
||
delete old_rsb;
|
||
|
||
*rsb_ptr = new_rsb;
|
||
}
|
||
#endif
|
||
|
||
|
||
static bool augment_stack(jrd_nod* node, NodeStack& stack)
|
||
{
|
||
/**************************************
|
||
*
|
||
* a u g m e n t _ s t a c k
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Add node to stack unless node is already on stack.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
for (NodeStack::const_iterator temp(stack); temp.hasData(); ++temp) {
|
||
if (node_equality(node, temp.object())) {
|
||
return false;
|
||
}
|
||
}
|
||
|
||
stack.push(node);
|
||
|
||
return true;
|
||
}
|
||
|
||
|
||
static UINT64 calculate_priority_level(const OptimizerBlk* opt, const index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c a l c u l a t e _ p r i o r i t y _ l e v e l
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Return an calculated value based on
|
||
* how nodes where matched on the index.
|
||
* Before calling this function the
|
||
* match_index function must be called first!
|
||
*
|
||
**************************************/
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
|
||
// Count how many fields can be used in this index and
|
||
// count the maximum equals that matches at the begin.
|
||
USHORT idx_eql_count = 0;
|
||
USHORT idx_field_count = 0;
|
||
const OptimizerBlk::opt_segment* idx_tail = opt->opt_segments;
|
||
const OptimizerBlk::opt_segment* const idx_end = idx_tail + idx->idx_count;
|
||
for (;idx_tail < idx_end &&
|
||
(idx_tail->opt_lower || idx_tail->opt_upper); idx_tail++)
|
||
{
|
||
idx_field_count++;
|
||
const jrd_nod* node = idx_tail->opt_match;
|
||
if (node->nod_type == nod_eql) {
|
||
idx_eql_count++;
|
||
}
|
||
else {
|
||
break;
|
||
}
|
||
}
|
||
|
||
// Note: dbb->dbb_max_idx = 1022 for the largest supported page of 16K and
|
||
// 62 for the smallest page of 1K
|
||
const UINT64 max_idx = JRD_get_thread_data()->tdbb_database->dbb_max_idx + 1;
|
||
UINT64 unique_prefix = 0;
|
||
if ((idx->idx_flags & idx_unique) && (idx_eql_count == idx->idx_count)) {
|
||
unique_prefix = (max_idx - idx->idx_count) * max_idx * max_idx * max_idx;
|
||
}
|
||
// Calculate our priority level.
|
||
return unique_prefix + ((idx_eql_count * max_idx * max_idx) +
|
||
(idx_field_count * max_idx) + (max_idx - idx->idx_count));
|
||
|
||
}
|
||
else {
|
||
return LOWEST_PRIORITY_LEVEL;
|
||
}
|
||
}
|
||
|
||
|
||
static void check_indices(const CompilerScratch::csb_repeat* csb_tail)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c h e c k _ i n d i c e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Check to make sure that the user-specified
|
||
* indices were actually utilized by the optimizer.
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
|
||
const jrd_nod* plan = csb_tail->csb_plan;
|
||
if (!plan) {
|
||
return;
|
||
}
|
||
|
||
if (plan->nod_type != nod_retrieve) {
|
||
return;
|
||
}
|
||
|
||
const jrd_rel* relation = csb_tail->csb_relation;
|
||
|
||
/* if there were no indices fetched at all but the
|
||
user specified some, error out using the first
|
||
index specified */
|
||
const jrd_nod* access_type = 0;
|
||
if (!csb_tail->csb_indices &&
|
||
(access_type = plan->nod_arg[e_retrieve_access_type]))
|
||
{
|
||
/* index %s cannot be used in the specified plan */
|
||
ERR_post(isc_index_unused, isc_arg_string, access_type->nod_arg[2],
|
||
0);
|
||
}
|
||
|
||
/* check to make sure that all indices are either used or marked not to be used,
|
||
and that there are no unused navigational indices */
|
||
SqlIdentifier index_name;
|
||
|
||
const index_desc* idx = csb_tail->csb_idx->items;
|
||
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
|
||
if (!(idx->idx_runtime_flags & (idx_plan_dont_use | idx_used)) ||
|
||
((idx->idx_runtime_flags & idx_plan_navigate)
|
||
&& !(idx->idx_runtime_flags & idx_navigate)))
|
||
{
|
||
if (!
|
||
(idx->idx_runtime_flags &
|
||
(idx_plan_missing | idx_plan_starts)))
|
||
{
|
||
if (relation) {
|
||
MET_lookup_index(tdbb, index_name, relation->rel_name,
|
||
(USHORT) (idx->idx_id + 1));
|
||
}
|
||
else {
|
||
index_name[0] = 0;
|
||
}
|
||
|
||
/* index %s cannot be used in the specified plan */
|
||
ERR_post(isc_index_unused, isc_arg_string,
|
||
ERR_cstring(index_name), 0);
|
||
}
|
||
}
|
||
++idx;
|
||
}
|
||
}
|
||
|
||
|
||
static bool check_relationship(const OptimizerBlk* opt, USHORT position, USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c h e c k _ r e l a t i o n s h i p
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Check for a potential indexed relationship.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
|
||
const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
|
||
for (const OptimizerBlk::opt_stream* const end = tail + position; tail < end; tail++)
|
||
{
|
||
const USHORT n = tail->opt_stream_number;
|
||
for (const IndexedRelationship* relationship = opt->opt_streams[n].opt_relationships;
|
||
relationship;
|
||
relationship = relationship->irl_next)
|
||
{
|
||
if (stream == relationship->irl_stream) {
|
||
return true;
|
||
}
|
||
}
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
|
||
static void check_sorts(RecordSelExpr* rse)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c h e c k _ s o r t s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Try to optimize out unnecessary sorting.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(rse, type_nod);
|
||
|
||
jrd_nod* sort = rse->rse_sorted;
|
||
jrd_nod* project = rse->rse_projection;
|
||
|
||
// check if a GROUP BY exists using the same fields as the project or sort:
|
||
// if so, the projection can be eliminated; if no projection exists, then
|
||
// the sort can be eliminated.
|
||
|
||
jrd_nod *group, *sub_rse;
|
||
if ((project || sort) &&
|
||
(rse->rse_count == 1) &&
|
||
(sub_rse = rse->rse_relation[0]) &&
|
||
(sub_rse->nod_type == nod_aggregate) &&
|
||
(group = sub_rse->nod_arg[e_agg_group]))
|
||
{
|
||
// if all the fields of the project are the same as all the fields
|
||
// of the group by, get rid of the project.
|
||
|
||
if (project && (project->nod_count == group->nod_count)) {
|
||
jrd_nod** project_ptr = project->nod_arg;
|
||
const jrd_nod* const* const project_end = project_ptr + project->nod_count;
|
||
for (; project_ptr < project_end; project_ptr++)
|
||
{
|
||
const jrd_nod* const* group_ptr = group->nod_arg;
|
||
const jrd_nod* const* const group_end = group_ptr + group->nod_count;
|
||
for (; group_ptr < group_end; group_ptr++)
|
||
{
|
||
if (map_equal(*group_ptr, *project_ptr, sub_rse->nod_arg[e_agg_map])) {
|
||
break;
|
||
}
|
||
}
|
||
if (group_ptr == group_end) {
|
||
break;
|
||
}
|
||
}
|
||
|
||
// we can now ignore the project, but in case the project is being done
|
||
// in descending order because of an order by, do the group by the same way.
|
||
if (project_ptr == project_end) {
|
||
set_direction(project, group);
|
||
project = rse->rse_projection = NULL;
|
||
}
|
||
}
|
||
|
||
// if there is no projection, then we can make a similar optimization
|
||
// for sort, except that sort may have fewer fields than group by.
|
||
if (!project && sort && (sort->nod_count <= group->nod_count)) {
|
||
const jrd_nod* const* sort_ptr = sort->nod_arg;
|
||
const jrd_nod* const* const sort_end = sort_ptr + sort->nod_count;
|
||
for (; sort_ptr < sort_end; sort_ptr++)
|
||
{
|
||
const jrd_nod* const* group_ptr = group->nod_arg;
|
||
const jrd_nod* const* const group_end = group_ptr + sort->nod_count;
|
||
for (; group_ptr < group_end; group_ptr++)
|
||
{
|
||
if (map_equal(*group_ptr, *sort_ptr, sub_rse->nod_arg[e_agg_map])) {
|
||
break;
|
||
}
|
||
}
|
||
if (group_ptr == group_end) {
|
||
break;
|
||
}
|
||
}
|
||
|
||
// if all the fields in the sort list match the first n fields in the
|
||
// project list, we can ignore the sort, but update the sort order
|
||
// (ascending/descending) to match that in the sort list
|
||
|
||
if (sort_ptr == sort_end) {
|
||
set_direction(sort, group);
|
||
set_position(sort, group, sub_rse->nod_arg[e_agg_map]);
|
||
sort = rse->rse_sorted = NULL;
|
||
}
|
||
}
|
||
|
||
}
|
||
|
||
// examine the ORDER BY and DISTINCT clauses; if all the fields in the
|
||
// ORDER BY match the first n fields in the DISTINCT in any order, the
|
||
// ORDER BY can be removed, changing the fields in the DISTINCT to match
|
||
// the ordering of fields in the ORDER BY.
|
||
|
||
if (sort && project && (sort->nod_count <= project->nod_count)) {
|
||
const jrd_nod* const* sort_ptr = sort->nod_arg;
|
||
const jrd_nod* const* const sort_end = sort_ptr + sort->nod_count;
|
||
for (; sort_ptr < sort_end; sort_ptr++)
|
||
{
|
||
const jrd_nod* const* project_ptr = project->nod_arg;
|
||
const jrd_nod* const* const project_end = project_ptr + sort->nod_count;
|
||
for (; project_ptr < project_end; project_ptr++)
|
||
{
|
||
if ((*sort_ptr)->nod_type == nod_field
|
||
&& (*project_ptr)->nod_type == nod_field
|
||
&& (*sort_ptr)->nod_arg[e_fld_stream] ==
|
||
(*project_ptr)->nod_arg[e_fld_stream]
|
||
&& (*sort_ptr)->nod_arg[e_fld_id] ==
|
||
(*project_ptr)->nod_arg[e_fld_id])
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
|
||
if (project_ptr == project_end) {
|
||
break;
|
||
}
|
||
}
|
||
|
||
// if all the fields in the sort list match the first n fields
|
||
// in the project list, we can ignore the sort, but update
|
||
// the project to match the sort.
|
||
if (sort_ptr == sort_end) {
|
||
set_direction(sort, project);
|
||
set_position(sort, project, NULL);
|
||
sort = rse->rse_sorted = NULL;
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static void class_mask(USHORT count, jrd_nod** eq_class, ULONG* mask)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c l a s s _ m a s k
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Given an sort/merge join equivalence class (vector of node pointers
|
||
* of representative values for rivers), return a bit mask of rivers
|
||
* with values.
|
||
*
|
||
**************************************/
|
||
#ifdef DEV_BUILD
|
||
if (*eq_class) {
|
||
DEV_BLKCHK(*eq_class, type_nod);
|
||
}
|
||
#endif
|
||
|
||
if (count > MAX_CONJUNCTS) {
|
||
ERR_post(isc_optimizer_blk_exc, 0);
|
||
/* Msg442: size of optimizer block exceeded */
|
||
}
|
||
|
||
SLONG i;
|
||
for (i = 0; i < OPT_STREAM_BITS; i++) {
|
||
mask[i] = 0;
|
||
}
|
||
|
||
for (i = 0; i < count; i++, eq_class++) {
|
||
if (*eq_class) {
|
||
SET_DEP_BIT(mask, i);
|
||
DEV_BLKCHK(*eq_class, type_nod);
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static void clear_bounds(OptimizerBlk* opt, const index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c l e a r _ b o u n d s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Clear upper and lower value slots before matching booleans to
|
||
* indices.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
|
||
const OptimizerBlk::opt_segment* const opt_end = &opt->opt_segments[idx->idx_count];
|
||
|
||
for (OptimizerBlk::opt_segment* tail = opt->opt_segments; tail < opt_end; tail++) {
|
||
tail->opt_lower = NULL;
|
||
tail->opt_upper = NULL;
|
||
tail->opt_match = NULL;
|
||
}
|
||
}
|
||
|
||
|
||
static jrd_nod* compose(jrd_nod** node1, jrd_nod* node2, NOD_T node_type)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c o m p o s e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Build and AND out of two conjuncts.
|
||
*
|
||
**************************************/
|
||
|
||
DEV_BLKCHK(*node1, type_nod);
|
||
DEV_BLKCHK(node2, type_nod);
|
||
|
||
if (!node2) {
|
||
return *node1;
|
||
}
|
||
|
||
if (!*node1) {
|
||
return (*node1 = node2);
|
||
}
|
||
|
||
return *node1 = make_binary_node(node_type, *node1, node2, false);
|
||
}
|
||
|
||
|
||
static bool computable(CompilerScratch* csb,
|
||
jrd_nod* node,
|
||
SSHORT stream,
|
||
bool idx_use,
|
||
bool allowOnlyCurrentStream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c o m p u t a b l e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* See if node is presently computable.
|
||
* Note that a field is not computable
|
||
* with respect to its own stream.
|
||
*
|
||
* There are two different uses of computable().
|
||
* (a) idx_use == false: when an unused conjunct is to be picked for making
|
||
* into a boolean and in making a db_key.
|
||
* In this case, a node is said to be computable, if all the streams
|
||
* involved in that node are csb_active. The csb_active flag
|
||
* defines all the streams available in the current scope of the
|
||
* query.
|
||
* (b) idx_use == true: to determine if we can use an
|
||
* index on the conjunct we have already chosen.
|
||
* In order to use an index on a conjunct, it is required that the
|
||
* all the streams involved in the conjunct are currently active
|
||
* or have been already processed before and made into rivers.
|
||
* Because, here we want to differentiate between streams we have
|
||
* not yet worked on and those that we have worked on or are currently
|
||
* working on.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(csb, type_csb);
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
/* Recurse thru interesting sub-nodes */
|
||
|
||
jrd_nod** ptr = node->nod_arg;
|
||
|
||
if (node->nod_type == nod_procedure) {
|
||
return false;
|
||
}
|
||
|
||
if (node->nod_type == nod_union) {
|
||
jrd_nod* clauses = node->nod_arg[e_uni_clauses];
|
||
ptr = clauses->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + clauses->nod_count;
|
||
ptr < end; ptr += 2)
|
||
{
|
||
if (!computable(csb, *ptr, stream, idx_use, allowOnlyCurrentStream)) {
|
||
return false;
|
||
}
|
||
}
|
||
}
|
||
else {
|
||
for (const jrd_nod* const* const end = ptr + node->nod_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
if (!computable(csb, *ptr, stream, idx_use, allowOnlyCurrentStream)) {
|
||
return false;
|
||
}
|
||
}
|
||
}
|
||
|
||
RecordSelExpr* rse;
|
||
jrd_nod* sub;
|
||
jrd_nod* value;
|
||
USHORT n;
|
||
|
||
switch (node->nod_type) {
|
||
case nod_field:
|
||
|
||
n = (USHORT)(IPTR) node->nod_arg[e_fld_stream];
|
||
|
||
if (allowOnlyCurrentStream) {
|
||
if (n != stream) {
|
||
return false;
|
||
}
|
||
}
|
||
else {
|
||
if (n == stream) {
|
||
return false;
|
||
}
|
||
}
|
||
// AB: cbs_made_river has been replaced by find_used_streams()
|
||
//if (idx_use &&
|
||
// !(csb->csb_rpt[n].csb_flags & (csb_made_river | csb_active)))
|
||
return csb->csb_rpt[n].csb_flags & csb_active;
|
||
|
||
case nod_rec_version:
|
||
case nod_dbkey:
|
||
|
||
n = (USHORT)(IPTR) node->nod_arg[0];
|
||
|
||
if (allowOnlyCurrentStream) {
|
||
if (n != stream) {
|
||
return false;
|
||
}
|
||
}
|
||
else {
|
||
if (n == stream) {
|
||
return false;
|
||
}
|
||
}
|
||
// AB: cbs_made_river has been replaced by find_used_streams()
|
||
//if (idx_use &&
|
||
// !(csb->csb_rpt[n].
|
||
// csb_flags & (csb_made_river | csb_active)))
|
||
return csb->csb_rpt[n].csb_flags & csb_active;
|
||
|
||
case nod_min:
|
||
case nod_max:
|
||
case nod_average:
|
||
case nod_total:
|
||
case nod_count:
|
||
case nod_from:
|
||
if ((sub = node->nod_arg[e_stat_default]) &&
|
||
!computable(csb, sub, stream, idx_use, allowOnlyCurrentStream))
|
||
{
|
||
return false;
|
||
}
|
||
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
|
||
value = node->nod_arg[e_stat_value];
|
||
break;
|
||
|
||
case nod_rse:
|
||
rse = (RecordSelExpr*) node;
|
||
value = NULL;
|
||
break;
|
||
|
||
case nod_aggregate:
|
||
rse = (RecordSelExpr*) node->nod_arg[e_agg_rse];
|
||
rse->rse_sorted = node->nod_arg[e_agg_group];
|
||
value = NULL;
|
||
break;
|
||
|
||
default:
|
||
return true;
|
||
}
|
||
|
||
/* Node is a record selection expression. */
|
||
|
||
bool result = true;
|
||
|
||
if ((sub = rse->rse_first) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) {
|
||
return false;
|
||
}
|
||
|
||
if ((sub = rse->rse_skip) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) {
|
||
return false;
|
||
}
|
||
|
||
/* Set sub-streams of rse active */
|
||
|
||
const jrd_nod* const* end;
|
||
|
||
for (ptr = rse->rse_relation, end = ptr + rse->rse_count; ptr < end; ptr++) {
|
||
if ((*ptr)->nod_type != nod_rse) {
|
||
n = (USHORT)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
|
||
csb->csb_rpt[n].csb_flags |= csb_active;
|
||
}
|
||
}
|
||
|
||
/* Check sub-stream */
|
||
|
||
if (((sub = rse->rse_boolean) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) ||
|
||
((sub = rse->rse_sorted) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) ||
|
||
((sub = rse->rse_projection) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)))
|
||
{
|
||
result = false;
|
||
}
|
||
|
||
for (ptr = rse->rse_relation, end = ptr + rse->rse_count;
|
||
((ptr < end) && (result)); ptr++)
|
||
{
|
||
if ((*ptr)->nod_type != nod_rse) {
|
||
if (!computable(csb, (*ptr), stream, idx_use, allowOnlyCurrentStream)) {
|
||
result = false;
|
||
}
|
||
}
|
||
}
|
||
|
||
/* Check value expression, if any */
|
||
|
||
if (result && value && !computable(csb, value, stream, idx_use, allowOnlyCurrentStream)) {
|
||
result = false;
|
||
}
|
||
|
||
/* Reset streams inactive */
|
||
|
||
for (ptr = rse->rse_relation, end = ptr + rse->rse_count; ptr < end;
|
||
ptr++)
|
||
{
|
||
if ((*ptr)->nod_type != nod_rse)
|
||
{
|
||
n = (USHORT)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
|
||
csb->csb_rpt[n].csb_flags &= ~csb_active;
|
||
}
|
||
}
|
||
|
||
return result;
|
||
}
|
||
|
||
|
||
static void compute_dependencies(const jrd_nod* node, ULONG* dependencies)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c o m p u t e _ d e p e n d e n c i e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compute stream dependencies for evaluation of an expression.
|
||
*
|
||
**************************************/
|
||
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
/* Recurse thru interesting sub-nodes */
|
||
|
||
const jrd_nod* const* ptr = node->nod_arg;
|
||
|
||
if (node->nod_type == nod_procedure) {
|
||
return;
|
||
}
|
||
|
||
{ // scope for MSVC6
|
||
for (const jrd_nod* const* const end = ptr + node->nod_count; ptr < end; ptr++)
|
||
{
|
||
compute_dependencies(*ptr, dependencies);
|
||
}
|
||
} // scope
|
||
|
||
const RecordSelExpr* rse;
|
||
const jrd_nod* sub;
|
||
const jrd_nod* value;
|
||
|
||
switch (node->nod_type) {
|
||
case nod_field:
|
||
{
|
||
const SLONG n = (SLONG)(IPTR) node->nod_arg[e_fld_stream];
|
||
SET_DEP_BIT(dependencies, n);
|
||
return;
|
||
}
|
||
|
||
case nod_rec_version:
|
||
case nod_dbkey:
|
||
{
|
||
const SLONG n = (SLONG)(IPTR) node->nod_arg[0];
|
||
SET_DEP_BIT(dependencies, n);
|
||
return;
|
||
}
|
||
|
||
case nod_min:
|
||
case nod_max:
|
||
case nod_average:
|
||
case nod_total:
|
||
case nod_count:
|
||
case nod_from:
|
||
if ( (sub = node->nod_arg[e_stat_default]) ) {
|
||
compute_dependencies(sub, dependencies);
|
||
}
|
||
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
|
||
value = node->nod_arg[e_stat_value];
|
||
break;
|
||
|
||
case nod_rse:
|
||
rse = (RecordSelExpr*) node;
|
||
value = NULL;
|
||
break;
|
||
|
||
default:
|
||
return;
|
||
}
|
||
|
||
/* Node is a record selection expression. Groan. Ugh. Yuck. */
|
||
|
||
if ( (sub = rse->rse_first) ) {
|
||
compute_dependencies(sub, dependencies);
|
||
}
|
||
|
||
/* Check sub-expressions */
|
||
|
||
if ( (sub = rse->rse_boolean) ) {
|
||
compute_dependencies(sub, dependencies);
|
||
}
|
||
|
||
if ( (sub = rse->rse_sorted) ) {
|
||
compute_dependencies(sub, dependencies);
|
||
}
|
||
|
||
if ( (sub = rse->rse_projection) ) {
|
||
compute_dependencies(sub, dependencies);
|
||
}
|
||
|
||
/* Check value expression, if any */
|
||
|
||
if (value) {
|
||
compute_dependencies(value, dependencies);
|
||
}
|
||
|
||
/* Reset streams inactive */
|
||
|
||
ptr = rse->rse_relation;
|
||
for (const jrd_nod* const* const end = ptr + rse->rse_count; ptr < end; ptr++)
|
||
{
|
||
if ((*ptr)->nod_type != nod_rse) {
|
||
const SLONG n = (SLONG)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
|
||
CLEAR_DEP_BIT(dependencies, n);
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static void compute_dbkey_streams(const CompilerScratch* csb, const jrd_nod* node, UCHAR* streams)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c o m p u t e _ d b k e y _ s t r e a m s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Identify all of the streams for which a
|
||
* dbkey may need to be carried through a sort.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(csb, type_csb);
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
if (node->nod_type == nod_relation) {
|
||
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
|
||
streams[++streams[0]] = (UCHAR)(IPTR) node->nod_arg[e_rel_stream];
|
||
}
|
||
else if (node->nod_type == nod_union) {
|
||
const jrd_nod* clauses = node->nod_arg[e_uni_clauses];
|
||
if (clauses->nod_type != nod_procedure) {
|
||
const jrd_nod* const* ptr = clauses->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + clauses->nod_count;
|
||
ptr < end; ptr += 2)
|
||
{
|
||
compute_dbkey_streams(csb, *ptr, streams);
|
||
}
|
||
}
|
||
}
|
||
else if (node->nod_type == nod_rse) {
|
||
const RecordSelExpr* rse = (RecordSelExpr*) node;
|
||
const jrd_nod* const* ptr = rse->rse_relation;
|
||
for (const jrd_nod* const* const end = ptr + rse->rse_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
compute_dbkey_streams(csb, *ptr, streams);
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static void compute_rse_streams(const CompilerScratch* csb, const RecordSelExpr* rse, UCHAR* streams)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c o m p u t e _ r s e _ s t r e a m s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Identify the streams that make up an RecordSelExpr.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(csb, type_csb);
|
||
DEV_BLKCHK(rse, type_nod);
|
||
|
||
const jrd_nod* const* ptr = rse->rse_relation;
|
||
for (const jrd_nod* const* const end = ptr + rse->rse_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
const jrd_nod* node = *ptr;
|
||
if (node->nod_type != nod_rse) {
|
||
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
|
||
streams[++streams[0]] = (UCHAR)(IPTR) node->nod_arg[STREAM_INDEX(node)];
|
||
}
|
||
else {
|
||
compute_rse_streams(csb, (const RecordSelExpr*) node, streams);
|
||
}
|
||
}
|
||
}
|
||
|
||
static bool check_for_nod_from(const jrd_nod* node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* c h e c k _ f o r _ n o d _ f r o m
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Check for nod_from under >=0 nod_cast nodes.
|
||
*
|
||
**************************************/
|
||
if (node->nod_type == nod_from)
|
||
return true;
|
||
if (node->nod_type == nod_cast)
|
||
return check_for_nod_from(node->nod_arg[e_cast_source]);
|
||
return false;
|
||
}
|
||
|
||
static SLONG decompose(thread_db* tdbb,
|
||
jrd_nod* boolean_node,
|
||
NodeStack& stack,
|
||
CompilerScratch* csb)
|
||
{
|
||
/**************************************
|
||
*
|
||
* d e c o m p o s e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Decompose a boolean into a stack of conjuctions.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(boolean_node, type_nod);
|
||
DEV_BLKCHK(csb, type_csb);
|
||
|
||
|
||
if (boolean_node->nod_type == nod_and) {
|
||
return decompose(tdbb, boolean_node->nod_arg[0], stack, csb) +
|
||
decompose(tdbb, boolean_node->nod_arg[1], stack, csb);
|
||
}
|
||
|
||
/* turn a between into (a greater than or equal) AND (a less than or equal) */
|
||
|
||
if (boolean_node->nod_type == nod_between) {
|
||
jrd_nod* arg = boolean_node->nod_arg[0];
|
||
if (check_for_nod_from(arg)) {
|
||
/* Without this ERR_punt(), server was crashing with sub queries
|
||
* under "between" predicate, Bug No. 73766 */
|
||
ERR_post(isc_optimizer_between_err, 0);
|
||
/* Msg 493: Unsupported field type specified in BETWEEN predicate */
|
||
}
|
||
jrd_nod* node = make_binary_node(nod_geq, arg, boolean_node->nod_arg[1], true);
|
||
stack.push(node);
|
||
arg = CMP_clone_node(tdbb, csb, arg);
|
||
node = make_binary_node(nod_leq, arg, boolean_node->nod_arg[2], true);
|
||
stack.push(node);
|
||
return 2;
|
||
}
|
||
|
||
/* turn a LIKE into a LIKE and a STARTING WITH, if it starts
|
||
with anything other than a pattern-matching character */
|
||
|
||
jrd_nod* arg;
|
||
if ((boolean_node->nod_type == nod_like) &&
|
||
(arg = optimize_like(tdbb, boolean_node)))
|
||
{
|
||
stack.push(make_binary_node(nod_starts,
|
||
boolean_node->nod_arg[0], arg, false));
|
||
stack.push(boolean_node);
|
||
return 2;
|
||
}
|
||
|
||
stack.push(boolean_node);
|
||
|
||
return 1;
|
||
}
|
||
|
||
|
||
static USHORT distribute_equalities(NodeStack& org_stack, CompilerScratch* csb, USHORT base_count)
|
||
{
|
||
/**************************************
|
||
*
|
||
* d i s t r i b u t e _ e q u a l i t i e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Given a stack of conjunctions, generate some simple
|
||
* inferences. In general, find classes of equalities,
|
||
* then find operations based on members of those classes.
|
||
* If we find any, generate additional conjunctions. In
|
||
* short:
|
||
*
|
||
* If (a == b) and (a $ c) --> (b $ c) for any
|
||
* operation '$'.
|
||
*
|
||
**************************************/
|
||
Firebird::ObjectsArray<NodeStack> classes;
|
||
Firebird::ObjectsArray<NodeStack>::iterator eq_class;
|
||
|
||
DEV_BLKCHK(csb, type_csb);
|
||
|
||
/* Zip thru stack of booleans looking for field equalities */
|
||
|
||
for (NodeStack::iterator stack1(org_stack); stack1.hasData(); ++stack1) {
|
||
jrd_nod* boolean = stack1.object();
|
||
if (boolean->nod_type != nod_eql)
|
||
continue;
|
||
jrd_nod* node1 = boolean->nod_arg[0];
|
||
if (node1->nod_type != nod_field)
|
||
continue;
|
||
jrd_nod* node2 = boolean->nod_arg[1];
|
||
if (node2->nod_type != nod_field)
|
||
continue;
|
||
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class)
|
||
{
|
||
if (search_stack(node1, *eq_class)) {
|
||
augment_stack(node2, *eq_class);
|
||
break;
|
||
}
|
||
else if (search_stack(node2, *eq_class)) {
|
||
eq_class->push(node1);
|
||
break;
|
||
}
|
||
}
|
||
if (eq_class == classes.end()) {
|
||
NodeStack& s = classes.add();
|
||
s.push(node1);
|
||
s.push(node2);
|
||
eq_class = classes.back();
|
||
}
|
||
}
|
||
|
||
if (classes.getCount() == 0)
|
||
return 0;
|
||
|
||
/* Make another pass looking for any equality relationships that may
|
||
have crept in between classes (this could result from the
|
||
sequence (A = B, C = D, B = C) */
|
||
|
||
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
|
||
for (NodeStack::const_iterator stack2(*eq_class); stack2.hasData(); ++stack2) {
|
||
for (Firebird::ObjectsArray<NodeStack>::iterator eq_class2(eq_class);
|
||
++eq_class2 != classes.end();)
|
||
{
|
||
if (search_stack(stack2.object(), *eq_class2)) {
|
||
DEBUG;
|
||
while (eq_class2->hasData()) {
|
||
augment_stack(eq_class2->pop(), *eq_class);
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
USHORT count = 0;
|
||
|
||
/* Start by making a pass distributing field equalities */
|
||
|
||
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
|
||
if (eq_class->hasMore(3)) {
|
||
for (NodeStack::iterator outer(*eq_class); outer.hasData(); ++outer) {
|
||
for (NodeStack::iterator inner(outer); (++inner).hasData(); ) {
|
||
jrd_nod* boolean =
|
||
make_binary_node(nod_eql, outer.object(),
|
||
inner.object(), true);
|
||
if ((base_count + count < MAX_CONJUNCTS) &&
|
||
augment_stack(boolean, org_stack))
|
||
{
|
||
DEBUG;
|
||
count++;
|
||
}
|
||
else
|
||
delete boolean;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
/* Now make a second pass looking for non-field equalities */
|
||
|
||
for (NodeStack::iterator stack3(org_stack); stack3.hasData(); ++stack3) {
|
||
jrd_nod* boolean = stack3.object();
|
||
if (boolean->nod_type != nod_eql &&
|
||
boolean->nod_type != nod_gtr &&
|
||
boolean->nod_type != nod_geq &&
|
||
boolean->nod_type != nod_leq &&
|
||
boolean->nod_type != nod_lss &&
|
||
boolean->nod_type != nod_matches &&
|
||
boolean->nod_type != nod_contains &&
|
||
boolean->nod_type != nod_like)
|
||
{
|
||
continue;
|
||
}
|
||
const jrd_nod* node1 = boolean->nod_arg[0];
|
||
const jrd_nod* node2 = boolean->nod_arg[1];
|
||
bool reverse = false;
|
||
if (node1->nod_type != nod_field) {
|
||
const jrd_nod* swap_node = node1;
|
||
node1 = node2;
|
||
node2 = swap_node;
|
||
reverse = true;
|
||
}
|
||
if (node1->nod_type != nod_field) {
|
||
continue;
|
||
}
|
||
if (node2->nod_type != nod_literal &&
|
||
node2->nod_type != nod_variable &&
|
||
node2->nod_type != nod_argument)
|
||
{
|
||
continue;
|
||
}
|
||
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
|
||
if (search_stack(node1, *eq_class)) {
|
||
for (NodeStack::iterator temp(*eq_class); temp.hasData(); ++temp) {
|
||
if (!node_equality(node1, temp.object())) {
|
||
jrd_nod* arg1;
|
||
jrd_nod* arg2;
|
||
if (reverse) {
|
||
arg1 = boolean->nod_arg[0];
|
||
arg2 = temp.object();
|
||
}
|
||
else {
|
||
arg1 = temp.object();
|
||
arg2 = boolean->nod_arg[1];
|
||
}
|
||
|
||
/* From the conjuncts X(A,B) and A=C, infer the
|
||
* conjunct X(C,B)
|
||
*/
|
||
jrd_nod* new_node =
|
||
make_inference_node(csb, boolean, arg1, arg2);
|
||
if ((base_count + count < MAX_CONJUNCTS) &&
|
||
augment_stack(new_node, org_stack))
|
||
{
|
||
count++;
|
||
}
|
||
}
|
||
}
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
return count;
|
||
}
|
||
|
||
|
||
static bool dump_index(const jrd_nod* node,
|
||
SCHAR** buffer_ptr, SSHORT* buffer_length)
|
||
{
|
||
/**************************************
|
||
*
|
||
* d u m p _ i n d e x
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Dump an index inversion tree to
|
||
* an info buffer.
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
SCHAR* buffer = *buffer_ptr;
|
||
|
||
if (--(*buffer_length) < 0) {
|
||
return false;
|
||
}
|
||
|
||
// spit out the node type
|
||
switch (node->nod_type)
|
||
{
|
||
case nod_bit_and:
|
||
*buffer++ = isc_info_rsb_and;
|
||
break;
|
||
case nod_bit_or:
|
||
case nod_bit_in:
|
||
*buffer++ = isc_info_rsb_or;
|
||
break;
|
||
case nod_bit_dbkey:
|
||
*buffer++ = isc_info_rsb_dbkey;
|
||
break;
|
||
case nod_index:
|
||
*buffer++ = isc_info_rsb_index;
|
||
break;
|
||
}
|
||
|
||
SqlIdentifier index_name;
|
||
// dump sub-nodes or the actual index info
|
||
if ((node->nod_type == nod_bit_and) ||
|
||
(node->nod_type == nod_bit_or) ||
|
||
(node->nod_type == nod_bit_in))
|
||
{
|
||
if (!dump_index(node->nod_arg[0], &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
if (!dump_index(node->nod_arg[1], &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
}
|
||
else if (node->nod_type == nod_index) {
|
||
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
|
||
MET_lookup_index(tdbb, index_name, retrieval->irb_relation->rel_name,
|
||
(USHORT) (retrieval->irb_index + 1));
|
||
SSHORT length = strlen(index_name);
|
||
|
||
*buffer_length -= 1 + length;
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
*buffer++ = (SCHAR) length;
|
||
const TEXT* i = index_name;
|
||
while (length--) {
|
||
*buffer++ = *i++;
|
||
}
|
||
}
|
||
|
||
*buffer_ptr = buffer;
|
||
|
||
return true;
|
||
}
|
||
|
||
|
||
static bool dump_rsb(const jrd_req* request,
|
||
const RecordSource* rsb, SCHAR** buffer_ptr, SSHORT* buffer_length)
|
||
{
|
||
/**************************************
|
||
*
|
||
* d u m p _ r s b
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Returns a formatted access path for
|
||
* a particular rsb.
|
||
*
|
||
**************************************/
|
||
SSHORT return_length;
|
||
jrd_prc* procedure;
|
||
|
||
DEV_BLKCHK(rsb, type_rsb);
|
||
|
||
SCHAR* buffer = *buffer_ptr;
|
||
|
||
// leave room for the rsb begin, type, and end.
|
||
*buffer_length -= 4;
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
*buffer++ = isc_info_rsb_begin;
|
||
|
||
// dump out the alias or relation name if it exists.
|
||
const jrd_rel* relation = rsb->rsb_relation;
|
||
USHORT length = 0;
|
||
const SCHAR* name = NULL;
|
||
|
||
const str* alias = rsb->rsb_alias;
|
||
if (alias) {
|
||
length = alias->str_length;
|
||
name = (SCHAR *) alias->str_data;
|
||
}
|
||
else if (relation) {
|
||
length = strlen(relation->rel_name);
|
||
name = relation->rel_name;
|
||
}
|
||
|
||
if (name) {
|
||
*buffer_length -= 2 + length;
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
*buffer++ = isc_info_rsb_relation;
|
||
*buffer++ = (SCHAR) length;
|
||
while (length--) {
|
||
*buffer++ = *name++;
|
||
}
|
||
}
|
||
|
||
/* print out the type followed immediately by any
|
||
type-specific data */
|
||
|
||
*buffer++ = isc_info_rsb_type;
|
||
switch (rsb->rsb_type) {
|
||
case rsb_indexed:
|
||
*buffer++ = isc_info_rsb_indexed;
|
||
if (!dump_index((jrd_nod*) rsb->rsb_arg[0], &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
break;
|
||
|
||
case rsb_navigate:
|
||
*buffer++ = isc_info_rsb_navigate;
|
||
if (!dump_index((jrd_nod*) rsb->rsb_arg[RSB_NAV_index],
|
||
&buffer, buffer_length))
|
||
{
|
||
return false;
|
||
}
|
||
// dimitr: here we report indicies used to limit
|
||
// the navigational-based retrieval
|
||
if (rsb->rsb_arg[RSB_NAV_inversion]) {
|
||
*buffer_length -= 2;
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
*buffer++ = isc_info_rsb_type;
|
||
*buffer++ = isc_info_rsb_indexed;
|
||
if (!dump_index((jrd_nod*) rsb->rsb_arg[RSB_NAV_inversion],
|
||
&buffer, buffer_length))
|
||
{
|
||
return false;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case rsb_sequential:
|
||
*buffer++ = isc_info_rsb_sequential;
|
||
break;
|
||
|
||
case rsb_cross:
|
||
*buffer++ = isc_info_rsb_cross;
|
||
break;
|
||
|
||
case rsb_sort:
|
||
*buffer++ = isc_info_rsb_sort;
|
||
break;
|
||
|
||
case rsb_procedure:
|
||
*buffer++ = isc_info_rsb_procedure;
|
||
|
||
// don't try to print out plans of procedures called by procedures, since
|
||
// we could get into a recursive situation; if the customer wants to know
|
||
// the plan produced by the sub-procedure, they can invoke it directly.
|
||
if (request->req_procedure) {
|
||
break;
|
||
}
|
||
|
||
procedure = rsb->rsb_procedure;
|
||
if (!procedure || !procedure->prc_request) {
|
||
return false;
|
||
}
|
||
|
||
// CVC: This is becoming trickier. There are procedures that don't have a plan
|
||
// because they don't access tables. In this case, the engine gives up and swallows
|
||
// the whole plan. Not acceptable.
|
||
|
||
if (procedure->prc_request->req_fors.getCount() == 0) {
|
||
const Firebird::string& n = procedure->prc_name;
|
||
*buffer_length -= 6 + n.length();
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
*buffer++ = isc_info_rsb_begin;
|
||
*buffer++ = isc_info_rsb_relation;
|
||
*buffer++ = (SCHAR) n.length();
|
||
memcpy(buffer, n.c_str(), n.length());
|
||
buffer += n.length();
|
||
*buffer++ = isc_info_rsb_type;
|
||
*buffer++ = isc_info_rsb_sequential;
|
||
*buffer++ = isc_info_rsb_end;
|
||
break;
|
||
}
|
||
|
||
if (!OPT_access_path(procedure->prc_request, buffer, *buffer_length,
|
||
reinterpret_cast<USHORT*>(&return_length)))
|
||
{
|
||
return false;
|
||
}
|
||
*buffer_length -= return_length;
|
||
if (*buffer_length < 0) {
|
||
return false;
|
||
}
|
||
buffer += return_length;
|
||
break;
|
||
|
||
case rsb_first:
|
||
*buffer++ = isc_info_rsb_first;
|
||
break;
|
||
|
||
case rsb_skip:
|
||
*buffer++ = isc_info_rsb_skip;
|
||
break;
|
||
|
||
case rsb_boolean:
|
||
*buffer++ = isc_info_rsb_boolean;
|
||
break;
|
||
|
||
case rsb_union:
|
||
*buffer++ = isc_info_rsb_union;
|
||
break;
|
||
|
||
case rsb_aggregate:
|
||
*buffer++ = isc_info_rsb_aggregate;
|
||
break;
|
||
|
||
case rsb_merge:
|
||
*buffer++ = isc_info_rsb_merge;
|
||
break;
|
||
|
||
case rsb_ext_sequential:
|
||
*buffer++ = isc_info_rsb_ext_sequential;
|
||
break;
|
||
|
||
case rsb_ext_indexed:
|
||
*buffer++ = isc_info_rsb_ext_indexed;
|
||
break;
|
||
|
||
case rsb_ext_dbkey:
|
||
*buffer++ = isc_info_rsb_ext_dbkey;
|
||
break;
|
||
|
||
case rsb_left_cross:
|
||
*buffer++ = isc_info_rsb_left_cross;
|
||
break;
|
||
|
||
default:
|
||
*buffer++ = isc_info_rsb_unknown;
|
||
break;
|
||
}
|
||
|
||
// dump out any sub-rsbs; for join-type rses like cross
|
||
// and merge, dump out the count of streams first, then
|
||
// loop through the substreams and dump them out.
|
||
|
||
if (--(*buffer_length) < 0) {
|
||
return false;
|
||
}
|
||
|
||
const RecordSource* const* ptr;
|
||
const RecordSource* const* end;
|
||
|
||
switch (rsb->rsb_type) {
|
||
case rsb_cross:
|
||
*buffer++ = (UCHAR) rsb->rsb_count;
|
||
ptr = rsb->rsb_arg;
|
||
for (end = ptr + rsb->rsb_count; ptr < end; ptr++) {
|
||
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case rsb_union:
|
||
*buffer++ = rsb->rsb_count / 2;
|
||
ptr = rsb->rsb_arg;
|
||
for (end = ptr + rsb->rsb_count; ptr < end; ptr++) {
|
||
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
ptr++;
|
||
}
|
||
break;
|
||
|
||
case rsb_merge:
|
||
*buffer++ = (SCHAR) rsb->rsb_count;
|
||
ptr = rsb->rsb_arg;
|
||
for (end = ptr + rsb->rsb_count * 2; ptr < end;
|
||
ptr += 2)
|
||
{
|
||
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case rsb_left_cross:
|
||
*buffer++ = 2;
|
||
if (!dump_rsb(request, rsb->rsb_arg[RSB_LEFT_outer], &buffer,
|
||
buffer_length))
|
||
{
|
||
return false;
|
||
}
|
||
if (!dump_rsb(request, rsb->rsb_arg[RSB_LEFT_inner], &buffer,
|
||
buffer_length))
|
||
{
|
||
return false;
|
||
}
|
||
break;
|
||
|
||
default: // Shut up compiler warnings.
|
||
break;
|
||
}
|
||
|
||
// dump out the next rsb.
|
||
if (rsb->rsb_next) {
|
||
if (!dump_rsb(request, rsb->rsb_next, &buffer, buffer_length)) {
|
||
return false;
|
||
}
|
||
}
|
||
|
||
*buffer++ = isc_info_rsb_end;
|
||
|
||
*buffer_ptr = buffer;
|
||
|
||
return true;
|
||
}
|
||
|
||
|
||
static bool estimate_cost(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
USHORT stream,
|
||
double *cost, double *resulting_cardinality)
|
||
{
|
||
/**************************************
|
||
*
|
||
* e s t i m a t e _ c o s t
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Make an estimate of the cost to fetch a stream. The cost
|
||
* is a function of estimated cardinality of the relation, index
|
||
* selectivity, and total boolean selectivity. Since none of
|
||
* this information is available, the estimates are likely to
|
||
* be a bit weak. Return true if the relation is index
|
||
* retrievable.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
SET_TDBB(tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
|
||
csb_tail->csb_flags |= csb_active;
|
||
double cardinality = MAX(csb_tail->csb_cardinality, 10);
|
||
double index_selectivity = 1.0;
|
||
USHORT indexes = 0, equalities = 0, inequalities = 0, index_hits = 0;
|
||
bool unique = false;
|
||
ULONG inactivities[OPT_STREAM_BITS];
|
||
get_inactivities(csb, inactivities);
|
||
|
||
// Compute index selectivity. This involves finding the indices
|
||
// to be utilized and making a crude guess of selectivities.
|
||
|
||
if (opt->opt_conjuncts.getCount()) {
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
|
||
SSHORT n = 0;
|
||
clear_bounds(opt, idx);
|
||
const OptimizerBlk::opt_conjunct* const opt_end =
|
||
opt->opt_conjuncts.end();
|
||
for (const OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
|
||
tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
|
||
!(TEST_DEP_ARRAYS(tail->opt_dependencies, inactivities)))
|
||
{
|
||
n += match_index(tdbb, opt, stream, node, idx);
|
||
}
|
||
}
|
||
OptimizerBlk::opt_segment* segment = opt->opt_segments;
|
||
if (segment->opt_lower || segment->opt_upper) {
|
||
indexes++;
|
||
USHORT count;
|
||
for (count = 0; count < idx->idx_count; count++, segment++) {
|
||
if (!segment->opt_lower || segment->opt_lower != segment->opt_upper) {
|
||
break;
|
||
}
|
||
}
|
||
double s = idx->idx_selectivity;
|
||
if (s <= 0 || s >= 1) {
|
||
s = ESTIMATED_SELECTIVITY;
|
||
}
|
||
if (count == idx->idx_count) {
|
||
if (idx->idx_flags & idx_unique) {
|
||
unique = true;
|
||
s = 1 / cardinality;
|
||
}
|
||
}
|
||
else {
|
||
s *= INVERSE_ESTIMATE;
|
||
}
|
||
index_selectivity *= s;
|
||
index_hits += MAX(count, n);
|
||
}
|
||
++idx;
|
||
}
|
||
}
|
||
|
||
// We now known the relation cardinality, the combined index selectivity,
|
||
// and the number of index lookups required. From this we can compute the
|
||
// cost of executing the record selection expression (cost of index lookups
|
||
// plus the number of records fetched).
|
||
|
||
if (indexes) {
|
||
*cost = cardinality * index_selectivity + indexes * INDEX_COST;
|
||
}
|
||
else {
|
||
*cost = cardinality;
|
||
}
|
||
|
||
/* Next, we need to estimate the number of records coming out of the
|
||
record stream. This is based on conjunctions without regard to whether
|
||
or not they were the result of index operations. */
|
||
|
||
const OptimizerBlk::opt_conjunct* const opt_end =
|
||
opt->opt_conjuncts.end();
|
||
|
||
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
|
||
tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
|
||
!(TEST_DEP_ARRAYS(tail->opt_dependencies, inactivities)))
|
||
{
|
||
if (node->nod_type == nod_eql) {
|
||
++equalities;
|
||
}
|
||
else {
|
||
++inequalities;
|
||
}
|
||
tail->opt_conjunct_flags |= opt_conjunct_used;
|
||
}
|
||
}
|
||
|
||
double selectivity;
|
||
const SSHORT n = inequalities + 3 * (equalities - index_hits);
|
||
if (n > 0) {
|
||
selectivity = 0.3 / n;
|
||
if (selectivity > index_selectivity) {
|
||
selectivity = index_selectivity;
|
||
}
|
||
}
|
||
else {
|
||
selectivity = index_selectivity;
|
||
}
|
||
|
||
cardinality *= selectivity;
|
||
|
||
if (unique) {
|
||
*resulting_cardinality = cardinality;
|
||
}
|
||
else {
|
||
*resulting_cardinality = MAX(cardinality, 1.0);
|
||
}
|
||
|
||
csb_tail->csb_flags |= csb_active;
|
||
|
||
// AB: Nice that we return a boolean, but do we ever need it?
|
||
return (indexes != 0);
|
||
}
|
||
|
||
|
||
static bool expression_contains(const jrd_nod* node, NOD_T node_type)
|
||
{
|
||
/**************************************
|
||
*
|
||
* e x p r e s s i o n _ c o n t a i n s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Search if somewhere in the expression the give
|
||
* node_type is buried. Return true if a unknown
|
||
* node is passed.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
if (!node) {
|
||
return false;
|
||
}
|
||
|
||
if (node->nod_type == node_type) {
|
||
return true;
|
||
}
|
||
else {
|
||
|
||
RecordSelExpr* rse = NULL;
|
||
|
||
switch (node->nod_type) {
|
||
|
||
case nod_cast:
|
||
return expression_contains(node->nod_arg[e_cast_source], node_type);
|
||
|
||
case nod_extract:
|
||
return expression_contains(node->nod_arg[e_extract_value], node_type);
|
||
|
||
case nod_function:
|
||
return expression_contains(node->nod_arg[e_fun_args], node_type);
|
||
|
||
case nod_procedure:
|
||
return expression_contains(node->nod_arg[e_prc_inputs], node_type);
|
||
|
||
case nod_any:
|
||
case nod_unique:
|
||
case nod_ansi_any:
|
||
case nod_ansi_all:
|
||
case nod_exists:
|
||
return expression_contains(node->nod_arg[e_any_rse], node_type);
|
||
|
||
case nod_field:
|
||
case nod_rec_version:
|
||
case nod_dbkey:
|
||
case nod_argument:
|
||
case nod_current_date:
|
||
case nod_current_role:
|
||
case nod_current_time:
|
||
case nod_current_timestamp:
|
||
case nod_gen_id:
|
||
case nod_gen_id2:
|
||
case nod_internal_info:
|
||
case nod_literal:
|
||
case nod_null:
|
||
case nod_user_name:
|
||
case nod_variable:
|
||
return false;
|
||
|
||
case nod_rse:
|
||
rse = (RecordSelExpr*) node;
|
||
break;
|
||
|
||
case nod_average:
|
||
case nod_count:
|
||
case nod_count2:
|
||
case nod_from:
|
||
case nod_max:
|
||
case nod_min:
|
||
case nod_total:
|
||
{
|
||
const jrd_nod* nodeDefault = node->nod_arg[e_stat_rse];
|
||
if (nodeDefault && expression_contains(nodeDefault, node_type)) {
|
||
return true;
|
||
}
|
||
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
|
||
const jrd_nod* value = node->nod_arg[e_stat_value];
|
||
if (value && expression_contains(value, node_type)) {
|
||
return true;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case nod_or:
|
||
case nod_and:
|
||
|
||
case nod_add:
|
||
case nod_add2:
|
||
case nod_agg_average:
|
||
case nod_agg_average2:
|
||
case nod_agg_average_distinct:
|
||
case nod_agg_average_distinct2:
|
||
case nod_agg_max:
|
||
case nod_agg_min:
|
||
case nod_agg_total:
|
||
case nod_agg_total2:
|
||
case nod_agg_total_distinct:
|
||
case nod_agg_total_distinct2:
|
||
case nod_concatenate:
|
||
case nod_divide:
|
||
case nod_divide2:
|
||
case nod_multiply:
|
||
case nod_multiply2:
|
||
case nod_negate:
|
||
case nod_subtract:
|
||
case nod_subtract2:
|
||
|
||
case nod_upcase:
|
||
case nod_substr:
|
||
|
||
case nod_like:
|
||
case nod_between:
|
||
case nod_sleuth:
|
||
case nod_missing:
|
||
case nod_value_if:
|
||
case nod_matches:
|
||
case nod_contains:
|
||
case nod_starts:
|
||
case nod_equiv:
|
||
case nod_eql:
|
||
case nod_neq:
|
||
case nod_geq:
|
||
case nod_gtr:
|
||
case nod_lss:
|
||
case nod_leq:
|
||
{
|
||
const jrd_nod* const* ptr = node->nod_arg;
|
||
// Check all sub-nodes of this node.
|
||
for (const jrd_nod* const* const end = ptr + node->nod_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
if (expression_contains(*ptr, node_type)) {
|
||
return true;
|
||
}
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
|
||
default :
|
||
return true;
|
||
}
|
||
|
||
|
||
if (rse) {
|
||
|
||
jrd_nod* sub;
|
||
if ((sub = rse->rse_first) && expression_contains(sub, node_type)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_skip) && expression_contains(sub, node_type)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_boolean) && expression_contains(sub, node_type)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_sorted) && expression_contains(sub, node_type)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_projection) && expression_contains(sub, node_type)) {
|
||
return true;
|
||
}
|
||
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
}
|
||
|
||
|
||
static bool expression_contains_stream(const jrd_nod* node, UCHAR stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* e x p r e s s i o n _ c o n t a i n s _ s t r e a m
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Search if somewhere in the expression the given stream
|
||
* is used. If a unknown node is found it will return true.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
if (!node) {
|
||
return false;
|
||
}
|
||
|
||
RecordSelExpr* rse = NULL;
|
||
|
||
switch (node->nod_type) {
|
||
|
||
case nod_field:
|
||
return ((USHORT)(IPTR) node->nod_arg[e_fld_stream] == stream);
|
||
|
||
case nod_rec_version:
|
||
case nod_dbkey:
|
||
return ((USHORT)(IPTR) node->nod_arg[0] == stream);
|
||
|
||
case nod_cast:
|
||
return expression_contains_stream(node->nod_arg[e_cast_source], stream);
|
||
|
||
case nod_extract:
|
||
return expression_contains_stream(node->nod_arg[e_extract_value], stream);
|
||
|
||
case nod_function:
|
||
return expression_contains_stream(node->nod_arg[e_fun_args], stream);
|
||
|
||
case nod_procedure:
|
||
return expression_contains_stream(node->nod_arg[e_prc_inputs], stream);
|
||
|
||
case nod_any:
|
||
case nod_unique:
|
||
case nod_ansi_any:
|
||
case nod_ansi_all:
|
||
case nod_exists:
|
||
return expression_contains_stream(node->nod_arg[e_any_rse], stream);
|
||
|
||
case nod_argument:
|
||
case nod_current_date:
|
||
case nod_current_role:
|
||
case nod_current_time:
|
||
case nod_current_timestamp:
|
||
case nod_gen_id:
|
||
case nod_gen_id2:
|
||
case nod_internal_info:
|
||
case nod_literal:
|
||
case nod_null:
|
||
case nod_user_name:
|
||
case nod_variable:
|
||
return false;
|
||
|
||
case nod_rse:
|
||
rse = (RecordSelExpr*) node;
|
||
break;
|
||
|
||
case nod_average:
|
||
case nod_count:
|
||
case nod_count2:
|
||
case nod_from:
|
||
case nod_max:
|
||
case nod_min:
|
||
case nod_total:
|
||
{
|
||
const jrd_nod* nodeDefault = node->nod_arg[e_stat_rse];
|
||
if (nodeDefault && expression_contains_stream(nodeDefault, stream)) {
|
||
return true;
|
||
}
|
||
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
|
||
const jrd_nod* value = node->nod_arg[e_stat_value];
|
||
if (value && expression_contains_stream(value, stream)) {
|
||
return true;
|
||
}
|
||
}
|
||
break;
|
||
|
||
// go into the node arguments
|
||
case nod_add:
|
||
case nod_add2:
|
||
case nod_agg_average:
|
||
case nod_agg_average2:
|
||
case nod_agg_average_distinct:
|
||
case nod_agg_average_distinct2:
|
||
case nod_agg_max:
|
||
case nod_agg_min:
|
||
case nod_agg_total:
|
||
case nod_agg_total2:
|
||
case nod_agg_total_distinct:
|
||
case nod_agg_total_distinct2:
|
||
case nod_concatenate:
|
||
case nod_divide:
|
||
case nod_divide2:
|
||
case nod_multiply:
|
||
case nod_multiply2:
|
||
case nod_negate:
|
||
case nod_subtract:
|
||
case nod_subtract2:
|
||
|
||
case nod_upcase:
|
||
case nod_substr:
|
||
|
||
case nod_like:
|
||
case nod_between:
|
||
case nod_sleuth:
|
||
case nod_missing:
|
||
case nod_value_if:
|
||
case nod_matches:
|
||
case nod_contains:
|
||
case nod_starts:
|
||
case nod_equiv:
|
||
case nod_eql:
|
||
case nod_neq:
|
||
case nod_geq:
|
||
case nod_gtr:
|
||
case nod_lss:
|
||
case nod_leq:
|
||
{
|
||
const jrd_nod* const* ptr = node->nod_arg;
|
||
// Check all sub-nodes of this node.
|
||
for (const jrd_nod* const* const end = ptr + node->nod_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
if (expression_contains_stream(*ptr, stream)) {
|
||
return true;
|
||
}
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
default :
|
||
return true;
|
||
}
|
||
|
||
if (rse) {
|
||
|
||
jrd_nod* sub;
|
||
if ((sub = rse->rse_first) && expression_contains_stream(sub, stream)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_skip) && expression_contains_stream(sub, stream)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_boolean) && expression_contains_stream(sub, stream)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_sorted) && expression_contains_stream(sub, stream)) {
|
||
return true;
|
||
}
|
||
|
||
if ((sub = rse->rse_projection) && expression_contains_stream(sub, stream)) {
|
||
return true;
|
||
}
|
||
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
|
||
#ifdef EXPRESSION_INDICES
|
||
|
||
// Try to merge this function with node_equality() into 1 function.
|
||
|
||
static bool expression_equal(thread_db* tdbb, OptimizerBlk* opt,
|
||
const index_desc* idx, jrd_nod* node,
|
||
USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* e x p r e s s i o n _ e q u a l
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Wrapper for expression_equal2().
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
SET_TDBB(tdbb);
|
||
|
||
if (idx && idx->idx_expression_request && idx->idx_expression)
|
||
{
|
||
fb_assert(idx->idx_flags & idx_expressn);
|
||
fb_assert(idx->idx_expression_request->req_caller == NULL);
|
||
idx->idx_expression_request->req_caller = tdbb->tdbb_request;
|
||
tdbb->tdbb_request = idx->idx_expression_request;
|
||
bool result = false;
|
||
{
|
||
Jrd::ContextPoolHolder context(tdbb, tdbb->tdbb_request->req_pool);
|
||
|
||
result = expression_equal2(tdbb, opt, idx->idx_expression,
|
||
node, stream);
|
||
}
|
||
tdbb->tdbb_request = idx->idx_expression_request->req_caller;
|
||
idx->idx_expression_request->req_caller = NULL;
|
||
|
||
return result;
|
||
}
|
||
else
|
||
return false;
|
||
}
|
||
|
||
|
||
static bool expression_equal2(thread_db* tdbb, OptimizerBlk* opt,
|
||
jrd_nod* node1, jrd_nod* node2,
|
||
USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* e x p r e s s i o n _ e q u a l 2
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Determine if two expression trees are the same for
|
||
* the purposes of matching one half of a boolean expression
|
||
* to an index.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node1, type_nod);
|
||
DEV_BLKCHK(node2, type_nod);
|
||
|
||
SET_TDBB(tdbb);
|
||
|
||
if (!node1 || !node2)
|
||
{
|
||
BUGCHECK(303); // msg 303 Invalid expression for evaluation.
|
||
}
|
||
|
||
if (node1->nod_type != node2->nod_type)
|
||
{
|
||
dsc dsc1, dsc2;
|
||
dsc *desc1 = &dsc1, *desc2 = &dsc2;
|
||
|
||
if (node1->nod_type == nod_cast && node2->nod_type == nod_field)
|
||
{
|
||
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
|
||
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
|
||
|
||
if (DSC_EQUIV(desc1, desc2) &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[e_cast_source],
|
||
node2, stream))
|
||
{
|
||
return true;
|
||
}
|
||
}
|
||
|
||
if (node1->nod_type == nod_field && node2->nod_type == nod_cast)
|
||
{
|
||
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
|
||
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
|
||
|
||
if (DSC_EQUIV(desc1, desc2) &&
|
||
expression_equal2(tdbb, opt, node1,
|
||
node2->nod_arg[e_cast_source], stream))
|
||
{
|
||
return true;
|
||
}
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
switch (node1->nod_type) {
|
||
case nod_add:
|
||
case nod_multiply:
|
||
case nod_add2:
|
||
case nod_multiply2:
|
||
case nod_equiv:
|
||
case nod_eql:
|
||
case nod_neq:
|
||
case nod_and:
|
||
case nod_or:
|
||
// A+B is equivilant to B+A, ditto A*B==B*A
|
||
// Note: If one expression is A+B+C, but the other is B+C+A we won't
|
||
// necessarily match them.
|
||
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
|
||
node2->nod_arg[1], stream) &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[1],
|
||
node2->nod_arg[0], stream))
|
||
{
|
||
return true;
|
||
}
|
||
// Fall into ...
|
||
case nod_subtract:
|
||
case nod_divide:
|
||
case nod_subtract2:
|
||
case nod_divide2:
|
||
case nod_concatenate:
|
||
|
||
// TODO match A > B to B <= A, etc
|
||
case nod_gtr:
|
||
case nod_geq:
|
||
case nod_leq:
|
||
case nod_lss:
|
||
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
|
||
node2->nod_arg[0], stream) &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[1],
|
||
node2->nod_arg[1], stream))
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_rec_version:
|
||
case nod_dbkey:
|
||
if (node1->nod_arg[0] == node2->nod_arg[0])
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_field:
|
||
{
|
||
const USHORT fld_stream = (USHORT)(IPTR) node2->nod_arg[e_fld_stream];
|
||
if ((node1->nod_arg[e_fld_id] == node2->nod_arg[e_fld_id]) &&
|
||
(fld_stream == stream))
|
||
{
|
||
/*
|
||
dsc dsc1, dsc2;
|
||
dsc *desc1 = &dsc1, *desc2 = &dsc2;
|
||
|
||
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
|
||
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
|
||
|
||
if (DSC_GET_COLLATE(desc1) == DSC_GET_COLLATE(desc2))
|
||
*/
|
||
return true;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case nod_function:
|
||
if (node1->nod_arg[e_fun_function] &&
|
||
(node1->nod_arg[e_fun_function] == node2->nod_arg[e_fun_function]) &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[e_fun_args],
|
||
node2->nod_arg[e_fun_args], stream))
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_literal:
|
||
{
|
||
const dsc* desc1 = EVL_expr(tdbb, node1);
|
||
const dsc* desc2 = EVL_expr(tdbb, node2);
|
||
if (desc1 && desc2 && !MOV_compare(desc1, desc2))
|
||
{
|
||
return true;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case nod_null:
|
||
case nod_user_name:
|
||
case nod_current_role:
|
||
case nod_current_time:
|
||
case nod_current_date:
|
||
case nod_current_timestamp:
|
||
return true;
|
||
|
||
case nod_between:
|
||
case nod_like:
|
||
case nod_missing:
|
||
case nod_any:
|
||
case nod_ansi_any:
|
||
case nod_ansi_all:
|
||
case nod_not:
|
||
case nod_unique:
|
||
|
||
case nod_value_if:
|
||
case nod_substr:
|
||
{
|
||
if (node1->nod_count != node2->nod_count)
|
||
{
|
||
return false;
|
||
}
|
||
for (int i = 0; i < node1->nod_count; ++i)
|
||
{
|
||
if (!expression_equal2(tdbb, opt, node1->nod_arg[i],
|
||
node2->nod_arg[i], stream))
|
||
{
|
||
return false;
|
||
}
|
||
}
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_gen_id:
|
||
case nod_gen_id2:
|
||
if (node1->nod_arg[e_gen_id] == node2->nod_arg[e_gen_id])
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_negate:
|
||
case nod_internal_info:
|
||
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
|
||
node2->nod_arg[0], stream))
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_upcase:
|
||
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
|
||
node2->nod_arg[0], stream))
|
||
{
|
||
/*
|
||
dsc dsc1, dsc2;
|
||
dsc *desc1 = &dsc1, *desc2 = &dsc2;
|
||
|
||
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
|
||
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
|
||
|
||
if (DSC_GET_COLLATE(desc1) == DSC_GET_COLLATE(desc2))
|
||
*/
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_cast:
|
||
{
|
||
dsc dsc1, dsc2;
|
||
dsc *desc1 = &dsc1, *desc2 = &dsc2;
|
||
|
||
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
|
||
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
|
||
|
||
if (DSC_EQUIV(desc1, desc2) &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[e_cast_source],
|
||
node2->nod_arg[e_cast_source], stream))
|
||
{
|
||
return true;
|
||
}
|
||
}
|
||
break;
|
||
|
||
case nod_extract:
|
||
if (node1->nod_arg[e_extract_part] == node2->nod_arg[e_extract_part] &&
|
||
expression_equal2(tdbb, opt, node1->nod_arg[e_extract_value],
|
||
node2->nod_arg[e_extract_value], stream))
|
||
{
|
||
return true;
|
||
}
|
||
break;
|
||
|
||
case nod_list:
|
||
{
|
||
jrd_nod** ptr1 = node1->nod_arg;
|
||
jrd_nod** ptr2 = node2->nod_arg;
|
||
|
||
if (node1->nod_count != node2->nod_count)
|
||
{
|
||
return false;
|
||
}
|
||
|
||
ULONG count = node1->nod_count;
|
||
|
||
while (count--)
|
||
{
|
||
if (!expression_equal2(tdbb, opt, *ptr1++, *ptr2++, stream))
|
||
{
|
||
return false;
|
||
}
|
||
}
|
||
|
||
return true;
|
||
}
|
||
|
||
// AB: New nodes has to be added
|
||
|
||
default:
|
||
break;
|
||
}
|
||
|
||
return false;
|
||
}
|
||
#endif
|
||
|
||
|
||
static void find_best(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
USHORT stream,
|
||
USHORT position,
|
||
UCHAR* streams,
|
||
const jrd_nod* plan_node,
|
||
double cost,
|
||
double cardinality)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f i n d _ b e s t
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Find the best join from the passed "stream" to
|
||
* the remaining "streams" in the RecordSelExpr. This routine
|
||
* uses recursion to successively consider all
|
||
* possible join orders which use indexed
|
||
* relationships to form joins.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(plan_node, type_nod);
|
||
#ifdef OPT_DEBUG
|
||
// this is used only in development so is not in the message file.
|
||
if (opt_debug_flag >= DEBUG_PUNT) {
|
||
ERR_post(isc_random, isc_arg_string, "punt", 0);
|
||
}
|
||
#endif
|
||
// if a plan was specified, check that this order matches the order
|
||
// that the user provided; this may seem like an ass-backwards way to
|
||
// enforce ordering, but I think it is important to follow the same
|
||
// code path for SET PLAN as for a normal optimization--it reduces
|
||
// chances for bugs to be introduced, and forces the person maintaining
|
||
// the optimizer to think about SET PLAN when new features are added --deej
|
||
if (plan_node)
|
||
{
|
||
if (streams[position + 1] == stream)
|
||
{
|
||
opt->opt_streams[position].opt_best_stream = stream;
|
||
++position;
|
||
if (position < streams[0])
|
||
{
|
||
find_best(tdbb, opt, streams[position + 1], position, streams, plan_node,
|
||
(double) 0, (double) 1);
|
||
}
|
||
else
|
||
{
|
||
opt->opt_best_count = streams[0];
|
||
}
|
||
}
|
||
return;
|
||
}
|
||
|
||
// do some initializations.
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
csb->csb_rpt[stream].csb_flags |= csb_active;
|
||
const UCHAR* stream_end = &streams[1] + streams[0];
|
||
opt->opt_streams[position].opt_stream_number = stream;
|
||
++position;
|
||
OptimizerBlk::opt_stream* order_end = opt->opt_streams.begin() + position;
|
||
OptimizerBlk::opt_stream* stream_data = opt->opt_streams.begin() + stream;
|
||
|
||
// Save the various flag bits from the optimizer block to reset its
|
||
// state after each test.
|
||
Firebird::HalfStaticArray<UCHAR, OPT_STATIC_ITEMS>
|
||
stream_flags(*tdbb->getDefaultPool()), conjunct_flags(*tdbb->getDefaultPool());
|
||
stream_flags.grow(csb->csb_n_stream);
|
||
conjunct_flags.grow(opt->opt_conjuncts.getCount());
|
||
size_t i;
|
||
for (i = 0; i < stream_flags.getCount(); i++)
|
||
stream_flags[i] = opt->opt_streams[i].opt_stream_flags & opt_stream_used;
|
||
for (i = 0; i < conjunct_flags.getCount(); i++)
|
||
conjunct_flags[i] = opt->opt_conjuncts[i].opt_conjunct_flags & opt_conjunct_used;
|
||
|
||
// Compute delta and total estimate cost to fetch this stream.
|
||
double position_cost, position_cardinality, new_cost = 0, new_cardinality = 0;
|
||
|
||
if (!plan_node) {
|
||
estimate_cost(tdbb, opt, stream, &position_cost,
|
||
&position_cardinality);
|
||
new_cost = cost + cardinality * position_cost;
|
||
new_cardinality = position_cardinality * cardinality;
|
||
}
|
||
|
||
++opt->opt_combinations;
|
||
// If the partial order is either longer than any previous partial order,
|
||
// or the same length and cheap, save order as "best".
|
||
if (position > opt->opt_best_count ||
|
||
(position == opt->opt_best_count && new_cost < opt->opt_best_cost))
|
||
{
|
||
opt->opt_best_count = position;
|
||
opt->opt_best_cost = new_cost;
|
||
for (OptimizerBlk::opt_stream* tail = opt->opt_streams.begin(); tail < order_end; tail++) {
|
||
tail->opt_best_stream = tail->opt_stream_number;
|
||
}
|
||
#ifdef OPT_DEBUG
|
||
if (opt_debug_flag >= DEBUG_CANDIDATE) {
|
||
print_order(opt, position, new_cardinality, new_cost);
|
||
}
|
||
}
|
||
else {
|
||
if (opt_debug_flag >= DEBUG_ALL) {
|
||
print_order(opt, position, new_cardinality, new_cost);
|
||
}
|
||
#endif
|
||
}
|
||
// mark this stream as "used" in the sense that it is already included
|
||
// in this particular proposed stream ordering.
|
||
stream_data->opt_stream_flags |= opt_stream_used;
|
||
bool done = false;
|
||
|
||
// if we've used up all the streams there's no reason to go any further.
|
||
if (position == streams[0]) {
|
||
done = true;
|
||
}
|
||
|
||
// We need to prune the combinations to avoid spending all of our time
|
||
// recursing through find_best(). Based on experimentation, the cost of
|
||
// recursion becomes significant at about a 7 table join. Therefore,
|
||
// make a simplifying assumption that if we have already seen a join
|
||
// ordering that is lower cost than this one, give up.
|
||
if (!done && position > 4) {
|
||
OptimizerBlk::opt_stream* tail = &opt->opt_streams[position];
|
||
/* If we are the new low-cost join ordering, record that
|
||
fact. Otherwise, give up. */
|
||
if (tail->opt_best_stream_cost == 0 ||
|
||
new_cost < tail->opt_best_stream_cost)
|
||
{
|
||
tail->opt_best_stream_cost = new_cost;
|
||
}
|
||
else {
|
||
if (!plan_node) {
|
||
done = true;
|
||
}
|
||
}
|
||
}
|
||
|
||
// First, handle any streams that have direct unique indexed
|
||
// relationships to this stream. If there are any, we
|
||
// won't consider (now) indirect relationships.
|
||
if (!done) {
|
||
for (IndexedRelationship* relationship = stream_data->opt_relationships;
|
||
relationship;
|
||
relationship = relationship->irl_next)
|
||
{
|
||
if (relationship->irl_unique &&
|
||
(!(opt->opt_streams[relationship->irl_stream].opt_stream_flags & opt_stream_used)))
|
||
{
|
||
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
|
||
if (*ptr == relationship->irl_stream) {
|
||
if (!plan_node) {
|
||
done = true;
|
||
}
|
||
find_best(tdbb, opt, relationship->irl_stream,
|
||
position, streams, plan_node, new_cost, new_cardinality);
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// Next, handle any streams that have direct indexed relationships to this
|
||
// stream. If there are any, we won't consider (now) indirect relationships
|
||
if (!done) {
|
||
for (IndexedRelationship* relationship = stream_data->opt_relationships;
|
||
relationship;
|
||
relationship = relationship->irl_next)
|
||
{
|
||
if (!(opt->opt_streams[relationship->irl_stream].opt_stream_flags & opt_stream_used))
|
||
{
|
||
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
|
||
if (*ptr == relationship->irl_stream) {
|
||
if (!plan_node) {
|
||
done = true;
|
||
}
|
||
find_best(tdbb, opt, relationship->irl_stream,
|
||
position, streams, plan_node, new_cost,
|
||
new_cardinality);
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// If there were no direct relationships, look for indirect relationships
|
||
if (!done) {
|
||
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
|
||
if (!(opt->opt_streams[*ptr].opt_stream_flags & opt_stream_used) &&
|
||
check_relationship(opt, position, *ptr))
|
||
{
|
||
find_best(tdbb, opt, *ptr, position,
|
||
streams, plan_node, new_cost, new_cardinality);
|
||
}
|
||
}
|
||
}
|
||
|
||
// Clean up from any changes made for compute the cost for this stream
|
||
csb->csb_rpt[stream].csb_flags &= ~csb_active;
|
||
for (i = 0; i < stream_flags.getCount(); i++)
|
||
opt->opt_streams[i].opt_stream_flags &= stream_flags[i];
|
||
for (i = 0; i < conjunct_flags.getCount(); i++)
|
||
opt->opt_conjuncts[i].opt_conjunct_flags &= conjunct_flags[i];
|
||
}
|
||
|
||
|
||
static jrd_nod* find_dbkey(jrd_nod* dbkey, USHORT stream, SLONG* position)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f i n d _ d b k e y
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Search a dbkey (possibly a concatenated one) for
|
||
* a dbkey for specified stream.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(dbkey, type_nod);
|
||
if (dbkey->nod_type == nod_dbkey) {
|
||
if ((USHORT)(IPTR) dbkey->nod_arg[0] == stream)
|
||
return dbkey;
|
||
else {
|
||
*position = *position + 1;
|
||
return NULL;
|
||
}
|
||
}
|
||
else if (dbkey->nod_type == nod_concatenate) {
|
||
jrd_nod** ptr = dbkey->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + dbkey->nod_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
jrd_nod* dbkey_temp = find_dbkey(*ptr, stream, position);
|
||
if (dbkey_temp)
|
||
return dbkey_temp;
|
||
}
|
||
}
|
||
return NULL;
|
||
}
|
||
|
||
|
||
static USHORT find_order(thread_db* tdbb,
|
||
OptimizerBlk* opt, UCHAR* streams, const jrd_nod* plan_node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f i n d _ o r d e r
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Given a set of streams, select the "best order" to join them.
|
||
* The "best order" is defined as longest, cheapest join order
|
||
* (length, of course, takes precedence over cost). The best
|
||
* order is developed and returned in the optimization block.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(plan_node, type_nod);
|
||
opt->opt_best_count = 0;
|
||
|
||
// if a plan was specified, the order is already
|
||
// present in the streams vector, so we only want
|
||
// to try one order.
|
||
const UCHAR* stream_end;
|
||
if (plan_node) {
|
||
stream_end = &streams[1] + 1;
|
||
}
|
||
else {
|
||
stream_end = &streams[1] + streams[0];
|
||
}
|
||
|
||
// Consider each stream as the leftmost stream in the join order;
|
||
// for each stream, the best order from that stream is considered,
|
||
// and the one which is best is placed into the opt block. Thus
|
||
// at the end of this loop the opt block holds the best order.
|
||
for (const UCHAR* stream = streams + 1; stream < stream_end; stream++) {
|
||
find_best(tdbb, opt, *stream, 0, streams, plan_node,
|
||
(double) 0, (double) 1);
|
||
}
|
||
#ifdef OPT_DEBUG
|
||
if (opt_debug_flag >= DEBUG_BEST) {
|
||
const OptimizerBlk::opt_stream* const order_end =
|
||
opt->opt_streams.begin() + opt->opt_best_count;
|
||
fprintf(opt_debug_file,
|
||
"find_order() -- best_count: %2.2d, best_streams: ",
|
||
opt->opt_best_count);
|
||
for (const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
|
||
tail < order_end; tail++)
|
||
{
|
||
fprintf(opt_debug_file, "%2.2d ", tail->opt_best_stream);
|
||
}
|
||
fprintf(opt_debug_file,
|
||
"\n\t\t\tbest_cost: %g\tcombinations: %ld\n",
|
||
opt->opt_best_cost, opt->opt_combinations);
|
||
}
|
||
#endif
|
||
|
||
return opt->opt_best_count;
|
||
}
|
||
|
||
|
||
static void find_rsbs(RecordSource* rsb, StreamStack* stream_list, RsbStack* rsb_list)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f i n d _ r s b s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Find all rsbs at or below the current one that map
|
||
* to a single stream. Save the stream numbers in a list.
|
||
* For unions/aggregates/procedures also save the rsb pointer.
|
||
*
|
||
**************************************/
|
||
#ifdef DEV_BUILD
|
||
DEV_BLKCHK(rsb, type_rsb);
|
||
#endif
|
||
|
||
if (!rsb) {
|
||
return;
|
||
}
|
||
|
||
RecordSource** ptr;
|
||
const RecordSource* const* end;
|
||
|
||
switch (rsb->rsb_type) {
|
||
case rsb_union:
|
||
case rsb_aggregate:
|
||
case rsb_procedure:
|
||
if (rsb_list) {
|
||
rsb_list->push(rsb);
|
||
}
|
||
case rsb_indexed:
|
||
case rsb_sequential:
|
||
case rsb_ext_sequential:
|
||
case rsb_ext_indexed:
|
||
// No need to go any farther down with these.
|
||
stream_list->push(rsb->rsb_stream);
|
||
return;
|
||
|
||
case rsb_cross:
|
||
// Loop through the sub-streams.
|
||
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count; ptr < end; ptr++) {
|
||
find_rsbs(*ptr, stream_list, rsb_list);
|
||
}
|
||
break;
|
||
|
||
case rsb_left_cross:
|
||
find_rsbs(rsb->rsb_arg[RSB_LEFT_outer], stream_list, rsb_list);
|
||
find_rsbs(rsb->rsb_arg[RSB_LEFT_inner], stream_list, rsb_list);
|
||
break;
|
||
|
||
case rsb_merge:
|
||
// Loop through the sub-streams
|
||
|
||
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count * 2;
|
||
ptr < end; ptr += 2)
|
||
{
|
||
find_rsbs(*ptr, stream_list, rsb_list);
|
||
}
|
||
break;
|
||
|
||
default: // Shut up compiler warnings
|
||
break;
|
||
}
|
||
|
||
find_rsbs(rsb->rsb_next, stream_list, rsb_list);
|
||
}
|
||
|
||
|
||
static void find_used_streams(const RecordSource* rsb, UCHAR* streams)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f i n d _ u s e d _ s t r e a m s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Find all streams through the given rsb
|
||
* and add them to the stream list.
|
||
*
|
||
**************************************/
|
||
if (!(rsb)) {
|
||
return;
|
||
}
|
||
|
||
const RecordSource* const* ptr;
|
||
const RecordSource* const* end;
|
||
USHORT stream;
|
||
bool found = false;
|
||
|
||
switch (rsb->rsb_type) {
|
||
|
||
case rsb_aggregate:
|
||
case rsb_ext_indexed:
|
||
case rsb_ext_sequential:
|
||
case rsb_indexed:
|
||
case rsb_navigate:
|
||
case rsb_procedure:
|
||
case rsb_sequential:
|
||
case rsb_union:
|
||
stream = rsb->rsb_stream;
|
||
found = true;
|
||
break;
|
||
|
||
case rsb_cross:
|
||
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count; ptr < end; ptr++) {
|
||
find_used_streams(*ptr, streams);
|
||
}
|
||
break;
|
||
|
||
case rsb_merge:
|
||
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count * 2; ptr < end; ptr += 2) {
|
||
find_used_streams(*ptr, streams);
|
||
}
|
||
break;
|
||
|
||
case rsb_left_cross:
|
||
find_used_streams(rsb->rsb_arg[RSB_LEFT_inner], streams);
|
||
find_used_streams(rsb->rsb_arg[RSB_LEFT_outer], streams);
|
||
break;
|
||
|
||
default: // Shut up compiler warnings.
|
||
break;
|
||
}
|
||
|
||
if (rsb->rsb_next) {
|
||
find_used_streams(rsb->rsb_next, streams);
|
||
}
|
||
|
||
if (found) {
|
||
found = false;
|
||
for (USHORT i = 1; i <= streams[0]; i++) {
|
||
if (stream == streams[i]) {
|
||
found = true;
|
||
break;
|
||
}
|
||
}
|
||
if (!found) {
|
||
streams[++streams[0]] = stream;
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static void form_rivers(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
UCHAR* streams,
|
||
RiverStack& river_stack,
|
||
jrd_nod** sort_clause,
|
||
jrd_nod** project_clause,
|
||
jrd_nod* plan_clause)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f o r m _ r i v e r s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Form streams into rivers according
|
||
* to the user-specified plan.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
if (sort_clause) {
|
||
DEV_BLKCHK(*sort_clause, type_nod);
|
||
}
|
||
if (project_clause) {
|
||
DEV_BLKCHK(*project_clause, type_nod);
|
||
}
|
||
DEV_BLKCHK(plan_clause, type_nod);
|
||
|
||
stream_array_t temp;
|
||
temp[0] = 0;
|
||
USHORT count = plan_clause->nod_count;
|
||
|
||
// this must be a join or a merge node, so go through
|
||
// the substreams and place them into the temp vector
|
||
// for formation into a river.
|
||
jrd_nod* plan_node = 0;
|
||
jrd_nod** ptr = plan_clause->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + count; ptr < end; ptr++) {
|
||
plan_node = *ptr;
|
||
if (plan_node->nod_type == nod_merge || plan_node->nod_type == nod_join) {
|
||
form_rivers(tdbb, opt, streams, river_stack, sort_clause,
|
||
project_clause, plan_node);
|
||
continue;
|
||
}
|
||
|
||
// at this point we must have a retrieval node, so put
|
||
// the stream into the river.
|
||
temp[0]++;
|
||
const jrd_nod* relation_node = plan_node->nod_arg[e_retrieve_relation];
|
||
temp[temp[0]] = (UCHAR)(IPTR) relation_node->nod_arg[e_rel_stream];
|
||
}
|
||
|
||
// just because the user specified a join does not mean that
|
||
// we are able to form a river; thus form as many rivers out
|
||
// of the join are as necessary to exhaust the streams.
|
||
// AB: Only form rivers when any retrieval node is seen, for
|
||
// example a MERGE on two JOINs will come with no retrievals
|
||
// at this point.
|
||
// CVC: Notice "plan_node" is pointing to the last element in the loop above.
|
||
// If the loop didn't execute, we had garbage in "plan_node".
|
||
if (temp[0] != 0) {
|
||
do {
|
||
count = find_order(tdbb, opt, temp, plan_node);
|
||
} while (form_river
|
||
(tdbb, opt, count, streams, temp, river_stack, sort_clause,
|
||
project_clause, 0));
|
||
}
|
||
}
|
||
|
||
|
||
static bool form_river(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
USHORT count,
|
||
UCHAR* streams,
|
||
UCHAR* temp,
|
||
RiverStack& river_stack,
|
||
jrd_nod** sort_clause,
|
||
jrd_nod** project_clause,
|
||
jrd_nod* plan_clause)
|
||
{
|
||
/**************************************
|
||
*
|
||
* f o r m _ r i v e r
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Form streams into rivers (combinations of streams).
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
if (sort_clause) {
|
||
DEV_BLKCHK(*sort_clause, type_nod);
|
||
}
|
||
if (project_clause) {
|
||
DEV_BLKCHK(*project_clause, type_nod);
|
||
}
|
||
DEV_BLKCHK(plan_clause, type_nod);
|
||
|
||
SET_TDBB(tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
|
||
// Allocate a river block and move the best order into it.
|
||
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), count) River();
|
||
river_stack.push(river);
|
||
river->riv_count = (UCHAR) count;
|
||
|
||
RecordSource* rsb;
|
||
RecordSource** ptr;
|
||
|
||
if (count == 1) {
|
||
rsb = NULL;
|
||
ptr = &river->riv_rsb;
|
||
}
|
||
else {
|
||
river->riv_rsb = rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count) RecordSource();
|
||
rsb->rsb_type = rsb_cross;
|
||
rsb->rsb_count = count;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
|
||
ptr = rsb->rsb_arg;
|
||
}
|
||
|
||
UCHAR* stream = river->riv_streams;
|
||
const OptimizerBlk::opt_stream* const opt_end = opt->opt_streams.begin() + count;
|
||
if (count != streams[0]) {
|
||
sort_clause = project_clause = NULL;
|
||
}
|
||
|
||
OptimizerBlk::opt_stream* tail;
|
||
|
||
for (tail = opt->opt_streams.begin(); tail < opt_end; tail++, stream++, ptr++) {
|
||
*stream = (UCHAR) tail->opt_best_stream;
|
||
*ptr = gen_retrieval(tdbb, opt, *stream, sort_clause, project_clause,
|
||
false, false, NULL);
|
||
sort_clause = project_clause = NULL;
|
||
}
|
||
|
||
// determine whether the rsb we just made should be marked as a projection.
|
||
if (rsb && rsb->rsb_arg[0]
|
||
&& ((RecordSource*) rsb->rsb_arg[0])->rsb_flags & rsb_project)
|
||
{
|
||
rsb->rsb_flags |= rsb_project;
|
||
}
|
||
set_made_river(opt, river);
|
||
set_inactive(opt, river);
|
||
|
||
// Reform "temp" from streams not consumed.
|
||
stream = temp + 1;
|
||
UCHAR* end_stream = stream + temp[0];
|
||
if (!(temp[0] -= count)) {
|
||
return false;
|
||
}
|
||
|
||
for (UCHAR* t2 = stream; t2 < end_stream; t2++) {
|
||
for (tail = opt->opt_streams.begin(); tail < opt_end; tail++) {
|
||
if (*t2 == tail->opt_best_stream) {
|
||
goto used;
|
||
}
|
||
}
|
||
*stream++ = *t2;
|
||
used:;
|
||
}
|
||
|
||
return true;
|
||
}
|
||
|
||
|
||
|
||
static RecordSource* gen_aggregate(thread_db* tdbb, OptimizerBlk* opt, jrd_nod* node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ a g g r e g a t e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate an RecordSource (Record Source Block) for each aggregate operation.
|
||
* Generate an AggregateSort (Aggregate Sort Block) for each DISTINCT aggregate.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(node, type_nod);
|
||
SET_TDBB(tdbb);
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
RecordSelExpr* rse = (RecordSelExpr*) node->nod_arg[e_agg_rse];
|
||
rse->rse_sorted = node->nod_arg[e_agg_group];
|
||
|
||
// try to optimize MAX and MIN to use an index; for now, optimize
|
||
// only the simplest case, although it is probably possible
|
||
// to use an index in more complex situations
|
||
|
||
jrd_nod** ptr;
|
||
jrd_nod* agg_operator;
|
||
jrd_nod* map = node->nod_arg[e_agg_map];
|
||
if ((map->nod_count == 1) &&
|
||
(ptr = map->nod_arg) &&
|
||
(agg_operator = (*ptr)->nod_arg[e_asgn_from]) &&
|
||
(agg_operator->nod_type == nod_agg_min ||
|
||
agg_operator->nod_type == nod_agg_max))
|
||
{
|
||
/* generate a sort block which the optimizer will try to map to an index */
|
||
|
||
jrd_nod* aggregate = PAR_make_node(tdbb, 3);
|
||
aggregate->nod_type = nod_sort;
|
||
aggregate->nod_count = 1;
|
||
aggregate->nod_arg[0] = agg_operator->nod_arg[e_asgn_from];
|
||
/* in the max case, flag the sort as descending */
|
||
if (agg_operator->nod_type == nod_agg_max) {
|
||
aggregate->nod_arg[1] = (jrd_nod*) TRUE;
|
||
}
|
||
/* 10-Aug-2004. Nickolay Samofatov
|
||
Unneeded nulls seem to be skipped somehow. */
|
||
aggregate->nod_arg[2] = (jrd_nod*) rse_nulls_default;
|
||
rse->rse_aggregate = aggregate;
|
||
}
|
||
|
||
// allocate and optimize the record source block
|
||
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
|
||
rsb->rsb_type = rsb_aggregate;
|
||
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_STREAMS);
|
||
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_UCHAR);
|
||
rsb->rsb_stream = (UCHAR) (IPTR) node->nod_arg[e_agg_stream];
|
||
rsb->rsb_format = csb->csb_rpt[rsb->rsb_stream].csb_format;
|
||
rsb->rsb_next = OPT_compile(tdbb, csb, rse, NULL);
|
||
rsb->rsb_arg[0] = (RecordSource*) node;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
|
||
|
||
if (rse->rse_aggregate)
|
||
{
|
||
// The rse_aggregate is still set. That means the optimizer
|
||
// was able to match the field to an index, so flag that fact
|
||
// so that it can be handled in EVL_group
|
||
if (agg_operator->nod_type == nod_agg_min) {
|
||
agg_operator->nod_type = nod_agg_min_indexed;
|
||
}
|
||
else if (agg_operator->nod_type == nod_agg_max) {
|
||
agg_operator->nod_type = nod_agg_max_indexed;
|
||
}
|
||
}
|
||
|
||
// Now generate a separate AggregateSort (Aggregate Sort Block) for each
|
||
// distinct operation;
|
||
// note that this should be optimized to use indices if possible
|
||
|
||
DSC descriptor;
|
||
DSC* desc = &descriptor;
|
||
ptr = map->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + map->nod_count; ptr < end; ptr++)
|
||
{
|
||
jrd_nod* from = (*ptr)->nod_arg[e_asgn_from];
|
||
if ((from->nod_type == nod_agg_count_distinct) ||
|
||
(from->nod_type == nod_agg_total_distinct) ||
|
||
(from->nod_type == nod_agg_total_distinct2) ||
|
||
(from->nod_type == nod_agg_average_distinct2) ||
|
||
(from->nod_type == nod_agg_average_distinct))
|
||
{
|
||
const USHORT count = asb_delta + 1 +
|
||
(sizeof(sort_key_def) + sizeof(jrd_nod**) - 1) / sizeof(jrd_nod**);
|
||
AggregateSort* asb = (AggregateSort*) PAR_make_node(tdbb, count);
|
||
asb->nod_type = nod_asb;
|
||
asb->nod_count = 0;
|
||
/* build the sort key definition. Turn varying text and
|
||
cstrings into text */
|
||
CMP_get_desc(tdbb, csb, from->nod_arg[0], desc);
|
||
if (desc->dsc_dtype == dtype_varying) {
|
||
desc->dsc_dtype = dtype_text;
|
||
desc->dsc_length -= sizeof(USHORT);
|
||
}
|
||
else if (desc->dsc_dtype == dtype_cstring) {
|
||
desc->dsc_dtype = dtype_text;
|
||
desc->dsc_length--;
|
||
}
|
||
|
||
sort_key_def* sort_key = asb->asb_key_desc = (sort_key_def*) asb->asb_key_data;
|
||
sort_key->skd_offset = 0;
|
||
// UCHAR desc->dsc_dtype is always >=0
|
||
// fb_assert(desc->dsc_dtype >= 0)
|
||
fb_assert(desc->dsc_dtype < FB_NELEM(sort_dtypes));
|
||
sort_key->skd_dtype = sort_dtypes[desc->dsc_dtype];
|
||
/* as it is legal to have skd_dtype = 0
|
||
I have removed these asserts, to avoid
|
||
server restarts in debug mode.
|
||
FSG 18.Dec.2000
|
||
*/
|
||
/*fb_assert (sort_key->skd_dtype != 0); */
|
||
sort_key->skd_length = desc->dsc_length;
|
||
sort_key->skd_flags = SKD_ascending;
|
||
asb->nod_impure = CMP_impure(csb, sizeof(impure_agg_sort));
|
||
asb->asb_desc = *desc;
|
||
from->nod_arg[1] = (jrd_nod*) asb;
|
||
from->nod_count = 2;
|
||
}
|
||
}
|
||
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_boolean(thread_db* tdbb, OptimizerBlk* opt,
|
||
RecordSource* prior_rsb, jrd_nod* node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ b o o l e a n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(node, type_nod);
|
||
DEV_BLKCHK(prior_rsb, type_rsb);
|
||
SET_TDBB(tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
|
||
rsb->rsb_count = 1;
|
||
rsb->rsb_type = rsb_boolean;
|
||
rsb->rsb_next = prior_rsb;
|
||
rsb->rsb_arg[0] = (RecordSource*) node;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_first(thread_db* tdbb, OptimizerBlk* opt,
|
||
RecordSource* prior_rsb, jrd_nod* node)
|
||
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ f i r s t
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
*
|
||
* NOTE: The rsb_first node MUST appear in the rsb list before the
|
||
* rsb_skip node. The calling code MUST call gen_first after
|
||
* gen_skip.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(prior_rsb, type_rsb);
|
||
DEV_BLKCHK(node, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
|
||
rsb->rsb_count = 1;
|
||
rsb->rsb_type = rsb_first;
|
||
rsb->rsb_next = prior_rsb;
|
||
rsb->rsb_arg[0] = (RecordSource*) node;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_first_n));
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static void gen_join(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
UCHAR* streams,
|
||
RiverStack& river_stack,
|
||
jrd_nod** sort_clause,
|
||
jrd_nod** project_clause,
|
||
jrd_nod* plan_clause)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ j o i n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Find all indexed relationships between streams,
|
||
* then form streams into rivers (combinations of
|
||
* streams).
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(*sort_clause, type_nod);
|
||
DEV_BLKCHK(*project_clause, type_nod);
|
||
DEV_BLKCHK(plan_clause, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
Database* dbb = tdbb->tdbb_database;
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
|
||
if (!streams[0]) {
|
||
return;
|
||
}
|
||
|
||
// If there is only a single stream, don't bother with a join.
|
||
if (streams[0] == 1) {
|
||
// if a nod_cardinality references this stream,
|
||
// compute the cardinality even though we don't
|
||
// need it to optimize retrieval.
|
||
|
||
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[streams[1]];
|
||
fb_assert(csb_tail);
|
||
if (csb_tail->csb_flags & csb_compute) {
|
||
jrd_rel* relation = csb_tail->csb_relation;
|
||
fb_assert(relation);
|
||
const Format* format = CMP_format(tdbb, csb, streams[1]);
|
||
fb_assert(format);
|
||
csb_tail->csb_cardinality =
|
||
(float) DPM_data_pages(tdbb, relation) *
|
||
dbb->dbb_page_size / format->fmt_length;
|
||
}
|
||
|
||
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) River();
|
||
river->riv_count = 1;
|
||
|
||
fb_assert(csb->csb_rpt[streams[1]].csb_relation);
|
||
|
||
river->riv_rsb =
|
||
gen_retrieval(tdbb, opt, streams[1], sort_clause, project_clause,
|
||
false, false, NULL);
|
||
river->riv_streams[0] = streams[1];
|
||
river_stack.push(river);
|
||
return;
|
||
}
|
||
|
||
// Compute cardinality and indexed relationships for all streams.
|
||
const UCHAR* end_stream = streams + 1 + streams[0];
|
||
for (UCHAR* stream = streams + 1; stream < end_stream; stream++) {
|
||
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[*stream];
|
||
fb_assert(csb_tail);
|
||
jrd_rel* relation = csb_tail->csb_relation;
|
||
fb_assert(relation);
|
||
const Format* format = CMP_format(tdbb, csb, *stream);
|
||
// if this is an external file, set an arbitrary cardinality;
|
||
// if a plan was specified, don't bother computing cardinality;
|
||
// otherwise give a rough estimate based on the number of data
|
||
// pages times the estimated number of records per page -- note
|
||
// this is an upper limit since all pages are probably not full
|
||
// and many of the records on page may be back versions.
|
||
if (relation->rel_file) {
|
||
csb_tail->csb_cardinality = (float) 10000;
|
||
}
|
||
else if (plan_clause) {
|
||
csb_tail->csb_cardinality = (float) 0;
|
||
}
|
||
else {
|
||
fb_assert(format);
|
||
csb_tail->csb_cardinality =
|
||
(float) DPM_data_pages(tdbb, relation) *
|
||
dbb->dbb_page_size / format->fmt_length;
|
||
}
|
||
|
||
// find indexed relationships from this stream to every other stream
|
||
OptimizerBlk::opt_stream* tail = opt->opt_streams.begin() + *stream;
|
||
csb_tail->csb_flags |= csb_active;
|
||
for (UCHAR* t2 = streams + 1; t2 < end_stream; t2++) {
|
||
if (*t2 != *stream) {
|
||
CompilerScratch::csb_repeat* csb_tail2 = &csb->csb_rpt[*t2];
|
||
csb_tail2->csb_flags |= csb_active;
|
||
IndexedRelationship* relationship = indexed_relationship(tdbb, opt, *t2);
|
||
if (relationship) {
|
||
relationship->irl_next = tail->opt_relationships;
|
||
tail->opt_relationships = relationship;
|
||
relationship->irl_stream = *t2;
|
||
}
|
||
csb_tail2->csb_flags &= ~csb_active;
|
||
}
|
||
}
|
||
csb_tail->csb_flags &= ~csb_active;
|
||
|
||
#ifdef OPT_DEBUG
|
||
if (opt_debug_flag >= DEBUG_RELATIONSHIPS) {
|
||
fprintf(opt_debug_file,
|
||
"gen_join () -- relationships from stream %2.2d: ",
|
||
*stream);
|
||
for (IndexedRelationship* relationship = tail->opt_relationships;
|
||
relationship;
|
||
relationship = relationship->irl_next)
|
||
{
|
||
fprintf(opt_debug_file, "%2.2d %s ",
|
||
relationship->irl_stream,
|
||
(relationship->irl_unique) ? "(unique)" : "");
|
||
}
|
||
fprintf(opt_debug_file, "\n");
|
||
}
|
||
#endif
|
||
}
|
||
|
||
// if the user specified a plan, force a join order;
|
||
// otherwise try to find one
|
||
if (plan_clause) {
|
||
form_rivers(tdbb, opt, streams, river_stack, sort_clause,
|
||
project_clause, plan_clause);
|
||
}
|
||
else {
|
||
// copy the streams vector to a temporary space to be used
|
||
// to form rivers out of streams
|
||
stream_array_t temp;
|
||
MOVE_FAST(streams, temp, streams[0] + 1);
|
||
|
||
USHORT count;
|
||
do {
|
||
count = find_order(tdbb, opt, temp, 0);
|
||
} while (form_river
|
||
(tdbb, opt, count, streams, temp, river_stack,
|
||
sort_clause, project_clause, 0));
|
||
}
|
||
}
|
||
|
||
|
||
static RecordSource* gen_navigation(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
USHORT stream,
|
||
jrd_rel* relation, str* alias, index_desc* idx, jrd_nod** sort_ptr)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ n a v i g a t i o n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* See if a navigational walk of an index is in order. If so,
|
||
* generate the appropriate RecordSource and zap the sort pointer. If
|
||
* not, return NULL. Prior to ODS7, missing values sorted in
|
||
* the wrong place for ascending indices, so don't use them.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(alias, type_str);
|
||
DEV_BLKCHK(*sort_ptr, type_nod);
|
||
|
||
Database* dbb = tdbb->tdbb_database;
|
||
|
||
// Check sort order against index. If they don't match, give up and
|
||
// go home. Also don't bother if we have a non-unique index.
|
||
// This is because null values aren't placed in a "good" spot in
|
||
// the index in versions prior to V3.2.
|
||
jrd_nod* sort = *sort_ptr;
|
||
|
||
// if the number of fields in the sort is greater than the number of
|
||
// fields in the index, the index will not be used to optimize the
|
||
// sort--note that in the case where the first field is unique, this
|
||
// could be optimized, since the sort will be performed correctly by
|
||
// navigating on a unique index on the first field--deej
|
||
if (sort->nod_count > idx->idx_count) {
|
||
return NULL;
|
||
}
|
||
|
||
// not sure the significance of this magic number; if it's meant to
|
||
// signify that we shouldn't navigate on a system table, our catalog
|
||
// has grown beyond 16 tables--it doesn't seem like a problem
|
||
// to allow navigating through system tables, so I won't bump the
|
||
// number up, but I'll leave it at 16 for safety's sake--deej
|
||
if (relation->rel_id <= 16) {
|
||
return NULL;
|
||
}
|
||
|
||
// if the user-specified access plan for this request didn't
|
||
// mention this index, forget it
|
||
if ((idx->idx_runtime_flags & idx_plan_dont_use) &&
|
||
!(idx->idx_runtime_flags & idx_plan_navigate))
|
||
{
|
||
return NULL;
|
||
}
|
||
|
||
// check to see if the fields in the sort match the fields in the index
|
||
// in the exact same order--we used to check for ascending/descending prior
|
||
// to SCROLLABLE_CURSORS, but now descending sorts can use ascending indices
|
||
// and vice versa.
|
||
#ifdef SCROLLABLE_CURSORS
|
||
RSE_GET_MODE mode;
|
||
RSE_GET_MODE last_mode = RSE_get_next;
|
||
#endif
|
||
|
||
index_desc::idx_repeat* idx_tail = idx->idx_rpt;
|
||
jrd_nod** ptr = sort->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + sort->nod_count; ptr < end;
|
||
ptr++, idx_tail++)
|
||
{
|
||
jrd_nod* node = *ptr;
|
||
if (node->nod_type != nod_field
|
||
|| (USHORT)(IPTR) node->nod_arg[e_fld_stream] != stream
|
||
|| (USHORT)(IPTR) node->nod_arg[e_fld_id] != idx_tail->idx_field
|
||
// for ODS11 default nulls placement always may be matched to index
|
||
|| (dbb->dbb_ods_version >= ODS_VERSION11 && (
|
||
(reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_first && ptr[sort->nod_count])
|
||
|| (reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_last && !ptr[sort->nod_count])))
|
||
// for ODS10 and earlier indices always placed nulls at the end of dataset
|
||
|| (dbb->dbb_ods_version < ODS_VERSION11 &&
|
||
reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_first)
|
||
#ifdef SCROLLABLE_CURSORS
|
||
)
|
||
#else
|
||
|| (ptr[sort->nod_count]
|
||
&& !(idx->idx_flags & idx_descending))
|
||
|| (!ptr[sort->nod_count]
|
||
&& (idx->idx_flags & idx_descending)) )
|
||
#endif
|
||
{
|
||
return NULL;
|
||
}
|
||
#ifdef SCROLLABLE_CURSORS
|
||
// determine whether we ought to navigate backwards or forwards through
|
||
// the index--we can't allow navigating one index in two different directions
|
||
// on two different fields at the same time!
|
||
mode = ((ptr[sort->nod_count] && !(idx->idx_flags & idx_descending))
|
||
|| (!ptr[sort->nod_count]
|
||
&& (idx->
|
||
idx_flags & idx_descending))) ? RSE_get_backward :
|
||
RSE_get_forward;
|
||
if (last_mode == RSE_get_next) {
|
||
last_mode = mode;
|
||
}
|
||
else if (last_mode != mode) {
|
||
return NULL;
|
||
}
|
||
#endif
|
||
}
|
||
|
||
// Looks like we can do a navigational walk. Flag that
|
||
// we have used this index for navigation, and allocate
|
||
// a navigational rsb for it.
|
||
*sort_ptr = NULL;
|
||
idx->idx_runtime_flags |= idx_navigate;
|
||
return gen_nav_rsb(tdbb, opt, stream, relation, alias, idx
|
||
#ifdef SCROLLABLE_CURSORS
|
||
, mode
|
||
#endif
|
||
);
|
||
}
|
||
|
||
|
||
static RecordSource* gen_nav_rsb(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
USHORT stream, jrd_rel* relation, str* alias, index_desc* idx
|
||
#ifdef SCROLLABLE_CURSORS
|
||
, RSE_GET_MODE mode
|
||
#endif
|
||
)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ n a v _ r s b
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a navigational rsb, either
|
||
* for a compile or for a set index.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(alias, type_str);
|
||
SET_TDBB(tdbb);
|
||
|
||
USHORT key_length = ROUNDUP(BTR_key_length(relation, idx), sizeof(SLONG));
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_NAV_count) RecordSource();
|
||
rsb->rsb_type = rsb_navigate;
|
||
rsb->rsb_relation = relation;
|
||
rsb->rsb_stream = (UCHAR) stream;
|
||
rsb->rsb_alias = alias;
|
||
rsb->rsb_arg[RSB_NAV_index] = (RecordSource*) OPT_make_index(tdbb, opt, relation, idx);
|
||
rsb->rsb_arg[RSB_NAV_key_length] = (RecordSource*) (IPTR) key_length;
|
||
|
||
#ifdef SCROLLABLE_CURSORS
|
||
// indicate that the index needs to be navigated in a mirror-image
|
||
// fashion; that when the user wants to go backwards we actually go
|
||
// forwards and vice versa
|
||
if (mode == RSE_get_backward) {
|
||
rsb->rsb_flags |= rsb_descending;
|
||
}
|
||
#endif
|
||
|
||
// if this is a blr_stream, adjust the allocated impure area
|
||
// to be based on the maximum key size so that the index may be
|
||
// reset at any time to another index of larger key length
|
||
// without adjusting the impure area offsets
|
||
if (opt->opt_g_flags & opt_g_stream) {
|
||
key_length = MAX_KEY;
|
||
}
|
||
const USHORT size = nav_rsb_size(rsb, key_length, 0);
|
||
rsb->rsb_impure = CMP_impure(opt->opt_csb, size);
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_outer(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
RecordSelExpr* rse,
|
||
RiverStack& river_stack, jrd_nod** sort_clause, jrd_nod** project_clause)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ o u t e r
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a top level outer join. The "outer" and "inner"
|
||
* sub-streams must be handled differently from each other.
|
||
* The inner is like other streams. The outer stream isn't
|
||
* because conjuncts may not eliminate records from the
|
||
* stream. They only determine if a join with an inner
|
||
* stream record is to be attempted.
|
||
*
|
||
**************************************/
|
||
struct {
|
||
RecordSource* stream_rsb;
|
||
USHORT stream_num;
|
||
} stream_o, stream_i, *stream_ptr[2];
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(rse, type_nod);
|
||
DEV_BLKCHK(*sort_clause, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
// Determine which stream should be outer and which is inner.
|
||
// In the case of a left join, the syntactically left stream is the
|
||
// outer, and the right stream is the inner. For all others, swap
|
||
// the sense of inner and outer, though for a full join it doesn't
|
||
// matter and we should probably try both orders to see which is
|
||
// more efficient.
|
||
if (rse->rse_jointype != blr_left) {
|
||
stream_ptr[1] = &stream_o;
|
||
stream_ptr[0] = &stream_i;
|
||
}
|
||
else {
|
||
stream_ptr[0] = &stream_o;
|
||
stream_ptr[1] = &stream_i;
|
||
}
|
||
|
||
// Loop through the outer join sub-streams in
|
||
// reverse order because rivers may have been PUSHed
|
||
River* river;
|
||
SSHORT i;
|
||
jrd_nod* node;
|
||
for (i = 1; i >= 0; i--) {
|
||
node = rse->rse_relation[i];
|
||
if (node->nod_type == nod_union ||
|
||
node->nod_type == nod_aggregate ||
|
||
node->nod_type == nod_procedure || node->nod_type == nod_rse)
|
||
{
|
||
river = river_stack.pop();
|
||
stream_ptr[i]->stream_rsb = river->riv_rsb;
|
||
}
|
||
else {
|
||
stream_ptr[i]->stream_rsb = NULL;
|
||
stream_ptr[i]->stream_num =
|
||
(USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
|
||
}
|
||
}
|
||
|
||
// Generate rsbs for the sub-streams. For the left sub-stream
|
||
// we also will get a boolean back
|
||
jrd_nod* boolean = NULL;
|
||
jrd_nod* inner_boolean = NULL;
|
||
if (!stream_o.stream_rsb) {
|
||
stream_o.stream_rsb =
|
||
gen_retrieval(tdbb, opt, stream_o.stream_num, sort_clause,
|
||
project_clause, true, false, &boolean);
|
||
}
|
||
|
||
// in the case of a full join, we must make sure we don't exclude record from
|
||
// the inner stream; otherwise just retrieve it as we would for an inner join
|
||
if (!stream_i.stream_rsb)
|
||
{
|
||
const bool bFullJoin = rse->rse_jointype == blr_full;
|
||
const bool bOuter = bFullJoin;
|
||
jrd_nod** ppNod = bFullJoin ? &inner_boolean : 0;
|
||
stream_i.stream_rsb =
|
||
gen_retrieval(tdbb,
|
||
opt,
|
||
stream_i.stream_num,
|
||
sort_clause,
|
||
project_clause,
|
||
bOuter,
|
||
true,
|
||
ppNod);
|
||
}
|
||
|
||
// generate a parent boolean rsb for any remaining booleans that
|
||
// were not satisfied via an index lookup
|
||
stream_i.stream_rsb = gen_residual_boolean(tdbb, opt, stream_i.stream_rsb);
|
||
|
||
// Allocate and fill in the rsb
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_LEFT_count) RecordSource();
|
||
rsb->rsb_type = rsb_left_cross;
|
||
rsb->rsb_count = 2;
|
||
rsb->rsb_impure = CMP_impure(opt->opt_csb, sizeof(struct irsb));
|
||
rsb->rsb_arg[RSB_LEFT_outer] = stream_o.stream_rsb;
|
||
rsb->rsb_arg[RSB_LEFT_inner] = stream_i.stream_rsb;
|
||
rsb->rsb_arg[RSB_LEFT_boolean] = (RecordSource*) boolean;
|
||
rsb->rsb_arg[RSB_LEFT_inner_boolean] = (RecordSource*) inner_boolean;
|
||
rsb->rsb_left_streams =
|
||
FB_NEW(*tdbb->getDefaultPool()) StreamStack(*tdbb->getDefaultPool());
|
||
rsb->rsb_left_inner_streams =
|
||
FB_NEW(*tdbb->getDefaultPool()) StreamStack(*tdbb->getDefaultPool());
|
||
rsb->rsb_left_rsbs =
|
||
FB_NEW(*tdbb->getDefaultPool()) RsbStack(*tdbb->getDefaultPool());
|
||
// find all the outer and inner substreams and push them on a stack.
|
||
find_rsbs(stream_i.stream_rsb,
|
||
rsb->rsb_left_streams,
|
||
rsb->rsb_left_rsbs);
|
||
if (rse->rse_jointype == blr_full) {
|
||
find_rsbs(stream_o.stream_rsb,
|
||
rsb->rsb_left_inner_streams, NULL);
|
||
}
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_procedure(thread_db* tdbb, OptimizerBlk* opt, jrd_nod* node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ p r o c e d u r e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(node, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
jrd_prc* procedure = MET_lookup_procedure_id(tdbb,
|
||
(SSHORT)(IPTR)node->nod_arg[e_prc_procedure], false, false, 0);
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_PRC_count) RecordSource();
|
||
rsb->rsb_type = rsb_procedure;
|
||
rsb->rsb_stream = (UCHAR)(IPTR) node->nod_arg[e_prc_stream];
|
||
rsb->rsb_procedure = procedure;
|
||
rsb->rsb_format = procedure->prc_format;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_procedure));
|
||
rsb->rsb_arg[RSB_PRC_inputs] = (RecordSource*) node->nod_arg[e_prc_inputs];
|
||
rsb->rsb_arg[RSB_PRC_in_msg] = (RecordSource*) node->nod_arg[e_prc_in_msg];
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_residual_boolean(thread_db* tdbb, OptimizerBlk* opt,
|
||
RecordSource* prior_rsb)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ r e s i d u a l _ b o o l e a n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Pick up any residual boolean remaining,
|
||
* meaning those that have not been used
|
||
* as part of some join. These booleans
|
||
* must still be applied to the result stream.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(prior_rsb, type_rsb);
|
||
|
||
jrd_nod* boolean = NULL;
|
||
const OptimizerBlk::opt_conjunct* const opt_end =
|
||
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
|
||
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)) {
|
||
compose(&boolean, node, nod_and);
|
||
tail->opt_conjunct_flags |= opt_conjunct_used;
|
||
}
|
||
}
|
||
|
||
if (!boolean) {
|
||
return prior_rsb;
|
||
}
|
||
return gen_boolean(tdbb, opt, prior_rsb, boolean);
|
||
}
|
||
|
||
|
||
static RecordSource* gen_retrieval(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
SSHORT stream,
|
||
jrd_nod** sort_ptr,
|
||
jrd_nod** project_ptr,
|
||
bool outer_flag,
|
||
bool inner_flag,
|
||
jrd_nod** return_boolean)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ r e t r i e v a l
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
**************************************/
|
||
SSHORT i, position;
|
||
OptimizerBlk::opt_conjunct* tail;
|
||
OptimizerBlk::opt_segment* idx_tail;
|
||
bool full = false;
|
||
|
||
SET_TDBB(tdbb);
|
||
|
||
#ifdef DEV_BUILD
|
||
DEV_BLKCHK(opt, type_opt);
|
||
if (sort_ptr) {
|
||
DEV_BLKCHK(*sort_ptr, type_nod);
|
||
}
|
||
if (project_ptr) {
|
||
DEV_BLKCHK(*project_ptr, type_nod);
|
||
}
|
||
if (return_boolean) {
|
||
DEV_BLKCHK(*return_boolean, type_nod);
|
||
}
|
||
#endif
|
||
|
||
// since a full outer join is a special case for us, as we have 2 outer
|
||
// streams, recoginze this condition and set the full flag, also reset the
|
||
// inner flag. This condition is only statisfied for the second stream in
|
||
// the full join. This condition is only set from the call in gen_outer() in
|
||
// case of a full join.
|
||
if ((inner_flag == true) && (outer_flag == true)) {
|
||
/* the inner flag back to false and set the full flag */
|
||
inner_flag = false;
|
||
full = true;
|
||
}
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
|
||
jrd_rel* relation = csb_tail->csb_relation;
|
||
|
||
fb_assert(relation);
|
||
|
||
str* alias = make_alias(tdbb, csb, csb_tail);
|
||
csb_tail->csb_flags |= csb_active;
|
||
/* bug #8180 reported by Bill Karwin: when a DISTINCT and an ORDER BY
|
||
are done on different fields, and the ORDER BY can be mapped to an
|
||
index, then the records are returned in the wrong order because the
|
||
DISTINCT sort is performed after the navigational walk of the index;
|
||
for that reason, we need to de-optimize this case so that the ORDER
|
||
BY does not use an index; if desired, we could re-optimize by doing
|
||
the DISTINCT first, using a sparse bit map to store the DISTINCT
|
||
records, then perform the navigational walk for the ORDER BY and
|
||
filter the records out with the sparse bitmap. However, that is a
|
||
task for another day. --deej */
|
||
/* Bug #8958: comment out anything having to do with mapping a DISTINCT
|
||
to an index, for now. The fix for this bug was going to be so involved
|
||
that it made more sense to deoptimize this case for the time being until
|
||
we can determine whether it really makes sense to optimize a DISTINCT,
|
||
or for that matter, and ORDER BY, via an index--there is a case
|
||
to be made that it is a deoptimization and more testing needs to be done
|
||
to determine that; see more comments in the bug description
|
||
*/
|
||
if (sort_ptr && *sort_ptr && project_ptr && *project_ptr) {
|
||
sort_ptr = NULL;
|
||
}
|
||
/* Time to find inversions. For each index on the relation
|
||
match all unused booleans against the index looking for upper
|
||
and lower bounds that can be computed by the index. When
|
||
all unused conjunctions are exhausted, see if there is enough
|
||
information for an index retrieval. If so, build up an
|
||
inversion component of the boolean. */
|
||
|
||
jrd_nod* inversion = NULL;
|
||
// It's recalculated later.
|
||
const OptimizerBlk::opt_conjunct* opt_end =
|
||
opt->opt_conjuncts.begin() + (inner_flag ? opt->opt_base_missing_conjuncts : opt->opt_conjuncts.getCount());
|
||
RecordSource* rsb = NULL;
|
||
bool index_used = false;
|
||
|
||
if (relation->rel_file)
|
||
{
|
||
rsb = EXT_optimize(opt, stream, sort_ptr ? sort_ptr : project_ptr);
|
||
}
|
||
else if (opt->opt_conjuncts.getCount() || (sort_ptr && *sort_ptr)
|
||
/***|| (project_ptr && *project_ptr)***/
|
||
)
|
||
{
|
||
/* we want to start with indices which have more index segments, attempting to match
|
||
all the conjuncts possible to these indices, on the theory that one index matched
|
||
to n booleans is more selective and uses less resources than using n indices;
|
||
therefore find out which index has the most segments and proceed backwards from there;
|
||
NOTE: it's possible that a boolean might be matched to an index and then later it could
|
||
have been paired with another boolean to match another index such that both booleans
|
||
could be calculated via the index; currently we won't detect that case
|
||
*/
|
||
|
||
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS> idx_walk_vector(*tdbb->getDefaultPool());
|
||
idx_walk_vector.grow(csb_tail->csb_indices);
|
||
index_desc** idx_walk = idx_walk_vector.begin();
|
||
Firebird::HalfStaticArray<UINT64, OPT_STATIC_ITEMS> idx_priority_level_vector(*tdbb->getDefaultPool());
|
||
idx_priority_level_vector.grow(csb_tail->csb_indices);
|
||
UINT64* idx_priority_level = idx_priority_level_vector.begin();
|
||
|
||
i = 0;
|
||
for (index_desc* idx = csb_tail->csb_idx->items; i < csb_tail->csb_indices;
|
||
++i, ++idx)
|
||
{
|
||
|
||
idx_walk[i] = idx;
|
||
idx_priority_level[i] = LOWEST_PRIORITY_LEVEL;
|
||
/* skip this part if the index wasn't specified for indexed
|
||
retrieval (still need to look for navigational retrieval) */
|
||
if ((idx->idx_runtime_flags & idx_plan_dont_use) &&
|
||
!(idx->idx_runtime_flags & idx_plan_navigate))
|
||
{
|
||
continue;
|
||
}
|
||
|
||
/* go through all the unused conjuncts and see if
|
||
any of them are computable using this index */
|
||
clear_bounds(opt, idx);
|
||
tail = opt->opt_conjuncts.begin();
|
||
if (outer_flag) {
|
||
tail += opt->opt_base_parent_conjuncts;
|
||
}
|
||
for (; tail < opt_end; tail++)
|
||
{
|
||
if (tail->opt_conjunct_flags & opt_conjunct_matched) {
|
||
continue;
|
||
}
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
|
||
computable(csb, node, -1, (inner_flag || outer_flag), false))
|
||
{
|
||
match_index(tdbb, opt, stream, node, idx);
|
||
}
|
||
if (node->nod_type == nod_starts)
|
||
compose(&inversion,
|
||
make_starts(tdbb, opt, relation, node, stream,
|
||
idx), nod_bit_and);
|
||
if (node->nod_type == nod_missing)
|
||
compose(&inversion,
|
||
make_missing(tdbb, opt, relation, node,
|
||
stream, idx), nod_bit_and);
|
||
}
|
||
|
||
/* look for a navigational retrieval (unless one was already found or
|
||
there is no sort block); if no navigational retrieval on this index,
|
||
add an indexed retrieval to the inversion tree */
|
||
if (!rsb)
|
||
{
|
||
if (sort_ptr && *sort_ptr)
|
||
{
|
||
rsb = gen_navigation(tdbb, opt, stream, relation, alias,
|
||
idx, sort_ptr);
|
||
if (rsb) {
|
||
continue;
|
||
}
|
||
}
|
||
|
||
/* for now, make sure that we only map a DISTINCT to an index if they contain
|
||
the same number of fields; it should be possible to map a DISTINCT to an
|
||
index which has extra fields to the right, but we need to add some code
|
||
in NAV_get_record() to check when the relevant fields change, rather than
|
||
the whole index key */
|
||
|
||
/***if (project_ptr && *project_ptr)
|
||
|
||
if ((idx->idx_count == (*project_ptr)->nod_count) &&
|
||
(rsb = gen_navigation (tdbb, opt, stream, relation, alias, idx, project_ptr)))
|
||
{
|
||
rsb->rsb_flags |= rsb_project;
|
||
continue;
|
||
}***/
|
||
}
|
||
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
|
||
// Calculate the priority level for this index.
|
||
idx_priority_level[i] = calculate_priority_level(opt, idx);
|
||
}
|
||
|
||
}
|
||
|
||
// Sort indices based on the priority level into idx_walk.
|
||
SSHORT idx_walk_count =
|
||
sort_indices_by_priority(csb_tail, idx_walk, idx_priority_level);
|
||
|
||
// Walk through the indicies based on earlier calculated count and
|
||
// when necessary build the index
|
||
|
||
Firebird::HalfStaticArray<SSHORT, OPT_STATIC_ITEMS>
|
||
conjunct_position_vector(*tdbb->getDefaultPool());
|
||
|
||
Firebird::HalfStaticArray<OptimizerBlk::opt_conjunct*, OPT_STATIC_ITEMS>
|
||
matching_nodes_vector(*tdbb->getDefaultPool());
|
||
|
||
for (i = 0; i < idx_walk_count; i++)
|
||
{
|
||
|
||
index_desc* idx = idx_walk[i];
|
||
if (idx->idx_runtime_flags & idx_plan_dont_use) {
|
||
continue;
|
||
}
|
||
|
||
conjunct_position_vector.shrink(0);
|
||
matching_nodes_vector.shrink(0);
|
||
clear_bounds(opt, idx);
|
||
tail = opt->opt_conjuncts.begin();
|
||
if (outer_flag) {
|
||
tail += opt->opt_base_parent_conjuncts;
|
||
}
|
||
for (; tail < opt_end; tail++) {
|
||
// Test if this conjunction is available for this index.
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_matched)) {
|
||
// Setting opt_lower and/or opt_upper values
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
|
||
computable(csb,
|
||
node,
|
||
-1,
|
||
(inner_flag || outer_flag),
|
||
false))
|
||
{
|
||
if (match_index(tdbb, opt, stream, node, idx)) {
|
||
position = 0;
|
||
idx_tail = opt->opt_segments;
|
||
const OptimizerBlk::opt_segment* const idx_end =
|
||
idx_tail + idx->idx_count;
|
||
for (; idx_tail < idx_end; idx_tail++, position++) {
|
||
if (idx_tail->opt_match == node)
|
||
break;
|
||
}
|
||
if (idx_tail >= idx_end && !csb_tail->csb_plan) {
|
||
// Nevertheless we have a resulting count
|
||
// from match_index, still a node could not
|
||
// be assigned, because equal nodes are
|
||
// preferred against other ones.
|
||
// Flag this node as used, so that no other
|
||
// index is used with this bad one.
|
||
// example: WHERE (ID = 100) and (ID >= 1)
|
||
tail->opt_conjunct_flags |= opt_conjunct_matched;
|
||
}
|
||
else {
|
||
matching_nodes_vector.add(tail);
|
||
conjunct_position_vector.add(position);
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
// Use a different marking if a PLAN was specified, this is
|
||
// for backwards compatibility. Juck...
|
||
if (csb_tail->csb_plan) {
|
||
// Mark only used conjuncts in this index as used
|
||
idx_tail = opt->opt_segments;
|
||
const OptimizerBlk::opt_segment* const idx_end =
|
||
idx_tail + idx->idx_count;
|
||
for (; idx_tail < idx_end &&
|
||
(idx_tail->opt_lower || idx_tail->opt_upper); idx_tail++)
|
||
{
|
||
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++) {
|
||
if (idx_tail->opt_match == tail->opt_conjunct_node) {
|
||
tail->opt_conjunct_flags |= opt_conjunct_matched;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
else {
|
||
// No plan
|
||
// Mark all conjuncts that could be calculated against the
|
||
// index as used. For example if you have :
|
||
// (node1 >= constant) and (node1 <= constant) be sure both
|
||
// conjuncts will be marked as opt_conjunct_matched
|
||
position = 0;
|
||
idx_tail = opt->opt_segments;
|
||
const OptimizerBlk::opt_segment* const idx_end =
|
||
idx_tail + idx->idx_count;
|
||
for (; idx_tail < idx_end &&
|
||
(idx_tail->opt_lower || idx_tail->opt_upper);
|
||
idx_tail++, position++)
|
||
{
|
||
for (size_t j = 0; j < conjunct_position_vector.getCount(); j++) {
|
||
if (conjunct_position_vector[j] == position) {
|
||
matching_nodes_vector[j]->opt_conjunct_flags |= opt_conjunct_matched;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
jrd_nod* idx_node = OPT_make_index(tdbb, opt, relation, idx);
|
||
IndexRetrieval* retrieval =
|
||
(IndexRetrieval*) idx_node->nod_arg[e_idx_retrieval];
|
||
compose(&inversion, idx_node, nod_bit_and);
|
||
idx->idx_runtime_flags |= idx_used_with_and;
|
||
index_used = true;
|
||
|
||
// When we composed a UNIQUE index stop composing, because
|
||
// this is the best we can get, but only when full used.
|
||
if ((idx->idx_flags & idx_unique) && !(csb_tail->csb_plan) &&
|
||
!(retrieval->irb_generic & irb_partial))
|
||
{
|
||
break; // Go out of idx_walk loop
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
if (outer_flag) {
|
||
// Now make another pass thru the outer conjuncts only, finding unused,
|
||
// computable booleans. When one is found, roll it into a final
|
||
// boolean and mark it used.
|
||
*return_boolean = NULL;
|
||
opt_end = opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
|
||
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++) {
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
|
||
&& computable(csb, node, -1, false, false))
|
||
{
|
||
compose(return_boolean, node, nod_and);
|
||
tail->opt_conjunct_flags |= opt_conjunct_used;
|
||
}
|
||
}
|
||
}
|
||
|
||
// Now make another pass thru the conjuncts finding unused, computable
|
||
// booleans. When one is found, roll it into a final boolean and mark
|
||
// it used. If a computable boolean didn't match against an index then
|
||
// mark the stream to denote unmatched booleans.
|
||
jrd_nod* opt_boolean = NULL;
|
||
opt_end = opt->opt_conjuncts.begin() + (inner_flag ? opt->opt_base_parent_conjuncts : opt->opt_conjuncts.getCount());
|
||
tail = opt->opt_conjuncts.begin();
|
||
if (outer_flag) {
|
||
tail += opt->opt_base_parent_conjuncts;
|
||
}
|
||
|
||
for (; tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!relation->rel_file) {
|
||
compose(&inversion, OPT_make_dbkey(opt, node, stream), nod_bit_and);
|
||
}
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
|
||
&& computable(csb, node, -1, false, false))
|
||
{
|
||
if (node->nod_type == nod_or) {
|
||
compose(&inversion, make_inversion(tdbb, opt, node, stream),
|
||
nod_bit_and);
|
||
}
|
||
// If no index is used then leave other nodes alone, because they
|
||
// could be used for building a SORT/MERGE.
|
||
if ((inversion && expression_contains_stream(node, stream)) ||
|
||
(!inversion && computable(csb, node, stream, false, true)))
|
||
{
|
||
// Don't allow adding IS NULL conjunction to outer stream
|
||
// from parent node, because a FULL OUTER JOIN could return
|
||
// wrong results with it.
|
||
if (!outer_flag ||
|
||
(outer_flag && !expression_contains(node, nod_missing)))
|
||
{
|
||
compose(&opt_boolean, node, nod_and);
|
||
tail->opt_conjunct_flags |= opt_conjunct_used;
|
||
|
||
if (!outer_flag && !(tail->opt_conjunct_flags & opt_conjunct_matched)) {
|
||
csb_tail->csb_flags |= csb_unmatched;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
if (full) {
|
||
return gen_rsb(tdbb, opt, rsb, inversion, stream, relation, alias,
|
||
*return_boolean, csb_tail->csb_cardinality);
|
||
}
|
||
else {
|
||
return gen_rsb(tdbb, opt, rsb, inversion, stream, relation, alias,
|
||
opt_boolean, csb_tail->csb_cardinality);
|
||
}
|
||
}
|
||
|
||
|
||
static RecordSource* gen_rsb(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
RecordSource* rsb,
|
||
jrd_nod* inversion,
|
||
SSHORT stream,
|
||
jrd_rel* relation, str* alias, jrd_nod* boolean, float cardinality)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ r s b
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a record source block to handle either a sort or a project.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(rsb, type_rsb);
|
||
DEV_BLKCHK(inversion, type_nod);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(alias, type_str);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
SET_TDBB(tdbb);
|
||
if (rsb) {
|
||
if (rsb->rsb_type == rsb_navigate && inversion)
|
||
rsb->rsb_arg[RSB_NAV_inversion] = (RecordSource*) inversion;
|
||
}
|
||
else {
|
||
SSHORT size;
|
||
if (inversion) {
|
||
rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
|
||
rsb->rsb_type = rsb_indexed;
|
||
rsb->rsb_count = 1;
|
||
size = sizeof(struct irsb_index);
|
||
rsb->rsb_arg[0] = (RecordSource*) inversion;
|
||
}
|
||
else {
|
||
rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) RecordSource();
|
||
rsb->rsb_type = rsb_sequential;
|
||
size = sizeof(struct irsb);
|
||
if (boolean)
|
||
opt->opt_csb->csb_rpt[stream].csb_flags |= csb_unmatched;
|
||
}
|
||
|
||
rsb->rsb_stream = (UCHAR) stream;
|
||
rsb->rsb_relation = relation;
|
||
rsb->rsb_alias = alias;
|
||
// if this is a blr_stream, we need to leave room
|
||
// in the impure area for a navigational-type rsb;
|
||
// even if this is not currently a navigational rsb,
|
||
// OPT_set_index() could be used to convert it to one.
|
||
if (opt->opt_g_flags & opt_g_stream) {
|
||
size = sizeof(impure_inversion);
|
||
size = nav_rsb_size(rsb, MAX_KEY, size);
|
||
}
|
||
|
||
rsb->rsb_impure = CMP_impure(opt->opt_csb, size);
|
||
}
|
||
|
||
if (boolean) {
|
||
rsb = gen_boolean(tdbb, opt, rsb, boolean);
|
||
}
|
||
|
||
// retain the cardinality for use at runtime by blr_cardinality
|
||
rsb->rsb_cardinality = (ULONG) cardinality;
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_skip(thread_db* tdbb, OptimizerBlk* opt,
|
||
RecordSource* prior_rsb, jrd_nod* node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ s k i p
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Compile and optimize a record selection expression into a
|
||
* set of record source blocks (rsb's).
|
||
*
|
||
* NOTE: The rsb_skip node MUST appear in the rsb list after the
|
||
* rsb_first node. The calling code MUST call gen_skip before
|
||
* gen_first.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK (opt, type_opt);
|
||
DEV_BLKCHK (prior_rsb, type_rsb);
|
||
DEV_BLKCHK (node, type_nod);
|
||
|
||
SET_TDBB (tdbb);
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
// was : rsb = (RecordSource*) ALLOCDV (type_rsb, 1);
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) RecordSource();
|
||
rsb->rsb_count = 1;
|
||
rsb->rsb_type = rsb_skip;
|
||
rsb->rsb_next = prior_rsb;
|
||
rsb->rsb_arg[0] = (RecordSource*) node;
|
||
rsb->rsb_impure = CMP_impure (csb, sizeof (struct irsb_skip_n));
|
||
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_sort(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
UCHAR * streams,
|
||
UCHAR * dbkey_streams,
|
||
RecordSource* prior_rsb, jrd_nod* sort, bool project_flag)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ s o r t
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a record source block to handle either a sort or a project.
|
||
* The two case are virtual identical -- the only difference is that
|
||
* project eliminates duplicates. However, since duplicates are
|
||
* recognized and handled by sort, the JRD processing is identical.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(prior_rsb, type_rsb);
|
||
DEV_BLKCHK(sort, type_nod);
|
||
SET_TDBB(tdbb);
|
||
/* We already know the number of keys, but we also need to compute the
|
||
total number of fields, keys and non-keys, to be pumped thru sort. Starting
|
||
with the number of keys, count the other field referenced. Since a field
|
||
is often a key, check for overlap to keep the length of the sort record
|
||
down. */
|
||
/* Along with the record number, the transaction id of the
|
||
* record will also be stored in the sort file. This will
|
||
* be used to detect update conflict in read committed
|
||
* transactions.
|
||
*/
|
||
|
||
UCHAR* ptr;
|
||
dsc descriptor;
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
USHORT items =
|
||
sort->nod_count + (streams[0] * 2) +
|
||
(dbkey_streams ? dbkey_streams[0] : 0);
|
||
const UCHAR* const end_ptr = streams + streams[0];
|
||
const jrd_nod* const* const end_node = sort->nod_arg + sort->nod_count;
|
||
Firebird::Stack<SLONG> id_stack;
|
||
StreamStack stream_stack;
|
||
|
||
for (ptr = &streams[1]; ptr <= end_ptr; ptr++) {
|
||
UInt32Bitmap::Accessor accessor(csb->csb_rpt[*ptr].csb_fields);
|
||
|
||
if (accessor.getFirst()) do {
|
||
ULONG id = accessor.current();
|
||
items++;
|
||
id_stack.push(id);
|
||
stream_stack.push(*ptr);
|
||
for (jrd_nod** node_ptr = sort->nod_arg; node_ptr < end_node; node_ptr++)
|
||
{
|
||
jrd_nod* node = *node_ptr;
|
||
if (node->nod_type == nod_field
|
||
&& (USHORT)(IPTR) node->nod_arg[e_fld_stream] == *ptr
|
||
&& (USHORT)(IPTR) node->nod_arg[e_fld_id] == id)
|
||
{
|
||
dsc* desc = &descriptor;
|
||
CMP_get_desc(tdbb, csb, node, desc);
|
||
/* International type text has a computed key */
|
||
if (IS_INTL_DATA(desc))
|
||
break;
|
||
--items;
|
||
id_stack.pop();
|
||
stream_stack.pop();
|
||
break;
|
||
}
|
||
}
|
||
} while (accessor.getNext());
|
||
}
|
||
|
||
/* Now that we know the number of items, allocate a sort map block. Allocate
|
||
it sufficiently large that there is room for a sort key descriptor on the
|
||
end. */
|
||
|
||
const USHORT count = items +
|
||
(sizeof(sort_key_def) * 2 * sort->nod_count + sizeof(smb_repeat) -
|
||
1) / sizeof(smb_repeat);
|
||
SortMap* map = FB_NEW_RPT(*tdbb->getDefaultPool(), count) SortMap();
|
||
map->smb_keys = sort->nod_count * 2;
|
||
map->smb_count = items;
|
||
if (project_flag) {
|
||
map->smb_flags |= SMB_project;
|
||
}
|
||
|
||
ULONG map_length = 0;
|
||
|
||
// Loop thru sort keys building sort keys. Actually, to handle null values
|
||
// correctly, two sort keys are made for each field, one for the null flag
|
||
// and one for field itself.
|
||
smb_repeat* map_item = map->smb_rpt;
|
||
sort_key_def* sort_key = (sort_key_def*) & map->smb_rpt[items];
|
||
map->smb_key_desc = sort_key;
|
||
for (jrd_nod** node_ptr = sort->nod_arg; node_ptr < end_node;
|
||
node_ptr++, map_item++)
|
||
{
|
||
/* Pick up sort key expression. */
|
||
|
||
jrd_nod* node = *node_ptr;
|
||
dsc* desc = &descriptor;
|
||
CMP_get_desc(tdbb, csb, node, desc);
|
||
/* Allow for "key" forms of International text to grow */
|
||
if (IS_INTL_DATA(desc)) {
|
||
/* Turn varying text and cstrings into text. */
|
||
|
||
if (desc->dsc_dtype == dtype_varying) {
|
||
desc->dsc_dtype = dtype_text;
|
||
desc->dsc_length -= sizeof(USHORT);
|
||
}
|
||
else if (desc->dsc_dtype == dtype_cstring) {
|
||
desc->dsc_dtype = dtype_text;
|
||
desc->dsc_length--;
|
||
}
|
||
desc->dsc_length =
|
||
INTL_key_length(tdbb, INTL_INDEX_TYPE(desc),
|
||
desc->dsc_length);}
|
||
|
||
/* Make key for null flag */
|
||
|
||
#ifndef WORDS_BIGENDIAN
|
||
map_length = ROUNDUP(map_length, sizeof(SLONG));
|
||
#endif
|
||
sort_key->skd_offset = map_item->smb_flag_offset =
|
||
(USHORT) map_length++;
|
||
sort_key->skd_dtype = SKD_text;
|
||
sort_key->skd_length = 1;
|
||
// Handle nulls placement
|
||
sort_key->skd_flags = SKD_ascending;
|
||
if (tdbb->tdbb_database->dbb_ods_version < ODS_VERSION11) {
|
||
// Put nulls at the tail for ODS10 and earlier
|
||
if ((IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_first)
|
||
sort_key->skd_flags |= SKD_descending;
|
||
}
|
||
else {
|
||
// Have SQL-compliant nulls ordering for ODS11+
|
||
if (((IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_default && !*(node_ptr + sort->nod_count)) ||
|
||
(IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_first)
|
||
{
|
||
sort_key->skd_flags |= SKD_descending;
|
||
}
|
||
}
|
||
++sort_key;
|
||
/* Make key for sort key proper */
|
||
#ifndef WORDS_BIGENDIAN
|
||
map_length = ROUNDUP(map_length, sizeof(SLONG));
|
||
#else
|
||
if (desc->dsc_dtype >= dtype_aligned)
|
||
map_length =
|
||
FB_ALIGN(map_length, type_alignments[desc->dsc_dtype]);
|
||
#endif
|
||
sort_key->skd_offset = (USHORT) map_length;
|
||
sort_key->skd_flags = SKD_ascending;
|
||
if (*(node_ptr + sort->nod_count))
|
||
sort_key->skd_flags |= SKD_descending;
|
||
// UCHAR desc->dsc_dtype is always >=0
|
||
// fb_assert(desc->dsc_dtype >= 0);
|
||
fb_assert(desc->dsc_dtype < FB_NELEM(sort_dtypes));
|
||
sort_key->skd_dtype = sort_dtypes[desc->dsc_dtype];
|
||
/*fb_assert (sort_key->skd_dtype != 0); */
|
||
if (sort_key->skd_dtype == SKD_varying ||
|
||
sort_key->skd_dtype == SKD_cstring)
|
||
{
|
||
if (desc->dsc_ttype() == ttype_binary)
|
||
sort_key->skd_flags |= SKD_binary;
|
||
}
|
||
sort_key->skd_length = desc->dsc_length;
|
||
++sort_key;
|
||
map_item->smb_node = node;
|
||
map_item->smb_desc = *desc;
|
||
map_item->smb_desc.dsc_address = (UCHAR *) (IPTR) map_length;
|
||
map_length += desc->dsc_length;
|
||
if (node->nod_type == nod_field) {
|
||
map_item->smb_stream = (USHORT)(IPTR) node->nod_arg[e_fld_stream];
|
||
map_item->smb_field_id = (USHORT)(IPTR) node->nod_arg[e_fld_id];
|
||
}
|
||
}
|
||
|
||
map_length = ROUNDUP(map_length, sizeof(SLONG));
|
||
map->smb_key_length = (USHORT) map_length >> SHIFTLONG;
|
||
USHORT flag_offset = (USHORT) map_length;
|
||
map_length += items - sort->nod_count;
|
||
/* Now go back and process all to fields involved with the sort. If the
|
||
field has already been mentioned as a sort key, don't bother to repeat
|
||
it. */
|
||
while (stream_stack.hasData()) {
|
||
const SLONG id = id_stack.pop();
|
||
// AP: why USHORT - we pushed UCHAR
|
||
const USHORT stream = stream_stack.pop();
|
||
const Format* format = CMP_format(tdbb, csb, stream);
|
||
const dsc* desc = &format->fmt_desc[id];
|
||
if (id >= format->fmt_count || desc->dsc_length == 0)
|
||
IBERROR(157); /* msg 157 cannot sort on a field that does not exist */
|
||
if (desc->dsc_dtype >= dtype_aligned)
|
||
map_length =
|
||
FB_ALIGN(map_length, type_alignments[desc->dsc_dtype]);
|
||
map_item->smb_field_id = (SSHORT) id;
|
||
map_item->smb_stream = stream;
|
||
map_item->smb_flag_offset = flag_offset++;
|
||
map_item->smb_desc = *desc;
|
||
map_item->smb_desc.dsc_address = (UCHAR *) (IPTR)map_length;
|
||
map_length += desc->dsc_length;
|
||
map_item++;
|
||
}
|
||
|
||
/* Make fields for record numbers record for all streams */
|
||
|
||
map_length = ROUNDUP(map_length, sizeof(SLONG));
|
||
for (ptr = &streams[1]; ptr <= end_ptr; ptr++, map_item++) {
|
||
map_item->smb_field_id = SMB_DBKEY;
|
||
map_item->smb_stream = *ptr;
|
||
dsc* desc = &map_item->smb_desc;
|
||
desc->dsc_dtype = dtype_int64;
|
||
desc->dsc_length = sizeof(SINT64);
|
||
desc->dsc_address = (UCHAR *)(IPTR)map_length;
|
||
map_length += desc->dsc_length;
|
||
}
|
||
|
||
/* Make fields for transaction id of record for all streams */
|
||
|
||
for (ptr = &streams[1]; ptr <= end_ptr; ptr++, map_item++) {
|
||
map_item->smb_field_id = SMB_TRANS_ID;
|
||
map_item->smb_stream = *ptr;
|
||
dsc* desc = &map_item->smb_desc;
|
||
desc->dsc_dtype = dtype_long;
|
||
desc->dsc_length = sizeof(SLONG);
|
||
desc->dsc_address = (UCHAR *) (IPTR)map_length;
|
||
map_length += desc->dsc_length;
|
||
}
|
||
|
||
if (dbkey_streams) {
|
||
ptr = &dbkey_streams[1];
|
||
for (const UCHAR* const end_ptrL = dbkey_streams + dbkey_streams[0];
|
||
ptr <= end_ptrL; ptr++, map_item++)
|
||
{
|
||
map_item->smb_field_id = SMB_DBKEY;
|
||
map_item->smb_stream = *ptr;
|
||
dsc* desc = &map_item->smb_desc;
|
||
desc->dsc_dtype = dtype_int64;
|
||
desc->dsc_length = sizeof(SINT64);
|
||
desc->dsc_address = (UCHAR *)(IPTR)map_length;
|
||
map_length += desc->dsc_length;
|
||
}
|
||
}
|
||
|
||
/* Make fields to store varying and cstring length. */
|
||
|
||
const sort_key_def* const end_key = sort_key;
|
||
for (sort_key = map->smb_key_desc; sort_key < end_key; sort_key++) {
|
||
/* fb_assert (sort_key->skd_dtype != 0); */
|
||
if (sort_key->skd_dtype == SKD_varying ||
|
||
sort_key->skd_dtype == SKD_cstring)
|
||
{
|
||
sort_key->skd_vary_offset = (USHORT) map_length;
|
||
map_length += sizeof(USHORT);
|
||
}
|
||
}
|
||
|
||
if (map_length > MAX_SORT_RECORD)
|
||
ERR_post(isc_sort_rec_size_err, isc_arg_number, map_length, 0);
|
||
/* Msg438: sort record size of %ld bytes is too big */
|
||
map->smb_length = (USHORT) map_length;
|
||
/* That was most unpleasant. Never the less, it's done (except for
|
||
the debugging). All that remains is to build the record source
|
||
block for the sort. */
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
|
||
rsb->rsb_type = rsb_sort;
|
||
rsb->rsb_next = prior_rsb;
|
||
rsb->rsb_arg[0] = (RecordSource*) map;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_sort));
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static bool gen_sort_merge(thread_db* tdbb, OptimizerBlk* opt, RiverStack& org_rivers)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ s o r t _ m e r g e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* We've got a set of rivers that may or may not be amenable to
|
||
* a sort/merge join, and it's time to find out. If there are,
|
||
* build a sort/merge RecordSource, push it on the rsb stack, and update
|
||
* rivers accordingly. If two or more rivers were successfully
|
||
* joined, return true. If the whole things is a moby no-op,
|
||
* return false.
|
||
*
|
||
**************************************/
|
||
USHORT i;
|
||
ULONG selected_rivers[OPT_STREAM_BITS], selected_rivers2[OPT_STREAM_BITS];
|
||
jrd_nod **eq_class, **ptr;
|
||
DEV_BLKCHK(opt, type_opt);
|
||
SET_TDBB(tdbb);
|
||
Database* dbb = tdbb->tdbb_database;
|
||
|
||
// Count the number of "rivers" involved in the operation, then allocate
|
||
// a scratch block large enough to hold values to compute equality
|
||
// classes.
|
||
USHORT cnt = 0;
|
||
for (RiverStack::iterator stack1(org_rivers); stack1.hasData(); ++stack1) {
|
||
stack1.object()->riv_number = cnt++;
|
||
}
|
||
|
||
Firebird::HalfStaticArray<jrd_nod*, OPT_STATIC_ITEMS> scratch(*tdbb->getDefaultPool());
|
||
scratch.grow(opt->opt_base_conjuncts * cnt);
|
||
jrd_nod** classes = scratch.begin();
|
||
|
||
// Compute equivalence classes among streams. This involves finding groups
|
||
// of streams joined by field equalities.
|
||
jrd_nod** last_class = classes;
|
||
OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
|
||
const OptimizerBlk::opt_conjunct* const end = tail + opt->opt_base_conjuncts;
|
||
for (; tail < end; tail++)
|
||
{
|
||
if (tail->opt_conjunct_flags & opt_conjunct_used) {
|
||
continue;
|
||
}
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (node->nod_type != nod_eql) {
|
||
continue;
|
||
}
|
||
jrd_nod* node1 = node->nod_arg[0];
|
||
jrd_nod* node2 = node->nod_arg[1];
|
||
for (RiverStack::iterator stack0(org_rivers); stack0.hasData(); ++stack0) {
|
||
River* river1 = stack0.object();
|
||
if (!river_reference(river1, node1)) {
|
||
if (river_reference(river1, node2)) {
|
||
node = node1;
|
||
node1 = node2;
|
||
node2 = node;
|
||
}
|
||
else {
|
||
continue;
|
||
}
|
||
}
|
||
for (RiverStack::iterator stack2(stack0); (++stack2).hasData();)
|
||
{
|
||
River* river2 = stack2.object();
|
||
if (river_reference(river2, node2)) {
|
||
for (eq_class = classes; eq_class < last_class; eq_class += cnt)
|
||
{
|
||
if (node_equality(node1, classes[river1->riv_number])
|
||
|| node_equality(node2, classes[river2->riv_number]))
|
||
{
|
||
break;
|
||
}
|
||
}
|
||
eq_class[river1->riv_number] = node1;
|
||
eq_class[river2->riv_number] = node2;
|
||
if (eq_class == last_class) {
|
||
last_class += cnt;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
/* Pick both a set of classes and a set of rivers on which to join with
|
||
sort merge. Obviously, if the set of classes is empty, return false
|
||
to indicate that nothing could be done. */
|
||
|
||
USHORT river_cnt = 0, stream_cnt = 0;
|
||
Firebird::HalfStaticArray<jrd_nod**, OPT_STATIC_ITEMS> selected_classes(*tdbb->getDefaultPool(), cnt);
|
||
for (eq_class = classes; eq_class < last_class; eq_class += cnt) {
|
||
i = river_count(cnt, eq_class);
|
||
if (i > river_cnt) {
|
||
river_cnt = i;
|
||
selected_classes.shrink(0);
|
||
selected_classes.add(eq_class);
|
||
class_mask(cnt, eq_class, selected_rivers);
|
||
}
|
||
else {
|
||
class_mask(cnt, eq_class, selected_rivers2);
|
||
for (i = 0; i < OPT_STREAM_BITS; i++) {
|
||
if ((selected_rivers[i] & selected_rivers2[i]) != selected_rivers[i]) {
|
||
break;
|
||
}
|
||
}
|
||
if (i == OPT_STREAM_BITS) {
|
||
selected_classes.add(eq_class);
|
||
}
|
||
}
|
||
}
|
||
|
||
if (!river_cnt)
|
||
return false;
|
||
|
||
// Build a sort stream.
|
||
RecordSource* merge_rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), river_cnt * 2) RecordSource();
|
||
merge_rsb->rsb_count = river_cnt;
|
||
merge_rsb->rsb_type = rsb_merge;
|
||
merge_rsb->rsb_impure =
|
||
CMP_impure(opt->opt_csb, (USHORT) (sizeof(struct irsb_mrg) +
|
||
river_cnt * sizeof(irsb_mrg::irsb_mrg_repeat)));
|
||
|
||
RecordSource** rsb_tail = merge_rsb->rsb_arg;
|
||
stream_cnt = 0;
|
||
for (RiverStack::iterator stack3(org_rivers); stack3.hasData(); ++stack3) {
|
||
River* river1 = stack3.object();
|
||
if (!(TEST_DEP_BIT(selected_rivers, river1->riv_number))) {
|
||
continue;
|
||
}
|
||
stream_cnt += river1->riv_count;
|
||
jrd_nod* sort = FB_NEW_RPT(*tdbb->getDefaultPool(), selected_classes.getCount() * 3) jrd_nod();
|
||
sort->nod_type = nod_sort;
|
||
sort->nod_count = selected_classes.getCount();
|
||
jrd_nod*** selected_class;
|
||
for (selected_class = selected_classes.begin(), ptr = sort->nod_arg;
|
||
selected_class < selected_classes.end(); selected_class++)
|
||
{
|
||
ptr[sort->nod_count] = (jrd_nod*) FALSE; // Ascending sort
|
||
ptr[sort->nod_count * 2] = (jrd_nod*) rse_nulls_default; // Default nulls placement
|
||
*ptr++ = (*selected_class)[river1->riv_number];
|
||
}
|
||
|
||
RecordSource* rsb =
|
||
gen_sort(tdbb, opt, &river1->riv_count, NULL, river1->riv_rsb, sort, false);
|
||
*rsb_tail++ = rsb;
|
||
*rsb_tail++ = (RecordSource*) sort;
|
||
}
|
||
|
||
// Finally, merge selected rivers into a single river, and rebuild
|
||
// original river stack.
|
||
River* river1 = FB_NEW_RPT(*tdbb->getDefaultPool(), stream_cnt) River();
|
||
river1->riv_count = (UCHAR) stream_cnt;
|
||
river1->riv_rsb = merge_rsb;
|
||
UCHAR* stream = river1->riv_streams;
|
||
RiverStack newRivers(org_rivers.getPool());
|
||
while (org_rivers.hasData()) {
|
||
River* river2 = org_rivers.pop();
|
||
if (TEST_DEP_BIT(selected_rivers, river2->riv_number)) {
|
||
MOVE_FAST(river2->riv_streams, stream, river2->riv_count);
|
||
stream += river2->riv_count;
|
||
}
|
||
else {
|
||
// AB: Be sure that the rivers 'order' will be kept.
|
||
if (newRivers.hasData()) {
|
||
River* river3 = newRivers.pop();
|
||
newRivers.push(river2);
|
||
newRivers.push(river3);
|
||
}
|
||
else {
|
||
newRivers.push(river2);
|
||
}
|
||
}
|
||
}
|
||
// AB: Moved LLS_PUSH() from before the while (*org_rivers) loop to here, because
|
||
// the merged rivers could be refering to other streams on the list.
|
||
newRivers.push(river1);
|
||
|
||
// Pick up any boolean that may apply.
|
||
{
|
||
USHORT flag_vector[MAX_STREAMS + 1], *fv;
|
||
UCHAR stream_nr;
|
||
// AB: Inactivate currently all streams from every river, because we
|
||
// need to know which nodes are computable between the rivers used
|
||
// for the merge.
|
||
for (stream_nr = 0, fv = flag_vector; stream_nr < opt->opt_csb->csb_n_stream; stream_nr++) {
|
||
*fv++ = opt->opt_csb->csb_rpt[stream_nr].csb_flags & csb_active;
|
||
opt->opt_csb->csb_rpt[stream_nr].csb_flags &= ~csb_active;
|
||
}
|
||
|
||
set_active(opt, river1);
|
||
jrd_nod* node = NULL;
|
||
for (tail = opt->opt_conjuncts.begin(); tail < end; tail++)
|
||
{
|
||
jrd_nod* node1 = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
|
||
&& computable(opt->opt_csb, node1, -1, false, false))
|
||
{
|
||
compose(&node, node1, nod_and);
|
||
tail->opt_conjunct_flags |= opt_conjunct_used;
|
||
}
|
||
}
|
||
|
||
if (node) {
|
||
river1->riv_rsb = gen_boolean(tdbb, opt, river1->riv_rsb, node);
|
||
}
|
||
set_inactive(opt, river1);
|
||
org_rivers.takeOwnership(newRivers);
|
||
|
||
for (stream_nr = 0, fv = flag_vector;
|
||
stream_nr < opt->opt_csb->csb_n_stream; stream_nr++)
|
||
{
|
||
opt->opt_csb->csb_rpt[stream_nr].csb_flags |= *fv++;
|
||
}
|
||
}
|
||
|
||
return true;
|
||
}
|
||
|
||
|
||
static RecordSource* gen_union(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
jrd_nod* union_node, UCHAR * streams, USHORT nstreams)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e n _ u n i o n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a union complex.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(union_node, type_nod);
|
||
|
||
SET_TDBB(tdbb);
|
||
jrd_nod* clauses = union_node->nod_arg[e_uni_clauses];
|
||
const USHORT count = clauses->nod_count;
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count + nstreams + 1) RecordSource();
|
||
rsb->rsb_type = rsb_union;
|
||
rsb->rsb_count = count;
|
||
rsb->rsb_stream = (UCHAR)(IPTR) union_node->nod_arg[e_uni_stream];
|
||
rsb->rsb_format = csb->csb_rpt[rsb->rsb_stream].csb_format;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
|
||
RecordSource** rsb_ptr = rsb->rsb_arg;
|
||
jrd_nod** ptr = clauses->nod_arg;
|
||
for (const jrd_nod* const* const end = ptr + count; ptr < end;) {
|
||
*rsb_ptr++ = OPT_compile(tdbb, csb, (RecordSelExpr*) * ptr++, NULL);
|
||
*rsb_ptr++ = (RecordSource*) * ptr++;
|
||
}
|
||
|
||
/* Save the count and numbers of the streams that make up the union */
|
||
|
||
*rsb_ptr++ = (RecordSource*)(IPTR) nstreams;
|
||
while (nstreams--) {
|
||
*rsb_ptr++ = (RecordSource*)(IPTR) *streams++;
|
||
}
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static void get_inactivities(const CompilerScratch* csb, ULONG* dependencies)
|
||
{
|
||
/**************************************
|
||
*
|
||
* g e t _ i n a c t i v i t i e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Find any streams not explicitily active.
|
||
*
|
||
**************************************/
|
||
SLONG n;
|
||
DEV_BLKCHK(csb, type_csb);
|
||
for (n = 0; n < OPT_STREAM_BITS; n++)
|
||
dependencies[n] = (ULONG) - 1;
|
||
n = 0;
|
||
CompilerScratch::rpt_const_itr tail = csb->csb_rpt.begin();
|
||
for (const CompilerScratch::rpt_const_itr end = tail + csb->csb_n_stream;
|
||
tail < end; n++, tail++)
|
||
{
|
||
if (tail->csb_flags & csb_active)
|
||
CLEAR_DEP_BIT(dependencies, n);
|
||
}
|
||
}
|
||
|
||
|
||
static IndexedRelationship* indexed_relationship(thread_db* tdbb, OptimizerBlk* opt,
|
||
USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* i n d e x e d _ r e l a t i o n s h i p
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* See if two streams are related by an index.
|
||
* An indexed relationship is a means of joining two
|
||
* streams via an index, which is possible when a field from
|
||
* each of the streams is compared with a field from the other,
|
||
* and there is an index on one stream to retrieve the value
|
||
* of the other field.
|
||
*
|
||
**************************************/
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
SET_TDBB(tdbb);
|
||
|
||
if (!opt->opt_base_conjuncts) {
|
||
return NULL;
|
||
}
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
|
||
OptimizerBlk::opt_conjunct* opt_end =
|
||
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
|
||
IndexedRelationship* relationship = NULL;
|
||
|
||
/* Loop thru indexes looking for a match */
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
for (USHORT i = 0; i < csb_tail->csb_indices;
|
||
++i, ++idx)
|
||
{
|
||
/* skip this part if the index wasn't specified for indexed retrieval */
|
||
if (idx->idx_runtime_flags & idx_plan_dont_use) {
|
||
continue;
|
||
}
|
||
clear_bounds(opt, idx);
|
||
OptimizerBlk::opt_conjunct* tail;
|
||
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++)
|
||
{
|
||
jrd_nod* node = tail->opt_conjunct_node;
|
||
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
|
||
&& computable(csb, node, -1, false, false))
|
||
{
|
||
// AB: Why only check for AND structures ?
|
||
// Added match_indices for support of "OR" with INNER JOINs */
|
||
|
||
// match_index(tdbb, opt, stream, node, idx);
|
||
match_indices(tdbb, opt, stream, node, idx);
|
||
// AB: Why should we look further?
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
if (!relationship) {
|
||
relationship = FB_NEW(*tdbb->getDefaultPool()) IndexedRelationship();
|
||
}
|
||
if (idx->idx_flags & idx_unique) {
|
||
relationship->irl_unique = TRUE;
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
return relationship;
|
||
}
|
||
|
||
|
||
static str* make_alias(thread_db* tdbb, CompilerScratch* csb,
|
||
CompilerScratch::csb_repeat* base_tail)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ a l i a s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Make an alias string suitable for printing
|
||
* as part of the plan. For views, this means
|
||
* multiple aliases to distinguish the base
|
||
* table.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(csb, type_csb);
|
||
SET_TDBB(tdbb);
|
||
if (!base_tail->csb_view && !base_tail->csb_alias)
|
||
return NULL;
|
||
|
||
const CompilerScratch::csb_repeat* csb_tail;
|
||
/* calculate the length of the alias by going up through
|
||
the view stack to find the lengths of all aliases;
|
||
adjust for spaces and a null terminator */
|
||
USHORT alias_length = 0;
|
||
for (csb_tail = base_tail;;
|
||
csb_tail = &csb->csb_rpt[csb_tail->csb_view_stream])
|
||
{
|
||
if (csb_tail->csb_alias)
|
||
alias_length += csb_tail->csb_alias->length();
|
||
else {
|
||
alias_length +=
|
||
(!(csb_tail->csb_relation) || !(csb_tail->csb_relation->rel_name))
|
||
? 0 : strlen(csb_tail->csb_relation->rel_name);
|
||
}
|
||
alias_length++;
|
||
if (!csb_tail->csb_view)
|
||
break;
|
||
}
|
||
|
||
/* allocate a string block to hold the concatenated alias */
|
||
|
||
str* alias = FB_NEW_RPT(*tdbb->getDefaultPool(), alias_length) str();
|
||
alias->str_length = alias_length - 1;
|
||
/* now concatenate the individual aliases into the string block,
|
||
beginning at the end and copying back to the beginning */
|
||
TEXT* p = (TEXT *) alias->str_data + alias->str_length;
|
||
*p-- = 0;
|
||
for (csb_tail = base_tail;;
|
||
csb_tail = &csb->csb_rpt[csb_tail->csb_view_stream])
|
||
{
|
||
const TEXT* q;
|
||
if (csb_tail->csb_alias)
|
||
q = (TEXT *) csb_tail->csb_alias->c_str();
|
||
else {
|
||
q = (!(csb_tail->csb_relation) || !(csb_tail->csb_relation->rel_name))
|
||
? NULL : csb_tail->csb_relation->rel_name;
|
||
}
|
||
/* go to the end of the alias and copy it backwards */
|
||
if (q) {
|
||
for (alias_length = 0; *q; alias_length++)
|
||
q++;
|
||
while (alias_length--)
|
||
*p-- = *--q;
|
||
}
|
||
|
||
if (!csb_tail->csb_view)
|
||
break;
|
||
*p-- = ' ';
|
||
}
|
||
|
||
return alias;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_binary_node(NOD_T type, jrd_nod* arg1, jrd_nod* arg2, bool flag)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ b i n a r y _ n o d e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Make a binary node.
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
DEV_BLKCHK(arg1, type_nod);
|
||
DEV_BLKCHK(arg2, type_nod);
|
||
jrd_nod* node = PAR_make_node(tdbb, 2);
|
||
node->nod_type = type;
|
||
node->nod_arg[0] = arg1;
|
||
node->nod_arg[1] = arg2;
|
||
if (flag) {
|
||
node->nod_flags |= nod_comparison;
|
||
}
|
||
return node;
|
||
}
|
||
|
||
|
||
static RecordSource* make_cross(thread_db* tdbb, OptimizerBlk* opt, RiverStack& stack)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ c r o s s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Generate a cross block.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
SET_TDBB(tdbb);
|
||
const int count = stack.getCount();
|
||
if (count == 1) {
|
||
return stack.pop()->riv_rsb;
|
||
}
|
||
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count) RecordSource();
|
||
rsb->rsb_type = rsb_cross;
|
||
rsb->rsb_count = count;
|
||
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
|
||
RecordSource** ptr = rsb->rsb_arg + count;
|
||
while (stack.hasData()) {
|
||
*--ptr = stack.pop()->riv_rsb;
|
||
}
|
||
|
||
return rsb;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_index_node(thread_db* tdbb, jrd_rel* relation,
|
||
CompilerScratch* csb, index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ i n d e x _ n o d e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Make an index node and an index retrieval block.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(csb, type_csb);
|
||
SET_TDBB(tdbb);
|
||
/* check whether this is during a compile or during
|
||
a SET INDEX operation */
|
||
if (csb)
|
||
CMP_post_resource(&csb->csb_resources,
|
||
relation, Resource::rsc_index,
|
||
idx->idx_id);
|
||
else
|
||
CMP_post_resource(&tdbb->tdbb_request->req_resources,
|
||
relation, Resource::rsc_index,
|
||
idx->idx_id);
|
||
|
||
jrd_nod* node = PAR_make_node(tdbb, e_idx_length);
|
||
node->nod_type = nod_index;
|
||
node->nod_count = 0;
|
||
IndexRetrieval* retrieval =
|
||
FB_NEW_RPT(*tdbb->getDefaultPool(), idx->idx_count * 2) IndexRetrieval();
|
||
node->nod_arg[e_idx_retrieval] = (jrd_nod*) retrieval;
|
||
retrieval->irb_index = idx->idx_id;
|
||
MOVE_FAST(idx, &retrieval->irb_desc, sizeof(retrieval->irb_desc));
|
||
if (csb)
|
||
node->nod_impure = CMP_impure(csb, sizeof(impure_inversion));
|
||
return node;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_inference_node(CompilerScratch* csb, jrd_nod* boolean,
|
||
jrd_nod* arg1, jrd_nod* arg2)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ i n f e r e n c e _ n o d e
|
||
*
|
||
**************************************
|
||
*
|
||
* Defined
|
||
* 1996-Jan-15 David Schnepper
|
||
*
|
||
* Functional description
|
||
* From the predicate, boolean, and infer a new
|
||
* predicate using arg1 & arg2 as the first two
|
||
* parameters to the predicate.
|
||
*
|
||
* This is used when the engine knows A<B and A=C, and
|
||
* creates a new node to represent the infered knowledge C<B.
|
||
*
|
||
* Note that this may be sometimes incorrect with 3-value
|
||
* logic (per Chris Date's Object & Relations seminar).
|
||
* Later stages of query evaluation evaluate exactly
|
||
* the originally specified query, so 3-value issues are
|
||
* caught there. Making this inference might cause us to
|
||
* examine more records than needed, but would not result
|
||
* in incorrect results.
|
||
*
|
||
* Note that some nodes, specifically nod_like, have
|
||
* more than two parameters for a boolean operation.
|
||
* (nod_like has an optional 3rd parameter for the ESCAPE character
|
||
* option of SQL)
|
||
* Nod_sleuth also has an optional 3rd parameter (for the GDML
|
||
* matching ESCAPE character language). But nod_sleuth is
|
||
* (apparently) not considered during optimization.
|
||
*
|
||
*
|
||
**************************************/
|
||
thread_db* tdbb = JRD_get_thread_data();
|
||
DEV_BLKCHK(csb, type_csb);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
DEV_BLKCHK(arg1, type_nod);
|
||
DEV_BLKCHK(arg2, type_nod);
|
||
fb_assert(boolean->nod_count >= 2); /* must be a conjunction boolean */
|
||
/* Clone the input predicate */
|
||
jrd_nod* node = PAR_make_node(tdbb, boolean->nod_count);
|
||
node->nod_type = boolean->nod_type;
|
||
|
||
// We may safely copy invariantness flag because
|
||
// (1) we only distribute field equalities
|
||
// (2) invariantness of second argument of STARTING WITH or LIKE is solely
|
||
// determined by its dependency on any of the fields
|
||
// If provisions above change the line below will have to be modified
|
||
node->nod_flags = boolean->nod_flags;
|
||
/* But substitute new values for some of the predicate arguments */
|
||
node->nod_arg[0] = CMP_clone_node(tdbb, csb, arg1);
|
||
node->nod_arg[1] = CMP_clone_node(tdbb, csb, arg2);
|
||
/* Arguments after the first two are just cloned (eg: LIKE ESCAPE clause) */
|
||
for (USHORT n = 2; n < boolean->nod_count; n++)
|
||
node->nod_arg[n] = CMP_clone_node(tdbb, csb, boolean->nod_arg[n]);
|
||
// Share impure area for cached invariant value used to hold pre-compiled
|
||
// pattern for new LIKE and CONTAINING algorithms.
|
||
// Proper cloning of impure area for this node would require careful accounting
|
||
// of new invariant dependencies - we avoid such hassles via using single
|
||
// cached pattern value for all node clones. This is faster too.
|
||
if (node->nod_flags & nod_invariant)
|
||
node->nod_impure = boolean->nod_impure;
|
||
return node;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_inversion(thread_db* tdbb, OptimizerBlk* opt,
|
||
jrd_nod* boolean, USHORT stream)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ i n v e r s i o n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Build an inversion for a boolean, if possible. Otherwise,
|
||
* return NULL. Make inversion is call initially from
|
||
* gen_retrieval to handle "or" nodes, but may be called
|
||
* recursively for almost anything.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
|
||
CompilerScratch::csb_repeat* csb_tail = &opt->opt_csb->csb_rpt[stream];
|
||
jrd_rel* relation = csb_tail->csb_relation;
|
||
|
||
if ((!relation) || (relation->rel_file)) {
|
||
return NULL;
|
||
}
|
||
|
||
// Handle the "OR" case up front
|
||
jrd_nod* inversion;
|
||
if (boolean->nod_type == nod_or)
|
||
{
|
||
inversion = make_inversion(tdbb, opt, boolean->nod_arg[0], stream);
|
||
if (!inversion)
|
||
{
|
||
return NULL;
|
||
}
|
||
jrd_nod* inversion2 = make_inversion(tdbb, opt, boolean->nod_arg[1], stream);
|
||
if (inversion2)
|
||
{
|
||
if ((inversion->nod_type == nod_index) &&
|
||
(inversion2->nod_type == nod_index) &&
|
||
(reinterpret_cast<IndexRetrieval*>(inversion->nod_arg[e_idx_retrieval])->irb_index ==
|
||
reinterpret_cast<IndexRetrieval*>(inversion2->nod_arg[e_idx_retrieval])->irb_index))
|
||
{
|
||
return compose(&inversion, inversion2, nod_bit_in);
|
||
}
|
||
else if ((inversion->nod_type == nod_bit_in) &&
|
||
(inversion2->nod_type == nod_index) &&
|
||
(reinterpret_cast<IndexRetrieval*>(inversion->nod_arg[1]->nod_arg[e_idx_retrieval])->irb_index ==
|
||
reinterpret_cast<IndexRetrieval*>(inversion2->nod_arg[e_idx_retrieval])->irb_index))
|
||
{
|
||
return compose(&inversion, inversion2, nod_bit_in);
|
||
}
|
||
else
|
||
{
|
||
return compose(&inversion, inversion2, nod_bit_or);
|
||
}
|
||
}
|
||
if (inversion->nod_type == nod_index) {
|
||
delete inversion->nod_arg[e_idx_retrieval];
|
||
}
|
||
delete inversion;
|
||
return NULL;
|
||
}
|
||
|
||
// Time to find inversions. For each index on the relation
|
||
// match all unused booleans against the index looking for upper
|
||
// and lower bounds that can be computed by the index. When
|
||
// all unused conjunctions are exhausted, see if there is enough
|
||
// information for an index retrieval. If so, build up and
|
||
// inversion component of the boolean.
|
||
|
||
// AB: If the boolean is a part of an earlier created index
|
||
// retrieval check with the compound_selectivity if it's
|
||
// really interresting to use.
|
||
inversion = NULL;
|
||
bool accept_starts = true;
|
||
bool accept_missing = true;
|
||
bool used_in_compound = false;
|
||
float compound_selectivity = 1; // Real maximum selectivity possible is 1.
|
||
|
||
// TMN: Shouldn't this be allocated from the tdbb->getDefaultPool() pool?
|
||
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS>
|
||
idx_walk_vector(*tdbb->getDefaultPool());
|
||
idx_walk_vector.grow(csb_tail->csb_indices);
|
||
index_desc** idx_walk = idx_walk_vector.begin();
|
||
Firebird::HalfStaticArray<UINT64, OPT_STATIC_ITEMS>
|
||
idx_priority_level_vector(*tdbb->getDefaultPool());
|
||
idx_priority_level_vector.grow(csb_tail->csb_indices);
|
||
UINT64* idx_priority_level = idx_priority_level_vector.begin();
|
||
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
SSHORT i;
|
||
if (opt->opt_base_conjuncts) {
|
||
for (i = 0; i < csb_tail->csb_indices; i++) {
|
||
|
||
idx_walk[i] = idx;
|
||
idx_priority_level[i] = LOWEST_PRIORITY_LEVEL;
|
||
|
||
clear_bounds(opt, idx);
|
||
if (match_index(tdbb, opt, stream, boolean, idx) &&
|
||
!(idx->idx_runtime_flags & idx_plan_dont_use))
|
||
{
|
||
// Calculate the priority level of this index.
|
||
idx_priority_level[i] = calculate_priority_level(opt, idx);
|
||
}
|
||
|
||
// If the index was already used in an AND node check
|
||
// if this node is also present in this index
|
||
if (idx->idx_runtime_flags & idx_used_with_and) {
|
||
if ((match_index(tdbb, opt, stream, boolean, idx)) &&
|
||
(idx->idx_selectivity < compound_selectivity))
|
||
{
|
||
compound_selectivity = idx->idx_selectivity;
|
||
used_in_compound = true;
|
||
}
|
||
}
|
||
|
||
/* Because indices are already sort based on their selectivity
|
||
it's not needed to more then 1 index for a node */
|
||
if ((boolean->nod_type == nod_starts) && accept_starts) {
|
||
jrd_nod* node = make_starts(tdbb, opt, relation, boolean, stream, idx);
|
||
if (node) {
|
||
compose(&inversion, node, nod_bit_and);
|
||
accept_starts = false;
|
||
}
|
||
}
|
||
|
||
if ((boolean->nod_type == nod_missing) && accept_missing) {
|
||
jrd_nod* node = make_missing(tdbb, opt, relation, boolean, stream, idx);
|
||
if (node) {
|
||
compose(&inversion, node, nod_bit_and);
|
||
accept_missing = false;
|
||
}
|
||
}
|
||
|
||
++idx;
|
||
}
|
||
}
|
||
|
||
/* Sort indices based on the priority level into idx_walk */
|
||
|
||
const SSHORT idx_walk_count =
|
||
sort_indices_by_priority(csb_tail, idx_walk, idx_priority_level);
|
||
|
||
bool accept = true;
|
||
idx = csb_tail->csb_idx->items;
|
||
if (opt->opt_base_conjuncts) {
|
||
for (i = 0; i < idx_walk_count; i++) {
|
||
idx = idx_walk[i];
|
||
if (idx->idx_runtime_flags & idx_plan_dont_use) {
|
||
continue;
|
||
}
|
||
|
||
clear_bounds(opt, idx);
|
||
if (((accept || used_in_compound) &&
|
||
(idx->idx_selectivity < compound_selectivity * OR_SELECTIVITY_THRESHOLD_FACTOR)) ||
|
||
(csb_tail->csb_plan))
|
||
{
|
||
match_index(tdbb, opt, stream, boolean, idx);
|
||
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
|
||
compose(&inversion, OPT_make_index(tdbb, opt, relation, idx),
|
||
nod_bit_and);
|
||
accept = false;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
if (!inversion) {
|
||
inversion = OPT_make_dbkey(opt, boolean, stream);
|
||
}
|
||
|
||
return inversion;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_missing(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
jrd_rel* relation, jrd_nod* boolean, USHORT stream, index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ m i s s i n g
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* If the a given boolean is an index optimizable, build and
|
||
* return a inversion type node. Indexes built before minor
|
||
* version 3 (V3.2) have unreliable representations for missing
|
||
* character string fields, so they won't be used.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
Database* dbb = tdbb->tdbb_database;
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
|
||
jrd_nod* field = boolean->nod_arg[0];
|
||
|
||
#ifdef EXPRESSION_INDICES
|
||
if (idx->idx_flags & idx_expressn)
|
||
{
|
||
fb_assert(idx->idx_expression != NULL);
|
||
if (!expression_equal(tdbb, opt, idx, field, stream))
|
||
{
|
||
return NULL;
|
||
}
|
||
}
|
||
else
|
||
{
|
||
#endif
|
||
if (field->nod_type != nod_field)
|
||
{
|
||
return NULL;
|
||
}
|
||
|
||
if ((USHORT)(IPTR) field->nod_arg[e_fld_stream] != stream ||
|
||
(USHORT)(IPTR) field->nod_arg[e_fld_id] != idx->idx_rpt[0].idx_field)
|
||
{
|
||
return NULL;
|
||
}
|
||
#ifdef EXPRESSION_INDICES
|
||
}
|
||
#endif
|
||
|
||
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
|
||
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
|
||
retrieval->irb_relation = relation;
|
||
|
||
if ((dbb->dbb_ods_version < ODS_VERSION11) || (idx->idx_flags & idx_descending)) {
|
||
// AB: irb_starting? Why?
|
||
// Commenting myself. Because we don't know exact length for the field.
|
||
// For ascending NULLs in ODS 11 and higher this doesn't matter, because
|
||
// a NULL is always stored as a key with length 0 (zero).
|
||
retrieval->irb_generic = irb_starting;
|
||
}
|
||
|
||
retrieval->irb_lower_count = retrieval->irb_upper_count = 1;
|
||
|
||
// If we are matching less than the full index, this is a partial match
|
||
if (retrieval->irb_upper_count < idx->idx_count) {
|
||
retrieval->irb_generic |= irb_partial;
|
||
}
|
||
|
||
// Set descending flag on retrieval if index is descending
|
||
if (idx->idx_flags & idx_descending) {
|
||
retrieval->irb_generic |= irb_descending;
|
||
}
|
||
|
||
jrd_nod* value = PAR_make_node(tdbb, 0);
|
||
retrieval->irb_value[0] = retrieval->irb_value[idx->idx_count] = value;
|
||
value->nod_type = nod_null;
|
||
idx->idx_runtime_flags |= idx_plan_missing;
|
||
|
||
return node;
|
||
}
|
||
|
||
|
||
static jrd_nod* make_starts(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
jrd_rel* relation, jrd_nod* boolean, USHORT stream, index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a k e _ s t a r t s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* If the given boolean is an index optimizable, build and
|
||
* return a inversion type node.
|
||
*
|
||
**************************************/
|
||
SET_TDBB(tdbb);
|
||
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(relation, type_rel);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
|
||
if (boolean->nod_type != nod_starts)
|
||
return NULL;
|
||
|
||
jrd_nod* field = boolean->nod_arg[0];
|
||
jrd_nod* value = boolean->nod_arg[1];
|
||
|
||
#ifdef EXPRESSION_INDICES
|
||
if (idx->idx_flags & idx_expressn)
|
||
{
|
||
fb_assert(idx->idx_expression != NULL);
|
||
if (!(expression_equal(tdbb, opt, idx, field, stream) &&
|
||
computable(opt->opt_csb, value, stream, true, false)))
|
||
{
|
||
if (expression_equal(tdbb, opt, idx, value, stream) &&
|
||
computable(opt->opt_csb, field, stream, true, false))
|
||
{
|
||
field = value;
|
||
value = boolean->nod_arg[0];
|
||
}
|
||
else
|
||
{
|
||
return NULL;
|
||
}
|
||
}
|
||
}
|
||
else
|
||
#endif
|
||
{
|
||
if (field->nod_type != nod_field)
|
||
{
|
||
// dimitr: any idea how we can use an index in this case?
|
||
// The code below produced wrong results.
|
||
return NULL;
|
||
/*
|
||
if (value->nod_type != nod_field)
|
||
return NULL;
|
||
field = value;
|
||
value = boolean->nod_arg[0];
|
||
*/
|
||
}
|
||
|
||
/* Every string starts with an empty string so
|
||
don't bother using an index in that case. */
|
||
|
||
if (value->nod_type == nod_literal)
|
||
{
|
||
const dsc* literal_desc = &((Literal*) value)->lit_desc;
|
||
if ((literal_desc->dsc_dtype == dtype_text &&
|
||
literal_desc->dsc_length == 0) ||
|
||
(literal_desc->dsc_dtype == dtype_varying &&
|
||
literal_desc->dsc_length == sizeof(USHORT)))
|
||
{
|
||
return NULL;
|
||
}
|
||
}
|
||
|
||
if ((USHORT)(IPTR) field->nod_arg[e_fld_stream] != stream ||
|
||
(USHORT)(IPTR) field->nod_arg[e_fld_id] != idx->idx_rpt[0].idx_field
|
||
|| !(idx->idx_rpt[0].idx_itype == idx_string
|
||
|| idx->idx_rpt[0].idx_itype == idx_byte_array
|
||
|| idx->idx_rpt[0].idx_itype == idx_metadata
|
||
|| idx->idx_rpt[0].idx_itype >= idx_first_intl_string)
|
||
|| !computable(opt->opt_csb, value, stream, false, false))
|
||
{
|
||
return NULL;
|
||
}
|
||
}
|
||
|
||
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
|
||
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
|
||
retrieval->irb_relation = relation;
|
||
retrieval->irb_generic = irb_starting;
|
||
|
||
// STARTING WITH can never include NULL values, thus ignore
|
||
// them already at index scan
|
||
retrieval->irb_generic |= irb_ignore_null_value_key;
|
||
|
||
retrieval->irb_lower_count = retrieval->irb_upper_count = 1;
|
||
// If we are matching less than the full index, this is a partial match
|
||
if (retrieval->irb_upper_count < idx->idx_count) {
|
||
retrieval->irb_generic |= irb_partial;
|
||
}
|
||
|
||
// Set descending flag on retrieval if index is descending
|
||
if (idx->idx_flags & idx_descending) {
|
||
retrieval->irb_generic |= irb_descending;
|
||
}
|
||
retrieval->irb_value[0] = retrieval->irb_value[idx->idx_count] = value;
|
||
idx->idx_runtime_flags |= idx_plan_starts;
|
||
|
||
return node;
|
||
}
|
||
|
||
|
||
static bool map_equal(const jrd_nod* field1, const jrd_nod* field2, const jrd_nod* map)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a p _ e q u a l
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Test to see if two fields are equal, where the fields
|
||
* are in two different streams possibly mapped to each other.
|
||
* Order of the input fields is important.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(field1, type_nod);
|
||
DEV_BLKCHK(field2, type_nod);
|
||
DEV_BLKCHK(map, type_nod);
|
||
if (field1->nod_type != nod_field) {
|
||
return false;
|
||
}
|
||
if (field2->nod_type != nod_field) {
|
||
return false;
|
||
}
|
||
|
||
// look through the mapping and see if we can find an equivalence.
|
||
const jrd_nod* const* map_ptr = map->nod_arg;
|
||
for (const jrd_nod* const* const map_end = map_ptr + map->nod_count;
|
||
map_ptr < map_end; map_ptr++)
|
||
{
|
||
const jrd_nod* map_from = (*map_ptr)->nod_arg[e_asgn_from];
|
||
const jrd_nod* map_to = (*map_ptr)->nod_arg[e_asgn_to];
|
||
if (map_from->nod_type != nod_field || map_to->nod_type != nod_field) {
|
||
continue;
|
||
}
|
||
if (field1->nod_arg[e_fld_stream] != map_from->nod_arg[e_fld_stream]
|
||
|| field1->nod_arg[e_fld_id] != map_from->nod_arg[e_fld_id])
|
||
{
|
||
continue;
|
||
}
|
||
if (field2->nod_arg[e_fld_stream] != map_to->nod_arg[e_fld_stream]
|
||
|| field2->nod_arg[e_fld_id] != map_to->nod_arg[e_fld_id])
|
||
{
|
||
continue;
|
||
}
|
||
return true;
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
|
||
|
||
static void mark_indices(CompilerScratch::csb_repeat* csb_tail, SSHORT relation_id)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a r k _ i n d i c e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Mark indices that were not included
|
||
* in the user-specified access plan.
|
||
*
|
||
**************************************/
|
||
const jrd_nod* plan = csb_tail->csb_plan;
|
||
if (!plan)
|
||
return;
|
||
if (plan->nod_type != nod_retrieve)
|
||
return;
|
||
/* find out how many indices were specified; if
|
||
there were none, this is a sequential retrieval */
|
||
USHORT plan_count = 0;
|
||
const jrd_nod* access_type = plan->nod_arg[e_retrieve_access_type];
|
||
if (access_type)
|
||
plan_count = access_type->nod_count;
|
||
/* go through each of the indices and mark it unusable
|
||
for indexed retrieval unless it was specifically mentioned
|
||
in the plan; also mark indices for navigational access */
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
|
||
if (access_type) {
|
||
const jrd_nod* const* arg = access_type->nod_arg;
|
||
const jrd_nod* const* const end = arg + plan_count;
|
||
for (; arg < end; arg += 3) {
|
||
if (relation_id != (SSHORT)(IPTR) * arg) {
|
||
/* index %s cannot be used in the specified plan */
|
||
ERR_post(isc_index_unused, isc_arg_string, *(arg + 2), 0);
|
||
}
|
||
if (idx->idx_id == (USHORT)(IPTR) * (arg + 1)) {
|
||
if (access_type->nod_type == nod_navigational &&
|
||
arg == access_type->nod_arg)
|
||
{
|
||
// dimitr: navigational access can use only one index,
|
||
// hence the extra check added (see the line above)
|
||
idx->idx_runtime_flags |= idx_plan_navigate;
|
||
}
|
||
else { // nod_indices
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
if (arg == end)
|
||
idx->idx_runtime_flags |= idx_plan_dont_use;
|
||
}
|
||
else {
|
||
idx->idx_runtime_flags |= idx_plan_dont_use;
|
||
}
|
||
++idx;
|
||
}
|
||
}
|
||
|
||
|
||
static SSHORT match_index(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
SSHORT stream, jrd_nod* boolean,
|
||
index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a t c h _ i n d e x
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Match a boolean against an index location lower and upper
|
||
* bounds. Return the number of relational nodes that were
|
||
* matched. In ODS versions prior to 7, descending indexes
|
||
* were not reliable and will not be used.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
if (boolean->nod_type == nod_and)
|
||
{
|
||
return match_index(tdbb, opt, stream, boolean->nod_arg[0], idx) +
|
||
match_index(tdbb, opt, stream, boolean->nod_arg[1], idx);
|
||
}
|
||
|
||
bool forward = true;
|
||
|
||
jrd_nod* match = boolean->nod_arg[0];
|
||
jrd_nod* value = (boolean->nod_count < 2) ? NULL : boolean->nod_arg[1];
|
||
|
||
#ifdef EXPRESSION_INDICES
|
||
if (idx->idx_flags & idx_expressn)
|
||
{
|
||
// see if one side or the other is matchable to the index expression
|
||
|
||
fb_assert(idx->idx_expression != NULL);
|
||
|
||
if (!expression_equal(tdbb, opt, idx, match, stream) ||
|
||
(value && !computable(opt->opt_csb, value, stream, true, false)))
|
||
{
|
||
if (value &&
|
||
expression_equal(tdbb, opt, idx, value, stream) &&
|
||
computable(opt->opt_csb, match, stream, true, false))
|
||
{
|
||
match = boolean->nod_arg[1];
|
||
value = boolean->nod_arg[0];
|
||
}
|
||
else
|
||
return 0;
|
||
}
|
||
}
|
||
else {
|
||
#endif
|
||
// If left side is not a field, swap sides.
|
||
// If left side is still not a field, give up
|
||
|
||
if (match->nod_type != nod_field ||
|
||
(USHORT)(IPTR) match->nod_arg[e_fld_stream] != stream ||
|
||
(value && !computable(opt->opt_csb, value, stream, true, false)))
|
||
{
|
||
match = value;
|
||
value = boolean->nod_arg[0];
|
||
if (!match ||
|
||
match->nod_type != nod_field ||
|
||
(USHORT)(IPTR) match->nod_arg[e_fld_stream] != stream ||
|
||
!computable(opt->opt_csb, value, stream, true, false))
|
||
{
|
||
return 0;
|
||
}
|
||
forward = false;
|
||
}
|
||
#ifdef EXPRESSION_INDICES
|
||
}
|
||
#endif
|
||
|
||
/* match the field to an index, if possible, and save the value to be matched
|
||
as either the lower or upper bound for retrieval, or both */
|
||
|
||
SSHORT count = 0;
|
||
SSHORT i = 0;
|
||
for (OptimizerBlk::opt_segment* ptr = opt->opt_segments; i < idx->idx_count;
|
||
i++, ptr++)
|
||
{
|
||
if (
|
||
#ifdef EXPRESSION_INDICES
|
||
(idx->idx_flags & idx_expressn) ||
|
||
#endif
|
||
(USHORT)(IPTR) match->nod_arg[e_fld_id] == idx->idx_rpt[i].idx_field)
|
||
{
|
||
++count;
|
||
/* AB: If we have already an exact match don't
|
||
override it with worser matches, but increment the
|
||
count so that the node will be marked as matched! */
|
||
if (ptr->opt_match && ptr->opt_match->nod_type == nod_eql) {
|
||
break;
|
||
}
|
||
switch (boolean->nod_type) {
|
||
case nod_between:
|
||
if (!forward ||
|
||
!computable(opt->opt_csb,
|
||
boolean->nod_arg[2],
|
||
stream,
|
||
true,
|
||
false))
|
||
{
|
||
return 0;
|
||
}
|
||
ptr->opt_lower = value;
|
||
ptr->opt_upper = boolean->nod_arg[2];
|
||
ptr->opt_match = boolean;
|
||
break;
|
||
case nod_equiv:
|
||
case nod_eql:
|
||
ptr->opt_lower = ptr->opt_upper = value;
|
||
ptr->opt_match = boolean;
|
||
break;
|
||
case nod_gtr:
|
||
case nod_geq:
|
||
if (forward) {
|
||
ptr->opt_lower = value;
|
||
}
|
||
else {
|
||
ptr->opt_upper = value;
|
||
}
|
||
ptr->opt_match = boolean;
|
||
break;
|
||
case nod_lss:
|
||
case nod_leq:
|
||
if (forward) {
|
||
ptr->opt_upper = value;
|
||
}
|
||
else {
|
||
ptr->opt_lower = value;
|
||
}
|
||
ptr->opt_match = boolean;
|
||
break;
|
||
default: /* Shut up compiler warnings */
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
return count;
|
||
}
|
||
|
||
|
||
static bool match_indices(thread_db* tdbb,
|
||
OptimizerBlk* opt,
|
||
SSHORT stream, jrd_nod* boolean,
|
||
index_desc* idx)
|
||
{
|
||
/**************************************
|
||
*
|
||
* m a t c h _ i n d i c e s
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Match a boolean against an index location lower and upper
|
||
* bounds. Return the number of relational nodes that were
|
||
* matched. In ODS versions prior to 7, descending indexes
|
||
* were not reliable and will not be used.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(boolean, type_nod);
|
||
SET_TDBB(tdbb);
|
||
|
||
if (boolean->nod_count < 2) {
|
||
return false;
|
||
}
|
||
|
||
if (boolean->nod_type == nod_or) {
|
||
if (match_indices(tdbb, opt, stream, boolean->nod_arg[0], idx) &&
|
||
match_indices(tdbb, opt, stream, boolean->nod_arg[1], idx))
|
||
{
|
||
opt->opt_segments[0].opt_match = NULL;
|
||
return true;
|
||
}
|
||
}
|
||
else {
|
||
if (match_index(tdbb, opt, stream, boolean, idx)) {
|
||
opt->opt_segments[0].opt_match = NULL;
|
||
return true;
|
||
}
|
||
}
|
||
opt->opt_segments[0].opt_match = NULL;
|
||
opt->opt_segments[0].opt_upper = NULL;
|
||
opt->opt_segments[0].opt_lower = NULL;
|
||
return false;
|
||
}
|
||
|
||
|
||
static USHORT nav_rsb_size(RecordSource* rsb, USHORT key_length, USHORT size)
|
||
{
|
||
/**************************************
|
||
*
|
||
* n a v _ r s b _ s i z e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Calculate the size of a navigational rsb.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(rsb, type_rsb);
|
||
#ifdef SCROLLABLE_CURSORS
|
||
/* allocate extra impure area to hold the current key,
|
||
plus an upper and lower bound key value, for a total
|
||
of three times the key length for the index */
|
||
size += sizeof(struct irsb_nav) + 3 * key_length;
|
||
#else
|
||
size += sizeof(struct irsb_nav) + 2 * key_length;
|
||
#endif
|
||
size = FB_ALIGN(size, ALIGNMENT);
|
||
/* make room for an idx structure to describe the index
|
||
that was used to generate this rsb */
|
||
if (rsb->rsb_type == rsb_navigate)
|
||
rsb->rsb_arg[RSB_NAV_idx_offset] = (RecordSource*) (IPTR) size;
|
||
size += sizeof(index_desc);
|
||
return size;
|
||
}
|
||
|
||
|
||
static bool node_equality(const jrd_nod* node1, const jrd_nod* node2)
|
||
{
|
||
/**************************************
|
||
*
|
||
* n o d e _ e q u a l i t y
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Test two field node pointers for symbolic equality.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node1, type_nod);
|
||
DEV_BLKCHK(node2, type_nod);
|
||
if (!node1 || !node2) {
|
||
return false;
|
||
}
|
||
if (node1->nod_type != node2->nod_type) {
|
||
return false;
|
||
}
|
||
if (node1 == node2) {
|
||
return true;
|
||
}
|
||
switch (node1->nod_type) {
|
||
case nod_field:
|
||
return (node1->nod_arg[e_fld_stream] == node2->nod_arg[e_fld_stream]
|
||
&& node1->nod_arg[e_fld_id] == node2->nod_arg[e_fld_id]);
|
||
case nod_equiv:
|
||
case nod_eql:
|
||
if (node_equality(node1->nod_arg[0], node2->nod_arg[0])
|
||
&& node_equality(node1->nod_arg[1], node2->nod_arg[1]))
|
||
{
|
||
return true;
|
||
}
|
||
if (node_equality(node1->nod_arg[0], node2->nod_arg[1])
|
||
&& node_equality(node1->nod_arg[1], node2->nod_arg[0]))
|
||
{
|
||
return true;
|
||
}
|
||
return false;
|
||
|
||
case nod_gtr:
|
||
case nod_geq:
|
||
case nod_leq:
|
||
case nod_lss:
|
||
case nod_matches:
|
||
case nod_contains:
|
||
case nod_like:
|
||
default:
|
||
break;
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
|
||
static jrd_nod* optimize_like(thread_db* tdbb, jrd_nod* like_node)
|
||
{
|
||
/**************************************
|
||
*
|
||
* o p t i m i z e _ l i k e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Optimize a LIKE expression, if possible,
|
||
* into a "starting with" AND a "like". This
|
||
* will allow us to use the index for the
|
||
* starting with, and the LIKE can just tag
|
||
* aSLONG for the ride.
|
||
* But on the ride it does useful work, consider
|
||
* match LIKE "ab%c". This is optimized by adding
|
||
* AND starting_with "ab", but the LIKE clause is
|
||
* still needed.
|
||
*
|
||
**************************************/
|
||
UCHAR tmp_buffer[32]; /* large enough to hold 1 ch of escape string */
|
||
SET_TDBB(tdbb);
|
||
DEV_BLKCHK(like_node, type_nod);
|
||
|
||
jrd_nod* search_node = like_node->nod_arg[1];
|
||
jrd_nod* escape_node = (like_node->nod_count > 2) ? like_node->nod_arg[2] : NULL;
|
||
/* if the matching string or the escape string can't
|
||
be evaluated at compile time, forget it */
|
||
if ((search_node->nod_type != nod_literal) ||
|
||
(escape_node && escape_node->nod_type != nod_literal))
|
||
{
|
||
return NULL;
|
||
}
|
||
dsc* search_desc = &((Literal*) search_node)->lit_desc;
|
||
dsc* escape_desc = 0;
|
||
if (escape_node)
|
||
escape_desc = &((Literal*) escape_node)->lit_desc;
|
||
|
||
/* if either is not a character expression, forget it */
|
||
if ((search_desc->dsc_dtype > dtype_any_text) ||
|
||
(escape_node && escape_desc->dsc_dtype > dtype_any_text))
|
||
{
|
||
return NULL;
|
||
}
|
||
|
||
/* Get the escape character, if any */
|
||
TextType text_obj = NULL;
|
||
USHORT escape_ch = 0;
|
||
if (escape_node)
|
||
{
|
||
/* Ensure escape string is same character set as search string
|
||
* Error report on Overflow is OK, as sql only allows a single
|
||
* character escape string */
|
||
|
||
const char* p2;
|
||
USHORT p_count =
|
||
MOV_make_string(escape_desc, INTL_TTYPE(search_desc), &p2,
|
||
reinterpret_cast<vary*>(tmp_buffer),
|
||
sizeof(tmp_buffer));
|
||
const UCHAR* p = reinterpret_cast<const UCHAR*>(p2);
|
||
/* Now get first character from escape string */
|
||
escape_ch =
|
||
INTL_getch(tdbb, &text_obj,
|
||
INTL_TTYPE(search_desc), &p, &p_count);
|
||
}
|
||
|
||
// If the first character is a wildcard char, forget it.
|
||
// CVC: Beware, if INTL doesn't understand the next character, p_count is zero.
|
||
// No check is done. We must handle this failure.
|
||
const UCHAR* p = search_desc->dsc_address;
|
||
USHORT p_count = search_desc->dsc_length;
|
||
USHORT ch =
|
||
INTL_getch(tdbb, &text_obj,
|
||
INTL_TTYPE(search_desc), &p, &p_count);
|
||
if ((!escape_node || ch != escape_ch)
|
||
&& (ch == SQL_MATCH_1_CHAR || ch == SQL_MATCH_ANY_CHARS))
|
||
{
|
||
return NULL;
|
||
}
|
||
// allocate a literal node to store the starting with string;
|
||
// assume it will be shorter than the search string
|
||
// CVC: This assumption may not be true if we use "value like field".
|
||
const SSHORT count = lit_delta +
|
||
(search_desc->dsc_length + sizeof(jrd_nod*) - 1) / sizeof(jrd_nod*);
|
||
jrd_nod* node = PAR_make_node(tdbb, count);
|
||
node->nod_type = nod_literal;
|
||
node->nod_count = 0;
|
||
Literal* literal = (Literal*) node;
|
||
literal->lit_desc = *search_desc;
|
||
UCHAR* q = reinterpret_cast<UCHAR*>(literal->lit_data);
|
||
literal->lit_desc.dsc_address = q;
|
||
/* copy the string into the starting with literal, up to the first wildcard character */
|
||
p_count = search_desc->dsc_length;
|
||
p = search_desc->dsc_address;
|
||
for (const UCHAR* const end = p + search_desc->dsc_length; p < end;)
|
||
{
|
||
// if there are escape characters, skip past them and
|
||
// don't treat the next char as a wildcard
|
||
// CVC: Beware, if INTL doesn't understand the next character, p_count is zero. No check is done.
|
||
// Same than above, but worse, since it will enter an infinite loop. Example: Spanish <20> against unicode.
|
||
// Reported also on Portuguese characters that aren't ASCII < 128.
|
||
const UCHAR* p_start = p;
|
||
ch =
|
||
INTL_getch(tdbb, &text_obj,
|
||
INTL_TTYPE(search_desc), &p, &p_count);
|
||
if (escape_node && (ch == escape_ch))
|
||
{
|
||
/* Check for Escape character at end of string */
|
||
|
||
if (!(p < end))
|
||
break;
|
||
p_start = p;
|
||
ch =
|
||
INTL_getch(tdbb, &text_obj,
|
||
INTL_TTYPE(search_desc), &p, &p_count);
|
||
}
|
||
else if (ch == SQL_MATCH_1_CHAR || ch == SQL_MATCH_ANY_CHARS)
|
||
{
|
||
break;
|
||
}
|
||
/* copy the bytes of the character */
|
||
while (p_start < p) {
|
||
*q++ = *p_start++;
|
||
}
|
||
}
|
||
|
||
literal->lit_desc.dsc_length = q - literal->lit_desc.dsc_address;
|
||
return node;
|
||
}
|
||
|
||
|
||
|
||
#ifdef OPT_DEBUG
|
||
static void print_order(OptimizerBlk* opt,
|
||
USHORT position, double cardinality, double cost)
|
||
{
|
||
/**************************************
|
||
*
|
||
* p r i n t _ o r d e r
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
fprintf(opt_debug_file, "print_order() -- position %2.2d: ", position);
|
||
const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
|
||
for (const OptimizerBlk::opt_stream* const order_end = opt->opt_streams.begin() + position;
|
||
tail < order_end; tail++)
|
||
{
|
||
fprintf(opt_debug_file, "stream %2.2d, ", tail->opt_stream_number);
|
||
}
|
||
fprintf(opt_debug_file, "\n\t\t\tcardinality: %g\tcost: %g\n",
|
||
cardinality, cost);
|
||
}
|
||
#endif
|
||
|
||
|
||
static USHORT river_count(USHORT count, jrd_nod** eq_class)
|
||
{
|
||
/**************************************
|
||
*
|
||
* r i v e r _ c o u n t
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Given an sort/merge join equivalence class (vector of node pointers
|
||
* of representative values for rivers), return the count of rivers
|
||
* with values.
|
||
*
|
||
**************************************/
|
||
#ifdef DEV_BUILD
|
||
if (*eq_class) {
|
||
DEV_BLKCHK(*eq_class, type_nod);
|
||
}
|
||
#endif
|
||
USHORT cnt = 0;
|
||
for (USHORT i = 0; i < count; i++, eq_class++)
|
||
if (*eq_class) {
|
||
cnt++;
|
||
DEV_BLKCHK(*eq_class, type_nod);
|
||
}
|
||
|
||
return cnt;
|
||
}
|
||
|
||
|
||
static bool river_reference(const River* river, const jrd_nod* node, bool* field_found)
|
||
{
|
||
/**************************************
|
||
*
|
||
* r i v e r _ r e f e r e n c e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* See if a value node is a reference to a given river.
|
||
* AB: Handle also expressions (F1 + F2 * 3, etc..)
|
||
* The expression is checked if all fields that are
|
||
* buried inside are pointing to the the given river.
|
||
* If a passed field isn't referenced by the river then
|
||
* we have an expression with 2 fields pointing to
|
||
* different rivers and then the result is always false.
|
||
* NOTE! The first time this function is called
|
||
* field_found should be NULL.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(river, type_riv);
|
||
DEV_BLKCHK(node, type_nod);
|
||
|
||
bool lfield_found = false;
|
||
bool root_caller = false;
|
||
|
||
// If no boolean parameter is given then this is the first call
|
||
// to this function and we use the local boolean to pass to
|
||
// itselfs. The boolean is used to see if any field has passed
|
||
// that references to the river.
|
||
if (!field_found) {
|
||
root_caller = true;
|
||
field_found = &lfield_found;
|
||
}
|
||
|
||
switch (node->nod_type) {
|
||
|
||
case nod_field :
|
||
{
|
||
// Check if field references to the river.
|
||
const UCHAR* streams = river->riv_streams;
|
||
for (const UCHAR* const end = streams + river->riv_count;
|
||
streams < end; streams++)
|
||
{
|
||
if ((USHORT)(IPTR) node->nod_arg[e_fld_stream] == *streams) {
|
||
*field_found = true;
|
||
return true;
|
||
}
|
||
}
|
||
return false;
|
||
}
|
||
|
||
default :
|
||
{
|
||
const jrd_nod* const* ptr = node->nod_arg;
|
||
// Check all sub-nodes of this node.
|
||
for (const jrd_nod* const* const end = ptr + node->nod_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
if (!river_reference(river, *ptr, field_found)) {
|
||
return false;
|
||
}
|
||
}
|
||
// if this was the first call then field_found tells
|
||
// us if any field (referenced by river) was found.
|
||
if (root_caller) {
|
||
return *field_found;
|
||
}
|
||
else {
|
||
return true;
|
||
}
|
||
}
|
||
}
|
||
/*
|
||
// AB: Original code FB1.0 , just left as reference for a while
|
||
UCHAR *streams, *end;
|
||
DEV_BLKCHK(river, type_riv);
|
||
DEV_BLKCHK(node, type_nod);
|
||
if (node->nod_type != nod_field)
|
||
return false;
|
||
for (streams = river->riv_streams, end =
|
||
streams + river->riv_count; streams < end; streams++)
|
||
if ((USHORT) node->nod_arg[e_fld_stream] == *streams)
|
||
return true;
|
||
return false;
|
||
*/
|
||
return false;
|
||
}
|
||
|
||
|
||
static bool search_stack(const jrd_nod* node, const NodeStack& stack)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e a r c h _ s t a c k
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Search a stack for the presence of a particular value.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(node, type_nod);
|
||
for (NodeStack::const_iterator iter(stack); iter.hasData(); ++iter) {
|
||
if (node_equality(node, iter.object())) {
|
||
return true;
|
||
}
|
||
}
|
||
return false;
|
||
}
|
||
|
||
|
||
static void set_active(OptimizerBlk* opt, const River* river)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e t _ a c t i v e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Set a group of streams active.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(river, type_riv);
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
const UCHAR* streams = river->riv_streams;
|
||
for (const UCHAR* const end = streams + river->riv_count; streams < end;
|
||
streams++)
|
||
{
|
||
csb->csb_rpt[*streams].csb_flags |= csb_active;
|
||
}
|
||
}
|
||
|
||
|
||
static void set_direction(const jrd_nod* from_clause, jrd_nod* to_clause)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e t _ d i r e c t i o n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Update the direction of a GROUP BY, DISTINCT, or ORDER BY
|
||
* clause to the same direction as another clause.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(from_clause, type_nod);
|
||
DEV_BLKCHK(to_clause, type_nod);
|
||
/* all three clauses are allocated with thrice the number of arguments to
|
||
leave room at the end for an ascending/descending and nulls placement flags,
|
||
one for each field */
|
||
jrd_nod* const* from_ptr = from_clause->nod_arg + from_clause->nod_count;
|
||
jrd_nod** to_ptr = to_clause->nod_arg + to_clause->nod_count;
|
||
for (const jrd_nod* const* const end = from_ptr + from_clause->nod_count * 2;
|
||
from_ptr < end; from_ptr++)
|
||
{
|
||
*to_ptr++ = *from_ptr;
|
||
}
|
||
}
|
||
|
||
|
||
|
||
static void set_inactive(OptimizerBlk* opt, const River* river)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e t _ i n a c t i v e
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Set a group of streams inactive.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(river, type_riv);
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
const UCHAR* streams = river->riv_streams;
|
||
for (const UCHAR* const end = streams + river->riv_count; streams < end;
|
||
streams++)
|
||
{
|
||
csb->csb_rpt[*streams].csb_flags &= ~csb_active;
|
||
}
|
||
}
|
||
|
||
|
||
static void set_made_river(OptimizerBlk* opt, const River* river)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e t _ m a d e _ r i v e r
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Mark all the streams in a river with the csb_made_river flag.
|
||
*
|
||
* A stream with this flag set, incicates that this stream has
|
||
* already been made into a river. Currently, this flag is used
|
||
* in computable() to decide if we can use the an index to
|
||
* optimise retrieving the streams involved in the conjunct.
|
||
*
|
||
* We can use an index in retrieving the streams involved in a
|
||
* conjunct if both of the streams are currently active or have
|
||
* been processed (and made into rivers) before.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(opt, type_opt);
|
||
DEV_BLKCHK(river, type_riv);
|
||
CompilerScratch* csb = opt->opt_csb;
|
||
const UCHAR* streams = river->riv_streams;
|
||
for (const UCHAR* const end = streams + river->riv_count; streams < end;
|
||
streams++)
|
||
{
|
||
csb->csb_rpt[*streams].csb_flags |= csb_made_river;
|
||
}
|
||
}
|
||
|
||
|
||
static void set_position(const jrd_nod* from_clause, jrd_nod* to_clause,
|
||
const jrd_nod* map)
|
||
{
|
||
/**************************************
|
||
*
|
||
* s e t _ p o s i t i o n
|
||
*
|
||
**************************************
|
||
*
|
||
* Functional description
|
||
* Update the fields in a GROUP BY, DISTINCT, or ORDER BY
|
||
* clause to the same position as another clause, possibly
|
||
* using a mapping between the streams.
|
||
*
|
||
**************************************/
|
||
DEV_BLKCHK(from_clause, type_nod);
|
||
DEV_BLKCHK(to_clause, type_nod);
|
||
DEV_BLKCHK(map, type_nod);
|
||
/* Track the position in the from list with "to_swap", and find the corresponding
|
||
field in the from list with "to_ptr", then swap the two fields. By the time
|
||
we get to the end of the from list, all fields in the to list will be reordered. */
|
||
jrd_nod** to_swap = to_clause->nod_arg;
|
||
const jrd_nod* const* from_ptr = from_clause->nod_arg;
|
||
for (const jrd_nod* const* const from_end =
|
||
from_ptr + from_clause->nod_count; from_ptr < from_end; from_ptr++)
|
||
{
|
||
jrd_nod** to_ptr = to_clause->nod_arg;
|
||
for (const jrd_nod* const* const to_end =
|
||
to_ptr + from_clause->nod_count; to_ptr < to_end; to_ptr++)
|
||
{
|
||
if ((map && map_equal(*to_ptr, *from_ptr, map))
|
||
|| (!map
|
||
&& (*from_ptr)->nod_arg[e_fld_stream] ==
|
||
(*to_ptr)->nod_arg[e_fld_stream]
|
||
&& (*from_ptr)->nod_arg[e_fld_id] ==
|
||
(*to_ptr)->nod_arg[e_fld_id]))
|
||
{
|
||
jrd_nod* swap = *to_swap;
|
||
*to_swap = *to_ptr;
|
||
*to_ptr = swap;
|
||
}
|
||
}
|
||
|
||
to_swap++;
|
||
}
|
||
|
||
}
|
||
|
||
|
||
static void set_rse_inactive(CompilerScratch* csb, const RecordSelExpr* rse)
|
||
{
|
||
/***************************************************
|
||
*
|
||
* s e t _ r s e _ i n a c t i v e
|
||
*
|
||
***************************************************
|
||
*
|
||
* Functional Description:
|
||
* Set all the streams involved in an RecordSelExpr as inactive. Do it recursively.
|
||
*
|
||
***************************************************/
|
||
const jrd_nod* const* ptr = rse->rse_relation;
|
||
for (const jrd_nod* const* const end = ptr + rse->rse_count;
|
||
ptr < end; ptr++)
|
||
{
|
||
const jrd_nod* node = *ptr;
|
||
if (node->nod_type != nod_rse) {
|
||
const SSHORT stream = (USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
|
||
csb->csb_rpt[stream].csb_flags &= ~csb_active;
|
||
}
|
||
else
|
||
set_rse_inactive(csb, (const RecordSelExpr*) node);
|
||
}
|
||
}
|
||
|
||
|
||
static void sort_indices_by_selectivity(CompilerScratch::csb_repeat* csb_tail)
|
||
{
|
||
/***************************************************
|
||
*
|
||
* s o r t _ i n d i c e s _ b y _ s e l e c t i v i t y
|
||
*
|
||
***************************************************
|
||
*
|
||
* Functional Description:
|
||
* Sort indices based on there selectivity.
|
||
* Lowest selectivy as first, highest as last.
|
||
*
|
||
***************************************************/
|
||
|
||
if (csb_tail->csb_plan) {
|
||
return;
|
||
}
|
||
|
||
index_desc* selected_idx = NULL;
|
||
USHORT i, j;
|
||
Firebird::Array<index_desc> idx_sort(*JRD_get_thread_data()->getDefaultPool(), csb_tail->csb_indices);
|
||
bool same_selectivity = false;
|
||
|
||
// Walk through the indices and sort them into into idx_sort
|
||
// where idx_sort[0] contains the lowest selectivity (best) and
|
||
// idx_sort[csb_tail->csb_indices - 1] the highest (worst)
|
||
|
||
if (csb_tail->csb_idx && (csb_tail->csb_indices > 1)) {
|
||
for (j = 0; j < csb_tail->csb_indices; j++) {
|
||
float selectivity = 1; // Maximum selectivity is 1 (when all keys are the same)
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
for (i = 0; i < csb_tail->csb_indices; i++) {
|
||
// Prefer ASC indices in the case of almost the same selectivities
|
||
if (selectivity > idx->idx_selectivity) {
|
||
same_selectivity = ((selectivity - idx->idx_selectivity) <= 0.00001);
|
||
}
|
||
else {
|
||
same_selectivity = ((idx->idx_selectivity - selectivity) <= 0.00001);
|
||
}
|
||
if (!(idx->idx_runtime_flags & idx_marker) &&
|
||
(idx->idx_selectivity <= selectivity) &&
|
||
!((idx->idx_flags & idx_descending) && same_selectivity))
|
||
{
|
||
selectivity = idx->idx_selectivity;
|
||
selected_idx = idx;
|
||
}
|
||
++idx;
|
||
}
|
||
// If no index was found than pick the first one available out of the list
|
||
if ((!selected_idx) || (selected_idx->idx_runtime_flags & idx_marker))
|
||
{
|
||
idx = csb_tail->csb_idx->items;
|
||
for (i = 0; i < csb_tail->csb_indices; i++) {
|
||
if (!(idx->idx_runtime_flags & idx_marker)) {
|
||
selected_idx = idx;
|
||
break;
|
||
}
|
||
++idx;
|
||
}
|
||
}
|
||
selected_idx->idx_runtime_flags |= idx_marker;
|
||
idx_sort.add(*selected_idx);
|
||
}
|
||
|
||
// Finally store the right order in cbs_tail->csb_idx
|
||
index_desc* idx = csb_tail->csb_idx->items;
|
||
for (j = 0; j < csb_tail->csb_indices; j++) {
|
||
idx->idx_runtime_flags &= ~idx_marker;
|
||
MOVE_FAST(&idx_sort[j], idx, sizeof(index_desc));
|
||
++idx;
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
static SSHORT sort_indices_by_priority(CompilerScratch::csb_repeat* csb_tail,
|
||
index_desc** idx_walk,
|
||
UINT64* idx_priority_level)
|
||
{
|
||
/***************************************************
|
||
*
|
||
* s o r t _ i n d i c e s _ b y _ p r i o r i t y
|
||
*
|
||
***************************************************
|
||
*
|
||
* Functional Description:
|
||
* Sort indices based on the priority level.
|
||
*
|
||
***************************************************/
|
||
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS> idx_csb(*JRD_get_thread_data()->getDefaultPool());
|
||
idx_csb.grow(csb_tail->csb_indices);
|
||
memcpy(idx_csb.begin(), idx_walk, csb_tail->csb_indices * sizeof(index_desc*));
|
||
|
||
SSHORT idx_walk_count = 0;
|
||
float selectivity = 1; /* Real maximum selectivity possible is 1 */
|
||
|
||
for (SSHORT i = 0; i < csb_tail->csb_indices; i++)
|
||
{
|
||
SSHORT last_idx = -1;
|
||
UINT64 last_priority_level = 0;
|
||
|
||
for (SSHORT j = csb_tail->csb_indices - 1; j >= 0; j--)
|
||
{
|
||
if (!(idx_priority_level[j] == 0) &&
|
||
(idx_priority_level[j] >= last_priority_level))
|
||
{
|
||
last_priority_level = idx_priority_level[j];
|
||
last_idx = j;
|
||
}
|
||
}
|
||
|
||
if (last_idx >= 0) {
|
||
/* dimitr: Empirically, it's better to use less indices with very good selectivity
|
||
than using all available ones. Here we're deciding how many indices we
|
||
should use. Since all indices are already ordered by their selectivity,
|
||
it becomes a trivial task. But note that indices with zero (unknown)
|
||
selectivity are always used, because we don't have a clue how useful
|
||
they are in fact, so we should be optimistic in this case. Unique
|
||
indices are also always used, because they are good by definition,
|
||
regardless of their (probably old) selectivity values. */
|
||
index_desc* idx = idx_csb[last_idx];
|
||
bool should_be_used = true;
|
||
if (idx->idx_selectivity && !(csb_tail->csb_plan)) {
|
||
if (!(idx->idx_flags & idx_unique) &&
|
||
(selectivity * SELECTIVITY_THRESHOLD_FACTOR < idx->idx_selectivity))
|
||
{
|
||
should_be_used = false;
|
||
}
|
||
selectivity = idx->idx_selectivity;
|
||
}
|
||
idx_priority_level[last_idx] = 0; /* Mark as used by setting priority_level to 0 */
|
||
if (should_be_used) {
|
||
idx_walk[idx_walk_count] = idx_csb[last_idx];
|
||
idx_walk_count++;
|
||
}
|
||
}
|
||
}
|
||
|
||
return idx_walk_count;
|
||
}
|
||
|