8
0
mirror of https://github.com/FirebirdSQL/firebird.git synced 2025-01-27 20:03:03 +01:00
firebird-mirror/src/jrd/opt.cpp
dimitr 09c51110b4 Added the equivalence operator. The major index optimizations are done.
Notes:
1) Some optimizations will follow after more deep analysis.
2) The syntax "==" is not yet agreed on. I'd prefer it to be changed.
2004-10-14 19:09:19 +00:00

7608 lines
217 KiB
C++
Raw Blame History

/*
* PROGRAM: JRD Access Method
* MODULE: opt.cpp
* DESCRIPTION: Optimizer / record selection expression compiler
*
* The contents of this file are subject to the Interbase Public
* License Version 1.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy
* of the License at http://www.Inprise.com/IPL.html
*
* Software distributed under the License is distributed on an
* "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express
* or implied. See the License for the specific language governing
* rights and limitations under the License.
*
* The Original Code was created by Inprise Corporation
* and its predecessors. Portions created by Inprise Corporation are
* Copyright (C) Inprise Corporation.
*
* All Rights Reserved.
* Contributor(s): ______________________________________.
* 2002.10.12: Nickolay Samofatov: Fixed problems with wrong results produced by
* outer joins
* 2001.07.28: John Bellardo: Added code to handle rse_skip nodes.
* 2001.07.17 Claudio Valderrama: Stop crash with indices and recursive calls
* of OPT_compile: indicator csb_indices set to zero after used memory is
* returned to the free pool.
* 2001.02.15: Claudio Valderrama: Don't obfuscate the plan output if a selectable
* stored procedure doesn't access tables, views or other procedures directly.
* 2002.10.29 Sean Leyne - Removed obsolete "Netware" port
* 2002.10.30: Arno Brinkman: Changes made to gen_retrieval, OPT_compile and make_inversion.
* Procedure sort_indices added. The changes in gen_retrieval are that now
* an index with high field-count has priority to build an index from.
* Procedure make_inversion is changed so that it not pick every index
* that comes away, this was slow performance with bad selectivity indices
* which most are foreign_keys with a reference to a few records.
* 2002.11.01: Arno Brinkman: Added match_indices for better support of OR handling
* in INNER JOIN (gen_join) statements.
* 2002.12.15: Arno Brinkman: Added find_used_streams, so that inside opt_compile all the
* streams are marked active. This causes that more indices can be used for
* a retrieval. With this change BUG SF #219525 is solved too.
*
*/
#include "firebird.h"
#include "../jrd/common.h"
#include <stdio.h>
#include <string.h>
#include "../jrd/ibase.h"
#include "../jrd/jrd.h"
#include "../jrd/align.h"
#include "../jrd/val.h"
#include "../jrd/req.h"
#include "../jrd/exe.h"
#include "../jrd/lls.h"
#include "../jrd/ods.h"
#include "../jrd/btr.h"
#include "../jrd/sort.h"
#include "../jrd/rse.h"
#include "../jrd/intl.h"
#include "../jrd/thd.h"
#include "../jrd/gdsassert.h"
#include "../jrd/all_proto.h"
#include "../jrd/btr_proto.h"
#include "../jrd/cch_proto.h"
#include "../jrd/cmp_proto.h"
#include "../jrd/dpm_proto.h"
#include "../jrd/err_proto.h"
#include "../jrd/ext_proto.h"
#include "../jrd/evl_proto.h"
#include "../jrd/intl_proto.h"
#include "../jrd/lck_proto.h"
#include "../jrd/met_proto.h"
#include "../jrd/mov_proto.h"
#include "../jrd/opt_proto.h"
#include "../jrd/par_proto.h"
#include "../jrd/gds_proto.h"
#include "../jrd/dbg_proto.h"
#include "../common/classes/array.h"
#include "../common/classes/objects_array.h"
using namespace Jrd;
#ifdef DEV_BUILD
#define OPT_DEBUG
#endif
static bool augment_stack(jrd_nod*, NodeStack&);
static UINT64 calculate_priority_level(const OptimizerBlk*, const index_desc*);
static void check_indices(const CompilerScratch::csb_repeat*);
static bool check_relationship(const OptimizerBlk*, USHORT, USHORT);
static void check_sorts(RecordSelExpr*);
static void class_mask(USHORT, jrd_nod**, ULONG *);
static void clear_bounds(OptimizerBlk*, const index_desc*);
static jrd_nod* compose(jrd_nod**, jrd_nod*, NOD_T);
static bool computable(CompilerScratch*, jrd_nod*, SSHORT, bool, bool);
static void compute_dependencies(const jrd_nod*, ULONG*);
static void compute_dbkey_streams(const CompilerScratch*, const jrd_nod*, UCHAR*);
static void compute_rse_streams(const CompilerScratch*, const RecordSelExpr*, UCHAR*);
static bool check_for_nod_from(const jrd_nod*);
static SLONG decompose(thread_db*, jrd_nod*, NodeStack&, CompilerScratch*);
static USHORT distribute_equalities(NodeStack&, CompilerScratch*, USHORT);
static bool dump_index(const jrd_nod*, SCHAR**, SSHORT*);
static bool dump_rsb(const jrd_req*, const RecordSource*, SCHAR**, SSHORT*);
static bool estimate_cost(thread_db*, OptimizerBlk*, USHORT, double *, double *);
static bool expression_contains(const jrd_nod*, NOD_T);
static bool expression_contains_stream(const jrd_nod*, UCHAR);
#ifdef EXPRESSION_INDICES
static bool expression_equal(thread_db*, OptimizerBlk*, const index_desc*,
jrd_nod*, USHORT);
static bool expression_equal2(thread_db*, OptimizerBlk*, jrd_nod*,
jrd_nod*, USHORT);
#endif
static void find_best(thread_db*, OptimizerBlk*, USHORT, USHORT, UCHAR*, const jrd_nod*,
double, double);
static jrd_nod* find_dbkey(jrd_nod*, USHORT, SLONG*);
static USHORT find_order(thread_db*, OptimizerBlk*, UCHAR*, const jrd_nod*);
static void find_rsbs(RecordSource*, StreamStack*, RsbStack*);
static void find_used_streams(const RecordSource*, UCHAR*);
static void form_rivers(thread_db*, OptimizerBlk*, UCHAR*, RiverStack&, jrd_nod**, jrd_nod**, jrd_nod*);
static bool form_river(thread_db*, OptimizerBlk*, USHORT, UCHAR *, UCHAR *, RiverStack&, jrd_nod**,
jrd_nod**, jrd_nod*);
static RecordSource* gen_aggregate(thread_db*, OptimizerBlk*, jrd_nod*);
static RecordSource* gen_boolean(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
static RecordSource* gen_first(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
static void gen_join(thread_db*, OptimizerBlk*, UCHAR*, RiverStack&, jrd_nod**, jrd_nod**, jrd_nod*);
static RecordSource* gen_navigation(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*, jrd_nod**);
#ifdef SCROLLABLE_CURSORS
static RecordSource* gen_nav_rsb(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*, RSE_GET_MODE);
#else
static RecordSource* gen_nav_rsb(thread_db*, OptimizerBlk*, USHORT, jrd_rel*, str*, index_desc*);
#endif
static RecordSource* gen_outer(thread_db*, OptimizerBlk*, RecordSelExpr*, RiverStack&, jrd_nod**, jrd_nod**);
static RecordSource* gen_procedure(thread_db*, OptimizerBlk*, jrd_nod*);
static RecordSource* gen_residual_boolean(thread_db*, OptimizerBlk*, RecordSource*);
static RecordSource* gen_retrieval(thread_db*, OptimizerBlk*, SSHORT, jrd_nod**, jrd_nod**, bool, bool,
jrd_nod**);
static RecordSource* gen_rsb(thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*, SSHORT, jrd_rel*, str*, jrd_nod*, float);
static RecordSource* gen_skip (thread_db*, OptimizerBlk*, RecordSource*, jrd_nod*);
static RecordSource* gen_sort(thread_db*, OptimizerBlk*, UCHAR *, UCHAR *, RecordSource*, jrd_nod*, bool);
static bool gen_sort_merge(thread_db*, OptimizerBlk*, RiverStack&);
static RecordSource* gen_union(thread_db*, OptimizerBlk*, jrd_nod*, UCHAR *, USHORT);
static void get_inactivities(const CompilerScratch*, ULONG*);
static IndexedRelationship* indexed_relationship(thread_db*, OptimizerBlk*, USHORT);
static str* make_alias(thread_db*, CompilerScratch*, CompilerScratch::csb_repeat*);
static jrd_nod* make_binary_node(NOD_T, jrd_nod*, jrd_nod*, bool);
static RecordSource* make_cross(thread_db*, OptimizerBlk*, RiverStack&);
static jrd_nod* make_index_node(thread_db*, jrd_rel*, CompilerScratch*, index_desc*);
static jrd_nod* make_inference_node(CompilerScratch*, jrd_nod*, jrd_nod*, jrd_nod*);
static jrd_nod* make_inversion(thread_db*, OptimizerBlk*, jrd_nod*, USHORT);
static jrd_nod* make_missing(thread_db*, OptimizerBlk*, jrd_rel*, jrd_nod*, USHORT, index_desc*);
static jrd_nod* make_starts(thread_db*, OptimizerBlk*, jrd_rel*, jrd_nod*, USHORT, index_desc*);
static bool map_equal(const jrd_nod*, const jrd_nod*, const jrd_nod*);
static void mark_indices(CompilerScratch::csb_repeat*, SSHORT);
static SSHORT match_index(thread_db*, OptimizerBlk*, SSHORT, jrd_nod*, index_desc*);
static bool match_indices(thread_db*, OptimizerBlk*, SSHORT, jrd_nod*, index_desc*);
static USHORT nav_rsb_size(RecordSource*, USHORT, USHORT);
static bool node_equality(const jrd_nod*, const jrd_nod*);
static jrd_nod* optimize_like(thread_db*, jrd_nod*);
#ifdef OPT_DEBUG
static void print_order(OptimizerBlk*, USHORT, double, double);
#endif
static USHORT river_count(USHORT, jrd_nod**);
static bool river_reference(const River*, const jrd_nod*, bool* field_found = NULL);
static bool search_stack(const jrd_nod*, const NodeStack&);
static void set_active(OptimizerBlk*, const River*);
static void set_direction(const jrd_nod*, jrd_nod*);
static void set_inactive(OptimizerBlk*, const River*);
static void set_made_river(OptimizerBlk*, const River*);
static void set_position(const jrd_nod*, jrd_nod*, const jrd_nod*);
static void set_rse_inactive(CompilerScratch*, const RecordSelExpr*);
static void sort_indices_by_selectivity(CompilerScratch::csb_repeat*);
static SSHORT sort_indices_by_priority(CompilerScratch::csb_repeat*, index_desc**, UINT64*);
/* macro definitions */
#ifdef OPT_DEBUG
const int DEBUG_PUNT = 5;
const int DEBUG_RELATIONSHIPS = 4;
const int DEBUG_ALL = 3;
const int DEBUG_CANDIDATE = 2;
const int DEBUG_BEST = 1;
const int DEBUG_NONE = 0;
FILE *opt_debug_file = 0;
static int opt_debug_flag = DEBUG_NONE;
#endif
inline void SET_DEP_BIT(ULONG* array, const SLONG bit)
{
array[bit / 32] |= (1L << (bit % 32));
}
inline void CLEAR_DEP_BIT(ULONG* array, const SLONG bit)
{
array[bit / 32] &= ~(1L << (bit % 32));
}
inline bool TEST_DEP_BIT(const ULONG* array, const ULONG bit)
{
return (array[bit / 32] & (1L << (bit % 32))) != 0;
}
inline bool TEST_DEP_ARRAYS(const ULONG* ar1, const ULONG* ar2)
{ return (ar1[0] & ar2[0]) || (ar1[1] & ar2[1]) ||
(ar1[2] & ar2[2]) || (ar1[3] & ar2[3]) ||
(ar1[4] & ar2[4]) || (ar1[5] & ar2[5]) ||
(ar1[6] & ar2[6]) || (ar1[7] & ar2[7]);
}
inline int STREAM_INDEX(const jrd_nod* node)
{
switch (node->nod_type)
{
case nod_relation:
return e_rel_stream;
case nod_procedure:
return e_prc_stream;
case nod_union:
return e_uni_stream;
default:
return e_agg_stream;
}
}
/* some arbitrary fudge factors for calculating costs, etc.--
these could probably be better tuned someday */
const double ESTIMATED_SELECTIVITY = 0.01;
const int INVERSE_ESTIMATE = 10;
const double INDEX_COST = 30.0;
const int CACHE_PAGES_PER_STREAM = 15;
const int SELECTIVITY_THRESHOLD_FACTOR = 10;
const int OR_SELECTIVITY_THRESHOLD_FACTOR = 2000;
const UINT64 LOWEST_PRIORITY_LEVEL = 0;
/* enumeration of sort datatypes */
static const UCHAR sort_dtypes[] =
{
0, /* dtype_unknown */
SKD_text, /* dtype_text */
SKD_cstring, /* dtype_cstring */
SKD_varying, /* dtype_varying */
0,
0,
0, /* dtype_packed */
0, /* dtype_byte */
SKD_short, /* dtype_short */
SKD_long, /* dtype_long */
SKD_quad, /* dtype_quad */
SKD_float, /* dtype_real */
SKD_double, /* dtype_double */
SKD_double, /* dtype_d_float */
SKD_sql_date, /* dtype_sql_date */
SKD_sql_time, /* dtype_sql_time */
SKD_timestamp2, /* dtype_timestamp */
0, /* dtype_blob */
0, /* dtype_array */
SKD_int64 /* dtype_int64 */
};
typedef UCHAR stream_array_t[MAX_STREAMS + 1];
bool OPT_access_path(const jrd_req* request,
SCHAR* buffer,
SSHORT buffer_length, USHORT* return_length)
{
/**************************************
*
* O P T _ a c c e s s _ p a t h
*
**************************************
*
* Functional description
* Returns a formatted access path for all
* RecordSelExpr's in the specified request.
*
**************************************/
DEV_BLKCHK(request, type_req);
SCHAR* begin = buffer;
/* loop through all RSEs in the request,
and describe the rsb tree for that rsb */
size_t i;
for (i = 0; i < request->req_fors.getCount(); i++) {
RecordSource* rsb = request->req_fors[i];
if (rsb && !dump_rsb(request, rsb, &buffer, &buffer_length))
break;
}
*return_length = buffer - begin;
return (i >= request->req_fors.getCount());
}
RecordSource* OPT_compile(thread_db* tdbb,
CompilerScratch* csb,
RecordSelExpr* rse,
NodeStack* parent_stack)
{
/**************************************
*
* O P T _ c o m p i l e
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
**************************************/
stream_array_t streams, beds, local_streams, outer_streams, sub_streams,
key_streams;
DEV_BLKCHK(csb, type_csb);
DEV_BLKCHK(rse, type_nod);
SET_TDBB(tdbb);
Database* dbb = tdbb->tdbb_database;
#ifdef OPT_DEBUG
if (opt_debug_flag != DEBUG_NONE && !opt_debug_file)
opt_debug_file = fopen("opt_debug.out", "w");
#endif
/* If there is a boolean, there is some work to be done. First,
decompose the boolean into conjunctions. Then get descriptions
of all indices for all relations in the RecordSelExpr. This will give
us the info necessary to allocate a optimizer block big
enough to hold this crud. */
/* Do not allocate the index_desc struct. Let BTR_all do the job. The allocated
memory will then be in csb->csb_rpt[stream].csb_idx_allocation, which
gets cleaned up before this function exits. */
index_desc* idx = NULL;
OptimizerBlk* opt = FB_NEW(*tdbb->getDefaultPool()) OptimizerBlk(tdbb->getDefaultPool());
opt->opt_streams.grow(csb->csb_n_stream);
RecordSource* rsb = 0;
try {
opt->opt_csb = csb;
if (rse->nod_flags & rse_stream)
opt->opt_g_flags |= opt_g_stream;
beds[0] = streams[0] = key_streams[0] = outer_streams[0] = sub_streams[0] = 0;
NodeStack conjunct_stack;
RiverStack rivers_stack;
SLONG conjunct_count = 0;
check_sorts(rse);
jrd_nod* sort = rse->rse_sorted;
jrd_nod* project = rse->rse_projection;
jrd_nod* aggregate = rse->rse_aggregate;
// put any additional booleans on the conjunct stack, and see if we
// can generate additional booleans by associativity--this will help
// to utilize indices that we might not have noticed
if (rse->rse_boolean) {
conjunct_count =
decompose(tdbb, rse->rse_boolean, conjunct_stack, csb);
}
conjunct_count += distribute_equalities(conjunct_stack, csb, conjunct_count);
// AB: If we have limit our retrieval with FIRST / SKIP syntax then
// we may not deliver above conditions (from higher rse's) to this
// rse, because the results should be consistent.
if (rse->rse_skip || rse->rse_first) {
parent_stack = NULL;
}
// clear the csb_active flag of all streams in the RecordSelExpr
set_rse_inactive(csb, rse);
UCHAR* p = streams + 1;
// go through the record selection expression generating
// record source blocks for all streams
// CVC: I defined this var here because it's assigned inside an if() shortly
// below but it's used later in the loop always, so I assume the idea is that
// iterations where nod_type != nod_rse are the ones that set up a new stream.
// Hope this isn't some kind of logic error.
SSHORT stream = -1;
jrd_nod** ptr = rse->rse_relation;
for (const jrd_nod* const* const end = ptr + rse->rse_count; ptr < end;
ptr++)
{
jrd_nod* node = *ptr;
// find the stream number and place it at the end of the beds array
// (if this is really a stream and not another RecordSelExpr)
if (node->nod_type != nod_rse)
{
stream = (USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
fb_assert(stream <= MAX_UCHAR);
fb_assert(beds[0] < MAX_STREAMS && beds[0] < MAX_UCHAR);
beds[++beds[0]] = (UCHAR) stream;
}
// for nodes which are not relations, generate an rsb to
// represent that work has to be done to retrieve them;
// find all the substreams involved and compile them as well
rsb = NULL;
local_streams[0] = 0;
switch (node->nod_type)
{
case nod_union:
{
const SSHORT i = (SSHORT) key_streams[0];
compute_dbkey_streams(csb, node, key_streams);
rsb =
gen_union(tdbb, opt, node, key_streams + i + 1,
(USHORT) (key_streams[0] - i));
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
local_streams[++local_streams[0]] =
(UCHAR)(IPTR) node->nod_arg[e_uni_stream];
break;
}
case nod_aggregate:
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_STREAMS);
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_UCHAR);
rsb = gen_aggregate(tdbb, opt, node);
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
local_streams[++local_streams[0]] =
(UCHAR)(IPTR) node->nod_arg[e_agg_stream];
break;
case nod_procedure:
rsb = gen_procedure(tdbb, opt, node);
fb_assert(local_streams[0] < MAX_STREAMS && local_streams[0] < MAX_UCHAR);
local_streams[++local_streams[0]] =
(UCHAR)(IPTR) node->nod_arg[e_prc_stream];
break;
case nod_rse:
compute_rse_streams(csb, (RecordSelExpr*) node, beds);
compute_rse_streams(csb, (RecordSelExpr*) node, local_streams);
compute_dbkey_streams(csb, node, key_streams);
// pass RecordSelExpr boolean only to inner substreams because join condition
// should never exclude records from outer substreams
if (rse->rse_jointype == blr_inner ||
(rse->rse_jointype == blr_left && (ptr - rse->rse_relation) == 1) )
{
// AB: For an (X LEFT JOIN Y) mark the outer-streams (X) as
// active because the inner-streams (Y) are always "dependent"
// on the outer-streams. So that index retrieval nodes could be made.
// For an INNER JOIN mark previous generated RecordSource's as active.
if (rse->rse_jointype == blr_left) {
for (SSHORT i = 1; i <= outer_streams[0]; i++) {
csb->csb_rpt[outer_streams[i]].csb_flags |= csb_active;
}
}
const NodeStack::iterator stackSavepoint(conjunct_stack);
NodeStack::const_iterator stack_end;
NodeStack deliverStack;
if (rse->rse_jointype != blr_inner) {
// Make list of nodes that can be delivered to a outer-stream.
// In fact this are all nodes except when a IS NULL (nod_missing)
// comparision is done.
// Note! Don't forget that this can be burried inside a expression
// such as "CASE WHEN (FieldX IS NULL) THEN 0 ELSE 1 END = 0"
NodeStack::iterator stackItem;
if (parent_stack)
{
stackItem = *parent_stack;
}
for (; stackItem.hasData(); ++stackItem) {
jrd_nod* deliverNode = stackItem.object();
if (!expression_contains(deliverNode, nod_missing)) {
deliverStack.push(deliverNode);
}
}
stack_end = conjunct_stack.merge(deliverStack);
}
else {
if (parent_stack)
{
stack_end = conjunct_stack.merge(*parent_stack);
}
}
rsb = OPT_compile(tdbb, csb, (RecordSelExpr*) node, &conjunct_stack);
if (rse->rse_jointype != blr_inner) {
// Remove previously added parent conjuctions from the stack.
conjunct_stack.split(stack_end, deliverStack);
}
else {
if (parent_stack)
{
conjunct_stack.split(stack_end, *parent_stack);
}
}
if (rse->rse_jointype == blr_left) {
for (SSHORT i = 1; i <= outer_streams[0]; i++) {
csb->csb_rpt[outer_streams[i]].csb_flags &= ~csb_active;
}
}
}
else {
rsb = OPT_compile(tdbb, csb, (RecordSelExpr*) node, parent_stack);
if (rse->rse_jointype == blr_left)
find_used_streams(rsb, outer_streams);
}
break;
}
// if an rsb has been generated, we have a non-relation;
// so it forms a river of its own since it is separately
// optimized from the streams in this rsb
if (rsb) {
const SSHORT i = local_streams[0];
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), i) River();
river->riv_count = (UCHAR) i;
river->riv_rsb = rsb;
MOVE_FAST(local_streams + 1, river->riv_streams, i);
// AB: Save all inner-part streams
if (rse->rse_jointype == blr_inner ||
(rse->rse_jointype == blr_left && (ptr - rse->rse_relation)==0))
{
find_used_streams(rsb, sub_streams);
}
set_made_river(opt, river);
set_inactive(opt, river);
rivers_stack.push(river);
continue;
}
// we have found a base relation; record its stream
// number in the streams array as a candidate for
// merging into a river
// TMN: Is the intention really to allow streams[0] to overflow?
// I must assume that is indeed not the intention (not to mention
// it would make code later on fail), so I added the following fb_assert.
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
++streams[0];
*p++ = (UCHAR) stream;
if (rse->rse_jointype == blr_left) {
fb_assert(outer_streams[0] < MAX_STREAMS && outer_streams[0] < MAX_UCHAR);
outer_streams[++outer_streams[0]] = stream;
}
// if we have seen any booleans or sort fields, we may be able to
// use an index to optimize them; retrieve the current format of
// all indices at this time so we can determine if it's possible
// AB: if a parent_stack was available and conjunct_count was 0
// then no indices where retrieved. Added also OR check on
// parent_stack below. SF BUG # [ 508594 ]
if (conjunct_count || sort || project || aggregate || parent_stack)
{
jrd_rel* relation = (jrd_rel*) node->nod_arg[e_rel_relation];
if (relation && !relation->rel_file)
{
csb->csb_rpt[stream].csb_indices =
BTR_all(tdbb, relation,
&csb->csb_rpt[stream].csb_idx);
sort_indices_by_selectivity(&csb->csb_rpt[stream]);
mark_indices(&csb->csb_rpt[stream], relation->rel_id);
}
else
csb->csb_rpt[stream].csb_indices = 0;
}
}
// this is an attempt to make sure we have a large enough cache to
// efficiently retrieve this query; make sure the cache has a minimum
// number of pages for each stream in the RecordSelExpr (the number is just a guess)
if (streams[0] > 5) {
CCH_expand(tdbb, (ULONG) (streams[0] * CACHE_PAGES_PER_STREAM));
}
// At this point we are ready to start optimizing.
// We will use the opt block to hold information of
// a global nature, meaning that it needs to stick
// around for the rest of the optimization process.
// Set base-point before the parent/distributed nodes begin.
opt->opt_base_conjuncts = (SSHORT) conjunct_count;
// AB: Add parent conjunctions to conjunct_stack, keep in mind
// the outer-streams! For outer streams put missing (IS NULL)
// conjunctions in the missingStack.
SLONG distributed_count = 0;
NodeStack missingStack;
if (parent_stack && parent_stack->getCount())
{
NodeStack::iterator iter(*parent_stack);
for (; iter.hasData() && conjunct_count < MAX_CONJUNCTS; ++iter)
{
jrd_nod* node = iter.object();
if ((rse->rse_jointype != blr_inner) &&
expression_contains(node, nod_missing))
{
// parent missing conjunctions shouldn't be
// distributed to FULL OUTER JOIN streams at all
if (rse->rse_jointype != blr_full)
{
missingStack.push(node);
}
}
else
{
conjunct_stack.push(node);
conjunct_count++;
}
}
// We've now merged parent, try again to make more conjunctions.
distributed_count = distribute_equalities(conjunct_stack, csb, conjunct_count);
conjunct_count += distributed_count;
}
// The newly created conjunctions belong to the base conjunctions.
// After them are starting the parent conjunctions.
opt->opt_base_parent_conjuncts = opt->opt_base_conjuncts + (SSHORT) distributed_count;
// Set base-point before the parent IS NULL nodes begin
opt->opt_base_missing_conjuncts = (SSHORT) conjunct_count;
// Check if size of optimizer block exceeded.
if (conjunct_count > MAX_CONJUNCTS)
{
ERR_post(isc_optimizer_blk_exc, 0);
// Msg442: size of optimizer block exceeded
}
// Put conjunctions in opt structure.
// Note that it's a stack and we get the nodes in reversed order from the stack.
opt->opt_conjuncts.grow(conjunct_count);
SSHORT i, j, nodeBase;
for (i = conjunct_count; i > 0; i--)
{
jrd_nod* node = conjunct_stack.pop();
if (i == opt->opt_base_conjuncts)
{
// The base conjunctions.
j = 0;
nodeBase = 0;
}
else if (i == conjunct_count)
{
// The new conjunctions created by "distribution" from the stack.
j = 0;
nodeBase = opt->opt_base_conjuncts;
}
else if (i == (conjunct_count - distributed_count))
{
// The parent conjunctions.
j = 0;
nodeBase = opt->opt_base_conjuncts + distributed_count;
}
opt->opt_conjuncts[nodeBase + j].opt_conjunct_node = node;
compute_dependencies(node, opt->opt_conjuncts[nodeBase + j].opt_dependencies);
j++;
}
// Put the parent missing nodes on the stack.
for (i = 0; (i < missingStack.getCount()) && (conjunct_count < MAX_CONJUNCTS); i++)
{
opt->opt_conjuncts.grow(conjunct_count + 1);
jrd_nod* node = missingStack.pop();
opt->opt_conjuncts[conjunct_count].opt_conjunct_node = node;
compute_dependencies(node,
opt->opt_conjuncts[conjunct_count].opt_dependencies);
conjunct_count++;
}
// attempt to optimize aggregates via an index, if possible
if (aggregate && !sort && !project) {
sort = aggregate;
}
else {
rse->rse_aggregate = aggregate = NULL;
}
// AB: Mark the previous used streams (sub-RecordSelExpr's) as active
for (i = 1; i <= sub_streams[0]; i++) {
csb->csb_rpt[sub_streams[i]].csb_flags |= csb_active;
}
// outer joins require some extra processing
if (rse->rse_jointype != blr_inner) {
rsb = gen_outer(tdbb, opt, rse, rivers_stack, &sort, &project);
}
else {
bool sort_present = (sort);
bool outer_rivers = false;
jrd_nod* const saved_sort_node = sort;
// AB: If previous rsb's are already on the stack we can't use
// an navigational-retrieval for an ORDER BY cause the next
// streams are JOINed to the previous ones
if (rivers_stack.hasData()) {
sort = NULL;
outer_rivers = true;
// AB: We could already have multiple rivers at this
// point so try to do some sort/merging now.
while (rivers_stack.hasMore(1)
&& gen_sort_merge(tdbb, opt, rivers_stack));
// AB: Mark the previous used streams (sub-RecordSelExpr's) again
// as active, because an SORT/MERGE could reset the flags
for (i = 1; i <= sub_streams[0]; i++) {
csb->csb_rpt[sub_streams[i]].csb_flags |= csb_active;
}
}
// attempt to form joins in decreasing order of desirability
fb_assert(streams[0] != 1 || csb->csb_rpt[streams[1]].csb_relation != 0);
gen_join(tdbb, opt, streams, rivers_stack, &sort, &project,
rse->rse_plan);
// If there are multiple rivers, try some sort/merging
while (rivers_stack.hasMore(1)
&& gen_sort_merge(tdbb, opt, rivers_stack));
rsb = make_cross(tdbb, opt, rivers_stack);
// AB: When we have a merge then a previous made ordering with
// an index doesn't guarantee that the result will be in that
// order. So we assigned the sort node back.
// SF BUG # [ 221921 ] ORDER BY has no effect
RecordSource* test_rsb = rsb;
if ((rsb) && (rsb->rsb_type == rsb_boolean) && (rsb->rsb_next)) {
test_rsb = rsb->rsb_next;
}
if ((sort_present && outer_rivers) ||
((test_rsb) && (test_rsb->rsb_type == rsb_merge) && !sort && sort_present)) {
sort = saved_sort_node;
}
// Pick up any residual boolean that may have fallen thru the cracks
rsb = gen_residual_boolean(tdbb, opt, rsb);
}
// if the aggregate was not optimized via an index, get rid of the
// sort and flag the fact to the calling routine
if (aggregate && sort) {
rse->rse_aggregate = NULL;
sort = NULL;
}
// check index usage in all the base streams to ensure
// that any user-specified access plan is followed
for (i = 1; i <= streams[0]; i++) {
check_indices(&csb->csb_rpt[streams[i]]);
}
if (project || sort) {
// Eliminate any duplicate dbkey streams
const UCHAR* const b_end = beds + beds[0];
const UCHAR* const k_end = key_streams + key_streams[0];
UCHAR* k = &key_streams[1];
for (const UCHAR* p2 = k; p2 <= k_end; p2++) {
const UCHAR* q = &beds[1];
while (q <= b_end && *q != *p2) {
q++;
}
if (q > b_end) {
*k++ = *p2;
}
}
key_streams[0] = k - &key_streams[1];
// Handle project clause, if present.
if (project) {
rsb = gen_sort(tdbb, opt, beds, key_streams, rsb, project, true);
}
// Handle sort clause if present
if (sort) {
rsb = gen_sort(tdbb, opt, beds, key_streams, rsb, sort, false);
}
}
// Handle first and/or skip. The skip MUST (if present)
// appear in the rsb list AFTER the first. Since the gen_first and gen_skip
// functions add their nodes at the beginning of the rsb list we MUST call
// gen_skip before gen_first.
//
if (rse->rse_skip) {
rsb = gen_skip(tdbb, opt, rsb, rse->rse_skip);
}
if (rse->rse_first) {
rsb = gen_first(tdbb, opt, rsb, rse->rse_first);
}
// release memory allocated for index descriptions
for (i = 0; i < streams[0]; i++) {
stream = streams[i + 1];
delete csb->csb_rpt[stream].csb_idx;
csb->csb_rpt[stream].csb_idx = 0;
// CVC: The following line added because OPT_compile is recursive, both directly
// and through gen_union(), too. Otherwise, we happen to step on deallocated memory
// and this is the cause of the crashes with indices that have plagued IB since v4.
csb->csb_rpt[stream].csb_indices = 0;
}
DEBUG
// free up memory for optimizer structures
delete opt;
#ifdef OPT_DEBUG
if (opt_debug_file) {
fflush(opt_debug_file);
//fclose(opt_debug_file);
//opt_debug_file = 0;
}
#endif
} // try
catch (const std::exception&) {
for (SSHORT i = 0; i < streams[0]; i++) {
const SSHORT stream = streams[i + 1];
delete csb->csb_rpt[stream].csb_idx;
csb->csb_rpt[stream].csb_idx = 0;
csb->csb_rpt[stream].csb_indices = 0; // Probably needed to be safe
}
delete opt;
throw;
}
if (rse->rse_writelock)
rsb->rsb_flags |= rsb_writelock;
// Assign pointer to list of dependent invariant values
rsb->rsb_invariants = rse->rse_invariants;
return rsb;
}
jrd_nod* OPT_make_dbkey(OptimizerBlk* opt, jrd_nod* boolean, USHORT stream)
{
/**************************************
*
* O P T _ m a k e _ d b k e y
*
**************************************
*
* Functional description
* If boolean is an equality comparison on the proper dbkey,
* make a "bit_dbkey" operator (makes bitmap out of dbkey
* expression.
*
* This is a little hairy, since view dbkeys are expressed as
* concatenations of primitive dbkeys.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(boolean, type_nod);
/* If this isn't an equality, it isn't even interesting */
if (boolean->nod_type != nod_eql)
return NULL;
/* Find the side of the equality that is potentially a dbkey. If
neither, make the obvious deduction */
jrd_nod* dbkey = boolean->nod_arg[0];
jrd_nod* value = boolean->nod_arg[1];
SLONG n = 0;
if (dbkey->nod_type != nod_dbkey && dbkey->nod_type != nod_concatenate)
{
if (value->nod_type != nod_dbkey &&
value->nod_type != nod_concatenate)
{
return NULL;
}
dbkey = value;
value = boolean->nod_arg[0];
}
/* If the value isn't computable, this has been a waste of time */
CompilerScratch* csb = opt->opt_csb;
if (!computable(csb, value, stream, false, false)) {
return NULL;
}
/* If this is a concatenation, find an appropriate dbkey */
if (dbkey->nod_type == nod_concatenate) {
dbkey = find_dbkey(dbkey, stream, &n);
if (!dbkey) {
return NULL;
}
}
/* Make sure we have the correct stream */
if ((USHORT)(IPTR) dbkey->nod_arg[0] != stream)
return NULL;
/* If this is a dbkey for the appropriate stream, it's invertable */
dbkey = PAR_make_node(tdbb, 2);
dbkey->nod_count = 1;
dbkey->nod_type = nod_bit_dbkey;
dbkey->nod_arg[0] = value;
dbkey->nod_arg[1] = (jrd_nod*) (IPTR) n;
dbkey->nod_impure = CMP_impure(csb, sizeof(impure_inversion));
return dbkey;
}
jrd_nod* OPT_make_index(thread_db* tdbb, OptimizerBlk* opt, jrd_rel* relation,
index_desc* idx)
{
/**************************************
*
* O P T _ m a k e _ i n d e x
*
**************************************
*
* Functional description
* Build node for index scan.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(relation, type_rel);
/* Allocate both a index retrieval node and block. */
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
retrieval->irb_relation = relation;
/* Pick up lower bound segment values */
jrd_nod** lower = retrieval->irb_value;
jrd_nod** upper = retrieval->irb_value + idx->idx_count;
const OptimizerBlk::opt_segment* const end = opt->opt_segments + idx->idx_count;
OptimizerBlk::opt_segment* tail;
if (idx->idx_flags & idx_descending) {
for (tail = opt->opt_segments; tail->opt_lower && tail < end; tail++)
*upper++ = tail->opt_lower;
for (tail = opt->opt_segments; tail->opt_upper && tail < end; tail++)
*lower++ = tail->opt_upper;
retrieval->irb_generic |= irb_descending;
}
else {
for (tail = opt->opt_segments; tail->opt_lower && tail < end; tail++)
*lower++ = tail->opt_lower;
for (tail = opt->opt_segments; tail->opt_upper && tail < end; tail++)
*upper++ = tail->opt_upper;
}
retrieval->irb_lower_count = lower - retrieval->irb_value;
retrieval->irb_upper_count =
(upper - retrieval->irb_value) - idx->idx_count;
bool equiv = false;
for (tail = opt->opt_segments; tail->opt_match && tail < end; tail++)
{
if (tail->opt_match->nod_type == nod_equiv)
{
equiv = true;
break;
}
}
// This index is never used for IS NULL, thus we can ignore NULLs
// already at index scan. But this rule doesn't apply to nod_equiv
// which requires NULLs to be found in the index.
if (!equiv)
{
retrieval->irb_generic |= irb_ignore_null_value_key;
}
/* Check to see if this is really an equality retrieval */
if (retrieval->irb_lower_count == retrieval->irb_upper_count) {
retrieval->irb_generic |= irb_equality;
lower = retrieval->irb_value;
upper = retrieval->irb_value + idx->idx_count;
for (const jrd_nod* const* const end_node = lower + retrieval->irb_lower_count;
lower < end_node;)
{
if (*upper++ != *lower++) {
retrieval->irb_generic &= ~irb_equality;
break;
}
}
}
/* If we are matching less than the full index, this is a partial match */
if (retrieval->irb_upper_count < idx->idx_count)
retrieval->irb_generic |= irb_partial;
/* mark the index as utilized for the purposes of this compile */
idx->idx_runtime_flags |= idx_used;
return node;
}
int OPT_match_index(OptimizerBlk* opt, USHORT stream, index_desc* idx)
{
/**************************************
*
* O P T _ m a t c h _ i n d e x
*
**************************************
*
* Functional description
* Match any active (computable but not consumed) boolean
* conjunctions against a given index. This is used by
* the external relation modules to do index optimization.
* Return the number of matching items.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
DEV_BLKCHK(opt, type_opt);
/* If there are not conjunctions, don't waste our time */
if (!opt->opt_base_conjuncts) {
return 0;
}
CompilerScratch* csb = opt->opt_csb;
const OptimizerBlk::opt_conjunct* const opt_end =
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
USHORT n = 0;
clear_bounds(opt, idx);
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
&& computable(csb, node, -1, true, false))
{
n += match_index(tdbb, opt, stream, node, idx);
}
}
return n; // implicit USHORT -> int
}
#ifdef PC_ENGINE
void OPT_set_index(thread_db* tdbb,
jrd_req* request, RecordSource** rsb_ptr, jrd_rel* relation, index_desc* idx)
{
/**************************************
*
* O P T _ s e t _ i n d e x
*
**************************************
*
* Functional description
* Reset the navigational order of a stream.
* Given a sequential or navigational rsb,
* reset the rsb to be a navigational rsb
* on the specified index.
*
**************************************/
DEV_BLKCHK(request, type_req);
DEV_BLKCHK(*rsb_ptr, type_rsb);
DEV_BLKCHK(relation, type_rel);
SET_TDBB(tdbb);
Database* dbb = tdbb->tdbb_database;
RecordSource* old_rsb = *rsb_ptr;
/* fix up a boolean rsb to point to the actual stream rsb */
if (old_rsb->rsb_type == rsb_boolean) {
rsb_ptr = &old_rsb->rsb_next;
old_rsb = old_rsb->rsb_next;
}
/* check if there is an existing inversion for
a boolean expression mapped to an index */
jrd_nod* inversion = NULL;
if (old_rsb->rsb_type == rsb_indexed) {
inversion = (jrd_nod*) old_rsb->rsb_arg[0];
}
else if (old_rsb->rsb_type == rsb_navigate) {
inversion = (jrd_nod*) old_rsb->rsb_arg[RSB_NAV_inversion];
}
/* set up a dummy optimizer block just for the purposes
of the set index, to pass information to subroutines */
OptimizerBlk* opt = FB_NEW(*tdbb->getDefaultPool()) OptimizerBlk(tdbb->getDefaultPool());
opt->opt_g_flags |= opt_g_stream;
/* generate a new rsb for the retrieval, making sure to
preserve the inversion generated for the last rsb; note
that if the bitmap for the inversion has already been
generated, it will be reused since it is already part of
the impure area--I can't think of any reason not to reuse it--deej */
RecordSource* new_rsb;
if (idx) {
new_rsb = gen_nav_rsb(tdbb, opt, old_rsb->rsb_stream, relation, 0, idx
#ifdef SCROLLABLE_CURSORS
, RSE_get_forward
#endif
);
new_rsb->rsb_arg[RSB_NAV_inversion] = (RecordSource*) inversion;
new_rsb->rsb_cardinality = old_rsb->rsb_cardinality;
}
else {
new_rsb = gen_rsb(tdbb, opt, 0, inversion, old_rsb->rsb_stream,
relation, 0, 0, (float) old_rsb->rsb_cardinality);
}
/* point the impure area of the new rsb to the impure area of the
old; since impure area is pre-allocated it would be difficult
to change now, so just use the same area; NOTE: this implies
that we must take some pains to ensure that the impure area is
always large enough to handle a maximum-key index */
new_rsb->rsb_impure = old_rsb->rsb_impure;
/* find index node if the old rsb was navigational */
jrd_nod* index_node = NULL;
if (old_rsb->rsb_type == rsb_navigate) {
index_node = (jrd_nod*) old_rsb->rsb_arg[RSB_NAV_index];
}
/* if the new rsb is navigational, set up impure space in request
for new index node; to convert from non-navigational to navigational,
we need to adjust the impure area upwards to make room for an impure_inversion
structure, and vice versa to convert the other way */
if (idx) {
jrd_nod* new_index_node = (jrd_nod*) new_rsb->rsb_arg[RSB_NAV_index];
if (old_rsb->rsb_type == rsb_navigate)
new_index_node->nod_impure = index_node->nod_impure;
else {
new_index_node->nod_impure = old_rsb->rsb_impure;
new_rsb->rsb_impure += sizeof(impure_inversion);
}
}
else if (old_rsb->rsb_type == rsb_navigate) {
new_rsb->rsb_impure -= sizeof(impure_inversion);
}
/* if there was a previous index, release its lock
and remove its resource from the request */
if (old_rsb->rsb_type == rsb_navigate) {
IndexRetrieval* retrieval =
(IndexRetrieval*) index_node->nod_arg[e_idx_retrieval];
const USHORT index_id = retrieval->irb_index;
IndexLock* index = CMP_get_index_lock(tdbb, relation, index_id);
if (index) {
if (index->idl_count)
--index->idl_count;
if (!index->idl_count) {
LCK_release(tdbb, index->idl_lock);
}
}
CMP_release_resource(&request->req_resources, Resource::rsc_index, index_id);
}
/* get lock on new index */
if (idx) {
IndexLock* index = CMP_get_index_lock(tdbb, relation, idx->idx_id);
if (index) {
if (!index->idl_count) {
LCK_lock_non_blocking(tdbb, index->idl_lock, LCK_SR, LCK_WAIT);
}
++index->idl_count;
}
}
/* go out to the vector which stores all rsbs for the
request, and replace the old with the new */
for (size_t i = 0; i < request->req_fors.getCount(); i++) {
if (request->req_fors[i] == old_rsb) {
request->req_fors[i] = new_rsb;
break;
}
}
/* release unneeded blocks */
delete opt;
if (index_node) {
delete index_node;
}
delete old_rsb;
*rsb_ptr = new_rsb;
}
#endif
static bool augment_stack(jrd_nod* node, NodeStack& stack)
{
/**************************************
*
* a u g m e n t _ s t a c k
*
**************************************
*
* Functional description
* Add node to stack unless node is already on stack.
*
**************************************/
DEV_BLKCHK(node, type_nod);
for (NodeStack::const_iterator temp(stack); temp.hasData(); ++temp) {
if (node_equality(node, temp.object())) {
return false;
}
}
stack.push(node);
return true;
}
static UINT64 calculate_priority_level(const OptimizerBlk* opt, const index_desc* idx)
{
/**************************************
*
* c a l c u l a t e _ p r i o r i t y _ l e v e l
*
**************************************
*
* Functional description
* Return an calculated value based on
* how nodes where matched on the index.
* Before calling this function the
* match_index function must be called first!
*
**************************************/
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
// Count how many fields can be used in this index and
// count the maximum equals that matches at the begin.
USHORT idx_eql_count = 0;
USHORT idx_field_count = 0;
const OptimizerBlk::opt_segment* idx_tail = opt->opt_segments;
const OptimizerBlk::opt_segment* const idx_end = idx_tail + idx->idx_count;
for (;idx_tail < idx_end &&
(idx_tail->opt_lower || idx_tail->opt_upper); idx_tail++)
{
idx_field_count++;
const jrd_nod* node = idx_tail->opt_match;
if (node->nod_type == nod_eql) {
idx_eql_count++;
}
else {
break;
}
}
// Note: dbb->dbb_max_idx = 1022 for the largest supported page of 16K and
// 62 for the smallest page of 1K
const UINT64 max_idx = JRD_get_thread_data()->tdbb_database->dbb_max_idx + 1;
UINT64 unique_prefix = 0;
if ((idx->idx_flags & idx_unique) && (idx_eql_count == idx->idx_count)) {
unique_prefix = (max_idx - idx->idx_count) * max_idx * max_idx * max_idx;
}
// Calculate our priority level.
return unique_prefix + ((idx_eql_count * max_idx * max_idx) +
(idx_field_count * max_idx) + (max_idx - idx->idx_count));
}
else {
return LOWEST_PRIORITY_LEVEL;
}
}
static void check_indices(const CompilerScratch::csb_repeat* csb_tail)
{
/**************************************
*
* c h e c k _ i n d i c e s
*
**************************************
*
* Functional description
* Check to make sure that the user-specified
* indices were actually utilized by the optimizer.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
const jrd_nod* plan = csb_tail->csb_plan;
if (!plan) {
return;
}
if (plan->nod_type != nod_retrieve) {
return;
}
const jrd_rel* relation = csb_tail->csb_relation;
/* if there were no indices fetched at all but the
user specified some, error out using the first
index specified */
const jrd_nod* access_type = 0;
if (!csb_tail->csb_indices &&
(access_type = plan->nod_arg[e_retrieve_access_type]))
{
/* index %s cannot be used in the specified plan */
ERR_post(isc_index_unused, isc_arg_string, access_type->nod_arg[2],
0);
}
/* check to make sure that all indices are either used or marked not to be used,
and that there are no unused navigational indices */
SqlIdentifier index_name;
const index_desc* idx = csb_tail->csb_idx->items;
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
if (!(idx->idx_runtime_flags & (idx_plan_dont_use | idx_used)) ||
((idx->idx_runtime_flags & idx_plan_navigate)
&& !(idx->idx_runtime_flags & idx_navigate)))
{
if (!
(idx->idx_runtime_flags &
(idx_plan_missing | idx_plan_starts)))
{
if (relation) {
MET_lookup_index(tdbb, index_name, relation->rel_name,
(USHORT) (idx->idx_id + 1));
}
else {
index_name[0] = 0;
}
/* index %s cannot be used in the specified plan */
ERR_post(isc_index_unused, isc_arg_string,
ERR_cstring(index_name), 0);
}
}
++idx;
}
}
static bool check_relationship(const OptimizerBlk* opt, USHORT position, USHORT stream)
{
/**************************************
*
* c h e c k _ r e l a t i o n s h i p
*
**************************************
*
* Functional description
* Check for a potential indexed relationship.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
for (const OptimizerBlk::opt_stream* const end = tail + position; tail < end; tail++)
{
const USHORT n = tail->opt_stream_number;
for (const IndexedRelationship* relationship = opt->opt_streams[n].opt_relationships;
relationship;
relationship = relationship->irl_next)
{
if (stream == relationship->irl_stream) {
return true;
}
}
}
return false;
}
static void check_sorts(RecordSelExpr* rse)
{
/**************************************
*
* c h e c k _ s o r t s
*
**************************************
*
* Functional description
* Try to optimize out unnecessary sorting.
*
**************************************/
DEV_BLKCHK(rse, type_nod);
jrd_nod* sort = rse->rse_sorted;
jrd_nod* project = rse->rse_projection;
// check if a GROUP BY exists using the same fields as the project or sort:
// if so, the projection can be eliminated; if no projection exists, then
// the sort can be eliminated.
jrd_nod *group, *sub_rse;
if ((project || sort) &&
(rse->rse_count == 1) &&
(sub_rse = rse->rse_relation[0]) &&
(sub_rse->nod_type == nod_aggregate) &&
(group = sub_rse->nod_arg[e_agg_group]))
{
// if all the fields of the project are the same as all the fields
// of the group by, get rid of the project.
if (project && (project->nod_count == group->nod_count)) {
jrd_nod** project_ptr = project->nod_arg;
const jrd_nod* const* const project_end = project_ptr + project->nod_count;
for (; project_ptr < project_end; project_ptr++)
{
const jrd_nod* const* group_ptr = group->nod_arg;
const jrd_nod* const* const group_end = group_ptr + group->nod_count;
for (; group_ptr < group_end; group_ptr++)
{
if (map_equal(*group_ptr, *project_ptr, sub_rse->nod_arg[e_agg_map])) {
break;
}
}
if (group_ptr == group_end) {
break;
}
}
// we can now ignore the project, but in case the project is being done
// in descending order because of an order by, do the group by the same way.
if (project_ptr == project_end) {
set_direction(project, group);
project = rse->rse_projection = NULL;
}
}
// if there is no projection, then we can make a similar optimization
// for sort, except that sort may have fewer fields than group by.
if (!project && sort && (sort->nod_count <= group->nod_count)) {
const jrd_nod* const* sort_ptr = sort->nod_arg;
const jrd_nod* const* const sort_end = sort_ptr + sort->nod_count;
for (; sort_ptr < sort_end; sort_ptr++)
{
const jrd_nod* const* group_ptr = group->nod_arg;
const jrd_nod* const* const group_end = group_ptr + sort->nod_count;
for (; group_ptr < group_end; group_ptr++)
{
if (map_equal(*group_ptr, *sort_ptr, sub_rse->nod_arg[e_agg_map])) {
break;
}
}
if (group_ptr == group_end) {
break;
}
}
// if all the fields in the sort list match the first n fields in the
// project list, we can ignore the sort, but update the sort order
// (ascending/descending) to match that in the sort list
if (sort_ptr == sort_end) {
set_direction(sort, group);
set_position(sort, group, sub_rse->nod_arg[e_agg_map]);
sort = rse->rse_sorted = NULL;
}
}
}
// examine the ORDER BY and DISTINCT clauses; if all the fields in the
// ORDER BY match the first n fields in the DISTINCT in any order, the
// ORDER BY can be removed, changing the fields in the DISTINCT to match
// the ordering of fields in the ORDER BY.
if (sort && project && (sort->nod_count <= project->nod_count)) {
const jrd_nod* const* sort_ptr = sort->nod_arg;
const jrd_nod* const* const sort_end = sort_ptr + sort->nod_count;
for (; sort_ptr < sort_end; sort_ptr++)
{
const jrd_nod* const* project_ptr = project->nod_arg;
const jrd_nod* const* const project_end = project_ptr + sort->nod_count;
for (; project_ptr < project_end; project_ptr++)
{
if ((*sort_ptr)->nod_type == nod_field
&& (*project_ptr)->nod_type == nod_field
&& (*sort_ptr)->nod_arg[e_fld_stream] ==
(*project_ptr)->nod_arg[e_fld_stream]
&& (*sort_ptr)->nod_arg[e_fld_id] ==
(*project_ptr)->nod_arg[e_fld_id])
{
break;
}
}
if (project_ptr == project_end) {
break;
}
}
// if all the fields in the sort list match the first n fields
// in the project list, we can ignore the sort, but update
// the project to match the sort.
if (sort_ptr == sort_end) {
set_direction(sort, project);
set_position(sort, project, NULL);
sort = rse->rse_sorted = NULL;
}
}
}
static void class_mask(USHORT count, jrd_nod** eq_class, ULONG* mask)
{
/**************************************
*
* c l a s s _ m a s k
*
**************************************
*
* Functional description
* Given an sort/merge join equivalence class (vector of node pointers
* of representative values for rivers), return a bit mask of rivers
* with values.
*
**************************************/
#ifdef DEV_BUILD
if (*eq_class) {
DEV_BLKCHK(*eq_class, type_nod);
}
#endif
if (count > MAX_CONJUNCTS) {
ERR_post(isc_optimizer_blk_exc, 0);
/* Msg442: size of optimizer block exceeded */
}
SLONG i;
for (i = 0; i < OPT_STREAM_BITS; i++) {
mask[i] = 0;
}
for (i = 0; i < count; i++, eq_class++) {
if (*eq_class) {
SET_DEP_BIT(mask, i);
DEV_BLKCHK(*eq_class, type_nod);
}
}
}
static void clear_bounds(OptimizerBlk* opt, const index_desc* idx)
{
/**************************************
*
* c l e a r _ b o u n d s
*
**************************************
*
* Functional description
* Clear upper and lower value slots before matching booleans to
* indices.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
const OptimizerBlk::opt_segment* const opt_end = &opt->opt_segments[idx->idx_count];
for (OptimizerBlk::opt_segment* tail = opt->opt_segments; tail < opt_end; tail++) {
tail->opt_lower = NULL;
tail->opt_upper = NULL;
tail->opt_match = NULL;
}
}
static jrd_nod* compose(jrd_nod** node1, jrd_nod* node2, NOD_T node_type)
{
/**************************************
*
* c o m p o s e
*
**************************************
*
* Functional description
* Build and AND out of two conjuncts.
*
**************************************/
DEV_BLKCHK(*node1, type_nod);
DEV_BLKCHK(node2, type_nod);
if (!node2) {
return *node1;
}
if (!*node1) {
return (*node1 = node2);
}
return *node1 = make_binary_node(node_type, *node1, node2, false);
}
static bool computable(CompilerScratch* csb,
jrd_nod* node,
SSHORT stream,
bool idx_use,
bool allowOnlyCurrentStream)
{
/**************************************
*
* c o m p u t a b l e
*
**************************************
*
* Functional description
* See if node is presently computable.
* Note that a field is not computable
* with respect to its own stream.
*
* There are two different uses of computable().
* (a) idx_use == false: when an unused conjunct is to be picked for making
* into a boolean and in making a db_key.
* In this case, a node is said to be computable, if all the streams
* involved in that node are csb_active. The csb_active flag
* defines all the streams available in the current scope of the
* query.
* (b) idx_use == true: to determine if we can use an
* index on the conjunct we have already chosen.
* In order to use an index on a conjunct, it is required that the
* all the streams involved in the conjunct are currently active
* or have been already processed before and made into rivers.
* Because, here we want to differentiate between streams we have
* not yet worked on and those that we have worked on or are currently
* working on.
*
**************************************/
DEV_BLKCHK(csb, type_csb);
DEV_BLKCHK(node, type_nod);
/* Recurse thru interesting sub-nodes */
jrd_nod** ptr = node->nod_arg;
if (node->nod_type == nod_procedure) {
return false;
}
if (node->nod_type == nod_union) {
jrd_nod* clauses = node->nod_arg[e_uni_clauses];
ptr = clauses->nod_arg;
for (const jrd_nod* const* const end = ptr + clauses->nod_count;
ptr < end; ptr += 2)
{
if (!computable(csb, *ptr, stream, idx_use, allowOnlyCurrentStream)) {
return false;
}
}
}
else {
for (const jrd_nod* const* const end = ptr + node->nod_count;
ptr < end; ptr++)
{
if (!computable(csb, *ptr, stream, idx_use, allowOnlyCurrentStream)) {
return false;
}
}
}
RecordSelExpr* rse;
jrd_nod* sub;
jrd_nod* value;
USHORT n;
switch (node->nod_type) {
case nod_field:
n = (USHORT)(IPTR) node->nod_arg[e_fld_stream];
if (allowOnlyCurrentStream) {
if (n != stream) {
return false;
}
}
else {
if (n == stream) {
return false;
}
}
// AB: cbs_made_river has been replaced by find_used_streams()
//if (idx_use &&
// !(csb->csb_rpt[n].csb_flags & (csb_made_river | csb_active)))
return csb->csb_rpt[n].csb_flags & csb_active;
case nod_rec_version:
case nod_dbkey:
n = (USHORT)(IPTR) node->nod_arg[0];
if (allowOnlyCurrentStream) {
if (n != stream) {
return false;
}
}
else {
if (n == stream) {
return false;
}
}
// AB: cbs_made_river has been replaced by find_used_streams()
//if (idx_use &&
// !(csb->csb_rpt[n].
// csb_flags & (csb_made_river | csb_active)))
return csb->csb_rpt[n].csb_flags & csb_active;
case nod_min:
case nod_max:
case nod_average:
case nod_total:
case nod_count:
case nod_from:
if ((sub = node->nod_arg[e_stat_default]) &&
!computable(csb, sub, stream, idx_use, allowOnlyCurrentStream))
{
return false;
}
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
value = node->nod_arg[e_stat_value];
break;
case nod_rse:
rse = (RecordSelExpr*) node;
value = NULL;
break;
case nod_aggregate:
rse = (RecordSelExpr*) node->nod_arg[e_agg_rse];
rse->rse_sorted = node->nod_arg[e_agg_group];
value = NULL;
break;
default:
return true;
}
/* Node is a record selection expression. */
bool result = true;
if ((sub = rse->rse_first) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) {
return false;
}
if ((sub = rse->rse_skip) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) {
return false;
}
/* Set sub-streams of rse active */
const jrd_nod* const* end;
for (ptr = rse->rse_relation, end = ptr + rse->rse_count; ptr < end; ptr++) {
if ((*ptr)->nod_type != nod_rse) {
n = (USHORT)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
csb->csb_rpt[n].csb_flags |= csb_active;
}
}
/* Check sub-stream */
if (((sub = rse->rse_boolean) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) ||
((sub = rse->rse_sorted) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)) ||
((sub = rse->rse_projection) && !computable(csb, sub, stream, idx_use, allowOnlyCurrentStream)))
{
result = false;
}
for (ptr = rse->rse_relation, end = ptr + rse->rse_count;
((ptr < end) && (result)); ptr++)
{
if ((*ptr)->nod_type != nod_rse) {
if (!computable(csb, (*ptr), stream, idx_use, allowOnlyCurrentStream)) {
result = false;
}
}
}
/* Check value expression, if any */
if (result && value && !computable(csb, value, stream, idx_use, allowOnlyCurrentStream)) {
result = false;
}
/* Reset streams inactive */
for (ptr = rse->rse_relation, end = ptr + rse->rse_count; ptr < end;
ptr++)
{
if ((*ptr)->nod_type != nod_rse)
{
n = (USHORT)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
csb->csb_rpt[n].csb_flags &= ~csb_active;
}
}
return result;
}
static void compute_dependencies(const jrd_nod* node, ULONG* dependencies)
{
/**************************************
*
* c o m p u t e _ d e p e n d e n c i e s
*
**************************************
*
* Functional description
* Compute stream dependencies for evaluation of an expression.
*
**************************************/
DEV_BLKCHK(node, type_nod);
/* Recurse thru interesting sub-nodes */
const jrd_nod* const* ptr = node->nod_arg;
if (node->nod_type == nod_procedure) {
return;
}
{ // scope for MSVC6
for (const jrd_nod* const* const end = ptr + node->nod_count; ptr < end; ptr++)
{
compute_dependencies(*ptr, dependencies);
}
} // scope
const RecordSelExpr* rse;
const jrd_nod* sub;
const jrd_nod* value;
switch (node->nod_type) {
case nod_field:
{
const SLONG n = (SLONG)(IPTR) node->nod_arg[e_fld_stream];
SET_DEP_BIT(dependencies, n);
return;
}
case nod_rec_version:
case nod_dbkey:
{
const SLONG n = (SLONG)(IPTR) node->nod_arg[0];
SET_DEP_BIT(dependencies, n);
return;
}
case nod_min:
case nod_max:
case nod_average:
case nod_total:
case nod_count:
case nod_from:
if ( (sub = node->nod_arg[e_stat_default]) ) {
compute_dependencies(sub, dependencies);
}
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
value = node->nod_arg[e_stat_value];
break;
case nod_rse:
rse = (RecordSelExpr*) node;
value = NULL;
break;
default:
return;
}
/* Node is a record selection expression. Groan. Ugh. Yuck. */
if ( (sub = rse->rse_first) ) {
compute_dependencies(sub, dependencies);
}
/* Check sub-expressions */
if ( (sub = rse->rse_boolean) ) {
compute_dependencies(sub, dependencies);
}
if ( (sub = rse->rse_sorted) ) {
compute_dependencies(sub, dependencies);
}
if ( (sub = rse->rse_projection) ) {
compute_dependencies(sub, dependencies);
}
/* Check value expression, if any */
if (value) {
compute_dependencies(value, dependencies);
}
/* Reset streams inactive */
ptr = rse->rse_relation;
for (const jrd_nod* const* const end = ptr + rse->rse_count; ptr < end; ptr++)
{
if ((*ptr)->nod_type != nod_rse) {
const SLONG n = (SLONG)(IPTR) (*ptr)->nod_arg[STREAM_INDEX((*ptr))];
CLEAR_DEP_BIT(dependencies, n);
}
}
}
static void compute_dbkey_streams(const CompilerScratch* csb, const jrd_nod* node, UCHAR* streams)
{
/**************************************
*
* c o m p u t e _ d b k e y _ s t r e a m s
*
**************************************
*
* Functional description
* Identify all of the streams for which a
* dbkey may need to be carried through a sort.
*
**************************************/
DEV_BLKCHK(csb, type_csb);
DEV_BLKCHK(node, type_nod);
if (node->nod_type == nod_relation) {
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
streams[++streams[0]] = (UCHAR)(IPTR) node->nod_arg[e_rel_stream];
}
else if (node->nod_type == nod_union) {
const jrd_nod* clauses = node->nod_arg[e_uni_clauses];
if (clauses->nod_type != nod_procedure) {
const jrd_nod* const* ptr = clauses->nod_arg;
for (const jrd_nod* const* const end = ptr + clauses->nod_count;
ptr < end; ptr += 2)
{
compute_dbkey_streams(csb, *ptr, streams);
}
}
}
else if (node->nod_type == nod_rse) {
const RecordSelExpr* rse = (RecordSelExpr*) node;
const jrd_nod* const* ptr = rse->rse_relation;
for (const jrd_nod* const* const end = ptr + rse->rse_count;
ptr < end; ptr++)
{
compute_dbkey_streams(csb, *ptr, streams);
}
}
}
static void compute_rse_streams(const CompilerScratch* csb, const RecordSelExpr* rse, UCHAR* streams)
{
/**************************************
*
* c o m p u t e _ r s e _ s t r e a m s
*
**************************************
*
* Functional description
* Identify the streams that make up an RecordSelExpr.
*
**************************************/
DEV_BLKCHK(csb, type_csb);
DEV_BLKCHK(rse, type_nod);
const jrd_nod* const* ptr = rse->rse_relation;
for (const jrd_nod* const* const end = ptr + rse->rse_count;
ptr < end; ptr++)
{
const jrd_nod* node = *ptr;
if (node->nod_type != nod_rse) {
fb_assert(streams[0] < MAX_STREAMS && streams[0] < MAX_UCHAR);
streams[++streams[0]] = (UCHAR)(IPTR) node->nod_arg[STREAM_INDEX(node)];
}
else {
compute_rse_streams(csb, (const RecordSelExpr*) node, streams);
}
}
}
static bool check_for_nod_from(const jrd_nod* node)
{
/**************************************
*
* c h e c k _ f o r _ n o d _ f r o m
*
**************************************
*
* Functional description
* Check for nod_from under >=0 nod_cast nodes.
*
**************************************/
if (node->nod_type == nod_from)
return true;
if (node->nod_type == nod_cast)
return check_for_nod_from(node->nod_arg[e_cast_source]);
return false;
}
static SLONG decompose(thread_db* tdbb,
jrd_nod* boolean_node,
NodeStack& stack,
CompilerScratch* csb)
{
/**************************************
*
* d e c o m p o s e
*
**************************************
*
* Functional description
* Decompose a boolean into a stack of conjuctions.
*
**************************************/
DEV_BLKCHK(boolean_node, type_nod);
DEV_BLKCHK(csb, type_csb);
if (boolean_node->nod_type == nod_and) {
return decompose(tdbb, boolean_node->nod_arg[0], stack, csb) +
decompose(tdbb, boolean_node->nod_arg[1], stack, csb);
}
/* turn a between into (a greater than or equal) AND (a less than or equal) */
if (boolean_node->nod_type == nod_between) {
jrd_nod* arg = boolean_node->nod_arg[0];
if (check_for_nod_from(arg)) {
/* Without this ERR_punt(), server was crashing with sub queries
* under "between" predicate, Bug No. 73766 */
ERR_post(isc_optimizer_between_err, 0);
/* Msg 493: Unsupported field type specified in BETWEEN predicate */
}
jrd_nod* node = make_binary_node(nod_geq, arg, boolean_node->nod_arg[1], true);
stack.push(node);
arg = CMP_clone_node(tdbb, csb, arg);
node = make_binary_node(nod_leq, arg, boolean_node->nod_arg[2], true);
stack.push(node);
return 2;
}
/* turn a LIKE into a LIKE and a STARTING WITH, if it starts
with anything other than a pattern-matching character */
jrd_nod* arg;
if ((boolean_node->nod_type == nod_like) &&
(arg = optimize_like(tdbb, boolean_node)))
{
stack.push(make_binary_node(nod_starts,
boolean_node->nod_arg[0], arg, false));
stack.push(boolean_node);
return 2;
}
stack.push(boolean_node);
return 1;
}
static USHORT distribute_equalities(NodeStack& org_stack, CompilerScratch* csb, USHORT base_count)
{
/**************************************
*
* d i s t r i b u t e _ e q u a l i t i e s
*
**************************************
*
* Functional description
* Given a stack of conjunctions, generate some simple
* inferences. In general, find classes of equalities,
* then find operations based on members of those classes.
* If we find any, generate additional conjunctions. In
* short:
*
* If (a == b) and (a $ c) --> (b $ c) for any
* operation '$'.
*
**************************************/
Firebird::ObjectsArray<NodeStack> classes;
Firebird::ObjectsArray<NodeStack>::iterator eq_class;
DEV_BLKCHK(csb, type_csb);
/* Zip thru stack of booleans looking for field equalities */
for (NodeStack::iterator stack1(org_stack); stack1.hasData(); ++stack1) {
jrd_nod* boolean = stack1.object();
if (boolean->nod_type != nod_eql)
continue;
jrd_nod* node1 = boolean->nod_arg[0];
if (node1->nod_type != nod_field)
continue;
jrd_nod* node2 = boolean->nod_arg[1];
if (node2->nod_type != nod_field)
continue;
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class)
{
if (search_stack(node1, *eq_class)) {
augment_stack(node2, *eq_class);
break;
}
else if (search_stack(node2, *eq_class)) {
eq_class->push(node1);
break;
}
}
if (eq_class == classes.end()) {
NodeStack& s = classes.add();
s.push(node1);
s.push(node2);
eq_class = classes.back();
}
}
if (classes.getCount() == 0)
return 0;
/* Make another pass looking for any equality relationships that may
have crept in between classes (this could result from the
sequence (A = B, C = D, B = C) */
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
for (NodeStack::const_iterator stack2(*eq_class); stack2.hasData(); ++stack2) {
for (Firebird::ObjectsArray<NodeStack>::iterator eq_class2(eq_class);
++eq_class2 != classes.end();)
{
if (search_stack(stack2.object(), *eq_class2)) {
DEBUG;
while (eq_class2->hasData()) {
augment_stack(eq_class2->pop(), *eq_class);
}
}
}
}
}
USHORT count = 0;
/* Start by making a pass distributing field equalities */
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
if (eq_class->hasMore(3)) {
for (NodeStack::iterator outer(*eq_class); outer.hasData(); ++outer) {
for (NodeStack::iterator inner(outer); (++inner).hasData(); ) {
jrd_nod* boolean =
make_binary_node(nod_eql, outer.object(),
inner.object(), true);
if ((base_count + count < MAX_CONJUNCTS) &&
augment_stack(boolean, org_stack))
{
DEBUG;
count++;
}
else
delete boolean;
}
}
}
}
/* Now make a second pass looking for non-field equalities */
for (NodeStack::iterator stack3(org_stack); stack3.hasData(); ++stack3) {
jrd_nod* boolean = stack3.object();
if (boolean->nod_type != nod_eql &&
boolean->nod_type != nod_gtr &&
boolean->nod_type != nod_geq &&
boolean->nod_type != nod_leq &&
boolean->nod_type != nod_lss &&
boolean->nod_type != nod_matches &&
boolean->nod_type != nod_contains &&
boolean->nod_type != nod_like)
{
continue;
}
const jrd_nod* node1 = boolean->nod_arg[0];
const jrd_nod* node2 = boolean->nod_arg[1];
bool reverse = false;
if (node1->nod_type != nod_field) {
const jrd_nod* swap_node = node1;
node1 = node2;
node2 = swap_node;
reverse = true;
}
if (node1->nod_type != nod_field) {
continue;
}
if (node2->nod_type != nod_literal &&
node2->nod_type != nod_variable &&
node2->nod_type != nod_argument)
{
continue;
}
for (eq_class = classes.begin(); eq_class != classes.end(); ++eq_class) {
if (search_stack(node1, *eq_class)) {
for (NodeStack::iterator temp(*eq_class); temp.hasData(); ++temp) {
if (!node_equality(node1, temp.object())) {
jrd_nod* arg1;
jrd_nod* arg2;
if (reverse) {
arg1 = boolean->nod_arg[0];
arg2 = temp.object();
}
else {
arg1 = temp.object();
arg2 = boolean->nod_arg[1];
}
/* From the conjuncts X(A,B) and A=C, infer the
* conjunct X(C,B)
*/
jrd_nod* new_node =
make_inference_node(csb, boolean, arg1, arg2);
if ((base_count + count < MAX_CONJUNCTS) &&
augment_stack(new_node, org_stack))
{
count++;
}
}
}
break;
}
}
}
return count;
}
static bool dump_index(const jrd_nod* node,
SCHAR** buffer_ptr, SSHORT* buffer_length)
{
/**************************************
*
* d u m p _ i n d e x
*
**************************************
*
* Functional description
* Dump an index inversion tree to
* an info buffer.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
DEV_BLKCHK(node, type_nod);
SCHAR* buffer = *buffer_ptr;
if (--(*buffer_length) < 0) {
return false;
}
// spit out the node type
switch (node->nod_type)
{
case nod_bit_and:
*buffer++ = isc_info_rsb_and;
break;
case nod_bit_or:
case nod_bit_in:
*buffer++ = isc_info_rsb_or;
break;
case nod_bit_dbkey:
*buffer++ = isc_info_rsb_dbkey;
break;
case nod_index:
*buffer++ = isc_info_rsb_index;
break;
}
SqlIdentifier index_name;
// dump sub-nodes or the actual index info
if ((node->nod_type == nod_bit_and) ||
(node->nod_type == nod_bit_or) ||
(node->nod_type == nod_bit_in))
{
if (!dump_index(node->nod_arg[0], &buffer, buffer_length)) {
return false;
}
if (!dump_index(node->nod_arg[1], &buffer, buffer_length)) {
return false;
}
}
else if (node->nod_type == nod_index) {
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
MET_lookup_index(tdbb, index_name, retrieval->irb_relation->rel_name,
(USHORT) (retrieval->irb_index + 1));
SSHORT length = strlen(index_name);
*buffer_length -= 1 + length;
if (*buffer_length < 0) {
return false;
}
*buffer++ = (SCHAR) length;
const TEXT* i = index_name;
while (length--) {
*buffer++ = *i++;
}
}
*buffer_ptr = buffer;
return true;
}
static bool dump_rsb(const jrd_req* request,
const RecordSource* rsb, SCHAR** buffer_ptr, SSHORT* buffer_length)
{
/**************************************
*
* d u m p _ r s b
*
**************************************
*
* Functional description
* Returns a formatted access path for
* a particular rsb.
*
**************************************/
SSHORT return_length;
jrd_prc* procedure;
DEV_BLKCHK(rsb, type_rsb);
SCHAR* buffer = *buffer_ptr;
// leave room for the rsb begin, type, and end.
*buffer_length -= 4;
if (*buffer_length < 0) {
return false;
}
*buffer++ = isc_info_rsb_begin;
// dump out the alias or relation name if it exists.
const jrd_rel* relation = rsb->rsb_relation;
USHORT length = 0;
const SCHAR* name = NULL;
const str* alias = rsb->rsb_alias;
if (alias) {
length = alias->str_length;
name = (SCHAR *) alias->str_data;
}
else if (relation) {
length = strlen(relation->rel_name);
name = relation->rel_name;
}
if (name) {
*buffer_length -= 2 + length;
if (*buffer_length < 0) {
return false;
}
*buffer++ = isc_info_rsb_relation;
*buffer++ = (SCHAR) length;
while (length--) {
*buffer++ = *name++;
}
}
/* print out the type followed immediately by any
type-specific data */
*buffer++ = isc_info_rsb_type;
switch (rsb->rsb_type) {
case rsb_indexed:
*buffer++ = isc_info_rsb_indexed;
if (!dump_index((jrd_nod*) rsb->rsb_arg[0], &buffer, buffer_length)) {
return false;
}
break;
case rsb_navigate:
*buffer++ = isc_info_rsb_navigate;
if (!dump_index((jrd_nod*) rsb->rsb_arg[RSB_NAV_index],
&buffer, buffer_length))
{
return false;
}
// dimitr: here we report indicies used to limit
// the navigational-based retrieval
if (rsb->rsb_arg[RSB_NAV_inversion]) {
*buffer_length -= 2;
if (*buffer_length < 0) {
return false;
}
*buffer++ = isc_info_rsb_type;
*buffer++ = isc_info_rsb_indexed;
if (!dump_index((jrd_nod*) rsb->rsb_arg[RSB_NAV_inversion],
&buffer, buffer_length))
{
return false;
}
}
break;
case rsb_sequential:
*buffer++ = isc_info_rsb_sequential;
break;
case rsb_cross:
*buffer++ = isc_info_rsb_cross;
break;
case rsb_sort:
*buffer++ = isc_info_rsb_sort;
break;
case rsb_procedure:
*buffer++ = isc_info_rsb_procedure;
// don't try to print out plans of procedures called by procedures, since
// we could get into a recursive situation; if the customer wants to know
// the plan produced by the sub-procedure, they can invoke it directly.
if (request->req_procedure) {
break;
}
procedure = rsb->rsb_procedure;
if (!procedure || !procedure->prc_request) {
return false;
}
// CVC: This is becoming trickier. There are procedures that don't have a plan
// because they don't access tables. In this case, the engine gives up and swallows
// the whole plan. Not acceptable.
if (procedure->prc_request->req_fors.getCount() == 0) {
const Firebird::string& n = procedure->prc_name;
*buffer_length -= 6 + n.length();
if (*buffer_length < 0) {
return false;
}
*buffer++ = isc_info_rsb_begin;
*buffer++ = isc_info_rsb_relation;
*buffer++ = (SCHAR) n.length();
memcpy(buffer, n.c_str(), n.length());
buffer += n.length();
*buffer++ = isc_info_rsb_type;
*buffer++ = isc_info_rsb_sequential;
*buffer++ = isc_info_rsb_end;
break;
}
if (!OPT_access_path(procedure->prc_request, buffer, *buffer_length,
reinterpret_cast<USHORT*>(&return_length)))
{
return false;
}
*buffer_length -= return_length;
if (*buffer_length < 0) {
return false;
}
buffer += return_length;
break;
case rsb_first:
*buffer++ = isc_info_rsb_first;
break;
case rsb_skip:
*buffer++ = isc_info_rsb_skip;
break;
case rsb_boolean:
*buffer++ = isc_info_rsb_boolean;
break;
case rsb_union:
*buffer++ = isc_info_rsb_union;
break;
case rsb_aggregate:
*buffer++ = isc_info_rsb_aggregate;
break;
case rsb_merge:
*buffer++ = isc_info_rsb_merge;
break;
case rsb_ext_sequential:
*buffer++ = isc_info_rsb_ext_sequential;
break;
case rsb_ext_indexed:
*buffer++ = isc_info_rsb_ext_indexed;
break;
case rsb_ext_dbkey:
*buffer++ = isc_info_rsb_ext_dbkey;
break;
case rsb_left_cross:
*buffer++ = isc_info_rsb_left_cross;
break;
default:
*buffer++ = isc_info_rsb_unknown;
break;
}
// dump out any sub-rsbs; for join-type rses like cross
// and merge, dump out the count of streams first, then
// loop through the substreams and dump them out.
if (--(*buffer_length) < 0) {
return false;
}
const RecordSource* const* ptr;
const RecordSource* const* end;
switch (rsb->rsb_type) {
case rsb_cross:
*buffer++ = (UCHAR) rsb->rsb_count;
ptr = rsb->rsb_arg;
for (end = ptr + rsb->rsb_count; ptr < end; ptr++) {
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
return false;
}
}
break;
case rsb_union:
*buffer++ = rsb->rsb_count / 2;
ptr = rsb->rsb_arg;
for (end = ptr + rsb->rsb_count; ptr < end; ptr++) {
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
return false;
}
ptr++;
}
break;
case rsb_merge:
*buffer++ = (SCHAR) rsb->rsb_count;
ptr = rsb->rsb_arg;
for (end = ptr + rsb->rsb_count * 2; ptr < end;
ptr += 2)
{
if (!dump_rsb(request, *ptr, &buffer, buffer_length)) {
return false;
}
}
break;
case rsb_left_cross:
*buffer++ = 2;
if (!dump_rsb(request, rsb->rsb_arg[RSB_LEFT_outer], &buffer,
buffer_length))
{
return false;
}
if (!dump_rsb(request, rsb->rsb_arg[RSB_LEFT_inner], &buffer,
buffer_length))
{
return false;
}
break;
default: // Shut up compiler warnings.
break;
}
// dump out the next rsb.
if (rsb->rsb_next) {
if (!dump_rsb(request, rsb->rsb_next, &buffer, buffer_length)) {
return false;
}
}
*buffer++ = isc_info_rsb_end;
*buffer_ptr = buffer;
return true;
}
static bool estimate_cost(thread_db* tdbb,
OptimizerBlk* opt,
USHORT stream,
double *cost, double *resulting_cardinality)
{
/**************************************
*
* e s t i m a t e _ c o s t
*
**************************************
*
* Functional description
* Make an estimate of the cost to fetch a stream. The cost
* is a function of estimated cardinality of the relation, index
* selectivity, and total boolean selectivity. Since none of
* this information is available, the estimates are likely to
* be a bit weak. Return true if the relation is index
* retrievable.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
csb_tail->csb_flags |= csb_active;
double cardinality = MAX(csb_tail->csb_cardinality, 10);
double index_selectivity = 1.0;
USHORT indexes = 0, equalities = 0, inequalities = 0, index_hits = 0;
bool unique = false;
ULONG inactivities[OPT_STREAM_BITS];
get_inactivities(csb, inactivities);
// Compute index selectivity. This involves finding the indices
// to be utilized and making a crude guess of selectivities.
if (opt->opt_conjuncts.getCount()) {
index_desc* idx = csb_tail->csb_idx->items;
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
SSHORT n = 0;
clear_bounds(opt, idx);
const OptimizerBlk::opt_conjunct* const opt_end =
opt->opt_conjuncts.end();
for (const OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
!(TEST_DEP_ARRAYS(tail->opt_dependencies, inactivities)))
{
n += match_index(tdbb, opt, stream, node, idx);
}
}
OptimizerBlk::opt_segment* segment = opt->opt_segments;
if (segment->opt_lower || segment->opt_upper) {
indexes++;
USHORT count;
for (count = 0; count < idx->idx_count; count++, segment++) {
if (!segment->opt_lower || segment->opt_lower != segment->opt_upper) {
break;
}
}
double s = idx->idx_selectivity;
if (s <= 0 || s >= 1) {
s = ESTIMATED_SELECTIVITY;
}
if (count == idx->idx_count) {
if (idx->idx_flags & idx_unique) {
unique = true;
s = 1 / cardinality;
}
}
else {
s *= INVERSE_ESTIMATE;
}
index_selectivity *= s;
index_hits += MAX(count, n);
}
++idx;
}
}
// We now known the relation cardinality, the combined index selectivity,
// and the number of index lookups required. From this we can compute the
// cost of executing the record selection expression (cost of index lookups
// plus the number of records fetched).
if (indexes) {
*cost = cardinality * index_selectivity + indexes * INDEX_COST;
}
else {
*cost = cardinality;
}
/* Next, we need to estimate the number of records coming out of the
record stream. This is based on conjunctions without regard to whether
or not they were the result of index operations. */
const OptimizerBlk::opt_conjunct* const opt_end =
opt->opt_conjuncts.end();
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
!(TEST_DEP_ARRAYS(tail->opt_dependencies, inactivities)))
{
if (node->nod_type == nod_eql) {
++equalities;
}
else {
++inequalities;
}
tail->opt_conjunct_flags |= opt_conjunct_used;
}
}
double selectivity;
const SSHORT n = inequalities + 3 * (equalities - index_hits);
if (n > 0) {
selectivity = 0.3 / n;
if (selectivity > index_selectivity) {
selectivity = index_selectivity;
}
}
else {
selectivity = index_selectivity;
}
cardinality *= selectivity;
if (unique) {
*resulting_cardinality = cardinality;
}
else {
*resulting_cardinality = MAX(cardinality, 1.0);
}
csb_tail->csb_flags |= csb_active;
// AB: Nice that we return a boolean, but do we ever need it?
return (indexes != 0);
}
static bool expression_contains(const jrd_nod* node, NOD_T node_type)
{
/**************************************
*
* e x p r e s s i o n _ c o n t a i n s
*
**************************************
*
* Functional description
* Search if somewhere in the expression the give
* node_type is buried. Return true if a unknown
* node is passed.
*
**************************************/
DEV_BLKCHK(node, type_nod);
if (!node) {
return false;
}
if (node->nod_type == node_type) {
return true;
}
else {
RecordSelExpr* rse = NULL;
switch (node->nod_type) {
case nod_cast:
return expression_contains(node->nod_arg[e_cast_source], node_type);
case nod_extract:
return expression_contains(node->nod_arg[e_extract_value], node_type);
case nod_function:
return expression_contains(node->nod_arg[e_fun_args], node_type);
case nod_procedure:
return expression_contains(node->nod_arg[e_prc_inputs], node_type);
case nod_any:
case nod_unique:
case nod_ansi_any:
case nod_ansi_all:
case nod_exists:
return expression_contains(node->nod_arg[e_any_rse], node_type);
case nod_field:
case nod_rec_version:
case nod_dbkey:
case nod_argument:
case nod_current_date:
case nod_current_role:
case nod_current_time:
case nod_current_timestamp:
case nod_gen_id:
case nod_gen_id2:
case nod_internal_info:
case nod_literal:
case nod_null:
case nod_user_name:
case nod_variable:
return false;
case nod_rse:
rse = (RecordSelExpr*) node;
break;
case nod_average:
case nod_count:
case nod_count2:
case nod_from:
case nod_max:
case nod_min:
case nod_total:
{
const jrd_nod* nodeDefault = node->nod_arg[e_stat_rse];
if (nodeDefault && expression_contains(nodeDefault, node_type)) {
return true;
}
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
const jrd_nod* value = node->nod_arg[e_stat_value];
if (value && expression_contains(value, node_type)) {
return true;
}
}
break;
case nod_or:
case nod_and:
case nod_add:
case nod_add2:
case nod_agg_average:
case nod_agg_average2:
case nod_agg_average_distinct:
case nod_agg_average_distinct2:
case nod_agg_max:
case nod_agg_min:
case nod_agg_total:
case nod_agg_total2:
case nod_agg_total_distinct:
case nod_agg_total_distinct2:
case nod_concatenate:
case nod_divide:
case nod_divide2:
case nod_multiply:
case nod_multiply2:
case nod_negate:
case nod_subtract:
case nod_subtract2:
case nod_upcase:
case nod_substr:
case nod_like:
case nod_between:
case nod_sleuth:
case nod_missing:
case nod_value_if:
case nod_matches:
case nod_contains:
case nod_starts:
case nod_equiv:
case nod_eql:
case nod_neq:
case nod_geq:
case nod_gtr:
case nod_lss:
case nod_leq:
{
const jrd_nod* const* ptr = node->nod_arg;
// Check all sub-nodes of this node.
for (const jrd_nod* const* const end = ptr + node->nod_count;
ptr < end; ptr++)
{
if (expression_contains(*ptr, node_type)) {
return true;
}
}
return false;
}
default :
return true;
}
if (rse) {
jrd_nod* sub;
if ((sub = rse->rse_first) && expression_contains(sub, node_type)) {
return true;
}
if ((sub = rse->rse_skip) && expression_contains(sub, node_type)) {
return true;
}
if ((sub = rse->rse_boolean) && expression_contains(sub, node_type)) {
return true;
}
if ((sub = rse->rse_sorted) && expression_contains(sub, node_type)) {
return true;
}
if ((sub = rse->rse_projection) && expression_contains(sub, node_type)) {
return true;
}
}
return false;
}
}
static bool expression_contains_stream(const jrd_nod* node, UCHAR stream)
{
/**************************************
*
* e x p r e s s i o n _ c o n t a i n s _ s t r e a m
*
**************************************
*
* Functional description
* Search if somewhere in the expression the given stream
* is used. If a unknown node is found it will return true.
*
**************************************/
DEV_BLKCHK(node, type_nod);
if (!node) {
return false;
}
RecordSelExpr* rse = NULL;
switch (node->nod_type) {
case nod_field:
return ((USHORT)(IPTR) node->nod_arg[e_fld_stream] == stream);
case nod_rec_version:
case nod_dbkey:
return ((USHORT)(IPTR) node->nod_arg[0] == stream);
case nod_cast:
return expression_contains_stream(node->nod_arg[e_cast_source], stream);
case nod_extract:
return expression_contains_stream(node->nod_arg[e_extract_value], stream);
case nod_function:
return expression_contains_stream(node->nod_arg[e_fun_args], stream);
case nod_procedure:
return expression_contains_stream(node->nod_arg[e_prc_inputs], stream);
case nod_any:
case nod_unique:
case nod_ansi_any:
case nod_ansi_all:
case nod_exists:
return expression_contains_stream(node->nod_arg[e_any_rse], stream);
case nod_argument:
case nod_current_date:
case nod_current_role:
case nod_current_time:
case nod_current_timestamp:
case nod_gen_id:
case nod_gen_id2:
case nod_internal_info:
case nod_literal:
case nod_null:
case nod_user_name:
case nod_variable:
return false;
case nod_rse:
rse = (RecordSelExpr*) node;
break;
case nod_average:
case nod_count:
case nod_count2:
case nod_from:
case nod_max:
case nod_min:
case nod_total:
{
const jrd_nod* nodeDefault = node->nod_arg[e_stat_rse];
if (nodeDefault && expression_contains_stream(nodeDefault, stream)) {
return true;
}
rse = (RecordSelExpr*) node->nod_arg[e_stat_rse];
const jrd_nod* value = node->nod_arg[e_stat_value];
if (value && expression_contains_stream(value, stream)) {
return true;
}
}
break;
// go into the node arguments
case nod_add:
case nod_add2:
case nod_agg_average:
case nod_agg_average2:
case nod_agg_average_distinct:
case nod_agg_average_distinct2:
case nod_agg_max:
case nod_agg_min:
case nod_agg_total:
case nod_agg_total2:
case nod_agg_total_distinct:
case nod_agg_total_distinct2:
case nod_concatenate:
case nod_divide:
case nod_divide2:
case nod_multiply:
case nod_multiply2:
case nod_negate:
case nod_subtract:
case nod_subtract2:
case nod_upcase:
case nod_substr:
case nod_like:
case nod_between:
case nod_sleuth:
case nod_missing:
case nod_value_if:
case nod_matches:
case nod_contains:
case nod_starts:
case nod_equiv:
case nod_eql:
case nod_neq:
case nod_geq:
case nod_gtr:
case nod_lss:
case nod_leq:
{
const jrd_nod* const* ptr = node->nod_arg;
// Check all sub-nodes of this node.
for (const jrd_nod* const* const end = ptr + node->nod_count;
ptr < end; ptr++)
{
if (expression_contains_stream(*ptr, stream)) {
return true;
}
}
return false;
}
default :
return true;
}
if (rse) {
jrd_nod* sub;
if ((sub = rse->rse_first) && expression_contains_stream(sub, stream)) {
return true;
}
if ((sub = rse->rse_skip) && expression_contains_stream(sub, stream)) {
return true;
}
if ((sub = rse->rse_boolean) && expression_contains_stream(sub, stream)) {
return true;
}
if ((sub = rse->rse_sorted) && expression_contains_stream(sub, stream)) {
return true;
}
if ((sub = rse->rse_projection) && expression_contains_stream(sub, stream)) {
return true;
}
}
return false;
}
#ifdef EXPRESSION_INDICES
// Try to merge this function with node_equality() into 1 function.
static bool expression_equal(thread_db* tdbb, OptimizerBlk* opt,
const index_desc* idx, jrd_nod* node,
USHORT stream)
{
/**************************************
*
* e x p r e s s i o n _ e q u a l
*
**************************************
*
* Functional description
* Wrapper for expression_equal2().
*
**************************************/
DEV_BLKCHK(node, type_nod);
SET_TDBB(tdbb);
if (idx && idx->idx_expression_request && idx->idx_expression)
{
fb_assert(idx->idx_flags & idx_expressn);
fb_assert(idx->idx_expression_request->req_caller == NULL);
idx->idx_expression_request->req_caller = tdbb->tdbb_request;
tdbb->tdbb_request = idx->idx_expression_request;
bool result = false;
{
Jrd::ContextPoolHolder context(tdbb, tdbb->tdbb_request->req_pool);
result = expression_equal2(tdbb, opt, idx->idx_expression,
node, stream);
}
tdbb->tdbb_request = idx->idx_expression_request->req_caller;
idx->idx_expression_request->req_caller = NULL;
return result;
}
else
return false;
}
static bool expression_equal2(thread_db* tdbb, OptimizerBlk* opt,
jrd_nod* node1, jrd_nod* node2,
USHORT stream)
{
/**************************************
*
* e x p r e s s i o n _ e q u a l 2
*
**************************************
*
* Functional description
* Determine if two expression trees are the same for
* the purposes of matching one half of a boolean expression
* to an index.
*
**************************************/
DEV_BLKCHK(node1, type_nod);
DEV_BLKCHK(node2, type_nod);
SET_TDBB(tdbb);
if (!node1 || !node2)
{
BUGCHECK(303); // msg 303 Invalid expression for evaluation.
}
if (node1->nod_type != node2->nod_type)
{
dsc dsc1, dsc2;
dsc *desc1 = &dsc1, *desc2 = &dsc2;
if (node1->nod_type == nod_cast && node2->nod_type == nod_field)
{
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
if (DSC_EQUIV(desc1, desc2) &&
expression_equal2(tdbb, opt, node1->nod_arg[e_cast_source],
node2, stream))
{
return true;
}
}
if (node1->nod_type == nod_field && node2->nod_type == nod_cast)
{
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
if (DSC_EQUIV(desc1, desc2) &&
expression_equal2(tdbb, opt, node1,
node2->nod_arg[e_cast_source], stream))
{
return true;
}
}
return false;
}
switch (node1->nod_type) {
case nod_add:
case nod_multiply:
case nod_add2:
case nod_multiply2:
case nod_equiv:
case nod_eql:
case nod_neq:
case nod_and:
case nod_or:
// A+B is equivilant to B+A, ditto A*B==B*A
// Note: If one expression is A+B+C, but the other is B+C+A we won't
// necessarily match them.
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
node2->nod_arg[1], stream) &&
expression_equal2(tdbb, opt, node1->nod_arg[1],
node2->nod_arg[0], stream))
{
return true;
}
// Fall into ...
case nod_subtract:
case nod_divide:
case nod_subtract2:
case nod_divide2:
case nod_concatenate:
// TODO match A > B to B <= A, etc
case nod_gtr:
case nod_geq:
case nod_leq:
case nod_lss:
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
node2->nod_arg[0], stream) &&
expression_equal2(tdbb, opt, node1->nod_arg[1],
node2->nod_arg[1], stream))
{
return true;
}
break;
case nod_rec_version:
case nod_dbkey:
if (node1->nod_arg[0] == node2->nod_arg[0])
{
return true;
}
break;
case nod_field:
{
const USHORT fld_stream = (USHORT)(IPTR) node2->nod_arg[e_fld_stream];
if ((node1->nod_arg[e_fld_id] == node2->nod_arg[e_fld_id]) &&
(fld_stream == stream))
{
/*
dsc dsc1, dsc2;
dsc *desc1 = &dsc1, *desc2 = &dsc2;
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
if (DSC_GET_COLLATE(desc1) == DSC_GET_COLLATE(desc2))
*/
return true;
}
}
break;
case nod_function:
if (node1->nod_arg[e_fun_function] &&
(node1->nod_arg[e_fun_function] == node2->nod_arg[e_fun_function]) &&
expression_equal2(tdbb, opt, node1->nod_arg[e_fun_args],
node2->nod_arg[e_fun_args], stream))
{
return true;
}
break;
case nod_literal:
{
const dsc* desc1 = EVL_expr(tdbb, node1);
const dsc* desc2 = EVL_expr(tdbb, node2);
if (desc1 && desc2 && !MOV_compare(desc1, desc2))
{
return true;
}
}
break;
case nod_null:
case nod_user_name:
case nod_current_role:
case nod_current_time:
case nod_current_date:
case nod_current_timestamp:
return true;
case nod_between:
case nod_like:
case nod_missing:
case nod_any:
case nod_ansi_any:
case nod_ansi_all:
case nod_not:
case nod_unique:
case nod_value_if:
case nod_substr:
{
if (node1->nod_count != node2->nod_count)
{
return false;
}
for (int i = 0; i < node1->nod_count; ++i)
{
if (!expression_equal2(tdbb, opt, node1->nod_arg[i],
node2->nod_arg[i], stream))
{
return false;
}
}
return true;
}
break;
case nod_gen_id:
case nod_gen_id2:
if (node1->nod_arg[e_gen_id] == node2->nod_arg[e_gen_id])
{
return true;
}
break;
case nod_negate:
case nod_internal_info:
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
node2->nod_arg[0], stream))
{
return true;
}
break;
case nod_upcase:
if (expression_equal2(tdbb, opt, node1->nod_arg[0],
node2->nod_arg[0], stream))
{
/*
dsc dsc1, dsc2;
dsc *desc1 = &dsc1, *desc2 = &dsc2;
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
if (DSC_GET_COLLATE(desc1) == DSC_GET_COLLATE(desc2))
*/
return true;
}
break;
case nod_cast:
{
dsc dsc1, dsc2;
dsc *desc1 = &dsc1, *desc2 = &dsc2;
CMP_get_desc(tdbb, opt->opt_csb, node1, desc1);
CMP_get_desc(tdbb, opt->opt_csb, node2, desc2);
if (DSC_EQUIV(desc1, desc2) &&
expression_equal2(tdbb, opt, node1->nod_arg[e_cast_source],
node2->nod_arg[e_cast_source], stream))
{
return true;
}
}
break;
case nod_extract:
if (node1->nod_arg[e_extract_part] == node2->nod_arg[e_extract_part] &&
expression_equal2(tdbb, opt, node1->nod_arg[e_extract_value],
node2->nod_arg[e_extract_value], stream))
{
return true;
}
break;
case nod_list:
{
jrd_nod** ptr1 = node1->nod_arg;
jrd_nod** ptr2 = node2->nod_arg;
if (node1->nod_count != node2->nod_count)
{
return false;
}
ULONG count = node1->nod_count;
while (count--)
{
if (!expression_equal2(tdbb, opt, *ptr1++, *ptr2++, stream))
{
return false;
}
}
return true;
}
// AB: New nodes has to be added
default:
break;
}
return false;
}
#endif
static void find_best(thread_db* tdbb,
OptimizerBlk* opt,
USHORT stream,
USHORT position,
UCHAR* streams,
const jrd_nod* plan_node,
double cost,
double cardinality)
{
/**************************************
*
* f i n d _ b e s t
*
**************************************
*
* Functional description
* Find the best join from the passed "stream" to
* the remaining "streams" in the RecordSelExpr. This routine
* uses recursion to successively consider all
* possible join orders which use indexed
* relationships to form joins.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(plan_node, type_nod);
#ifdef OPT_DEBUG
// this is used only in development so is not in the message file.
if (opt_debug_flag >= DEBUG_PUNT) {
ERR_post(isc_random, isc_arg_string, "punt", 0);
}
#endif
// if a plan was specified, check that this order matches the order
// that the user provided; this may seem like an ass-backwards way to
// enforce ordering, but I think it is important to follow the same
// code path for SET PLAN as for a normal optimization--it reduces
// chances for bugs to be introduced, and forces the person maintaining
// the optimizer to think about SET PLAN when new features are added --deej
if (plan_node)
{
if (streams[position + 1] == stream)
{
opt->opt_streams[position].opt_best_stream = stream;
++position;
if (position < streams[0])
{
find_best(tdbb, opt, streams[position + 1], position, streams, plan_node,
(double) 0, (double) 1);
}
else
{
opt->opt_best_count = streams[0];
}
}
return;
}
// do some initializations.
CompilerScratch* csb = opt->opt_csb;
csb->csb_rpt[stream].csb_flags |= csb_active;
const UCHAR* stream_end = &streams[1] + streams[0];
opt->opt_streams[position].opt_stream_number = stream;
++position;
OptimizerBlk::opt_stream* order_end = opt->opt_streams.begin() + position;
OptimizerBlk::opt_stream* stream_data = opt->opt_streams.begin() + stream;
// Save the various flag bits from the optimizer block to reset its
// state after each test.
Firebird::HalfStaticArray<UCHAR, OPT_STATIC_ITEMS>
stream_flags(*tdbb->getDefaultPool()), conjunct_flags(*tdbb->getDefaultPool());
stream_flags.grow(csb->csb_n_stream);
conjunct_flags.grow(opt->opt_conjuncts.getCount());
size_t i;
for (i = 0; i < stream_flags.getCount(); i++)
stream_flags[i] = opt->opt_streams[i].opt_stream_flags & opt_stream_used;
for (i = 0; i < conjunct_flags.getCount(); i++)
conjunct_flags[i] = opt->opt_conjuncts[i].opt_conjunct_flags & opt_conjunct_used;
// Compute delta and total estimate cost to fetch this stream.
double position_cost, position_cardinality, new_cost = 0, new_cardinality = 0;
if (!plan_node) {
estimate_cost(tdbb, opt, stream, &position_cost,
&position_cardinality);
new_cost = cost + cardinality * position_cost;
new_cardinality = position_cardinality * cardinality;
}
++opt->opt_combinations;
// If the partial order is either longer than any previous partial order,
// or the same length and cheap, save order as "best".
if (position > opt->opt_best_count ||
(position == opt->opt_best_count && new_cost < opt->opt_best_cost))
{
opt->opt_best_count = position;
opt->opt_best_cost = new_cost;
for (OptimizerBlk::opt_stream* tail = opt->opt_streams.begin(); tail < order_end; tail++) {
tail->opt_best_stream = tail->opt_stream_number;
}
#ifdef OPT_DEBUG
if (opt_debug_flag >= DEBUG_CANDIDATE) {
print_order(opt, position, new_cardinality, new_cost);
}
}
else {
if (opt_debug_flag >= DEBUG_ALL) {
print_order(opt, position, new_cardinality, new_cost);
}
#endif
}
// mark this stream as "used" in the sense that it is already included
// in this particular proposed stream ordering.
stream_data->opt_stream_flags |= opt_stream_used;
bool done = false;
// if we've used up all the streams there's no reason to go any further.
if (position == streams[0]) {
done = true;
}
// We need to prune the combinations to avoid spending all of our time
// recursing through find_best(). Based on experimentation, the cost of
// recursion becomes significant at about a 7 table join. Therefore,
// make a simplifying assumption that if we have already seen a join
// ordering that is lower cost than this one, give up.
if (!done && position > 4) {
OptimizerBlk::opt_stream* tail = &opt->opt_streams[position];
/* If we are the new low-cost join ordering, record that
fact. Otherwise, give up. */
if (tail->opt_best_stream_cost == 0 ||
new_cost < tail->opt_best_stream_cost)
{
tail->opt_best_stream_cost = new_cost;
}
else {
if (!plan_node) {
done = true;
}
}
}
// First, handle any streams that have direct unique indexed
// relationships to this stream. If there are any, we
// won't consider (now) indirect relationships.
if (!done) {
for (IndexedRelationship* relationship = stream_data->opt_relationships;
relationship;
relationship = relationship->irl_next)
{
if (relationship->irl_unique &&
(!(opt->opt_streams[relationship->irl_stream].opt_stream_flags & opt_stream_used)))
{
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
if (*ptr == relationship->irl_stream) {
if (!plan_node) {
done = true;
}
find_best(tdbb, opt, relationship->irl_stream,
position, streams, plan_node, new_cost, new_cardinality);
break;
}
}
}
}
}
// Next, handle any streams that have direct indexed relationships to this
// stream. If there are any, we won't consider (now) indirect relationships
if (!done) {
for (IndexedRelationship* relationship = stream_data->opt_relationships;
relationship;
relationship = relationship->irl_next)
{
if (!(opt->opt_streams[relationship->irl_stream].opt_stream_flags & opt_stream_used))
{
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
if (*ptr == relationship->irl_stream) {
if (!plan_node) {
done = true;
}
find_best(tdbb, opt, relationship->irl_stream,
position, streams, plan_node, new_cost,
new_cardinality);
break;
}
}
}
}
}
// If there were no direct relationships, look for indirect relationships
if (!done) {
for (const UCHAR* ptr = streams + 1; ptr < stream_end; ptr++) {
if (!(opt->opt_streams[*ptr].opt_stream_flags & opt_stream_used) &&
check_relationship(opt, position, *ptr))
{
find_best(tdbb, opt, *ptr, position,
streams, plan_node, new_cost, new_cardinality);
}
}
}
// Clean up from any changes made for compute the cost for this stream
csb->csb_rpt[stream].csb_flags &= ~csb_active;
for (i = 0; i < stream_flags.getCount(); i++)
opt->opt_streams[i].opt_stream_flags &= stream_flags[i];
for (i = 0; i < conjunct_flags.getCount(); i++)
opt->opt_conjuncts[i].opt_conjunct_flags &= conjunct_flags[i];
}
static jrd_nod* find_dbkey(jrd_nod* dbkey, USHORT stream, SLONG* position)
{
/**************************************
*
* f i n d _ d b k e y
*
**************************************
*
* Functional description
* Search a dbkey (possibly a concatenated one) for
* a dbkey for specified stream.
*
**************************************/
DEV_BLKCHK(dbkey, type_nod);
if (dbkey->nod_type == nod_dbkey) {
if ((USHORT)(IPTR) dbkey->nod_arg[0] == stream)
return dbkey;
else {
*position = *position + 1;
return NULL;
}
}
else if (dbkey->nod_type == nod_concatenate) {
jrd_nod** ptr = dbkey->nod_arg;
for (const jrd_nod* const* const end = ptr + dbkey->nod_count;
ptr < end; ptr++)
{
jrd_nod* dbkey_temp = find_dbkey(*ptr, stream, position);
if (dbkey_temp)
return dbkey_temp;
}
}
return NULL;
}
static USHORT find_order(thread_db* tdbb,
OptimizerBlk* opt, UCHAR* streams, const jrd_nod* plan_node)
{
/**************************************
*
* f i n d _ o r d e r
*
**************************************
*
* Functional description
* Given a set of streams, select the "best order" to join them.
* The "best order" is defined as longest, cheapest join order
* (length, of course, takes precedence over cost). The best
* order is developed and returned in the optimization block.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(plan_node, type_nod);
opt->opt_best_count = 0;
// if a plan was specified, the order is already
// present in the streams vector, so we only want
// to try one order.
const UCHAR* stream_end;
if (plan_node) {
stream_end = &streams[1] + 1;
}
else {
stream_end = &streams[1] + streams[0];
}
// Consider each stream as the leftmost stream in the join order;
// for each stream, the best order from that stream is considered,
// and the one which is best is placed into the opt block. Thus
// at the end of this loop the opt block holds the best order.
for (const UCHAR* stream = streams + 1; stream < stream_end; stream++) {
find_best(tdbb, opt, *stream, 0, streams, plan_node,
(double) 0, (double) 1);
}
#ifdef OPT_DEBUG
if (opt_debug_flag >= DEBUG_BEST) {
const OptimizerBlk::opt_stream* const order_end =
opt->opt_streams.begin() + opt->opt_best_count;
fprintf(opt_debug_file,
"find_order() -- best_count: %2.2d, best_streams: ",
opt->opt_best_count);
for (const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
tail < order_end; tail++)
{
fprintf(opt_debug_file, "%2.2d ", tail->opt_best_stream);
}
fprintf(opt_debug_file,
"\n\t\t\tbest_cost: %g\tcombinations: %ld\n",
opt->opt_best_cost, opt->opt_combinations);
}
#endif
return opt->opt_best_count;
}
static void find_rsbs(RecordSource* rsb, StreamStack* stream_list, RsbStack* rsb_list)
{
/**************************************
*
* f i n d _ r s b s
*
**************************************
*
* Functional description
* Find all rsbs at or below the current one that map
* to a single stream. Save the stream numbers in a list.
* For unions/aggregates/procedures also save the rsb pointer.
*
**************************************/
#ifdef DEV_BUILD
DEV_BLKCHK(rsb, type_rsb);
#endif
if (!rsb) {
return;
}
RecordSource** ptr;
const RecordSource* const* end;
switch (rsb->rsb_type) {
case rsb_union:
case rsb_aggregate:
case rsb_procedure:
if (rsb_list) {
rsb_list->push(rsb);
}
case rsb_indexed:
case rsb_sequential:
case rsb_ext_sequential:
case rsb_ext_indexed:
// No need to go any farther down with these.
stream_list->push(rsb->rsb_stream);
return;
case rsb_cross:
// Loop through the sub-streams.
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count; ptr < end; ptr++) {
find_rsbs(*ptr, stream_list, rsb_list);
}
break;
case rsb_left_cross:
find_rsbs(rsb->rsb_arg[RSB_LEFT_outer], stream_list, rsb_list);
find_rsbs(rsb->rsb_arg[RSB_LEFT_inner], stream_list, rsb_list);
break;
case rsb_merge:
// Loop through the sub-streams
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count * 2;
ptr < end; ptr += 2)
{
find_rsbs(*ptr, stream_list, rsb_list);
}
break;
default: // Shut up compiler warnings
break;
}
find_rsbs(rsb->rsb_next, stream_list, rsb_list);
}
static void find_used_streams(const RecordSource* rsb, UCHAR* streams)
{
/**************************************
*
* f i n d _ u s e d _ s t r e a m s
*
**************************************
*
* Functional description
* Find all streams through the given rsb
* and add them to the stream list.
*
**************************************/
if (!(rsb)) {
return;
}
const RecordSource* const* ptr;
const RecordSource* const* end;
USHORT stream;
bool found = false;
switch (rsb->rsb_type) {
case rsb_aggregate:
case rsb_ext_indexed:
case rsb_ext_sequential:
case rsb_indexed:
case rsb_navigate:
case rsb_procedure:
case rsb_sequential:
case rsb_union:
stream = rsb->rsb_stream;
found = true;
break;
case rsb_cross:
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count; ptr < end; ptr++) {
find_used_streams(*ptr, streams);
}
break;
case rsb_merge:
for (ptr = rsb->rsb_arg, end = ptr + rsb->rsb_count * 2; ptr < end; ptr += 2) {
find_used_streams(*ptr, streams);
}
break;
case rsb_left_cross:
find_used_streams(rsb->rsb_arg[RSB_LEFT_inner], streams);
find_used_streams(rsb->rsb_arg[RSB_LEFT_outer], streams);
break;
default: // Shut up compiler warnings.
break;
}
if (rsb->rsb_next) {
find_used_streams(rsb->rsb_next, streams);
}
if (found) {
found = false;
for (USHORT i = 1; i <= streams[0]; i++) {
if (stream == streams[i]) {
found = true;
break;
}
}
if (!found) {
streams[++streams[0]] = stream;
}
}
}
static void form_rivers(thread_db* tdbb,
OptimizerBlk* opt,
UCHAR* streams,
RiverStack& river_stack,
jrd_nod** sort_clause,
jrd_nod** project_clause,
jrd_nod* plan_clause)
{
/**************************************
*
* f o r m _ r i v e r s
*
**************************************
*
* Functional description
* Form streams into rivers according
* to the user-specified plan.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
if (sort_clause) {
DEV_BLKCHK(*sort_clause, type_nod);
}
if (project_clause) {
DEV_BLKCHK(*project_clause, type_nod);
}
DEV_BLKCHK(plan_clause, type_nod);
stream_array_t temp;
temp[0] = 0;
USHORT count = plan_clause->nod_count;
// this must be a join or a merge node, so go through
// the substreams and place them into the temp vector
// for formation into a river.
jrd_nod* plan_node = 0;
jrd_nod** ptr = plan_clause->nod_arg;
for (const jrd_nod* const* const end = ptr + count; ptr < end; ptr++) {
plan_node = *ptr;
if (plan_node->nod_type == nod_merge || plan_node->nod_type == nod_join) {
form_rivers(tdbb, opt, streams, river_stack, sort_clause,
project_clause, plan_node);
continue;
}
// at this point we must have a retrieval node, so put
// the stream into the river.
temp[0]++;
const jrd_nod* relation_node = plan_node->nod_arg[e_retrieve_relation];
temp[temp[0]] = (UCHAR)(IPTR) relation_node->nod_arg[e_rel_stream];
}
// just because the user specified a join does not mean that
// we are able to form a river; thus form as many rivers out
// of the join are as necessary to exhaust the streams.
// AB: Only form rivers when any retrieval node is seen, for
// example a MERGE on two JOINs will come with no retrievals
// at this point.
// CVC: Notice "plan_node" is pointing to the last element in the loop above.
// If the loop didn't execute, we had garbage in "plan_node".
if (temp[0] != 0) {
do {
count = find_order(tdbb, opt, temp, plan_node);
} while (form_river
(tdbb, opt, count, streams, temp, river_stack, sort_clause,
project_clause, 0));
}
}
static bool form_river(thread_db* tdbb,
OptimizerBlk* opt,
USHORT count,
UCHAR* streams,
UCHAR* temp,
RiverStack& river_stack,
jrd_nod** sort_clause,
jrd_nod** project_clause,
jrd_nod* plan_clause)
{
/**************************************
*
* f o r m _ r i v e r
*
**************************************
*
* Functional description
* Form streams into rivers (combinations of streams).
*
**************************************/
DEV_BLKCHK(opt, type_opt);
if (sort_clause) {
DEV_BLKCHK(*sort_clause, type_nod);
}
if (project_clause) {
DEV_BLKCHK(*project_clause, type_nod);
}
DEV_BLKCHK(plan_clause, type_nod);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
// Allocate a river block and move the best order into it.
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), count) River();
river_stack.push(river);
river->riv_count = (UCHAR) count;
RecordSource* rsb;
RecordSource** ptr;
if (count == 1) {
rsb = NULL;
ptr = &river->riv_rsb;
}
else {
river->riv_rsb = rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count) RecordSource();
rsb->rsb_type = rsb_cross;
rsb->rsb_count = count;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
ptr = rsb->rsb_arg;
}
UCHAR* stream = river->riv_streams;
const OptimizerBlk::opt_stream* const opt_end = opt->opt_streams.begin() + count;
if (count != streams[0]) {
sort_clause = project_clause = NULL;
}
OptimizerBlk::opt_stream* tail;
for (tail = opt->opt_streams.begin(); tail < opt_end; tail++, stream++, ptr++) {
*stream = (UCHAR) tail->opt_best_stream;
*ptr = gen_retrieval(tdbb, opt, *stream, sort_clause, project_clause,
false, false, NULL);
sort_clause = project_clause = NULL;
}
// determine whether the rsb we just made should be marked as a projection.
if (rsb && rsb->rsb_arg[0]
&& ((RecordSource*) rsb->rsb_arg[0])->rsb_flags & rsb_project)
{
rsb->rsb_flags |= rsb_project;
}
set_made_river(opt, river);
set_inactive(opt, river);
// Reform "temp" from streams not consumed.
stream = temp + 1;
UCHAR* end_stream = stream + temp[0];
if (!(temp[0] -= count)) {
return false;
}
for (UCHAR* t2 = stream; t2 < end_stream; t2++) {
for (tail = opt->opt_streams.begin(); tail < opt_end; tail++) {
if (*t2 == tail->opt_best_stream) {
goto used;
}
}
*stream++ = *t2;
used:;
}
return true;
}
static RecordSource* gen_aggregate(thread_db* tdbb, OptimizerBlk* opt, jrd_nod* node)
{
/**************************************
*
* g e n _ a g g r e g a t e
*
**************************************
*
* Functional description
* Generate an RecordSource (Record Source Block) for each aggregate operation.
* Generate an AggregateSort (Aggregate Sort Block) for each DISTINCT aggregate.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(node, type_nod);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
RecordSelExpr* rse = (RecordSelExpr*) node->nod_arg[e_agg_rse];
rse->rse_sorted = node->nod_arg[e_agg_group];
// try to optimize MAX and MIN to use an index; for now, optimize
// only the simplest case, although it is probably possible
// to use an index in more complex situations
jrd_nod** ptr;
jrd_nod* agg_operator;
jrd_nod* map = node->nod_arg[e_agg_map];
if ((map->nod_count == 1) &&
(ptr = map->nod_arg) &&
(agg_operator = (*ptr)->nod_arg[e_asgn_from]) &&
(agg_operator->nod_type == nod_agg_min ||
agg_operator->nod_type == nod_agg_max))
{
/* generate a sort block which the optimizer will try to map to an index */
jrd_nod* aggregate = PAR_make_node(tdbb, 3);
aggregate->nod_type = nod_sort;
aggregate->nod_count = 1;
aggregate->nod_arg[0] = agg_operator->nod_arg[e_asgn_from];
/* in the max case, flag the sort as descending */
if (agg_operator->nod_type == nod_agg_max) {
aggregate->nod_arg[1] = (jrd_nod*) TRUE;
}
/* 10-Aug-2004. Nickolay Samofatov
Unneeded nulls seem to be skipped somehow. */
aggregate->nod_arg[2] = (jrd_nod*) rse_nulls_default;
rse->rse_aggregate = aggregate;
}
// allocate and optimize the record source block
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
rsb->rsb_type = rsb_aggregate;
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_STREAMS);
fb_assert((int) (IPTR)node->nod_arg[e_agg_stream] <= MAX_UCHAR);
rsb->rsb_stream = (UCHAR) (IPTR) node->nod_arg[e_agg_stream];
rsb->rsb_format = csb->csb_rpt[rsb->rsb_stream].csb_format;
rsb->rsb_next = OPT_compile(tdbb, csb, rse, NULL);
rsb->rsb_arg[0] = (RecordSource*) node;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
if (rse->rse_aggregate)
{
// The rse_aggregate is still set. That means the optimizer
// was able to match the field to an index, so flag that fact
// so that it can be handled in EVL_group
if (agg_operator->nod_type == nod_agg_min) {
agg_operator->nod_type = nod_agg_min_indexed;
}
else if (agg_operator->nod_type == nod_agg_max) {
agg_operator->nod_type = nod_agg_max_indexed;
}
}
// Now generate a separate AggregateSort (Aggregate Sort Block) for each
// distinct operation;
// note that this should be optimized to use indices if possible
DSC descriptor;
DSC* desc = &descriptor;
ptr = map->nod_arg;
for (const jrd_nod* const* const end = ptr + map->nod_count; ptr < end; ptr++)
{
jrd_nod* from = (*ptr)->nod_arg[e_asgn_from];
if ((from->nod_type == nod_agg_count_distinct) ||
(from->nod_type == nod_agg_total_distinct) ||
(from->nod_type == nod_agg_total_distinct2) ||
(from->nod_type == nod_agg_average_distinct2) ||
(from->nod_type == nod_agg_average_distinct))
{
const USHORT count = asb_delta + 1 +
(sizeof(sort_key_def) + sizeof(jrd_nod**) - 1) / sizeof(jrd_nod**);
AggregateSort* asb = (AggregateSort*) PAR_make_node(tdbb, count);
asb->nod_type = nod_asb;
asb->nod_count = 0;
/* build the sort key definition. Turn varying text and
cstrings into text */
CMP_get_desc(tdbb, csb, from->nod_arg[0], desc);
if (desc->dsc_dtype == dtype_varying) {
desc->dsc_dtype = dtype_text;
desc->dsc_length -= sizeof(USHORT);
}
else if (desc->dsc_dtype == dtype_cstring) {
desc->dsc_dtype = dtype_text;
desc->dsc_length--;
}
sort_key_def* sort_key = asb->asb_key_desc = (sort_key_def*) asb->asb_key_data;
sort_key->skd_offset = 0;
// UCHAR desc->dsc_dtype is always >=0
// fb_assert(desc->dsc_dtype >= 0)
fb_assert(desc->dsc_dtype < FB_NELEM(sort_dtypes));
sort_key->skd_dtype = sort_dtypes[desc->dsc_dtype];
/* as it is legal to have skd_dtype = 0
I have removed these asserts, to avoid
server restarts in debug mode.
FSG 18.Dec.2000
*/
/*fb_assert (sort_key->skd_dtype != 0); */
sort_key->skd_length = desc->dsc_length;
sort_key->skd_flags = SKD_ascending;
asb->nod_impure = CMP_impure(csb, sizeof(impure_agg_sort));
asb->asb_desc = *desc;
from->nod_arg[1] = (jrd_nod*) asb;
from->nod_count = 2;
}
}
return rsb;
}
static RecordSource* gen_boolean(thread_db* tdbb, OptimizerBlk* opt,
RecordSource* prior_rsb, jrd_nod* node)
{
/**************************************
*
* g e n _ b o o l e a n
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(node, type_nod);
DEV_BLKCHK(prior_rsb, type_rsb);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
rsb->rsb_count = 1;
rsb->rsb_type = rsb_boolean;
rsb->rsb_next = prior_rsb;
rsb->rsb_arg[0] = (RecordSource*) node;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
return rsb;
}
static RecordSource* gen_first(thread_db* tdbb, OptimizerBlk* opt,
RecordSource* prior_rsb, jrd_nod* node)
{
/**************************************
*
* g e n _ f i r s t
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
*
* NOTE: The rsb_first node MUST appear in the rsb list before the
* rsb_skip node. The calling code MUST call gen_first after
* gen_skip.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(prior_rsb, type_rsb);
DEV_BLKCHK(node, type_nod);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
rsb->rsb_count = 1;
rsb->rsb_type = rsb_first;
rsb->rsb_next = prior_rsb;
rsb->rsb_arg[0] = (RecordSource*) node;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_first_n));
return rsb;
}
static void gen_join(thread_db* tdbb,
OptimizerBlk* opt,
UCHAR* streams,
RiverStack& river_stack,
jrd_nod** sort_clause,
jrd_nod** project_clause,
jrd_nod* plan_clause)
{
/**************************************
*
* g e n _ j o i n
*
**************************************
*
* Functional description
* Find all indexed relationships between streams,
* then form streams into rivers (combinations of
* streams).
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(*sort_clause, type_nod);
DEV_BLKCHK(*project_clause, type_nod);
DEV_BLKCHK(plan_clause, type_nod);
SET_TDBB(tdbb);
Database* dbb = tdbb->tdbb_database;
CompilerScratch* csb = opt->opt_csb;
if (!streams[0]) {
return;
}
// If there is only a single stream, don't bother with a join.
if (streams[0] == 1) {
// if a nod_cardinality references this stream,
// compute the cardinality even though we don't
// need it to optimize retrieval.
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[streams[1]];
fb_assert(csb_tail);
if (csb_tail->csb_flags & csb_compute) {
jrd_rel* relation = csb_tail->csb_relation;
fb_assert(relation);
const Format* format = CMP_format(tdbb, csb, streams[1]);
fb_assert(format);
csb_tail->csb_cardinality =
(float) DPM_data_pages(tdbb, relation) *
dbb->dbb_page_size / format->fmt_length;
}
River* river = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) River();
river->riv_count = 1;
fb_assert(csb->csb_rpt[streams[1]].csb_relation);
river->riv_rsb =
gen_retrieval(tdbb, opt, streams[1], sort_clause, project_clause,
false, false, NULL);
river->riv_streams[0] = streams[1];
river_stack.push(river);
return;
}
// Compute cardinality and indexed relationships for all streams.
const UCHAR* end_stream = streams + 1 + streams[0];
for (UCHAR* stream = streams + 1; stream < end_stream; stream++) {
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[*stream];
fb_assert(csb_tail);
jrd_rel* relation = csb_tail->csb_relation;
fb_assert(relation);
const Format* format = CMP_format(tdbb, csb, *stream);
// if this is an external file, set an arbitrary cardinality;
// if a plan was specified, don't bother computing cardinality;
// otherwise give a rough estimate based on the number of data
// pages times the estimated number of records per page -- note
// this is an upper limit since all pages are probably not full
// and many of the records on page may be back versions.
if (relation->rel_file) {
csb_tail->csb_cardinality = (float) 10000;
}
else if (plan_clause) {
csb_tail->csb_cardinality = (float) 0;
}
else {
fb_assert(format);
csb_tail->csb_cardinality =
(float) DPM_data_pages(tdbb, relation) *
dbb->dbb_page_size / format->fmt_length;
}
// find indexed relationships from this stream to every other stream
OptimizerBlk::opt_stream* tail = opt->opt_streams.begin() + *stream;
csb_tail->csb_flags |= csb_active;
for (UCHAR* t2 = streams + 1; t2 < end_stream; t2++) {
if (*t2 != *stream) {
CompilerScratch::csb_repeat* csb_tail2 = &csb->csb_rpt[*t2];
csb_tail2->csb_flags |= csb_active;
IndexedRelationship* relationship = indexed_relationship(tdbb, opt, *t2);
if (relationship) {
relationship->irl_next = tail->opt_relationships;
tail->opt_relationships = relationship;
relationship->irl_stream = *t2;
}
csb_tail2->csb_flags &= ~csb_active;
}
}
csb_tail->csb_flags &= ~csb_active;
#ifdef OPT_DEBUG
if (opt_debug_flag >= DEBUG_RELATIONSHIPS) {
fprintf(opt_debug_file,
"gen_join () -- relationships from stream %2.2d: ",
*stream);
for (IndexedRelationship* relationship = tail->opt_relationships;
relationship;
relationship = relationship->irl_next)
{
fprintf(opt_debug_file, "%2.2d %s ",
relationship->irl_stream,
(relationship->irl_unique) ? "(unique)" : "");
}
fprintf(opt_debug_file, "\n");
}
#endif
}
// if the user specified a plan, force a join order;
// otherwise try to find one
if (plan_clause) {
form_rivers(tdbb, opt, streams, river_stack, sort_clause,
project_clause, plan_clause);
}
else {
// copy the streams vector to a temporary space to be used
// to form rivers out of streams
stream_array_t temp;
MOVE_FAST(streams, temp, streams[0] + 1);
USHORT count;
do {
count = find_order(tdbb, opt, temp, 0);
} while (form_river
(tdbb, opt, count, streams, temp, river_stack,
sort_clause, project_clause, 0));
}
}
static RecordSource* gen_navigation(thread_db* tdbb,
OptimizerBlk* opt,
USHORT stream,
jrd_rel* relation, str* alias, index_desc* idx, jrd_nod** sort_ptr)
{
/**************************************
*
* g e n _ n a v i g a t i o n
*
**************************************
*
* Functional description
* See if a navigational walk of an index is in order. If so,
* generate the appropriate RecordSource and zap the sort pointer. If
* not, return NULL. Prior to ODS7, missing values sorted in
* the wrong place for ascending indices, so don't use them.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(alias, type_str);
DEV_BLKCHK(*sort_ptr, type_nod);
Database* dbb = tdbb->tdbb_database;
// Check sort order against index. If they don't match, give up and
// go home. Also don't bother if we have a non-unique index.
// This is because null values aren't placed in a "good" spot in
// the index in versions prior to V3.2.
jrd_nod* sort = *sort_ptr;
// if the number of fields in the sort is greater than the number of
// fields in the index, the index will not be used to optimize the
// sort--note that in the case where the first field is unique, this
// could be optimized, since the sort will be performed correctly by
// navigating on a unique index on the first field--deej
if (sort->nod_count > idx->idx_count) {
return NULL;
}
// not sure the significance of this magic number; if it's meant to
// signify that we shouldn't navigate on a system table, our catalog
// has grown beyond 16 tables--it doesn't seem like a problem
// to allow navigating through system tables, so I won't bump the
// number up, but I'll leave it at 16 for safety's sake--deej
if (relation->rel_id <= 16) {
return NULL;
}
// if the user-specified access plan for this request didn't
// mention this index, forget it
if ((idx->idx_runtime_flags & idx_plan_dont_use) &&
!(idx->idx_runtime_flags & idx_plan_navigate))
{
return NULL;
}
// check to see if the fields in the sort match the fields in the index
// in the exact same order--we used to check for ascending/descending prior
// to SCROLLABLE_CURSORS, but now descending sorts can use ascending indices
// and vice versa.
#ifdef SCROLLABLE_CURSORS
RSE_GET_MODE mode;
RSE_GET_MODE last_mode = RSE_get_next;
#endif
index_desc::idx_repeat* idx_tail = idx->idx_rpt;
jrd_nod** ptr = sort->nod_arg;
for (const jrd_nod* const* const end = ptr + sort->nod_count; ptr < end;
ptr++, idx_tail++)
{
jrd_nod* node = *ptr;
if (node->nod_type != nod_field
|| (USHORT)(IPTR) node->nod_arg[e_fld_stream] != stream
|| (USHORT)(IPTR) node->nod_arg[e_fld_id] != idx_tail->idx_field
// for ODS11 default nulls placement always may be matched to index
|| (dbb->dbb_ods_version >= ODS_VERSION11 && (
(reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_first && ptr[sort->nod_count])
|| (reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_last && !ptr[sort->nod_count])))
// for ODS10 and earlier indices always placed nulls at the end of dataset
|| (dbb->dbb_ods_version < ODS_VERSION11 &&
reinterpret_cast<IPTR>(ptr[2*sort->nod_count]) == rse_nulls_first)
#ifdef SCROLLABLE_CURSORS
)
#else
|| (ptr[sort->nod_count]
&& !(idx->idx_flags & idx_descending))
|| (!ptr[sort->nod_count]
&& (idx->idx_flags & idx_descending)) )
#endif
{
return NULL;
}
#ifdef SCROLLABLE_CURSORS
// determine whether we ought to navigate backwards or forwards through
// the index--we can't allow navigating one index in two different directions
// on two different fields at the same time!
mode = ((ptr[sort->nod_count] && !(idx->idx_flags & idx_descending))
|| (!ptr[sort->nod_count]
&& (idx->
idx_flags & idx_descending))) ? RSE_get_backward :
RSE_get_forward;
if (last_mode == RSE_get_next) {
last_mode = mode;
}
else if (last_mode != mode) {
return NULL;
}
#endif
}
// Looks like we can do a navigational walk. Flag that
// we have used this index for navigation, and allocate
// a navigational rsb for it.
*sort_ptr = NULL;
idx->idx_runtime_flags |= idx_navigate;
return gen_nav_rsb(tdbb, opt, stream, relation, alias, idx
#ifdef SCROLLABLE_CURSORS
, mode
#endif
);
}
static RecordSource* gen_nav_rsb(thread_db* tdbb,
OptimizerBlk* opt,
USHORT stream, jrd_rel* relation, str* alias, index_desc* idx
#ifdef SCROLLABLE_CURSORS
, RSE_GET_MODE mode
#endif
)
{
/**************************************
*
* g e n _ n a v _ r s b
*
**************************************
*
* Functional description
* Generate a navigational rsb, either
* for a compile or for a set index.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(alias, type_str);
SET_TDBB(tdbb);
USHORT key_length = ROUNDUP(BTR_key_length(relation, idx), sizeof(SLONG));
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_NAV_count) RecordSource();
rsb->rsb_type = rsb_navigate;
rsb->rsb_relation = relation;
rsb->rsb_stream = (UCHAR) stream;
rsb->rsb_alias = alias;
rsb->rsb_arg[RSB_NAV_index] = (RecordSource*) OPT_make_index(tdbb, opt, relation, idx);
rsb->rsb_arg[RSB_NAV_key_length] = (RecordSource*) (IPTR) key_length;
#ifdef SCROLLABLE_CURSORS
// indicate that the index needs to be navigated in a mirror-image
// fashion; that when the user wants to go backwards we actually go
// forwards and vice versa
if (mode == RSE_get_backward) {
rsb->rsb_flags |= rsb_descending;
}
#endif
// if this is a blr_stream, adjust the allocated impure area
// to be based on the maximum key size so that the index may be
// reset at any time to another index of larger key length
// without adjusting the impure area offsets
if (opt->opt_g_flags & opt_g_stream) {
key_length = MAX_KEY;
}
const USHORT size = nav_rsb_size(rsb, key_length, 0);
rsb->rsb_impure = CMP_impure(opt->opt_csb, size);
return rsb;
}
static RecordSource* gen_outer(thread_db* tdbb,
OptimizerBlk* opt,
RecordSelExpr* rse,
RiverStack& river_stack, jrd_nod** sort_clause, jrd_nod** project_clause)
{
/**************************************
*
* g e n _ o u t e r
*
**************************************
*
* Functional description
* Generate a top level outer join. The "outer" and "inner"
* sub-streams must be handled differently from each other.
* The inner is like other streams. The outer stream isn't
* because conjuncts may not eliminate records from the
* stream. They only determine if a join with an inner
* stream record is to be attempted.
*
**************************************/
struct {
RecordSource* stream_rsb;
USHORT stream_num;
} stream_o, stream_i, *stream_ptr[2];
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(rse, type_nod);
DEV_BLKCHK(*sort_clause, type_nod);
SET_TDBB(tdbb);
// Determine which stream should be outer and which is inner.
// In the case of a left join, the syntactically left stream is the
// outer, and the right stream is the inner. For all others, swap
// the sense of inner and outer, though for a full join it doesn't
// matter and we should probably try both orders to see which is
// more efficient.
if (rse->rse_jointype != blr_left) {
stream_ptr[1] = &stream_o;
stream_ptr[0] = &stream_i;
}
else {
stream_ptr[0] = &stream_o;
stream_ptr[1] = &stream_i;
}
// Loop through the outer join sub-streams in
// reverse order because rivers may have been PUSHed
River* river;
SSHORT i;
jrd_nod* node;
for (i = 1; i >= 0; i--) {
node = rse->rse_relation[i];
if (node->nod_type == nod_union ||
node->nod_type == nod_aggregate ||
node->nod_type == nod_procedure || node->nod_type == nod_rse)
{
river = river_stack.pop();
stream_ptr[i]->stream_rsb = river->riv_rsb;
}
else {
stream_ptr[i]->stream_rsb = NULL;
stream_ptr[i]->stream_num =
(USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
}
}
// Generate rsbs for the sub-streams. For the left sub-stream
// we also will get a boolean back
jrd_nod* boolean = NULL;
jrd_nod* inner_boolean = NULL;
if (!stream_o.stream_rsb) {
stream_o.stream_rsb =
gen_retrieval(tdbb, opt, stream_o.stream_num, sort_clause,
project_clause, true, false, &boolean);
}
// in the case of a full join, we must make sure we don't exclude record from
// the inner stream; otherwise just retrieve it as we would for an inner join
if (!stream_i.stream_rsb)
{
const bool bFullJoin = rse->rse_jointype == blr_full;
const bool bOuter = bFullJoin;
jrd_nod** ppNod = bFullJoin ? &inner_boolean : 0;
stream_i.stream_rsb =
gen_retrieval(tdbb,
opt,
stream_i.stream_num,
sort_clause,
project_clause,
bOuter,
true,
ppNod);
}
// generate a parent boolean rsb for any remaining booleans that
// were not satisfied via an index lookup
stream_i.stream_rsb = gen_residual_boolean(tdbb, opt, stream_i.stream_rsb);
// Allocate and fill in the rsb
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_LEFT_count) RecordSource();
rsb->rsb_type = rsb_left_cross;
rsb->rsb_count = 2;
rsb->rsb_impure = CMP_impure(opt->opt_csb, sizeof(struct irsb));
rsb->rsb_arg[RSB_LEFT_outer] = stream_o.stream_rsb;
rsb->rsb_arg[RSB_LEFT_inner] = stream_i.stream_rsb;
rsb->rsb_arg[RSB_LEFT_boolean] = (RecordSource*) boolean;
rsb->rsb_arg[RSB_LEFT_inner_boolean] = (RecordSource*) inner_boolean;
rsb->rsb_left_streams =
FB_NEW(*tdbb->getDefaultPool()) StreamStack(*tdbb->getDefaultPool());
rsb->rsb_left_inner_streams =
FB_NEW(*tdbb->getDefaultPool()) StreamStack(*tdbb->getDefaultPool());
rsb->rsb_left_rsbs =
FB_NEW(*tdbb->getDefaultPool()) RsbStack(*tdbb->getDefaultPool());
// find all the outer and inner substreams and push them on a stack.
find_rsbs(stream_i.stream_rsb,
rsb->rsb_left_streams,
rsb->rsb_left_rsbs);
if (rse->rse_jointype == blr_full) {
find_rsbs(stream_o.stream_rsb,
rsb->rsb_left_inner_streams, NULL);
}
return rsb;
}
static RecordSource* gen_procedure(thread_db* tdbb, OptimizerBlk* opt, jrd_nod* node)
{
/**************************************
*
* g e n _ p r o c e d u r e
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(node, type_nod);
SET_TDBB(tdbb);
CompilerScratch* csb = opt->opt_csb;
jrd_prc* procedure = MET_lookup_procedure_id(tdbb,
(SSHORT)(IPTR)node->nod_arg[e_prc_procedure], false, false, 0);
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), RSB_PRC_count) RecordSource();
rsb->rsb_type = rsb_procedure;
rsb->rsb_stream = (UCHAR)(IPTR) node->nod_arg[e_prc_stream];
rsb->rsb_procedure = procedure;
rsb->rsb_format = procedure->prc_format;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_procedure));
rsb->rsb_arg[RSB_PRC_inputs] = (RecordSource*) node->nod_arg[e_prc_inputs];
rsb->rsb_arg[RSB_PRC_in_msg] = (RecordSource*) node->nod_arg[e_prc_in_msg];
return rsb;
}
static RecordSource* gen_residual_boolean(thread_db* tdbb, OptimizerBlk* opt,
RecordSource* prior_rsb)
{
/**************************************
*
* g e n _ r e s i d u a l _ b o o l e a n
*
**************************************
*
* Functional description
* Pick up any residual boolean remaining,
* meaning those that have not been used
* as part of some join. These booleans
* must still be applied to the result stream.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(prior_rsb, type_rsb);
jrd_nod* boolean = NULL;
const OptimizerBlk::opt_conjunct* const opt_end =
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
for (OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used)) {
compose(&boolean, node, nod_and);
tail->opt_conjunct_flags |= opt_conjunct_used;
}
}
if (!boolean) {
return prior_rsb;
}
return gen_boolean(tdbb, opt, prior_rsb, boolean);
}
static RecordSource* gen_retrieval(thread_db* tdbb,
OptimizerBlk* opt,
SSHORT stream,
jrd_nod** sort_ptr,
jrd_nod** project_ptr,
bool outer_flag,
bool inner_flag,
jrd_nod** return_boolean)
{
/**************************************
*
* g e n _ r e t r i e v a l
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
**************************************/
SSHORT i, position;
OptimizerBlk::opt_conjunct* tail;
OptimizerBlk::opt_segment* idx_tail;
bool full = false;
SET_TDBB(tdbb);
#ifdef DEV_BUILD
DEV_BLKCHK(opt, type_opt);
if (sort_ptr) {
DEV_BLKCHK(*sort_ptr, type_nod);
}
if (project_ptr) {
DEV_BLKCHK(*project_ptr, type_nod);
}
if (return_boolean) {
DEV_BLKCHK(*return_boolean, type_nod);
}
#endif
// since a full outer join is a special case for us, as we have 2 outer
// streams, recoginze this condition and set the full flag, also reset the
// inner flag. This condition is only statisfied for the second stream in
// the full join. This condition is only set from the call in gen_outer() in
// case of a full join.
if ((inner_flag == true) && (outer_flag == true)) {
/* the inner flag back to false and set the full flag */
inner_flag = false;
full = true;
}
CompilerScratch* csb = opt->opt_csb;
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
jrd_rel* relation = csb_tail->csb_relation;
fb_assert(relation);
str* alias = make_alias(tdbb, csb, csb_tail);
csb_tail->csb_flags |= csb_active;
/* bug #8180 reported by Bill Karwin: when a DISTINCT and an ORDER BY
are done on different fields, and the ORDER BY can be mapped to an
index, then the records are returned in the wrong order because the
DISTINCT sort is performed after the navigational walk of the index;
for that reason, we need to de-optimize this case so that the ORDER
BY does not use an index; if desired, we could re-optimize by doing
the DISTINCT first, using a sparse bit map to store the DISTINCT
records, then perform the navigational walk for the ORDER BY and
filter the records out with the sparse bitmap. However, that is a
task for another day. --deej */
/* Bug #8958: comment out anything having to do with mapping a DISTINCT
to an index, for now. The fix for this bug was going to be so involved
that it made more sense to deoptimize this case for the time being until
we can determine whether it really makes sense to optimize a DISTINCT,
or for that matter, and ORDER BY, via an index--there is a case
to be made that it is a deoptimization and more testing needs to be done
to determine that; see more comments in the bug description
*/
if (sort_ptr && *sort_ptr && project_ptr && *project_ptr) {
sort_ptr = NULL;
}
/* Time to find inversions. For each index on the relation
match all unused booleans against the index looking for upper
and lower bounds that can be computed by the index. When
all unused conjunctions are exhausted, see if there is enough
information for an index retrieval. If so, build up an
inversion component of the boolean. */
jrd_nod* inversion = NULL;
// It's recalculated later.
const OptimizerBlk::opt_conjunct* opt_end =
opt->opt_conjuncts.begin() + (inner_flag ? opt->opt_base_missing_conjuncts : opt->opt_conjuncts.getCount());
RecordSource* rsb = NULL;
bool index_used = false;
if (relation->rel_file)
{
rsb = EXT_optimize(opt, stream, sort_ptr ? sort_ptr : project_ptr);
}
else if (opt->opt_conjuncts.getCount() || (sort_ptr && *sort_ptr)
/***|| (project_ptr && *project_ptr)***/
)
{
/* we want to start with indices which have more index segments, attempting to match
all the conjuncts possible to these indices, on the theory that one index matched
to n booleans is more selective and uses less resources than using n indices;
therefore find out which index has the most segments and proceed backwards from there;
NOTE: it's possible that a boolean might be matched to an index and then later it could
have been paired with another boolean to match another index such that both booleans
could be calculated via the index; currently we won't detect that case
*/
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS> idx_walk_vector(*tdbb->getDefaultPool());
idx_walk_vector.grow(csb_tail->csb_indices);
index_desc** idx_walk = idx_walk_vector.begin();
Firebird::HalfStaticArray<UINT64, OPT_STATIC_ITEMS> idx_priority_level_vector(*tdbb->getDefaultPool());
idx_priority_level_vector.grow(csb_tail->csb_indices);
UINT64* idx_priority_level = idx_priority_level_vector.begin();
i = 0;
for (index_desc* idx = csb_tail->csb_idx->items; i < csb_tail->csb_indices;
++i, ++idx)
{
idx_walk[i] = idx;
idx_priority_level[i] = LOWEST_PRIORITY_LEVEL;
/* skip this part if the index wasn't specified for indexed
retrieval (still need to look for navigational retrieval) */
if ((idx->idx_runtime_flags & idx_plan_dont_use) &&
!(idx->idx_runtime_flags & idx_plan_navigate))
{
continue;
}
/* go through all the unused conjuncts and see if
any of them are computable using this index */
clear_bounds(opt, idx);
tail = opt->opt_conjuncts.begin();
if (outer_flag) {
tail += opt->opt_base_parent_conjuncts;
}
for (; tail < opt_end; tail++)
{
if (tail->opt_conjunct_flags & opt_conjunct_matched) {
continue;
}
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
computable(csb, node, -1, (inner_flag || outer_flag), false))
{
match_index(tdbb, opt, stream, node, idx);
}
if (node->nod_type == nod_starts)
compose(&inversion,
make_starts(tdbb, opt, relation, node, stream,
idx), nod_bit_and);
if (node->nod_type == nod_missing)
compose(&inversion,
make_missing(tdbb, opt, relation, node,
stream, idx), nod_bit_and);
}
/* look for a navigational retrieval (unless one was already found or
there is no sort block); if no navigational retrieval on this index,
add an indexed retrieval to the inversion tree */
if (!rsb)
{
if (sort_ptr && *sort_ptr)
{
rsb = gen_navigation(tdbb, opt, stream, relation, alias,
idx, sort_ptr);
if (rsb) {
continue;
}
}
/* for now, make sure that we only map a DISTINCT to an index if they contain
the same number of fields; it should be possible to map a DISTINCT to an
index which has extra fields to the right, but we need to add some code
in NAV_get_record() to check when the relevant fields change, rather than
the whole index key */
/***if (project_ptr && *project_ptr)
if ((idx->idx_count == (*project_ptr)->nod_count) &&
(rsb = gen_navigation (tdbb, opt, stream, relation, alias, idx, project_ptr)))
{
rsb->rsb_flags |= rsb_project;
continue;
}***/
}
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
// Calculate the priority level for this index.
idx_priority_level[i] = calculate_priority_level(opt, idx);
}
}
// Sort indices based on the priority level into idx_walk.
SSHORT idx_walk_count =
sort_indices_by_priority(csb_tail, idx_walk, idx_priority_level);
// Walk through the indicies based on earlier calculated count and
// when necessary build the index
Firebird::HalfStaticArray<SSHORT, OPT_STATIC_ITEMS>
conjunct_position_vector(*tdbb->getDefaultPool());
Firebird::HalfStaticArray<OptimizerBlk::opt_conjunct*, OPT_STATIC_ITEMS>
matching_nodes_vector(*tdbb->getDefaultPool());
for (i = 0; i < idx_walk_count; i++)
{
index_desc* idx = idx_walk[i];
if (idx->idx_runtime_flags & idx_plan_dont_use) {
continue;
}
conjunct_position_vector.shrink(0);
matching_nodes_vector.shrink(0);
clear_bounds(opt, idx);
tail = opt->opt_conjuncts.begin();
if (outer_flag) {
tail += opt->opt_base_parent_conjuncts;
}
for (; tail < opt_end; tail++) {
// Test if this conjunction is available for this index.
if (!(tail->opt_conjunct_flags & opt_conjunct_matched)) {
// Setting opt_lower and/or opt_upper values
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used) &&
computable(csb,
node,
-1,
(inner_flag || outer_flag),
false))
{
if (match_index(tdbb, opt, stream, node, idx)) {
position = 0;
idx_tail = opt->opt_segments;
const OptimizerBlk::opt_segment* const idx_end =
idx_tail + idx->idx_count;
for (; idx_tail < idx_end; idx_tail++, position++) {
if (idx_tail->opt_match == node)
break;
}
if (idx_tail >= idx_end && !csb_tail->csb_plan) {
// Nevertheless we have a resulting count
// from match_index, still a node could not
// be assigned, because equal nodes are
// preferred against other ones.
// Flag this node as used, so that no other
// index is used with this bad one.
// example: WHERE (ID = 100) and (ID >= 1)
tail->opt_conjunct_flags |= opt_conjunct_matched;
}
else {
matching_nodes_vector.add(tail);
conjunct_position_vector.add(position);
}
}
}
}
}
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
// Use a different marking if a PLAN was specified, this is
// for backwards compatibility. Juck...
if (csb_tail->csb_plan) {
// Mark only used conjuncts in this index as used
idx_tail = opt->opt_segments;
const OptimizerBlk::opt_segment* const idx_end =
idx_tail + idx->idx_count;
for (; idx_tail < idx_end &&
(idx_tail->opt_lower || idx_tail->opt_upper); idx_tail++)
{
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++) {
if (idx_tail->opt_match == tail->opt_conjunct_node) {
tail->opt_conjunct_flags |= opt_conjunct_matched;
}
}
}
}
else {
// No plan
// Mark all conjuncts that could be calculated against the
// index as used. For example if you have :
// (node1 >= constant) and (node1 <= constant) be sure both
// conjuncts will be marked as opt_conjunct_matched
position = 0;
idx_tail = opt->opt_segments;
const OptimizerBlk::opt_segment* const idx_end =
idx_tail + idx->idx_count;
for (; idx_tail < idx_end &&
(idx_tail->opt_lower || idx_tail->opt_upper);
idx_tail++, position++)
{
for (size_t j = 0; j < conjunct_position_vector.getCount(); j++) {
if (conjunct_position_vector[j] == position) {
matching_nodes_vector[j]->opt_conjunct_flags |= opt_conjunct_matched;
}
}
}
}
jrd_nod* idx_node = OPT_make_index(tdbb, opt, relation, idx);
IndexRetrieval* retrieval =
(IndexRetrieval*) idx_node->nod_arg[e_idx_retrieval];
compose(&inversion, idx_node, nod_bit_and);
idx->idx_runtime_flags |= idx_used_with_and;
index_used = true;
// When we composed a UNIQUE index stop composing, because
// this is the best we can get, but only when full used.
if ((idx->idx_flags & idx_unique) && !(csb_tail->csb_plan) &&
!(retrieval->irb_generic & irb_partial))
{
break; // Go out of idx_walk loop
}
}
}
}
if (outer_flag) {
// Now make another pass thru the outer conjuncts only, finding unused,
// computable booleans. When one is found, roll it into a final
// boolean and mark it used.
*return_boolean = NULL;
opt_end = opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++) {
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
&& computable(csb, node, -1, false, false))
{
compose(return_boolean, node, nod_and);
tail->opt_conjunct_flags |= opt_conjunct_used;
}
}
}
// Now make another pass thru the conjuncts finding unused, computable
// booleans. When one is found, roll it into a final boolean and mark
// it used. If a computable boolean didn't match against an index then
// mark the stream to denote unmatched booleans.
jrd_nod* opt_boolean = NULL;
opt_end = opt->opt_conjuncts.begin() + (inner_flag ? opt->opt_base_parent_conjuncts : opt->opt_conjuncts.getCount());
tail = opt->opt_conjuncts.begin();
if (outer_flag) {
tail += opt->opt_base_parent_conjuncts;
}
for (; tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!relation->rel_file) {
compose(&inversion, OPT_make_dbkey(opt, node, stream), nod_bit_and);
}
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
&& computable(csb, node, -1, false, false))
{
if (node->nod_type == nod_or) {
compose(&inversion, make_inversion(tdbb, opt, node, stream),
nod_bit_and);
}
// If no index is used then leave other nodes alone, because they
// could be used for building a SORT/MERGE.
if ((inversion && expression_contains_stream(node, stream)) ||
(!inversion && computable(csb, node, stream, false, true)))
{
// Don't allow adding IS NULL conjunction to outer stream
// from parent node, because a FULL OUTER JOIN could return
// wrong results with it.
if (!outer_flag ||
(outer_flag && !expression_contains(node, nod_missing)))
{
compose(&opt_boolean, node, nod_and);
tail->opt_conjunct_flags |= opt_conjunct_used;
if (!outer_flag && !(tail->opt_conjunct_flags & opt_conjunct_matched)) {
csb_tail->csb_flags |= csb_unmatched;
}
}
}
}
}
if (full) {
return gen_rsb(tdbb, opt, rsb, inversion, stream, relation, alias,
*return_boolean, csb_tail->csb_cardinality);
}
else {
return gen_rsb(tdbb, opt, rsb, inversion, stream, relation, alias,
opt_boolean, csb_tail->csb_cardinality);
}
}
static RecordSource* gen_rsb(thread_db* tdbb,
OptimizerBlk* opt,
RecordSource* rsb,
jrd_nod* inversion,
SSHORT stream,
jrd_rel* relation, str* alias, jrd_nod* boolean, float cardinality)
{
/**************************************
*
* g e n _ r s b
*
**************************************
*
* Functional description
* Generate a record source block to handle either a sort or a project.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(rsb, type_rsb);
DEV_BLKCHK(inversion, type_nod);
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(alias, type_str);
DEV_BLKCHK(boolean, type_nod);
SET_TDBB(tdbb);
if (rsb) {
if (rsb->rsb_type == rsb_navigate && inversion)
rsb->rsb_arg[RSB_NAV_inversion] = (RecordSource*) inversion;
}
else {
SSHORT size;
if (inversion) {
rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
rsb->rsb_type = rsb_indexed;
rsb->rsb_count = 1;
size = sizeof(struct irsb_index);
rsb->rsb_arg[0] = (RecordSource*) inversion;
}
else {
rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) RecordSource();
rsb->rsb_type = rsb_sequential;
size = sizeof(struct irsb);
if (boolean)
opt->opt_csb->csb_rpt[stream].csb_flags |= csb_unmatched;
}
rsb->rsb_stream = (UCHAR) stream;
rsb->rsb_relation = relation;
rsb->rsb_alias = alias;
// if this is a blr_stream, we need to leave room
// in the impure area for a navigational-type rsb;
// even if this is not currently a navigational rsb,
// OPT_set_index() could be used to convert it to one.
if (opt->opt_g_flags & opt_g_stream) {
size = sizeof(impure_inversion);
size = nav_rsb_size(rsb, MAX_KEY, size);
}
rsb->rsb_impure = CMP_impure(opt->opt_csb, size);
}
if (boolean) {
rsb = gen_boolean(tdbb, opt, rsb, boolean);
}
// retain the cardinality for use at runtime by blr_cardinality
rsb->rsb_cardinality = (ULONG) cardinality;
return rsb;
}
static RecordSource* gen_skip(thread_db* tdbb, OptimizerBlk* opt,
RecordSource* prior_rsb, jrd_nod* node)
{
/**************************************
*
* g e n _ s k i p
*
**************************************
*
* Functional description
* Compile and optimize a record selection expression into a
* set of record source blocks (rsb's).
*
* NOTE: The rsb_skip node MUST appear in the rsb list after the
* rsb_first node. The calling code MUST call gen_skip before
* gen_first.
*
**************************************/
DEV_BLKCHK (opt, type_opt);
DEV_BLKCHK (prior_rsb, type_rsb);
DEV_BLKCHK (node, type_nod);
SET_TDBB (tdbb);
CompilerScratch* csb = opt->opt_csb;
// was : rsb = (RecordSource*) ALLOCDV (type_rsb, 1);
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) RecordSource();
rsb->rsb_count = 1;
rsb->rsb_type = rsb_skip;
rsb->rsb_next = prior_rsb;
rsb->rsb_arg[0] = (RecordSource*) node;
rsb->rsb_impure = CMP_impure (csb, sizeof (struct irsb_skip_n));
return rsb;
}
static RecordSource* gen_sort(thread_db* tdbb,
OptimizerBlk* opt,
UCHAR * streams,
UCHAR * dbkey_streams,
RecordSource* prior_rsb, jrd_nod* sort, bool project_flag)
{
/**************************************
*
* g e n _ s o r t
*
**************************************
*
* Functional description
* Generate a record source block to handle either a sort or a project.
* The two case are virtual identical -- the only difference is that
* project eliminates duplicates. However, since duplicates are
* recognized and handled by sort, the JRD processing is identical.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(prior_rsb, type_rsb);
DEV_BLKCHK(sort, type_nod);
SET_TDBB(tdbb);
/* We already know the number of keys, but we also need to compute the
total number of fields, keys and non-keys, to be pumped thru sort. Starting
with the number of keys, count the other field referenced. Since a field
is often a key, check for overlap to keep the length of the sort record
down. */
/* Along with the record number, the transaction id of the
* record will also be stored in the sort file. This will
* be used to detect update conflict in read committed
* transactions.
*/
UCHAR* ptr;
dsc descriptor;
CompilerScratch* csb = opt->opt_csb;
USHORT items =
sort->nod_count + (streams[0] * 2) +
(dbkey_streams ? dbkey_streams[0] : 0);
const UCHAR* const end_ptr = streams + streams[0];
const jrd_nod* const* const end_node = sort->nod_arg + sort->nod_count;
Firebird::Stack<SLONG> id_stack;
StreamStack stream_stack;
for (ptr = &streams[1]; ptr <= end_ptr; ptr++) {
UInt32Bitmap::Accessor accessor(csb->csb_rpt[*ptr].csb_fields);
if (accessor.getFirst()) do {
ULONG id = accessor.current();
items++;
id_stack.push(id);
stream_stack.push(*ptr);
for (jrd_nod** node_ptr = sort->nod_arg; node_ptr < end_node; node_ptr++)
{
jrd_nod* node = *node_ptr;
if (node->nod_type == nod_field
&& (USHORT)(IPTR) node->nod_arg[e_fld_stream] == *ptr
&& (USHORT)(IPTR) node->nod_arg[e_fld_id] == id)
{
dsc* desc = &descriptor;
CMP_get_desc(tdbb, csb, node, desc);
/* International type text has a computed key */
if (IS_INTL_DATA(desc))
break;
--items;
id_stack.pop();
stream_stack.pop();
break;
}
}
} while (accessor.getNext());
}
/* Now that we know the number of items, allocate a sort map block. Allocate
it sufficiently large that there is room for a sort key descriptor on the
end. */
const USHORT count = items +
(sizeof(sort_key_def) * 2 * sort->nod_count + sizeof(smb_repeat) -
1) / sizeof(smb_repeat);
SortMap* map = FB_NEW_RPT(*tdbb->getDefaultPool(), count) SortMap();
map->smb_keys = sort->nod_count * 2;
map->smb_count = items;
if (project_flag) {
map->smb_flags |= SMB_project;
}
ULONG map_length = 0;
// Loop thru sort keys building sort keys. Actually, to handle null values
// correctly, two sort keys are made for each field, one for the null flag
// and one for field itself.
smb_repeat* map_item = map->smb_rpt;
sort_key_def* sort_key = (sort_key_def*) & map->smb_rpt[items];
map->smb_key_desc = sort_key;
for (jrd_nod** node_ptr = sort->nod_arg; node_ptr < end_node;
node_ptr++, map_item++)
{
/* Pick up sort key expression. */
jrd_nod* node = *node_ptr;
dsc* desc = &descriptor;
CMP_get_desc(tdbb, csb, node, desc);
/* Allow for "key" forms of International text to grow */
if (IS_INTL_DATA(desc)) {
/* Turn varying text and cstrings into text. */
if (desc->dsc_dtype == dtype_varying) {
desc->dsc_dtype = dtype_text;
desc->dsc_length -= sizeof(USHORT);
}
else if (desc->dsc_dtype == dtype_cstring) {
desc->dsc_dtype = dtype_text;
desc->dsc_length--;
}
desc->dsc_length =
INTL_key_length(tdbb, INTL_INDEX_TYPE(desc),
desc->dsc_length);}
/* Make key for null flag */
#ifndef WORDS_BIGENDIAN
map_length = ROUNDUP(map_length, sizeof(SLONG));
#endif
sort_key->skd_offset = map_item->smb_flag_offset =
(USHORT) map_length++;
sort_key->skd_dtype = SKD_text;
sort_key->skd_length = 1;
// Handle nulls placement
sort_key->skd_flags = SKD_ascending;
if (tdbb->tdbb_database->dbb_ods_version < ODS_VERSION11) {
// Put nulls at the tail for ODS10 and earlier
if ((IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_first)
sort_key->skd_flags |= SKD_descending;
}
else {
// Have SQL-compliant nulls ordering for ODS11+
if (((IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_default && !*(node_ptr + sort->nod_count)) ||
(IPTR)*(node_ptr + sort->nod_count*2) == rse_nulls_first)
{
sort_key->skd_flags |= SKD_descending;
}
}
++sort_key;
/* Make key for sort key proper */
#ifndef WORDS_BIGENDIAN
map_length = ROUNDUP(map_length, sizeof(SLONG));
#else
if (desc->dsc_dtype >= dtype_aligned)
map_length =
FB_ALIGN(map_length, type_alignments[desc->dsc_dtype]);
#endif
sort_key->skd_offset = (USHORT) map_length;
sort_key->skd_flags = SKD_ascending;
if (*(node_ptr + sort->nod_count))
sort_key->skd_flags |= SKD_descending;
// UCHAR desc->dsc_dtype is always >=0
// fb_assert(desc->dsc_dtype >= 0);
fb_assert(desc->dsc_dtype < FB_NELEM(sort_dtypes));
sort_key->skd_dtype = sort_dtypes[desc->dsc_dtype];
/*fb_assert (sort_key->skd_dtype != 0); */
if (sort_key->skd_dtype == SKD_varying ||
sort_key->skd_dtype == SKD_cstring)
{
if (desc->dsc_ttype() == ttype_binary)
sort_key->skd_flags |= SKD_binary;
}
sort_key->skd_length = desc->dsc_length;
++sort_key;
map_item->smb_node = node;
map_item->smb_desc = *desc;
map_item->smb_desc.dsc_address = (UCHAR *) (IPTR) map_length;
map_length += desc->dsc_length;
if (node->nod_type == nod_field) {
map_item->smb_stream = (USHORT)(IPTR) node->nod_arg[e_fld_stream];
map_item->smb_field_id = (USHORT)(IPTR) node->nod_arg[e_fld_id];
}
}
map_length = ROUNDUP(map_length, sizeof(SLONG));
map->smb_key_length = (USHORT) map_length >> SHIFTLONG;
USHORT flag_offset = (USHORT) map_length;
map_length += items - sort->nod_count;
/* Now go back and process all to fields involved with the sort. If the
field has already been mentioned as a sort key, don't bother to repeat
it. */
while (stream_stack.hasData()) {
const SLONG id = id_stack.pop();
// AP: why USHORT - we pushed UCHAR
const USHORT stream = stream_stack.pop();
const Format* format = CMP_format(tdbb, csb, stream);
const dsc* desc = &format->fmt_desc[id];
if (id >= format->fmt_count || desc->dsc_length == 0)
IBERROR(157); /* msg 157 cannot sort on a field that does not exist */
if (desc->dsc_dtype >= dtype_aligned)
map_length =
FB_ALIGN(map_length, type_alignments[desc->dsc_dtype]);
map_item->smb_field_id = (SSHORT) id;
map_item->smb_stream = stream;
map_item->smb_flag_offset = flag_offset++;
map_item->smb_desc = *desc;
map_item->smb_desc.dsc_address = (UCHAR *) (IPTR)map_length;
map_length += desc->dsc_length;
map_item++;
}
/* Make fields for record numbers record for all streams */
map_length = ROUNDUP(map_length, sizeof(SLONG));
for (ptr = &streams[1]; ptr <= end_ptr; ptr++, map_item++) {
map_item->smb_field_id = SMB_DBKEY;
map_item->smb_stream = *ptr;
dsc* desc = &map_item->smb_desc;
desc->dsc_dtype = dtype_int64;
desc->dsc_length = sizeof(SINT64);
desc->dsc_address = (UCHAR *)(IPTR)map_length;
map_length += desc->dsc_length;
}
/* Make fields for transaction id of record for all streams */
for (ptr = &streams[1]; ptr <= end_ptr; ptr++, map_item++) {
map_item->smb_field_id = SMB_TRANS_ID;
map_item->smb_stream = *ptr;
dsc* desc = &map_item->smb_desc;
desc->dsc_dtype = dtype_long;
desc->dsc_length = sizeof(SLONG);
desc->dsc_address = (UCHAR *) (IPTR)map_length;
map_length += desc->dsc_length;
}
if (dbkey_streams) {
ptr = &dbkey_streams[1];
for (const UCHAR* const end_ptrL = dbkey_streams + dbkey_streams[0];
ptr <= end_ptrL; ptr++, map_item++)
{
map_item->smb_field_id = SMB_DBKEY;
map_item->smb_stream = *ptr;
dsc* desc = &map_item->smb_desc;
desc->dsc_dtype = dtype_int64;
desc->dsc_length = sizeof(SINT64);
desc->dsc_address = (UCHAR *)(IPTR)map_length;
map_length += desc->dsc_length;
}
}
/* Make fields to store varying and cstring length. */
const sort_key_def* const end_key = sort_key;
for (sort_key = map->smb_key_desc; sort_key < end_key; sort_key++) {
/* fb_assert (sort_key->skd_dtype != 0); */
if (sort_key->skd_dtype == SKD_varying ||
sort_key->skd_dtype == SKD_cstring)
{
sort_key->skd_vary_offset = (USHORT) map_length;
map_length += sizeof(USHORT);
}
}
if (map_length > MAX_SORT_RECORD)
ERR_post(isc_sort_rec_size_err, isc_arg_number, map_length, 0);
/* Msg438: sort record size of %ld bytes is too big */
map->smb_length = (USHORT) map_length;
/* That was most unpleasant. Never the less, it's done (except for
the debugging). All that remains is to build the record source
block for the sort. */
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), 1) RecordSource();
rsb->rsb_type = rsb_sort;
rsb->rsb_next = prior_rsb;
rsb->rsb_arg[0] = (RecordSource*) map;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb_sort));
return rsb;
}
static bool gen_sort_merge(thread_db* tdbb, OptimizerBlk* opt, RiverStack& org_rivers)
{
/**************************************
*
* g e n _ s o r t _ m e r g e
*
**************************************
*
* Functional description
* We've got a set of rivers that may or may not be amenable to
* a sort/merge join, and it's time to find out. If there are,
* build a sort/merge RecordSource, push it on the rsb stack, and update
* rivers accordingly. If two or more rivers were successfully
* joined, return true. If the whole things is a moby no-op,
* return false.
*
**************************************/
USHORT i;
ULONG selected_rivers[OPT_STREAM_BITS], selected_rivers2[OPT_STREAM_BITS];
jrd_nod **eq_class, **ptr;
DEV_BLKCHK(opt, type_opt);
SET_TDBB(tdbb);
Database* dbb = tdbb->tdbb_database;
// Count the number of "rivers" involved in the operation, then allocate
// a scratch block large enough to hold values to compute equality
// classes.
USHORT cnt = 0;
for (RiverStack::iterator stack1(org_rivers); stack1.hasData(); ++stack1) {
stack1.object()->riv_number = cnt++;
}
Firebird::HalfStaticArray<jrd_nod*, OPT_STATIC_ITEMS> scratch(*tdbb->getDefaultPool());
scratch.grow(opt->opt_base_conjuncts * cnt);
jrd_nod** classes = scratch.begin();
// Compute equivalence classes among streams. This involves finding groups
// of streams joined by field equalities.
jrd_nod** last_class = classes;
OptimizerBlk::opt_conjunct* tail = opt->opt_conjuncts.begin();
const OptimizerBlk::opt_conjunct* const end = tail + opt->opt_base_conjuncts;
for (; tail < end; tail++)
{
if (tail->opt_conjunct_flags & opt_conjunct_used) {
continue;
}
jrd_nod* node = tail->opt_conjunct_node;
if (node->nod_type != nod_eql) {
continue;
}
jrd_nod* node1 = node->nod_arg[0];
jrd_nod* node2 = node->nod_arg[1];
for (RiverStack::iterator stack0(org_rivers); stack0.hasData(); ++stack0) {
River* river1 = stack0.object();
if (!river_reference(river1, node1)) {
if (river_reference(river1, node2)) {
node = node1;
node1 = node2;
node2 = node;
}
else {
continue;
}
}
for (RiverStack::iterator stack2(stack0); (++stack2).hasData();)
{
River* river2 = stack2.object();
if (river_reference(river2, node2)) {
for (eq_class = classes; eq_class < last_class; eq_class += cnt)
{
if (node_equality(node1, classes[river1->riv_number])
|| node_equality(node2, classes[river2->riv_number]))
{
break;
}
}
eq_class[river1->riv_number] = node1;
eq_class[river2->riv_number] = node2;
if (eq_class == last_class) {
last_class += cnt;
}
}
}
}
}
/* Pick both a set of classes and a set of rivers on which to join with
sort merge. Obviously, if the set of classes is empty, return false
to indicate that nothing could be done. */
USHORT river_cnt = 0, stream_cnt = 0;
Firebird::HalfStaticArray<jrd_nod**, OPT_STATIC_ITEMS> selected_classes(*tdbb->getDefaultPool(), cnt);
for (eq_class = classes; eq_class < last_class; eq_class += cnt) {
i = river_count(cnt, eq_class);
if (i > river_cnt) {
river_cnt = i;
selected_classes.shrink(0);
selected_classes.add(eq_class);
class_mask(cnt, eq_class, selected_rivers);
}
else {
class_mask(cnt, eq_class, selected_rivers2);
for (i = 0; i < OPT_STREAM_BITS; i++) {
if ((selected_rivers[i] & selected_rivers2[i]) != selected_rivers[i]) {
break;
}
}
if (i == OPT_STREAM_BITS) {
selected_classes.add(eq_class);
}
}
}
if (!river_cnt)
return false;
// Build a sort stream.
RecordSource* merge_rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), river_cnt * 2) RecordSource();
merge_rsb->rsb_count = river_cnt;
merge_rsb->rsb_type = rsb_merge;
merge_rsb->rsb_impure =
CMP_impure(opt->opt_csb, (USHORT) (sizeof(struct irsb_mrg) +
river_cnt * sizeof(irsb_mrg::irsb_mrg_repeat)));
RecordSource** rsb_tail = merge_rsb->rsb_arg;
stream_cnt = 0;
for (RiverStack::iterator stack3(org_rivers); stack3.hasData(); ++stack3) {
River* river1 = stack3.object();
if (!(TEST_DEP_BIT(selected_rivers, river1->riv_number))) {
continue;
}
stream_cnt += river1->riv_count;
jrd_nod* sort = FB_NEW_RPT(*tdbb->getDefaultPool(), selected_classes.getCount() * 3) jrd_nod();
sort->nod_type = nod_sort;
sort->nod_count = selected_classes.getCount();
jrd_nod*** selected_class;
for (selected_class = selected_classes.begin(), ptr = sort->nod_arg;
selected_class < selected_classes.end(); selected_class++)
{
ptr[sort->nod_count] = (jrd_nod*) FALSE; // Ascending sort
ptr[sort->nod_count * 2] = (jrd_nod*) rse_nulls_default; // Default nulls placement
*ptr++ = (*selected_class)[river1->riv_number];
}
RecordSource* rsb =
gen_sort(tdbb, opt, &river1->riv_count, NULL, river1->riv_rsb, sort, false);
*rsb_tail++ = rsb;
*rsb_tail++ = (RecordSource*) sort;
}
// Finally, merge selected rivers into a single river, and rebuild
// original river stack.
River* river1 = FB_NEW_RPT(*tdbb->getDefaultPool(), stream_cnt) River();
river1->riv_count = (UCHAR) stream_cnt;
river1->riv_rsb = merge_rsb;
UCHAR* stream = river1->riv_streams;
RiverStack newRivers(org_rivers.getPool());
while (org_rivers.hasData()) {
River* river2 = org_rivers.pop();
if (TEST_DEP_BIT(selected_rivers, river2->riv_number)) {
MOVE_FAST(river2->riv_streams, stream, river2->riv_count);
stream += river2->riv_count;
}
else {
// AB: Be sure that the rivers 'order' will be kept.
if (newRivers.hasData()) {
River* river3 = newRivers.pop();
newRivers.push(river2);
newRivers.push(river3);
}
else {
newRivers.push(river2);
}
}
}
// AB: Moved LLS_PUSH() from before the while (*org_rivers) loop to here, because
// the merged rivers could be refering to other streams on the list.
newRivers.push(river1);
// Pick up any boolean that may apply.
{
USHORT flag_vector[MAX_STREAMS + 1], *fv;
UCHAR stream_nr;
// AB: Inactivate currently all streams from every river, because we
// need to know which nodes are computable between the rivers used
// for the merge.
for (stream_nr = 0, fv = flag_vector; stream_nr < opt->opt_csb->csb_n_stream; stream_nr++) {
*fv++ = opt->opt_csb->csb_rpt[stream_nr].csb_flags & csb_active;
opt->opt_csb->csb_rpt[stream_nr].csb_flags &= ~csb_active;
}
set_active(opt, river1);
jrd_nod* node = NULL;
for (tail = opt->opt_conjuncts.begin(); tail < end; tail++)
{
jrd_nod* node1 = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
&& computable(opt->opt_csb, node1, -1, false, false))
{
compose(&node, node1, nod_and);
tail->opt_conjunct_flags |= opt_conjunct_used;
}
}
if (node) {
river1->riv_rsb = gen_boolean(tdbb, opt, river1->riv_rsb, node);
}
set_inactive(opt, river1);
org_rivers.takeOwnership(newRivers);
for (stream_nr = 0, fv = flag_vector;
stream_nr < opt->opt_csb->csb_n_stream; stream_nr++)
{
opt->opt_csb->csb_rpt[stream_nr].csb_flags |= *fv++;
}
}
return true;
}
static RecordSource* gen_union(thread_db* tdbb,
OptimizerBlk* opt,
jrd_nod* union_node, UCHAR * streams, USHORT nstreams)
{
/**************************************
*
* g e n _ u n i o n
*
**************************************
*
* Functional description
* Generate a union complex.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(union_node, type_nod);
SET_TDBB(tdbb);
jrd_nod* clauses = union_node->nod_arg[e_uni_clauses];
const USHORT count = clauses->nod_count;
CompilerScratch* csb = opt->opt_csb;
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count + nstreams + 1) RecordSource();
rsb->rsb_type = rsb_union;
rsb->rsb_count = count;
rsb->rsb_stream = (UCHAR)(IPTR) union_node->nod_arg[e_uni_stream];
rsb->rsb_format = csb->csb_rpt[rsb->rsb_stream].csb_format;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
RecordSource** rsb_ptr = rsb->rsb_arg;
jrd_nod** ptr = clauses->nod_arg;
for (const jrd_nod* const* const end = ptr + count; ptr < end;) {
*rsb_ptr++ = OPT_compile(tdbb, csb, (RecordSelExpr*) * ptr++, NULL);
*rsb_ptr++ = (RecordSource*) * ptr++;
}
/* Save the count and numbers of the streams that make up the union */
*rsb_ptr++ = (RecordSource*)(IPTR) nstreams;
while (nstreams--) {
*rsb_ptr++ = (RecordSource*)(IPTR) *streams++;
}
return rsb;
}
static void get_inactivities(const CompilerScratch* csb, ULONG* dependencies)
{
/**************************************
*
* g e t _ i n a c t i v i t i e s
*
**************************************
*
* Functional description
* Find any streams not explicitily active.
*
**************************************/
SLONG n;
DEV_BLKCHK(csb, type_csb);
for (n = 0; n < OPT_STREAM_BITS; n++)
dependencies[n] = (ULONG) - 1;
n = 0;
CompilerScratch::rpt_const_itr tail = csb->csb_rpt.begin();
for (const CompilerScratch::rpt_const_itr end = tail + csb->csb_n_stream;
tail < end; n++, tail++)
{
if (tail->csb_flags & csb_active)
CLEAR_DEP_BIT(dependencies, n);
}
}
static IndexedRelationship* indexed_relationship(thread_db* tdbb, OptimizerBlk* opt,
USHORT stream)
{
/**************************************
*
* i n d e x e d _ r e l a t i o n s h i p
*
**************************************
*
* Functional description
* See if two streams are related by an index.
* An indexed relationship is a means of joining two
* streams via an index, which is possible when a field from
* each of the streams is compared with a field from the other,
* and there is an index on one stream to retrieve the value
* of the other field.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
SET_TDBB(tdbb);
if (!opt->opt_base_conjuncts) {
return NULL;
}
CompilerScratch* csb = opt->opt_csb;
CompilerScratch::csb_repeat* csb_tail = &csb->csb_rpt[stream];
OptimizerBlk::opt_conjunct* opt_end =
opt->opt_conjuncts.begin() + opt->opt_base_conjuncts;
IndexedRelationship* relationship = NULL;
/* Loop thru indexes looking for a match */
index_desc* idx = csb_tail->csb_idx->items;
for (USHORT i = 0; i < csb_tail->csb_indices;
++i, ++idx)
{
/* skip this part if the index wasn't specified for indexed retrieval */
if (idx->idx_runtime_flags & idx_plan_dont_use) {
continue;
}
clear_bounds(opt, idx);
OptimizerBlk::opt_conjunct* tail;
for (tail = opt->opt_conjuncts.begin(); tail < opt_end; tail++)
{
jrd_nod* node = tail->opt_conjunct_node;
if (!(tail->opt_conjunct_flags & opt_conjunct_used)
&& computable(csb, node, -1, false, false))
{
// AB: Why only check for AND structures ?
// Added match_indices for support of "OR" with INNER JOINs */
// match_index(tdbb, opt, stream, node, idx);
match_indices(tdbb, opt, stream, node, idx);
// AB: Why should we look further?
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
break;
}
}
}
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
if (!relationship) {
relationship = FB_NEW(*tdbb->getDefaultPool()) IndexedRelationship();
}
if (idx->idx_flags & idx_unique) {
relationship->irl_unique = TRUE;
break;
}
}
}
return relationship;
}
static str* make_alias(thread_db* tdbb, CompilerScratch* csb,
CompilerScratch::csb_repeat* base_tail)
{
/**************************************
*
* m a k e _ a l i a s
*
**************************************
*
* Functional description
* Make an alias string suitable for printing
* as part of the plan. For views, this means
* multiple aliases to distinguish the base
* table.
*
**************************************/
DEV_BLKCHK(csb, type_csb);
SET_TDBB(tdbb);
if (!base_tail->csb_view && !base_tail->csb_alias)
return NULL;
const CompilerScratch::csb_repeat* csb_tail;
/* calculate the length of the alias by going up through
the view stack to find the lengths of all aliases;
adjust for spaces and a null terminator */
USHORT alias_length = 0;
for (csb_tail = base_tail;;
csb_tail = &csb->csb_rpt[csb_tail->csb_view_stream])
{
if (csb_tail->csb_alias)
alias_length += csb_tail->csb_alias->length();
else {
alias_length +=
(!(csb_tail->csb_relation) || !(csb_tail->csb_relation->rel_name))
? 0 : strlen(csb_tail->csb_relation->rel_name);
}
alias_length++;
if (!csb_tail->csb_view)
break;
}
/* allocate a string block to hold the concatenated alias */
str* alias = FB_NEW_RPT(*tdbb->getDefaultPool(), alias_length) str();
alias->str_length = alias_length - 1;
/* now concatenate the individual aliases into the string block,
beginning at the end and copying back to the beginning */
TEXT* p = (TEXT *) alias->str_data + alias->str_length;
*p-- = 0;
for (csb_tail = base_tail;;
csb_tail = &csb->csb_rpt[csb_tail->csb_view_stream])
{
const TEXT* q;
if (csb_tail->csb_alias)
q = (TEXT *) csb_tail->csb_alias->c_str();
else {
q = (!(csb_tail->csb_relation) || !(csb_tail->csb_relation->rel_name))
? NULL : csb_tail->csb_relation->rel_name;
}
/* go to the end of the alias and copy it backwards */
if (q) {
for (alias_length = 0; *q; alias_length++)
q++;
while (alias_length--)
*p-- = *--q;
}
if (!csb_tail->csb_view)
break;
*p-- = ' ';
}
return alias;
}
static jrd_nod* make_binary_node(NOD_T type, jrd_nod* arg1, jrd_nod* arg2, bool flag)
{
/**************************************
*
* m a k e _ b i n a r y _ n o d e
*
**************************************
*
* Functional description
* Make a binary node.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
DEV_BLKCHK(arg1, type_nod);
DEV_BLKCHK(arg2, type_nod);
jrd_nod* node = PAR_make_node(tdbb, 2);
node->nod_type = type;
node->nod_arg[0] = arg1;
node->nod_arg[1] = arg2;
if (flag) {
node->nod_flags |= nod_comparison;
}
return node;
}
static RecordSource* make_cross(thread_db* tdbb, OptimizerBlk* opt, RiverStack& stack)
{
/**************************************
*
* m a k e _ c r o s s
*
**************************************
*
* Functional description
* Generate a cross block.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
SET_TDBB(tdbb);
const int count = stack.getCount();
if (count == 1) {
return stack.pop()->riv_rsb;
}
CompilerScratch* csb = opt->opt_csb;
RecordSource* rsb = FB_NEW_RPT(*tdbb->getDefaultPool(), count) RecordSource();
rsb->rsb_type = rsb_cross;
rsb->rsb_count = count;
rsb->rsb_impure = CMP_impure(csb, sizeof(struct irsb));
RecordSource** ptr = rsb->rsb_arg + count;
while (stack.hasData()) {
*--ptr = stack.pop()->riv_rsb;
}
return rsb;
}
static jrd_nod* make_index_node(thread_db* tdbb, jrd_rel* relation,
CompilerScratch* csb, index_desc* idx)
{
/**************************************
*
* m a k e _ i n d e x _ n o d e
*
**************************************
*
* Functional description
* Make an index node and an index retrieval block.
*
**************************************/
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(csb, type_csb);
SET_TDBB(tdbb);
/* check whether this is during a compile or during
a SET INDEX operation */
if (csb)
CMP_post_resource(&csb->csb_resources,
relation, Resource::rsc_index,
idx->idx_id);
else
CMP_post_resource(&tdbb->tdbb_request->req_resources,
relation, Resource::rsc_index,
idx->idx_id);
jrd_nod* node = PAR_make_node(tdbb, e_idx_length);
node->nod_type = nod_index;
node->nod_count = 0;
IndexRetrieval* retrieval =
FB_NEW_RPT(*tdbb->getDefaultPool(), idx->idx_count * 2) IndexRetrieval();
node->nod_arg[e_idx_retrieval] = (jrd_nod*) retrieval;
retrieval->irb_index = idx->idx_id;
MOVE_FAST(idx, &retrieval->irb_desc, sizeof(retrieval->irb_desc));
if (csb)
node->nod_impure = CMP_impure(csb, sizeof(impure_inversion));
return node;
}
static jrd_nod* make_inference_node(CompilerScratch* csb, jrd_nod* boolean,
jrd_nod* arg1, jrd_nod* arg2)
{
/**************************************
*
* m a k e _ i n f e r e n c e _ n o d e
*
**************************************
*
* Defined
* 1996-Jan-15 David Schnepper
*
* Functional description
* From the predicate, boolean, and infer a new
* predicate using arg1 & arg2 as the first two
* parameters to the predicate.
*
* This is used when the engine knows A<B and A=C, and
* creates a new node to represent the infered knowledge C<B.
*
* Note that this may be sometimes incorrect with 3-value
* logic (per Chris Date's Object & Relations seminar).
* Later stages of query evaluation evaluate exactly
* the originally specified query, so 3-value issues are
* caught there. Making this inference might cause us to
* examine more records than needed, but would not result
* in incorrect results.
*
* Note that some nodes, specifically nod_like, have
* more than two parameters for a boolean operation.
* (nod_like has an optional 3rd parameter for the ESCAPE character
* option of SQL)
* Nod_sleuth also has an optional 3rd parameter (for the GDML
* matching ESCAPE character language). But nod_sleuth is
* (apparently) not considered during optimization.
*
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
DEV_BLKCHK(csb, type_csb);
DEV_BLKCHK(boolean, type_nod);
DEV_BLKCHK(arg1, type_nod);
DEV_BLKCHK(arg2, type_nod);
fb_assert(boolean->nod_count >= 2); /* must be a conjunction boolean */
/* Clone the input predicate */
jrd_nod* node = PAR_make_node(tdbb, boolean->nod_count);
node->nod_type = boolean->nod_type;
// We may safely copy invariantness flag because
// (1) we only distribute field equalities
// (2) invariantness of second argument of STARTING WITH or LIKE is solely
// determined by its dependency on any of the fields
// If provisions above change the line below will have to be modified
node->nod_flags = boolean->nod_flags;
/* But substitute new values for some of the predicate arguments */
node->nod_arg[0] = CMP_clone_node(tdbb, csb, arg1);
node->nod_arg[1] = CMP_clone_node(tdbb, csb, arg2);
/* Arguments after the first two are just cloned (eg: LIKE ESCAPE clause) */
for (USHORT n = 2; n < boolean->nod_count; n++)
node->nod_arg[n] = CMP_clone_node(tdbb, csb, boolean->nod_arg[n]);
// Share impure area for cached invariant value used to hold pre-compiled
// pattern for new LIKE and CONTAINING algorithms.
// Proper cloning of impure area for this node would require careful accounting
// of new invariant dependencies - we avoid such hassles via using single
// cached pattern value for all node clones. This is faster too.
if (node->nod_flags & nod_invariant)
node->nod_impure = boolean->nod_impure;
return node;
}
static jrd_nod* make_inversion(thread_db* tdbb, OptimizerBlk* opt,
jrd_nod* boolean, USHORT stream)
{
/**************************************
*
* m a k e _ i n v e r s i o n
*
**************************************
*
* Functional description
* Build an inversion for a boolean, if possible. Otherwise,
* return NULL. Make inversion is call initially from
* gen_retrieval to handle "or" nodes, but may be called
* recursively for almost anything.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(boolean, type_nod);
CompilerScratch::csb_repeat* csb_tail = &opt->opt_csb->csb_rpt[stream];
jrd_rel* relation = csb_tail->csb_relation;
if ((!relation) || (relation->rel_file)) {
return NULL;
}
// Handle the "OR" case up front
jrd_nod* inversion;
if (boolean->nod_type == nod_or)
{
inversion = make_inversion(tdbb, opt, boolean->nod_arg[0], stream);
if (!inversion)
{
return NULL;
}
jrd_nod* inversion2 = make_inversion(tdbb, opt, boolean->nod_arg[1], stream);
if (inversion2)
{
if ((inversion->nod_type == nod_index) &&
(inversion2->nod_type == nod_index) &&
(reinterpret_cast<IndexRetrieval*>(inversion->nod_arg[e_idx_retrieval])->irb_index ==
reinterpret_cast<IndexRetrieval*>(inversion2->nod_arg[e_idx_retrieval])->irb_index))
{
return compose(&inversion, inversion2, nod_bit_in);
}
else if ((inversion->nod_type == nod_bit_in) &&
(inversion2->nod_type == nod_index) &&
(reinterpret_cast<IndexRetrieval*>(inversion->nod_arg[1]->nod_arg[e_idx_retrieval])->irb_index ==
reinterpret_cast<IndexRetrieval*>(inversion2->nod_arg[e_idx_retrieval])->irb_index))
{
return compose(&inversion, inversion2, nod_bit_in);
}
else
{
return compose(&inversion, inversion2, nod_bit_or);
}
}
if (inversion->nod_type == nod_index) {
delete inversion->nod_arg[e_idx_retrieval];
}
delete inversion;
return NULL;
}
// Time to find inversions. For each index on the relation
// match all unused booleans against the index looking for upper
// and lower bounds that can be computed by the index. When
// all unused conjunctions are exhausted, see if there is enough
// information for an index retrieval. If so, build up and
// inversion component of the boolean.
// AB: If the boolean is a part of an earlier created index
// retrieval check with the compound_selectivity if it's
// really interresting to use.
inversion = NULL;
bool accept_starts = true;
bool accept_missing = true;
bool used_in_compound = false;
float compound_selectivity = 1; // Real maximum selectivity possible is 1.
// TMN: Shouldn't this be allocated from the tdbb->getDefaultPool() pool?
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS>
idx_walk_vector(*tdbb->getDefaultPool());
idx_walk_vector.grow(csb_tail->csb_indices);
index_desc** idx_walk = idx_walk_vector.begin();
Firebird::HalfStaticArray<UINT64, OPT_STATIC_ITEMS>
idx_priority_level_vector(*tdbb->getDefaultPool());
idx_priority_level_vector.grow(csb_tail->csb_indices);
UINT64* idx_priority_level = idx_priority_level_vector.begin();
index_desc* idx = csb_tail->csb_idx->items;
SSHORT i;
if (opt->opt_base_conjuncts) {
for (i = 0; i < csb_tail->csb_indices; i++) {
idx_walk[i] = idx;
idx_priority_level[i] = LOWEST_PRIORITY_LEVEL;
clear_bounds(opt, idx);
if (match_index(tdbb, opt, stream, boolean, idx) &&
!(idx->idx_runtime_flags & idx_plan_dont_use))
{
// Calculate the priority level of this index.
idx_priority_level[i] = calculate_priority_level(opt, idx);
}
// If the index was already used in an AND node check
// if this node is also present in this index
if (idx->idx_runtime_flags & idx_used_with_and) {
if ((match_index(tdbb, opt, stream, boolean, idx)) &&
(idx->idx_selectivity < compound_selectivity))
{
compound_selectivity = idx->idx_selectivity;
used_in_compound = true;
}
}
/* Because indices are already sort based on their selectivity
it's not needed to more then 1 index for a node */
if ((boolean->nod_type == nod_starts) && accept_starts) {
jrd_nod* node = make_starts(tdbb, opt, relation, boolean, stream, idx);
if (node) {
compose(&inversion, node, nod_bit_and);
accept_starts = false;
}
}
if ((boolean->nod_type == nod_missing) && accept_missing) {
jrd_nod* node = make_missing(tdbb, opt, relation, boolean, stream, idx);
if (node) {
compose(&inversion, node, nod_bit_and);
accept_missing = false;
}
}
++idx;
}
}
/* Sort indices based on the priority level into idx_walk */
const SSHORT idx_walk_count =
sort_indices_by_priority(csb_tail, idx_walk, idx_priority_level);
bool accept = true;
idx = csb_tail->csb_idx->items;
if (opt->opt_base_conjuncts) {
for (i = 0; i < idx_walk_count; i++) {
idx = idx_walk[i];
if (idx->idx_runtime_flags & idx_plan_dont_use) {
continue;
}
clear_bounds(opt, idx);
if (((accept || used_in_compound) &&
(idx->idx_selectivity < compound_selectivity * OR_SELECTIVITY_THRESHOLD_FACTOR)) ||
(csb_tail->csb_plan))
{
match_index(tdbb, opt, stream, boolean, idx);
if (opt->opt_segments[0].opt_lower || opt->opt_segments[0].opt_upper) {
compose(&inversion, OPT_make_index(tdbb, opt, relation, idx),
nod_bit_and);
accept = false;
}
}
}
}
if (!inversion) {
inversion = OPT_make_dbkey(opt, boolean, stream);
}
return inversion;
}
static jrd_nod* make_missing(thread_db* tdbb,
OptimizerBlk* opt,
jrd_rel* relation, jrd_nod* boolean, USHORT stream, index_desc* idx)
{
/**************************************
*
* m a k e _ m i s s i n g
*
**************************************
*
* Functional description
* If the a given boolean is an index optimizable, build and
* return a inversion type node. Indexes built before minor
* version 3 (V3.2) have unreliable representations for missing
* character string fields, so they won't be used.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->tdbb_database;
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(boolean, type_nod);
jrd_nod* field = boolean->nod_arg[0];
#ifdef EXPRESSION_INDICES
if (idx->idx_flags & idx_expressn)
{
fb_assert(idx->idx_expression != NULL);
if (!expression_equal(tdbb, opt, idx, field, stream))
{
return NULL;
}
}
else
{
#endif
if (field->nod_type != nod_field)
{
return NULL;
}
if ((USHORT)(IPTR) field->nod_arg[e_fld_stream] != stream ||
(USHORT)(IPTR) field->nod_arg[e_fld_id] != idx->idx_rpt[0].idx_field)
{
return NULL;
}
#ifdef EXPRESSION_INDICES
}
#endif
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
retrieval->irb_relation = relation;
if ((dbb->dbb_ods_version < ODS_VERSION11) || (idx->idx_flags & idx_descending)) {
// AB: irb_starting? Why?
// Commenting myself. Because we don't know exact length for the field.
// For ascending NULLs in ODS 11 and higher this doesn't matter, because
// a NULL is always stored as a key with length 0 (zero).
retrieval->irb_generic = irb_starting;
}
retrieval->irb_lower_count = retrieval->irb_upper_count = 1;
// If we are matching less than the full index, this is a partial match
if (retrieval->irb_upper_count < idx->idx_count) {
retrieval->irb_generic |= irb_partial;
}
// Set descending flag on retrieval if index is descending
if (idx->idx_flags & idx_descending) {
retrieval->irb_generic |= irb_descending;
}
jrd_nod* value = PAR_make_node(tdbb, 0);
retrieval->irb_value[0] = retrieval->irb_value[idx->idx_count] = value;
value->nod_type = nod_null;
idx->idx_runtime_flags |= idx_plan_missing;
return node;
}
static jrd_nod* make_starts(thread_db* tdbb,
OptimizerBlk* opt,
jrd_rel* relation, jrd_nod* boolean, USHORT stream, index_desc* idx)
{
/**************************************
*
* m a k e _ s t a r t s
*
**************************************
*
* Functional description
* If the given boolean is an index optimizable, build and
* return a inversion type node.
*
**************************************/
SET_TDBB(tdbb);
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(relation, type_rel);
DEV_BLKCHK(boolean, type_nod);
if (boolean->nod_type != nod_starts)
return NULL;
jrd_nod* field = boolean->nod_arg[0];
jrd_nod* value = boolean->nod_arg[1];
#ifdef EXPRESSION_INDICES
if (idx->idx_flags & idx_expressn)
{
fb_assert(idx->idx_expression != NULL);
if (!(expression_equal(tdbb, opt, idx, field, stream) &&
computable(opt->opt_csb, value, stream, true, false)))
{
if (expression_equal(tdbb, opt, idx, value, stream) &&
computable(opt->opt_csb, field, stream, true, false))
{
field = value;
value = boolean->nod_arg[0];
}
else
{
return NULL;
}
}
}
else
#endif
{
if (field->nod_type != nod_field)
{
// dimitr: any idea how we can use an index in this case?
// The code below produced wrong results.
return NULL;
/*
if (value->nod_type != nod_field)
return NULL;
field = value;
value = boolean->nod_arg[0];
*/
}
/* Every string starts with an empty string so
don't bother using an index in that case. */
if (value->nod_type == nod_literal)
{
const dsc* literal_desc = &((Literal*) value)->lit_desc;
if ((literal_desc->dsc_dtype == dtype_text &&
literal_desc->dsc_length == 0) ||
(literal_desc->dsc_dtype == dtype_varying &&
literal_desc->dsc_length == sizeof(USHORT)))
{
return NULL;
}
}
if ((USHORT)(IPTR) field->nod_arg[e_fld_stream] != stream ||
(USHORT)(IPTR) field->nod_arg[e_fld_id] != idx->idx_rpt[0].idx_field
|| !(idx->idx_rpt[0].idx_itype == idx_string
|| idx->idx_rpt[0].idx_itype == idx_byte_array
|| idx->idx_rpt[0].idx_itype == idx_metadata
|| idx->idx_rpt[0].idx_itype >= idx_first_intl_string)
|| !computable(opt->opt_csb, value, stream, false, false))
{
return NULL;
}
}
jrd_nod* node = make_index_node(tdbb, relation, opt->opt_csb, idx);
IndexRetrieval* retrieval = (IndexRetrieval*) node->nod_arg[e_idx_retrieval];
retrieval->irb_relation = relation;
retrieval->irb_generic = irb_starting;
// STARTING WITH can never include NULL values, thus ignore
// them already at index scan
retrieval->irb_generic |= irb_ignore_null_value_key;
retrieval->irb_lower_count = retrieval->irb_upper_count = 1;
// If we are matching less than the full index, this is a partial match
if (retrieval->irb_upper_count < idx->idx_count) {
retrieval->irb_generic |= irb_partial;
}
// Set descending flag on retrieval if index is descending
if (idx->idx_flags & idx_descending) {
retrieval->irb_generic |= irb_descending;
}
retrieval->irb_value[0] = retrieval->irb_value[idx->idx_count] = value;
idx->idx_runtime_flags |= idx_plan_starts;
return node;
}
static bool map_equal(const jrd_nod* field1, const jrd_nod* field2, const jrd_nod* map)
{
/**************************************
*
* m a p _ e q u a l
*
**************************************
*
* Functional description
* Test to see if two fields are equal, where the fields
* are in two different streams possibly mapped to each other.
* Order of the input fields is important.
*
**************************************/
DEV_BLKCHK(field1, type_nod);
DEV_BLKCHK(field2, type_nod);
DEV_BLKCHK(map, type_nod);
if (field1->nod_type != nod_field) {
return false;
}
if (field2->nod_type != nod_field) {
return false;
}
// look through the mapping and see if we can find an equivalence.
const jrd_nod* const* map_ptr = map->nod_arg;
for (const jrd_nod* const* const map_end = map_ptr + map->nod_count;
map_ptr < map_end; map_ptr++)
{
const jrd_nod* map_from = (*map_ptr)->nod_arg[e_asgn_from];
const jrd_nod* map_to = (*map_ptr)->nod_arg[e_asgn_to];
if (map_from->nod_type != nod_field || map_to->nod_type != nod_field) {
continue;
}
if (field1->nod_arg[e_fld_stream] != map_from->nod_arg[e_fld_stream]
|| field1->nod_arg[e_fld_id] != map_from->nod_arg[e_fld_id])
{
continue;
}
if (field2->nod_arg[e_fld_stream] != map_to->nod_arg[e_fld_stream]
|| field2->nod_arg[e_fld_id] != map_to->nod_arg[e_fld_id])
{
continue;
}
return true;
}
return false;
}
static void mark_indices(CompilerScratch::csb_repeat* csb_tail, SSHORT relation_id)
{
/**************************************
*
* m a r k _ i n d i c e s
*
**************************************
*
* Functional description
* Mark indices that were not included
* in the user-specified access plan.
*
**************************************/
const jrd_nod* plan = csb_tail->csb_plan;
if (!plan)
return;
if (plan->nod_type != nod_retrieve)
return;
/* find out how many indices were specified; if
there were none, this is a sequential retrieval */
USHORT plan_count = 0;
const jrd_nod* access_type = plan->nod_arg[e_retrieve_access_type];
if (access_type)
plan_count = access_type->nod_count;
/* go through each of the indices and mark it unusable
for indexed retrieval unless it was specifically mentioned
in the plan; also mark indices for navigational access */
index_desc* idx = csb_tail->csb_idx->items;
for (USHORT i = 0; i < csb_tail->csb_indices; i++) {
if (access_type) {
const jrd_nod* const* arg = access_type->nod_arg;
const jrd_nod* const* const end = arg + plan_count;
for (; arg < end; arg += 3) {
if (relation_id != (SSHORT)(IPTR) * arg) {
/* index %s cannot be used in the specified plan */
ERR_post(isc_index_unused, isc_arg_string, *(arg + 2), 0);
}
if (idx->idx_id == (USHORT)(IPTR) * (arg + 1)) {
if (access_type->nod_type == nod_navigational &&
arg == access_type->nod_arg)
{
// dimitr: navigational access can use only one index,
// hence the extra check added (see the line above)
idx->idx_runtime_flags |= idx_plan_navigate;
}
else { // nod_indices
break;
}
}
}
if (arg == end)
idx->idx_runtime_flags |= idx_plan_dont_use;
}
else {
idx->idx_runtime_flags |= idx_plan_dont_use;
}
++idx;
}
}
static SSHORT match_index(thread_db* tdbb,
OptimizerBlk* opt,
SSHORT stream, jrd_nod* boolean,
index_desc* idx)
{
/**************************************
*
* m a t c h _ i n d e x
*
**************************************
*
* Functional description
* Match a boolean against an index location lower and upper
* bounds. Return the number of relational nodes that were
* matched. In ODS versions prior to 7, descending indexes
* were not reliable and will not be used.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(boolean, type_nod);
SET_TDBB(tdbb);
if (boolean->nod_type == nod_and)
{
return match_index(tdbb, opt, stream, boolean->nod_arg[0], idx) +
match_index(tdbb, opt, stream, boolean->nod_arg[1], idx);
}
bool forward = true;
jrd_nod* match = boolean->nod_arg[0];
jrd_nod* value = (boolean->nod_count < 2) ? NULL : boolean->nod_arg[1];
#ifdef EXPRESSION_INDICES
if (idx->idx_flags & idx_expressn)
{
// see if one side or the other is matchable to the index expression
fb_assert(idx->idx_expression != NULL);
if (!expression_equal(tdbb, opt, idx, match, stream) ||
(value && !computable(opt->opt_csb, value, stream, true, false)))
{
if (value &&
expression_equal(tdbb, opt, idx, value, stream) &&
computable(opt->opt_csb, match, stream, true, false))
{
match = boolean->nod_arg[1];
value = boolean->nod_arg[0];
}
else
return 0;
}
}
else {
#endif
// If left side is not a field, swap sides.
// If left side is still not a field, give up
if (match->nod_type != nod_field ||
(USHORT)(IPTR) match->nod_arg[e_fld_stream] != stream ||
(value && !computable(opt->opt_csb, value, stream, true, false)))
{
match = value;
value = boolean->nod_arg[0];
if (!match ||
match->nod_type != nod_field ||
(USHORT)(IPTR) match->nod_arg[e_fld_stream] != stream ||
!computable(opt->opt_csb, value, stream, true, false))
{
return 0;
}
forward = false;
}
#ifdef EXPRESSION_INDICES
}
#endif
/* match the field to an index, if possible, and save the value to be matched
as either the lower or upper bound for retrieval, or both */
SSHORT count = 0;
SSHORT i = 0;
for (OptimizerBlk::opt_segment* ptr = opt->opt_segments; i < idx->idx_count;
i++, ptr++)
{
if (
#ifdef EXPRESSION_INDICES
(idx->idx_flags & idx_expressn) ||
#endif
(USHORT)(IPTR) match->nod_arg[e_fld_id] == idx->idx_rpt[i].idx_field)
{
++count;
/* AB: If we have already an exact match don't
override it with worser matches, but increment the
count so that the node will be marked as matched! */
if (ptr->opt_match && ptr->opt_match->nod_type == nod_eql) {
break;
}
switch (boolean->nod_type) {
case nod_between:
if (!forward ||
!computable(opt->opt_csb,
boolean->nod_arg[2],
stream,
true,
false))
{
return 0;
}
ptr->opt_lower = value;
ptr->opt_upper = boolean->nod_arg[2];
ptr->opt_match = boolean;
break;
case nod_equiv:
case nod_eql:
ptr->opt_lower = ptr->opt_upper = value;
ptr->opt_match = boolean;
break;
case nod_gtr:
case nod_geq:
if (forward) {
ptr->opt_lower = value;
}
else {
ptr->opt_upper = value;
}
ptr->opt_match = boolean;
break;
case nod_lss:
case nod_leq:
if (forward) {
ptr->opt_upper = value;
}
else {
ptr->opt_lower = value;
}
ptr->opt_match = boolean;
break;
default: /* Shut up compiler warnings */
break;
}
}
}
return count;
}
static bool match_indices(thread_db* tdbb,
OptimizerBlk* opt,
SSHORT stream, jrd_nod* boolean,
index_desc* idx)
{
/**************************************
*
* m a t c h _ i n d i c e s
*
**************************************
*
* Functional description
* Match a boolean against an index location lower and upper
* bounds. Return the number of relational nodes that were
* matched. In ODS versions prior to 7, descending indexes
* were not reliable and will not be used.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(boolean, type_nod);
SET_TDBB(tdbb);
if (boolean->nod_count < 2) {
return false;
}
if (boolean->nod_type == nod_or) {
if (match_indices(tdbb, opt, stream, boolean->nod_arg[0], idx) &&
match_indices(tdbb, opt, stream, boolean->nod_arg[1], idx))
{
opt->opt_segments[0].opt_match = NULL;
return true;
}
}
else {
if (match_index(tdbb, opt, stream, boolean, idx)) {
opt->opt_segments[0].opt_match = NULL;
return true;
}
}
opt->opt_segments[0].opt_match = NULL;
opt->opt_segments[0].opt_upper = NULL;
opt->opt_segments[0].opt_lower = NULL;
return false;
}
static USHORT nav_rsb_size(RecordSource* rsb, USHORT key_length, USHORT size)
{
/**************************************
*
* n a v _ r s b _ s i z e
*
**************************************
*
* Functional description
* Calculate the size of a navigational rsb.
*
**************************************/
DEV_BLKCHK(rsb, type_rsb);
#ifdef SCROLLABLE_CURSORS
/* allocate extra impure area to hold the current key,
plus an upper and lower bound key value, for a total
of three times the key length for the index */
size += sizeof(struct irsb_nav) + 3 * key_length;
#else
size += sizeof(struct irsb_nav) + 2 * key_length;
#endif
size = FB_ALIGN(size, ALIGNMENT);
/* make room for an idx structure to describe the index
that was used to generate this rsb */
if (rsb->rsb_type == rsb_navigate)
rsb->rsb_arg[RSB_NAV_idx_offset] = (RecordSource*) (IPTR) size;
size += sizeof(index_desc);
return size;
}
static bool node_equality(const jrd_nod* node1, const jrd_nod* node2)
{
/**************************************
*
* n o d e _ e q u a l i t y
*
**************************************
*
* Functional description
* Test two field node pointers for symbolic equality.
*
**************************************/
DEV_BLKCHK(node1, type_nod);
DEV_BLKCHK(node2, type_nod);
if (!node1 || !node2) {
return false;
}
if (node1->nod_type != node2->nod_type) {
return false;
}
if (node1 == node2) {
return true;
}
switch (node1->nod_type) {
case nod_field:
return (node1->nod_arg[e_fld_stream] == node2->nod_arg[e_fld_stream]
&& node1->nod_arg[e_fld_id] == node2->nod_arg[e_fld_id]);
case nod_equiv:
case nod_eql:
if (node_equality(node1->nod_arg[0], node2->nod_arg[0])
&& node_equality(node1->nod_arg[1], node2->nod_arg[1]))
{
return true;
}
if (node_equality(node1->nod_arg[0], node2->nod_arg[1])
&& node_equality(node1->nod_arg[1], node2->nod_arg[0]))
{
return true;
}
return false;
case nod_gtr:
case nod_geq:
case nod_leq:
case nod_lss:
case nod_matches:
case nod_contains:
case nod_like:
default:
break;
}
return false;
}
static jrd_nod* optimize_like(thread_db* tdbb, jrd_nod* like_node)
{
/**************************************
*
* o p t i m i z e _ l i k e
*
**************************************
*
* Functional description
* Optimize a LIKE expression, if possible,
* into a "starting with" AND a "like". This
* will allow us to use the index for the
* starting with, and the LIKE can just tag
* aSLONG for the ride.
* But on the ride it does useful work, consider
* match LIKE "ab%c". This is optimized by adding
* AND starting_with "ab", but the LIKE clause is
* still needed.
*
**************************************/
UCHAR tmp_buffer[32]; /* large enough to hold 1 ch of escape string */
SET_TDBB(tdbb);
DEV_BLKCHK(like_node, type_nod);
jrd_nod* search_node = like_node->nod_arg[1];
jrd_nod* escape_node = (like_node->nod_count > 2) ? like_node->nod_arg[2] : NULL;
/* if the matching string or the escape string can't
be evaluated at compile time, forget it */
if ((search_node->nod_type != nod_literal) ||
(escape_node && escape_node->nod_type != nod_literal))
{
return NULL;
}
dsc* search_desc = &((Literal*) search_node)->lit_desc;
dsc* escape_desc = 0;
if (escape_node)
escape_desc = &((Literal*) escape_node)->lit_desc;
/* if either is not a character expression, forget it */
if ((search_desc->dsc_dtype > dtype_any_text) ||
(escape_node && escape_desc->dsc_dtype > dtype_any_text))
{
return NULL;
}
/* Get the escape character, if any */
TextType text_obj = NULL;
USHORT escape_ch = 0;
if (escape_node)
{
/* Ensure escape string is same character set as search string
* Error report on Overflow is OK, as sql only allows a single
* character escape string */
const char* p2;
USHORT p_count =
MOV_make_string(escape_desc, INTL_TTYPE(search_desc), &p2,
reinterpret_cast<vary*>(tmp_buffer),
sizeof(tmp_buffer));
const UCHAR* p = reinterpret_cast<const UCHAR*>(p2);
/* Now get first character from escape string */
escape_ch =
INTL_getch(tdbb, &text_obj,
INTL_TTYPE(search_desc), &p, &p_count);
}
// If the first character is a wildcard char, forget it.
// CVC: Beware, if INTL doesn't understand the next character, p_count is zero.
// No check is done. We must handle this failure.
const UCHAR* p = search_desc->dsc_address;
USHORT p_count = search_desc->dsc_length;
USHORT ch =
INTL_getch(tdbb, &text_obj,
INTL_TTYPE(search_desc), &p, &p_count);
if ((!escape_node || ch != escape_ch)
&& (ch == SQL_MATCH_1_CHAR || ch == SQL_MATCH_ANY_CHARS))
{
return NULL;
}
// allocate a literal node to store the starting with string;
// assume it will be shorter than the search string
// CVC: This assumption may not be true if we use "value like field".
const SSHORT count = lit_delta +
(search_desc->dsc_length + sizeof(jrd_nod*) - 1) / sizeof(jrd_nod*);
jrd_nod* node = PAR_make_node(tdbb, count);
node->nod_type = nod_literal;
node->nod_count = 0;
Literal* literal = (Literal*) node;
literal->lit_desc = *search_desc;
UCHAR* q = reinterpret_cast<UCHAR*>(literal->lit_data);
literal->lit_desc.dsc_address = q;
/* copy the string into the starting with literal, up to the first wildcard character */
p_count = search_desc->dsc_length;
p = search_desc->dsc_address;
for (const UCHAR* const end = p + search_desc->dsc_length; p < end;)
{
// if there are escape characters, skip past them and
// don't treat the next char as a wildcard
// CVC: Beware, if INTL doesn't understand the next character, p_count is zero. No check is done.
// Same than above, but worse, since it will enter an infinite loop. Example: Spanish <20> against unicode.
// Reported also on Portuguese characters that aren't ASCII < 128.
const UCHAR* p_start = p;
ch =
INTL_getch(tdbb, &text_obj,
INTL_TTYPE(search_desc), &p, &p_count);
if (escape_node && (ch == escape_ch))
{
/* Check for Escape character at end of string */
if (!(p < end))
break;
p_start = p;
ch =
INTL_getch(tdbb, &text_obj,
INTL_TTYPE(search_desc), &p, &p_count);
}
else if (ch == SQL_MATCH_1_CHAR || ch == SQL_MATCH_ANY_CHARS)
{
break;
}
/* copy the bytes of the character */
while (p_start < p) {
*q++ = *p_start++;
}
}
literal->lit_desc.dsc_length = q - literal->lit_desc.dsc_address;
return node;
}
#ifdef OPT_DEBUG
static void print_order(OptimizerBlk* opt,
USHORT position, double cardinality, double cost)
{
/**************************************
*
* p r i n t _ o r d e r
*
**************************************
*
* Functional description
*
**************************************/
DEV_BLKCHK(opt, type_opt);
fprintf(opt_debug_file, "print_order() -- position %2.2d: ", position);
const OptimizerBlk::opt_stream* tail = opt->opt_streams.begin();
for (const OptimizerBlk::opt_stream* const order_end = opt->opt_streams.begin() + position;
tail < order_end; tail++)
{
fprintf(opt_debug_file, "stream %2.2d, ", tail->opt_stream_number);
}
fprintf(opt_debug_file, "\n\t\t\tcardinality: %g\tcost: %g\n",
cardinality, cost);
}
#endif
static USHORT river_count(USHORT count, jrd_nod** eq_class)
{
/**************************************
*
* r i v e r _ c o u n t
*
**************************************
*
* Functional description
* Given an sort/merge join equivalence class (vector of node pointers
* of representative values for rivers), return the count of rivers
* with values.
*
**************************************/
#ifdef DEV_BUILD
if (*eq_class) {
DEV_BLKCHK(*eq_class, type_nod);
}
#endif
USHORT cnt = 0;
for (USHORT i = 0; i < count; i++, eq_class++)
if (*eq_class) {
cnt++;
DEV_BLKCHK(*eq_class, type_nod);
}
return cnt;
}
static bool river_reference(const River* river, const jrd_nod* node, bool* field_found)
{
/**************************************
*
* r i v e r _ r e f e r e n c e
*
**************************************
*
* Functional description
* See if a value node is a reference to a given river.
* AB: Handle also expressions (F1 + F2 * 3, etc..)
* The expression is checked if all fields that are
* buried inside are pointing to the the given river.
* If a passed field isn't referenced by the river then
* we have an expression with 2 fields pointing to
* different rivers and then the result is always false.
* NOTE! The first time this function is called
* field_found should be NULL.
*
**************************************/
DEV_BLKCHK(river, type_riv);
DEV_BLKCHK(node, type_nod);
bool lfield_found = false;
bool root_caller = false;
// If no boolean parameter is given then this is the first call
// to this function and we use the local boolean to pass to
// itselfs. The boolean is used to see if any field has passed
// that references to the river.
if (!field_found) {
root_caller = true;
field_found = &lfield_found;
}
switch (node->nod_type) {
case nod_field :
{
// Check if field references to the river.
const UCHAR* streams = river->riv_streams;
for (const UCHAR* const end = streams + river->riv_count;
streams < end; streams++)
{
if ((USHORT)(IPTR) node->nod_arg[e_fld_stream] == *streams) {
*field_found = true;
return true;
}
}
return false;
}
default :
{
const jrd_nod* const* ptr = node->nod_arg;
// Check all sub-nodes of this node.
for (const jrd_nod* const* const end = ptr + node->nod_count;
ptr < end; ptr++)
{
if (!river_reference(river, *ptr, field_found)) {
return false;
}
}
// if this was the first call then field_found tells
// us if any field (referenced by river) was found.
if (root_caller) {
return *field_found;
}
else {
return true;
}
}
}
/*
// AB: Original code FB1.0 , just left as reference for a while
UCHAR *streams, *end;
DEV_BLKCHK(river, type_riv);
DEV_BLKCHK(node, type_nod);
if (node->nod_type != nod_field)
return false;
for (streams = river->riv_streams, end =
streams + river->riv_count; streams < end; streams++)
if ((USHORT) node->nod_arg[e_fld_stream] == *streams)
return true;
return false;
*/
return false;
}
static bool search_stack(const jrd_nod* node, const NodeStack& stack)
{
/**************************************
*
* s e a r c h _ s t a c k
*
**************************************
*
* Functional description
* Search a stack for the presence of a particular value.
*
**************************************/
DEV_BLKCHK(node, type_nod);
for (NodeStack::const_iterator iter(stack); iter.hasData(); ++iter) {
if (node_equality(node, iter.object())) {
return true;
}
}
return false;
}
static void set_active(OptimizerBlk* opt, const River* river)
{
/**************************************
*
* s e t _ a c t i v e
*
**************************************
*
* Functional description
* Set a group of streams active.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(river, type_riv);
CompilerScratch* csb = opt->opt_csb;
const UCHAR* streams = river->riv_streams;
for (const UCHAR* const end = streams + river->riv_count; streams < end;
streams++)
{
csb->csb_rpt[*streams].csb_flags |= csb_active;
}
}
static void set_direction(const jrd_nod* from_clause, jrd_nod* to_clause)
{
/**************************************
*
* s e t _ d i r e c t i o n
*
**************************************
*
* Functional description
* Update the direction of a GROUP BY, DISTINCT, or ORDER BY
* clause to the same direction as another clause.
*
**************************************/
DEV_BLKCHK(from_clause, type_nod);
DEV_BLKCHK(to_clause, type_nod);
/* all three clauses are allocated with thrice the number of arguments to
leave room at the end for an ascending/descending and nulls placement flags,
one for each field */
jrd_nod* const* from_ptr = from_clause->nod_arg + from_clause->nod_count;
jrd_nod** to_ptr = to_clause->nod_arg + to_clause->nod_count;
for (const jrd_nod* const* const end = from_ptr + from_clause->nod_count * 2;
from_ptr < end; from_ptr++)
{
*to_ptr++ = *from_ptr;
}
}
static void set_inactive(OptimizerBlk* opt, const River* river)
{
/**************************************
*
* s e t _ i n a c t i v e
*
**************************************
*
* Functional description
* Set a group of streams inactive.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(river, type_riv);
CompilerScratch* csb = opt->opt_csb;
const UCHAR* streams = river->riv_streams;
for (const UCHAR* const end = streams + river->riv_count; streams < end;
streams++)
{
csb->csb_rpt[*streams].csb_flags &= ~csb_active;
}
}
static void set_made_river(OptimizerBlk* opt, const River* river)
{
/**************************************
*
* s e t _ m a d e _ r i v e r
*
**************************************
*
* Functional description
* Mark all the streams in a river with the csb_made_river flag.
*
* A stream with this flag set, incicates that this stream has
* already been made into a river. Currently, this flag is used
* in computable() to decide if we can use the an index to
* optimise retrieving the streams involved in the conjunct.
*
* We can use an index in retrieving the streams involved in a
* conjunct if both of the streams are currently active or have
* been processed (and made into rivers) before.
*
**************************************/
DEV_BLKCHK(opt, type_opt);
DEV_BLKCHK(river, type_riv);
CompilerScratch* csb = opt->opt_csb;
const UCHAR* streams = river->riv_streams;
for (const UCHAR* const end = streams + river->riv_count; streams < end;
streams++)
{
csb->csb_rpt[*streams].csb_flags |= csb_made_river;
}
}
static void set_position(const jrd_nod* from_clause, jrd_nod* to_clause,
const jrd_nod* map)
{
/**************************************
*
* s e t _ p o s i t i o n
*
**************************************
*
* Functional description
* Update the fields in a GROUP BY, DISTINCT, or ORDER BY
* clause to the same position as another clause, possibly
* using a mapping between the streams.
*
**************************************/
DEV_BLKCHK(from_clause, type_nod);
DEV_BLKCHK(to_clause, type_nod);
DEV_BLKCHK(map, type_nod);
/* Track the position in the from list with "to_swap", and find the corresponding
field in the from list with "to_ptr", then swap the two fields. By the time
we get to the end of the from list, all fields in the to list will be reordered. */
jrd_nod** to_swap = to_clause->nod_arg;
const jrd_nod* const* from_ptr = from_clause->nod_arg;
for (const jrd_nod* const* const from_end =
from_ptr + from_clause->nod_count; from_ptr < from_end; from_ptr++)
{
jrd_nod** to_ptr = to_clause->nod_arg;
for (const jrd_nod* const* const to_end =
to_ptr + from_clause->nod_count; to_ptr < to_end; to_ptr++)
{
if ((map && map_equal(*to_ptr, *from_ptr, map))
|| (!map
&& (*from_ptr)->nod_arg[e_fld_stream] ==
(*to_ptr)->nod_arg[e_fld_stream]
&& (*from_ptr)->nod_arg[e_fld_id] ==
(*to_ptr)->nod_arg[e_fld_id]))
{
jrd_nod* swap = *to_swap;
*to_swap = *to_ptr;
*to_ptr = swap;
}
}
to_swap++;
}
}
static void set_rse_inactive(CompilerScratch* csb, const RecordSelExpr* rse)
{
/***************************************************
*
* s e t _ r s e _ i n a c t i v e
*
***************************************************
*
* Functional Description:
* Set all the streams involved in an RecordSelExpr as inactive. Do it recursively.
*
***************************************************/
const jrd_nod* const* ptr = rse->rse_relation;
for (const jrd_nod* const* const end = ptr + rse->rse_count;
ptr < end; ptr++)
{
const jrd_nod* node = *ptr;
if (node->nod_type != nod_rse) {
const SSHORT stream = (USHORT)(IPTR) node->nod_arg[STREAM_INDEX(node)];
csb->csb_rpt[stream].csb_flags &= ~csb_active;
}
else
set_rse_inactive(csb, (const RecordSelExpr*) node);
}
}
static void sort_indices_by_selectivity(CompilerScratch::csb_repeat* csb_tail)
{
/***************************************************
*
* s o r t _ i n d i c e s _ b y _ s e l e c t i v i t y
*
***************************************************
*
* Functional Description:
* Sort indices based on there selectivity.
* Lowest selectivy as first, highest as last.
*
***************************************************/
if (csb_tail->csb_plan) {
return;
}
index_desc* selected_idx = NULL;
USHORT i, j;
Firebird::Array<index_desc> idx_sort(*JRD_get_thread_data()->getDefaultPool(), csb_tail->csb_indices);
bool same_selectivity = false;
// Walk through the indices and sort them into into idx_sort
// where idx_sort[0] contains the lowest selectivity (best) and
// idx_sort[csb_tail->csb_indices - 1] the highest (worst)
if (csb_tail->csb_idx && (csb_tail->csb_indices > 1)) {
for (j = 0; j < csb_tail->csb_indices; j++) {
float selectivity = 1; // Maximum selectivity is 1 (when all keys are the same)
index_desc* idx = csb_tail->csb_idx->items;
for (i = 0; i < csb_tail->csb_indices; i++) {
// Prefer ASC indices in the case of almost the same selectivities
if (selectivity > idx->idx_selectivity) {
same_selectivity = ((selectivity - idx->idx_selectivity) <= 0.00001);
}
else {
same_selectivity = ((idx->idx_selectivity - selectivity) <= 0.00001);
}
if (!(idx->idx_runtime_flags & idx_marker) &&
(idx->idx_selectivity <= selectivity) &&
!((idx->idx_flags & idx_descending) && same_selectivity))
{
selectivity = idx->idx_selectivity;
selected_idx = idx;
}
++idx;
}
// If no index was found than pick the first one available out of the list
if ((!selected_idx) || (selected_idx->idx_runtime_flags & idx_marker))
{
idx = csb_tail->csb_idx->items;
for (i = 0; i < csb_tail->csb_indices; i++) {
if (!(idx->idx_runtime_flags & idx_marker)) {
selected_idx = idx;
break;
}
++idx;
}
}
selected_idx->idx_runtime_flags |= idx_marker;
idx_sort.add(*selected_idx);
}
// Finally store the right order in cbs_tail->csb_idx
index_desc* idx = csb_tail->csb_idx->items;
for (j = 0; j < csb_tail->csb_indices; j++) {
idx->idx_runtime_flags &= ~idx_marker;
MOVE_FAST(&idx_sort[j], idx, sizeof(index_desc));
++idx;
}
}
}
static SSHORT sort_indices_by_priority(CompilerScratch::csb_repeat* csb_tail,
index_desc** idx_walk,
UINT64* idx_priority_level)
{
/***************************************************
*
* s o r t _ i n d i c e s _ b y _ p r i o r i t y
*
***************************************************
*
* Functional Description:
* Sort indices based on the priority level.
*
***************************************************/
Firebird::HalfStaticArray<index_desc*, OPT_STATIC_ITEMS> idx_csb(*JRD_get_thread_data()->getDefaultPool());
idx_csb.grow(csb_tail->csb_indices);
memcpy(idx_csb.begin(), idx_walk, csb_tail->csb_indices * sizeof(index_desc*));
SSHORT idx_walk_count = 0;
float selectivity = 1; /* Real maximum selectivity possible is 1 */
for (SSHORT i = 0; i < csb_tail->csb_indices; i++)
{
SSHORT last_idx = -1;
UINT64 last_priority_level = 0;
for (SSHORT j = csb_tail->csb_indices - 1; j >= 0; j--)
{
if (!(idx_priority_level[j] == 0) &&
(idx_priority_level[j] >= last_priority_level))
{
last_priority_level = idx_priority_level[j];
last_idx = j;
}
}
if (last_idx >= 0) {
/* dimitr: Empirically, it's better to use less indices with very good selectivity
than using all available ones. Here we're deciding how many indices we
should use. Since all indices are already ordered by their selectivity,
it becomes a trivial task. But note that indices with zero (unknown)
selectivity are always used, because we don't have a clue how useful
they are in fact, so we should be optimistic in this case. Unique
indices are also always used, because they are good by definition,
regardless of their (probably old) selectivity values. */
index_desc* idx = idx_csb[last_idx];
bool should_be_used = true;
if (idx->idx_selectivity && !(csb_tail->csb_plan)) {
if (!(idx->idx_flags & idx_unique) &&
(selectivity * SELECTIVITY_THRESHOLD_FACTOR < idx->idx_selectivity))
{
should_be_used = false;
}
selectivity = idx->idx_selectivity;
}
idx_priority_level[last_idx] = 0; /* Mark as used by setting priority_level to 0 */
if (should_be_used) {
idx_walk[idx_walk_count] = idx_csb[last_idx];
idx_walk_count++;
}
}
}
return idx_walk_count;
}