/* * PROGRAM: JRD Access Method * MODULE: nav.cpp * DESCRIPTION: Navigational index walking * * The contents of this file are subject to the Interbase Public * License Version 1.0 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy * of the License at http://www.Inprise.com/IPL.html * * Software distributed under the License is distributed on an * "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express * or implied. See the License for the specific language governing * rights and limitations under the License. * * The Original Code was created by Inprise Corporation * and its predecessors. Portions created by Inprise Corporation are * Copyright (C) Inprise Corporation. * * All Rights Reserved. * Contributor(s): ______________________________________. */ #include "firebird.h" #include #include "memory_routines.h" #include "../jrd/common.h" #include "../jrd/jrd.h" #include "../jrd/ods.h" #include "../jrd/val.h" #include "../jrd/btr.h" #include "../jrd/btn.h" #include "../jrd/req.h" #include "../jrd/exe.h" #include "../jrd/sbm.h" #include "../jrd/rse.h" #include "gen/iberror.h" #include "../jrd/lck.h" #include "../jrd/cch.h" #include "../jrd/blr.h" #include "../jrd/btr_proto.h" #include "../jrd/cch_proto.h" #include "../jrd/dbg_proto.h" #include "../jrd/err_proto.h" #include "../jrd/evl_proto.h" #include "../jrd/gds_proto.h" #include "../jrd/mov_proto.h" #include "../jrd/nav_proto.h" #include "../jrd/rse_proto.h" #include "../jrd/vio_proto.h" using namespace Jrd; //#define MOVE_BYTE(x_from, x_to) *x_to++ = *x_from++; static int compare_keys(const index_desc*, const UCHAR*, USHORT, const temporary_key*, USHORT); #ifdef SCROLLABLE_CURSORS static void expand_index(WIN *); #endif static btree_exp* find_current(exp_index_buf*, Ods::btree_page*, const UCHAR*); static bool find_saved_node(thread_db* tdbb, RecordSource*, IRSB_NAV, WIN*, UCHAR**); static UCHAR* get_position(thread_db*, RecordSource*, IRSB_NAV, WIN *, rse_get_mode, btree_exp**); static bool get_record(thread_db* tdbb, RecordSource*, IRSB_NAV, record_param*, temporary_key*, bool); static void init_fetch(IRSB_NAV); static UCHAR* nav_open(thread_db* tdbb, RecordSource*, IRSB_NAV, WIN *, rse_get_mode); //, btree_exp**); static void set_position(IRSB_NAV, record_param*, WIN*, const UCHAR*, btree_exp*, const UCHAR*, USHORT); static bool setup_bitmaps(thread_db* tdbb, RecordSource*, IRSB_NAV); #ifdef SCROLLABLE_CURSORS exp_index_buf* NAV_expand_index(WIN * window, IRSB_NAV impure) { /************************************** * * N A V _ e x p a n d _ i n d e x * ************************************** * * Functional description * Given a window with a btree leaf page loaded into it, * expand the index page into a form that facilitates walking * backward through it. Each node's data is decompressed. * Since the prefix field is not needed, it contains an offset to * the prior node. * * If an impure pointer is passed, set the current node on the * expanded page to match that on the corresponding btree page. * **************************************/ // allocate the expanded page to allow room for all nodes fully expanded, // plus leave room for an extra node with zero-length tail // (note that the difference in size of a btree_exp node versus a btree_nod node could // be deducted, but there is no easy way to get the no. of nodes on page) */ // if the right version of expanded page is available, there // is no work to be done exp_index_buf* expanded_page = window->win_expanded_buffer; if (expanded_page && (expanded_page->exp_incarnation == CCH_get_incarnation(window))) { return expanded_page; } // If different incarnation, reallocate the page if (expanded_page) { ALL_free(expanded_page); } Ods::btree_page* page = (Ods::btree_page*) window->win_buffer; expanded_page = (exp_index_buf*) ALL_malloc(EXP_SIZE + page->btr_prefix_total + (SLONG) page->btr_length + BTX_SIZE, ERR_jmp); window->win_expanded_buffer = expanded_page; expanded_page->exp_incarnation = -1; expand_index(window); if (!impure) { return expanded_page; } // go through the nodes on the original page and reposition UCHAR* pointer = BTreeNode::getPointerFirstNode(page); const UCHAR* const endPointer = ((UCHAR*) page + page->btr_length); btree_exp* expanded_node = (btree_exp*) expanded_page->exp_nodes; const UCHAR* current_pointer = ((UCHAR*) page + impure->irsb_nav_offset); impure->irsb_nav_expanded_offset = -1; Ods::IndexNode node; while (pointer < endPointer) { if (pointer == current_pointer) { impure->irsb_nav_expanded_offset = (UCHAR*) expanded_node - (UCHAR*) expanded_page; } pointer = BTreeNode::nextNode(pointer, &expanded_node); } return expanded_page; } #endif bool NAV_get_record(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure, record_param* rpb, rse_get_mode direction) { /************************************** * * N A V _ g e t _ r e c o r d * ************************************** * * Functional description * Get a record from a stream, either in * the forward or backward direction, or the * current record. This routine must set * BOF or EOF properly. * **************************************/ SET_TDBB(tdbb); #ifdef SCROLLABLE_CURSORS // before we do anything, check for the case where an ascending index // was used to optimize a descending sort, or a descending index was // used to optimize an ascending sort--in either case, we need to flip // the nominal direction of navigation if (rsb->rsb_flags & rsb_descending) { if (direction == RSE_get_forward) { direction = RSE_get_backward; } else if (direction == RSE_get_backward) { direction = RSE_get_forward; } } #endif init_fetch(impure); index_desc* idx = (index_desc*) ((SCHAR*) impure + (IPTR) rsb->rsb_arg[RSB_NAV_idx_offset]); // The bitmap is only valid when we are continuing on in one // direction. It is of no help when we change direction, // and so we need to reset in that case. #ifdef SCROLLABLE_CURSORS if (((impure->irsb_flags & irsb_backwards) && direction != RSE_get_backward) || (!(impure->irsb_flags & irsb_backwards) && direction != RSE_get_forward)) { RecordBitmap::reset(impure->irsb_nav_records_visited); } if (direction == RSE_get_forward) { impure->irsb_flags &= ~irsb_backwards; } else if (direction == RSE_get_backward) { impure->irsb_flags |= irsb_backwards; } #endif // find the last fetched position from the index const USHORT pageSpaceID = rpb->rpb_relation->getPages(tdbb)->rel_pg_space_id; WIN window(pageSpaceID, impure->irsb_nav_page); btree_exp* expanded_next = NULL; UCHAR* nextPointer = get_position(tdbb, rsb, impure, &window, direction, &expanded_next); if (!nextPointer) return false; temporary_key key; memcpy(key.key_data, impure->irsb_nav_data, impure->irsb_nav_length); jrd_nod* retrieval_node = (jrd_nod*) rsb->rsb_arg[RSB_NAV_index]; IndexRetrieval* retrieval = (IndexRetrieval*) retrieval_node->nod_arg[e_idx_retrieval]; // set the upper (or lower) limit for navigational retrieval temporary_key upper; #ifdef SCROLLABLE_CURSORS temporary_key lower; #endif if ((direction == RSE_get_forward) && retrieval->irb_upper_count) { upper.key_length = impure->irsb_nav_upper_length; #ifdef SCROLLABLE_CURSORS memcpy(upper.key_data, (impure->irsb_nav_data + (2 * (SLONG) rsb->rsb_arg[RSB_NAV_key_length])), upper.key_length); #else memcpy(upper.key_data, (impure->irsb_nav_data + (IPTR) rsb->rsb_arg[RSB_NAV_key_length]), upper.key_length); #endif } #ifdef SCROLLABLE_CURSORS else if ((direction == RSE_get_backward) && retrieval->irb_lower_count) { lower.key_length = impure->irsb_nav_lower_length; memcpy(lower.key_data, (impure->irsb_nav_data + (IPTR) rsb->rsb_arg[RSB_NAV_key_length]), lower.key_length); } #endif // In the case of a DISTINCT, we must detect whether the key changed since the last // time a record was returned from the rsb. It is not good enough to know whether the // key changed since the last node in the index, because the record represented // by the last index node may not have satisfied some boolean expression on the rsb. // So to find out whether the key has changed since the last time a record was actually // returned from the rsb, we save the record count each time we return a candidate record, // and see if the count is updated the next time we get here. // If the count has been updated, we know the record has been returned from the rsb, and // the index key must change before we can return another DISTINCT record candidate. If // the last candidate did not qualify, we know we should return another record no matter // what. if (rsb->rsb_record_count != impure->irsb_nav_count) { impure->irsb_flags &= ~irsb_key_changed; impure->irsb_nav_count = rsb->rsb_record_count; } else { impure->irsb_flags |= irsb_key_changed; } // Find the next interesting node. If necessary, skip to the next page bool page_changed = false; RecordNumber number; Ods::IndexNode node; while (true) { Ods::btree_page* page = (Ods::btree_page*) window.win_buffer; const UCHAR flags = page->btr_header.pag_flags; UCHAR* pointer = nextPointer; btree_exp* expanded_node = expanded_next; if (pointer) { BTreeNode::readNode(&node, pointer, flags, true); number = node.recordNumber; } #ifdef SCROLLABLE_CURSORS // in the backwards case, check to make sure we haven't hit the // beginning of a page, and if so fetch the left sibling page. if (direction == RSE_get_backward) { if (pointer < BTreeNode::getPointerFirstNode(page)) { exp_index_buf* expanded_page = window.win_expanded_buffer; if (!page->btr_left_sibling) { impure->irsb_flags |= irsb_bof; break; } page = BTR_left_handoff(tdbb, &window, page, LCK_read); expanded_page = NAV_expand_index(&window, 0); nextPointer = BTR_last_node(page, expanded_page, &expanded_next); page_changed = true; continue; } } else // In the forwards case, check for end of page. If we find // it, do a simple handoff to the right sibling page. #endif { if (node.isEndLevel) { #ifdef SCROLLABLE_CURSORS impure->irsb_flags |= irsb_eof; #endif break; } if (node.isEndBucket) { page = (Ods::btree_page*) window.win_buffer; page = (Ods::btree_page*) CCH_HANDOFF(tdbb, &window, page->btr_sibling, LCK_read, pag_index); nextPointer = BTreeNode::getPointerFirstNode(page); exp_index_buf* expanded_page = window.win_expanded_buffer; if (expanded_page) { expanded_next = (btree_exp*) expanded_page->exp_nodes; } page_changed = true; continue; } } // In the project (DISTINCT) case, we need to determine if the key has changed // since the last record that was returned from the rsb. That means that we must // know what the key was for that record // in the case where we are on the same page, // we simply check to see if there is any data in the node; if we are on a new // page, we must compare this node with the last key we saw // NOTE: the optimizer only uses indices which have the same number of fields as // those in the DISTINCT clause; there's no reason we couldn't use an index which // has extra fields to the right, we just need to add some code to check // when only the first n segment(s) of the key has changed, rather than the whole key if (rsb->rsb_flags & rsb_project) { if (page_changed) { if (node.length != key.key_length || (key.key_length && memcmp(key.key_data, node.data, key.key_length))) { impure->irsb_flags |= irsb_key_changed; } } else if (node.length) { impure->irsb_flags |= irsb_key_changed; } } page_changed = false; // Build the current key value from the prefix and current node data. if (expanded_node) { memcpy(key.key_data, expanded_node->btx_data, node.length + node.prefix); } else { memcpy(key.key_data + node.prefix, node.data, node.length); } key.key_length = node.length + node.prefix; // Make sure we haven't hit the upper (or lower) limit. if ((direction == RSE_get_forward) && retrieval->irb_upper_count && compare_keys(idx, key.key_data, key.key_length, &upper, retrieval->irb_generic & (irb_descending | irb_partial | irb_starting)) > 0) { break; } #ifdef SCROLLABLE_CURSORS if ((direction == RSE_get_backward) && retrieval->irb_lower_count && compare_keys(idx, key.key_data, key.key_length, &lower, retrieval->irb_generic & (irb_descending | irb_partial | irb_starting)) < 0) { break; } #endif // skip this record if: // 1) there is an inversion tree for this index and this record // is not in the bitmap for the inversion, or // 2) the record has already been visited, or // 3) this is a projection and the new node is the same as the last if ((rsb->rsb_arg[RSB_NAV_inversion] && (!impure->irsb_nav_bitmap || !RecordBitmap::test(*impure->irsb_nav_bitmap, number.getValue()))) || RecordBitmap::test(impure->irsb_nav_records_visited, number.getValue()) || ((rsb->rsb_flags & rsb_project) && !(impure->irsb_flags & irsb_key_changed))) { #ifdef SCROLLABLE_CURSORS if (direction == RSE_get_backward) { nextPointer = BTreeNode::previousNode(/*&node,*/ pointer, /*flags,*/ &expanded_node); expanded_next = expanded_node; continue; } #endif if (direction == RSE_get_forward) { nextPointer = BTreeNode::nextNode(&node, pointer, flags, &expanded_node); expanded_next = expanded_node; continue; } } // reset the current navigational position in the index rpb->rpb_number = number; set_position(impure, rpb, &window, pointer, expanded_node, key.key_data, key.key_length); CCH_RELEASE(tdbb, &window); if (get_record(tdbb, rsb, impure, rpb, &key, false)) { return true; } nextPointer = get_position(tdbb, rsb, impure, &window, direction, &expanded_next); if (!nextPointer) return false; } CCH_RELEASE(tdbb, &window); // bof or eof must have been set at this point return false; } static int compare_keys(const index_desc* idx, const UCHAR* key_string1, USHORT length1, const temporary_key* key2, USHORT flags) { /************************************** * * c o m p a r e _ k e y s * ************************************** * * Functional description * Compare two index keys. * If a partial key comparison is specified, * ensure that the shorter key (the second * one) matches segment-by-segment with the * index key. * **************************************/ const UCHAR* string1 = key_string1; const UCHAR* string2 = key2->key_data; const USHORT length2 = key2->key_length; USHORT l = MIN(length1, length2); if (l) { do { if (*string1++ != *string2++) { return (string1[-1] < string2[-1]) ? -1 : 1; } } while (--l); } // if the keys are identical, return 0 if (length1 == length2) { return 0; } // do a partial key search; if the index is a compound key, // check to see if the segments are matching--for character // fields, do partial matches within a segment if irb_starting // is specified, for other types do only matches on the entire segment if ((flags & (irb_partial | irb_starting)) && (length1 > length2)) { // figure out what segment we're on; if it's a // character segment we've matched the partial string const UCHAR* segment = 0; const index_desc::idx_repeat* tail; if (idx->idx_count > 1) { segment = key_string1 + ((length2 - 1) / (Ods::STUFF_COUNT + 1)) * (Ods::STUFF_COUNT + 1); tail = idx->idx_rpt + (idx->idx_count - *segment); } else { tail = &idx->idx_rpt[0]; } // If it's a string type key, and we're allowing "starting with" fuzzy // type matching, we're done if ((flags & irb_starting) && (tail->idx_itype == idx_string || tail->idx_itype == idx_byte_array || tail->idx_itype == idx_metadata || tail->idx_itype >= idx_first_intl_string)) { return 0; } if (idx->idx_count > 1) { // If we search for NULLs at the begin then we're done if the first // segment isn't the first one possible (0 for ASC, 255 for DESC). if (length2 == 0) { if (flags & irb_descending) { if (*segment != 255) { return 0; } } else { if (*segment != 0) { return 0; } } } // if we've exhausted the segment, we've found a match USHORT remainder = length2 % (Ods::STUFF_COUNT + 1); if (!remainder && (*string1 != *segment)) { return 0; } // if the rest of the key segment is 0's, we've found a match if (remainder) { for (remainder = Ods::STUFF_COUNT + 1 - remainder; remainder; remainder--) { if (*string1++) { break; } } if (!remainder) { return 0; } } } } if (flags & irb_descending) { return (length1 < length2) ? 1 : -1; } return (length1 < length2) ? -1 : 1; } #ifdef SCROLLABLE_CURSORS static void expand_index(WIN * window) { /************************************** * * e x p a n d _ i n d e x * ************************************** * * Functional description * Given a window with a btree leaf page loaded into it, * expand the index page into a form that facilitates walking * backward through it. Each node's data is decompressed. * Since the prefix field is not needed, it contains an offset to * the prior node. * **************************************/ Ods::btree_page* page = (Ods::btree_page*) window->win_buffer; exp_index_buf* expanded_page = window->win_expanded_buffer; expanded_page->exp_incarnation = CCH_get_incarnation(window); // go through the nodes on the original page and expand them temporary_key key; btree_exp* expanded_node = (btree_exp*) expanded_page->exp_nodes; bool priorPointer = false; UCHAR* pointer = BTreeNode::getPointerFirstNode(page); const UCHAR* const endPointer = ((UCHAR*) page + page->btr_length); const UCHAR flags = page->btr_header.pag_flags; Ods::IndexNode node, priorNode; while (pointer < endPointer) { if (!priorPointer) { pointer = BTreeNode::readNode(&node, pointer, flags, true); } memcpy(key.key_data + node.prefix, node.data, node.length); memcpy(expanded_node->btx_data, key.key_data, node.length + node.prefix); // point back to the prior nodes on the expanded page and the btree page expanded_node->btx_btr_previous_length = priorPointer ? BTreeNode::getLeafNodeSize(&priorNode, flags) : 0; expanded_node->btx_previous_length = priorPointer ? priorNode.length + priorNode.prefix : 0; priorPointer = true; priorNode = node; pointer = BTreeNode::nextNode(&node, pointer, flags, &expanded_node); } // insert one additional expanded node to keep track of the length of the // last node on page--this is necessary because the end of bucket marker // contains the length and key of the first node on the next page expanded_node->btx_btr_previous_length = priorPointer ? BTreeNode::getLeafNodeSize(&priorNode, flags) : 0; expanded_node->btx_previous_length = priorPointer ? priorNode.length + priorNode.prefix : 0; expanded_page->exp_length = (UCHAR*) expanded_node - (UCHAR*) expanded_page + BTX_SIZE; } #endif static btree_exp* find_current(exp_index_buf* expanded_page, Ods::btree_page* page, const UCHAR* current_pointer) { /************************************** * * f i n d _ c u r r e n t * ************************************** * * Functional description * Find the current location in the expanded * index buffer according to its corresponding * btree page. * **************************************/ if (!expanded_page) { return NULL; } btree_exp* expanded_node = expanded_page->exp_nodes; const UCHAR flags = page->btr_header.pag_flags; UCHAR* pointer = BTreeNode::getPointerFirstNode(page); const UCHAR* const endPointer = ((UCHAR*) page + page->btr_length); Ods::IndexNode node; while (pointer < endPointer) { if (pointer == current_pointer) { return expanded_node; } // AB: Together this looks pretty the same as BTreeNode::nextNode pointer = BTreeNode::readNode(&node, pointer, flags, true); expanded_node = (btree_exp*) ((UCHAR*) expanded_node->btx_data + node.prefix + node.length); } return NULL; } static bool find_saved_node(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure, WIN* window, UCHAR** return_pointer) { /************************************** * * f i n d _ s a v e d _ n o d e * ************************************** * * Functional description * A page has changed. Find the new position of the * previously stored node. The node could even be on * a sibling page if the page has split. If we find * the actual node, return true. * **************************************/ SET_TDBB(tdbb); index_desc* idx = (index_desc*) ((SCHAR*) impure + (IPTR) rsb->rsb_arg[RSB_NAV_idx_offset]); Ods::btree_page* page = (Ods::btree_page*) CCH_FETCH(tdbb, window, LCK_read, pag_index); // the outer loop goes through all the sibling pages // looking for the node (in case the page has split); // the inner loop goes through the nodes on each page temporary_key key; const UCHAR flags = page->btr_header.pag_flags; Ods::IndexNode node; while (true) { UCHAR* pointer = BTreeNode::getPointerFirstNode(page); const UCHAR* const endPointer = ((UCHAR*) page + page->btr_length); while (pointer < endPointer) { pointer = BTreeNode::readNode(&node, pointer, flags, true); if (node.isEndLevel) { *return_pointer = node.nodePointer; return false; } if (node.isEndBucket) { page = (Ods::btree_page*) CCH_HANDOFF(tdbb, window, page->btr_sibling, LCK_read, pag_index); break; } // maintain the running key value and compare it with the stored value memcpy(key.key_data + node.prefix, node.data, node.length); key.key_length = node.length + node.prefix; const int result = compare_keys(idx, impure->irsb_nav_data, impure->irsb_nav_length, &key, 0); // if the keys are equal, return this node even if it is just a duplicate node; // duplicate nodes that have already been returned will be filtered out at a // higher level by checking the sparse bit map of records already returned, and // duplicate nodes that were inserted before the stored node can be // safely returned since their position in the index is arbitrary if (!result) { *return_pointer = node.nodePointer; return node.recordNumber == impure->irsb_nav_number; } // if the stored key is less than the current key, then the stored key // has been deleted from the index and we should just return the next // key after it if (result < 0) { *return_pointer = node.nodePointer; return false; } } } } static UCHAR* get_position(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure, WIN* window, rse_get_mode direction, btree_exp** expanded_node) { /************************************** * * g e t _ p o s i t i o n * ************************************** * * Functional description * Re-fetch B-tree page and reposition the node pointer to where * we left off. If the page has been sitting in cache unchanged * since we were there last, this is easy and cheap. If there's * any chance the page has changed, we need to resynch. * **************************************/ SET_TDBB(tdbb); // If this is the first time, start at the beginning (or the end) #ifdef SCROLLABLE_CURSORS if (!window->win_page.getPageNum() || impure->irsb_flags & (irsb_bof | irsb_eof)) #else if (!window->win_page.getPageNum()) #endif { return nav_open(tdbb, rsb, impure, window, direction); //, expanded_node); } exp_index_buf* expanded_page = NULL; // Re-fetch page and get incarnation counter Ods::btree_page* page = (Ods::btree_page*) CCH_FETCH(tdbb, window, LCK_read, pag_index); #ifdef SCROLLABLE_CURSORS // we must ensure that if we are going backwards, we always // have an expanded buffer (and a valid position on that page) if (direction == RSE_get_backward) { NAV_expand_index(window, impure); } expanded_page = window->win_expanded_buffer; #endif UCHAR* pointer = 0; const UCHAR flags = page->btr_header.pag_flags; const SLONG incarnation = CCH_get_incarnation(window); Ods::IndexNode node; if (incarnation == impure->irsb_nav_incarnation) { pointer = ((UCHAR*) page + impure->irsb_nav_offset); if (!expanded_page) { // theoretically impossible *expanded_node = NULL; } else if (impure->irsb_nav_expanded_offset < 0) { // position unknown or invalid *expanded_node = find_current(expanded_page, page, pointer); } else { *expanded_node = (btree_exp*) ((UCHAR*) expanded_page + impure->irsb_nav_expanded_offset); } // The new way of doing things is to have the current // nav_offset be the last node fetched. Go forward or // backward from that point accordingly. #ifdef SCROLLABLE_CURSORS if (direction == RSE_get_backward) { pointer = BTreeNode::previousNode(/*&node,*/ pointer, /*flags,*/ expanded_node); //node = (btree_nod*) BTR_previous_node( (UCHAR*)node, expanded_node); } else #endif { if (direction == RSE_get_forward) pointer = BTreeNode::nextNode(&node, pointer, flags, expanded_node); } return pointer; } // Page is presumably changed. If there is a previous // stored position in the page, go back to it if possible. CCH_RELEASE(tdbb, window); if (!impure->irsb_nav_page) { return nav_open(tdbb, rsb, impure, window, direction); //, expanded_node); } const bool found = find_saved_node(tdbb, rsb, impure, window, &pointer); page = (Ods::btree_page*) window->win_buffer; if (pointer) { *expanded_node = find_current(window->win_expanded_buffer, page, pointer); #ifdef SCROLLABLE_CURSORS if (direction == RSE_get_backward) { pointer = BTreeNode::previousNode(/*&node,*/ pointer, /*flags,*/ expanded_node); //node = (btree_nod*) BTR_previous_node((UCHAR*) node, expanded_node); } else #endif { if (direction == RSE_get_forward && found) { // in the forward case, seek to the next node only if we found // the actual node on page; if we did not find it, we are already // at the next node (such as when the node is garbage collected) pointer = BTreeNode::nextNode(&node, pointer, flags, expanded_node); } } return pointer; } #ifdef SCROLLABLE_CURSORS // As a last resort, return the first (or last if backwards) // node on the page. The sparse bitmap will prevent us from // seeing records we have already visited before. if (direction == RSE_get_backward) { expanded_page = NAV_expand_index(window, 0); return BTR_last_node(page, expanded_page, expanded_node); } if (expanded_page = window->win_expanded_buffer) { *expanded_node = (btree_exp*) expanded_page->exp_nodes; } #endif return BTreeNode::getPointerFirstNode(page); } static bool get_record(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure, record_param* rpb, temporary_key* key, bool inhibit_cleanup) { /************************************** * * g e t _ r e c o r d * ************************************** * * Functional description * Get the record indicated by the passed rpb. * **************************************/ SET_TDBB(tdbb); jrd_req* request = tdbb->getRequest(); index_desc* idx = (index_desc*) ((SCHAR*) impure + (IPTR) rsb->rsb_arg[RSB_NAV_idx_offset]); ULONG old_att_flags = 0; bool result = false; try { if (inhibit_cleanup) { // Inhibit garbage collection & other housekeeping - // to prevent a deadlock when we visit the record. // There are cases when we are called here and have a window locked // HACK for bug 7041 old_att_flags = (tdbb->getAttachment()->att_flags & ATT_no_cleanup); tdbb->getAttachment()->att_flags |= ATT_no_cleanup; // HACK } #ifdef SCROLLABLE_CURSORS // the attempt to get a record, whether successful or not, takes // us off bof or eof (otherwise we will keep trying to retrieve // the first record) impure->irsb_flags &= ~(irsb_bof | irsb_eof); #endif result = VIO_get(tdbb, rpb, request->req_transaction, request->req_pool); temporary_key value; if (result) { BTR_key(tdbb, rpb->rpb_relation, rpb->rpb_record, reinterpret_cast((SCHAR*) impure + (IPTR) rsb->rsb_arg[RSB_NAV_idx_offset]), &value, 0, false); if (compare_keys(idx, key->key_data, key->key_length, &value, 0)) { result = false; } else { // mark in the navigational bitmap that we have visited this record RBM_SET(tdbb->getDefaultPool(), &impure->irsb_nav_records_visited, rpb->rpb_number.getValue()); } } if (inhibit_cleanup) { tdbb->getAttachment()->att_flags &= ~ATT_no_cleanup; tdbb->getAttachment()->att_flags |= old_att_flags; } } // try catch (const Firebird::Exception&) { // Cleanup the HACK should there be an error tdbb->getAttachment()->att_flags &= ~ATT_no_cleanup; tdbb->getAttachment()->att_flags |= old_att_flags; throw; } return result; } static void init_fetch(IRSB_NAV impure) { /************************************** * * i n i t _ f e t c h * ************************************** * * Functional description * Initialize for a fetch operation. * **************************************/ if (impure->irsb_flags & irsb_first) { impure->irsb_flags &= ~irsb_first; impure->irsb_nav_page = 0; } } static UCHAR* nav_open(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure, WIN* window, rse_get_mode direction) //, btree_exp** expanded_node) { /************************************** * * n a v _ o p e n * ************************************** * * Functional description * Open a stream to walk an index. * **************************************/ SET_TDBB(tdbb); // initialize for a retrieval if (!setup_bitmaps(tdbb, rsb, impure)) return NULL; impure->irsb_nav_page = 0; impure->irsb_nav_length = 0; #ifdef SCROLLABLE_CURSORS if (direction == RSE_get_forward) { impure->irsb_flags |= irsb_bof; } else if (direction == RSE_get_backward) { impure->irsb_flags |= irsb_eof; } #endif // Find the starting leaf page jrd_nod* retrieval_node = (jrd_nod*) rsb->rsb_arg[RSB_NAV_index]; IndexRetrieval* retrieval = (IndexRetrieval*) retrieval_node->nod_arg[e_idx_retrieval]; index_desc* idx = (index_desc*) ((SCHAR *) impure + (IPTR) rsb->rsb_arg[RSB_NAV_idx_offset]); temporary_key lower, upper; #ifdef SCROLLABLE_CURSORS Ods::btree_page* page = BTR_find_page(tdbb, retrieval, window, idx, &lower, &upper, (direction == RSE_get_backward)); #else Ods::btree_page* page = BTR_find_page(tdbb, retrieval, window, idx, &lower, &upper); #endif impure->irsb_nav_page = window->win_page.getPageNum(); #ifdef SCROLLABLE_CURSORS // store the upper and lower bounds for the search in the impure area for the rsb if (retrieval->irb_lower_count) { impure->irsb_nav_lower_length = lower.key_length; memcpy((impure->irsb_nav_data + (SLONG) rsb->rsb_arg[RSB_NAV_key_length]), lower.key_data, lower.key_length); } if (retrieval->irb_upper_count) { impure->irsb_nav_upper_length = upper.key_length; memcpy((impure->irsb_nav_data + (2 * (SLONG) rsb->rsb_arg[RSB_NAV_key_length])), upper.key_data, upper.key_length); } // find the limit the search needs to begin with, if any temporary_key* limit_ptr = NULL; if (direction == RSE_get_forward) { if (retrieval->irb_lower_count) limit_ptr = &lower; } else { if (retrieval->irb_upper_count) limit_ptr = &upper; } #else // find the upper limit for the search (or lower for backwards) temporary_key* limit_ptr = NULL; if (direction == RSE_get_forward) { if (retrieval->irb_upper_count) { impure->irsb_nav_upper_length = upper.key_length; memcpy((impure->irsb_nav_data + (IPTR) rsb->rsb_arg[RSB_NAV_key_length]), upper.key_data, upper.key_length); } if (retrieval->irb_lower_count) { limit_ptr = &lower; } } else { fb_assert(direction == RSE_get_forward); if (retrieval->irb_lower_count) { impure->irsb_nav_lower_length = lower.key_length; memcpy((impure->irsb_nav_data + (IPTR) rsb->rsb_arg[RSB_NAV_key_length]), lower.key_data, lower.key_length); } if (retrieval->irb_upper_count) { limit_ptr = &upper; } } #endif // If there is a starting descriptor, search down index to starting position. // This may involve sibling buckets if splits are in progress. If there // isn't a starting descriptor, walk down the left side of the index (or the // right side if backwards). #ifdef SCROLLABLE_CURSORS exp_index_buf* expanded_page = 0; #endif UCHAR* pointer = NULL; if (limit_ptr) { // If END_BUCKET is reached BTR_find_leaf will return NULL while (!(pointer = BTR_find_leaf(page, limit_ptr, impure->irsb_nav_data, 0, (idx->idx_flags & idx_descending) != 0, true))) { page = (Ods::btree_page*) CCH_HANDOFF(tdbb, window, page->btr_sibling, LCK_read, pag_index); } Ods::IndexNode node; BTreeNode::readNode(&node, pointer, page->btr_header.pag_flags, true); impure->irsb_nav_length = node.prefix + node.length; #ifdef SCROLLABLE_CURSORS // ensure that if we are going backward, there is an expanded page if (direction == RSE_get_backward && !window->win_expanded_buffer) NAV_expand_index(window, 0); // now find our current location on the expanded page if (expanded_node && (expanded_page = window->win_expanded_buffer)) { *expanded_node = find_current(expanded_page, page, pointer); } #endif } #ifdef SCROLLABLE_CURSORS else if (direction == RSE_get_backward) { expanded_page = NAV_expand_index(window, 0); pointer = BTR_last_node(page, expanded_page, expanded_node); } #endif else { pointer = BTreeNode::getPointerFirstNode(page); #ifdef SCROLLABLE_CURSORS if (expanded_node && (expanded_page = window->win_expanded_buffer)) { *expanded_node = (btree_exp*) expanded_page->exp_nodes; } else { *expanded_node = NULL; } #endif } return pointer; } static void set_position(IRSB_NAV impure, record_param* rpb, WIN* window, const UCHAR* pointer, btree_exp* expanded_node, const UCHAR* key_data, USHORT length) { /************************************** * * s e t _ p o s i t i o n * ************************************** * * Functional description * Setup the information about the current position * in the navigational index. Store all required data in the * impure area for the request. * **************************************/ // We can actually set position without having a data page // fetched; if not, just set the incarnation to the lowest possible impure->irsb_nav_incarnation = CCH_get_incarnation(window); impure->irsb_nav_page = window->win_page.getPageNum(); impure->irsb_nav_number = rpb->rpb_number; // save the current key value if it hasn't already been saved if (key_data) { impure->irsb_nav_length = length; memcpy(impure->irsb_nav_data, key_data, length); } // setup the offsets into the current index page and expanded index buffer impure->irsb_nav_offset = pointer - (UCHAR*) window->win_buffer; if (window->win_expanded_buffer) { impure->irsb_nav_expanded_offset = (UCHAR*) expanded_node - (UCHAR*) window->win_expanded_buffer; } else { impure->irsb_nav_expanded_offset = -1; } } static bool setup_bitmaps(thread_db* tdbb, RecordSource* rsb, IRSB_NAV impure) { /************************************** * * s e t u p _ b i t m a p s * ************************************** * * Functional description * Setup the various bitmaps associated * with a stream. * **************************************/ SET_TDBB(tdbb); // Start a bitmap which tells us we have already visited // this record; this is to handle the case where there is more // than one leaf node reference to the same record number; the // bitmap allows us to filter out the multiple references. RecordBitmap::reset(impure->irsb_nav_records_visited); // the first time we open the stream, compute a bitmap // for the inversion tree--this may cause problems for // read-committed transactions since they will get one // view of the database when the stream is opened if (rsb->rsb_arg[RSB_NAV_inversion]) { // There is no need to reset or release the bitmap, it is // done in EVL_bitmap (). impure->irsb_nav_bitmap = EVL_bitmap(tdbb, reinterpret_cast(rsb->rsb_arg[RSB_NAV_inversion]), NULL); return (*impure->irsb_nav_bitmap != NULL); } return true; }