/* * PROGRAM: JRD Access Method * MODULE: tra.cpp * DESCRIPTION: Transaction manager * * The contents of this file are subject to the Interbase Public * License Version 1.0 (the "License"); you may not use this file * except in compliance with the License. You may obtain a copy * of the License at http://www.Inprise.com/IPL.html * * Software distributed under the License is distributed on an * "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express * or implied. See the License for the specific language governing * rights and limitations under the License. * * The Original Code was created by Inprise Corporation * and its predecessors. Portions created by Inprise Corporation are * Copyright (C) Inprise Corporation. * * All Rights Reserved. * Contributor(s): ______________________________________. * 2001.07.06 Sean Leyne - Code Cleanup, removed "#ifdef READONLY_DATABASE" * conditionals, as the engine now fully supports * readonly databases. * 2002.10.29 Nickolay Samofatov: Added support for savepoints */ #include "firebird.h" #include #include "../jrd/jrd.h" #include "../jrd/tra.h" #include "../jrd/ods.h" #include "../jrd/pag.h" #include "../jrd/lck.h" #include "../jrd/lls.h" #include "../jrd/btr.h" #include "../jrd/req.h" #include "../jrd/exe.h" #include "../jrd/extds/ExtDS.h" #include "../jrd/rse.h" #include "../jrd/intl_classes.h" #include "../common/ThreadStart.h" #include "../jrd/UserManagement.h" #include "../jrd/blb_proto.h" #include "../jrd/cch_proto.h" #include "../jrd/cmp_proto.h" #include "../jrd/dfw_proto.h" #include "../jrd/dpm_proto.h" #include "../jrd/err_proto.h" #include "../jrd/exe_proto.h" #include "../jrd/ext_proto.h" #include "../jrd/idx_proto.h" #include "../yvalve/gds_proto.h" #include "../common/isc_proto.h" #include "../jrd/lck_proto.h" #include "../jrd/met_proto.h" #include "../jrd/mov_proto.h" #include "../jrd/pag_proto.h" #include "../jrd/rlck_proto.h" #include "../jrd/tpc_proto.h" #include "../jrd/tra_proto.h" #include "../jrd/vio_proto.h" #include "../jrd/jrd_proto.h" #include "../jrd/scl_proto.h" #include "../common/classes/ClumpletWriter.h" #include "../common/classes/TriState.h" #include "../common/utils_proto.h" #include "../lock/lock_proto.h" #include "../dsql/dsql.h" #include "../dsql/dsql_proto.h" #include "../common/StatusArg.h" #include "../jrd/trace/TraceManager.h" #include "../jrd/trace/TraceJrdHelpers.h" #include "../jrd/Function.h" #include "../jrd/Collation.h" #include "../jrd/Mapping.h" #include "../jrd/DbCreators.h" #include "../common/os/fbsyslog.h" const int DYN_MSG_FAC = 8; using namespace Jrd; using namespace Ods; using namespace Firebird; typedef Firebird::GenericMap > > RelationLockTypeMap; #ifdef SUPERSERVER_V2 static TraNumber bump_transaction_id(thread_db*, WIN*); #else static header_page* bump_transaction_id(thread_db*, WIN*, bool); #endif static void retain_context(thread_db* tdbb, jrd_tra* transaction, bool commit, int state); static void expand_view_lock(thread_db* tdbb, jrd_tra*, jrd_rel*, UCHAR lock_type, const char* option_name, RelationLockTypeMap& lockmap, const int level); static tx_inv_page* fetch_inventory_page(thread_db*, WIN* window, ULONG sequence, USHORT lock_level); static const char* get_lockname_v3(const UCHAR lock); static ULONG inventory_page(thread_db*, ULONG); static int limbo_transaction(thread_db*, TraNumber id); static void restart_requests(thread_db*, jrd_tra*); static void start_sweeper(thread_db*); static THREAD_ENTRY_DECLARE sweep_database(THREAD_ENTRY_PARAM); static void transaction_flush(thread_db* tdbb, USHORT flush_flag, TraNumber tra_number); static void transaction_options(thread_db*, jrd_tra*, const UCHAR*, USHORT); static void transaction_start(thread_db* tdbb, jrd_tra* temp); static const UCHAR sweep_tpb[] = { isc_tpb_version1, isc_tpb_read, isc_tpb_read_committed, isc_tpb_rec_version }; ActiveSnapshots::ActiveSnapshots(Firebird::MemoryPool& p) : m_snapshots(p), m_lastCommit(CN_ACTIVE), m_releaseCount(0) { } CommitNumber ActiveSnapshots::getSnapshotForVersion(CommitNumber version_cn) { if (version_cn > m_lastCommit) return CN_ACTIVE; if (m_snapshots.locate(locGreatEqual, version_cn)) return m_snapshots.current(); return m_lastCommit; } void TRA_setup_request_snapshot(Jrd::thread_db* tdbb, Jrd::jrd_req* request) { // This function is called whenever request is started in a transaction. // Setup context to preserve read consistency in READ COMMITTED transactions. Jrd::jrd_tra* transaction = request->req_transaction; // We assume that request is already attached to a transaction fb_assert(transaction); // Initialize or update list of active snapshots in a transaction // so this request can effectively perform intermediate GC if (TipCache* cache = tdbb->getDatabase()->dbb_tip_cache) cache->updateActiveSnapshots(tdbb, &transaction->tra_active_snapshots); // If we are not READ COMMITTED or stable cursors are not needed then nothing to do here if (!(transaction->tra_flags & TRA_read_committed) || !(transaction->tra_flags & TRA_read_consistency)) return; // See if there is any request right above us in the call stack jrd_req* org_request; thread_db* jrd_ctx = tdbb; do { // Check regular request call stack org_request = jrd_ctx->getRequest(); if (org_request) break; // Check for engine context switch (EXECUTE STATEMENT, etc) ThreadData* ctx = jrd_ctx; jrd_ctx = NULL; while( (ctx = ctx->getPriorContext()) ) { if (ctx->getType() == ThreadData::tddDBB) { jrd_ctx = static_cast(ctx); break; } } } while (jrd_ctx); if (org_request && org_request->req_transaction == transaction) { fb_assert(org_request->req_snapshot_owner); request->req_snapshot_owner = org_request->req_snapshot_owner; return; } // If we are a top-level request or caller is executed in a different transaction, // we need to set up statement snapshot for read consistency and own it request->req_snapshot_owner = request; request->req_snapshot_handle = tdbb->getDatabase()->dbb_tip_cache->beginSnapshot(tdbb, tdbb->getAttachment()->att_attachment_id, &request->req_snapshot_number); } void TRA_release_request_snapshot(Jrd::thread_db* tdbb, Jrd::jrd_req* request) { // This function is called whenever request has completed processing // in a transaction (normally or abnormally) if (!request->req_snapshot_owner) return; if (request->req_snapshot_handle) { tdbb->getDatabase()->dbb_tip_cache->endSnapshot(tdbb, request->req_snapshot_handle, request->req_attachment->att_attachment_id); request->req_snapshot_handle = 0; } request->req_snapshot_owner = NULL; } void TRA_attach_request(Jrd::jrd_tra* transaction, Jrd::jrd_req* request) { // When request finishes normally transaction reference is not cleared. // Then if afterwards request is restarted TRA_attach_request is called again. if (request->req_transaction) { if (request->req_transaction == transaction) return; TRA_detach_request(request); } fb_assert(request->req_transaction == NULL); fb_assert(request->req_tra_next == NULL); fb_assert(request->req_tra_prev == NULL); // Assign transaction reference request->req_transaction = transaction; // Add request to the doubly linked list if (transaction->tra_requests) { fb_assert(transaction->tra_requests->req_tra_prev == NULL); transaction->tra_requests->req_tra_prev = request; request->req_tra_next = transaction->tra_requests; } transaction->tra_requests = request; } void TRA_detach_request(Jrd::jrd_req* request) { if (!request->req_transaction) { fb_assert(!request->req_savepoints); return; } // Release stored looper savepoints Savepoint::destroy(request->req_savepoints); // Remove request from the doubly linked list if (request->req_tra_next) { fb_assert(request->req_tra_next->req_tra_prev == request); request->req_tra_next->req_tra_prev = request->req_tra_prev; } if (request->req_tra_prev) { fb_assert(request->req_tra_prev->req_tra_next == request); request->req_tra_prev->req_tra_next = request->req_tra_next; } else { fb_assert(request->req_transaction->tra_requests == request); request->req_transaction->tra_requests = request->req_tra_next; } // Clear references request->req_transaction = NULL; request->req_tra_next = NULL; request->req_tra_prev = NULL; } bool TRA_active_transactions(thread_db* tdbb, Database* dbb) { /************************************** * * T R A _ a c t i v e _ t r a n s a c t i o n s * ************************************** * * Functional description * Determine if any transactions are active. * Return true is active transactions; otherwise * return false if no active transactions. * **************************************/ SET_TDBB(tdbb); return LCK_query_data(tdbb, LCK_tra, LCK_ANY) ? true : false; } void TRA_cleanup(thread_db* tdbb) { /************************************** * * T R A _ c l e a n u p * ************************************** * * Functional description * TRA_cleanup is called at startup while an exclusive lock is * held on the database. Because we haven't started a transaction, * and we have an exclusive lock on the db, any transactions marked * as active on the transaction inventory pages are indeed dead. * Mark them so. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // Return without cleaning up the TIP's for a ReadOnly database if (dbb->readOnly()) return; // First, make damn sure there are no outstanding transactions for (Jrd::Attachment* attachment = dbb->dbb_attachments; attachment; attachment = attachment->att_next) { if (attachment->att_transactions) return; } const ULONG trans_per_tip = dbb->dbb_page_manager.transPerTIP; // Read header page and allocate transaction number. Since // the transaction inventory page was initialized to zero, it // transaction is automatically marked active. WIN window(HEADER_PAGE_NUMBER); const header_page* header = (header_page*) CCH_FETCH(tdbb, &window, LCK_read, pag_header); const TraNumber ceiling = Ods::getNT(header); const TraNumber active = Ods::getOAT(header); CCH_RELEASE(tdbb, &window); if (ceiling == 0) return; // Zip thru transactions from the "oldest active" to the next looking for // active transactions. When one is found, declare it dead. const ULONG last = ceiling / trans_per_tip; ULONG number = active % trans_per_tip; TraNumber limbo = 0; for (ULONG sequence = active / trans_per_tip; sequence <= last; sequence++, number = 0) { window.win_page = inventory_page(tdbb, sequence); tx_inv_page* tip = (tx_inv_page*) CCH_FETCH(tdbb, &window, LCK_write, pag_transactions); TraNumber max = ceiling - (TraNumber) sequence * trans_per_tip; if (max >= trans_per_tip) max = trans_per_tip - 1; for (; number <= max; number++) { const ULONG trans_offset = TRANS_OFFSET(number); UCHAR* byte = tip->tip_transactions + trans_offset; const USHORT shift = TRANS_SHIFT(number); const int state = (*byte >> shift) & TRA_MASK; if (state == tra_limbo && limbo == 0) limbo = (TraNumber) sequence * trans_per_tip + number; else if (state == tra_active) { CCH_MARK(tdbb, &window); *byte &= ~(TRA_MASK << shift); // hvlad: mark system transaction as committed if (sequence == 0 && number == 0) { *byte |= tra_committed << shift; } else { *byte |= tra_dead << shift; } } } #ifdef SUPERSERVER_V2 if (sequence == last) { CCH_MARK(tdbb, &window); for (; number < trans_per_tip; number++) { const ULONG trans_offset = TRANS_OFFSET(number); UCHAR* byte = tip->tip_transactions + trans_offset; const USHORT shift = TRANS_SHIFT(number); *byte &= ~(TRA_MASK << shift); if (tip->tip_next) *byte |= tra_committed << shift; else *byte |= tra_active << shift; } } #endif CCH_RELEASE(tdbb, &window); } #ifdef SUPERSERVER_V2 window.win_page = inventory_page(tdbb, last); tx_inv_page* tip = (tx_inv_page*) CCH_FETCH(tdbb, &window, LCK_write, pag_transactions); while (tip->tip_next) { CCH_RELEASE(tdbb, &window); window.win_page = inventory_page(tdbb, ++last); tip = (tx_inv_page*) CCH_FETCH(tdbb, &window, LCK_write, pag_transactions); CCH_MARK(tdbb, &window); for (number = 0; number < trans_per_tip; number++) { const ULONG trans_offset = TRANS_OFFSET(number); UCHAR* byte = tip->tip_transactions + trans_offset; const USHORT shift = TRANS_SHIFT(number); *byte &= ~(TRA_MASK << shift); if (tip->tip_next || !number) *byte |= tra_committed << shift; else *byte |= tra_active << shift; } if (!tip->tip_next) dbb->dbb_next_transaction = (TraNumber) last * trans_per_tip; } CCH_RELEASE(tdbb, &window); #endif } void TRA_commit(thread_db* tdbb, jrd_tra* transaction, const bool retaining_flag) { /************************************** * * T R A _ c o m m i t * ************************************** * * Functional description * Commit a transaction. * **************************************/ SET_TDBB(tdbb); TraceTransactionEnd trace(transaction, true, retaining_flag); EDS::Transaction::jrdTransactionEnd(tdbb, transaction, true, retaining_flag, false); jrd_tra* const sysTran = tdbb->getAttachment()->getSysTransaction(); // If this is a commit retaining, and no updates have been performed, // and no events have been posted (via stored procedures etc) // no-op the operation. if (retaining_flag && !((transaction->tra_flags & TRA_write) || transaction->tra_deferred_job)) { if (sysTran->tra_flags & TRA_write) transaction_flush(tdbb, FLUSH_SYSTEM, 0); transaction->tra_flags &= ~TRA_prepared; // Get rid of all user savepoints while (transaction->tra_save_point && !transaction->tra_save_point->isRoot()) transaction->rollforwardSavepoint(tdbb); trace.finish(ITracePlugin::RESULT_SUCCESS); return; } if (transaction->tra_flags & TRA_invalidated) ERR_post(Arg::Gds(isc_trans_invalid)); Jrd::ContextPoolHolder context(tdbb, transaction->tra_pool); // Perform any meta data work deferred if (!(transaction->tra_flags & TRA_prepared)) DFW_perform_work(tdbb, transaction); // Commit associated transaction in security DB SecDbContext* secContext = transaction->getSecDbContext(); if (secContext && secContext->tra) { LocalStatus ls; CheckStatusWrapper st(&ls); secContext->tra->commit(&st); if (st.getState() & IStatus::STATE_ERRORS) status_exception::raise(&st); secContext->tra = NULL; Mapping::clearCache(tdbb->getDatabase()->dbb_config->getSecurityDatabase(), Mapping::MAPPING_CACHE); transaction->eraseSecDbContext(); } if (transaction->tra_flags & (TRA_prepare2 | TRA_reconnected)) MET_update_transaction(tdbb, transaction, true); // Flush pages if transaction logically modified data if (transaction->tra_flags & TRA_write) { // Get rid of user savepoints to allow intermediate garbage collection // in indices and BLOBs after in-place updates while (transaction->tra_save_point) { transaction->rollforwardSavepoint(tdbb); } transaction_flush(tdbb, FLUSH_TRAN, transaction->tra_number); } else if ((transaction->tra_flags & (TRA_prepare2 | TRA_reconnected)) || (sysTran->tra_flags & TRA_write)) { // If the transaction only read data but is a member of a // multi-database transaction with a transaction description // message then flush RDB$TRANSACTIONS. transaction_flush(tdbb, FLUSH_SYSTEM, 0); } if (retaining_flag) { trace.finish(ITracePlugin::RESULT_SUCCESS); retain_context(tdbb, transaction, true, tra_committed); return; } // Set the state on the inventory page to be committed TRA_set_state(tdbb, transaction, transaction->tra_number, tra_committed); // Perform any post commit work DFW_perform_post_commit_work(transaction); // notify any waiting locks that this transaction is committing; // there could be no lock if this transaction is being reconnected ++transaction->tra_use_count; Lock* lock = transaction->tra_lock; if (lock && (lock->lck_logical < LCK_write)) LCK_convert(tdbb, lock, LCK_write, LCK_WAIT); --transaction->tra_use_count; TRA_release_transaction(tdbb, transaction, &trace); } void TRA_extend_tip(thread_db* tdbb, ULONG sequence) //, WIN* precedence_window) { /************************************** * * T R A _ e x t e n d _ t i p * ************************************** * * Functional description * Allocate and link in new TIP (transaction inventory page). * This is called from TRA_start and from validate/repair. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // Start by fetching prior transaction page, if any tx_inv_page* prior_tip = NULL; WIN prior_window(DB_PAGE_SPACE, -1); if (sequence) prior_tip = fetch_inventory_page(tdbb, &prior_window, (sequence - 1), LCK_write); // Allocate and format new page WIN window(DB_PAGE_SPACE, -1); tx_inv_page* tip = (tx_inv_page*) DPM_allocate(tdbb, &window); tip->tip_header.pag_type = pag_transactions; CCH_must_write(tdbb, &window); CCH_RELEASE(tdbb, &window); // Release prior page if (sequence) { CCH_MARK_MUST_WRITE(tdbb, &prior_window); prior_tip->tip_next = window.win_page.getPageNum(); CCH_RELEASE(tdbb, &prior_window); } // Link into internal data structures vcl* vector = dbb->dbb_t_pages = vcl::newVector(*dbb->dbb_permanent, dbb->dbb_t_pages, sequence + 1); (*vector)[sequence] = window.win_page.getPageNum(); // Write into pages relation DPM_pages(tdbb, 0, pag_transactions, sequence, window.win_page.getPageNum()); } int TRA_fetch_state(thread_db* tdbb, TraNumber number) { /************************************** * * T R A _ f e t c h _ s t a t e * ************************************** * * Functional description * Physically fetch the state of a given * transaction on the transaction inventory * page. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // locate and fetch the proper TIP page const ULONG trans_per_tip = dbb->dbb_page_manager.transPerTIP; const ULONG tip_seq = number / trans_per_tip; WIN window(DB_PAGE_SPACE, -1); const tx_inv_page* tip = fetch_inventory_page(tdbb, &window, tip_seq, LCK_read); // calculate the state of the desired transaction const ULONG byte = TRANS_OFFSET(number % trans_per_tip); const USHORT shift = TRANS_SHIFT(number); const int state = (tip->tip_transactions[byte] >> shift) & TRA_MASK; CCH_RELEASE(tdbb, &window); return state; } void TRA_get_inventory(thread_db* tdbb, UCHAR* bit_vector, TraNumber base, TraNumber top) { /************************************** * * T R A _ g e t _ i n v e n t o r y * ************************************** * * Functional description * Get an inventory of the state of all transactions * between the base and top (included) transactions passed. * To get a consistent view of the transaction * inventory (in case we ever implement sub-transactions), * do handoffs to read the pages in order. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // It does not make sence to call this function without bit_vector now fb_assert(bit_vector); const ULONG trans_per_tip = dbb->dbb_page_manager.transPerTIP; ULONG sequence = base / trans_per_tip; const ULONG last = top / trans_per_tip; // fetch the first inventory page WIN window(DB_PAGE_SPACE, -1); const tx_inv_page* tip = fetch_inventory_page(tdbb, &window, sequence++, LCK_read); // move the first page into the bit vector UCHAR* p = bit_vector; ULONG l = base % trans_per_tip; const UCHAR* q = tip->tip_transactions + TRANS_OFFSET(l); l = TRANS_OFFSET(MIN((top + TRA_MASK + 1 - base), trans_per_tip - l)); memcpy(p, q, l); p += l; // move successive pages into the bit vector while (sequence <= last) { base = (TraNumber) sequence * trans_per_tip; // release the read lock as we go, so that some one else can // commit without having to signal all other transactions. tip = (tx_inv_page*) CCH_HANDOFF(tdbb, &window, inventory_page(tdbb, sequence++), LCK_read, pag_transactions); l = TRANS_OFFSET(MIN((top + TRA_MASK + 1 - base), trans_per_tip)); memcpy(p, tip->tip_transactions, l); p += l; } CCH_RELEASE(tdbb, &window); } int TRA_get_state(thread_db* tdbb, TraNumber number) { /************************************** * * T R A _ g e t _ s t a t e * ************************************** * * Functional description * Get the state of a given transaction on the * transaction inventory page. * **************************************/ return TPC_snapshot_state(tdbb, number); } #ifdef SUPERSERVER_V2 void TRA_header_write(thread_db* tdbb, Database* dbb, TraNumber number) { /************************************** * * T R A _ h e a d e r _ w r i t e * ************************************** * * Functional description * Force transaction ID on header to disk. * Do post fetch check of the transaction * ID header write as a concurrent thread * might have written the header page * while blocked on the latch. * * The idea is to amortize the cost of * header page I/O across multiple transactions. * **************************************/ SET_TDBB(tdbb); // If transaction number is already on disk just return. if (!number || dbb->dbb_last_header_write < number) { WIN window(HEADER_PAGE_NUMBER); header_page* header = (header_page*) CCH_FETCH(tdbb, &window, LCK_write, pag_header); const TraNumber next_transaction = Ods::getNT(header); const TraNumber oldest_active = Ods::getOAT(header); const TraNumber oldest_transaction = Ods::getOIT(header); const TraNumber oldest_snapshot = Ods::getOST(header); if (next_transaction) { if (oldest_active > next_transaction) BUGCHECK(266); //next transaction older than oldest active if (oldest_transaction > next_transaction) BUGCHECK(267); // next transaction older than oldest transaction } // The header page might have been written while waiting // for the latch; perform a post fetch check and optimize // this case by not writing the page again. if (!number || dbb->dbb_last_header_write < number) { CCH_MARK_MUST_WRITE(tdbb, &window); if (dbb->dbb_next_transaction > next_transaction) Ods::writeNT(header, dbb->dbb_next_transaction); if (dbb->dbb_oldest_active > oldest_active) Ods::writeOAT(header, dbb->dbb_oldest_active); if (dbb->dbb_oldest_transaction > oldest_transaction) Ods::writeOIT(header, dbb->dbb_oldest_transaction); if (dbb->dbb_oldest_snapshot > oldest_snapshot) Ods::writeOST(header, dbb->dbb_oldest_snapshot); } CCH_RELEASE(tdbb, &window); } } #endif void TRA_init(Jrd::Attachment* attachment) { /************************************** * * T R A _ i n i t * ************************************** * * Functional description * "Start" the system transaction. * **************************************/ Database* dbb = attachment->att_database; CHECK_DBB(dbb); MemoryPool* const pool = dbb->dbb_permanent; jrd_tra* const trans = FB_NEW_POOL(*pool) jrd_tra(pool, &dbb->dbb_memory_stats, NULL, NULL); trans->tra_attachment = attachment; attachment->setSysTransaction(trans); trans->tra_flags |= TRA_system | TRA_ignore_limbo; } void TRA_invalidate(thread_db* tdbb, ULONG mask) { /************************************** * * T R A _ i n v a l i d a t e * ************************************** * * Functional description * Invalidate any active transactions that may have * modified a page that couldn't be written. * **************************************/ Database* const database = tdbb->getDatabase(); EngineCheckout cout(tdbb, FB_FUNCTION, true); SyncLockGuard dbbSync(&database->dbb_sync, SYNC_SHARED, "TRA_invalidate"); Jrd::Attachment* attachment = database->dbb_attachments; while (attachment) { Jrd::Attachment::SyncGuard attGuard(attachment, FB_FUNCTION); for (jrd_tra* transaction = attachment->att_transactions; transaction; transaction = transaction->tra_next) { const ULONG transaction_mask = 1L << (transaction->tra_number & (BITS_PER_LONG - 1)); if ((transaction_mask & mask) && (transaction->tra_flags & TRA_write)) transaction->tra_flags |= TRA_invalidated; } attachment = attachment->att_next; } } void TRA_link_cursor(jrd_tra* transaction, DsqlCursor* cursor) { /************************************** * * T R A _ l i n k _ c u r s o r * ************************************** * * Functional description * Add cursor to the list of open cursors belonging to this transaction. * **************************************/ fb_assert(!transaction->tra_open_cursors.exist(cursor)); transaction->tra_open_cursors.add(cursor); } void TRA_unlink_cursor(jrd_tra* transaction, DsqlCursor* cursor) { /************************************** * * T R A _ u n l i n k _ c u r s o r * ************************************** * * Functional description * Remove cursor from the list of open cursors. * **************************************/ FB_SIZE_T pos; if (transaction->tra_open_cursors.find(cursor, pos)) transaction->tra_open_cursors.remove(pos); } void TRA_update_counters(thread_db* tdbb, Database* dbb) { /************************************** * * T R A _ u p d a t e _ c o u n t e r s * ************************************** * * Functional description * Update header page using cached values of transactions counters * **************************************/ SET_TDBB(tdbb); if (!dbb || dbb->dbb_flags & DBB_read_only || dbb->dbb_flags & DBB_new || dbb->dbb_oldest_transaction == 0) { return; } WIN window(HEADER_PAGE_NUMBER); header_page* header = (header_page*)CCH_FETCH(tdbb, &window, LCK_write, pag_header); const TraNumber next_transaction = Ods::getNT(header); const TraNumber oldest_transaction = Ods::getOIT(header); const TraNumber oldest_active = Ods::getOAT(header); const TraNumber oldest_snapshot = Ods::getOST(header); fb_assert(dbb->dbb_next_transaction <= next_transaction); if (dbb->dbb_oldest_active > oldest_active || dbb->dbb_oldest_transaction > oldest_transaction || dbb->dbb_oldest_snapshot > oldest_snapshot || dbb->dbb_next_transaction > next_transaction) { CCH_MARK_MUST_WRITE(tdbb, &window); if (dbb->dbb_oldest_active > header->hdr_oldest_active) Ods::writeOAT(header, dbb->dbb_oldest_active); if (dbb->dbb_oldest_transaction > header->hdr_oldest_transaction) Ods::writeOIT(header, dbb->dbb_oldest_transaction); if (dbb->dbb_oldest_snapshot > header->hdr_oldest_snapshot) Ods::writeOST(header, dbb->dbb_oldest_snapshot); if (dbb->dbb_next_transaction > next_transaction) Ods::writeNT(header, dbb->dbb_next_transaction); } CCH_RELEASE(tdbb, &window); } void TRA_post_resources(thread_db* tdbb, jrd_tra* transaction, ResourceList& resources) { /************************************** * * T R A _ p o s t _ r e s o u r c e s * ************************************** * * Functional description * Post interest in relation/procedure/collation existence to transaction. * This guarantees that the relation/procedure/collation won't be dropped * out from under the transaction. * **************************************/ SET_TDBB(tdbb); Jrd::ContextPoolHolder context(tdbb, transaction->tra_pool); for (Resource* rsc = resources.begin(); rsc < resources.end(); rsc++) { if (rsc->rsc_type == Resource::rsc_relation || rsc->rsc_type == Resource::rsc_procedure || rsc->rsc_type == Resource::rsc_function || rsc->rsc_type == Resource::rsc_collation) { FB_SIZE_T i; if (!transaction->tra_resources.find(*rsc, i)) { transaction->tra_resources.insert(i, *rsc); switch (rsc->rsc_type) { case Resource::rsc_relation: MET_post_existence(tdbb, rsc->rsc_rel); if (rsc->rsc_rel->rel_file) { EXT_tra_attach(rsc->rsc_rel->rel_file, transaction); } break; case Resource::rsc_procedure: case Resource::rsc_function: rsc->rsc_routine->addRef(); #ifdef DEBUG_PROCS { char buffer[256]; sprintf(buffer, "Called from TRA_post_resources():\n\t Incrementing use count of %s\n", rsc->rsc_routine->prc_name->c_str()); JRD_print_procedure_info(tdbb, buffer); } #endif break; case Resource::rsc_collation: rsc->rsc_coll->incUseCount(tdbb); break; default: // shut up compiler warning break; } } } } } bool TRA_is_active(thread_db* tdbb, TraNumber number) { /************************************** * * T R A _ i s _ a c t i v e * ************************************** * * Functional description * Returns whether a given transaction * owned by some other guy active or not. * * If function return false - you can trust this value and be sure that transaction * is not active. However if function returns true - it might be inactive already, * but two engine threads are checking for its status at once. Callers need to * behave correctly when facing this behavior. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); Lock temp_lock(tdbb, sizeof(TraNumber), LCK_tra); temp_lock.setKey(number); // If we can't get a lock on the transaction, it must be active if (!LCK_lock(tdbb, &temp_lock, LCK_read, LCK_NO_WAIT)) { fb_utils::init_status(tdbb->tdbb_status_vector); return true; } LCK_release(tdbb, &temp_lock); return false; } void TRA_prepare(thread_db* tdbb, jrd_tra* transaction, USHORT length, const UCHAR* msg) { /************************************** * * T R A _ p r e p a r e * ************************************** * * Functional description * Put a transaction into limbo. * **************************************/ SET_TDBB(tdbb); if (transaction->tra_flags & TRA_prepared) return; if (transaction->tra_flags & TRA_invalidated) ERR_post(Arg::Gds(isc_trans_invalid)); /* If there's a transaction description message, log it to RDB$TRANSACTION We should only log a message to RDB$TRANSACTION if there is a message to log (if the length = 0, we won't log the transaction in RDB$TRANSACTION) These messages are used to recover transactions in limbo. The message indicates the action that is to be performed (hence, if nothing is getting logged, don't bother). */ /* Make sure that if msg is NULL there is no length. The two should go hand in hand msg == NULL || *msg == NULL */ fb_assert(!(!msg && length) || (msg && (!*msg && length))); if (msg && length) { MET_prepare(tdbb, transaction, length, msg); transaction->tra_flags |= TRA_prepare2; } // Prepare associated transaction in security DB SecDbContext* secContext = transaction->getSecDbContext(); if (secContext && secContext->tra) { LocalStatus ls; CheckStatusWrapper st(&ls); secContext->tra->prepare(&st, length, msg); if (st.getState() & IStatus::STATE_ERRORS) status_exception::raise(&st); } // Perform any meta data work deferred DFW_perform_work(tdbb, transaction); // Flush pages if transaction logically modified data jrd_tra* sysTran = tdbb->getAttachment()->getSysTransaction(); if (transaction->tra_flags & TRA_write) transaction_flush(tdbb, FLUSH_TRAN, transaction->tra_number); else if ((transaction->tra_flags & TRA_prepare2) || (sysTran->tra_flags & TRA_write)) { // If the transaction only read data but is a member of a // multi-database transaction with a transaction description // message then flush RDB$TRANSACTIONS. transaction_flush(tdbb, FLUSH_SYSTEM, 0); } // Set the state on the inventory page to be limbo transaction->tra_flags |= TRA_prepared; TRA_set_state(tdbb, transaction, transaction->tra_number, tra_limbo); } jrd_tra* TRA_reconnect(thread_db* tdbb, const UCHAR* id, USHORT length) { /************************************** * * T R A _ r e c o n n e c t * ************************************** * * Functional description * Reconnect to a transaction in limbo. * **************************************/ SET_TDBB(tdbb); Database* const dbb = tdbb->getDatabase(); CHECK_DBB(dbb); Jrd::Attachment* const attachment = tdbb->getAttachment(); // Cannot work on limbo transactions for ReadOnly database if (dbb->readOnly()) ERR_post(Arg::Gds(isc_read_only_database)); const TraNumber number = isc_portable_integer(id, length); if (number > dbb->dbb_next_transaction) PAG_header(tdbb, true); const int state = (number > dbb->dbb_next_transaction) ? 255 : limbo_transaction(tdbb, number); if (state != tra_limbo) { USHORT message; switch (state) { case tra_active: message = 262; // ACTIVE break; case tra_dead: message = 264; // ROLLED BACK break; case tra_committed: message = 263; // COMMITTED break; default: message = 265; // ILL DEFINED break; } TEXT text[128]; USHORT flags = 0; gds__msg_lookup(NULL, JRD_BUGCHK, message, sizeof(text), text, &flags); ERR_post(Arg::Gds(isc_no_recon) << Arg::Gds(isc_tra_state) << Arg::Num(number) << Arg::Str(text)); } MemoryPool* const pool = attachment->createPool(); Jrd::ContextPoolHolder context(tdbb, pool); jrd_tra* const trans = jrd_tra::create(pool, attachment, NULL); trans->tra_number = number; trans->tra_flags |= TRA_prepared | TRA_reconnected | TRA_write; trans->linkToAttachment(attachment); return trans; } void TRA_release_transaction(thread_db* tdbb, jrd_tra* transaction, Jrd::TraceTransactionEnd* trace) { /************************************** * * T R A _ r e l e a s e _ t r a n s a c t i o n * ************************************** * * Functional description * Cleanup a transaction. This is called by both COMMIT and * ROLLBACK as well as code in JRD to get rid of remote * transactions. * **************************************/ SET_TDBB(tdbb); Jrd::Attachment* const attachment = tdbb->getAttachment(); Database* const dbb = tdbb->getDatabase(); CHECK_DBB(dbb); if (!transaction->tra_outer) { if (transaction->tra_blobs->getFirst()) { while (true) { BlobIndex *current = &transaction->tra_blobs->current(); if (current->bli_materialized) { if (!transaction->tra_blobs->getNext()) break; } else { ULONG temp_id = current->bli_temp_id; current->bli_blob_object->BLB_cancel(tdbb); if (!transaction->tra_blobs->locate(Firebird::locGreat, temp_id)) break; } } } while (transaction->tra_arrays) blb::release_array(transaction->tra_arrays); } if (transaction->tra_pool) { // Iterate the doubly linked list of requests for transaction and null out the transaction references while (transaction->tra_requests) TRA_detach_request(transaction->tra_requests); } // Release interest in relation/procedure existence for transaction for (Resource* rsc = transaction->tra_resources.begin(); rsc < transaction->tra_resources.end(); rsc++) { switch (rsc->rsc_type) { case Resource::rsc_relation: MET_release_existence(tdbb, rsc->rsc_rel); if (rsc->rsc_rel->rel_file) { EXT_tra_detach(rsc->rsc_rel->rel_file, transaction); } break; case Resource::rsc_procedure: case Resource::rsc_function: rsc->rsc_routine->release(tdbb); break; case Resource::rsc_collation: rsc->rsc_coll->decUseCount(tdbb); break; default: fb_assert(false); } } { // scope vec& rels = *attachment->att_relations; for (FB_SIZE_T i = 0; i < rels.count(); i++) { jrd_rel* relation = rels[i]; if (relation && (relation->rel_flags & REL_temp_tran)) relation->delPages(tdbb, transaction->tra_number); } } // end scope // Release the locks associated with the transaction vec* vector = transaction->tra_relation_locks; if (vector) { vec::iterator lock = vector->begin(); for (ULONG i = 0; i < vector->count(); ++i, ++lock) { if (*lock) LCK_release(tdbb, *lock); } } ++transaction->tra_use_count; if (transaction->tra_lock) LCK_release(tdbb, transaction->tra_lock); --transaction->tra_use_count; // release the sparse bit map used for commit retain transaction delete transaction->tra_commit_sub_trans; if (trace) trace->finish(ITracePlugin::RESULT_SUCCESS); // Unlink the transaction from the attachment block transaction->unlinkFromAttachment(); // Release transaction's under-modification-rpb list delete transaction->tra_rpblist; // Release the database snapshot, if any delete transaction->tra_mon_snapshot; // Close all open DSQL cursors while (transaction->tra_open_cursors.hasData()) DsqlCursor::close(tdbb, transaction->tra_open_cursors.pop()); if (!(transaction->tra_flags & TRA_read_committed)) { dbb->dbb_tip_cache->endSnapshot(tdbb, transaction->tra_snapshot_handle, transaction->tra_attachment->att_attachment_id); } // Release the transaction and its pool tdbb->setTransaction(NULL); JTransaction* jTra = transaction->getInterface(true); // ASF: maybe it's better to pass false? if (jTra) { jTra->setHandle(NULL); } jrd_tra::destroy(attachment, transaction); } void TRA_rollback(thread_db* tdbb, jrd_tra* transaction, const bool retaining_flag, const bool force_flag) { /************************************** * * T R A _ r o l l b a c k * ************************************** * * Functional description * Rollback a transaction. * **************************************/ SET_TDBB(tdbb); TraceTransactionEnd trace(transaction, false, retaining_flag); EDS::Transaction::jrdTransactionEnd(tdbb, transaction, false, retaining_flag, false /*force_flag ?*/); Jrd::ContextPoolHolder context(tdbb, transaction->tra_pool); if (transaction->tra_flags & (TRA_prepare2 | TRA_reconnected)) MET_update_transaction(tdbb, transaction, false); // If force flag is true, get rid of all savepoints to mark the transaction as dead if (force_flag || (transaction->tra_flags & TRA_invalidated)) { // Free all savepoint data // Undo data space and BLOBs will be released in destructor Savepoint::destroy(transaction->tra_save_point); fb_assert(!transaction->tra_save_point); } else { // Remove undo data for GTT ON COMMIT DELETE ROWS as their data will be released // at transaction end anyway and we don't need to waste time backing it out for (Savepoint::Iterator iter(transaction->tra_save_point); *iter; ++iter) (*iter)->cleanupTempData(); } int state = tra_dead; if (transaction->tra_save_point) { // Make sure that any error during savepoint undo is handled by marking // the transaction as dead. try { // Release all user savepoints except transaction one // It will clean up blob ids and temporary space anyway but faster than rollback // because record data won't be updated with intermediate versions while (transaction->tra_save_point && !transaction->tra_save_point->isRoot()) transaction->rollforwardSavepoint(tdbb); if (transaction->tra_save_point) // we still can use undo log for rollback, it wasn't reset because of no_auto_undo flag or size { // In an attempt to avoid deadlocks, clear the precedence by writing // all dirty buffers for this transaction. if (transaction->tra_flags & TRA_write) { transaction_flush(tdbb, FLUSH_TRAN, transaction->tra_number); transaction->rollbackSavepoint(tdbb); transaction_flush(tdbb, FLUSH_TRAN, transaction->tra_number); } else transaction->rollbackSavepoint(tdbb); // All changes are undone, so we may mark the transaction // as committed state = tra_committed; } } catch (const Firebird::Exception&) { // Prevent a bugcheck in TRA_set_state to cause a loop // Clear the error because the rollback will succeed. fb_utils::init_status(tdbb->tdbb_status_vector); } } else if (!(transaction->tra_flags & TRA_write)) { // There were no changes within the transaction, so we may mark it // as committed state = tra_committed; } jrd_tra* const sysTran = tdbb->getAttachment()->getSysTransaction(); if (sysTran->tra_flags & TRA_write) transaction_flush(tdbb, FLUSH_SYSTEM, 0); // If this is a rollback retain abort this transaction and start a new one. if (retaining_flag) { trace.finish(ITracePlugin::RESULT_SUCCESS); retain_context(tdbb, transaction, false, state); return; } TRA_set_state(tdbb, transaction, transaction->tra_number, state); TRA_release_transaction(tdbb, transaction, &trace); } void TRA_set_state(thread_db* tdbb, jrd_tra* transaction, TraNumber number, int state) { /************************************** * * T R A _ s e t _ s t a t e * ************************************** * * Functional description * Set the state of a transaction in the inventory page. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // If it is a ReadOnly DB, set the new state in the TIP cache and return if (dbb->readOnly() && dbb->dbb_tip_cache) { TPC_set_state(tdbb, number, state); return; } // If we're terminating ourselves and we've been precommitted then just return. if (transaction && transaction->tra_number == number && (transaction->tra_flags & TRA_precommitted)) { return; } const ULONG trans_per_tip = dbb->dbb_page_manager.transPerTIP; const ULONG sequence = number / trans_per_tip; const ULONG byte = TRANS_OFFSET(number % trans_per_tip); const USHORT shift = TRANS_SHIFT(number); WIN window(DB_PAGE_SPACE, -1); tx_inv_page* tip = fetch_inventory_page(tdbb, &window, sequence, LCK_write); UCHAR* address = tip->tip_transactions + byte; const int old_state = ((*address) >> shift) & TRA_MASK; #ifdef SUPERSERVER_V2 CCH_MARK(tdbb, &window); const ULONG generation = tip->tip_header.pag_generation; #else if (!(dbb->dbb_flags & DBB_shared) || !transaction || (transaction->tra_flags & TRA_write) || old_state != tra_active || state != tra_committed) { CCH_MARK_MUST_WRITE(tdbb, &window); } else CCH_MARK(tdbb, &window); #endif // set the state on the TIP page *address &= ~(TRA_MASK << shift); *address |= state << shift; // set the new state in the TIP cache as well if (dbb->dbb_tip_cache) TPC_set_state(tdbb, number, state); CCH_RELEASE(tdbb, &window); #ifdef SUPERSERVER_V2 // Let the TIP be lazily updated for read-only queries. // To amortize write of TIP page for update transactions, // exit engine to allow other transactions to update the TIP // and use page generation to determine if page was written. if (transaction && !(transaction->tra_flags & TRA_write)) return; { //scope Database::Checkout dcoHolder(dbb, FB_FUNCTION); Thread::yield(); } tip = reinterpret_cast(CCH_FETCH(tdbb, &window, LCK_write, pag_transactions)); if (generation == tip->tip_header.pag_generation) CCH_MARK_MUST_WRITE(tdbb, &window); CCH_RELEASE(tdbb, &window); #endif } int TRA_snapshot_state(thread_db* tdbb, jrd_tra* trans, TraNumber number, CommitNumber *snapshot) { /************************************** * * T R A _ s n a p s h o t _ s t a t e * ************************************** * * Functional description * Get the state of a numbered transaction when a * transaction started. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // Inhibit intermediate GC by default if (snapshot) *snapshot = CN_ACTIVE; if (number == trans->tra_number) return tra_us; // If the transaction is older than the oldest // interesting transaction, it must be committed. if (number < trans->tra_oldest) { if (snapshot) *snapshot = trans->tra_active_snapshots.getSnapshotForVersion(CN_PREHISTORIC); return tra_committed; } // If the transaction is the system transaction, it is considered committed. if (number == TRA_system_transaction) { if (snapshot) *snapshot = trans->tra_active_snapshots.getSnapshotForVersion(CN_PREHISTORIC); return tra_committed; } // Determine transaction state and commit number if any int state; CommitNumber stateCn = CN_PREHISTORIC; if (TipCache* tip_cache = dbb->dbb_tip_cache) { stateCn = tip_cache->snapshotState(tdbb, number); switch(stateCn) { case CN_ACTIVE: state = tra_active; break; case CN_LIMBO: state = tra_limbo; break; case CN_DEAD: state = tra_dead; break; default: state = tra_committed; if (snapshot) *snapshot = trans->tra_active_snapshots.getSnapshotForVersion(stateCn); break; } } else state = TRA_fetch_state(tdbb, number); // If the transaction is a committed sub-transction - do the easy lookup. if (trans->tra_commit_sub_trans && trans->tra_commit_sub_trans->test(number)) return tra_committed; if (trans->tra_flags & TRA_read_committed) { if ((trans->tra_flags & TRA_read_consistency) && state == tra_committed) { // GC thread accesses data directly without any request if (jrd_req* current_request = tdbb->getRequest()) { // There is no request snapshot when we build expression index if (jrd_req* snapshot_request = current_request->req_snapshot_owner) { if (stateCn > snapshot_request->req_snapshot_number) return tra_active; } } } return state; } // The system transaction can read data from active transactions. if (trans->tra_flags & TRA_system) { if (state == tra_active) return tra_committed; return state; } if (state == tra_committed && stateCn > trans->tra_snapshot_number) return tra_active; return state; } jrd_tra* TRA_start(thread_db* tdbb, ULONG flags, SSHORT lock_timeout, Jrd::jrd_tra* outer) { /************************************** * * T R A _ s t a r t * ************************************** * * Functional description * Start a user transaction. * **************************************/ SET_TDBB(tdbb); Database* const dbb = tdbb->getDatabase(); Jrd::Attachment* const attachment = tdbb->getAttachment(); if (dbb->dbb_ast_flags & DBB_shut_tran) { ERR_post(Arg::Gds(isc_shutinprog) << Arg::Str(attachment->att_filename)); } // To handle the problems of relation locks, allocate a temporary // transaction block first, seize relation locks, then go ahead and // make up the real transaction block. MemoryPool* const pool = outer ? outer->getAutonomousPool() : attachment->createPool(); Jrd::ContextPoolHolder context(tdbb, pool); jrd_tra* const transaction = jrd_tra::create(pool, attachment, outer); transaction->tra_flags = flags & TRA_OPTIONS_MASK; transaction->tra_lock_timeout = lock_timeout; try { transaction_start(tdbb, transaction); } catch (const Exception&) { jrd_tra::destroy(attachment, transaction); throw; } if (attachment->att_trace_manager->needs(ITraceFactory::TRACE_EVENT_TRANSACTION_START)) { TraceConnectionImpl conn(attachment); TraceTransactionImpl tran(transaction); attachment->att_trace_manager->event_transaction_start(&conn, &tran, 0, NULL, ITracePlugin::RESULT_SUCCESS); } return transaction; } jrd_tra* TRA_start(thread_db* tdbb, int tpb_length, const UCHAR* tpb, Jrd::jrd_tra* outer) { /************************************** * * T R A _ s t a r t * ************************************** * * Functional description * Start a user transaction. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); Jrd::Attachment* attachment = tdbb->getAttachment(); if (dbb->dbb_ast_flags & DBB_shut_tran) { ERR_post(Arg::Gds(isc_shutinprog) << Arg::Str(attachment->att_filename)); } // To handle the problems of relation locks, allocate a temporary // transaction block first, seize relation locks, then go ahead and // make up the real transaction block. MemoryPool* const pool = outer ? outer->getAutonomousPool() : attachment->createPool(); Jrd::ContextPoolHolder context(tdbb, pool); jrd_tra* const transaction = jrd_tra::create(pool, attachment, outer); try { transaction_options(tdbb, transaction, tpb, tpb_length); transaction_start(tdbb, transaction); } catch (const Exception&) { jrd_tra::destroy(attachment, transaction); throw; } if (attachment->att_trace_manager->needs(ITraceFactory::TRACE_EVENT_TRANSACTION_START)) { TraceConnectionImpl conn(attachment); TraceTransactionImpl tran(transaction); attachment->att_trace_manager->event_transaction_start(&conn, &tran, tpb_length, tpb, ITracePlugin::RESULT_SUCCESS); } return transaction; } int TRA_state(const UCHAR* bit_vector, TraNumber oldest, TraNumber number) { /************************************** * * T R A _ s t a t e * ************************************** * * Functional description * Get the state of a transaction from a cached * bit vector. * NOTE: This code is reproduced elsewhere in * this module for speed. If changes are made * to this code make them in the replicated code also. * **************************************/ const TraNumber base = oldest & ~TRA_MASK; const ULONG byte = TRANS_OFFSET(number - base); const USHORT shift = TRANS_SHIFT(number); return (bit_vector[byte] >> shift) & TRA_MASK; } void TRA_sweep(thread_db* tdbb) { /************************************** * * T R A _ s w e e p * ************************************** * * Functional description * Make a garbage collection pass thru database. * **************************************/ SET_TDBB(tdbb); Database* const dbb = tdbb->getDatabase(); CHECK_DBB(dbb); if (!dbb->allowSweepRun(tdbb)) { dbb->clearSweepFlags(tdbb); return; } fb_assert(dbb->dbb_flags & DBB_sweep_in_progress); Jrd::Attachment* const attachment = tdbb->getAttachment(); jrd_tra* const tdbb_old_trans = tdbb->getTransaction(); jrd_tra* transaction = NULL; // Clean up the temporary locks we've gotten in case anything goes wrong try { // Identify ourselves as a sweeper thread. This accomplishes two goals: // 1) Sweep transaction is started "precommitted" and // 2) Execution is throttled in JRD_reschedule() by // yielding the processor when our quantum expires. tdbb->tdbb_flags |= TDBB_sweeper; TraceSweepEvent traceSweep(tdbb); // Start a transaction, if necessary, to perform the sweep. // Save the transaction's oldest snapshot as it is refreshed // during the course of the database sweep. Since it is used // below to advance the OIT we must save it before it changes. transaction = TRA_start(tdbb, sizeof(sweep_tpb), sweep_tpb); TraNumber transaction_oldest_active = transaction->tra_oldest_active; tdbb->setTransaction(transaction); // The garbage collector runs asynchronously with respect to // our database sweep. This isn't good enough since we must // be absolutely certain that all dead transactions have been // swept from the database before advancing the OIT. Turn off // the "notify garbage collector" flag for the attachment and // synchronously perform the garbage collection ourselves. attachment->att_flags &= ~ATT_notify_gc; if (VIO_sweep(tdbb, transaction, &traceSweep)) { // At this point, we know that no record versions belonging to dead // transactions remain anymore. However, there may still be limbo // transactions, so we need to find the oldest one between tra_oldest and tra_top. // As our transaction is read-committed (see sweep_tpb), we have to scan // the global TIP cache. int oldest_state = 0; const TraNumber oldest_limbo = TPC_find_states(tdbb, transaction->tra_oldest, transaction->tra_top - 1, 1 << tra_limbo, oldest_state); const TraNumber active = oldest_limbo ? oldest_limbo : transaction->tra_top; // Flush page buffers to insure that no dangling records from // dead transactions are left on-disk. This must be done before // the OIT is advanced and the header page is written to disk. // If the header page was written before flushing the page buffers // and there was a server crash, the dead records would appear // committed since their TID would now be less than the OIT recorded // in the database. CCH_flush(tdbb, FLUSH_SWEEP, 0); WIN window(HEADER_PAGE_NUMBER); header_page* const header = (header_page*) CCH_FETCH(tdbb, &window, LCK_write, pag_header); if (Ods::getOIT(header) < --transaction_oldest_active) { CCH_MARK_MUST_WRITE(tdbb, &window); Ods::writeOIT(header, MIN(active, transaction_oldest_active)); } traceSweep.update(header); CCH_RELEASE(tdbb, &window); traceSweep.finish(); } TRA_commit(tdbb, transaction, false); tdbb->tdbb_flags &= ~TDBB_sweeper; tdbb->setTransaction(tdbb_old_trans); dbb->clearSweepFlags(tdbb); } // try catch (const Firebird::Exception& ex) { iscLogException("Error during sweep:", ex); ex.stuffException(tdbb->tdbb_status_vector); if (transaction) { try { TRA_commit(tdbb, transaction, false); } catch (const Firebird::Exception& ex2) { ex2.stuffException(tdbb->tdbb_status_vector); } } tdbb->tdbb_flags &= ~TDBB_sweeper; tdbb->setTransaction(tdbb_old_trans); dbb->clearSweepFlags(tdbb); throw; } } int TRA_wait(thread_db* tdbb, jrd_tra* trans, TraNumber number, jrd_tra::wait_t wait) { /************************************** * * T R A _ w a i t * ************************************** * * Functional description * Wait for a given transaction to drop into a stable state (i.e. non-active) * state. To do this, we first wait on the transaction number. When we * are able to get the lock, the transaction is not longer bona fide * active. Next, we determine the state of the transaction from the * transaction inventory page. If either committed, dead, or limbo, * we return the state. If the transaction is still marked active, * however, declare the transaction dead, and mark the transaction * inventory page accordingly. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // Create, wait on, and release lock on target transaction. If // we can't get the lock due to deadlock if (wait != jrd_tra::tra_no_wait) { Lock temp_lock(tdbb, sizeof(TraNumber), LCK_tra); temp_lock.setKey(number); const SSHORT timeout = (wait == jrd_tra::tra_wait) ? trans->getLockWait() : 0; if (!LCK_lock(tdbb, &temp_lock, LCK_read, timeout)) { fb_utils::init_status(tdbb->tdbb_status_vector); return tra_active; } LCK_release(tdbb, &temp_lock); } int state = TRA_get_state(tdbb, number); if (wait != jrd_tra::tra_no_wait && state == tra_committed) return state; if (state == tra_precommitted) return state; // If the recorded state of the transaction is active, we know better. If // it were active, he'd be alive now. Mark him dead. if (state == tra_active) { state = tra_dead; TRA_set_state(tdbb, 0, number, tra_dead); } // If the transaction disappeared into limbo, died, for constructively // died, tweak the transaction state snapshot to reflect the new state. // This is guaranteed safe. TPC_set_state(tdbb, number, state); return state; } #ifdef SUPERSERVER_V2 static TraNumber bump_transaction_id(thread_db* tdbb, WIN* window) { /************************************** * * b u m p _ t r a n s a c t i o n _ i d * ************************************** * * Functional description * Fetch header and bump next transaction id. If necessary, * extend TIP. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); if (dbb->dbb_next_transaction >= MAX_TRA_NUMBER - 1) { CCH_RELEASE(tdbb, window); ERR_post(Arg::Gds(isc_imp_exc) << Arg::Gds(isc_tra_num_exc)); } const TraNumber number = ++dbb->dbb_next_transaction; dbb->assignLastestTransactionId(number); // No need to write TID onto the TIP page, for a RO DB if (dbb->readOnly()) return number; // If this is the first transaction on a TIP, allocate the TIP now. // Note, first TIP page is created with the database itself, // see JProvider::createDatabase. const bool new_tip = ((number % dbb->dbb_page_manager.transPerTIP) == 0); if (new_tip) TRA_extend_tip(tdbb, (number / dbb->dbb_page_manager.transPerTIP)); //, window); return number; } #else static header_page* bump_transaction_id(thread_db* tdbb, WIN* window, bool dontWrite) { /************************************** * * b u m p _ t r a n s a c t i o n _ i d * ************************************** * * Functional description * Fetch header and bump next transaction id. If necessary, * extend TIP. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); window->win_page = HEADER_PAGE_NUMBER; header_page* header = (header_page*) CCH_FETCH(tdbb, window, LCK_write, pag_header); const TraNumber next_transaction = Ods::getNT(header); const TraNumber oldest_active = Ods::getOAT(header); const TraNumber oldest_transaction = Ods::getOIT(header); const TraNumber oldest_snapshot = Ods::getOST(header); // Before incrementing the next transaction Id, make sure the current one is valid if (next_transaction) { if (oldest_active > next_transaction) BUGCHECK(266); //next transaction older than oldest active if (oldest_transaction > next_transaction) BUGCHECK(267); // next transaction older than oldest transaction } if (next_transaction >= MAX_TRA_NUMBER - 1) { CCH_RELEASE(tdbb, window); ERR_post(Arg::Gds(isc_imp_exc) << Arg::Gds(isc_tra_num_exc)); } const TraNumber number = next_transaction + 1; // If this is the first transaction on a TIP, allocate the TIP now. // Note, first TIP page is created with the database itself, // see JProvider::createDatabase. const bool new_tip = ((number % dbb->dbb_page_manager.transPerTIP) == 0); if (new_tip) TRA_extend_tip(tdbb, (number / dbb->dbb_page_manager.transPerTIP)); //, window); // Extend, if necessary, has apparently succeeded. Next, update header page if (dontWrite && !new_tip) CCH_MARK(tdbb, window); else CCH_MARK_MUST_WRITE(tdbb, window); //dbb->assignLatestTransactionId(number); dbb->dbb_next_transaction = number; Ods::writeNT(header, number); if (dbb->dbb_oldest_active > oldest_active) Ods::writeOAT(header, dbb->dbb_oldest_active); if (dbb->dbb_oldest_transaction > oldest_transaction) Ods::writeOIT(header, dbb->dbb_oldest_transaction); if (dbb->dbb_oldest_snapshot > oldest_snapshot) Ods::writeOST(header, dbb->dbb_oldest_snapshot); return header; } #endif static void expand_view_lock(thread_db* tdbb, jrd_tra* transaction, jrd_rel* relation, UCHAR lock_type, const char* option_name, RelationLockTypeMap& lockmap, const int level) { /************************************** * * e x p a n d _ v i e w _ l o c k * ************************************** * * Functional description * A view in a RESERVING will lead to all tables in the * view being locked. * Some checks only apply when the user reserved directly the table or view. * **************************************/ SET_TDBB(tdbb); if (level == 30) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_max_recursion) << Arg::Num(30)); } const char* const relation_name = relation->rel_name.c_str(); // LCK_none < LCK_SR < LCK_PR < LCK_SW < LCK_EX UCHAR oldlock; const bool found = lockmap.get(relation->rel_id, oldlock); if (found && oldlock > lock_type) { const char* newname = get_lockname_v3(lock_type); const char* oldname = get_lockname_v3(oldlock); if (level) { lock_type = oldlock; // Preserve the old, more powerful lock. ERR_post_warning(Arg::Warning(isc_tpb_reserv_stronger_wng) << Arg::Str(relation_name) << Arg::Str(oldname) << Arg::Str(newname)); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_stronger) << Arg::Str(relation_name) << Arg::Str(oldname) << Arg::Str(newname)); } } if (level == 0) { fb_assert(!relation->rel_view_rse && !relation->rel_view_contexts.getCount()); // Reject explicit attempts to take locks on virtual tables. if (relation->isVirtual()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_virtualtbl) << Arg::Str(relation_name)); } // Reject explicit attempts to take locks on system tables. if (relation->isSystem()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_systbl) << Arg::Str(relation_name)); } if (relation->isTemporary() && (lock_type == LCK_PR || lock_type == LCK_EX)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_temptbl) << Arg::Str(get_lockname_v3(LCK_PR)) << Arg::Str(get_lockname_v3(LCK_EX)) << Arg::Str(relation_name)); } } else { fb_assert(relation->rel_view_rse && relation->rel_view_contexts.getCount()); // Ignore implicit attempts to take locks on special tables through views. if (relation->isVirtual() || relation->isSystem()) return; // We can't propagate a view's LCK_PR or LCK_EX to a temporary table. if (relation->isTemporary()) { switch (lock_type) { case LCK_PR: lock_type = LCK_SR; break; case LCK_EX: lock_type = LCK_SW; break; } } } // set up the lock on the relation/view Lock* lock = RLCK_transaction_relation_lock(tdbb, transaction, relation); lock->lck_logical = lock_type; if (!found) *lockmap.put(relation->rel_id) = lock_type; const ViewContexts& ctx = relation->rel_view_contexts; for (FB_SIZE_T i = 0; i < ctx.getCount(); ++i) { if (ctx[i]->vcx_type == VCT_PROCEDURE) continue; jrd_rel* base_rel = MET_lookup_relation(tdbb, ctx[i]->vcx_relation_name); if (!base_rel) { // should be a BUGCHECK ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_baserelnotfound) << Arg::Str(ctx[i]->vcx_relation_name) << Arg::Str(relation_name) << Arg::Str(option_name)); } // force a scan to read view information MET_scan_relation(tdbb, base_rel); expand_view_lock(tdbb, transaction, base_rel, lock_type, option_name, lockmap, level + 1); } } static tx_inv_page* fetch_inventory_page(thread_db* tdbb, WIN* window, ULONG sequence, USHORT lock_level) { /************************************** * * f e t c h _ i n v e n t o r y _ p a g e * ************************************** * * Functional description * Fetch a transaction inventory page. * Use the opportunity to cache the info * in the TIP cache. * **************************************/ SET_TDBB(tdbb); window->win_page = inventory_page(tdbb, sequence); tx_inv_page* tip = (tx_inv_page*) CCH_FETCH(tdbb, window, lock_level, pag_transactions); return tip; } static const char* get_lockname_v3(const UCHAR lock) { /************************************** * * g e t _ l o c k n a m e _ v 3 * ************************************** * * Functional description * Get the lock mnemonic, given its binary value. * This is for TPB versions 1 & 3. * **************************************/ const char* typestr = "unknown"; switch (lock) { case LCK_none: case LCK_SR: typestr = "isc_tpb_lock_read, isc_tpb_shared"; break; case LCK_PR: typestr = "isc_tpb_lock_read, isc_tpb_protected/isc_tpb_exclusive"; break; case LCK_SW: typestr = "isc_tpb_lock_write, isc_tpb_shared"; break; case LCK_EX: typestr = "isc_tpb_lock_write, isc_tpb_protected/isc_tpb_exclusive"; break; } return typestr; } static ULONG inventory_page(thread_db* tdbb, ULONG sequence) { /************************************** * * i n v e n t o r y _ p a g e * ************************************** * * Functional description * Get the physical page number of the n-th transaction inventory * page. If not found, try to reconstruct using sibling pointer * from last known TIP page. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); WIN window(DB_PAGE_SPACE, -1); vcl* vector = dbb->dbb_t_pages; while (!vector || sequence >= vector->count()) { DPM_scan_pages(tdbb); if ((vector = dbb->dbb_t_pages) && sequence < vector->count()) break; if (!vector) BUGCHECK(165); // msg 165 cannot find tip page window.win_page = (*vector)[vector->count() - 1]; tx_inv_page* tip = (tx_inv_page*) CCH_FETCH(tdbb, &window, LCK_read, pag_transactions); const ULONG next = tip->tip_next; CCH_RELEASE(tdbb, &window); if (!(window.win_page = next)) BUGCHECK(165); // msg 165 cannot find tip page // Type check it tip = (tx_inv_page*) CCH_FETCH(tdbb, &window, LCK_read, pag_transactions); CCH_RELEASE(tdbb, &window); DPM_pages(tdbb, 0, pag_transactions, vector->count(), window.win_page.getPageNum()); } return (*vector)[sequence]; } static int limbo_transaction(thread_db* tdbb, TraNumber id) { /************************************** * * l i m b o _ t r a n s a c t i o n * ************************************** * * Functional description * * limbo_state is called when reconnecting * to an existing transaction to assure that * the transaction is actually in limbo. * It returns the transaction state. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); const ULONG trans_per_tip = dbb->dbb_page_manager.transPerTIP; const ULONG page = id / trans_per_tip; const ULONG number = id % trans_per_tip; WIN window(DB_PAGE_SPACE, -1); const tx_inv_page* tip = fetch_inventory_page(tdbb, &window, page, LCK_write); const ULONG trans_offset = TRANS_OFFSET(number); const UCHAR* byte = tip->tip_transactions + trans_offset; const USHORT shift = TRANS_SHIFT(number); const int state = (*byte >> shift) & TRA_MASK; CCH_RELEASE(tdbb, &window); return state; } void jrd_tra::unlinkFromAttachment() { for (jrd_tra** ptr = &tra_attachment->att_transactions; *ptr; ptr = &(*ptr)->tra_next) { if (*ptr == this) { *ptr = tra_next; return; } } tra_abort("transaction to unlink is missing in the attachment"); } void jrd_tra::linkToAttachment(Attachment* attachment) { /************************************** * * l i n k _ t r a n s a c t i o n * ************************************** * * Functional description * Link transaction block into database attachment. * **************************************/ tra_next = attachment->att_transactions; attachment->att_transactions = this; } void jrd_tra::tra_abort(const char* reason) { string buff; buff.printf("Failure working with transactions list: %s", reason); Syslog::Record(Syslog::Error, buff.c_str()); gds__log(buff.c_str()); #ifdef DEV_BUILD abort(); #endif } static void restart_requests(thread_db* tdbb, jrd_tra* trans) { /************************************** * * r e s t a r t _ r e q u e s t s * ************************************** * * Functional description * Restart all requests in the current * attachment to utilize the passed * transaction. * **************************************/ SET_TDBB(tdbb); for (jrd_req** i = trans->tra_attachment->att_requests.begin(); i != trans->tra_attachment->att_requests.end(); ++i) { Array& requests = (*i)->getStatement()->requests; for (jrd_req** j = requests.begin(); j != requests.end(); ++j) { jrd_req* request = *j; if (request && request->req_transaction) { EXE_unwind(tdbb, request); EXE_start(tdbb, request, trans); } } } } static void retain_context(thread_db* tdbb, jrd_tra* transaction, bool commit, int state) { /************************************** * * r e t a i n _ c o n t e x t * ************************************** * * Functional description * If 'commit' flag is true, commit the transaction, * else rollback the transaction. * * Commit/rollback a transaction while preserving the * context, in particular, its snapshot. The * trick is to insure that the transaction's * oldest active is seen by other transactions * simultaneously starting up. * **************************************/ SET_TDBB(tdbb); Database* dbb = tdbb->getDatabase(); CHECK_DBB(dbb); // The new transaction needs to remember the 'commit-retained' transaction // because it must see the operations of the 'commit-retained' transaction and // its snapshot doesn't contain these operations. if (commit) TBM_SET(tdbb->getDefaultPool(), &transaction->tra_commit_sub_trans, transaction->tra_number); // Create a new transaction lock, inheriting oldest active from transaction being committed. WIN window(DB_PAGE_SPACE, -1); TraNumber new_number; #ifdef SUPERSERVER_V2 new_number = bump_transaction_id(tdbb, &window); #else if (dbb->readOnly()) new_number = dbb->generateTransactionId(); else { const bool dontWrite = (dbb->dbb_flags & DBB_shared) && (transaction->tra_flags & TRA_readonly); const header_page* const header = bump_transaction_id(tdbb, &window, dontWrite); new_number = Ods::getNT(header); } #endif Lock* new_lock = NULL; Lock* old_lock = transaction->tra_lock; if (old_lock) { new_lock = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) Lock(tdbb, sizeof(TraNumber), LCK_tra); new_lock->setKey(new_number); new_lock->lck_data = transaction->tra_lock->lck_data; if (!LCK_lock(tdbb, new_lock, LCK_write, LCK_WAIT)) { #ifndef SUPERSERVER_V2 if (!dbb->readOnly()) CCH_RELEASE(tdbb, &window); #endif ERR_post(Arg::Gds(isc_lock_conflict)); } } #ifndef SUPERSERVER_V2 if (!dbb->readOnly()) CCH_RELEASE(tdbb, &window); #endif // Update database notion of the youngest commit retaining // transaction before committing the first transaction. This // secures the original snapshot by insuring the oldest active // is seen by other transactions. const TraNumber old_number = transaction->tra_number; if (!dbb->readOnly()) { // Set the state on the inventory page TRA_set_state(tdbb, transaction, old_number, state); } transaction->tra_number = new_number; // Release transaction lock since it isn't needed // anymore and the new one is already in place. if (old_lock) { ++transaction->tra_use_count; LCK_release(tdbb, old_lock); transaction->tra_lock = new_lock; --transaction->tra_use_count; delete old_lock; } // Perform any post commit work OR delete entries from deferred list if (commit) DFW_perform_post_commit_work(transaction); else DFW_delete_deferred(transaction, -1); transaction->tra_flags &= ~(TRA_write | TRA_prepared); // All savepoint were already released in TRA_commit/TRA_rollback except, may be, empty transaction-level one if (!transaction->tra_save_point && !(transaction->tra_flags & TRA_no_auto_undo)) transaction->startSavepoint(true); // start new savepoint if necessary if (transaction->tra_flags & TRA_precommitted) { if (!dbb->readOnly()) { transaction->tra_flags &= ~TRA_precommitted; TRA_set_state(tdbb, transaction, new_number, tra_committed); transaction->tra_flags |= TRA_precommitted; } } } static void start_sweeper(thread_db* tdbb) { /************************************** * * s t a r t _ s w e e p e r * ************************************** * * Functional description * Start a thread to sweep the database. * **************************************/ SET_TDBB(tdbb); Database* const dbb = tdbb->getDatabase(); if (!dbb->allowSweepThread(tdbb)) return; TRA_update_counters(tdbb, dbb); // allocate space for the string and a null at the end const char* pszFilename = tdbb->getAttachment()->att_filename.c_str(); char* database = (char*) gds__alloc(static_cast(strlen(pszFilename)) + 1); if (database) { strcpy(database, pszFilename); try { Thread::start(sweep_database, database, THREAD_medium); return; } catch (const Firebird::Exception& ex) { gds__free(database); iscLogException("cannot start sweep thread", ex); } } else { ERR_log(0, 0, "cannot start sweep thread, Out of Memory"); } dbb->clearSweepFlags(tdbb); } static THREAD_ENTRY_DECLARE sweep_database(THREAD_ENTRY_PARAM database) { /************************************** * * s w e e p _ d a t a b a s e * ************************************** * * Functional description * Sweep database. * **************************************/ Firebird::ClumpletWriter dpb(Firebird::ClumpletReader::Tagged, MAX_DPB_SIZE, isc_dpb_version1); dpb.insertByte(isc_dpb_sweep, isc_dpb_records); // use embedded authentication to attach database const char* szAuthenticator = "sweeper"; dpb.insertString(isc_dpb_user_name, szAuthenticator, fb_strlen(szAuthenticator)); ISC_STATUS_ARRAY status_vector = {0}; isc_db_handle db_handle = 0; isc_attach_database(status_vector, 0, (const char*) database, &db_handle, dpb.getBufferLength(), reinterpret_cast(dpb.getBuffer())); if (db_handle) { isc_detach_database(status_vector, &db_handle); } gds__free(database); return 0; } static void transaction_flush(thread_db* tdbb, USHORT flush_flag, TraNumber tra_number) { /************************************** * * t r a n s a c t i o n _ f l u s h * ************************************** * * Functional description * Flush pages modified by user and/or system transaction. * Note, flush of user transaction also flushed pages, * changed by system transaction. * **************************************/ fb_assert(flush_flag == FLUSH_TRAN || flush_flag == FLUSH_SYSTEM); CCH_flush(tdbb, flush_flag, tra_number); jrd_tra* const sysTran = tdbb->getAttachment()->getSysTransaction(); sysTran->tra_flags &= ~TRA_write; } static void transaction_options(thread_db* tdbb, jrd_tra* transaction, const UCHAR* tpb, USHORT tpb_length) { /************************************** * * t r a n s a c t i o n _ o p t i o n s * ************************************** * * Functional description * Process transaction options. * **************************************/ SET_TDBB(tdbb); if (!tpb_length) return; const UCHAR* const end = tpb + tpb_length; if (*tpb != isc_tpb_version3 && *tpb != isc_tpb_version1) ERR_post(Arg::Gds(isc_bad_tpb_form) << Arg::Gds(isc_wrotpbver)); Attachment* const attachment = tdbb->getAttachment(); RelationLockTypeMap lockmap; TriState wait, lock_timeout; TriState isolation, read_only, rec_version; bool anylock_write = false; ++tpb; while (tpb < end) { const USHORT op = *tpb++; switch (op) { case isc_tpb_consistency: if (!isolation.assignOnce(true)) ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_txn_isolation)); transaction->tra_flags |= TRA_degree3; transaction->tra_flags &= ~TRA_read_committed; break; case isc_tpb_concurrency: if (!isolation.assignOnce(true)) ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_txn_isolation)); transaction->tra_flags &= ~TRA_degree3; transaction->tra_flags &= ~TRA_read_committed; break; case isc_tpb_read_committed: if (!isolation.assignOnce(true)) ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_txn_isolation)); transaction->tra_flags &= ~TRA_degree3; transaction->tra_flags |= TRA_read_committed; break; case isc_tpb_shared: ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_before_table) << Arg::Str("isc_tpb_shared")); break; case isc_tpb_protected: ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_before_table) << Arg::Str("isc_tpb_protected")); break; case isc_tpb_exclusive: ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_before_table) << Arg::Str("isc_tpb_exclusive")); break; case isc_tpb_wait: if (!wait.assignOnce(true)) { if (!wait.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_wait") << Arg::Str("isc_tpb_nowait")); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_wait")); } } break; case isc_tpb_rec_version: if (isolation.isAssigned() && !(transaction->tra_flags & TRA_read_committed)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_option_without_rc) << Arg::Str("isc_tpb_rec_version")); } if (!rec_version.assignOnce(true)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_rec_version")); } transaction->tra_flags &= ~TRA_read_consistency; transaction->tra_flags |= TRA_rec_version; break; case isc_tpb_no_rec_version: if (isolation.isAssigned() && !(transaction->tra_flags & TRA_read_committed)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_option_without_rc) << Arg::Str("isc_tpb_no_rec_version")); } if (!rec_version.assignOnce(false)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_no_rec_version")); } transaction->tra_flags &= ~(TRA_rec_version | TRA_read_consistency); ; break; case isc_tpb_read_consistency: if (isolation.isAssigned() && !(transaction->tra_flags & TRA_read_committed)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_option_without_rc) << Arg::Str("isc_tpb_read_consistency")); } if (!rec_version.assignOnce(false)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_read_consistency")); } transaction->tra_flags &= ~TRA_rec_version; transaction->tra_flags |= TRA_read_consistency; break; case isc_tpb_nowait: if (lock_timeout.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_nowait") << Arg::Str("isc_tpb_lock_timeout")); } if (!wait.assignOnce(false)) { if (wait.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_nowait") << Arg::Str("isc_tpb_wait")); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_nowait")); } } transaction->tra_lock_timeout = 0; break; case isc_tpb_read: if (!read_only.assignOnce(true)) { if (!read_only.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_read") << Arg::Str("isc_tpb_write")); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_read")); } } // Cannot set the whole txn to R/O if we already saw a R/W table reservation. if (anylock_write) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_readtxn_after_writelock)); } transaction->tra_flags |= TRA_readonly; break; case isc_tpb_write: if (!read_only.assignOnce(false)) { if (read_only.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_write") << Arg::Str("isc_tpb_read")); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_write")); } } transaction->tra_flags &= ~TRA_readonly; break; case isc_tpb_ignore_limbo: transaction->tra_flags |= TRA_ignore_limbo; break; case isc_tpb_no_auto_undo: transaction->tra_flags |= TRA_no_auto_undo; break; case isc_tpb_lock_write: // Cannot set a R/W table reservation if the whole txn is R/O. if (read_only.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_writelock_after_readtxn)); } anylock_write = true; // fall into case isc_tpb_lock_read: { const char* option_name = (op == isc_tpb_lock_read) ? "isc_tpb_lock_read" : "isc_tpb_lock_write"; // Do we have space for the identifier length? if (tpb >= end) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_missing_tlen) << Arg::Str(option_name)); } const USHORT len = *tpb++; if (len > MAX_SQL_IDENTIFIER_LEN) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_long_tlen) << Arg::Num(len) << Arg::Str(option_name)); } if (!len) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_null_tlen) << Arg::Str(option_name)); } // Does the identifier length surpasses the remaining of the TPB? if (tpb >= end) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_missing_tname) << Arg::Num(len) << Arg::Str(option_name)); } if (end - tpb < len) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_corrup_tlen) << Arg::Num(len) << Arg::Str(option_name)); } const Firebird::MetaName orgName(reinterpret_cast(tpb), len); const Firebird::MetaName metaName = attachment->nameToMetaCharSet(tdbb, orgName); tpb += len; jrd_rel* relation = MET_lookup_relation(tdbb, metaName); if (!relation) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_reserv_relnotfound) << Arg::Str(metaName) << Arg::Str(option_name)); } // force a scan to read view information MET_scan_relation(tdbb, relation); UCHAR lock_type = (op == isc_tpb_lock_read) ? LCK_none : LCK_SW; if (tpb < end) { switch (*tpb) { case isc_tpb_shared: ++tpb; break; case isc_tpb_protected: case isc_tpb_exclusive: ++tpb; lock_type = (lock_type == LCK_SW) ? LCK_EX : LCK_PR; break; // We'll assume table reservation doesn't make the concurrency type mandatory. //default: // ERR_post(isc-arg-end); } } expand_view_lock(tdbb, transaction, relation, lock_type, option_name, lockmap, 0); } break; case isc_tpb_verb_time: case isc_tpb_commit_time: { const char* option_name = (op == isc_tpb_verb_time) ? "isc_tpb_verb_time" : "isc_tpb_commit_time"; // Harmless for now even if formally invalid. if (tpb >= end) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_missing_len) << Arg::Str(option_name)); } const USHORT len = *tpb++; if (tpb >= end && len > 0) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_missing_value) << Arg::Num(len) << Arg::Str(option_name)); } if (end - tpb < len) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_corrupt_len) << Arg::Num(len) << Arg::Str(option_name)); } tpb += len; } break; case isc_tpb_autocommit: transaction->tra_flags |= TRA_autocommit; break; case isc_tpb_restart_requests: transaction->tra_flags |= TRA_restart_requests; break; case isc_tpb_lock_timeout: { if (wait.isAssigned() && !wait.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_conflicting_options) << Arg::Str("isc_tpb_lock_timeout") << Arg::Str("isc_tpb_nowait")); } if (!lock_timeout.assignOnce(true)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_multiple_spec) << Arg::Str("isc_tpb_lock_timeout")); } // Do we have space for the identifier length? if (tpb >= end) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_missing_len) << Arg::Str("isc_tpb_lock_timeout")); } const USHORT len = *tpb++; // Does the encoded number's length surpasses the remaining of the TPB? if (tpb >= end) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_missing_value) << Arg::Num(len) << Arg::Str("isc_tpb_lock_timeout")); } if (end - tpb < len) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_corrupt_len) << Arg::Num(len) << Arg::Str("isc_tpb_lock_timeout")); } if (!len) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_null_len) << Arg::Str("isc_tpb_lock_timeout")); } if (len > sizeof(ULONG)) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_overflow_len) << Arg::Num(len) << Arg::Str("isc_tpb_lock_timeout")); } const SLONG value = gds__vax_integer(tpb, len); if (value <= 0 || value > MAX_SSHORT) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_invalid_value) << Arg::Num(value) << Arg::Str("isc_tpb_lock_timeout")); } transaction->tra_lock_timeout = (SSHORT) value; tpb += len; } break; default: ERR_post(Arg::Gds(isc_bad_tpb_form)); } } if (rec_version.isAssigned() && !(transaction->tra_flags & TRA_read_committed)) { if (rec_version.asBool()) { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_option_without_rc) << Arg::Str("isc_tpb_rec_version")); } else { ERR_post(Arg::Gds(isc_bad_tpb_content) << Arg::Gds(isc_tpb_option_without_rc) << Arg::Str("isc_tpb_no_rec_version")); } } if ((transaction->tra_flags & TRA_read_committed) && !(tdbb->tdbb_flags & TDBB_sweeper)) if (tdbb->getDatabase()->dbb_config->getReadConsistency()) transaction->tra_flags |= TRA_read_consistency | TRA_rec_version; // If there aren't any relation locks to seize, we're done. vec* vector = transaction->tra_relation_locks; if (!vector) return; // Try to seize all relation locks. If any can't be seized, release all and try again. for (ULONG id = 0; id < vector->count(); id++) { Lock* lock = (*vector)[id]; if (!lock) continue; USHORT level = lock->lck_logical; if (level == LCK_none || LCK_lock(tdbb, lock, level, transaction->getLockWait())) continue; for (ULONG l = 0; l < id; l++) { if ( (lock = (*vector)[l]) ) { level = lock->lck_logical; LCK_release(tdbb, lock); lock->lck_logical = level; } } id = 0; ERR_punt(); } } static void transaction_start(thread_db* tdbb, jrd_tra* trans) { /************************************** * * t r a n s a c t i o n _ s t a r t * ************************************** * * Functional description * Start a transaction. * **************************************/ SET_TDBB(tdbb); Database* const dbb = tdbb->getDatabase(); Jrd::Attachment* const attachment = tdbb->getAttachment(); WIN window(DB_PAGE_SPACE, -1); Lock* lock = FB_NEW_RPT(*tdbb->getDefaultPool(), 0) Lock(tdbb, sizeof(TraNumber), LCK_tra); // Read header page and allocate transaction number. Since // the transaction inventory page was initialized to zero, it // transaction is automatically marked active. TraNumber oldest, number, active, oldest_active, oldest_snapshot; #ifdef SUPERSERVER_V2 number = bump_transaction_id(tdbb, &window); oldest = dbb->dbb_oldest_transaction; active = MAX(dbb->dbb_oldest_active, dbb->dbb_oldest_transaction); oldest_active = dbb->dbb_oldest_active; oldest_snapshot = dbb->dbb_oldest_snapshot; #else // SUPERSERVER_V2 if (dbb->readOnly()) { number = dbb->generateTransactionId(); oldest = dbb->dbb_oldest_transaction; oldest_active = dbb->dbb_oldest_active; oldest_snapshot = dbb->dbb_oldest_snapshot; } else { const bool dontWrite = (dbb->dbb_flags & DBB_shared) && (trans->tra_flags & TRA_readonly); const header_page* header = bump_transaction_id(tdbb, &window, dontWrite); number = Ods::getNT(header); oldest = Ods::getOIT(header); oldest_active = Ods::getOAT(header); oldest_snapshot = Ods::getOST(header); } // oldest (OIT) > oldest_active (OAT) if OIT was advanced by sweep // and no transactions was started after the sweep starts active = MAX(oldest_active, oldest); #endif // SUPERSERVER_V2 // Allocate pool and transactions block. Since, by policy, // all transactions older than the oldest are either committed // or cleaned up, they can be all considered as committed. To // make everything simpler, round down the oldest to a multiple // of four, which puts the transaction on a byte boundary. trans->tra_number = number; trans->tra_top = number; trans->tra_oldest = oldest; trans->tra_oldest_active = active; trans->tra_lock = lock; lock->setKey(number); // Put the TID of the oldest active transaction (from the header page) // in the new transaction's lock. // hvlad: it is important to put transaction number for read-committed // transaction instead of oldest active to correctly calculate new oldest // active value (look at call to LCK_query_data below which will take into // account this new lock too) lock->lck_data = ((trans->tra_flags & TRA_read_committed) && !(trans->tra_flags & TRA_read_consistency)) ? number : active; lock->lck_object = trans; if (!LCK_lock(tdbb, lock, LCK_write, LCK_WAIT)) { #ifndef SUPERSERVER_V2 if (!dbb->readOnly()) CCH_RELEASE(tdbb, &window); #endif ERR_post(Arg::Gds(isc_lock_conflict)); } // Link the transaction to the attachment block before releasing // header page for handling signals. trans->linkToAttachment(attachment); try { #ifndef SUPERSERVER_V2 if (!dbb->readOnly()) CCH_RELEASE(tdbb, &window); #endif if (dbb->readOnly()) { // Set transaction flags to TRA_precommitted, TRA_readonly trans->tra_flags |= (TRA_readonly | TRA_precommitted); } // Next, take a snapshot of all transactions between the oldest interesting // transaction and the current. Don't bother to get a snapshot for // read-committed transactions; they use the snapshot off the dbb block // since they need to know what is currently committed. if (!(trans->tra_flags & TRA_read_committed)) { trans->tra_snapshot_handle = dbb->dbb_tip_cache->beginSnapshot(tdbb, attachment->att_attachment_id, &trans->tra_snapshot_number); } // Next task is to find the oldest active transaction on the system. This // is needed for garbage collection. Things are made ever so slightly // more complicated by the fact that existing transaction may have oldest // actives older than they are. Lock temp_lock(tdbb, sizeof(TraNumber), LCK_tra, trans); trans->tra_oldest_active = number; oldest_active = number; bool cleanup = !(number % TRA_ACTIVE_CLEANUP); int oldest_state; for (; active < number; active++) { //oldest_state = TPC_cache_state(tdbb, active); const ULONG mask = (1 << tra_active); active = TPC_find_states(tdbb, active, number, mask, oldest_state); if (!active) { active = number; break; } fb_assert(oldest_state == tra_active); if (oldest_state == tra_active) { temp_lock.setKey(active); TraNumber data = LCK_read_data(tdbb, &temp_lock); if (!data) { if (cleanup) { if (TRA_wait(tdbb, trans, active, jrd_tra::tra_no_wait) == tra_committed) cleanup = false; continue; } data = active; } oldest_active = active; break; } } // Calculate attachment-local oldest active and oldest snapshot numbers // looking at current attachment's transactions only. Calculated values // are used to determine garbage collection threshold for attachment-local // data such as temporary tables (GTT's). trans->tra_att_oldest_active = number; TraNumber att_oldest_active = number; TraNumber att_oldest_snapshot = number; for (jrd_tra* tx_att = attachment->att_transactions; tx_att; tx_att = tx_att->tra_next) { att_oldest_active = MIN(att_oldest_active, tx_att->tra_number); att_oldest_snapshot = MIN(att_oldest_snapshot, tx_att->tra_att_oldest_active); } trans->tra_att_oldest_active = ((trans->tra_flags & TRA_read_committed) && !(trans->tra_flags & TRA_read_consistency)) ? number : att_oldest_active; if (attachment->att_oldest_snapshot < att_oldest_snapshot) attachment->att_oldest_snapshot = att_oldest_snapshot; // Put the TID of the oldest active transaction (just calculated) // in the new transaction's lock. // hvlad: for read-committed transaction put tra_number to prevent // unnecessary blocking of garbage collection by read-committed // transactions const TraNumber lck_data = ((trans->tra_flags & TRA_read_committed) && !(trans->tra_flags & TRA_read_consistency)) ? number : oldest_active; static_assert(sizeof(lock->lck_data) == sizeof(lck_data), "Check lock data type !"); if (lock->lck_data != lck_data) LCK_write_data(tdbb, lock, lck_data); // Query the minimum lock data for all active transaction locks. // This will be the oldest active snapshot used for regulating garbage collection. const TraNumber data = LCK_query_data(tdbb, LCK_tra, LCK_MIN); if (data && data < trans->tra_oldest_active) trans->tra_oldest_active = data; // Finally, scan transactions looking for the oldest interesting transaction -- the oldest // non-commited transaction. This will not be updated immediately, but saved until the // next update access to the header page oldest_state = tra_committed; for (oldest = trans->tra_oldest; oldest < number; oldest++) { //oldest_state = TPC_cache_state(tdbb, oldest); const ULONG mask = ~((1 << tra_committed) | (1 << tra_precommitted)); oldest = TPC_find_states(tdbb, trans->tra_oldest, number, mask, oldest_state); if (!oldest) { oldest = number; break; } fb_assert(oldest_state != tra_committed && oldest_state != tra_precommitted); if (oldest_state != tra_committed && oldest_state != tra_precommitted) break; } if (oldest > number && dbb->dbb_flags & DBB_read_only) oldest = number; if (--oldest > dbb->dbb_oldest_transaction) dbb->dbb_oldest_transaction = oldest; if (oldest_active > dbb->dbb_oldest_active) dbb->dbb_oldest_active = oldest_active; if (trans->tra_oldest_active > dbb->dbb_oldest_snapshot) { dbb->dbb_oldest_snapshot = trans->tra_oldest_active; if (!(dbb->dbb_flags & DBB_gc_active) && (dbb->dbb_flags & DBB_gc_background)) { dbb->dbb_flags |= DBB_gc_pending; dbb->dbb_gc_sem.release(); } } // Release TPC shared memory if counters moved sufficently forward dbb->dbb_tip_cache->updateOldestTransaction(tdbb, dbb->dbb_oldest_transaction, dbb->dbb_oldest_snapshot); // If the transaction block is getting out of hand, force a sweep if (dbb->dbb_sweep_interval && (trans->tra_oldest_active > oldest) && (trans->tra_oldest_active - oldest > dbb->dbb_sweep_interval) && oldest_state != tra_limbo) { start_sweeper(tdbb); } // Start a 'transaction-level' savepoint, unless this is the // system transaction, or unless the transactions doesn't want // a savepoint to be started. This savepoint will be used to // undo the transaction if it rolls back. if (!(trans->tra_flags & TRA_system) && !(trans->tra_flags & TRA_no_auto_undo)) trans->startSavepoint(true); // if the user asked us to restart all requests in this attachment, // do so now using the new transaction if (trans->tra_flags & TRA_restart_requests) restart_requests(tdbb, trans); // If the transaction is read-only and read committed, it can be // precommitted because it can't modify any records. // 2014-08-26 NS XXX: with latest changes in TIP cache semantics and read // consistency changes precommitted transactions offer almost no benefit, but // complicate implementation considerably. It might make sense to remove // precommitted transactions logic completely. if ((trans->tra_flags & TRA_readonly) && (trans->tra_flags & TRA_read_committed)) { TRA_set_state(tdbb, trans, trans->tra_number, tra_committed); if (!(trans->tra_flags & TRA_read_consistency)) LCK_write_data(tdbb, lock, 0); // Fully disinhibit GC for this transaction trans->tra_flags |= TRA_precommitted; } } catch (const Firebird::Exception&) { trans->unlinkFromAttachment(); throw; } } jrd_tra::~jrd_tra() { while (tra_undo_records.hasData()) delete tra_undo_records.pop(); delete tra_undo_space; delete tra_user_management; delete tra_mapping_list; delete tra_gen_ids; if (!tra_outer) delete tra_blob_space; else fb_assert(!tra_arrays); DFW_delete_deferred(this, -1); if (tra_flags & TRA_own_interface) { tra_interface->setHandle(NULL); tra_interface->release(); } if (tra_autonomous_pool) MemoryPool::deletePool(tra_autonomous_pool); delete tra_sec_db_context; } JTransaction* jrd_tra::getInterface(bool create) { if (!tra_interface && create) { tra_flags |= TRA_own_interface; tra_interface = FB_NEW JTransaction(this, tra_attachment->getStable()); tra_interface->addRef(); } return tra_interface; } void jrd_tra::setInterface(JTransaction* jt) { fb_assert(tra_interface == NULL || tra_interface == jt); tra_interface = jt; } UserManagement* jrd_tra::getUserManagement() { if (!tra_user_management) tra_user_management = FB_NEW_POOL(*tra_pool) UserManagement(this); return tra_user_management; } MappingList* jrd_tra::getMappingList() { if (!tra_mapping_list) tra_mapping_list = FB_NEW_POOL(*tra_pool) MappingList(this); return tra_mapping_list; } DbCreatorsList* jrd_tra::getDbCreatorsList() { if (!tra_dbcreators_list) tra_dbcreators_list = FB_NEW_POOL(*tra_pool) DbCreatorsList(this); return tra_dbcreators_list; } jrd_tra* jrd_tra::getOuter() { jrd_tra* tra = this; while (tra->tra_outer) tra = tra->tra_outer; return tra; } MemoryPool* jrd_tra::getAutonomousPool() { if (!tra_autonomous_pool) { MemoryPool* pool = tra_pool; jrd_tra* outer = tra_outer; while (outer) { pool = outer->tra_pool; outer = outer->tra_outer; } tra_autonomous_pool = MemoryPool::createPool(pool, tra_memory_stats); tra_autonomous_cnt = 0; } return tra_autonomous_pool; } Record* jrd_tra::findNextUndo(VerbAction* stopAction, jrd_rel* relation, SINT64 number) /************************************** * * f i n d N e x t U n d o * ************************************** * * Functional description * For given record find next undo data in stack of savepoint (if any). * **************************************/ { UndoItem* result = NULL; for (Savepoint::Iterator iter(tra_save_point); *iter; ++iter) { VerbAction* const action = (*iter)->getAction(relation); if (action == stopAction) return result ? result->setupRecord(this) : NULL; if (action && action->vct_undo && action->vct_undo->locate(number)) result = &(action->vct_undo->current()); } fb_assert(false); // verb_action disappeared from savepoint stack return NULL; } void jrd_tra::listStayingUndo(jrd_rel* relation, SINT64 number, RecordStack &staying) /************************************** * * l i s t S t a y i n g U n d o * ************************************** * * Functional description * For given record find undo data in stack of savepoint (if any) and push it into list. * Except one from given verb action. * **************************************/ { for (Savepoint::Iterator iter(tra_save_point); *iter; ++iter) { VerbAction* const action = (*iter)->getAction(relation); if (action && action->vct_undo && action->vct_undo->locate(number)) staying.push(action->vct_undo->current().setupRecord(this)); } } void jrd_tra::releaseAutonomousPool(MemoryPool* toRelease) { fb_assert(tra_autonomous_pool == toRelease); if (++tra_autonomous_cnt > TRA_AUTONOMOUS_PER_POOL) { MemoryPool::deletePool(tra_autonomous_pool); tra_autonomous_pool = NULL; } } Savepoint* jrd_tra::startSavepoint(bool root) /************************************** * * s t a r t S a v e p o i n t * ************************************** * * Functional description * Start a new savepoint. Reuse some priorly allocated one, if exists. * **************************************/ { Savepoint* savepoint = tra_save_free; if (savepoint) tra_save_free = savepoint->getNext(); else savepoint = FB_NEW_POOL(*tra_pool) Savepoint(this); const SavNumber number = ++tra_save_point_number; savepoint->init(number, root, tra_save_point); tra_save_point = savepoint; return savepoint; } void jrd_tra::rollbackSavepoint(thread_db* tdbb) /************************************** * * r o l l b a c k S a v e p o i n t * ************************************** * * Functional description * Rollback last savepoint and free it. * **************************************/ { if (tra_save_point && !(tra_flags & TRA_system)) { Jrd::ContextPoolHolder context(tdbb, tra_pool); tra_save_point = tra_save_point->rollback(tdbb); } } void jrd_tra::rollbackToSavepoint(thread_db* tdbb, SavNumber number) /************************************** * * r o l l b a c k T o S a v e p o i n t * ************************************** * * Functional description * Rollback savepoints up to one with given number. * There may be cases when savepoint with given number does not exist. * Rollback all savepoints with bigger numbers then, but not more. * These cases most likely is a bug in logic somewhere, so assert is here. * **************************************/ { // Merge all but one folowing savepoints into one while (tra_save_point && tra_save_point->getNumber() > number && tra_save_point->getNext() && tra_save_point->getNext()->getNumber() >= number) { rollforwardSavepoint(tdbb); } // Check that savepoint with given number really exists fb_assert(tra_save_point && tra_save_point->getNumber() == number); if (tra_save_point && tra_save_point->getNumber() >= number) // second line of defence // under no circumstances a savepoint with smaller number should be rolled back { // Undo the savepoint rollbackSavepoint(tdbb); } } void jrd_tra::rollforwardSavepoint(thread_db* tdbb) /************************************** * * r o l l f o r w a r d S a v e p o i n t * ************************************** * * Functional description * Apply last savepoint and free it. * **************************************/ { if (tra_save_point && !(tra_flags & TRA_system)) { Jrd::ContextPoolHolder context(tdbb, tra_pool); tra_save_point = tra_save_point->rollforward(tdbb); } } void jrd_tra::checkBlob(thread_db* tdbb, const bid* blob_id) { USHORT rel_id = blob_id->bid_internal.bid_relation_id; if (tra_attachment->isGbak() || (tra_attachment->att_user && tra_attachment->att_user->locksmith(tdbb, SELECT_ANY_OBJECT_IN_DATABASE)) || rel_id == 0) { return; } if (!tra_blobs->locate(blob_id->bid_temp_id())) { vec* vector = tra_attachment->att_relations; jrd_rel* blb_relation; if (rel_id < vector->count() && (blb_relation = (*vector)[rel_id])) { if (blb_relation->rel_security_name.isEmpty()) MET_scan_relation(tdbb, blb_relation); SecurityClass* s_class = SCL_get_class(tdbb, blb_relation->rel_security_name.c_str()); if (s_class && !s_class->scl_blb_access) { SCL_check_access(tdbb, s_class, 0, 0, NULL, SCL_select, SCL_object_table, false, blb_relation->rel_name); s_class->scl_blb_access = true; } } } } /// class TraceSweepEvent TraceSweepEvent::TraceSweepEvent(thread_db* tdbb) { m_tdbb = tdbb; WIN window(HEADER_PAGE_NUMBER); Ods::header_page* header = (Ods::header_page*) CCH_FETCH(m_tdbb, &window, LCK_read, pag_header); m_sweep_info.update(header); CCH_RELEASE(m_tdbb, &window); Attachment* att = m_tdbb->getAttachment(); gds__log("Sweep is started by %s\n" "\tDatabase \"%s\" \n" "\tOIT %" SQUADFORMAT", OAT %" SQUADFORMAT", OST %" SQUADFORMAT", Next %" SQUADFORMAT, att->att_user ? att->att_user->getUserName().c_str() : "", att->att_filename.c_str(), m_sweep_info.getOIT(), m_sweep_info.getOAT(), m_sweep_info.getOST(), m_sweep_info.getNext()); TraceManager* trace_mgr = att->att_trace_manager; m_need_trace = trace_mgr->needs(ITraceFactory::TRACE_EVENT_SWEEP); if (!m_need_trace) return; m_start_clock = fb_utils::query_performance_counter(); TraceConnectionImpl conn(att); trace_mgr->event_sweep(&conn, &m_sweep_info, ITracePlugin::SWEEP_STATE_STARTED); } TraceSweepEvent::~TraceSweepEvent() { m_tdbb->setRequest(NULL); report(ITracePlugin::SWEEP_STATE_FAILED); } void TraceSweepEvent::beginSweepRelation(jrd_rel* relation) { if (!m_need_trace) return; if (relation && relation->rel_name.isEmpty()) { // don't accumulate per-relation stats for metadata query below MET_lookup_relation_id(m_tdbb, relation->rel_id, false); } m_relation_clock = fb_utils::query_performance_counter(); m_base_stats.assign(m_tdbb->getTransaction()->tra_stats); } void TraceSweepEvent::endSweepRelation(jrd_rel* relation) { if (!m_need_trace) return; Attachment* att = m_tdbb->getAttachment(); jrd_tra* tran = m_tdbb->getTransaction(); // don't report empty relation if (m_base_stats.getValue(RuntimeStatistics::RECORD_SEQ_READS) == tran->tra_stats.getValue(RuntimeStatistics::RECORD_SEQ_READS) && m_base_stats.getValue(RuntimeStatistics::RECORD_BACKOUTS) == tran->tra_stats.getValue(RuntimeStatistics::RECORD_BACKOUTS) && m_base_stats.getValue(RuntimeStatistics::RECORD_PURGES) == tran->tra_stats.getValue(RuntimeStatistics::RECORD_PURGES) && m_base_stats.getValue(RuntimeStatistics::RECORD_EXPUNGES) == tran->tra_stats.getValue(RuntimeStatistics::RECORD_EXPUNGES) ) { return; } TraceRuntimeStats stats(att, &m_base_stats, &tran->tra_stats, fb_utils::query_performance_counter() - m_relation_clock, 0); m_sweep_info.setPerf(stats.getPerf()); TraceConnectionImpl conn(att); TraceManager* trace_mgr = att->att_trace_manager; trace_mgr->event_sweep(&conn, &m_sweep_info, ITracePlugin::SWEEP_STATE_PROGRESS); } void TraceSweepEvent::report(ntrace_process_state_t state) { Attachment* att = m_tdbb->getAttachment(); if (state == ITracePlugin::SWEEP_STATE_FINISHED) { gds__log("Sweep is finished\n" "\tDatabase \"%s\" \n" "\tOIT %" SQUADFORMAT", OAT %" SQUADFORMAT", OST %" SQUADFORMAT", Next %" SQUADFORMAT, att->att_filename.c_str(), m_sweep_info.getOIT(), m_sweep_info.getOAT(), m_sweep_info.getOST(), m_sweep_info.getNext()); } if (!m_need_trace) return; Database* dbb = m_tdbb->getDatabase(); TraceManager* trace_mgr = att->att_trace_manager; TraceConnectionImpl conn(att); // we need to compare stats against zero base if (state != ITracePlugin::SWEEP_STATE_PROGRESS) m_base_stats.reset(); jrd_tra* tran = m_tdbb->getTransaction(); TraceRuntimeStats stats(att, &m_base_stats, &att->att_stats, fb_utils::query_performance_counter() - m_start_clock, 0); m_sweep_info.setPerf(stats.getPerf()); trace_mgr->event_sweep(&conn, &m_sweep_info, state); if (state == ITracePlugin::SWEEP_STATE_FAILED || state == ITracePlugin::SWEEP_STATE_FINISHED) m_need_trace = false; } SecDbContext::SecDbContext(IAttachment* a, ITransaction* t) : att(a), tra(t), savePoint(0) { } SecDbContext::~SecDbContext() { LocalStatus ls; CheckStatusWrapper st(&ls); if (tra) { tra->rollback(&st); tra = NULL; } if (att) { att->detach(&st); att = NULL; } } SecDbContext* jrd_tra::getSecDbContext() { return tra_sec_db_context; } SecDbContext* jrd_tra::setSecDbContext(IAttachment* att, ITransaction* tra) { fb_assert(!tra_sec_db_context); tra_sec_db_context = FB_NEW_POOL(*getDefaultMemoryPool()) SecDbContext(att, tra); return tra_sec_db_context; } void jrd_tra::eraseSecDbContext() { delete tra_sec_db_context; tra_sec_db_context = NULL; }