8
0
mirror of https://github.com/FirebirdSQL/firebird.git synced 2025-01-25 01:23:03 +01:00
firebird-mirror/src/jrd/cch.cpp

5412 lines
141 KiB
C++
Raw Normal View History

2001-05-23 15:26:42 +02:00
/*
* PROGRAM: JRD Access Method
* MODULE: cch.cpp
* DESCRIPTION: Disk cache manager
2001-05-23 15:26:42 +02:00
*
* The contents of this file are subject to the Interbase Public
* License Version 1.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy
* of the License at http://www.Inprise.com/IPL.html
*
* Software distributed under the License is distributed on an
* "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, either express
* or implied. See the License for the specific language governing
* rights and limitations under the License.
*
* The Original Code was created by Inprise Corporation
* and its predecessors. Portions created by Inprise Corporation are
* Copyright (C) Inprise Corporation.
*
* All Rights Reserved.
* Contributor(s): ______________________________________.
* 2001.07.06 Sean Leyne - Code Cleanup, removed "#ifdef READONLY_DATABASE"
* conditionals, as the engine now fully supports
* readonly databases.
2002-10-30 07:40:58 +01:00
*
* 2002.10.29 Sean Leyne - Removed obsolete "Netware" port
*
2001-05-23 15:26:42 +02:00
*/
#include "firebird.h"
2004-03-22 12:38:23 +01:00
#include "../jrd/common.h"
2004-04-29 00:43:34 +02:00
#include <stdio.h>
2001-05-23 15:26:42 +02:00
#include <string.h>
#include <stdlib.h>
#include "../jrd/jrd.h"
#include "../jrd/que.h"
#include "../jrd/lck.h"
#include "../jrd/ods.h"
2003-07-14 12:35:49 +02:00
#include "../jrd/os/pio.h"
2001-05-23 15:26:42 +02:00
#include "../jrd/cch.h"
#include "gen/iberror.h"
2001-05-23 15:26:42 +02:00
#include "../jrd/lls.h"
#include "../jrd/req.h"
#include "../jrd/sdw.h"
#include "../jrd/tra.h"
#include "../jrd/sbm.h"
#include "../jrd/nbak.h"
2001-05-23 15:26:42 +02:00
#include "../jrd/gdsassert.h"
#include "../jrd/cch_proto.h"
#include "../jrd/err_proto.h"
#include "../jrd/gds_proto.h"
#include "../jrd/isc_proto.h"
#include "../jrd/isc_s_proto.h"
#include "../jrd/jrd_proto.h"
#include "../jrd/lck_proto.h"
#include "../jrd/mov_proto.h"
#include "../jrd/pag_proto.h"
2003-07-14 12:35:49 +02:00
#include "../jrd/os/pio_proto.h"
2001-05-23 15:26:42 +02:00
#include "../jrd/sdw_proto.h"
#include "../jrd/shut_proto.h"
2008-01-16 09:31:31 +01:00
#include "../jrd/ThreadStart.h"
#include "../jrd/thread_proto.h"
2001-05-23 15:26:42 +02:00
#include "../jrd/tra_proto.h"
#include "../common/config/config.h"
#include "../common/classes/MsgPrint.h"
using namespace Jrd;
using namespace Ods;
using namespace Firebird;
2009-08-23 13:43:25 +02:00
// In the superserver mode, no page locks are acquired through the lock manager.
// Instead, a latching mechanism is used. So the calls to lock subsystem for
// database pages in the original code should not be made, lest they should cause
// any undesirable side-effects. The following defines help us achieve that.
#ifdef CCH_DEBUG
#include <stdarg.h>
IMPLEMENT_TRACE_ROUTINE(cch_trace, "CCH")
#endif
#ifdef SUPERSERVER
#define CACHE_WRITER
#endif
#ifdef SUPERSERVER_V2
#define CACHE_READER
#endif
#ifdef SUPERSERVER
#define PAGE_LOCK_RELEASE(lock)
#define PAGE_LOCK_ASSERT(lock)
#define PAGE_LOCK_RE_POST(lock)
2009-12-13 14:49:43 +01:00
#define PAGE_OVERHEAD (sizeof (bcb_repeat) + sizeof(BufferDesc) + (int) dbb->dbb_page_size)
#else
#define PAGE_LOCK_RELEASE(lock) LCK_release (tdbb, lock)
#define PAGE_LOCK_ASSERT(lock) LCK_assert (tdbb, lock)
#define PAGE_LOCK_RE_POST(lock) LCK_re_post (tdbb, lock)
#define PAGE_OVERHEAD (sizeof (bcb_repeat) + sizeof(BufferDesc) + \
sizeof (Lock) + (int) dbb->dbb_page_size)
#endif
2001-05-23 15:26:42 +02:00
static BufferDesc* alloc_bdb(thread_db*, BufferControl*, UCHAR **);
#ifndef SUPERSERVER
static Lock* alloc_page_lock(Jrd::thread_db*, BufferDesc*);
static int blocking_ast_bdb(void*);
#endif
#ifdef CACHE_READER
static THREAD_ENTRY_DECLARE cache_reader(THREAD_ENTRY_PARAM);
#endif
#ifdef CACHE_WRITER
static THREAD_ENTRY_DECLARE cache_writer(THREAD_ENTRY_PARAM);
#endif
2009-08-23 13:43:25 +02:00
static void check_precedence(thread_db*, WIN*, PageNumber);
static void clear_precedence(thread_db*, BufferDesc*);
static BufferDesc* dealloc_bdb(BufferDesc*);
#ifndef SUPERSERVER
static void down_grade(thread_db*, BufferDesc*);
#endif
static void expand_buffers(thread_db*, ULONG);
2006-05-22 00:07:35 +02:00
static BufferDesc* get_buffer(thread_db*, const PageNumber, LATCH, SSHORT);
static int get_related(BufferDesc*, PagesArray&, int, const ULONG);
static ULONG get_prec_walk_mark(BufferControl*);
2007-02-06 09:03:43 +01:00
static void invalidate_and_release_buffer(thread_db*, BufferDesc*);
2006-05-22 00:07:35 +02:00
static SSHORT latch_bdb(thread_db*, LATCH, BufferDesc*, const PageNumber, SSHORT);
2009-06-06 11:05:20 +02:00
static SSHORT lock_buffer(thread_db*, BufferDesc*, const SSHORT, const SCHAR);
2007-04-11 18:05:40 +02:00
static ULONG memory_init(thread_db*, BufferControl*, SLONG);
static void page_validation_error(thread_db*, win*, SSHORT);
#ifdef CACHE_READER
static void prefetch_epilogue(Prefetch*, ISC_STATUS *);
static void prefetch_init(Prefetch*, thread_db*);
static void prefetch_io(Prefetch*, ISC_STATUS *);
static void prefetch_prologue(Prefetch*, SLONG *);
#endif
static SSHORT related(BufferDesc*, const BufferDesc*, SSHORT, const ULONG);
static void release_bdb(thread_db*, BufferDesc*, const bool, const bool, const bool);
2009-08-23 13:43:25 +02:00
static void unmark(thread_db*, WIN*);
static bool writeable(BufferDesc*);
static bool is_writeable(BufferDesc*, const ULONG);
2009-12-13 14:49:43 +01:00
static int write_buffer(thread_db*, BufferDesc*, const PageNumber, const bool, ISC_STATUS* const,
const bool);
static bool write_page(thread_db*, BufferDesc*, ISC_STATUS* const, const bool);
static void set_diff_page(thread_db*, BufferDesc*);
static void set_dirty_flag(thread_db*, BufferDesc*);
static void clear_dirty_flag(thread_db*, BufferDesc*);
2001-05-23 15:26:42 +02:00
2007-05-20 05:25:52 +02:00
static inline void insertDirty(BufferControl* bcb, BufferDesc* bdb)
{
2008-12-05 02:20:14 +01:00
if (bdb->bdb_dirty.que_forward == &bdb->bdb_dirty)
{
bcb->bcb_dirty_count++;
QUE_INSERT(bcb->bcb_dirty, bdb->bdb_dirty);
}
}
2007-05-20 05:25:52 +02:00
static inline void removeDirty(BufferControl* bcb, BufferDesc* bdb)
{
2008-12-05 02:20:14 +01:00
if (bdb->bdb_dirty.que_forward != &bdb->bdb_dirty)
{
fb_assert(bcb->bcb_dirty_count > 0);
bcb->bcb_dirty_count--;
QUE_DELETE(bdb->bdb_dirty);
QUE_INIT(bdb->bdb_dirty);
}
}
static void flushDirty(thread_db* tdbb, SLONG transaction_mask, const bool sys_only, ISC_STATUS* status);
static void flushAll(thread_db* tdbb, USHORT flush_flag);
const SLONG MIN_BUFFER_SEGMENT = 65536;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Given pointer a field in the block, find the block
2001-05-23 15:26:42 +02:00
#define BLOCK(fld_ptr, type, fld) (type)((SCHAR*) fld_ptr - OFFSET (type, fld))
static inline SharedLatch* allocSharedLatch(thread_db* tdbb, BufferDesc* bdb)
{
2009-06-06 11:05:20 +02:00
BufferControl* const bcb = bdb->bdb_dbb->dbb_bcb;
SharedLatch* latch;
if (QUE_NOT_EMPTY(bcb->bcb_free_slt))
{
QUE que_inst = bcb->bcb_free_slt.que_forward;
QUE_DELETE(*que_inst);
latch = BLOCK(que_inst, SharedLatch*, slt_bdb_que);
}
else
{
const int BATCH_ALLOC = 64;
Database* dbb = bdb->bdb_dbb;
2008-06-07 00:40:15 +02:00
SharedLatch* latches = latch = FB_NEW(*dbb->dbb_bufferpool) SharedLatch[BATCH_ALLOC];
for (int i = 1; i < BATCH_ALLOC; i++) {
QUE_APPEND(bcb->bcb_free_slt, latches[i].slt_bdb_que);
}
}
latch->slt_bdb = bdb;
QUE_APPEND(bdb->bdb_shared, latch->slt_bdb_que);
latch->slt_tdbb = tdbb;
QUE_APPEND(tdbb->tdbb_latches, latch->slt_tdbb_que);
2008-12-05 02:20:14 +01:00
return latch;
}
static inline void freeSharedLatch(thread_db* tdbb, BufferControl* bcb, SharedLatch* latch)
{
latch->slt_bdb = NULL;
QUE_DELETE(latch->slt_bdb_que);
QUE_INSERT(bcb->bcb_free_slt, latch->slt_bdb_que);
latch->slt_tdbb = NULL;
QUE_DELETE(latch->slt_tdbb_que);
}
static inline SharedLatch* findSharedLatch(thread_db* tdbb, BufferDesc* bdb)
{
2008-12-05 02:20:14 +01:00
for (QUE que_inst = tdbb->tdbb_latches.que_forward; que_inst != &tdbb->tdbb_latches;
que_inst = que_inst->que_forward)
{
2008-06-07 00:40:15 +02:00
SharedLatch* latch = BLOCK(que_inst, SharedLatch*, slt_tdbb_que);
fb_assert(latch->slt_tdbb == tdbb);
if (latch->slt_bdb == bdb) {
return latch;
}
}
return NULL;
}
//
//#define BCB_MUTEX_ACQUIRE
//#define BCB_MUTEX_RELEASE
//
2008-12-05 02:20:14 +01:00
//#define PRE_MUTEX_ACQUIRE
//#define PRE_MUTEX_RELEASE
//
2008-12-05 02:20:14 +01:00
//#define BTC_MUTEX_ACQUIRE
//#define BTC_MUTEX_RELEASE
//
//#define LATCH_MUTEX_ACQUIRE
//#define LATCH_MUTEX_RELEASE
//
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
const PageNumber JOURNAL_PAGE(DB_PAGE_SPACE, -1);
const PageNumber SHADOW_PAGE(DB_PAGE_SPACE, -2);
const PageNumber FREE_PAGE(DB_PAGE_SPACE, -3);
const PageNumber CHECKPOINT_PAGE(DB_PAGE_SPACE, -4);
const PageNumber MIN_PAGE_NUMBER(DB_PAGE_SPACE, -5);
2001-05-23 15:26:42 +02:00
const int PRE_SEARCH_LIMIT = 256;
2004-04-29 16:51:02 +02:00
const int PRE_EXISTS = -1;
const int PRE_UNKNOWN = -2;
2001-05-23 15:26:42 +02:00
2003-12-22 11:00:59 +01:00
int CCH_down_grade_dbb(void* ast_object)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ d o w n _ g r a d e _ d b b
*
**************************************
*
* Functional description
* Down grade the lock on the database in response to a blocking
* AST.
*
**************************************/
2004-03-07 08:58:55 +01:00
Database* dbb = static_cast<Database*>(ast_object);
2001-05-23 15:26:42 +02:00
try
2003-12-22 11:00:59 +01:00
{
Database::SyncGuard dsGuard(dbb, true);
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
Lock* const lock = dbb->dbb_lock;
2001-05-23 15:26:42 +02:00
// Since this routine will be called asynchronously,
// we must establish a thread context
ThreadContextHolder tdbb;
tdbb->setDatabase(dbb);
tdbb->setAttachment(lock->lck_attachment);
2001-05-23 15:26:42 +02:00
dbb->dbb_ast_flags |= DBB_blocking;
2001-05-23 15:26:42 +02:00
// Database shutdown will release the database lock; just return
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (SHUT_blocking_ast(tdbb))
{
dbb->dbb_ast_flags &= ~DBB_blocking;
return 0;
}
2001-05-23 15:26:42 +02:00
// If we are already shared, there is nothing more we can do.
// If any case, the other guy probably wants exclusive access,
// and we can't give it anyway
2001-05-23 15:26:42 +02:00
if ((lock->lck_logical == LCK_SW) || (lock->lck_logical == LCK_SR)) {
return 0;
}
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (dbb->dbb_flags & DBB_bugcheck)
{
LCK_convert(tdbb, lock, LCK_SW, LCK_WAIT);
dbb->dbb_ast_flags &= ~DBB_blocking;
return 0;
}
2001-05-23 15:26:42 +02:00
// If we are supposed to be exclusive, stay exclusive
2001-05-23 15:26:42 +02:00
if ((dbb->dbb_flags & DBB_exclusive) || (dbb->dbb_ast_flags & DBB_shutdown_single)) {
return 0;
}
2001-05-23 15:26:42 +02:00
// Assert any page locks that have been requested, but not asserted
2001-05-23 15:26:42 +02:00
dbb->dbb_ast_flags |= DBB_assert_locks;
BufferControl* bcb = dbb->dbb_bcb;
2009-06-26 06:12:20 +02:00
if (bcb && bcb->bcb_count)
{
2008-06-05 13:02:42 +02:00
const bcb_repeat* tail = bcb->bcb_rpt;
for (const bcb_repeat* const end = tail + bcb->bcb_count; tail < end; ++tail)
{
PAGE_LOCK_ASSERT(tail->bcb_bdb->bdb_lock);
2003-12-22 11:00:59 +01:00
}
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Down grade the lock on the database itself
2001-05-23 15:26:42 +02:00
if (lock->lck_physical == LCK_EX) {
2009-08-23 13:43:25 +02:00
LCK_convert(tdbb, lock, LCK_PW, LCK_WAIT); // This lets waiting cache manager in first
}
else {
LCK_convert(tdbb, lock, LCK_SW, LCK_WAIT);
}
dbb->dbb_ast_flags &= ~DBB_blocking;
}
catch (const Firebird::Exception&)
{} // no-op
2001-05-23 15:26:42 +02:00
return 0;
2001-05-23 15:26:42 +02:00
}
bool CCH_exclusive(thread_db* tdbb, USHORT level, SSHORT wait_flag)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ e x c l u s i v e
*
**************************************
*
* Functional description
* Get exclusive access to a database. If we get it, return true.
* If the wait flag is FALSE, and we can't get it, give up and
* return false. There are two levels of database exclusivity: LCK_PW
2001-05-23 15:26:42 +02:00
* guarantees there are no normal users in the database while LCK_EX
* additionally guarantes background database processes like the
* shared cache manager have detached.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER
if (!CCH_exclusive_attachment(tdbb, level, wait_flag)) {
return false;
}
2001-05-23 15:26:42 +02:00
#endif
Lock* lock = dbb->dbb_lock;
if (!lock) {
return false;
}
2001-05-23 15:26:42 +02:00
dbb->dbb_flags |= DBB_exclusive;
2009-01-14 10:19:00 +01:00
switch (level)
{
2001-05-23 15:26:42 +02:00
case LCK_PW:
2008-12-20 20:57:43 +01:00
if (lock->lck_physical >= LCK_PW || LCK_convert(tdbb, lock, LCK_PW, wait_flag))
2003-12-22 11:00:59 +01:00
{
return true;
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
break;
case LCK_EX:
2008-12-18 11:47:25 +01:00
if (lock->lck_physical == LCK_EX || LCK_convert(tdbb, lock, LCK_EX, wait_flag))
2003-12-22 11:00:59 +01:00
{
return true;
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
break;
default:
break;
}
// Clear the status vector, as our callers check the return value
// and throw custom exceptions themselves
fb_utils::init_status(tdbb->tdbb_status_vector);
2009-08-23 13:43:25 +02:00
// If we are supposed to wait (presumably patiently),
// but can't get the lock, generate an error
2001-05-23 15:26:42 +02:00
if (wait_flag == LCK_WAIT) {
ERR_post(Arg::Gds(isc_deadlock));
}
2001-05-23 15:26:42 +02:00
dbb->dbb_flags &= ~DBB_exclusive;
return false;
2001-05-23 15:26:42 +02:00
}
bool CCH_exclusive_attachment(thread_db* tdbb, USHORT level, SSHORT wait_flag)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ e x c l u s i v e _ a t t a c h m e n t
*
**************************************
*
* Functional description
* Get exclusive access to a database. If we get it, return true.
* If the wait flag is FALSE, and we can't get it, give up and
* return false.
2001-05-23 15:26:42 +02:00
*
**************************************/
2009-08-23 13:43:25 +02:00
const int CCH_EXCLUSIVE_RETRY_INTERVAL = 1; // retry interval in seconds
2001-05-23 15:26:42 +02:00
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
Jrd::Attachment* attachment = tdbb->getAttachment();
if (attachment->att_flags & ATT_exclusive) {
return true;
}
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
attachment->att_flags |= (level == LCK_none) ? ATT_attach_pending : ATT_exclusive_pending;
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
const SLONG timeout = (SLONG) (wait_flag < 0) ?
-wait_flag : ((wait_flag == LCK_WAIT) ? 1L << 30 : CCH_EXCLUSIVE_RETRY_INTERVAL);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If requesting exclusive database access, then re-position attachment as the
// youngest so that pending attachments may pass.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (level != LCK_none)
{
for (Jrd::Attachment** ptr = &dbb->dbb_attachments; *ptr; ptr = &(*ptr)->att_next)
2009-06-26 06:12:20 +02:00
{
if (*ptr == attachment)
{
2001-05-23 15:26:42 +02:00
*ptr = attachment->att_next;
break;
}
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
attachment->att_next = dbb->dbb_attachments;
dbb->dbb_attachments = attachment;
}
2008-12-18 11:47:25 +01:00
for (SLONG remaining = timeout; remaining > 0; remaining -= CCH_EXCLUSIVE_RETRY_INTERVAL)
2003-12-22 11:00:59 +01:00
{
if (tdbb->getAttachment()->att_flags & ATT_shutdown) {
2001-05-23 15:26:42 +02:00
break;
}
2001-05-23 15:26:42 +02:00
2003-12-22 11:00:59 +01:00
bool found = false;
for (attachment = tdbb->getAttachment()->att_next; attachment;
2008-12-18 11:47:25 +01:00
attachment = attachment->att_next)
2003-12-22 11:00:59 +01:00
{
if (attachment->att_flags & ATT_shutdown) {
2001-05-23 15:26:42 +02:00
continue;
}
2001-05-23 15:26:42 +02:00
if (level == LCK_none)
2009-08-23 13:43:25 +02:00
{
// Wait for other attachments requesting exclusive access
2008-12-18 11:47:25 +01:00
if (attachment->att_flags & (ATT_exclusive | ATT_exclusive_pending))
2003-12-22 11:00:59 +01:00
{
found = true;
2001-05-23 15:26:42 +02:00
break;
}
// Forbid multiple attachments in single-user maintenance mode
2008-12-18 11:47:25 +01:00
if (attachment != tdbb->getAttachment() && (dbb->dbb_ast_flags & DBB_shutdown_single) )
{
found = true;
break;
}
2001-05-23 15:26:42 +02:00
}
2008-01-16 09:31:31 +01:00
else
{
// Requesting exclusive database access
2003-12-22 11:00:59 +01:00
found = true;
if (attachment->att_flags & ATT_exclusive_pending)
{
2007-12-05 01:03:15 +01:00
tdbb->getAttachment()->att_flags &= ~ATT_exclusive_pending;
if (wait_flag == LCK_WAIT) {
ERR_post(Arg::Gds(isc_deadlock));
}
else {
return false;
}
2001-05-23 15:26:42 +02:00
}
break;
}
}
if (!found)
{
2008-12-18 11:47:25 +01:00
tdbb->getAttachment()->att_flags &= ~(ATT_exclusive_pending | ATT_attach_pending);
if (level != LCK_none) {
tdbb->getAttachment()->att_flags |= ATT_exclusive;
}
return true;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Our thread needs to sleep for CCH_EXCLUSIVE_RETRY_INTERVAL seconds.
2001-05-23 15:26:42 +02:00
2002-04-29 13:14:46 +02:00
if (remaining > CCH_EXCLUSIVE_RETRY_INTERVAL)
{
Database::Checkout dcoHolder(dbb);
2002-04-29 13:14:46 +02:00
THREAD_SLEEP(CCH_EXCLUSIVE_RETRY_INTERVAL * 1000);
}
2001-05-23 15:26:42 +02:00
if (tdbb->getAttachment()->att_flags & ATT_cancel_raise)
{
2009-06-26 06:12:20 +02:00
if (JRD_reschedule(tdbb, 0, false))
{
2008-12-18 11:47:25 +01:00
tdbb->getAttachment()->att_flags &= ~(ATT_exclusive_pending | ATT_attach_pending);
2001-05-23 15:26:42 +02:00
ERR_punt();
}
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
}
2008-12-18 11:47:25 +01:00
tdbb->getAttachment()->att_flags &= ~(ATT_exclusive_pending | ATT_attach_pending);
return false;
2001-05-23 15:26:42 +02:00
}
void CCH_expand(thread_db* tdbb, ULONG number)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ e x p a n d
*
**************************************
*
* Functional description
* Expand the cache to at least a given number of buffers. If
* it's already that big, don't do anything.
*
**************************************/
SET_TDBB(tdbb);
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
expand_buffers(tdbb, number);
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
pag* CCH_fake(thread_db* tdbb, WIN* window, SSHORT latch_wait)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f a k e
*
**************************************
*
* Functional description
* Fake a fetch to a page. Rather than reading it, however,
* zero it in memory. This is used when allocating a new page.
*
* input
* latch_wait: 1 => Wait as long as necessary to get the latch.
* This can cause deadlocks of course.
* 0 => If the latch can't be acquired immediately,
* or an IO would be necessary, then give
* up and return 0.
* <negative number> => Latch timeout interval in seconds.
*
* return
* pag pointer if successful.
* NULL pointer if timeout occurred (only possible if latch_wait <> 1).
* NULL pointer if latch_wait=0 and the faked page would have to be
* before reuse.
*
**************************************/
SET_TDBB(tdbb);
2009-06-06 11:05:20 +02:00
Database* const dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
CCH_TRACE(("FK %d:%06d", window->win_page.getPageSpaceID(), window->win_page.getPageNum()));
2009-08-23 13:43:25 +02:00
// if there has been a shadow added recently, go out and
// find it before we grant any more write locks
2001-05-23 15:26:42 +02:00
if (dbb->dbb_ast_flags & DBB_get_shadows) {
SDW_get_shadows(tdbb);
}
2001-05-23 15:26:42 +02:00
Jrd::Attachment* attachment = tdbb->getAttachment();
if (!attachment->backupStateReadLock(tdbb, latch_wait))
return NULL;
BufferDesc* bdb = get_buffer(tdbb, window->win_page, LATCH_exclusive, latch_wait);
2009-06-26 06:12:20 +02:00
if (!bdb)
{
attachment->backupStateReadUnLock(tdbb);
2009-08-23 13:43:25 +02:00
return NULL; // latch timeout occurred
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If a dirty orphaned page is being reused - better write it first
// to clear current precedences and checkpoint state. This would also
// update the bcb_free_pages field appropriately.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (bdb->bdb_flags & (BDB_dirty | BDB_db_dirty))
{
2009-08-23 13:43:25 +02:00
// If the caller didn't want to wait at all, then
// return 'try to fake an other page' to the caller.
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (!latch_wait)
{
attachment->backupStateReadUnLock(tdbb);
release_bdb(tdbb, bdb, false, false, false);
return NULL;
2001-05-23 15:26:42 +02:00
}
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, bdb, bdb->bdb_page, true, tdbb->tdbb_status_vector, true))
2003-12-22 11:00:59 +01:00
{
attachment->backupStateReadUnLock(tdbb);
CCH_unwind(tdbb, true);
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
}
2009-01-14 10:19:00 +01:00
else if (QUE_NOT_EMPTY(bdb->bdb_lower))
{
2009-08-23 13:43:25 +02:00
// Clear residual precedence left over from AST-level I/O.
clear_precedence(tdbb, bdb);
2001-05-23 15:26:42 +02:00
}
// Here the page must not be dirty and have no backup lock owner
fb_assert((bdb->bdb_flags & (BDB_dirty | BDB_db_dirty)) == 0);
2001-05-23 15:26:42 +02:00
bdb->bdb_flags = (BDB_writer | BDB_faked);
bdb->bdb_scan_count = 0;
lock_buffer(tdbb, bdb, LCK_WAIT, pag_undefined);
MOVE_CLEAR(bdb->bdb_buffer, (SLONG) dbb->dbb_page_size);
window->win_buffer = bdb->bdb_buffer;
window->win_bdb = bdb;
window->win_flags = 0;
CCH_MARK(tdbb, window);
return bdb->bdb_buffer;
}
pag* CCH_fetch(thread_db* tdbb, WIN* window, USHORT lock_type, SCHAR page_type, SSHORT latch_wait,
const bool read_shadow, const bool merge_flag)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f e t c h
*
**************************************
*
* Functional description
* Fetch a specific page. If it's already in cache,
* so much the better.
*
* input
* latch_wait: 1 => Wait as long as necessary to get the latch.
* This can cause deadlocks of course.
* 0 => If the latch can't be acquired immediately,
* give up and return 0.
* <negative number> => Latch timeout interval in seconds.
*
* return
* PAG if successful.
* NULL pointer if timeout occurred (only possible if latch_wait <> 1).
*
**************************************/
SET_TDBB(tdbb);
2009-04-28 15:08:04 +02:00
//Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
CCH_TRACE(("FE %d:%06d", window->win_page.getPageSpaceID(), window->win_page.getPageNum()));
2007-04-25 04:26:33 +02:00
// FETCH_LOCK will return 0, 1, -1 or -2
2008-12-05 02:20:14 +01:00
2008-12-18 11:47:25 +01:00
const SSHORT fetch_lock_return = CCH_FETCH_LOCK(tdbb, window, lock_type, latch_wait, page_type);
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
switch (fetch_lock_return)
{
2009-01-14 10:19:00 +01:00
case 1:
CCH_TRACE(("FE %d:%06d", window->win_page.getPageSpaceID(), window->win_page.getPageNum()));
CCH_FETCH_PAGE(tdbb, window, read_shadow, merge_flag); // must read page from disk
2009-01-14 10:19:00 +01:00
break;
case -2:
case -1:
2009-08-23 13:43:25 +02:00
return NULL; // latch or lock timeout
}
2001-05-23 15:26:42 +02:00
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// if merge_flag is not set the page will be changed before or after merge
// and should be written into delta again
if (!merge_flag)
bdb->bdb_flags &= ~BDB_merge;
2009-08-23 13:43:25 +02:00
// If a page was read or prefetched on behalf of a large scan
// then load the window scan count into the buffer descriptor.
// This buffer scan count is decremented by releasing a buffer
// with CCH_RELEASE_TAIL.
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Otherwise zero the buffer scan count to prevent the buffer
// from being queued to the LRU tail.
2001-05-23 15:26:42 +02:00
if (window->win_flags & WIN_large_scan)
{
2008-12-18 11:47:25 +01:00
if (fetch_lock_return == 1 || bdb->bdb_flags & BDB_prefetch || bdb->bdb_scan_count < 0)
{
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = window->win_scans;
}
2001-05-23 15:26:42 +02:00
}
else if (window->win_flags & WIN_garbage_collector)
{
if (fetch_lock_return == 1) {
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = -1;
}
if (bdb->bdb_flags & BDB_garbage_collect) {
2001-05-23 15:26:42 +02:00
window->win_flags |= WIN_garbage_collect;
}
2001-05-23 15:26:42 +02:00
}
else if (window->win_flags & WIN_secondary)
{
if (fetch_lock_return == 1) {
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = -1;
}
2001-05-23 15:26:42 +02:00
}
else
{
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = 0;
2008-12-05 02:20:14 +01:00
if (bdb->bdb_flags & BDB_garbage_collect) {
2001-05-23 15:26:42 +02:00
bdb->bdb_flags &= ~BDB_garbage_collect;
2003-09-13 20:35:39 +02:00
}
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Validate the fetched page matches the expected type
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if (bdb->bdb_buffer->pag_type != page_type && page_type != pag_undefined)
{
page_validation_error(tdbb, window, page_type);
}
2001-05-23 15:26:42 +02:00
return window->win_buffer;
}
2008-12-18 11:47:25 +01:00
SSHORT CCH_fetch_lock(thread_db* tdbb, WIN* window, USHORT lock_type, SSHORT wait, SCHAR page_type)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f e t c h _ l o c k
*
**************************************
*
* Functional description
* Fetch a latch and lock for a specific page.
2001-05-23 15:26:42 +02:00
*
* input
*
2008-12-05 02:20:14 +01:00
* wait:
* LCK_WAIT (1) => Wait as long a necessary to get the lock.
* This can cause deadlocks of course.
2001-05-23 15:26:42 +02:00
*
2008-12-05 02:20:14 +01:00
* LCK_NO_WAIT (0) =>
* If the latch can't be acquired immediately, give up and return -2.
* If the lock can't be acquired immediately, give up and return -1.
*
* <negative number> => Lock (latch) timeout interval in seconds.
2001-05-23 15:26:42 +02:00
*
* return
* 0: fetch & lock were successful, page doesn't need to be read.
* 1: fetch & lock were successful, page needs to be read from disk.
* -1: lock timed out, fetch failed.
* -2: latch timed out, fetch failed, lock not attempted.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// if there has been a shadow added recently, go out and
// find it before we grant any more write locks
2001-05-23 15:26:42 +02:00
if (dbb->dbb_ast_flags & DBB_get_shadows) {
SDW_get_shadows(tdbb);
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Look for the page in the cache.
Jrd::Attachment* attachment = tdbb->getAttachment();
if (!attachment->backupStateReadLock(tdbb, wait))
return -2;
2001-05-23 15:26:42 +02:00
BufferDesc* bdb = get_buffer(tdbb, window->win_page,
((lock_type >= LCK_write) ? LATCH_exclusive : LATCH_shared), wait);
2009-01-14 10:19:00 +01:00
if (wait != 1 && bdb == 0) {
2009-08-23 13:43:25 +02:00
return -2; // latch timeout
}
2001-05-23 15:26:42 +02:00
2008-12-05 02:20:14 +01:00
if (lock_type >= LCK_write)
2008-08-13 11:02:35 +02:00
{
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_writer;
}
2001-05-23 15:26:42 +02:00
window->win_bdb = bdb;
window->win_buffer = bdb->bdb_buffer;
2009-08-23 13:43:25 +02:00
// lock_buffer returns 0 or 1 or -1.
const SSHORT lock_result = lock_buffer(tdbb, bdb, wait, page_type);
if (lock_result == -1)
attachment->backupStateReadUnLock(tdbb);
return lock_result;
2001-05-23 15:26:42 +02:00
}
void CCH_fetch_page(thread_db* tdbb, WIN* window, const bool read_shadow, const bool merge_flag)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f e t c h _ p a g e
*
**************************************
*
* Functional description
* Fetch a specific page. If it's already in cache,
* so much the better. When "compute_checksum" is 1, compute
* the checksum of the page. When it is 2, compute
* the checksum only when the page type is nonzero.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
2008-04-26 16:35:12 +02:00
ISC_STATUS* const status = tdbb->tdbb_status_vector;
2001-05-23 15:26:42 +02:00
pag* page = bdb->bdb_buffer;
2001-05-23 15:26:42 +02:00
bdb->bdb_incarnation = ++dbb->dbb_page_incarnation;
tdbb->bumpStats(RuntimeStatistics::PAGE_READS);
2001-05-23 15:26:42 +02:00
page = bdb->bdb_buffer;
2008-12-18 11:47:25 +01:00
PageSpace* pageSpace = dbb->dbb_page_manager.findPageSpace(bdb->bdb_page.getPageSpaceID());
2006-05-22 00:07:35 +02:00
fb_assert(pageSpace);
jrd_file* file = pageSpace->file;
SSHORT retryCount = 0;
2006-05-22 00:07:35 +02:00
const bool isTempPage = pageSpace->isTemporary();
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
/*
We will read a page, and if there is an I/O error we will try to
use the shadow file, and try reading again, for a maximum of
3 tries, before it gives up.
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
The read_shadow flag is set to false only in the call to
FETCH_NO_SHADOW, which is only called from validate
code.
2009-08-23 13:43:25 +02:00
read_shadow = false -> IF an I/O error occurs give up (exit
the loop, clean up, and return). So the caller,
validate in most cases, can know about it and attempt
to remedy the situation.
2009-08-23 13:43:25 +02:00
read_shadow = true -> IF an I/O error occurs attempt
to rollover to the shadow file. If the I/O error is
persistant (more than 3 times) error out of the routine by
calling CCH_unwind, and eventually punting out.
*/
2009-03-18 03:43:15 +01:00
BackupManager* bm = dbb->dbb_backup_manager;
const int bak_state = bm->getState();
fb_assert(bak_state != nbak_state_unknown);
2008-12-05 02:20:14 +01:00
ULONG diff_page = 0;
2009-04-01 12:49:54 +02:00
if (!isTempPage && bak_state != nbak_state_normal)
{
BackupManager::AllocReadGuard allocGuard(tdbb, dbb->dbb_backup_manager);
diff_page = bm->getPageIndex(tdbb, bdb->bdb_page.getPageNum());
2009-04-01 12:49:54 +02:00
NBAK_TRACE(("Reading page %d:%06d, state=%d, diff page=%d",
bdb->bdb_page.getPageSpaceID(), bdb->bdb_page.getPageNum(), bak_state, diff_page));
}
2008-01-16 09:31:31 +01:00
// In merge mode, if we are reading past beyond old end of file and page is in .delta file
// then we maintain actual page in difference file. Always read it from there.
2009-04-01 12:49:54 +02:00
if (isTempPage || bak_state == nbak_state_normal || !diff_page)
{
NBAK_TRACE(("Reading page %d:%06d, state=%d, diff page=%d from DISK",
bdb->bdb_page.getPageSpaceID(), bdb->bdb_page.getPageNum(), bak_state, diff_page));
2009-03-18 03:43:15 +01:00
// Read page from disk as normal
2009-03-18 03:43:15 +01:00
while (!PIO_read(file, bdb, page, status))
{
if (isTempPage || !read_shadow) {
break;
}
2009-06-26 06:12:20 +02:00
if (!CCH_rollover_to_shadow(tdbb, dbb, file, false))
{
PAGE_LOCK_RELEASE(bdb->bdb_lock);
CCH_unwind(tdbb, true);
}
if (file != pageSpace->file) {
file = pageSpace->file;
}
else
{
2009-06-26 06:12:20 +02:00
if (retryCount++ == 3)
{
2009-04-01 12:49:54 +02:00
fprintf(stderr, "IO error loop Unwind to avoid a hang\n");
PAGE_LOCK_RELEASE(bdb->bdb_lock);
CCH_unwind(tdbb, true);
}
}
}
}
else
{
2009-04-01 12:49:54 +02:00
NBAK_TRACE(("Reading page %d, state=%d, diff page=%d from DIFFERENCE",
bdb->bdb_page, bak_state, diff_page));
2009-06-26 06:12:20 +02:00
if (!bm->readDifference(tdbb, diff_page, page))
{
PAGE_LOCK_RELEASE(bdb->bdb_lock);
CCH_unwind(tdbb, true);
}
// This is the first reading the page from delta and it must not be written into it again
if (merge_flag)
bdb->bdb_flags |= BDB_merge;
if ((page->pag_type == 0) && !merge_flag)
2009-04-01 12:49:54 +02:00
{
// We encountered a page which was allocated, but never written to the
// difference file. In this case we try to read the page from database. With
// this approach if the page was old we get it from DISK, and if the page
// was new IO error (EOF) or BUGCHECK (checksum error) will be the result.
// Engine is not supposed to read a page which was never written unless
// this is a merge process.
2009-04-01 12:49:54 +02:00
NBAK_TRACE(("Re-reading page %d, state=%d, diff page=%d from DISK",
bdb->bdb_page, bak_state, diff_page));
while (!PIO_read(file, bdb, page, status))
{
if (!read_shadow) {
break;
}
2008-01-16 09:31:31 +01:00
2009-06-26 06:12:20 +02:00
if (!CCH_rollover_to_shadow(tdbb, dbb, file, false))
{
PAGE_LOCK_RELEASE(bdb->bdb_lock);
CCH_unwind(tdbb, true);
}
2006-05-22 00:07:35 +02:00
if (file != pageSpace->file) {
file = pageSpace->file;
}
else
{
2009-06-26 06:12:20 +02:00
if (retryCount++ == 3)
{
fprintf(stderr, "IO error loop Unwind to avoid a hang\n");
PAGE_LOCK_RELEASE(bdb->bdb_lock);
CCH_unwind(tdbb, true);
}
}
}
}
}
2001-05-23 15:26:42 +02:00
bdb->bdb_flags &= ~(BDB_not_valid | BDB_read_pending);
window->win_buffer = bdb->bdb_buffer;
}
2009-08-23 13:43:25 +02:00
void CCH_forget_page(thread_db* tdbb, WIN* window)
{
/**************************************
*
* C C H _ f o r g e t _ p a g e
*
**************************************
*
* Functional description
* Page was faked but can't be written on disk. Most probably because
2007-04-27 04:28:57 +02:00
* of out of disk space. Release page buffer and others resources and
* unlink page from various queues
*
**************************************/
SET_TDBB(tdbb);
BufferDesc* bdb = window->win_bdb;
Database* dbb = tdbb->getDatabase();
if (window->win_page != bdb->bdb_page ||
2008-12-05 02:20:14 +01:00
bdb->bdb_buffer->pag_type != pag_undefined)
{
// buffer was reassigned or page was reused
return;
}
window->win_bdb = NULL;
if (tdbb->tdbb_flags & TDBB_no_cache_unwind) {
release_bdb(tdbb, bdb, false, false, false);
}
if (bdb->bdb_flags & BDB_io_error) {
dbb->dbb_flags &= ~DBB_suspend_bgio;
}
clear_dirty_flag(tdbb, bdb);
bdb->bdb_flags = 0;
BufferControl* bcb = dbb->dbb_bcb;
removeDirty(bcb, bdb);
QUE_DELETE(bdb->bdb_in_use);
QUE_DELETE(bdb->bdb_que);
QUE_INSERT(bcb->bcb_empty, bdb->bdb_que);
}
void CCH_fini(thread_db* tdbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f i n i
*
**************************************
*
* Functional description
* Shut down buffer operation.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2004-01-13 10:52:19 +01:00
bool flush_error = false;
2008-12-05 02:20:14 +01:00
2004-01-13 10:52:19 +01:00
// CVC: Patching a conversion error FB1->FB2 with crude logic
for (int i = 0; i < 2; ++i)
{
2004-01-13 10:52:19 +01:00
try {
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If we've been initialized, either flush buffers
// or release locks, depending on where we've been
// bug-checked; as a defensive programming measure,
// make sure that the buffers were actually allocated.
2001-05-23 15:26:42 +02:00
2004-01-13 10:52:19 +01:00
bcb_repeat* tail;
BufferControl* bcb = dbb->dbb_bcb;
if (bcb && (tail = bcb->bcb_rpt) && (tail->bcb_bdb))
{
if (dbb->dbb_flags & DBB_bugcheck || flush_error)
{
2008-12-18 11:47:25 +01:00
for (const bcb_repeat* const end = bcb->bcb_rpt + bcb->bcb_count; tail < end; tail++)
2004-01-13 10:52:19 +01:00
{
BufferDesc* bdb = tail->bcb_bdb;
2004-01-13 10:52:19 +01:00
PAGE_LOCK_RELEASE(bdb->bdb_lock);
2001-05-23 15:26:42 +02:00
}
2004-01-13 10:52:19 +01:00
}
else {
CCH_flush(tdbb, FLUSH_FINI, (SLONG) 0);
2001-05-23 15:26:42 +02:00
}
}
2001-05-23 15:26:42 +02:00
#ifdef CACHE_READER
2009-08-23 13:43:25 +02:00
// Shutdown the dedicated cache reader for this database.
2001-05-23 15:26:42 +02:00
if ((bcb = dbb->dbb_bcb) && (bcb->bcb_flags & BCB_cache_reader))
{
2004-01-13 10:52:19 +01:00
bcb->bcb_flags &= ~BCB_cache_reader;
dbb->dbb_reader_sem.release();
{ // scope
Database::Checkout dcoHolder(dbb);
dbb->dbb_reader_fini.enter();
}
2004-01-13 10:52:19 +01:00
}
2001-05-23 15:26:42 +02:00
#endif
#ifdef CACHE_WRITER
2009-08-23 13:43:25 +02:00
// Wait for cache writer startup to complete.
2007-01-18 16:50:18 +01:00
while ((bcb = dbb->dbb_bcb) && (bcb->bcb_flags & BCB_writer_start))
{
Database::Checkout dcoHolder(dbb);
2007-01-18 16:50:18 +01:00
THREAD_YIELD();
}
2009-08-23 13:43:25 +02:00
// Shutdown the dedicated cache writer for this database.
2001-05-23 15:26:42 +02:00
if ((bcb = dbb->dbb_bcb) && (bcb->bcb_flags & BCB_cache_writer))
{
2004-01-13 10:52:19 +01:00
bcb->bcb_flags &= ~BCB_cache_writer;
dbb->dbb_writer_sem.release(); // Wake up running thread
{ // scope
Database::Checkout dcoHolder(dbb);
dbb->dbb_writer_fini.enter();
}
2004-01-13 10:52:19 +01:00
}
2001-05-23 15:26:42 +02:00
#endif
2009-08-23 13:43:25 +02:00
// close the database file and all associated shadow files
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
//PIO_close(dbb->dbb_file);
dbb->dbb_page_manager.closeAll();
2004-01-13 10:52:19 +01:00
SDW_close();
2001-05-23 15:26:42 +02:00
2008-12-05 02:20:14 +01:00
if ( (bcb = dbb->dbb_bcb) )
{
2008-12-05 02:20:14 +01:00
while (bcb->bcb_memory.hasData())
{
2006-12-04 22:26:43 +01:00
dbb->dbb_bufferpool->deallocate(bcb->bcb_memory.pop());
2004-01-13 10:52:19 +01:00
}
2001-05-23 15:26:42 +02:00
#ifdef CACHE_WRITER
2009-08-23 13:43:25 +02:00
// Dispose off any associated latching semaphores
2008-12-05 02:20:14 +01:00
while (QUE_NOT_EMPTY(bcb->bcb_free_lwt))
{
QUE que_inst = bcb->bcb_free_lwt.que_forward;
2008-05-11 14:27:51 +02:00
QUE_DELETE(*que_inst);
2008-10-11 04:42:01 +02:00
// LatchWait* lwt = (LatchWait*) BLOCK(que_inst, LatchWait*, lwt_waiters);
2004-01-13 10:52:19 +01:00
}
2001-05-23 15:26:42 +02:00
#endif
2004-01-13 10:52:19 +01:00
}
2004-01-13 10:52:19 +01:00
} // try
catch (const Firebird::Exception& ex)
2004-01-13 10:52:19 +01:00
{
Firebird::stuff_exception(tdbb->tdbb_status_vector, ex);
2004-01-13 10:52:19 +01:00
if (!flush_error) {
flush_error = true;
}
else {
ERR_punt();
}
}
2008-12-05 02:20:14 +01:00
2009-11-16 09:06:31 +01:00
if (!flush_error) {
// wasn't set in the catch => no failure, just exit
2004-01-13 10:52:19 +01:00
break;
2001-12-24 03:51:06 +01:00
}
2004-01-13 10:52:19 +01:00
} // for
2001-05-23 15:26:42 +02:00
}
void CCH_flush(thread_db* tdbb, USHORT flush_flag, SLONG tra_number)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f l u s h
*
**************************************
*
* Functional description
* Flush all buffers. If the release flag is set,
2001-05-23 15:26:42 +02:00
* release all locks.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
ISC_STATUS* status = tdbb->tdbb_status_vector;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// note that some of the code for btc_flush()
// replicates code in the for loop
// to minimize call overhead -- changes should be made in both places
2001-05-23 15:26:42 +02:00
if (flush_flag & (FLUSH_TRAN | FLUSH_SYSTEM))
{
2009-02-28 12:57:40 +01:00
const SLONG transaction_mask = tra_number ? 1L << (tra_number & (BITS_PER_LONG - 1)) : 0;
bool sys_only = false;
if (!transaction_mask && (flush_flag & FLUSH_SYSTEM)) {
2003-12-22 11:00:59 +01:00
sys_only = true;
}
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER_V2
BufferControl* bcb = dbb->dbb_bcb;
2009-08-23 13:43:25 +02:00
//if (!dbb->dbb_wal && A && B) becomes
//if (true && A && B) then finally (A && B)
if (!(dbb->dbb_flags & DBB_force_write) && transaction_mask)
{
2001-05-23 15:26:42 +02:00
dbb->dbb_flush_cycle |= transaction_mask;
if (!(bcb->bcb_flags & BCB_writer_active))
dbb->dbb_writer_sem.release();
2001-05-23 15:26:42 +02:00
}
else
#endif
flushDirty(tdbb, transaction_mask, sys_only, status);
2001-05-23 15:26:42 +02:00
}
else
{
flushAll(tdbb, flush_flag);
2001-05-23 15:26:42 +02:00
}
2008-12-05 02:20:14 +01:00
//
// Check if flush needed
//
const int max_unflushed_writes = dbb->dbb_config->getMaxUnflushedWrites();
const time_t max_unflushed_write_time = dbb->dbb_config->getMaxUnflushedWriteTime();
2003-02-16 14:25:44 +01:00
bool max_num = (max_unflushed_writes >= 0);
bool max_time = (max_unflushed_write_time >= 0);
bool doFlush = false;
2006-05-22 00:07:35 +02:00
PageSpace* pageSpaceID = dbb->dbb_page_manager.findPageSpace(DB_PAGE_SPACE);
jrd_file* main_file = pageSpaceID->file;
if (!(main_file->fil_flags & FIL_force_write) && (max_num || max_time))
{
2003-10-08 10:42:48 +02:00
const time_t now = time(0);
2003-02-16 14:25:44 +01:00
Database::CheckoutLockGuard guard(dbb, dbb->dbb_flush_count_mutex);
// If this is the first commit set last_flushed_write to now
if (!dbb->last_flushed_write)
{
dbb->last_flushed_write = now;
}
2003-02-16 14:25:44 +01:00
// test max_num condition and max_time condition
2008-12-18 11:47:25 +01:00
max_num = max_num && (dbb->unflushed_writes == max_unflushed_writes);
max_time = max_time && (now - dbb->last_flushed_write > max_unflushed_write_time);
2003-02-16 14:25:44 +01:00
if (max_num || max_time)
{
2003-02-16 14:25:44 +01:00
doFlush = true;
dbb->unflushed_writes = 0;
dbb->last_flushed_write = now;
}
2003-02-16 14:25:44 +01:00
else
{
dbb->unflushed_writes++;
}
}
2001-05-23 15:26:42 +02:00
if (doFlush)
{
2008-03-19 16:55:11 +01:00
PIO_flush(dbb, main_file);
if (dbb->dbb_shadow)
2003-02-16 14:25:44 +01:00
{
2008-03-19 16:55:11 +01:00
PIO_flush(dbb, dbb->dbb_shadow->sdw_file);
2003-02-16 14:25:44 +01:00
}
tdbb->bumpStats(RuntimeStatistics::FLUSHES);
}
2003-02-16 14:25:44 +01:00
2009-08-23 13:43:25 +02:00
// take the opportunity when we know there are no pages
// in cache to check that the shadow(s) have not been
// scheduled for shutdown or deletion
2001-05-23 15:26:42 +02:00
SDW_check(tdbb);
2001-05-23 15:26:42 +02:00
}
void CCH_flush_ast(thread_db* tdbb)
2007-02-06 09:03:43 +01:00
{
/**************************************
*
* C C H _ f l u s h _ a s t
2007-02-06 09:03:43 +01:00
*
**************************************
*
* Functional description
* Flush all buffers coming from database file.
* Should be called from AST
2007-02-06 09:03:43 +01:00
*
**************************************/
SET_TDBB(tdbb);
#ifdef SUPERSERVER
CCH_flush(tdbb, FLUSH_ALL, 0);
2008-12-05 02:20:14 +01:00
#else
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
2007-02-08 01:03:36 +01:00
// Do some fancy footwork to make sure that pages are
// not removed from the btc tree at AST level. Then
// restore the flag to whatever it was before.
2007-02-06 09:03:43 +01:00
const bool keep_pages = bcb->bcb_flags & BCB_keep_pages;
dbb->dbb_bcb->bcb_flags |= BCB_keep_pages;
2009-06-26 06:12:20 +02:00
for (ULONG i = 0; (bcb = dbb->dbb_bcb) && i < bcb->bcb_count; i++)
{
2007-04-25 04:26:33 +02:00
BufferDesc* bdb = bcb->bcb_rpt[i].bcb_bdb;
2008-06-05 13:02:42 +02:00
if (bdb->bdb_flags & (BDB_dirty | BDB_db_dirty))
down_grade(tdbb, bdb);
2007-02-06 09:03:43 +01:00
}
2007-02-06 09:03:43 +01:00
if (!keep_pages) {
bcb->bcb_flags &= ~BCB_keep_pages;
}
#endif
}
bool CCH_free_page(thread_db* tdbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ f r e e _ p a g e
*
**************************************
*
* Functional description
* Check if the cache is below its free pages
* threshold and write a page on the LRU tail.
*
**************************************/
2009-08-23 13:43:25 +02:00
// Called by VIO/garbage_collector() when it is idle to
// help quench the thirst for free pages.
2001-05-23 15:26:42 +02:00
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
if (dbb->dbb_flags & DBB_read_only) {
return false;
}
2001-05-23 15:26:42 +02:00
BufferDesc* bdb;
2008-12-18 11:47:25 +01:00
if (bcb->bcb_flags & BCB_free_pending && (bdb = get_buffer(tdbb, FREE_PAGE, LATCH_none, 1)))
2003-12-22 11:00:59 +01:00
{
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, bdb, bdb->bdb_page, true, tdbb->tdbb_status_vector, true))
2003-12-22 11:00:59 +01:00
{
CCH_unwind(tdbb, false);
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
else
return true;
2001-05-23 15:26:42 +02:00
}
return false;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
SLONG CCH_get_incarnation(WIN* window)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ g e t _ i n c a r n a t i o n
*
**************************************
*
* Functional description
* Get page incarnation associated with buffer.
*
**************************************/
return window->win_bdb->bdb_incarnation;
}
void CCH_get_related(thread_db* tdbb, PageNumber page, PagesArray &lowPages)
{
/**************************************
*
* C C H _ g e t _ r e l a t e d
*
**************************************
*
* Functional description
* Collect all pages, dependent on given page (i.e. all pages which must be
* written after given page). To do it, walk low part of precedence graph
2009-10-15 04:15:31 +02:00
* starting from given page and put its numbers into array.
*
**************************************/
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
QUE mod_que = &bcb->bcb_rpt[page.getPageNum() % bcb->bcb_count].bcb_page_mod;
QUE que_inst;
for (que_inst = mod_que->que_forward; que_inst != mod_que; que_inst = que_inst->que_forward)
{
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_que);
2009-10-15 04:15:31 +02:00
if (bdb->bdb_page == page)
{
const ULONG mark = get_prec_walk_mark(bcb);
get_related(bdb, lowPages, PRE_SEARCH_LIMIT, mark);
return;
}
}
}
2008-12-18 11:47:25 +01:00
pag* CCH_handoff(thread_db* tdbb, WIN* window, SLONG page, SSHORT lock, SCHAR page_type,
SSHORT latch_wait, const bool release_tail)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ h a n d o f f
*
**************************************
*
* Functional description
* Follow a pointer handing off the lock. Fetch the new page
* before retiring the old page lock.
*
* input
* latch_wait: 1 => Wait as long as necessary to get the latch.
* This can cause deadlocks of course.
* 0 => If the latch can't be acquired immediately,
* give up and return 0.
* <negative number> => Latch timeout interval in seconds.
*
* return
* PAG if successful.
* 0 if a latch timeout occurred (only possible if latch_wait <> 1).
* The latch on the fetched page is downgraded to shared.
* The fetched page is unmarked.
*
**************************************/
2009-08-23 13:43:25 +02:00
// The update, if there was one, of the input page is complete.
// The cache buffer can be 'unmarked'. It is important to
// unmark before CCH_unwind is (might be) called.
2001-05-23 15:26:42 +02:00
SET_TDBB(tdbb);
2009-04-01 12:49:54 +02:00
CCH_TRACE(("H %d:%06d->%06d",
window->win_page.getPageSpaceID(), window->win_page.getPageNum(), page));
2001-05-23 15:26:42 +02:00
unmark(tdbb, window);
2009-08-23 13:43:25 +02:00
// If the 'from-page' and 'to-page' of the handoff are the
// same and the latch requested is shared then downgrade it.
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if ((window->win_page.getPageNum() == page) && (lock == LCK_read))
{
release_bdb(tdbb, window->win_bdb, false, true, false);
2001-05-23 15:26:42 +02:00
return window->win_buffer;
}
WIN temp = *window;
2006-05-22 00:07:35 +02:00
window->win_page = PageNumber(window->win_page.getPageSpaceID(), page);
2008-12-18 11:47:25 +01:00
const SSHORT must_read = CCH_FETCH_LOCK(tdbb, window, lock, latch_wait, page_type);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Latch or lock timeout, return failure.
2001-05-23 15:26:42 +02:00
if (must_read == -2 || must_read == -1)
{
2001-05-23 15:26:42 +02:00
*window = temp;
CCH_RELEASE(tdbb, window);
return NULL;
2001-05-23 15:26:42 +02:00
}
if (release_tail)
CCH_RELEASE_TAIL(tdbb, &temp);
else
CCH_RELEASE(tdbb, &temp);
if (must_read) {
CCH_FETCH_PAGE(tdbb, window, true, false);
}
2001-05-23 15:26:42 +02:00
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If a page was read or prefetched on behalf of a large scan
// then load the window scan count into the buffer descriptor.
// This buffer scan count is decremented by releasing a buffer
// with CCH_RELEASE_TAIL.
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Otherwise zero the buffer scan count to prevent the buffer
// from being queued to the LRU tail.
2001-05-23 15:26:42 +02:00
if (window->win_flags & WIN_large_scan)
{
2008-12-18 11:47:25 +01:00
if (must_read == 1 || bdb->bdb_flags & BDB_prefetch || bdb->bdb_scan_count < 0)
{
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = window->win_scans;
}
2001-05-23 15:26:42 +02:00
}
else if (window->win_flags & WIN_garbage_collector)
{
if (must_read == 1) {
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = -1;
}
if (bdb->bdb_flags & BDB_garbage_collect) {
2001-05-23 15:26:42 +02:00
window->win_flags |= WIN_garbage_collect;
}
2001-05-23 15:26:42 +02:00
}
else if (window->win_flags & WIN_secondary)
{
if (must_read == 1) {
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = -1;
}
2001-05-23 15:26:42 +02:00
}
else
{
2001-05-23 15:26:42 +02:00
bdb->bdb_scan_count = 0;
2003-09-13 20:35:39 +02:00
if (bdb->bdb_flags & BDB_garbage_collect) {
2001-05-23 15:26:42 +02:00
bdb->bdb_flags &= ~BDB_garbage_collect;
2003-09-13 20:35:39 +02:00
}
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Validate the fetched page matches the expected type
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if (bdb->bdb_buffer->pag_type != page_type && page_type != pag_undefined)
{
page_validation_error(tdbb, window, page_type);
}
2001-05-23 15:26:42 +02:00
return window->win_buffer;
}
void CCH_init(thread_db* tdbb, ULONG number)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ i n i t
*
**************************************
*
* Functional description
* Initialize the cache. Allocate buffers control block,
* buffer descriptors, and actual buffers.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2008-12-05 02:20:14 +01:00
2007-04-25 08:32:54 +02:00
CCH_TRACE(("INIT %s", dbb->dbb_filename.c_str()));
2007-04-25 04:26:33 +02:00
// Check for database-specific page buffers
2001-05-23 15:26:42 +02:00
if (dbb->dbb_page_buffers) {
2001-05-23 15:26:42 +02:00
number = dbb->dbb_page_buffers;
}
2001-05-23 15:26:42 +02:00
2007-04-25 04:26:33 +02:00
// Enforce page buffer cache constraints
2001-05-23 15:26:42 +02:00
if (number < MIN_PAGE_BUFFERS) {
2001-05-23 15:26:42 +02:00
number = MIN_PAGE_BUFFERS;
}
if (number > MAX_PAGE_BUFFERS) {
2001-05-23 15:26:42 +02:00
number = MAX_PAGE_BUFFERS;
}
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
const SLONG count = number;
2001-05-23 15:26:42 +02:00
2007-04-25 04:26:33 +02:00
// Allocate and initialize buffers control block
BufferControl* bcb = 0;
while (!bcb)
{
2001-12-24 03:51:06 +01:00
try {
bcb = FB_NEW_RPT(*dbb->dbb_bufferpool, number) BufferControl(*dbb->dbb_bufferpool);
2006-05-20 05:55:54 +02:00
}
catch (const Firebird::Exception& ex)
{
Firebird::stuff_exception(tdbb->tdbb_status_vector, ex);
2009-08-23 13:43:25 +02:00
// If the buffer control block can't be allocated, memory is
// very low. Recalculate the number of buffers to account for
// page buffer overhead and reduce that number by a 25% fudge factor.
2001-05-23 15:26:42 +02:00
2001-12-24 03:51:06 +01:00
number = (sizeof(bcb_repeat) * number) / PAGE_OVERHEAD;
number -= number >> 2;
2001-05-23 15:26:42 +02:00
if (number < MIN_PAGE_BUFFERS) {
ERR_post(Arg::Gds(isc_cache_too_small));
}
2001-12-24 03:51:06 +01:00
}
2001-05-23 15:26:42 +02:00
}
dbb->dbb_bcb = bcb;
QUE_INIT(bcb->bcb_in_use);
QUE_INIT(bcb->bcb_dirty);
bcb->bcb_dirty_count = 0;
QUE_INIT(bcb->bcb_empty);
QUE_INIT(bcb->bcb_free_lwt);
QUE_INIT(bcb->bcb_free_slt);
2001-05-23 15:26:42 +02:00
2007-04-25 04:26:33 +02:00
// initialization of memory is system-specific
2001-05-23 15:26:42 +02:00
2007-04-11 18:05:40 +02:00
bcb->bcb_count = memory_init(tdbb, bcb, static_cast<SLONG>(number));
bcb->bcb_free_minimum = (SSHORT) MIN(bcb->bcb_count / 4, 128);
2001-05-23 15:26:42 +02:00
if (bcb->bcb_count < MIN_PAGE_BUFFERS) {
ERR_post(Arg::Gds(isc_cache_too_small));
}
2001-05-23 15:26:42 +02:00
2007-04-25 04:26:33 +02:00
// Log if requested number of page buffers could not be allocated.
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (count != (SLONG) bcb->bcb_count)
{
2008-12-18 11:47:25 +01:00
gds__log("Database: %s\n\tAllocated %ld page buffers of %ld requested",
tdbb->getAttachment()->att_filename.c_str(), bcb->bcb_count, count);
}
2001-05-23 15:26:42 +02:00
if (dbb->dbb_lock->lck_logical != LCK_EX) {
2001-05-23 15:26:42 +02:00
dbb->dbb_ast_flags |= DBB_assert_locks;
}
2001-05-23 15:26:42 +02:00
#ifdef CACHE_READER
if (gds__thread_start(cache_reader, dbb, THREAD_high, 0, 0))
{
2001-05-23 15:26:42 +02:00
ERR_bugcheck_msg("cannot start thread");
}
2001-05-23 15:26:42 +02:00
{ // scope
Database::Checkout dcoHolder(dbb);
dbb->dbb_reader_init.enter();
}
2001-05-23 15:26:42 +02:00
#endif
#ifdef CACHE_WRITER
if (!(dbb->dbb_flags & DBB_read_only))
{
2007-01-18 16:50:18 +01:00
// writer startup in progress
bcb->bcb_flags |= BCB_writer_start;
2008-12-18 11:47:25 +01:00
if (gds__thread_start(cache_writer, dbb, THREAD_high, 0, 0))
{
2007-01-18 16:50:18 +01:00
bcb->bcb_flags &= ~BCB_writer_start;
2001-05-23 15:26:42 +02:00
ERR_bugcheck_msg("cannot start thread");
}
{ // scope
Database::Checkout dcoHolder(dbb);
dbb->dbb_writer_init.enter();
}
2001-05-23 15:26:42 +02:00
}
#endif
}
2009-08-23 13:43:25 +02:00
void CCH_mark(thread_db* tdbb, WIN* window, USHORT mark_system, USHORT must_write)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ m a r k
*
**************************************
*
* Functional description
* Mark a window as dirty.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
tdbb->bumpStats(RuntimeStatistics::PAGE_MARKS);
BufferControl* bcb = dbb->dbb_bcb;
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
BLKCHK(bdb, type_bdb);
if (!(bdb->bdb_flags & BDB_writer)) {
2009-08-23 13:43:25 +02:00
BUGCHECK(208); // msg 208 page not accessed for write
}
CCH_TRACE(("M %d:%06d", window->win_page.getPageSpaceID(), window->win_page.getPageNum()));
2009-08-23 13:43:25 +02:00
// A LATCH_mark is needed before the BufferDesc can be marked.
// This prevents a write while the page is being modified.
2001-05-23 15:26:42 +02:00
if (latch_bdb(tdbb, LATCH_mark, bdb, bdb->bdb_page, 1) == -1) {
2009-08-23 13:43:25 +02:00
BUGCHECK(302); // msg 302 unexpected page change
}
2001-05-23 15:26:42 +02:00
bdb->bdb_incarnation = ++dbb->dbb_page_incarnation;
2009-08-23 13:43:25 +02:00
// mark the dirty bit vector for this specific transaction,
// if it exists; otherwise mark that the system transaction
// has updated this page
2001-05-23 15:26:42 +02:00
SLONG number;
jrd_tra* transaction = tdbb->getTransaction();
if (transaction && (number = transaction->tra_number))
{
2009-06-26 06:12:20 +02:00
if (!(tdbb->tdbb_flags & TDBB_sweeper))
{
const ULONG trans_bucket = number & (BITS_PER_LONG - 1);
2001-05-23 15:26:42 +02:00
bdb->bdb_transactions |= (1L << trans_bucket);
if (number > bdb->bdb_mark_transaction) {
2001-05-23 15:26:42 +02:00
bdb->bdb_mark_transaction = number;
}
2001-05-23 15:26:42 +02:00
}
}
else {
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_system_dirty;
}
2001-05-23 15:26:42 +02:00
if (mark_system) {
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_system_dirty;
}
2001-05-23 15:26:42 +02:00
2008-06-05 13:02:42 +02:00
if (!(tdbb->tdbb_flags & TDBB_sweeper) || bdb->bdb_flags & BDB_system_dirty)
{
insertDirty(bcb, bdb);
2001-05-23 15:26:42 +02:00
}
#ifdef SUPERSERVER
bdb->bdb_flags |= BDB_db_dirty;
#endif
set_dirty_flag(tdbb, bdb);
2001-05-23 15:26:42 +02:00
if (must_write || dbb->dbb_backup_manager->databaseFlushInProgress())
bdb->bdb_flags |= BDB_must_write;
2001-05-23 15:26:42 +02:00
set_diff_page(tdbb, bdb);
bdb->bdb_flags |= BDB_marked;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
void CCH_must_write(WIN* window)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ m u s t _ w r i t e
*
**************************************
*
* Functional description
* Mark a window as "must write".
*
**************************************/
Jrd::thread_db* tdbb = NULL;
SET_TDBB(tdbb);
2009-04-28 15:08:04 +02:00
//Database* dbb = tdbb->getDatabase();
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
BLKCHK(bdb, type_bdb);
if (!(bdb->bdb_flags & BDB_marked) || !(bdb->bdb_flags & BDB_dirty)) {
2009-08-23 13:43:25 +02:00
BUGCHECK(208); // msg 208 page not accessed for write
}
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_must_write;
set_dirty_flag(tdbb, bdb);
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
void CCH_precedence(thread_db* tdbb, WIN* window, SLONG pageNum)
2006-05-22 00:07:35 +02:00
{
const USHORT pageSpaceID = pageNum > FIRST_PIP_PAGE ?
2006-05-22 00:07:35 +02:00
window->win_page.getPageSpaceID() : DB_PAGE_SPACE;
CCH_precedence(tdbb, window, PageNumber(pageSpaceID, pageNum));
}
2009-08-23 13:43:25 +02:00
void CCH_precedence(thread_db* tdbb, WIN* window, PageNumber page)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ p r e c e d e n c e
*
**************************************
*
* Functional description
* Given a window accessed for write and a page number,
* establish a precedence relationship such that the
* specified page will always be written before the page
* associated with the window.
*
* If the "page number" is negative, it is really a transaction
* id. In this case, the precedence relationship is to the
* database header page from which the transaction id was
* obtained. If the header page has been written since the
* transaction id was assigned, no precedence relationship
* is required.
*
**************************************/
2009-08-23 13:43:25 +02:00
// If the page is zero, the caller isn't really serious
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
if (page.getPageNum() == 0) {
2001-05-23 15:26:42 +02:00
return;
}
2001-05-23 15:26:42 +02:00
2008-12-05 02:20:14 +01:00
// no need to support precedence for temporary pages
if (page.isTemporary() || window->win_page.isTemporary()) {
return;
}
2001-05-23 15:26:42 +02:00
check_precedence(tdbb, window, page);
}
#ifdef CACHE_READER
2009-12-13 14:49:43 +01:00
void CCH_prefetch(thread_db* tdbb, SLONG* pages, SSHORT count)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ p r e f e t c h
*
**************************************
*
* Functional description
* Given a vector of pages, set corresponding bits
* in global prefetch bitmap. Initiate an asynchronous
* I/O and get the cache reader reading in our behalf
* as well.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (!count || !(bcb->bcb_flags & BCB_cache_reader))
{
2009-08-23 13:43:25 +02:00
// Caller isn't really serious.
2001-05-23 15:26:42 +02:00
return;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Switch default pool to permanent pool for setting bits in prefetch bitmap.
Jrd::ContextPoolHolder context(tdbb, dbb->dbb_bufferpool);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// The global prefetch bitmap is the key to the I/O coalescense mechanism which dovetails
// all thread prefetch requests to minimize sequential I/O requests.
// It also enables multipage I/O by implicitly sorting page vector requests.
2001-05-23 15:26:42 +02:00
SLONG first_page = 0;
for (const SLONG* const end = pages + count; pages < end;)
{
const SLONG page = *pages++;
2009-06-26 06:12:20 +02:00
if (page)
{
2001-05-23 15:26:42 +02:00
SBM_set(tdbb, &bcb->bcb_prefetch, page);
if (!first_page)
first_page = page;
}
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Not likely that the caller's page vector was empty but check anyway.
2001-05-23 15:26:42 +02:00
if (first_page)
{
2003-10-20 12:53:52 +02:00
prf prefetch;
2001-05-23 15:26:42 +02:00
prefetch_init(&prefetch, tdbb);
prefetch_prologue(&prefetch, &first_page);
prefetch_io(&prefetch, tdbb->tdbb_status_vector);
prefetch_epilogue(&prefetch, tdbb->tdbb_status_vector);
}
}
bool CCH_prefetch_pages(thread_db* tdbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ p r e f e t c h _ p a g e s
*
**************************************
*
* Functional description
* Check the prefetch bitmap for a set
* of pages and read them into the cache.
2001-05-23 15:26:42 +02:00
*
**************************************/
2009-08-23 13:43:25 +02:00
// Placeholder to be implemented when predictive prefetch is
// enabled. This is called by VIO/garbage_collector() when it
// is idle to help satisfy the prefetch demand.
2001-05-23 15:26:42 +02:00
return false;
2001-05-23 15:26:42 +02:00
}
#endif // CACHE_READER
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
void set_diff_page(thread_db* tdbb, BufferDesc* bdb)
{
2009-06-06 11:05:20 +02:00
Database* const dbb = tdbb->getDatabase();
BackupManager* const bm = dbb->dbb_backup_manager;
// Determine location of the page in difference file and write destination
// so BufferDesc AST handlers and write_page routine can safely use this information
if (bdb->bdb_page != HEADER_PAGE_NUMBER)
{
// SCN of header page is adjusted in nbak.cpp
if (bdb->bdb_buffer->pag_scn != bm->getCurrentSCN())
{
bdb->bdb_buffer->pag_scn = bm->getCurrentSCN(); // Set SCN for the page
win window(bdb->bdb_page);
window.win_bdb = bdb;
window.win_buffer = bdb->bdb_buffer;
PAG_set_page_scn(tdbb, &window);
}
}
const int backup_state = bm->getState();
if (backup_state == nbak_state_normal)
return;
// Temporary pages don't write to delta
2008-12-18 11:47:25 +01:00
PageSpace* pageSpace = dbb->dbb_page_manager.findPageSpace(bdb->bdb_page.getPageSpaceID());
fb_assert(pageSpace);
if (pageSpace->isTemporary())
return;
2009-01-20 09:33:59 +01:00
switch (backup_state)
{
case nbak_state_stalled:
{ //scope
BackupManager::AllocReadGuard allocGuard(tdbb, bm);
bdb->bdb_difference_page = bm->getPageIndex(tdbb, bdb->bdb_page.getPageNum());
}
if (!bdb->bdb_difference_page)
{
{ //scope
BackupManager::AllocWriteGuard allocGuard(tdbb, bm);
bdb->bdb_difference_page = bm->allocateDifferencePage(tdbb, bdb->bdb_page.getPageNum());
}
2009-06-26 06:12:20 +02:00
if (!bdb->bdb_difference_page)
{
invalidate_and_release_buffer(tdbb, bdb);
CCH_unwind(tdbb, true);
}
2008-12-05 02:20:14 +01:00
NBAK_TRACE(("Allocate difference page %d for database page %d",
bdb->bdb_difference_page, bdb->bdb_page));
}
2009-06-26 06:12:20 +02:00
else
{
2008-12-05 02:20:14 +01:00
NBAK_TRACE(("Map existing difference page %d to database page %d",
bdb->bdb_difference_page, bdb->bdb_page));
}
break;
case nbak_state_merge:
{ //scope
BackupManager::AllocReadGuard allocGuard(tdbb, bm);
bdb->bdb_difference_page = bm->getPageIndex(tdbb, bdb->bdb_page.getPageNum());
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_difference_page)
{
2008-12-05 02:20:14 +01:00
NBAK_TRACE(("Map existing difference page %d to database page %d (write_both)",
bdb->bdb_difference_page, bdb->bdb_page));
}
break;
}
}
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
2009-08-23 13:43:25 +02:00
void CCH_release(thread_db* tdbb, WIN* window, const bool release_tail)
{
2007-02-06 09:03:43 +01:00
/**************************************
*
* C C H _ r e l e a s e
*
**************************************
*
* Functional description
* Release a window. If the release_tail
* flag is true then make the buffer
* least-recently-used.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2009-06-06 11:05:20 +02:00
BufferDesc* const bdb = window->win_bdb;
2007-02-06 09:03:43 +01:00
BLKCHK(bdb, type_bdb);
2003-09-13 20:35:39 +02:00
CCH_TRACE(("R %d:%06d", window->win_page.getPageSpaceID(), window->win_page.getPageNum()));
2009-08-23 13:43:25 +02:00
// A large sequential scan has requested that the garbage
// collector garbage collect. Mark the buffer so that the
// page isn't released to the LRU tail before the garbage
// collector can process the page.
2007-02-06 09:03:43 +01:00
2008-12-18 11:47:25 +01:00
if (window->win_flags & WIN_large_scan && window->win_flags & WIN_garbage_collect)
2007-02-06 09:03:43 +01:00
{
bdb->bdb_flags |= BDB_garbage_collect;
window->win_flags &= ~WIN_garbage_collect;
2006-05-22 00:07:35 +02:00
}
2007-02-06 09:03:43 +01:00
tdbb->getAttachment()->backupStateReadUnLock(tdbb);
2007-02-06 09:03:43 +01:00
if (bdb->bdb_use_count == 1)
2001-05-23 15:26:42 +02:00
{
2008-03-29 14:01:49 +01:00
const bool marked = bdb->bdb_flags & BDB_marked;
2008-12-05 02:20:14 +01:00
bdb->bdb_flags &= ~(BDB_writer | BDB_marked | BDB_faked);
2008-12-05 02:20:14 +01:00
if (marked)
{
release_bdb(tdbb, bdb, false, false, true);
2001-05-23 15:26:42 +02:00
}
2001-05-23 15:26:42 +02:00
if (bdb->bdb_flags & BDB_must_write)
{
2009-08-23 13:43:25 +02:00
// Downgrade exclusive latch to shared to allow concurrent share access
// to page during I/O.
2001-05-23 15:26:42 +02:00
release_bdb(tdbb, bdb, false, true, false);
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, bdb, bdb->bdb_page, false, tdbb->tdbb_status_vector, true))
2001-05-23 15:26:42 +02:00
{
insertDirty(dbb->dbb_bcb, bdb);
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
}
2001-05-23 15:26:42 +02:00
if (bdb->bdb_flags & BDB_no_blocking_ast)
{
if (bdb->bdb_flags & (BDB_db_dirty | BDB_dirty))
{
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, bdb, bdb->bdb_page, false, tdbb->tdbb_status_vector, true))
2001-05-23 15:26:42 +02:00
{
// Reassert blocking AST after write failure with dummy lock convert
// to same level. This will re-enable blocking AST notification.
2001-05-23 15:26:42 +02:00
LCK_convert_opt(tdbb, bdb->bdb_lock,
bdb->bdb_lock->lck_logical);
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
}
PAGE_LOCK_RELEASE(bdb->bdb_lock);
bdb->bdb_flags &= ~BDB_no_blocking_ast;
bdb->bdb_ast_flags &= ~BDB_blocking;
}
// Make buffer the least-recently-used by queueing it to the LRU tail
2001-05-23 15:26:42 +02:00
if (release_tail)
{
2008-12-18 11:47:25 +01:00
if ((window->win_flags & WIN_large_scan && bdb->bdb_scan_count > 0 &&
!(--bdb->bdb_scan_count) && !(bdb->bdb_flags & BDB_garbage_collect)) ||
(window->win_flags & WIN_garbage_collector && bdb->bdb_flags & BDB_garbage_collect &&
!bdb->bdb_scan_count))
2001-05-23 15:26:42 +02:00
{
if (window->win_flags & WIN_garbage_collector)
{
bdb->bdb_flags &= ~BDB_garbage_collect;
}
BufferControl* bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
QUE_LEAST_RECENTLY_USED(bdb->bdb_in_use);
#ifdef CACHE_WRITER
if (bdb->bdb_flags & (BDB_dirty | BDB_db_dirty))
{
2008-12-05 02:20:14 +01:00
if (bdb->bdb_dirty.que_forward != &bdb->bdb_dirty)
{
QUE_DELETE(bdb->bdb_dirty);
QUE_APPEND(bcb->bcb_dirty, bdb->bdb_dirty);
}
2001-05-23 15:26:42 +02:00
bcb->bcb_flags |= BCB_free_pending;
2008-12-18 11:47:25 +01:00
if (bcb->bcb_flags & BCB_cache_writer && !(bcb->bcb_flags & BCB_writer_active))
2001-05-23 15:26:42 +02:00
{
dbb->dbb_writer_sem.release();
2001-05-23 15:26:42 +02:00
}
}
#endif
}
}
}
release_bdb(tdbb, bdb, false, false, false);
const SSHORT use_count = bdb->bdb_use_count;
2001-05-23 15:26:42 +02:00
if (use_count < 0) {
2009-08-23 13:43:25 +02:00
BUGCHECK(209); // msg 209 attempt to release page not acquired
}
2001-05-23 15:26:42 +02:00
if (!use_count && (bdb->bdb_ast_flags & BDB_blocking))
2003-08-13 13:11:12 +02:00
{
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RE_POST(bdb->bdb_lock);
2003-08-13 13:11:12 +02:00
}
2001-05-23 15:26:42 +02:00
window->win_bdb = NULL;
fb_assert(bdb->bdb_use_count ? true : !(bdb->bdb_flags & BDB_marked))
2001-05-23 15:26:42 +02:00
}
void CCH_release_exclusive(thread_db* tdbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ r e l e a s e _ e x c l u s i v e
*
**************************************
*
* Functional description
* Release exclusive access to database.
*
**************************************/
2008-12-05 02:20:14 +01:00
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
dbb->dbb_flags &= ~DBB_exclusive;
Jrd::Attachment* attachment = tdbb->getAttachment();
if (attachment) {
2001-05-23 15:26:42 +02:00
attachment->att_flags &= ~ATT_exclusive;
}
2001-05-23 15:26:42 +02:00
if (dbb->dbb_ast_flags & DBB_blocking) {
LCK_re_post(tdbb, dbb->dbb_lock);
}
2001-05-23 15:26:42 +02:00
}
bool CCH_rollover_to_shadow(thread_db* tdbb, Database* dbb, jrd_file* file, const bool inAst)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ r o l l o v e r _ t o _ s h a d o w
*
**************************************
*
* Functional description
* An I/O error has been detected on the
2001-05-23 15:26:42 +02:00
* main database file. Roll over to use
* the shadow file.
*
**************************************/
SET_TDBB(tdbb);
// Is the shadow subsystem yet initialized
if (!dbb->dbb_shadow_lock) {
2003-12-22 11:00:59 +01:00
return false;
}
// hvlad: if there are no shadows can't rollover
// this is a temporary solution to prevent 100% CPU load
// in write_page in case of PIO_write failure
if (!dbb->dbb_shadow) {
return false;
}
// notify other process immediately to ensure all read from sdw
// file instead of db file
return SDW_rollover_to_shadow(tdbb, file, inAst);
2001-05-23 15:26:42 +02:00
}
2004-03-07 08:58:55 +01:00
void CCH_shutdown_database(Database* dbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ s h u t d o w n _ d a t a b a s e
*
**************************************
*
* Functional description
* Shutdown database physical page locks.
*
**************************************/
thread_db* tdbb = JRD_get_thread_data();
2001-05-23 15:26:42 +02:00
bcb_repeat* tail;
BufferControl* bcb = dbb->dbb_bcb;
if (bcb && (tail = bcb->bcb_rpt) && (tail->bcb_bdb))
{
2008-12-18 11:47:25 +01:00
for (const bcb_repeat* const end = tail + bcb->bcb_count; tail < end; tail++)
{
BufferDesc* bdb = tail->bcb_bdb;
bdb->bdb_flags &= ~BDB_db_dirty;
clear_dirty_flag(tdbb, bdb);
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RELEASE(bdb->bdb_lock);
}
}
2001-05-23 15:26:42 +02:00
#ifndef SUPERSERVER
2006-05-22 00:07:35 +02:00
PageSpace* pageSpaceID = dbb->dbb_page_manager.findPageSpace(DB_PAGE_SPACE);
PIO_close(pageSpaceID->file);
2001-05-23 15:26:42 +02:00
SDW_close();
#endif
}
2008-03-29 14:01:49 +01:00
void CCH_unwind(thread_db* tdbb, const bool punt)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ u n w i n d
*
**************************************
*
* Functional description
* Synchronously unwind cache after I/O or lock error.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// CCH_unwind is called when any of the following occurs:
// - IO error
// - journaling error => obsolete
// - bad page checksum => obsolete
// - wrong page type
// - page locking (not latching) deadlock
2001-05-23 15:26:42 +02:00
BufferControl* bcb = dbb->dbb_bcb;
if (!bcb || (tdbb->tdbb_flags & TDBB_no_cache_unwind))
{
2001-12-24 03:51:06 +01:00
if (punt) {
2001-05-23 15:26:42 +02:00
ERR_punt();
}
else {
2001-05-23 15:26:42 +02:00
return;
2001-12-24 03:51:06 +01:00
}
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// A cache error has occurred. Scan the cache for buffers
// which may be in use and release them.
2001-05-23 15:26:42 +02:00
bcb_repeat* tail = bcb->bcb_rpt;
for (const bcb_repeat* const end = tail + bcb->bcb_count; tail < end; tail++)
2001-12-24 03:51:06 +01:00
{
BufferDesc* bdb = tail->bcb_bdb;
2001-12-24 03:51:06 +01:00
if (!bdb->bdb_use_count) {
2001-05-23 15:26:42 +02:00
continue;
2001-12-24 03:51:06 +01:00
}
if (bdb->bdb_io == tdbb) {
release_bdb(tdbb, bdb, true, false, false);
2001-12-24 03:51:06 +01:00
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_exclusive == tdbb)
{
2006-01-05 11:10:37 +01:00
if (bdb->bdb_flags & BDB_marked) {
2009-08-23 13:43:25 +02:00
BUGCHECK(268); // msg 268 buffer marked during cache unwind
}
2001-05-23 15:26:42 +02:00
bdb->bdb_flags &= ~(BDB_writer | BDB_faked | BDB_must_write);
release_bdb(tdbb, bdb, true, false, false);
2001-05-23 15:26:42 +02:00
}
2008-12-05 02:20:14 +01:00
// hvlad : as far as I understand thread can't hold more than two shared latches
// on the same bdb, so findSharedLatch below will not be called many times
2008-06-07 00:40:15 +02:00
SharedLatch* latch = findSharedLatch(tdbb, bdb);
while (latch)
{
release_bdb(tdbb, bdb, true, false, false);
latch = findSharedLatch(tdbb, bdb);
2001-12-24 03:51:06 +01:00
}
#ifndef SUPERSERVER
const pag* const page = bdb->bdb_buffer;
if (page->pag_type == pag_header || page->pag_type == pag_transactions)
{
++bdb->bdb_use_count;
clear_dirty_flag(tdbb, bdb);
bdb->bdb_flags &= ~(BDB_writer | BDB_marked | BDB_faked | BDB_db_dirty);
PAGE_LOCK_RELEASE(bdb->bdb_lock);
--bdb->bdb_use_count;
}
2001-05-23 15:26:42 +02:00
#endif
}
if (punt) {
2001-05-23 15:26:42 +02:00
ERR_punt();
}
2001-05-23 15:26:42 +02:00
}
2008-12-18 11:47:25 +01:00
bool CCH_validate(WIN* window)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ v a l i d a t e
*
**************************************
*
* Functional description
* Give a page a quick once over looking for unhealthyness.
*
**************************************/
BufferDesc* bdb = window->win_bdb;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If page is marked for write, checksum is questionable
2001-05-23 15:26:42 +02:00
if ((bdb->bdb_flags & (BDB_dirty | BDB_db_dirty))) {
return true;
}
2001-05-23 15:26:42 +02:00
return (bdb->bdb_buffer->pag_pageno == bdb->bdb_page.getPageNum());
2001-05-23 15:26:42 +02:00
}
2008-12-18 11:47:25 +01:00
bool CCH_write_all_shadows(thread_db* tdbb, Shadow* shadow, BufferDesc* bdb,
2009-12-14 12:33:13 +01:00
ISC_STATUS* status, const bool inAst)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* C C H _ w r i t e _ a l l _ s h a d o w s
*
**************************************
*
* Functional description
* Compute a checksum and write a page out to all shadows
* detecting failure on write.
* If shadow is null, write to all shadows, otherwise only to specified
* shadow.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
Shadow* sdw = shadow ? shadow : dbb->dbb_shadow;
2001-05-23 15:26:42 +02:00
2001-12-24 03:51:06 +01:00
if (!sdw) {
2003-12-22 11:00:59 +01:00
return true;
2001-12-24 03:51:06 +01:00
}
2003-12-22 11:00:59 +01:00
bool result = true;
2008-03-19 12:46:47 +01:00
Firebird::UCharBuffer spare_buffer;
2001-05-23 15:26:42 +02:00
pag* page;
2008-03-19 12:46:47 +01:00
pag* old_buffer = NULL;
if (bdb->bdb_page == HEADER_PAGE_NUMBER)
{
2008-03-19 12:46:47 +01:00
page = (pag*) spare_buffer.getBuffer(dbb->dbb_page_size);
2008-02-03 11:41:44 +01:00
memcpy(page, bdb->bdb_buffer, HDR_SIZE);
2001-05-23 15:26:42 +02:00
old_buffer = bdb->bdb_buffer;
bdb->bdb_buffer = page;
}
bdb->bdb_buffer->pag_pageno = bdb->bdb_page.getPageNum();
2001-05-23 15:26:42 +02:00
for (; sdw; sdw = sdw->sdw_next)
{
2009-08-23 13:43:25 +02:00
// don't bother to write to the shadow if it is no longer viable
2001-05-23 15:26:42 +02:00
/* Fix for bug 7925. drop_gdb fails to remove secondary file if
the shadow is conditional. Reason being the header page not
being correctly initialized.
2001-05-23 15:26:42 +02:00
The following block was not being performed for a conditional
shadow since SDW_INVALID expanded to include conditional shadow
-Sudesh 07/10/95
2001-05-23 15:26:42 +02:00
old code --> if (sdw->sdw_flags & SDW_INVALID)
*/
2008-06-05 13:02:42 +02:00
if ((sdw->sdw_flags & SDW_INVALID) && !(sdw->sdw_flags & SDW_conditional))
{
continue;
}
2001-05-23 15:26:42 +02:00
if (bdb->bdb_page == HEADER_PAGE_NUMBER)
{
2009-08-23 13:43:25 +02:00
// fixup header for shadow file
jrd_file* shadow_file = sdw->sdw_file;
header_page* header = (header_page*) page;
2006-05-22 00:07:35 +02:00
PageSpace* pageSpaceID = dbb->dbb_page_manager.findPageSpace(DB_PAGE_SPACE);
const UCHAR* q = (UCHAR *) pageSpaceID->file->fil_string;
2001-05-23 15:26:42 +02:00
header->hdr_data[0] = HDR_end;
header->hdr_end = HDR_SIZE;
header->hdr_next_page = 0;
PAG_add_header_entry(tdbb, header, HDR_root_file_name,
2008-12-20 20:57:43 +01:00
(USHORT) strlen((const char*) q), q);
2001-05-23 15:26:42 +02:00
jrd_file* next_file = shadow_file->fil_next;
if (next_file)
{
2001-05-23 15:26:42 +02:00
q = (UCHAR *) next_file->fil_string;
const SLONG last = next_file->fil_min_page - 1;
PAG_add_header_entry(tdbb, header, HDR_file, (USHORT) strlen((const char*) q), q);
2008-12-18 11:47:25 +01:00
PAG_add_header_entry(tdbb, header, HDR_last_page, sizeof(last), (const UCHAR*) &last);
2001-05-23 15:26:42 +02:00
}
header->hdr_flags |= hdr_active_shadow;
header->hdr_header.pag_pageno = bdb->bdb_page.getPageNum();
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// This condition makes sure that PIO_write is performed in case of
// conditional shadow only if the page is Header page
//
// -Sudesh 07/10/95
2001-05-23 15:26:42 +02:00
2008-12-20 20:57:43 +01:00
if ((sdw->sdw_flags & SDW_conditional) && bdb->bdb_page != HEADER_PAGE_NUMBER)
{
continue;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// if a write failure happens on an AUTO shadow, mark the
// shadow to be deleted at the next available opportunity when we
// know we don't have a page fetched
2001-05-23 15:26:42 +02:00
if (!PIO_write(sdw->sdw_file, bdb, page, status))
{
if (sdw->sdw_flags & SDW_manual) {
2003-12-22 11:00:59 +01:00
result = false;
}
else
{
2001-05-23 15:26:42 +02:00
sdw->sdw_flags |= SDW_delete;
2009-06-26 06:12:20 +02:00
if (!inAst && SDW_check_conditional(tdbb))
{
if (SDW_lck_update(tdbb, 0))
{
SDW_notify(tdbb);
CCH_unwind(tdbb, false);
SDW_dump_pages(tdbb);
ERR_post(Arg::Gds(isc_deadlock));
2001-05-23 15:26:42 +02:00
}
}
}
}
2009-08-23 13:43:25 +02:00
// If shadow was specified, break out of loop
2001-05-23 15:26:42 +02:00
if (shadow) {
2001-05-23 15:26:42 +02:00
break;
}
2001-05-23 15:26:42 +02:00
}
2006-05-22 00:07:35 +02:00
if (bdb->bdb_page == HEADER_PAGE_NUMBER) {
2001-05-23 15:26:42 +02:00
bdb->bdb_buffer = old_buffer;
}
2001-05-23 15:26:42 +02:00
return result;
}
static BufferDesc* alloc_bdb(thread_db* tdbb, BufferControl* bcb, UCHAR** memory)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* a l l o c _ b d b
*
**************************************
*
* Functional description
* Allocate buffer descriptor block.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
BufferDesc* bdb = FB_NEW(*dbb->dbb_bufferpool) BufferDesc;
bdb->bdb_dbb = dbb;
2001-05-23 15:26:42 +02:00
#ifndef SUPERSERVER
2001-12-24 03:51:06 +01:00
try {
bdb->bdb_lock = alloc_page_lock(tdbb, bdb);
2001-12-24 03:51:06 +01:00
}
2009-06-26 06:12:20 +02:00
catch (const Firebird::Exception&)
{
delete bdb;
2001-12-24 03:51:06 +01:00
throw;
2001-05-23 15:26:42 +02:00
}
#endif
bdb->bdb_buffer = (pag*) *memory;
2001-05-23 15:26:42 +02:00
*memory += dbb->dbb_page_size;
QUE_INIT(bdb->bdb_higher);
QUE_INIT(bdb->bdb_lower);
QUE_INIT(bdb->bdb_waiters);
QUE_INIT(bdb->bdb_shared);
QUE_INSERT(bcb->bcb_empty, bdb->bdb_que);
QUE_INIT(bdb->bdb_dirty);
2001-05-23 15:26:42 +02:00
return bdb;
2001-05-23 15:26:42 +02:00
}
#ifndef SUPERSERVER
static Lock* alloc_page_lock(thread_db* tdbb, BufferDesc* bdb)
{
/**************************************
*
* a l l o c _ p a g e _ l o c k
*
**************************************
*
* Functional description
* Allocate a page-type lock.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
const SSHORT lockLen = PageNumber::getLockLen();
Lock* lock = FB_NEW_RPT(*dbb->dbb_bufferpool, lockLen) Lock;
lock->lck_type = LCK_bdb;
lock->lck_owner_handle = LCK_get_owner_handle(tdbb, lock->lck_type);
lock->lck_length = lockLen;
lock->lck_dbb = dbb;
lock->lck_parent = dbb->dbb_lock;
lock->lck_ast = blocking_ast_bdb;
lock->lck_object = bdb;
return lock;
}
static int blocking_ast_bdb(void* ast_object)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* b l o c k i n g _ a s t _ b d b
*
**************************************
*
* Functional description
* Blocking AST for buffer control blocks. This is called at
* AST (signal) level to indicate that a lock is blocking another
* process. If the BufferDesc* is in use, set a flag indicating that the
* lock is blocking and return. When the BufferDesc is released at normal
* level the lock will be down graded. If the BufferDesc* is not in use,
2001-05-23 15:26:42 +02:00
* write the page if dirty then downgrade lock. Things would be
* much hairier if UNIX supported asynchronous IO, but it doesn't.
* WHEW!
*
**************************************/
BufferDesc* bdb = static_cast<BufferDesc*>(ast_object);
2001-05-23 15:26:42 +02:00
try
{
Database* dbb = bdb->bdb_dbb;
2001-05-23 15:26:42 +02:00
Database::SyncGuard dsGuard(dbb, true);
2001-05-23 15:26:42 +02:00
// Since this routine will be called asynchronously,
// we must establish a thread context
ThreadContextHolder tdbb;
tdbb->setDatabase(dbb);
2001-05-23 15:26:42 +02:00
// Do some fancy footwork to make sure that pages are
// not removed from the btc tree at AST level. Then
// restore the flag to whatever it was before.
2001-05-23 15:26:42 +02:00
const bool keep_pages = (dbb->dbb_bcb->bcb_flags & BCB_keep_pages) != 0;
dbb->dbb_bcb->bcb_flags |= BCB_keep_pages;
2001-05-23 15:26:42 +02:00
down_grade(tdbb, bdb);
2001-05-23 15:26:42 +02:00
if (!keep_pages) {
dbb->dbb_bcb->bcb_flags &= ~BCB_keep_pages;
}
2001-05-23 15:26:42 +02:00
if (tdbb->tdbb_status_vector[1]) {
gds__log_status(dbb->dbb_filename.c_str(), tdbb->tdbb_status_vector);
}
}
catch (const Firebird::Exception&)
{} // no-op
2001-05-23 15:26:42 +02:00
return 0;
2001-05-23 15:26:42 +02:00
}
#endif
// Used in qsort below
extern "C" {
2007-05-20 05:25:52 +02:00
static int cmpBdbs(const void* a, const void* b)
{
const BufferDesc* bdbA = *(BufferDesc**) a;
const BufferDesc* bdbB = *(BufferDesc**) b;
2007-05-20 05:25:52 +02:00
if (bdbA->bdb_page > bdbB->bdb_page)
return 1;
2007-05-18 08:15:26 +02:00
if (bdbA->bdb_page < bdbB->bdb_page)
return -1;
2007-05-18 08:15:26 +02:00
return 0;
}
2009-08-23 13:43:25 +02:00
} // extern C
2008-12-05 02:20:14 +01:00
// Remove cleared precedence blocks from high precedence queue
static void purgePrecedence(BufferControl* bcb, BufferDesc* bdb)
{
QUE que_prec = bdb->bdb_higher.que_forward, next_prec;
for (; que_prec != &bdb->bdb_higher; que_prec = next_prec)
{
next_prec = que_prec->que_forward;
Precedence* precedence = BLOCK(que_prec, Precedence*, pre_higher);
2008-12-05 02:20:14 +01:00
if (precedence->pre_flags & PRE_cleared)
{
QUE_DELETE(precedence->pre_higher);
QUE_DELETE(precedence->pre_lower);
precedence->pre_hi = (BufferDesc*) bcb->bcb_free;
bcb->bcb_free = precedence;
}
}
}
// Write pages modified by given or system transaction to disk. First sort all
2008-12-05 02:20:14 +01:00
// corresponding pages by their numbers to make writes physically ordered and
// thus faster. At every iteration of while loop write pages which have no high
2008-12-05 02:20:14 +01:00
// precedence pages to ensure order preserved. If after some iteration there are
// no such pages (i.e. all of not written yet pages have high precedence pages)
// then write them all at last iteration (of course write_buffer will also check
// for precedence before write)
2008-12-18 11:47:25 +01:00
static void flushDirty(thread_db* tdbb, SLONG transaction_mask, const bool sys_only,
ISC_STATUS* status)
{
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
Firebird::HalfStaticArray<BufferDesc*, 1024> flush;
QUE que_inst = bcb->bcb_dirty.que_forward, next;
for (; que_inst != &bcb->bcb_dirty; que_inst = next)
{
next = que_inst->que_forward;
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_dirty);
2009-06-26 06:12:20 +02:00
if (!(bdb->bdb_flags & BDB_dirty))
{
removeDirty(bcb, bdb);
continue;
}
2008-12-18 11:47:25 +01:00
if ((transaction_mask & bdb->bdb_transactions) || (bdb->bdb_flags & BDB_system_dirty) ||
(!transaction_mask && !sys_only) || (!bdb->bdb_transactions))
{
flush.add(bdb);
}
}
2008-12-05 02:20:14 +01:00
qsort(flush.begin(), flush.getCount(), sizeof(BufferDesc*), cmpBdbs);
2007-05-20 05:25:52 +02:00
bool writeAll = false;
while (flush.getCount())
{
BufferDesc** ptr = flush.begin();
const size_t cnt = flush.getCount();
while (ptr < flush.end())
{
BufferDesc* bdb = *ptr;
if (!writeAll) {
purgePrecedence(bcb, bdb);
}
if (writeAll || QUE_EMPTY(bdb->bdb_higher))
{
const PageNumber page = bdb->bdb_page;
if (!write_buffer(tdbb, bdb, page, false, status, true)) {
CCH_unwind(tdbb, true);
}
// re-post the lock only if it was really written
if ((bdb->bdb_ast_flags & BDB_blocking) && !(bdb->bdb_flags & BDB_dirty))
{
PAGE_LOCK_RE_POST(bdb->bdb_lock);
}
flush.remove(ptr);
}
else
ptr++;
}
if (cnt == flush.getCount())
writeAll = true;
}
}
// Write pages modified by garbage collector or all dirty pages or release page
// locks - depending of flush_flag. See also comments in flushDirty
static void flushAll(thread_db* tdbb, USHORT flush_flag)
{
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
ISC_STATUS* status = tdbb->tdbb_status_vector;
Firebird::HalfStaticArray<BufferDesc*, 1024> flush(bcb->bcb_dirty_count);
#ifdef SUPERSERVER
const bool all_flag = (flush_flag & FLUSH_ALL) != 0;
const bool sweep_flag = (flush_flag & FLUSH_SWEEP) != 0;
#endif
const bool release_flag = (flush_flag & FLUSH_RLSE) != 0;
const bool write_thru = release_flag;
const LATCH latch = release_flag ? LATCH_exclusive : LATCH_none;
for (ULONG i = 0; (bcb = dbb->dbb_bcb) && i < bcb->bcb_count; i++)
{
BufferDesc* bdb = bcb->bcb_rpt[i].bcb_bdb;
#ifdef SUPERSERVER
if (bdb->bdb_flags & BDB_db_dirty)
{
// pages modified by sweep\garbage collector are not in dirty list
const bool dirty_list = (bdb->bdb_dirty.que_forward != &bdb->bdb_dirty);
if (all_flag || (sweep_flag && !dirty_list)) {
flush.add(bdb);
}
}
#else
if (bdb->bdb_flags & BDB_dirty) {
flush.add(bdb);
}
#endif
else if (release_flag)
{
if (latch_bdb(tdbb, latch, bdb, bdb->bdb_page, 1) == -1) {
BUGCHECK(302); // msg 302 unexpected page change
}
if (bdb->bdb_use_count > 1) {
BUGCHECK(210); // msg 210 page in use during flush
}
PAGE_LOCK_RELEASE(bdb->bdb_lock);
release_bdb(tdbb, bdb, false, false, false);
}
}
qsort(flush.begin(), flush.getCount(), sizeof(BufferDesc*), cmpBdbs);
bool writeAll = false;
while (flush.getCount())
{
BufferDesc** ptr = flush.begin();
const size_t cnt = flush.getCount();
while (ptr < flush.end())
{
BufferDesc* bdb = *ptr;
if (!writeAll) {
purgePrecedence(bcb, bdb);
}
if (writeAll || QUE_EMPTY(bdb->bdb_higher))
{
if (release_flag)
{
if (latch_bdb(tdbb, latch, bdb, bdb->bdb_page, 1) == -1) {
BUGCHECK(302); // msg 302 unexpected page change
}
if (bdb->bdb_use_count > 1) {
BUGCHECK(210); // msg 210 page in use during flush
}
}
if (bdb->bdb_flags & (BDB_db_dirty | BDB_dirty))
{
if (!write_buffer(tdbb, bdb, bdb->bdb_page, write_thru, status, true))
{
CCH_unwind(tdbb, true);
}
}
if (release_flag)
{
PAGE_LOCK_RELEASE(bdb->bdb_lock);
release_bdb(tdbb, bdb, false, false, false);
}
flush.remove(ptr);
}
else
ptr++;
}
if (cnt == flush.getCount())
writeAll = true;
2001-05-23 15:26:42 +02:00
}
}
#ifdef CACHE_READER
static THREAD_ENTRY_DECLARE cache_reader(THREAD_ENTRY_PARAM arg)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* c a c h e _ r e a d e r
*
**************************************
*
* Functional description
* Prefetch pages into cache for sequential scans.
* Use asynchronous I/O to keep two prefetch requests
* busy at a time.
*
**************************************/
2008-01-29 02:36:41 +01:00
Database* dbb = (Database*) arg;
Database::SyncGuard dsGuard(dbb);
2001-05-23 15:26:42 +02:00
2008-01-16 09:31:31 +01:00
ISC_STATUS_ARRAY status_vector;
2009-08-23 13:43:25 +02:00
// Establish a thread context.
2008-01-16 09:31:31 +01:00
ThreadContextHolder tdbb(status_vector);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Dummy attachment needed for lock owner identification.
tdbb->setDatabase(dbb);
Jrd::Attachment* const attachment = Attachment::create(dbb);
tdbb->setAttachment(attachment);
attachment->att_filename = dbb->dbb_filename;
2008-01-16 09:31:31 +01:00
Jrd::ContextPoolHolder context(tdbb, dbb->dbb_bufferpool);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// This try block is specifically to protect the LCK_init call: if
// LCK_init fails we won't be able to accomplish anything anyway, so
// return, unlike the other try blocks further down the page.
2008-12-05 02:20:14 +01:00
BufferControl* bcb = 0;
2001-05-23 15:26:42 +02:00
2001-12-24 03:51:06 +01:00
try {
2001-05-23 15:26:42 +02:00
2001-12-24 03:51:06 +01:00
LCK_init(tdbb, LCK_OWNER_attachment);
2001-05-23 15:26:42 +02:00
bcb = dbb->dbb_bcb;
2001-12-24 03:51:06 +01:00
bcb->bcb_flags |= BCB_cache_reader;
2009-08-23 13:43:25 +02:00
dbb->dbb_reader_init.post(); // Notify our creator that we have started
2001-12-24 03:51:06 +01:00
}
2009-06-26 06:12:20 +02:00
catch (const Firebird::Exception& ex)
{
Firebird::stuff_exception(status_vector, ex);
2001-05-23 15:26:42 +02:00
gds__log_status(dbb->dbb_file->fil_string, status_vector);
return -1;
2001-05-23 15:26:42 +02:00
}
2001-12-24 03:51:06 +01:00
try {
2009-08-23 13:43:25 +02:00
// Set up dual prefetch control blocks to keep multiple prefetch
// requests active at a time. Also helps to prevent the cache reader
// from becoming dedicated or locked into a single request's prefetch demands.
prf prefetch1, prefetch2;
2001-05-23 15:26:42 +02:00
prefetch_init(&prefetch1, tdbb);
prefetch_init(&prefetch2, tdbb);
while (bcb->bcb_flags & BCB_cache_reader)
{
2001-05-23 15:26:42 +02:00
bcb->bcb_flags |= BCB_reader_active;
bool found = false;
SLONG starting_page = -1;
prf* next_prefetch = &prefetch1;
2001-05-23 15:26:42 +02:00
if (dbb->dbb_flags & DBB_suspend_bgio)
{
Database::Checkout dcoHolder(dbb);
dbb->dbb_reader_sem.tryEnter(10);
2001-05-23 15:26:42 +02:00
continue;
}
2009-08-23 13:43:25 +02:00
// Make a pass thru the global prefetch bitmap looking for something
// to read. When the entire bitmap has been scanned and found to be
// empty then wait for new requests.
2001-05-23 15:26:42 +02:00
do {
if (!(prefetch1.prf_flags & PRF_active) &&
2008-12-05 02:20:14 +01:00
SBM_next(bcb->bcb_prefetch, &starting_page, RSE_get_forward))
2003-12-31 06:36:12 +01:00
{
found = true;
2001-05-23 15:26:42 +02:00
prefetch_prologue(&prefetch1, &starting_page);
prefetch_io(&prefetch1, status_vector);
}
if (!(prefetch2.prf_flags & PRF_active) &&
2008-12-05 02:20:14 +01:00
SBM_next(bcb->bcb_prefetch, &starting_page, RSE_get_forward))
2003-12-31 06:36:12 +01:00
{
found = true;
2001-05-23 15:26:42 +02:00
prefetch_prologue(&prefetch2, &starting_page);
prefetch_io(&prefetch2, status_vector);
}
prf* post_prefetch = next_prefetch;
2008-12-18 11:47:25 +01:00
next_prefetch = (post_prefetch == &prefetch1) ? &prefetch2 : &prefetch1;
if (post_prefetch->prf_flags & PRF_active) {
2001-05-23 15:26:42 +02:00
prefetch_epilogue(post_prefetch, status_vector);
}
2001-05-23 15:26:42 +02:00
if (found)
{
2009-08-23 13:43:25 +02:00
// If the cache writer or garbage collector is idle, put
// them to work prefetching pages.
2001-05-23 15:26:42 +02:00
#ifdef CACHE_WRITER
2008-12-20 20:57:43 +01:00
if ((bcb->bcb_flags & BCB_cache_writer) && !(bcb->bcb_flags & BCB_writer_active))
2003-12-31 06:36:12 +01:00
{
dbb_writer_sem.release();
2003-12-31 06:36:12 +01:00
}
2001-05-23 15:26:42 +02:00
#endif
#ifdef GARBAGE_THREAD
2008-12-20 20:57:43 +01:00
if ((dbb->dbb_flags & DBB_garbage_collector) && !(dbb->dbb_flags & DBB_gc_active))
2003-12-31 06:36:12 +01:00
{
dbb->dbb_gc_sem.release();
2003-12-31 06:36:12 +01:00
}
2001-05-23 15:26:42 +02:00
#endif
}
2008-12-18 11:47:25 +01:00
} while (prefetch1.prf_flags & PRF_active || prefetch2.prf_flags & PRF_active);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If there's more work to do voluntarily ask to be rescheduled.
// Otherwise, wait for event notification.
BufferDesc* bdb;
if (found) {
2003-12-22 11:00:59 +01:00
JRD_reschedule(tdbb, 0, true);
}
2001-05-23 15:26:42 +02:00
else if (bcb->bcb_flags & BCB_free_pending &&
2008-12-18 11:47:25 +01:00
(bdb = get_buffer(tdbb, FREE_PAGE, LATCH_none, 1)))
2003-12-22 11:00:59 +01:00
{
2009-08-23 13:43:25 +02:00
// In our spare time, help writer clean the cache.
2001-05-23 15:26:42 +02:00
2003-12-22 11:00:59 +01:00
write_buffer(tdbb, bdb, bdb->bdb_page, true, status_vector, true);
2001-05-23 15:26:42 +02:00
}
2009-06-26 06:12:20 +02:00
else
{
2001-05-23 15:26:42 +02:00
bcb->bcb_flags &= ~BCB_reader_active;
Database::Checkout dcoHolder(dbb);
dbb->dbb_reader_sem.tryEnter(10);
2001-05-23 15:26:42 +02:00
}
bcb = dbb->dbb_bcb;
}
LCK_fini(tdbb, LCK_OWNER_attachment);
Jrd::Attachment::destroy(attachment); // no need saving warning error strings here
tdbb->setAttachment(NULL);
2001-05-23 15:26:42 +02:00
bcb->bcb_flags &= ~BCB_cache_reader;
dbb->dbb_reader_fini.post();
2001-12-24 03:51:06 +01:00
} // try
2009-06-26 06:12:20 +02:00
catch (const Firebird::Exception& ex)
{
Firebird::stuff_exception(status_vector, ex);
2001-12-24 03:51:06 +01:00
bcb = dbb->dbb_bcb;
gds__log_status(dbb->dbb_file->fil_string, status_vector);
}
return 0;
2001-05-23 15:26:42 +02:00
}
#endif
#ifdef CACHE_WRITER
static THREAD_ENTRY_DECLARE cache_writer(THREAD_ENTRY_PARAM arg)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* c a c h e _ w r i t e r
*
**************************************
*
* Functional description
* Write dirty pages to database to maintain an
* adequate supply of free pages. If WAL is enabled,
* perform database checkpoint when WAL subsystem
* deems it necessary.
*
**************************************/
Database* dbb = (Database*)arg;
Database::SyncGuard dsGuard(dbb);
2001-05-23 15:26:42 +02:00
2008-01-16 09:31:31 +01:00
ISC_STATUS_ARRAY status_vector;
2009-08-23 13:43:25 +02:00
// Establish a thread context.
2008-01-16 09:31:31 +01:00
ThreadContextHolder tdbb(status_vector);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Dummy attachment needed for lock owner identification.
2001-05-23 15:26:42 +02:00
tdbb->setDatabase(dbb);
Jrd::Attachment* const attachment = Jrd::Attachment::create(dbb, 0);
tdbb->setAttachment(attachment);
attachment->att_filename = dbb->dbb_filename;
2008-01-16 09:31:31 +01:00
Jrd::ContextPoolHolder context(tdbb, dbb->dbb_bufferpool);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// This try block is specifically to protect the LCK_init call: if
// LCK_init fails we won't be able to accomplish anything anyway, so
// return, unlike the other try blocks further down the page.
Semaphore& writer_sem = dbb->dbb_writer_sem;
2007-01-18 16:50:18 +01:00
BufferControl* bcb = dbb->dbb_bcb;
2001-12-24 03:51:06 +01:00
try {
LCK_init(tdbb, LCK_OWNER_attachment);
2001-12-24 03:51:06 +01:00
bcb->bcb_flags |= BCB_cache_writer;
2007-01-18 16:50:18 +01:00
bcb->bcb_flags &= ~BCB_writer_start;
2009-08-23 13:43:25 +02:00
// Notify our creator that we have started
dbb->dbb_writer_init.release();
2001-12-24 03:51:06 +01:00
}
2009-06-26 06:12:20 +02:00
catch (const Firebird::Exception& ex)
{
Firebird::stuff_exception(status_vector, ex);
2006-05-22 00:07:35 +02:00
gds__log_status(dbb->dbb_filename.c_str(), status_vector);
2007-01-18 16:50:18 +01:00
bcb->bcb_flags &= ~(BCB_cache_writer | BCB_writer_start);
return (THREAD_ENTRY_RETURN)(-1);
2001-05-23 15:26:42 +02:00
}
2001-12-24 03:51:06 +01:00
try {
while (bcb->bcb_flags & BCB_cache_writer)
{
bcb->bcb_flags |= BCB_writer_active;
#ifdef CACHE_READER
SLONG starting_page = -1;
#endif
if (dbb->dbb_flags & DBB_suspend_bgio)
{
{ //scope
Database::Checkout dcoHolder(dbb);
writer_sem.tryEnter(10);
}
2007-01-18 16:50:18 +01:00
bcb = dbb->dbb_bcb;
continue;
}
2008-12-05 02:20:14 +01:00
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER_V2
2009-08-23 13:43:25 +02:00
// Flush buffers for lazy commit
SLONG commit_mask;
2008-12-18 11:47:25 +01:00
if (!(dbb->dbb_flags & DBB_force_write) && (commit_mask = dbb->dbb_flush_cycle))
2003-12-22 11:00:59 +01:00
{
dbb->dbb_flush_cycle = 0;
2003-12-22 11:00:59 +01:00
btc_flush(tdbb, commit_mask, false, status_vector);
}
2001-05-23 15:26:42 +02:00
#endif
{ // scope
Database::Checkout dcoHolder(dbb);
THREAD_YIELD();
}
if (bcb->bcb_flags & BCB_free_pending)
{
BufferDesc* bdb = get_buffer(tdbb, FREE_PAGE, LATCH_none, 1);
2009-06-26 06:12:20 +02:00
if (bdb)
{
2003-12-22 11:00:59 +01:00
write_buffer(tdbb, bdb, bdb->bdb_page, true, status_vector, true);
bcb = dbb->dbb_bcb;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If the cache reader or garbage collector is idle, put
// them to work freeing pages.
2001-05-23 15:26:42 +02:00
#ifdef CACHE_READER
2008-12-20 20:57:43 +01:00
if ((bcb->bcb_flags & BCB_cache_reader) && !(bcb->bcb_flags & BCB_reader_active))
{
2008-12-18 11:47:25 +01:00
dbb->dbb_reader_sem.post();
}
2001-05-23 15:26:42 +02:00
#endif
#ifdef GARBAGE_THREAD
2008-12-20 20:57:43 +01:00
if ((dbb->dbb_flags & DBB_garbage_collector) && !(dbb->dbb_flags & DBB_gc_active))
{
2008-12-18 11:47:25 +01:00
dbb->dbb_gc_sem.release();
}
2001-05-23 15:26:42 +02:00
#endif
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If there's more work to do voluntarily ask to be rescheduled.
// Otherwise, wait for event notification.
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if ((bcb->bcb_flags & BCB_free_pending) || bcb->bcb_checkpoint || dbb->dbb_flush_cycle)
{
2003-12-22 11:00:59 +01:00
JRD_reschedule(tdbb, 0, true);
}
2001-05-23 15:26:42 +02:00
#ifdef CACHE_READER
else if (SBM_next(bcb->bcb_prefetch, &starting_page, RSE_get_forward))
{
2009-08-23 13:43:25 +02:00
// Prefetch some pages in our spare time and in the process
// garbage collect the prefetch bitmap.
2003-10-20 12:53:52 +02:00
prf prefetch;
prefetch_init(&prefetch, tdbb);
prefetch_prologue(&prefetch, &starting_page);
prefetch_io(&prefetch, status_vector);
prefetch_epilogue(&prefetch, status_vector);
}
2001-05-23 15:26:42 +02:00
#endif
else
{
bcb->bcb_flags &= ~BCB_writer_active;
Database::Checkout dcoHolder(dbb);
writer_sem.tryEnter(10);
}
bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
}
LCK_fini(tdbb, LCK_OWNER_attachment);
Jrd::Attachment::destroy(attachment); // no need saving warning error strings here
tdbb->setAttachment(NULL);
bcb->bcb_flags &= ~BCB_cache_writer;
2009-08-23 13:43:25 +02:00
// Notify the finalization caller that we're finishing.
dbb->dbb_writer_fini.release();
2001-12-24 03:51:06 +01:00
} // try
2009-06-26 06:12:20 +02:00
catch (const Firebird::Exception& ex)
{
Firebird::stuff_exception(status_vector, ex);
2001-12-24 03:51:06 +01:00
bcb = dbb->dbb_bcb;
2006-05-22 00:07:35 +02:00
gds__log_status(dbb->dbb_filename.c_str(), status_vector);
2001-12-24 03:51:06 +01:00
}
return 0;
2001-05-23 15:26:42 +02:00
}
#endif
2009-08-23 13:43:25 +02:00
static void check_precedence(thread_db* tdbb, WIN* window, PageNumber page)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* c h e c k _ p r e c e d e n c e
*
**************************************
*
* Functional description
* Given a window accessed for write and a page number,
* establish a precedence relationship such that the
* specified page will always be written before the page
* associated with the window.
*
* If the "page number" is negative, it is really a transaction
* id. In this case, the precedence relationship is to the
* database header page from which the transaction id was
* obtained. If the header page has been written since the
* transaction id was assigned, no precedence relationship
* is required.
*
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If this is really a transaction id, sort things out
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if ((page.getPageSpaceID() == DB_PAGE_SPACE) && (page.getPageNum() < 0))
2006-05-22 00:07:35 +02:00
{
if (-page.getPageNum() <= dbb->dbb_last_header_write) {
2001-05-23 15:26:42 +02:00
return;
}
2008-01-16 09:31:31 +01:00
page = PageNumber(DB_PAGE_SPACE, 0);
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Start by finding the buffer containing the high priority page
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_ACQUIRE;
//PRE_MUTEX_ACQUIRE;
BufferControl* bcb = dbb->dbb_bcb;
2006-05-22 00:07:35 +02:00
QUE mod_que = &bcb->bcb_rpt[page.getPageNum() % bcb->bcb_count].bcb_page_mod;
2001-05-23 15:26:42 +02:00
BufferDesc* high = 0;
QUE que_inst;
2009-06-26 06:12:20 +02:00
for (que_inst = mod_que->que_forward; que_inst != mod_que; que_inst = que_inst->que_forward)
{
if ((high = BLOCK(que_inst, BufferDesc*, bdb_que))->bdb_page == page) {
2001-05-23 15:26:42 +02:00
break;
}
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2009-06-26 06:12:20 +02:00
if (que_inst == mod_que)
{
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
2009-08-23 13:43:25 +02:00
// Found the higher precedence buffer. If it's not dirty, don't sweat it.
// If it's the same page, ditto.
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if (!(high->bdb_flags & BDB_dirty) || (high->bdb_page == window->win_page))
{
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
BufferDesc* low = window->win_bdb;
2001-05-23 15:26:42 +02:00
if ((low->bdb_flags & BDB_marked) && !(low->bdb_flags & BDB_faked))
2009-08-23 13:43:25 +02:00
BUGCHECK(212); // msg 212 CCH_precedence: block marked
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If already related, there's nothing more to do. If the precedence
// search was too complex to complete, just write the high page and
// forget about about establishing the relationship.
2001-05-23 15:26:42 +02:00
2008-01-16 09:31:31 +01:00
if (QUE_NOT_EMPTY(high->bdb_lower))
{
const ULONG mark = get_prec_walk_mark(bcb);
const SSHORT relationship = related(low, high, PRE_SEARCH_LIMIT, mark);
if (relationship == PRE_EXISTS)
{
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
2008-01-16 09:31:31 +01:00
if (relationship == PRE_UNKNOWN)
{
2006-05-22 00:07:35 +02:00
const PageNumber high_page = high->bdb_page;
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, high, high_page, false, tdbb->tdbb_status_vector, true))
2003-12-22 11:00:59 +01:00
{
CCH_unwind(tdbb, true);
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
return;
}
}
2009-08-23 13:43:25 +02:00
// Check to see if we're going to create a cycle or the precedence search
// was too complex to complete. If so, force a write of the "after"
// (currently fetched) page. Assuming everyone obeys the rules and calls
// precedence before marking the buffer, everything should be ok
2001-05-23 15:26:42 +02:00
if (QUE_NOT_EMPTY(low->bdb_lower))
{
const ULONG mark = get_prec_walk_mark(bcb);
const SSHORT relationship = related(high, low, PRE_SEARCH_LIMIT, mark);
if (relationship == PRE_EXISTS || relationship == PRE_UNKNOWN)
{
2006-05-22 00:07:35 +02:00
const PageNumber low_page = low->bdb_page;
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, low, low_page, false, tdbb->tdbb_status_vector, true))
2003-12-22 11:00:59 +01:00
{
CCH_unwind(tdbb, true);
2003-12-22 11:00:59 +01:00
}
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
// We're going to establish a new precedence relationship. Get a block,
// fill in the appropriate fields, and insert it into the various ques
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
bcb = dbb->dbb_bcb; // Re-initialize
2001-05-23 15:26:42 +02:00
Precedence* precedence = bcb->bcb_free;
if (precedence) {
bcb->bcb_free = (Precedence*) precedence->pre_hi;
}
else {
precedence = FB_NEW(*dbb->dbb_bufferpool) Precedence;
}
2001-05-23 15:26:42 +02:00
precedence->pre_low = low;
precedence->pre_hi = high;
precedence->pre_flags = 0;
QUE_INSERT(low->bdb_higher, precedence->pre_higher);
QUE_INSERT(high->bdb_lower, precedence->pre_lower);
// explicitly include high page in system transaction flush process
if (low->bdb_flags & BDB_system_dirty && high->bdb_flags & BDB_dirty)
high->bdb_flags |= BDB_system_dirty;
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
}
static void clear_precedence(thread_db* tdbb, BufferDesc* bdb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* c l e a r _ p r e c e d e n c e
*
**************************************
*
* Functional description
* Clear precedence relationships to lower precedence block.
*
**************************************/
SET_TDBB(tdbb);
2009-06-06 11:05:20 +02:00
Database* const dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_ACQUIRE;
2009-06-06 11:05:20 +02:00
BufferControl* const bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Loop thru lower precedence buffers. If any can be downgraded,
// by all means down grade them.
2001-05-23 15:26:42 +02:00
while (QUE_NOT_EMPTY(bdb->bdb_lower))
{
QUE que_inst = bdb->bdb_lower.que_forward;
Precedence* precedence = BLOCK(que_inst, Precedence*, pre_lower);
BufferDesc* low_bdb = precedence->pre_low;
2001-05-23 15:26:42 +02:00
QUE_DELETE(precedence->pre_higher);
QUE_DELETE(precedence->pre_lower);
precedence->pre_hi = (BufferDesc*) bcb->bcb_free;
2001-05-23 15:26:42 +02:00
bcb->bcb_free = precedence;
2009-06-26 06:12:20 +02:00
if (!(precedence->pre_flags & PRE_cleared))
{
2001-05-23 15:26:42 +02:00
if (low_bdb->bdb_ast_flags & BDB_blocking)
2003-08-13 13:11:12 +02:00
{
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RE_POST(low_bdb->bdb_lock);
2003-08-13 13:11:12 +02:00
}
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
}
static BufferDesc* dealloc_bdb(BufferDesc* bdb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* d e a l l o c _ b d b
*
**************************************
*
* Functional description
* Deallocate buffer descriptor block.
*
**************************************/
2009-06-26 06:12:20 +02:00
if (bdb)
{
#ifndef SUPERSERVER
delete bdb->bdb_lock;
2001-05-23 15:26:42 +02:00
#endif
QUE_DELETE(bdb->bdb_que);
2001-12-24 03:51:06 +01:00
delete bdb;
2001-05-23 15:26:42 +02:00
}
return NULL;
2001-05-23 15:26:42 +02:00
}
#ifndef SUPERSERVER
2003-12-22 11:00:59 +01:00
// CVC: Nobody was interested in the result from this function, so I made it
// void instead of bool, but preserved the returned values in comments.
static void down_grade(thread_db* tdbb, BufferDesc* bdb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* d o w n _ g r a d e
*
**************************************
*
* Functional description
* A lock on a page is blocking another process. If possible, downgrade
* the lock on the buffer. This may be called from either AST or
* regular level. Return true if the down grade was successful. If the
* down grade was deferred for any reason, return false.
2001-05-23 15:26:42 +02:00
*
**************************************/
SET_TDBB(tdbb);
bdb->bdb_ast_flags |= BDB_blocking;
Lock* lock = bdb->bdb_lock;
2004-03-07 08:58:55 +01:00
Database* dbb = bdb->bdb_dbb;
2001-05-23 15:26:42 +02:00
if (dbb->dbb_flags & DBB_bugcheck)
{
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RELEASE(bdb->bdb_lock);
bdb->bdb_ast_flags &= ~BDB_blocking;
clear_dirty_flag(tdbb, bdb);
return; // true;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// If the BufferDesc is in use and, being written or already
// downgraded to read, mark it as blocking and exit.
2001-05-23 15:26:42 +02:00
if (bdb->bdb_use_count) {
return; // false;
}
2001-05-23 15:26:42 +02:00
latch_bdb(tdbb, LATCH_io, bdb, bdb->bdb_page, 1);
2009-08-23 13:43:25 +02:00
// If the page isn't dirty, the lock can be quietly downgraded.
2001-05-23 15:26:42 +02:00
if (!(bdb->bdb_flags & BDB_dirty))
{
2001-05-23 15:26:42 +02:00
bdb->bdb_ast_flags &= ~BDB_blocking;
LCK_downgrade(tdbb, lock);
release_bdb(tdbb, bdb, false, false, false);
return; // true;
2001-05-23 15:26:42 +02:00
}
bool in_use = false, invalid = false;
2001-05-23 15:26:42 +02:00
if (bdb->bdb_flags & BDB_not_valid) {
invalid = true;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If there are higher precedence guys, see if they can be written.
2009-06-06 11:05:20 +02:00
for (QUE que_inst = bdb->bdb_higher.que_forward; que_inst != &bdb->bdb_higher;
que_inst = que_inst->que_forward)
2003-12-22 11:00:59 +01:00
{
Precedence* precedence = BLOCK(que_inst, Precedence*, pre_higher);
2001-05-23 15:26:42 +02:00
if (precedence->pre_flags & PRE_cleared)
continue;
2009-06-26 06:12:20 +02:00
if (invalid)
{
2001-05-23 15:26:42 +02:00
precedence->pre_flags |= PRE_cleared;
continue;
}
BufferDesc* blocking_bdb = precedence->pre_hi;
if (blocking_bdb->bdb_flags & BDB_dirty)
{
2001-05-23 15:26:42 +02:00
down_grade(tdbb, blocking_bdb);
if (blocking_bdb->bdb_flags & BDB_dirty) {
in_use = true;
}
2009-06-26 06:12:20 +02:00
if (blocking_bdb->bdb_flags & BDB_not_valid)
{
invalid = true;
in_use = false;
que_inst = bdb->bdb_higher.que_forward;
2001-05-23 15:26:42 +02:00
}
}
}
2009-08-23 13:43:25 +02:00
// If any higher precedence buffer can't be written, mark this buffer as blocking and exit.
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (in_use)
{
release_bdb(tdbb, bdb, false, false, false);
return; // false;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Everything is clear to write this buffer. Do so and reduce the lock
2001-05-23 15:26:42 +02:00
2009-12-13 14:49:43 +01:00
if (invalid || !write_page(tdbb, bdb, tdbb->tdbb_status_vector, true))
2003-12-22 11:00:59 +01:00
{
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_not_valid;
clear_dirty_flag(tdbb, bdb);
2001-05-23 15:26:42 +02:00
bdb->bdb_ast_flags &= ~BDB_blocking;
TRA_invalidate(dbb, bdb->bdb_transactions);
bdb->bdb_transactions = 0;
PAGE_LOCK_RELEASE(bdb->bdb_lock);
}
2009-06-26 06:12:20 +02:00
else
{
2001-05-23 15:26:42 +02:00
bdb->bdb_ast_flags &= ~BDB_blocking;
LCK_downgrade(tdbb, lock);
}
2009-08-23 13:43:25 +02:00
// Clear precedence relationships to lower precedence buffers. Since it
// isn't safe to tweak the que pointers from AST level, just mark the precedence
// links as cleared. Somebody else will clean up the precedence blocks.
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
for (QUE que_inst = bdb->bdb_lower.que_forward; que_inst != &bdb->bdb_lower;
2008-12-20 20:57:43 +01:00
que_inst = que_inst->que_forward)
2003-12-22 11:00:59 +01:00
{
Precedence* precedence = BLOCK(que_inst, Precedence*, pre_lower);
BufferDesc* blocking_bdb = precedence->pre_low;
2001-05-23 15:26:42 +02:00
if (bdb->bdb_flags & BDB_not_valid)
blocking_bdb->bdb_flags |= BDB_not_valid;
precedence->pre_flags |= PRE_cleared;
2008-12-20 20:57:43 +01:00
if ((blocking_bdb->bdb_flags & BDB_not_valid) || (blocking_bdb->bdb_ast_flags & BDB_blocking))
2003-12-22 11:00:59 +01:00
{
2001-05-23 15:26:42 +02:00
down_grade(tdbb, blocking_bdb);
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
}
bdb->bdb_flags &= ~BDB_not_valid;
release_bdb(tdbb, bdb, false, false, false);
2001-05-23 15:26:42 +02:00
return; // true;
2001-05-23 15:26:42 +02:00
}
#endif
static void expand_buffers(thread_db* tdbb, ULONG number)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* e x p a n d _ b u f f e r s
*
**************************************
*
* Functional description
* Expand the cache to at least a given number of buffers. If
* it's already that big, don't do anything.
*
* Nickolay Samofatov, 08-Mar-2004.
* This function does not handle exceptions correctly,
* it looks like good handling requires rewrite.
*
2001-05-23 15:26:42 +02:00
**************************************/
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
BufferControl* old = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
if (number <= old->bcb_count || number > MAX_PAGE_BUFFERS) {
2001-05-23 15:26:42 +02:00
return;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// for Win16 platform, we want to ensure that no cache buffer ever ends on a segment boundary
// CVC: Is this code obsolete or only the comment?
2001-05-23 15:26:42 +02:00
ULONG num_per_seg = number - old->bcb_count;
ULONG left_to_do = num_per_seg;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Allocate and initialize buffers control block
Jrd::ContextPoolHolder context(tdbb, dbb->dbb_bufferpool);
2001-05-23 15:26:42 +02:00
old = dbb->dbb_bcb;
const bcb_repeat* const old_end = old->bcb_rpt + old->bcb_count;
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
BufferControl* new_block = FB_NEW_RPT(*dbb->dbb_bufferpool, number)
BufferControl(*dbb->dbb_bufferpool);
2004-02-02 12:02:12 +01:00
new_block->bcb_count = number;
2009-08-23 13:43:25 +02:00
new_block->bcb_free_minimum = (SSHORT) MIN(number / 4, 128); // 25% clean page reserve
2004-02-02 12:02:12 +01:00
new_block->bcb_checkpoint = old->bcb_checkpoint;
new_block->bcb_flags = old->bcb_flags;
const bcb_repeat* const new_end = new_block->bcb_rpt + number;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// point at the dirty page binary tree
2001-05-23 15:26:42 +02:00
new_block->bcb_dirty_count = old->bcb_dirty_count;
QUE_INSERT(old->bcb_dirty, new_block->bcb_dirty);
QUE_DELETE(old->bcb_dirty);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// point at the free precedence blocks
2001-05-23 15:26:42 +02:00
2004-02-02 12:02:12 +01:00
new_block->bcb_free = old->bcb_free;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// position the new bcb in the in use, empty and latch queues
2001-05-23 15:26:42 +02:00
2004-02-02 12:02:12 +01:00
QUE_INSERT(old->bcb_in_use, new_block->bcb_in_use);
2001-05-23 15:26:42 +02:00
QUE_DELETE(old->bcb_in_use);
2004-02-02 12:02:12 +01:00
QUE_INSERT(old->bcb_empty, new_block->bcb_empty);
2001-05-23 15:26:42 +02:00
QUE_DELETE(old->bcb_empty);
2004-02-02 12:02:12 +01:00
QUE_INSERT(old->bcb_free_lwt, new_block->bcb_free_lwt);
2001-05-23 15:26:42 +02:00
QUE_DELETE(old->bcb_free_lwt);
QUE_INSERT(old->bcb_free_slt, new_block->bcb_free_slt);
QUE_DELETE(old->bcb_free_slt);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Copy addresses of previously allocated buffer space to new block
2001-05-23 15:26:42 +02:00
for (Jrd::UCharStack::iterator stack(old->bcb_memory); stack.hasData(); ++stack) {
new_block->bcb_memory.push(stack.object());
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Initialize tail of new buffer control block
bcb_repeat* new_tail;
2004-02-02 12:02:12 +01:00
for (new_tail = new_block->bcb_rpt; new_tail < new_end; new_tail++) {
2001-05-23 15:26:42 +02:00
QUE_INIT(new_tail->bcb_page_mod);
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Move any active buffers from old block to new
2001-05-23 15:26:42 +02:00
2004-02-02 12:02:12 +01:00
new_tail = new_block->bcb_rpt;
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
for (bcb_repeat* old_tail = old->bcb_rpt; old_tail < old_end; old_tail++, new_tail++)
{
2001-05-23 15:26:42 +02:00
new_tail->bcb_bdb = old_tail->bcb_bdb;
while (QUE_NOT_EMPTY(old_tail->bcb_page_mod))
{
QUE que_inst = old_tail->bcb_page_mod.que_forward;
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_que);
2008-05-11 14:27:51 +02:00
QUE_DELETE(*que_inst);
QUE mod_que =
2006-05-22 00:07:35 +02:00
&new_block->bcb_rpt[bdb->bdb_page.getPageNum() % new_block->bcb_count].bcb_page_mod;
2008-05-11 14:27:51 +02:00
QUE_INSERT(*mod_que, *que_inst);
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
// Allocate new buffer descriptor blocks
2001-05-23 15:26:42 +02:00
ULONG num_in_seg = 0;
2006-12-04 22:26:43 +01:00
UCHAR* memory = NULL;
for (; new_tail < new_end; new_tail++)
{
2009-08-23 13:43:25 +02:00
// if current segment is exhausted, allocate another
2001-05-23 15:26:42 +02:00
if (!num_in_seg)
{
2006-12-04 22:26:43 +01:00
const size_t alloc_size = dbb->dbb_page_size * (num_per_seg + 1);
memory = (UCHAR*) dbb->dbb_bufferpool->allocate_nothrow(alloc_size);
// NOMEM: crash!
new_block->bcb_memory.push(memory);
2006-12-04 22:26:43 +01:00
memory = (UCHAR *) FB_ALIGN((U_IPTR) memory, dbb->dbb_page_size);
2001-05-23 15:26:42 +02:00
num_in_seg = num_per_seg;
left_to_do -= num_per_seg;
if (num_per_seg > left_to_do) {
2001-05-23 15:26:42 +02:00
num_per_seg = left_to_do;
}
2001-05-23 15:26:42 +02:00
}
2004-02-02 12:02:12 +01:00
new_tail->bcb_bdb = alloc_bdb(tdbb, new_block, &memory);
2001-05-23 15:26:42 +02:00
num_in_seg--;
}
2009-08-23 13:43:25 +02:00
// Set up new buffer control, release old buffer control, and clean up
2001-05-23 15:26:42 +02:00
2004-02-02 12:02:12 +01:00
dbb->dbb_bcb = new_block;
2001-05-23 15:26:42 +02:00
2001-12-24 03:51:06 +01:00
delete old;
2001-05-23 15:26:42 +02:00
}
2006-05-22 00:07:35 +02:00
static BufferDesc* get_buffer(thread_db* tdbb, const PageNumber page, LATCH latch, SSHORT latch_wait)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* g e t _ b u f f e r
*
**************************************
*
* Functional description
* Get a buffer. If possible, get a buffer already assigned
* to the page. Otherwise get one from the free list or pick
* the least recently used buffer to be reused.
* Note the following special page numbers:
* -1 indicates that a buffer is required for journaling => obsolete
2001-05-23 15:26:42 +02:00
* -2 indicates a special scratch buffer for shadowing
*
* input
* page: page to get
* latch: type of latch to acquire on the page.
* latch_wait: 1 => Wait as long as necessary to get the latch.
* This can cause deadlocks of course.
* 0 => If the latch can't be acquired immediately,
* give up and return 0;
* <negative number> => Latch timeout interval in seconds.
*
* return
* BufferDesc pointer if successful.
2001-05-23 15:26:42 +02:00
* NULL pointer if timeout occurred (only possible is latch_wait <> 1).
* if cache manager doesn't have any pages to write anymore.
*
2001-05-23 15:26:42 +02:00
**************************************/
// CVC: Those two vars are tricky or nonsense to put in minimal scope.
QUE que_inst;
BufferControl* bcb;
2001-05-23 15:26:42 +02:00
SET_TDBB(tdbb);
Database* dbb = tdbb->getDatabase();
#ifdef CACHE_WRITER
SSHORT walk = dbb->dbb_bcb->bcb_free_minimum;
#endif
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
while (true)
{
2001-05-23 15:26:42 +02:00
find_page:
bcb = dbb->dbb_bcb;
2009-01-14 10:19:00 +01:00
if (page.getPageNum() >= 0)
{
2009-08-23 13:43:25 +02:00
// Check to see if buffer has already been assigned to page
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
QUE mod_que = &bcb->bcb_rpt[page.getPageNum() % bcb->bcb_count].bcb_page_mod;
for (que_inst = mod_que->que_forward; que_inst != mod_que;
2009-01-14 10:19:00 +01:00
que_inst = que_inst->que_forward)
{
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_que);
if (bdb->bdb_page == page)
{
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER_V2
2006-05-22 00:07:35 +02:00
if (page != HEADER_PAGE_NUMBER)
2001-05-23 15:26:42 +02:00
#endif
2009-04-01 12:49:54 +02:00
QUE_MOST_RECENTLY_USED(bdb->bdb_in_use);
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2008-12-18 11:47:25 +01:00
const SSHORT latch_return = latch_bdb(tdbb, latch, bdb, page, latch_wait);
2008-01-16 09:31:31 +01:00
if (latch_return)
{
if (latch_return == 1) {
2009-08-23 13:43:25 +02:00
return NULL; // permitted timeout happened
}
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
goto find_page;
}
2008-01-16 09:31:31 +01:00
bdb->bdb_flags &= ~(BDB_faked | BDB_prefetch);
tdbb->bumpStats(RuntimeStatistics::PAGE_FETCHES);
return bdb;
2001-05-23 15:26:42 +02:00
}
}
2001-05-23 15:26:42 +02:00
}
#ifdef CACHE_WRITER
2009-01-14 10:19:00 +01:00
else if ((page == FREE_PAGE) || (page == CHECKPOINT_PAGE))
{
2009-08-23 13:43:25 +02:00
// This code is only used by the background I/O threads:
// cache writer, cache reader and garbage collector.
2001-05-23 15:26:42 +02:00
Database::Checkout dcoHolder(dbb);
for (que_inst = bcb->bcb_in_use.que_backward;
que_inst != &bcb->bcb_in_use; que_inst = que_inst->que_backward)
2003-12-22 11:00:59 +01:00
{
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_in_use);
2008-01-16 09:31:31 +01:00
if (page == FREE_PAGE)
{
2008-12-20 20:57:43 +01:00
if (bdb->bdb_use_count || (bdb->bdb_flags & BDB_free_pending))
{
continue;
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_flags & BDB_db_dirty)
{
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return bdb;
}
2009-06-26 06:12:20 +02:00
if (!--walk)
{
2001-05-23 15:26:42 +02:00
bcb->bcb_flags &= ~BCB_free_pending;
break;
}
}
2009-06-26 06:12:20 +02:00
else // if (page == CHECKPOINT_PAGE)
{
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (bdb->bdb_flags & BDB_checkpoint)
{
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return bdb;
}
}
}
if (page == FREE_PAGE) {
bcb->bcb_flags &= ~BCB_free_pending;
}
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
return NULL;
2001-05-23 15:26:42 +02:00
}
#endif
for (que_inst = bcb->bcb_in_use.que_backward;
que_inst != &bcb->bcb_in_use || QUE_NOT_EMPTY(bcb->bcb_empty);
que_inst = que_inst->que_backward)
{
2009-08-23 13:43:25 +02:00
bcb = dbb->dbb_bcb; // Re-initialize in the loop
2006-05-22 00:07:35 +02:00
QUE mod_que = &bcb->bcb_rpt[page.getPageNum() % bcb->bcb_count].bcb_page_mod;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If there is an empty buffer sitting around, allocate it
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (QUE_NOT_EMPTY(bcb->bcb_empty))
{
que_inst = bcb->bcb_empty.que_forward;
2008-05-11 14:27:51 +02:00
QUE_DELETE(*que_inst);
BufferDesc* bdb = BLOCK(que_inst, BufferDesc*, bdb_que);
2009-01-14 10:19:00 +01:00
if (page.getPageNum() >= 0)
{
2008-05-11 14:27:51 +02:00
QUE_INSERT(*mod_que, *que_inst);
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER_V2
2009-08-23 13:43:25 +02:00
// Reserve a buffer for header page with deferred header
// page write mechanism. Otherwise, a deadlock will occur
// if all dirty pages in the cache must force header page
// to disk before they can be written but there is no free
// buffer to read the header page into.
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
if (page != HEADER_PAGE_NUMBER)
2001-05-23 15:26:42 +02:00
#endif
2009-04-01 12:49:54 +02:00
QUE_INSERT(bcb->bcb_in_use, bdb->bdb_in_use);
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// This correction for bdb_use_count below is needed to
// avoid a deadlock situation in latching code. It's not
// clear though how the bdb_use_count can get < 0 for a bdb
// in bcb_empty queue
if (bdb->bdb_use_count < 0) {
2009-08-23 13:43:25 +02:00
BUGCHECK(301); // msg 301 Non-zero use_count of a buffer in the empty que_inst
}
2001-05-23 15:26:42 +02:00
bdb->bdb_page = page;
fb_assert((bdb->bdb_flags & (BDB_dirty | BDB_marked)) == 0)
2001-05-23 15:26:42 +02:00
bdb->bdb_flags = BDB_read_pending;
bdb->bdb_scan_count = 0;
2009-08-23 13:43:25 +02:00
// The following latch should never fail because the buffer is 'empty'
// and the page is not in cache.
if (latch_bdb(tdbb, latch, bdb, page, -100) == -1) {
2009-08-23 13:43:25 +02:00
BUGCHECK(302); // msg 302 unexpected page change
}
#ifndef SUPERSERVER
2009-06-26 06:12:20 +02:00
if (page.getPageNum() >= 0)
{
CCH_TRACE(("bdb->bdb_lock->lck_logical = LCK_none; page=%i", bdb->bdb_page));
2001-05-23 15:26:42 +02:00
bdb->bdb_lock->lck_logical = LCK_none;
}
else {
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RELEASE(bdb->bdb_lock);
}
2001-05-23 15:26:42 +02:00
#endif
tdbb->bumpStats(RuntimeStatistics::PAGE_FETCHES);
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return bdb;
}
2009-08-23 13:43:25 +02:00
// get the oldest buffer as the least recently used -- note
// that since there are no empty buffers this queue cannot be empty
2001-05-23 15:26:42 +02:00
if (bcb->bcb_in_use.que_forward == &bcb->bcb_in_use) {
2009-08-23 13:43:25 +02:00
BUGCHECK(213); // msg 213 insufficient cache size
}
2001-05-23 15:26:42 +02:00
BufferDesc* oldest = BLOCK(que_inst, BufferDesc*, bdb_in_use);
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_ACQUIRE;
2008-12-18 11:47:25 +01:00
if (oldest->bdb_use_count || (oldest->bdb_flags & BDB_free_pending) ||
!writeable(oldest))
2003-12-22 11:00:59 +01:00
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
continue;
}
#ifdef SUPERSERVER_V2
2009-08-23 13:43:25 +02:00
// If page has been prefetched but not yet fetched, let
// it cycle once more thru LRU queue before re-using it.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (oldest->bdb_flags & BDB_prefetch)
{
2001-05-23 15:26:42 +02:00
oldest->bdb_flags &= ~BDB_prefetch;
que_inst = que_inst->que_forward;
2001-05-23 15:26:42 +02:00
QUE_MOST_RECENTLY_USED(oldest->bdb_in_use);
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
continue;
}
#endif
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
#ifdef CACHE_WRITER
2009-01-14 10:19:00 +01:00
if (oldest->bdb_flags & (BDB_dirty | BDB_db_dirty))
{
2001-05-23 15:26:42 +02:00
bcb->bcb_flags |= BCB_free_pending;
2008-12-20 20:57:43 +01:00
if ((bcb->bcb_flags & BCB_cache_writer) && !(bcb->bcb_flags & BCB_writer_active))
{
dbb->dbb_writer_sem.release();
}
if (walk)
{
2008-01-16 09:31:31 +01:00
if (!--walk)
2001-05-23 15:26:42 +02:00
break;
2008-01-16 09:31:31 +01:00
continue;
2001-05-23 15:26:42 +02:00
}
}
#endif
BufferDesc* bdb = oldest;
if (latch_bdb(tdbb, LATCH_exclusive, bdb, bdb->bdb_page, 0)) {
2009-08-23 13:43:25 +02:00
continue; // BufferDesc changed, continue looking for a buffer
}
2001-05-23 15:26:42 +02:00
QUE_MOST_RECENTLY_USED(bdb->bdb_in_use);
bdb->bdb_flags |= BDB_free_pending;
2009-08-23 13:43:25 +02:00
// If the buffer selected is dirty, arrange to have it written.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (bdb->bdb_flags & (BDB_dirty | BDB_db_dirty))
{
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER
2008-12-18 11:47:25 +01:00
if (!write_buffer(tdbb, bdb, bdb->bdb_page, true, tdbb->tdbb_status_vector, true))
2001-05-23 15:26:42 +02:00
#else
2008-12-18 11:47:25 +01:00
if (!write_buffer (tdbb, bdb, bdb->bdb_page, false, tdbb->tdbb_status_vector, true))
2001-05-23 15:26:42 +02:00
#endif
{
bdb->bdb_flags &= ~BDB_free_pending;
release_bdb(tdbb, bdb, false, false, false);
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
bcb = dbb->dbb_bcb; // Re-initialize
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If the buffer is still in the dirty tree, remove it.
// In any case, release any lock it may have.
2001-05-23 15:26:42 +02:00
removeDirty(bcb, bdb);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Cleanup any residual precedence blocks. Unless something is
// screwed up, the only precedence blocks that can still be hanging
// around are ones cleared at AST level.
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_ACQUIRE;
while (QUE_NOT_EMPTY(bdb->bdb_higher))
{
QUE que2 = bdb->bdb_higher.que_forward;
Precedence* precedence = BLOCK(que2, Precedence*, pre_higher);
2001-05-23 15:26:42 +02:00
QUE_DELETE(precedence->pre_higher);
QUE_DELETE(precedence->pre_lower);
precedence->pre_hi = (BufferDesc*) bcb->bcb_free;
2001-05-23 15:26:42 +02:00
bcb->bcb_free = precedence;
}
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
clear_precedence(tdbb, bdb);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// remove the buffer from the "mod" queue and place it
// in it's new spot, provided it's not a negative (scratch) page
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//BCB_MUTEX_ACQUIRE;
2006-05-22 00:07:35 +02:00
if (bdb->bdb_page.getPageNum() >= 0) {
2001-05-23 15:26:42 +02:00
QUE_DELETE(bdb->bdb_que);
}
2001-05-23 15:26:42 +02:00
QUE_INSERT(bcb->bcb_empty, bdb->bdb_que);
2008-05-11 14:27:51 +02:00
QUE_DELETE(bdb->bdb_in_use);
2001-05-23 15:26:42 +02:00
bdb->bdb_page = JOURNAL_PAGE;
release_bdb(tdbb, bdb, false, false, false);
2001-05-23 15:26:42 +02:00
break;
}
if (que_inst == &bcb->bcb_in_use)
{
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER
expand_buffers(tdbb, bcb->bcb_count + 75);
#else
2009-08-23 13:43:25 +02:00
BUGCHECK(214); // msg 214 no cache buffers available for reuse
2001-05-23 15:26:42 +02:00
#endif
}
2001-05-23 15:26:42 +02:00
}
}
static ULONG get_prec_walk_mark(BufferControl* bcb)
{
/**************************************
*
* g e t _ p r e c _ w a l k _ m a r k
*
**************************************
*
* Functional description
* Get next mark for walking precedence graph.
*
**************************************/
if (++bcb->bcb_prec_walk_mark == 0)
{
for (ULONG i = 0; i < bcb->bcb_count; i++) {
bcb->bcb_rpt[i].bcb_bdb->bdb_prec_walk_mark = 0;
}
bcb->bcb_prec_walk_mark = 1;
}
return bcb->bcb_prec_walk_mark;
}
static int get_related(BufferDesc* bdb, PagesArray &lowPages, int limit, const ULONG mark)
{
/**************************************
*
* g e t _ r e l a t e d
*
**************************************
*
* Functional description
2009-10-15 04:15:31 +02:00
* Recursively walk low part of precedence graph of given buffer and put
* low pages numbers into array.
*
**************************************/
const struct que* base = &bdb->bdb_lower;
2009-10-15 04:15:31 +02:00
for (const struct que* que_inst = base->que_forward; que_inst != base;
que_inst = que_inst->que_forward)
{
const Precedence* precedence = BLOCK(que_inst, Precedence*, pre_lower);
if (precedence->pre_flags & PRE_cleared)
continue;
2009-10-15 04:15:31 +02:00
BufferDesc* low = precedence->pre_low;
if (low->bdb_prec_walk_mark == mark)
continue;
if (!--limit)
return 0;
const SLONG lowPage = low->bdb_page.getPageNum();
size_t pos;
if (!lowPages.find(lowPage, pos))
lowPages.insert(pos, lowPage);
if (QUE_NOT_EMPTY(low->bdb_lower))
{
limit = get_related(low, lowPages, limit, mark);
if (!limit)
return 0;
}
else
low->bdb_prec_walk_mark = mark;
}
bdb->bdb_prec_walk_mark = mark;
return limit;
}
2007-02-06 09:03:43 +01:00
static void invalidate_and_release_buffer(thread_db* tdbb, BufferDesc* bdb)
{
/**************************************
*
* i n v a l i d a t e _ a n d _ r e l e a s e _ b u f f e r
*
**************************************
*
* Functional description
* Invalidate the page buffer.
2007-02-06 09:03:43 +01:00
*
**************************************/
Database* dbb = tdbb->getDatabase();
2007-02-06 09:03:43 +01:00
bdb->bdb_flags |= BDB_not_valid;
clear_dirty_flag(tdbb, bdb);
2007-02-06 09:03:43 +01:00
TRA_invalidate(dbb, bdb->bdb_transactions);
bdb->bdb_transactions = 0;
release_bdb(tdbb, bdb, false, false, false);
}
2009-01-14 10:19:00 +01:00
static SSHORT latch_bdb(thread_db* tdbb,
2006-05-22 00:07:35 +02:00
LATCH type, BufferDesc* bdb, const PageNumber page, SSHORT latch_wait)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* l a t c h _ b d b
*
**************************************
*
* Functional description
*
* input
* type: LATCH_none, LATCH_exclusive, LATCH_io, LATCH_shared, or LATCH_mark.
* bdb: object to acquire latch on.
* page: page of bdb, for verification.
* latch_wait: 1 => Wait as long as necessary to get the latch.
* This can cause deadlocks of course.
* 0 => If the latch can't be acquired immediately,
* give up and return 1.
* <negative number> => Latch timeout interval in seconds.
*
* return
* 0: latch successfully acquired.
* 1: latch not acquired due to a (permitted) timeout.
* -1: latch not acquired, bdb doesn't corresponds to page.
*
**************************************/
2009-08-23 13:43:25 +02:00
// If the buffer has been reassigned to another page make the caller deal with it.
2001-05-23 15:26:42 +02:00
if (bdb->bdb_page != page) {
2001-05-23 15:26:42 +02:00
return -1;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Handle the easy case first, no users of the buffer.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (!bdb->bdb_use_count)
{
switch (type)
{
2001-05-23 15:26:42 +02:00
case LATCH_shared:
++bdb->bdb_use_count;
allocSharedLatch(tdbb, bdb);
2001-05-23 15:26:42 +02:00
break;
case LATCH_exclusive:
++bdb->bdb_use_count;
bdb->bdb_exclusive = tdbb;
break;
case LATCH_io:
++bdb->bdb_use_count;
bdb->bdb_io = tdbb;
break;
case LATCH_mark:
2009-08-23 13:43:25 +02:00
BUGCHECK(295); // inconsistent LATCH_mark call
2001-05-23 15:26:42 +02:00
break;
case LATCH_none:
break;
}
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
}
2009-08-23 13:43:25 +02:00
/* Grant the latch request if it is compatible with existing
latch holders. Pending latches are queued in the order in
which they are requested except that io/mark latches are queued
ahead of all other latch requests (to avoid deadlocks and
this does not cause starvation). Also, shared latches are granted
immediately if a disk write is in progress.
Note that asking for a higher mode latch when already holding a
share latch results in deadlock. CCH_handoff routinely acquires a
shared latch while owning already a shared latch on the page
(the case of handing off to the same page). If the BDB_must_write
flag is set, then an exclusive latch request will be followed by
an io latch request. */
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
switch (type)
{
2001-05-23 15:26:42 +02:00
case LATCH_none:
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
case LATCH_shared:
if (bdb->bdb_flags & BDB_read_pending) {
2001-05-23 15:26:42 +02:00
break;
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_exclusive)
{
if (bdb->bdb_exclusive != tdbb) {
2009-08-23 13:43:25 +02:00
break; // someone else owns exclusive latch
}
2001-05-23 15:26:42 +02:00
}
2009-01-14 10:19:00 +01:00
else
{
2009-08-23 13:43:25 +02:00
// Note that Firebird often 'hands-off' to the same page, for both
// shared and exlusive latches.
// Check if we own already an exclusive latch.
if (!findSharedLatch(tdbb, bdb))
2009-08-23 13:43:25 +02:00
{
// we don't own a shared latch yet
// If there are latch-waiters, and they are not waiting for an
// io_latch, then we have to wait also (there must be a exclusive
// latch waiter). If there is an IO in progress, then violate the
// fairness and sneak ahead of the exclusive (or io) waiters.
2001-05-23 15:26:42 +02:00
if ((QUE_NOT_EMPTY(bdb->bdb_waiters)) && !bdb->bdb_io) {
2009-08-23 13:43:25 +02:00
break; // be fair and wait behind exclusive latch requests
}
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
// Nobody owns an exlusive latch, or sneak ahead of exclusive latch
// waiters while an io is in progress.
2001-05-23 15:26:42 +02:00
++bdb->bdb_use_count;
allocSharedLatch(tdbb, bdb);
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
case LATCH_io:
if (bdb->bdb_flags & BDB_read_pending) {
2001-05-23 15:26:42 +02:00
break;
}
if (bdb->bdb_io) {
2009-08-23 13:43:25 +02:00
break; // someone else owns the io latch
}
2001-05-23 15:26:42 +02:00
++bdb->bdb_use_count;
bdb->bdb_io = tdbb;
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
case LATCH_exclusive:
2009-08-23 13:43:25 +02:00
// Exclusive latches wait for existing shared latches and
// (unfortunately) for existing io latches. This is not as
// bad as it sounds because an exclusive latch is typically followed
// by a mark latch, which then would wait behind the io latch.
// Obsolete: Note that the ail-code latches the same buffer multiple times
// in shared and exclusive
// Note that Firebird often 'hands-off' to the same page, for both
// shared and exlusive latches.
if (bdb->bdb_use_count && (bdb->bdb_exclusive != tdbb)) {
2001-05-23 15:26:42 +02:00
break;
}
2001-05-23 15:26:42 +02:00
++bdb->bdb_use_count;
bdb->bdb_exclusive = tdbb;
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
case LATCH_mark:
if (bdb->bdb_exclusive != tdbb) {
2009-08-23 13:43:25 +02:00
BUGCHECK(295); // inconsistent LATCH_mark call
}
2009-08-23 13:43:25 +02:00
// Some Firebird code marks a buffer more than once.
if (bdb->bdb_io && (bdb->bdb_io != tdbb)) {
2001-05-23 15:26:42 +02:00
break;
}
2001-05-23 15:26:42 +02:00
bdb->bdb_io = tdbb;
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
default:
break;
}
2009-08-23 13:43:25 +02:00
// If the caller doesn't want to wait for this latch, then return now.
2009-06-26 06:12:20 +02:00
if (latch_wait == 0)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 1;
}
2009-08-23 13:43:25 +02:00
// Get or create a latch wait block and wait for someone to grant the latch.
2001-05-23 15:26:42 +02:00
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
LatchWait* lwt;
if (QUE_NOT_EMPTY(bcb->bcb_free_lwt))
{
QUE que_inst = bcb->bcb_free_lwt.que_forward;
2008-05-11 14:27:51 +02:00
QUE_DELETE(*que_inst);
lwt = (LatchWait*) BLOCK(que_inst, LatchWait*, lwt_waiters);
2001-05-23 15:26:42 +02:00
}
else
{
lwt = FB_NEW(*dbb->dbb_bufferpool) LatchWait;
QUE_INIT(lwt->lwt_waiters);
2001-05-23 15:26:42 +02:00
}
lwt->lwt_flags |= LWT_pending;
lwt->lwt_latch = type;
lwt->lwt_tdbb = tdbb;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Give priority to IO. This might prevent deadlocks while performing
// precedence writes. This does not cause starvation because an
// exclusive latch is needed to dirty the page again.
if ((type == LATCH_io) || (type == LATCH_mark)) {
2008-05-11 14:27:51 +02:00
QUE_INSERT(bdb->bdb_waiters, lwt->lwt_waiters);
}
else {
QUE_APPEND(bdb->bdb_waiters, lwt->lwt_waiters);
}
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
bool timeout_occurred = false;
2009-08-23 13:43:25 +02:00
// Loop until the latch is granted or until a timeout occurs.
while ((lwt->lwt_flags & LWT_pending) && !timeout_occurred)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
Database::Checkout dcoHolder(dbb);
timeout_occurred = !(lwt->lwt_sem.tryEnter(latch_wait > 0 ? 120 : -latch_wait));
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
bcb = dbb->dbb_bcb; // Re-initialize
QUE_DELETE(lwt->lwt_waiters);
QUE_INSERT(bcb->bcb_free_lwt, lwt->lwt_waiters);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If the latch is not granted then a timeout must have occurred.
2009-01-14 10:19:00 +01:00
if ((lwt->lwt_flags & LWT_pending) && timeout_occurred)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2009-06-26 06:12:20 +02:00
if (latch_wait == 1)
{
ERR_build_status(tdbb->tdbb_status_vector, Arg::Gds(isc_deadlock));
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
else {
2001-05-23 15:26:42 +02:00
return 1;
}
2001-05-23 15:26:42 +02:00
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_page != page)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
release_bdb(tdbb, bdb, true, false, false);
2001-05-23 15:26:42 +02:00
return -1;
}
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return 0;
}
2009-06-06 11:05:20 +02:00
static SSHORT lock_buffer(thread_db* tdbb, BufferDesc* bdb, const SSHORT wait, const SCHAR page_type)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* l o c k _ b u f f e r
*
**************************************
*
* Functional description
* Get a lock on page for a buffer. If the lock ever slipped
* below READ, indicate that the page must be read.
*
* input:
* wait: LCK_WAIT = 1 => Wait as long a necessary to get the lock.
* LCK_NO_WAIT = 0 => If the lock can't be acquired immediately,
2001-05-23 15:26:42 +02:00
* give up and return -1.
* <negative number> => Lock timeout interval in seconds.
*
2007-05-16 08:53:47 +02:00
* return: 0 => buffer locked, page is already in memory.
2001-05-23 15:26:42 +02:00
* 1 => buffer locked, page needs to be read from disk.
* -1 => timeout on lock occurred, see input parameter 'wait'.
*
**************************************/
SET_TDBB(tdbb);
#ifdef SUPERSERVER
2001-05-23 15:26:42 +02:00
return ((bdb->bdb_flags & BDB_read_pending) ? 1 : 0);
#else
2008-12-18 11:47:25 +01:00
const USHORT lock_type = (bdb->bdb_flags & (BDB_dirty | BDB_writer)) ? LCK_write : LCK_read;
2009-06-06 11:05:20 +02:00
Lock* const lock = bdb->bdb_lock;
2001-05-23 15:26:42 +02:00
if (lock->lck_logical >= lock_type) {
2001-05-23 15:26:42 +02:00
return 0;
}
2001-05-23 15:26:42 +02:00
TEXT errmsg[MAX_ERRMSG_LEN + 1];
2009-06-06 11:05:20 +02:00
ISC_STATUS* const status = tdbb->tdbb_status_vector;
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (lock->lck_logical == LCK_none)
{
2009-08-23 13:43:25 +02:00
// Prevent header and TIP pages from generating blocking AST
// overhead. The promise is that the lock will unconditionally
// be released when the buffer use count indicates it is safe to do so.
2001-05-23 15:26:42 +02:00
if (page_type == pag_header || page_type == pag_transactions)
{
2003-11-04 00:59:24 +01:00
fb_assert(lock->lck_ast == blocking_ast_bdb);
fb_assert(lock->lck_object == bdb);
2001-05-23 15:26:42 +02:00
lock->lck_ast = 0;
lock->lck_object = NULL;
}
else {
2003-11-04 00:59:24 +01:00
fb_assert(lock->lck_ast != NULL);
}
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
//lock->lck_key.lck_long = bdb->bdb_page;
bdb->bdb_page.getLockStr(lock->lck_key.lck_string);
2009-01-14 10:19:00 +01:00
if (LCK_lock_opt(tdbb, lock, lock_type, wait))
{
if (!lock->lck_ast)
{
// Restore blocking AST to lock block if it was swapped out.
// Flag the BufferDesc so that the lock is released when the buffer is released.
2001-05-23 15:26:42 +02:00
fb_assert(page_type == pag_header || page_type == pag_transactions);
lock->lck_ast = blocking_ast_bdb;
lock->lck_object = bdb;
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_no_blocking_ast;
}
return 1;
}
2009-06-26 06:12:20 +02:00
if (!lock->lck_ast)
{
2003-11-04 00:59:24 +01:00
fb_assert(page_type == pag_header || page_type == pag_transactions);
lock->lck_ast = blocking_ast_bdb;
lock->lck_object = bdb;
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Case: a timeout was specified, or the caller didn't want to wait, return the error.
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if ((wait == LCK_NO_WAIT) || ((wait < 0) && (status[1] == isc_lock_timeout)))
{
fb_utils::init_status(status);
release_bdb(tdbb, bdb, false, false, false);
2001-05-23 15:26:42 +02:00
return -1;
}
2009-08-23 13:43:25 +02:00
// Case: lock manager detected a deadlock, probably caused by locking the
// BufferDesc's in an unfortunate order. Nothing we can do about it, return the
// error, and log it to firebird.log.
2001-05-23 15:26:42 +02:00
fb_msg_format(0, JRD_BUGCHK, 215, sizeof(errmsg), errmsg,
MsgFormat::SafeArg() << bdb->bdb_page.getPageNum() << (int) page_type);
ERR_append_status(status, Arg::Gds(isc_random) << Arg::Str(errmsg));
2009-08-23 13:43:25 +02:00
ERR_log(JRD_BUGCHK, 215, errmsg); // msg 215 page %ld, page type %ld lock conversion denied
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// CCH_unwind releases all the BufferDesc's and calls ERR_punt()
// ERR_punt will longjump.
2001-05-23 15:26:42 +02:00
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
// Lock requires an upward conversion. Sigh. Try to get the conversion.
// If it fails, release the lock and re-seize. Save the contents of the
// status vector just in case
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
const SSHORT must_read = (lock->lck_logical < LCK_read) ? 1 : 0;
2001-05-23 15:26:42 +02:00
ISC_STATUS_ARRAY alt_status;
2001-05-23 15:26:42 +02:00
memcpy(alt_status, tdbb->tdbb_status_vector, sizeof(alt_status));
if (LCK_convert_opt(tdbb, lock, lock_type)) {
2001-05-23 15:26:42 +02:00
return must_read;
}
2009-06-06 11:05:20 +02:00
2009-06-26 06:12:20 +02:00
if (wait == LCK_NO_WAIT)
{
release_bdb(tdbb, bdb, true, false, false);
2001-05-23 15:26:42 +02:00
return -1;
}
memcpy(tdbb->tdbb_status_vector, alt_status, sizeof(alt_status));
if (LCK_lock(tdbb, lock, lock_type, wait)) {
2001-05-23 15:26:42 +02:00
return 1;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Case: a timeout was specified, or the caller didn't want to wait, return the error.
2001-05-23 15:26:42 +02:00
2008-12-05 02:20:14 +01:00
if ((wait < 0) && (status[1] == isc_lock_timeout))
{
fb_utils::init_status(status);
release_bdb(tdbb, bdb, false, false, false);
2001-05-23 15:26:42 +02:00
return -1;
}
2009-08-23 13:43:25 +02:00
// Case: lock manager detected a deadlock, probably caused by locking the
// BufferDesc's in an unfortunate order. Nothing we can do about it, return the
// error, and log it to firebird.log.
2001-05-23 15:26:42 +02:00
fb_msg_format(0, JRD_BUGCHK, 216, sizeof(errmsg), errmsg,
MsgFormat::SafeArg() << bdb->bdb_page.getPageNum() << (int) page_type);
ERR_append_status(status, Arg::Gds(isc_random) << Arg::Str(errmsg));
2009-08-23 13:43:25 +02:00
ERR_log(JRD_BUGCHK, 216, errmsg); // msg 216 page %ld, page type %ld lock denied
2001-05-23 15:26:42 +02:00
CCH_unwind(tdbb, true);
2009-08-23 13:43:25 +02:00
return 0; // Added to get rid of Compiler Warning
2001-05-23 15:26:42 +02:00
#endif
}
2007-04-11 18:05:40 +02:00
static ULONG memory_init(thread_db* tdbb, BufferControl* bcb, SLONG number)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* m e m o r y _ i n i t
*
**************************************
*
* Functional description
* Initialize memory for the cache.
* Return number of buffers allocated.
*
**************************************/
SET_TDBB(tdbb);
2009-06-06 11:05:20 +02:00
Database* const dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
2006-12-04 22:26:43 +01:00
UCHAR* memory = NULL;
SLONG buffers = 0;
const size_t page_size = dbb->dbb_page_size;
size_t memory_size = page_size * (number + 1);
2009-06-06 11:05:20 +02:00
fb_assert(memory_size > 0);
SLONG old_buffers = 0;
2006-12-04 22:26:43 +01:00
bcb_repeat* old_tail = NULL;
const UCHAR* memory_end = NULL;
bcb_repeat* tail = bcb->bcb_rpt;
// "end" is changed inside the loop
for (const bcb_repeat* end = tail + number; tail < end; tail++)
{
if (!memory)
{
2009-08-23 13:43:25 +02:00
// Allocate only what is required for remaining buffers.
2001-05-23 15:26:42 +02:00
2006-12-04 22:26:43 +01:00
if (memory_size > (page_size * (number + 1))) {
2001-05-23 15:26:42 +02:00
memory_size = page_size * (number + 1);
}
2001-05-23 15:26:42 +02:00
2008-12-05 02:20:14 +01:00
while (true)
2006-04-06 10:18:53 +02:00
{
2006-12-04 22:26:43 +01:00
try {
memory = (UCHAR*) dbb->dbb_bufferpool->allocate(memory_size);
break;
2006-12-04 22:26:43 +01:00
}
catch (Firebird::BadAlloc&)
{
2009-08-23 13:43:25 +02:00
// Either there's not enough virtual memory or there is
// but it's not virtually contiguous. Let's find out by
// cutting the size in half to see if the buffers can be
// scattered over the remaining virtual address space.
2006-12-04 22:26:43 +01:00
memory_size >>= 1;
2009-06-26 06:12:20 +02:00
if (memory_size < MIN_BUFFER_SEGMENT)
{
2009-08-23 13:43:25 +02:00
// Diminishing returns
2006-12-04 22:26:43 +01:00
return buffers;
}
}
2006-04-06 10:18:53 +02:00
}
2001-05-23 15:26:42 +02:00
bcb->bcb_memory.push(memory);
2001-05-23 15:26:42 +02:00
memory_end = memory + memory_size;
2009-08-23 13:43:25 +02:00
// Allocate buffers on an address that is an even multiple
// of the page size (rather the physical sector size.) This
// is a necessary condition to support raw I/O interfaces.
2006-12-04 22:26:43 +01:00
memory = (UCHAR *) FB_ALIGN((U_IPTR) memory, page_size);
2001-05-23 15:26:42 +02:00
old_tail = tail;
old_buffers = buffers;
}
QUE_INIT(tail->bcb_page_mod);
2009-01-14 10:19:00 +01:00
if (!(tail->bcb_bdb = alloc_bdb(tdbb, bcb, &memory)))
{
2009-08-23 13:43:25 +02:00
// Whoops! Time to reset our expectations. Release the buffer memory
// but use that memory size to calculate a new number that takes into account
// the page buffer overhead. Reduce this number by a 25% fudge factor to
// leave some memory for useful work.
2001-05-23 15:26:42 +02:00
2006-12-04 22:26:43 +01:00
dbb->dbb_bufferpool->deallocate(bcb->bcb_memory.pop());
memory = NULL;
for (bcb_repeat* tail2 = old_tail; tail2 < tail; tail2++)
{
2001-05-23 15:26:42 +02:00
tail2->bcb_bdb = dealloc_bdb(tail2->bcb_bdb);
}
2001-05-23 15:26:42 +02:00
number = memory_size / PAGE_OVERHEAD;
number -= number >> 2;
end = old_tail + number;
2009-08-23 13:43:25 +02:00
tail = --old_tail; // For loop continue pops tail above
2001-05-23 15:26:42 +02:00
buffers = old_buffers;
continue;
}
2009-08-23 13:43:25 +02:00
buffers++; // Allocated buffers
number--; // Remaining buffers
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Check if memory segment has been exhausted.
2001-05-23 15:26:42 +02:00
if (memory + page_size > memory_end) {
2001-05-23 15:26:42 +02:00
memory = 0;
}
2001-05-23 15:26:42 +02:00
}
return buffers;
}
2009-08-23 13:43:25 +02:00
static void page_validation_error(thread_db* tdbb, WIN* window, SSHORT type)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* p a g e _ v a l i d a t i o n _ e r r o r
*
**************************************
*
* Functional description
* We've detected a validation error on fetch. Generally
* we've detected that the type of page fetched didn't match the
* type of page we were expecting. Report an error and
* get out.
* This function will only be called rarely, as a page validation
* error is an indication of on-disk database corruption.
*
**************************************/
SET_TDBB(tdbb);
BufferDesc* bdb = window->win_bdb;
const pag* page = bdb->bdb_buffer;
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
PageSpace* pages =
tdbb->getDatabase()->dbb_page_manager.findPageSpace(bdb->bdb_page.getPageSpaceID());
2006-05-22 00:07:35 +02:00
ERR_build_status(tdbb->tdbb_status_vector,
Arg::Gds(isc_db_corrupt) << Arg::Str(pages->file->fil_string) <<
Arg::Gds(isc_page_type_err) <<
2008-12-05 02:20:14 +01:00
Arg::Gds(isc_badpagtyp) << Arg::Num(bdb->bdb_page.getPageNum()) <<
Arg::Num(type) <<
Arg::Num(page->pag_type));
2009-08-23 13:43:25 +02:00
// We should invalidate this bad buffer.
CCH_unwind(tdbb, true);
2001-05-23 15:26:42 +02:00
}
#ifdef CACHE_READER
static void prefetch_epilogue(Prefetch* prefetch, ISC_STATUS* status_vector)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* p r e f e t c h _ e p i l o g u e
*
**************************************
*
* Functional description
* Stall on asynchronous I/O completion.
* Move data from prefetch buffer to database
2001-05-23 15:26:42 +02:00
* buffers, compute the checksum, and release
* the latch.
*
**************************************/
if (!(prefetch->prf_flags & PRF_active)) {
2001-05-23 15:26:42 +02:00
return;
}
2001-05-23 15:26:42 +02:00
thread_db* tdbb = prefetch->prf_tdbb;
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
prefetch->prf_piob.piob_wait = TRUE;
const bool async_status = PIO_status(dbb, &prefetch->prf_piob, status_vector);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// If there was an I/O error release all buffer latches acquired for the prefetch request.
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (!async_status)
{
BufferDesc** next_bdb = prefetch->prf_bdbs;
for (USHORT i = 0; i < prefetch->prf_max_prefetch; i++)
{
if (*next_bdb) {
release_bdb(tdbb, *next_bdb, true, false, false);
}
2001-05-23 15:26:42 +02:00
next_bdb++;
}
prefetch->prf_flags &= ~PRF_active;
return;
}
const SCHAR* next_buffer = prefetch->prf_io_buffer;
BufferDesc** next_bdb = prefetch->prf_bdbs;
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
for (USHORT i = 0; i < prefetch->prf_max_prefetch; i++)
{
if (*next_bdb)
{
pag* page = (*next_bdb)->bdb_buffer;
if (next_buffer != reinterpret_cast<char*>(page)) {
2008-02-03 11:41:44 +01:00
memcpy(page, next_buffer, (ULONG) dbb->dbb_page_size);
}
2009-12-14 12:41:47 +01:00
if (page->pag_pageno == (*next_bdb)->bdb_page.getPageNum())
2009-06-26 06:12:20 +02:00
{
2001-05-23 15:26:42 +02:00
(*next_bdb)->bdb_flags &= ~(BDB_read_pending | BDB_not_valid);
(*next_bdb)->bdb_flags |= BDB_prefetch;
}
release_bdb(tdbb, *next_bdb, true, false, false);
2001-05-23 15:26:42 +02:00
}
next_buffer += dbb->dbb_page_size;
next_bdb++;
}
prefetch->prf_flags &= ~PRF_active;
}
static void prefetch_init(Prefetch* prefetch, thread_db* tdbb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* p r e f e t c h _ i n i t
*
**************************************
*
* Functional description
* Initialize prefetch data structure.
* Most systems that allow access to "raw" I/O
* interfaces want the buffer address aligned.
*
**************************************/
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
prefetch->prf_tdbb = tdbb;
prefetch->prf_flags = 0;
prefetch->prf_max_prefetch = PREFETCH_MAX_TRANSFER / dbb->dbb_page_size;
prefetch->prf_aligned_buffer =
2008-12-18 11:47:25 +01:00
(SCHAR*) (((U_IPTR) &prefetch->prf_unaligned_buffer + MIN_PAGE_SIZE - 1) &
~((U_IPTR) MIN_PAGE_SIZE - 1));
2001-05-23 15:26:42 +02:00
}
static void prefetch_io(Prefetch* prefetch, ISC_STATUS* status_vector)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* p r e f e t c h _ i o
*
**************************************
*
* Functional description
* Queue an asynchronous I/O to read
* multiple pages into prefetch buffer.
*
**************************************/
thread_db* tdbb = prefetch->prf_tdbb;
Database* dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
if (!prefetch->prf_page_count) {
2001-05-23 15:26:42 +02:00
prefetch->prf_flags &= ~PRF_active;
}
2009-01-14 10:19:00 +01:00
else
{
2009-08-23 13:43:25 +02:00
// Get the cache reader working on our behalf too
2001-05-23 15:26:42 +02:00
if (!(dbb->dbb_bcb->bcb_flags & BCB_reader_active)) {
dbb->dbb_reader_sem.post();
}
2001-05-23 15:26:42 +02:00
const bool async_status =
2008-12-18 11:47:25 +01:00
PIO_read_ahead(dbb, prefetch->prf_start_page, prefetch->prf_io_buffer,
prefetch->prf_page_count, &prefetch->prf_piob, status_vector);
if (!async_status)
{
BufferDesc** next_bdb = prefetch->prf_bdbs;
2009-06-26 06:12:20 +02:00
for (USHORT i = 0; i < prefetch->prf_max_prefetch; i++)
{
if (*next_bdb) {
release_bdb(tdbb, *next_bdb, true, false, false);
}
2001-05-23 15:26:42 +02:00
next_bdb++;
}
prefetch->prf_flags &= ~PRF_active;
}
}
}
static void prefetch_prologue(Prefetch* prefetch, SLONG* start_page)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* p r e f e t c h _ p r o l o g u e
*
**************************************
*
* Functional description
* Search for consecutive pages to be prefetched
* and latch them for I/O.
*
**************************************/
thread_db* tdbb = prefetch->prf_tdbb;
Database* dbb = tdbb->getDatabase();
BufferControl* bcb = dbb->dbb_bcb;
2001-05-23 15:26:42 +02:00
prefetch->prf_start_page = *start_page;
prefetch->prf_page_count = 0;
prefetch->prf_flags |= PRF_active;
BufferDesc** next_bdb = prefetch->prf_bdbs;
2009-01-14 10:19:00 +01:00
for (USHORT i = 0; i < prefetch->prf_max_prefetch; i++)
{
2001-05-23 15:26:42 +02:00
*next_bdb = 0;
if (SBM_clear(bcb->bcb_prefetch, *start_page) &&
(*next_bdb = get_buffer(tdbb, *start_page, LATCH_shared, 0)))
{
if ((*next_bdb)->bdb_flags & BDB_read_pending) {
2001-05-23 15:26:42 +02:00
prefetch->prf_page_count = i + 1;
}
2009-06-26 06:12:20 +02:00
else
{
release_bdb(tdbb, *next_bdb, true, false, false);
2001-05-23 15:26:42 +02:00
*next_bdb = 0;
}
}
next_bdb++;
(*start_page)++;
}
2009-08-23 13:43:25 +02:00
// Optimize non-sequential list prefetching to transfer directly to database buffers.
2001-05-23 15:26:42 +02:00
BufferDesc* bdb;
if (prefetch->prf_page_count == 1 && (bdb = prefetch->prf_bdbs[0])) {
2002-04-29 17:05:11 +02:00
prefetch->prf_io_buffer = reinterpret_cast<char*>(bdb->bdb_buffer);
}
else {
2001-05-23 15:26:42 +02:00
prefetch->prf_io_buffer = prefetch->prf_aligned_buffer;
}
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Reset starting page for next bitmap walk
2001-05-23 15:26:42 +02:00
--(*start_page);
}
#endif // CACHE_READER
2001-05-23 15:26:42 +02:00
static SSHORT related(BufferDesc* low, const BufferDesc* high, SSHORT limit, const ULONG mark)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* r e l a t e d
*
**************************************
*
* Functional description
* See if there are precedence relationships linking two buffers.
* Since precedence graphs can become very complex, limit search for
* precedence relationship by visiting a presribed limit of higher
* precedence blocks.
*
**************************************/
const struct que* base = &low->bdb_higher;
2001-05-23 15:26:42 +02:00
for (const struct que* que_inst = base->que_forward; que_inst != base; que_inst = que_inst->que_forward)
{
if (!--limit) {
2001-05-23 15:26:42 +02:00
return PRE_UNKNOWN;
}
const Precedence* precedence = BLOCK(que_inst, Precedence*, pre_higher);
2009-01-14 10:19:00 +01:00
if (!(precedence->pre_flags & PRE_cleared))
{
if (precedence->pre_hi->bdb_prec_walk_mark == mark)
continue;
if (precedence->pre_hi == high) {
2001-05-23 15:26:42 +02:00
return PRE_EXISTS;
}
if (QUE_NOT_EMPTY(precedence->pre_hi->bdb_higher))
{
limit = related(precedence->pre_hi, high, limit, mark);
if (limit == PRE_EXISTS || limit == PRE_UNKNOWN) {
return limit;
}
}
else
precedence->pre_hi->bdb_prec_walk_mark = mark;
2001-05-23 15:26:42 +02:00
}
}
low->bdb_prec_walk_mark = mark;
2001-05-23 15:26:42 +02:00
return limit;
}
static void release_bdb(thread_db* tdbb,
BufferDesc* bdb,
const bool repost,
const bool downgrade_latch,
const bool rel_mark_latch)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* r e l e a s e _ b d b
*
**************************************
*
* Functional description
* Decrement the use count of a BufferDesc, reposting
2001-05-23 15:26:42 +02:00
* blocking AST if required.
* If rel_mark_latch is true, the value of downgrade_latch is ignored.
2001-05-23 15:26:42 +02:00
*
**************************************/
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
2009-06-06 11:05:20 +02:00
que* const wait_que = &bdb->bdb_waiters;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Releasing a LATCH_mark.
2009-01-14 10:19:00 +01:00
if (rel_mark_latch)
{
if ((bdb->bdb_io != tdbb) || (bdb->bdb_exclusive != tdbb)) {
2009-08-23 13:43:25 +02:00
BUGCHECK(294); // inconsistent LATCH_mark release
}
2001-05-23 15:26:42 +02:00
bdb->bdb_io = 0;
}
2009-01-14 10:19:00 +01:00
else if (downgrade_latch)
{
2009-08-23 13:43:25 +02:00
// Downgrading from an exlusive to a shared latch.
// Only the transition from exclusive to shared is supported.
// If an actual state changed, then we need to check if waiters
// can be granted. Otherwise, there is nothing further to do.
if (bdb->bdb_io == tdbb) {
2009-08-23 13:43:25 +02:00
BUGCHECK(296); // inconsistent latch downgrade call
}
2009-06-26 06:12:20 +02:00
if (bdb->bdb_exclusive == tdbb)
{
2001-05-23 15:26:42 +02:00
bdb->bdb_exclusive = 0;
allocSharedLatch(tdbb, bdb);
2001-05-23 15:26:42 +02:00
}
2009-06-26 06:12:20 +02:00
else
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
}
2009-01-14 10:19:00 +01:00
else if (bdb->bdb_exclusive == tdbb)
{
2009-08-23 13:43:25 +02:00
// If the exclusive latch is held, then certain code does funny things:
// ail.c does: exclusive - mark - exclusive
// CVC: but this comment was related to our obsolete WAL facility.
2001-05-23 15:26:42 +02:00
--bdb->bdb_use_count;
if (!bdb->bdb_use_count)
2009-08-23 13:43:25 +02:00
{
// All latches are released
2001-05-23 15:26:42 +02:00
bdb->bdb_exclusive = bdb->bdb_io = 0;
2008-12-05 02:20:14 +01:00
while (QUE_NOT_EMPTY(bdb->bdb_shared))
{
SharedLatch* latch = BLOCK(bdb->bdb_shared.que_forward, SharedLatch*, slt_bdb_que);
freeSharedLatch(tdbb, bdb->bdb_dbb->dbb_bcb, latch);
}
2001-05-23 15:26:42 +02:00
}
2009-01-14 10:19:00 +01:00
else if (bdb->bdb_io)
2009-08-23 13:43:25 +02:00
{
// This is a release for an io or an exclusive latch
if (bdb->bdb_io == tdbb)
2009-08-23 13:43:25 +02:00
{
// We have an io latch
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// The BDB_must_write flag causes the system to latch for io, in addition
// to the already owned latches. Make sure not to disturb an already existing
// exclusive latch.
// ail.c does: EX => MARK => SHARED => release => EX => MARK => RELEASE => EX
// CVC: ail.c was related to our obsolete WAL facility.
if (!(bdb->bdb_flags & BDB_marked)) {
2001-05-23 15:26:42 +02:00
bdb->bdb_io = 0;
}
2001-05-23 15:26:42 +02:00
}
2009-06-26 06:12:20 +02:00
else if (bdb->bdb_use_count == 1)
{
2009-08-23 13:43:25 +02:00
// This must be a release for our exclusive latch
2001-05-23 15:26:42 +02:00
bdb->bdb_exclusive = 0;
}
2001-05-23 15:26:42 +02:00
}
2009-06-26 06:12:20 +02:00
else
2009-08-23 13:43:25 +02:00
{
// This is a release for a shared latch
SharedLatch* latch = findSharedLatch(tdbb, bdb);
if (latch) {
freeSharedLatch(tdbb, bdb->bdb_dbb->dbb_bcb, latch);
}
2001-05-23 15:26:42 +02:00
}
}
else
{
2009-08-23 13:43:25 +02:00
// If the exclusive latch is not held, then things have to behave much nicer.
if (bdb->bdb_flags & BDB_marked) {
2009-08-23 13:43:25 +02:00
BUGCHECK(297); // bdb is unexpectedly marked
}
2001-05-23 15:26:42 +02:00
--bdb->bdb_use_count;
if (bdb->bdb_io == tdbb) {
2001-05-23 15:26:42 +02:00
bdb->bdb_io = 0;
}
2009-06-26 06:12:20 +02:00
else
{
SharedLatch* latch = findSharedLatch(tdbb, bdb);
if (!latch) {
2009-08-23 13:43:25 +02:00
BUGCHECK(300); // can't find shared latch
}
freeSharedLatch(tdbb, bdb->bdb_dbb->dbb_bcb, latch);
2001-05-23 15:26:42 +02:00
}
}
bool granted = false;
2001-05-23 15:26:42 +02:00
for (QUE que_inst = wait_que->que_forward; que_inst != wait_que; que_inst = que_inst->que_forward)
{
2009-08-23 13:43:25 +02:00
// Note that this loop assumes that requests for LATCH_io and LATCH_mark
// are queued before LATCH_shared and LATCH_exclusive.
LatchWait* lwt = BLOCK(que_inst, LatchWait*, lwt_waiters);
if (lwt->lwt_flags & LWT_pending)
{
switch (lwt->lwt_latch)
{
case LATCH_exclusive:
2009-06-26 06:12:20 +02:00
if (bdb->bdb_use_count)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
2008-01-16 09:31:31 +01:00
++bdb->bdb_use_count;
bdb->bdb_exclusive = lwt->lwt_tdbb;
lwt->lwt_flags &= ~LWT_pending;
lwt->lwt_sem.release();
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2008-01-16 09:31:31 +01:00
return;
2001-05-23 15:26:42 +02:00
case LATCH_io:
2008-01-16 09:31:31 +01:00
if (!bdb->bdb_io)
{
2001-05-23 15:26:42 +02:00
++bdb->bdb_use_count;
bdb->bdb_io = lwt->lwt_tdbb;
lwt->lwt_flags &= ~LWT_pending;
lwt->lwt_sem.release();
granted = true;
2001-05-23 15:26:42 +02:00
}
2008-01-16 09:31:31 +01:00
break;
2001-05-23 15:26:42 +02:00
case LATCH_mark:
if (bdb->bdb_exclusive != lwt->lwt_tdbb) {
2009-08-23 13:43:25 +02:00
BUGCHECK(298); // missing exclusive latch
}
2008-01-16 09:31:31 +01:00
if (!bdb->bdb_io)
{
bdb->bdb_io = lwt->lwt_tdbb;
lwt->lwt_flags &= ~LWT_pending;
lwt->lwt_sem.release();
granted = true;
2001-05-23 15:26:42 +02:00
}
2008-01-16 09:31:31 +01:00
break;
2001-05-23 15:26:42 +02:00
case LATCH_shared:
if (bdb->bdb_exclusive)
{
2009-08-23 13:43:25 +02:00
break; // defensive programming
2008-12-05 02:20:14 +01:00
2009-08-23 13:43:25 +02:00
// correct programming
/*
//LATCH_MUTEX_RELEASE;
return;
*/
2001-05-23 15:26:42 +02:00
}
++bdb->bdb_use_count;
allocSharedLatch(lwt->lwt_tdbb, bdb);
lwt->lwt_flags &= ~LWT_pending;
lwt->lwt_sem.release();
granted = true;
2001-05-23 15:26:42 +02:00
break;
}
2009-06-26 06:12:20 +02:00
if (granted && (bdb->bdb_flags & BDB_read_pending))
{
2009-08-23 13:43:25 +02:00
// Allow only one reader to proceed
2001-05-23 15:26:42 +02:00
break;
}
2001-05-23 15:26:42 +02:00
}
}
2001-05-23 15:26:42 +02:00
2009-06-26 06:12:20 +02:00
if (bdb->bdb_use_count || !repost)
{
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
return;
}
2009-08-23 13:43:25 +02:00
//LATCH_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
if (bdb->bdb_ast_flags & BDB_blocking)
2003-08-13 13:11:12 +02:00
{
2001-05-23 15:26:42 +02:00
PAGE_LOCK_RE_POST(bdb->bdb_lock);
2003-08-13 13:11:12 +02:00
}
2001-05-23 15:26:42 +02:00
}
2009-08-23 13:43:25 +02:00
static void unmark(thread_db* tdbb, WIN* window)
2007-02-06 09:03:43 +01:00
{
/**************************************
*
* u n m a r k
*
**************************************
*
* Functional description
* Unmark a BufferDesc. Called when the update of a page is
* complete and delaying the 'unmarking' could cause
* problems.
*
**************************************/
SET_TDBB(tdbb);
BufferDesc* bdb = window->win_bdb;
BLKCHK(bdb, type_bdb);
2009-01-14 10:19:00 +01:00
if (bdb->bdb_use_count == 1)
{
const bool marked = bdb->bdb_flags & BDB_marked;
2007-02-06 09:03:43 +01:00
bdb->bdb_flags &= ~BDB_marked;
if (marked) {
release_bdb(tdbb, bdb, false, false, true);
2007-02-06 09:03:43 +01:00
}
}
}
static inline bool writeable(BufferDesc* bdb)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* w r i t e a b l e
*
**************************************
*
* Functional description
* See if a buffer is writeable. A buffer is writeable if
* neither it nor any of it's higher precedence cousins are
* marked for write.
2008-12-05 02:20:14 +01:00
* This is the starting point of recursive walk of precedence
2008-02-13 13:57:04 +01:00
* graph. The writeable_mark member is used to mark already seen
* buffers to avoid repeated walk of the same sub-graph.
* Currently this function can't be called from more than one
* thread simultaneously. When SMP will be implemented we must
* take additional care about thread-safety.
2001-05-23 15:26:42 +02:00
*
**************************************/
if (bdb->bdb_flags & BDB_marked) {
2003-12-22 11:00:59 +01:00
return false;
}
2001-05-23 15:26:42 +02:00
2008-02-08 02:25:41 +01:00
BufferControl* bcb = bdb->bdb_dbb->dbb_bcb;
const ULONG mark = get_prec_walk_mark(bcb);
return is_writeable(bdb, mark);
}
2001-05-23 15:26:42 +02:00
static bool is_writeable(BufferDesc* bdb, const ULONG mark)
{
/**************************************
*
* i s _ w r i t e a b l e
*
**************************************
*
* Functional description
* See if a buffer is writeable. A buffer is writeable if
* neither it nor any of it's higher precedence cousins are
* marked for write.
*
**************************************/
2008-12-05 02:20:14 +01:00
// If there are buffers that must be written first, check them, too.
for (const que* queue = bdb->bdb_higher.que_forward;
queue != &bdb->bdb_higher; queue = queue->que_forward)
2003-12-22 11:00:59 +01:00
{
const Precedence* precedence = BLOCK(queue, Precedence*, pre_higher);
if (!(precedence->pre_flags & PRE_cleared))
2003-12-22 11:00:59 +01:00
{
2008-02-08 02:25:41 +01:00
BufferDesc* high = precedence->pre_hi;
2008-12-05 02:20:14 +01:00
if (high->bdb_flags & BDB_marked) {
return false;
}
if (high->bdb_prec_walk_mark != mark)
{
if (QUE_EMPTY(high->bdb_higher))
high->bdb_prec_walk_mark = mark;
else if (!is_writeable(high, mark))
return false;
}
2003-12-22 11:00:59 +01:00
}
2001-05-23 15:26:42 +02:00
}
bdb->bdb_prec_walk_mark = mark;
2003-12-22 11:00:59 +01:00
return true;
2001-05-23 15:26:42 +02:00
}
2008-12-18 11:47:25 +01:00
static int write_buffer(thread_db* tdbb,
BufferDesc* bdb,
2006-05-22 00:07:35 +02:00
const PageNumber page,
2003-12-22 11:00:59 +01:00
const bool write_thru,
2009-06-06 11:05:20 +02:00
ISC_STATUS* const status, const bool write_this_page)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* w r i t e _ b u f f e r
*
**************************************
*
* Functional description
* Write a dirty buffer. This may recurse due to
* precedence problems.
*
* input: write_this_page
2001-05-23 15:26:42 +02:00
* = true if the input page needs to be written
* before returning. (normal case)
* = false if the input page is being written
2001-05-23 15:26:42 +02:00
* because of precedence. Only write
* one page and return so that the caller
* can re-establish the need to write this
* page.
*
2001-05-23 15:26:42 +02:00
* return: 0 = Write failed.
* 1 = Page is written. Page was written by this
* call, or was written by someone else, or the
* cache buffer is already reassigned.
2003-12-22 11:00:59 +01:00
* 2 = Only possible if write_this_page is false.
* This input page is not written. One
2001-05-23 15:26:42 +02:00
* page higher in precedence is written
* though. Probable action: re-establich the
* need to write this page and retry write.
*
**************************************/
SET_TDBB(tdbb);
2009-06-06 11:05:20 +02:00
Database* const dbb = tdbb->getDatabase();
2001-05-23 15:26:42 +02:00
if (latch_bdb(tdbb, LATCH_io, bdb, page, 1) == -1) {
2001-05-23 15:26:42 +02:00
return 1;
}
2001-05-23 15:26:42 +02:00
if ((bdb->bdb_flags & BDB_marked) && !(bdb->bdb_flags & BDB_faked)) {
2009-08-23 13:43:25 +02:00
BUGCHECK(217); // msg 217 buffer marked for update
}
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if (!(bdb->bdb_flags & BDB_dirty) && !(write_thru && bdb->bdb_flags & BDB_db_dirty))
2003-12-22 11:00:59 +01:00
{
clear_precedence(tdbb, bdb);
release_bdb(tdbb, bdb, true, false, false);
2001-05-23 15:26:42 +02:00
return 1;
}
2009-08-23 13:43:25 +02:00
// If there are buffers that must be written first, write them now.
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
while (QUE_NOT_EMPTY(bdb->bdb_higher))
{
2009-08-23 13:43:25 +02:00
BufferControl* const bcb = dbb->dbb_bcb; // Re-initialize in the loop
QUE que_inst = bdb->bdb_higher.que_forward;
Precedence* precedence = BLOCK(que_inst, Precedence*, pre_higher);
if (precedence->pre_flags & PRE_cleared)
{
2001-05-23 15:26:42 +02:00
QUE_DELETE(precedence->pre_higher);
QUE_DELETE(precedence->pre_lower);
precedence->pre_hi = (BufferDesc*) bcb->bcb_free;
2001-05-23 15:26:42 +02:00
bcb->bcb_free = precedence;
}
2009-01-14 10:19:00 +01:00
else
{
BufferDesc* hi_bdb = precedence->pre_hi;
2006-05-22 00:07:35 +02:00
const PageNumber hi_page = hi_bdb->bdb_page;
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
release_bdb(tdbb, bdb, false, false, false);
2008-12-18 11:47:25 +01:00
const int write_status = write_buffer(tdbb, hi_bdb, hi_page, write_thru, status, false);
if (write_status == 0) {
2009-08-23 13:43:25 +02:00
return 0; // return IO error
}
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER
2009-06-26 06:12:20 +02:00
if (!write_this_page)
{
return 2;
2009-08-23 13:43:25 +02:00
// caller wants to re-establish the need for this write after one precedence write
}
2001-05-23 15:26:42 +02:00
#endif
if (latch_bdb(tdbb, LATCH_io, bdb, page, 1) == -1) {
2009-08-23 13:43:25 +02:00
return 1; // cache buffer reassigned, return 'write successful'
}
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_ACQUIRE;
2001-05-23 15:26:42 +02:00
}
}
2009-08-23 13:43:25 +02:00
//PRE_MUTEX_RELEASE;
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER_V2
2009-08-23 13:43:25 +02:00
// Header page I/O is deferred until a dirty page, which was modified by a
// transaction not updated on the header page, needs to be written. Note
// that the header page needs to be written with the target page latched to
// prevent younger transactions from modifying the target page.
2001-05-23 15:26:42 +02:00
2008-12-18 11:47:25 +01:00
if (page != HEADER_PAGE_NUMBER && bdb->bdb_mark_transaction > dbb->dbb_last_header_write)
2003-12-22 11:00:59 +01:00
{
TRA_header_write(tdbb, dbb, bdb->bdb_mark_transaction);
}
2001-05-23 15:26:42 +02:00
#endif
2009-08-23 13:43:25 +02:00
// Unless the buffer has been faked (recently re-allocated), write out the page
2001-05-23 15:26:42 +02:00
2003-12-22 11:00:59 +01:00
bool result = true;
2008-12-18 11:47:25 +01:00
if ((bdb->bdb_flags & BDB_dirty || (write_thru && bdb->bdb_flags & BDB_db_dirty)) &&
!(bdb->bdb_flags & BDB_marked))
2003-12-22 11:00:59 +01:00
{
2009-12-13 14:49:43 +01:00
if ( (result = write_page(tdbb, bdb, status, false)) ) {
clear_precedence(tdbb, bdb);
}
2001-05-23 15:26:42 +02:00
}
else {
clear_precedence(tdbb, bdb);
}
2001-05-23 15:26:42 +02:00
release_bdb(tdbb, bdb, true, false, false);
2001-05-23 15:26:42 +02:00
if (!result) {
2001-05-23 15:26:42 +02:00
return 0;
}
2008-01-16 09:31:31 +01:00
2001-05-23 15:26:42 +02:00
#ifdef SUPERSERVER
if (!write_this_page) {
2001-05-23 15:26:42 +02:00
return 2;
}
2001-05-23 15:26:42 +02:00
#endif
2008-01-16 09:31:31 +01:00
return 1;
2001-05-23 15:26:42 +02:00
}
2009-12-13 14:49:43 +01:00
static bool write_page(thread_db* tdbb, BufferDesc* bdb, ISC_STATUS* const status, const bool inAst)
2001-05-23 15:26:42 +02:00
{
/**************************************
*
* w r i t e _ p a g e
*
**************************************
*
* Functional description
* Do actions required when writing a database page,
* including journaling, shadowing.
*
**************************************/
2009-06-26 06:12:20 +02:00
if (bdb->bdb_flags & BDB_not_valid)
{
ERR_build_status(status, Arg::Gds(isc_buf_invalid) << Arg::Num(bdb->bdb_page.getPageNum()));
2003-12-22 11:00:59 +01:00
return false;
2001-05-23 15:26:42 +02:00
}
2009-06-07 12:16:41 +02:00
Database* const dbb = bdb->bdb_dbb;
2009-06-06 11:05:20 +02:00
pag* const page = bdb->bdb_buffer;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// Before writing db header page, make sure that
// the next_transaction > oldest_active transaction
2009-01-14 10:19:00 +01:00
if (bdb->bdb_page == HEADER_PAGE_NUMBER)
{
2009-06-06 11:05:20 +02:00
const header_page* header = (header_page*) page;
if (header->hdr_next_transaction)
{
if (header->hdr_oldest_active > header->hdr_next_transaction) {
2009-08-23 13:43:25 +02:00
BUGCHECK(266); // next transaction older than oldest active
}
2001-05-23 15:26:42 +02:00
if (header->hdr_oldest_transaction > header->hdr_next_transaction) {
2009-08-23 13:43:25 +02:00
BUGCHECK(267); // next transaction older than oldest transaction
}
2001-05-23 15:26:42 +02:00
}
}
page->pag_generation++;
2009-06-07 12:16:41 +02:00
bool result = true;
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
//if (!dbb->dbb_wal || write_thru) becomes
//if (true || write_thru) then finally if (true)
// I won't wipe out the if() itself to allow my changes be verified easily by others
2009-01-14 10:19:00 +01:00
if (true)
{
tdbb->bumpStats(RuntimeStatistics::PAGE_WRITES);
2001-05-23 15:26:42 +02:00
2009-08-23 13:43:25 +02:00
// write out page to main database file, and to any
// shadows, making a special case of the header page
BackupManager* bm = dbb->dbb_backup_manager;
const int backup_state = bm->getState();
2001-05-23 15:26:42 +02:00
2009-01-14 10:19:00 +01:00
if (bdb->bdb_page.getPageNum() >= 0)
{
fb_assert(backup_state != nbak_state_unknown);
page->pag_pageno = bdb->bdb_page.getPageNum();
2005-07-20 01:27:38 +02:00
#ifdef NBAK_DEBUG
// We cannot call normal trace functions here as they are signal-unsafe
// "Write page=%d, dir=%d, diff=%d, scn=%d"
char buffer[1000], *ptr = buffer;
2009-05-02 15:00:09 +02:00
strcpy(ptr, "NBAK, Write page ");
2005-07-20 01:27:38 +02:00
ptr += strlen(ptr);
2008-01-14 17:22:43 +01:00
gds__ulstr(ptr, bdb->bdb_page.getPageNum(), 0, 0);
2005-07-20 01:27:38 +02:00
ptr += strlen(ptr);
strcpy(ptr, ", backup_state=");
2005-07-20 01:27:38 +02:00
ptr += strlen(ptr);
gds__ulstr(ptr, backup_state, 0, 0);
2005-07-20 01:27:38 +02:00
ptr += strlen(ptr);
strcpy(ptr, ", diff=");
ptr += strlen(ptr);
gds__ulstr(ptr, bdb->bdb_difference_page, 0, 0);
ptr += strlen(ptr);
strcpy(ptr, ", scn=");
ptr += strlen(ptr);
gds__ulstr(ptr, bdb->bdb_buffer->pag_scn, 0, 0);
ptr += strlen(ptr);
gds__trace(buffer);
#endif
2008-12-05 02:20:14 +01:00
PageSpace* pageSpace =
dbb->dbb_page_manager.findPageSpace(bdb->bdb_page.getPageSpaceID());
fb_assert(pageSpace);
const bool isTempPage = pageSpace->isTemporary();
2005-07-20 01:27:38 +02:00
if (!isTempPage && (backup_state == nbak_state_stalled ||
2009-04-01 12:49:54 +02:00
(backup_state == nbak_state_merge &&
bdb->bdb_difference_page && !(bdb->bdb_flags & BDB_merge))))
{
2008-01-16 09:31:31 +01:00
const bool res = dbb->dbb_backup_manager->writeDifference(status,
2008-12-18 11:47:25 +01:00
bdb->bdb_difference_page, bdb->bdb_buffer);
2008-01-16 09:31:31 +01:00
2008-12-05 02:20:14 +01:00
if (!res)
{
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_io_error;
dbb->dbb_flags |= DBB_suspend_bgio;
2003-12-22 11:00:59 +01:00
return false;
2001-05-23 15:26:42 +02:00
}
}
2009-01-14 10:19:00 +01:00
if (!isTempPage && backup_state == nbak_state_stalled)
{
// We finished. Adjust transaction accounting and get ready for exit
2006-05-22 00:07:35 +02:00
if (bdb->bdb_page == HEADER_PAGE_NUMBER) {
dbb->dbb_last_header_write = ((header_page*) page)->hdr_next_transaction;
}
2003-12-22 11:00:59 +01:00
}
2009-01-14 10:19:00 +01:00
else
{
// We need to write our pages to main database files
2008-01-16 09:31:31 +01:00
2006-05-22 00:07:35 +02:00
jrd_file* file = pageSpace->file;
2009-01-14 10:19:00 +01:00
while (!PIO_write(file, bdb, page, status))
{
2008-01-16 09:31:31 +01:00
if (isTempPage || !CCH_rollover_to_shadow(tdbb, dbb, file, inAst))
2006-05-22 00:07:35 +02:00
{
bdb->bdb_flags |= BDB_io_error;
dbb->dbb_flags |= DBB_suspend_bgio;
2003-12-22 11:00:59 +01:00
return false;
}
2008-01-16 09:31:31 +01:00
2006-05-22 00:07:35 +02:00
file = pageSpace->file;
}
2001-05-23 15:26:42 +02:00
2006-05-22 00:07:35 +02:00
if (bdb->bdb_page == HEADER_PAGE_NUMBER) {
dbb->dbb_last_header_write = ((header_page*) page)->hdr_next_transaction;
}
2006-05-22 00:07:35 +02:00
if (dbb->dbb_shadow && !isTempPage) {
2009-12-14 12:33:13 +01:00
result = CCH_write_all_shadows(tdbb, 0, bdb, status, inAst);
2003-12-22 11:00:59 +01:00
}
}
2001-05-23 15:26:42 +02:00
}
#ifdef SUPERSERVER
2009-01-14 10:19:00 +01:00
if (result)
{
2001-05-23 15:26:42 +02:00
#ifdef CACHE_WRITER
if (bdb->bdb_flags & BDB_checkpoint) {
2001-05-23 15:26:42 +02:00
--dbb->dbb_bcb->bcb_checkpoint;
}
2001-05-23 15:26:42 +02:00
#endif
bdb->bdb_flags &= ~(BDB_db_dirty | BDB_checkpoint);
}
#endif
}
if (!result)
{
2009-08-23 13:43:25 +02:00
// If there was a write error then idle background threads
// so that they don't spin trying to write these pages. This
// usually results from device full errors which can be fixed
// by someone freeing disk space.
2001-05-23 15:26:42 +02:00
bdb->bdb_flags |= BDB_io_error;
dbb->dbb_flags |= DBB_suspend_bgio;
}
2009-01-14 10:19:00 +01:00
else
{
2009-08-23 13:43:25 +02:00
// clear the dirty bit vector, since the buffer is now
// clean regardless of which transactions have modified it
2001-05-23 15:26:42 +02:00
2009-04-01 12:49:54 +02:00
// Destination difference page number is only valid between MARK and
// write_page so clean it now to avoid confusion
bdb->bdb_difference_page = 0;
2001-05-23 15:26:42 +02:00
bdb->bdb_transactions = bdb->bdb_mark_transaction = 0;
if (!(dbb->dbb_bcb->bcb_flags & BCB_keep_pages)) {
removeDirty(dbb->dbb_bcb, bdb);
}
bdb->bdb_flags &= ~(BDB_must_write | BDB_system_dirty | BDB_merge);
clear_dirty_flag(tdbb, bdb);
if (bdb->bdb_flags & BDB_io_error)
{
2009-08-23 13:43:25 +02:00
// If a write error has cleared, signal background threads
// to resume their regular duties. If someone has freed up
// disk space these errors will spontaneously go away.
2001-05-23 15:26:42 +02:00
bdb->bdb_flags &= ~BDB_io_error;
dbb->dbb_flags &= ~DBB_suspend_bgio;
}
}
return result;
}
static void set_dirty_flag(thread_db* tdbb, BufferDesc* bdb)
{
if ( !(bdb->bdb_flags & BDB_dirty) )
{
2009-04-01 12:49:54 +02:00
NBAK_TRACE(("lock state for dirty page %d:%06d",
bdb->bdb_page.getPageSpaceID(), bdb->bdb_page.getPageNum()));
bdb->bdb_flags |= BDB_dirty;
tdbb->getDatabase()->dbb_backup_manager->lockDirtyPage(tdbb);
}
}
static void clear_dirty_flag(thread_db* tdbb, BufferDesc* bdb)
{
if (bdb->bdb_flags & BDB_dirty)
{
bdb->bdb_flags &= ~BDB_dirty;
2009-04-01 12:49:54 +02:00
NBAK_TRACE(("unlock state for dirty page %d:%06d",
bdb->bdb_page.getPageSpaceID(), bdb->bdb_page.getPageNum()));
tdbb->getDatabase()->dbb_backup_manager->unlockDirtyPage(tdbb);
}
}