Files
cpython-source-deps/txn/txn_region.c
2017-09-04 13:40:25 -05:00

475 lines
11 KiB
C

/*-
* See the file LICENSE for redistribution information.
*
* Copyright (c) 1996,2008 Oracle. All rights reserved.
*
* $Id: txn_region.c 63573 2008-05-23 21:43:21Z trent.nelson $
*/
#include "db_config.h"
#include "db_int.h"
#include "dbinc/log.h"
#include "dbinc/txn.h"
static int __txn_init __P((ENV *, DB_TXNMGR *));
static size_t __txn_region_size __P((ENV *));
/*
* __txn_open --
* Open a transaction region.
*
* PUBLIC: int __txn_open __P((ENV *, int));
*/
int
__txn_open(env, create_ok)
ENV *env;
int create_ok;
{
DB_TXNMGR *mgr;
int ret;
/* Create/initialize the transaction manager structure. */
if ((ret = __os_calloc(env, 1, sizeof(DB_TXNMGR), &mgr)) != 0)
return (ret);
TAILQ_INIT(&mgr->txn_chain);
mgr->env = env;
/* Join/create the txn region. */
mgr->reginfo.env = env;
mgr->reginfo.type = REGION_TYPE_TXN;
mgr->reginfo.id = INVALID_REGION_ID;
mgr->reginfo.flags = REGION_JOIN_OK;
if (create_ok)
F_SET(&mgr->reginfo, REGION_CREATE_OK);
if ((ret = __env_region_attach(env,
&mgr->reginfo, __txn_region_size(env))) != 0)
goto err;
/* If we created the region, initialize it. */
if (F_ISSET(&mgr->reginfo, REGION_CREATE))
if ((ret = __txn_init(env, mgr)) != 0)
goto err;
/* Set the local addresses. */
mgr->reginfo.primary =
R_ADDR(&mgr->reginfo, mgr->reginfo.rp->primary);
/* If threaded, acquire a mutex to protect the active TXN list. */
if ((ret = __mutex_alloc(
env, MTX_TXN_ACTIVE, DB_MUTEX_PROCESS_ONLY, &mgr->mutex)) != 0)
goto err;
env->tx_handle = mgr;
return (0);
err: env->tx_handle = NULL;
if (mgr->reginfo.addr != NULL)
(void)__env_region_detach(env, &mgr->reginfo, 0);
(void)__mutex_free(env, &mgr->mutex);
__os_free(env, mgr);
return (ret);
}
/*
* __txn_init --
* Initialize a transaction region in shared memory.
*/
static int
__txn_init(env, mgr)
ENV *env;
DB_TXNMGR *mgr;
{
DB_ENV *dbenv;
DB_LSN last_ckp;
DB_TXNREGION *region;
int ret;
dbenv = env->dbenv;
/*
* Find the last checkpoint in the log.
*/
ZERO_LSN(last_ckp);
if (LOGGING_ON(env)) {
/*
* The log system has already walked through the last
* file. Get the LSN of a checkpoint it may have found.
*/
if ((ret = __log_get_cached_ckp_lsn(env, &last_ckp)) != 0)
return (ret);
/*
* If that didn't work, look backwards from the beginning of
* the last log file until we find the last checkpoint.
*/
if (IS_ZERO_LSN(last_ckp) &&
(ret = __txn_findlastckp(env, &last_ckp, NULL)) != 0)
return (ret);
}
if ((ret = __env_alloc(&mgr->reginfo,
sizeof(DB_TXNREGION), &mgr->reginfo.primary)) != 0) {
__db_errx(env,
"Unable to allocate memory for the transaction region");
return (ret);
}
mgr->reginfo.rp->primary =
R_OFFSET(&mgr->reginfo, mgr->reginfo.primary);
region = mgr->reginfo.primary;
memset(region, 0, sizeof(*region));
if ((ret = __mutex_alloc(
env, MTX_TXN_REGION, 0, &region->mtx_region)) != 0)
return (ret);
region->maxtxns = dbenv->tx_max;
region->last_txnid = TXN_MINIMUM;
region->cur_maxid = TXN_MAXIMUM;
if ((ret = __mutex_alloc(
env, MTX_TXN_CHKPT, 0, &region->mtx_ckp)) != 0)
return (ret);
region->last_ckp = last_ckp;
region->time_ckp = time(NULL);
memset(&region->stat, 0, sizeof(region->stat));
#ifdef HAVE_STATISTICS
region->stat.st_maxtxns = region->maxtxns;
#endif
SH_TAILQ_INIT(&region->active_txn);
SH_TAILQ_INIT(&region->mvcc_txn);
return (ret);
}
/*
* __txn_findlastckp --
* Find the last checkpoint in the log, walking backwards from the
* max_lsn given or the beginning of the last log file. (The
* log system looked through the last log file when it started up.)
*
* PUBLIC: int __txn_findlastckp __P((ENV *, DB_LSN *, DB_LSN *));
*/
int
__txn_findlastckp(env, lsnp, max_lsn)
ENV *env;
DB_LSN *lsnp;
DB_LSN *max_lsn;
{
DBT dbt;
DB_LOGC *logc;
DB_LSN lsn;
int ret, t_ret;
u_int32_t rectype;
ZERO_LSN(*lsnp);
if ((ret = __log_cursor(env, &logc)) != 0)
return (ret);
/* Get the last LSN. */
memset(&dbt, 0, sizeof(dbt));
if (max_lsn != NULL) {
lsn = *max_lsn;
if ((ret = __logc_get(logc, &lsn, &dbt, DB_SET)) != 0)
goto err;
} else {
if ((ret = __logc_get(logc, &lsn, &dbt, DB_LAST)) != 0)
goto err;
/*
* Twiddle the last LSN so it points to the beginning of the
* last file; we know there's no checkpoint after that, since
* the log system already looked there.
*/
lsn.offset = 0;
}
/* Read backwards, looking for checkpoints. */
while ((ret = __logc_get(logc, &lsn, &dbt, DB_PREV)) == 0) {
if (dbt.size < sizeof(u_int32_t))
continue;
memcpy(&rectype, dbt.data, sizeof(u_int32_t));
if (rectype == DB___txn_ckp) {
*lsnp = lsn;
break;
}
}
err: if ((t_ret = __logc_close(logc)) != 0 && ret == 0)
ret = t_ret;
/*
* Not finding a checkpoint is not an error; there may not exist
* one in the log.
*/
return ((ret == 0 || ret == DB_NOTFOUND) ? 0 : ret);
}
/*
* __txn_env_refresh --
* Clean up after the transaction system on a close or failed open.
*
* PUBLIC: int __txn_env_refresh __P((ENV *));
*/
int
__txn_env_refresh(env)
ENV *env;
{
DB_TXN *txn;
DB_TXNMGR *mgr;
REGINFO *reginfo;
u_int32_t txnid;
int aborted, ret, t_ret;
ret = 0;
mgr = env->tx_handle;
reginfo = &mgr->reginfo;
/*
* This function can only be called once per process (i.e., not
* once per thread), so no synchronization is required.
*
* The caller is probably doing something wrong if close is called with
* active transactions. Try and abort any active transactions that are
* not prepared, but it's quite likely the aborts will fail because
* recovery won't find open files. If we can't abort any of the
* unprepared transaction, panic, we have to run recovery to get back
* to a known state.
*/
aborted = 0;
if (TAILQ_FIRST(&mgr->txn_chain) != NULL) {
while ((txn = TAILQ_FIRST(&mgr->txn_chain)) != NULL) {
/* Prepared transactions are OK. */
txnid = txn->txnid;
if (((TXN_DETAIL *)txn->td)->status == TXN_PREPARED) {
if ((ret = __txn_discard_int(txn, 0)) != 0) {
__db_err(env, ret,
"unable to discard txn %#lx",
(u_long)txnid);
break;
}
continue;
}
aborted = 1;
if ((t_ret = __txn_abort(txn)) != 0) {
__db_err(env, t_ret,
"unable to abort transaction %#lx",
(u_long)txnid);
ret = __env_panic(env, t_ret);
break;
}
}
if (aborted) {
__db_errx(env,
"Error: closing the transaction region with active transactions");
if (ret == 0)
ret = EINVAL;
}
}
/* Discard the per-thread lock. */
if ((t_ret = __mutex_free(env, &mgr->mutex)) != 0 && ret == 0)
ret = t_ret;
/* Detach from the region. */
if ((t_ret = __env_region_detach(env, reginfo, 0)) != 0 && ret == 0)
ret = t_ret;
__os_free(env, mgr);
env->tx_handle = NULL;
return (ret);
}
/*
* __txn_region_mutex_count --
* Return the number of mutexes the txn region will need.
*
* PUBLIC: u_int32_t __txn_region_mutex_count __P((ENV *));
*/
u_int32_t
__txn_region_mutex_count(env)
ENV *env;
{
DB_ENV *dbenv;
dbenv = env->dbenv;
/*
* We need a MVCC mutex for each TXN_DETAIL structure, a mutex for
* DB_TXNMGR structure, two mutexes for the DB_TXNREGION structure.
*/
return (dbenv->tx_max + 1 + 2);
}
/*
* __txn_region_size --
* Return the amount of space needed for the txn region.
*/
static size_t
__txn_region_size(env)
ENV *env;
{
DB_ENV *dbenv;
size_t s;
dbenv = env->dbenv;
/*
* Make the region large enough to hold the primary transaction region
* structure, txn_max transaction detail structures, txn_max chunks of
* overhead required by the underlying shared region allocator for each
* chunk of memory, txn_max transaction names, at an average of 20
* bytes each, and 10KB for safety.
*/
s = sizeof(DB_TXNREGION) +
dbenv->tx_max * (sizeof(TXN_DETAIL) + __env_alloc_overhead() + 20) +
10 * 1024;
return (s);
}
/*
* __txn_id_set --
* Set the current transaction ID and current maximum unused ID (for
* testing purposes only).
*
* PUBLIC: int __txn_id_set __P((ENV *, u_int32_t, u_int32_t));
*/
int
__txn_id_set(env, cur_txnid, max_txnid)
ENV *env;
u_int32_t cur_txnid, max_txnid;
{
DB_TXNMGR *mgr;
DB_TXNREGION *region;
int ret;
ENV_REQUIRES_CONFIG(env, env->tx_handle, "txn_id_set", DB_INIT_TXN);
mgr = env->tx_handle;
region = mgr->reginfo.primary;
region->last_txnid = cur_txnid;
region->cur_maxid = max_txnid;
ret = 0;
if (cur_txnid < TXN_MINIMUM) {
__db_errx(env, "Current ID value %lu below minimum",
(u_long)cur_txnid);
ret = EINVAL;
}
if (max_txnid < TXN_MINIMUM) {
__db_errx(env, "Maximum ID value %lu below minimum",
(u_long)max_txnid);
ret = EINVAL;
}
return (ret);
}
/*
* __txn_oldest_reader --
* Find the oldest "read LSN" of any active transaction'
* MVCC changes older than this can safely be discarded from the cache.
*
* PUBLIC: int __txn_oldest_reader __P((ENV *, DB_LSN *));
*/
int
__txn_oldest_reader(env, lsnp)
ENV *env;
DB_LSN *lsnp;
{
DB_LSN old_lsn;
DB_TXNMGR *mgr;
DB_TXNREGION *region;
TXN_DETAIL *td;
int ret;
if ((mgr = env->tx_handle) == NULL)
return (0);
region = mgr->reginfo.primary;
if ((ret = __log_current_lsn(env, &old_lsn, NULL, NULL)) != 0)
return (ret);
TXN_SYSTEM_LOCK(env);
SH_TAILQ_FOREACH(td, &region->active_txn, links, __txn_detail)
if (LOG_COMPARE(&td->read_lsn, &old_lsn) < 0)
old_lsn = td->read_lsn;
TXN_SYSTEM_UNLOCK(env);
DB_ASSERT(env, LOG_COMPARE(&old_lsn, lsnp) >= 0);
*lsnp = old_lsn;
return (0);
}
/*
* __txn_add_buffer --
* Add to the count of buffers created by the given transaction.
*
* PUBLIC: int __txn_add_buffer __P((ENV *, TXN_DETAIL *));
*/
int
__txn_add_buffer(env, td)
ENV *env;
TXN_DETAIL *td;
{
DB_ASSERT(env, td != NULL);
MUTEX_LOCK(env, td->mvcc_mtx);
DB_ASSERT(env, td->mvcc_ref < UINT32_MAX);
++td->mvcc_ref;
MUTEX_UNLOCK(env, td->mvcc_mtx);
COMPQUIET(env, NULL);
return (0);
}
/*
* __txn_remove_buffer --
* Remove a buffer from a transaction -- free the transaction if necessary.
*
* PUBLIC: int __txn_remove_buffer __P((ENV *, TXN_DETAIL *, db_mutex_t));
*/
int
__txn_remove_buffer(env, td, hash_mtx)
ENV *env;
TXN_DETAIL *td;
db_mutex_t hash_mtx;
{
DB_TXNMGR *mgr;
DB_TXNREGION *region;
int need_free, ret;
DB_ASSERT(env, td != NULL);
ret = 0;
mgr = env->tx_handle;
region = mgr->reginfo.primary;
MUTEX_LOCK(env, td->mvcc_mtx);
DB_ASSERT(env, td->mvcc_ref > 0);
need_free = (--td->mvcc_ref == 0);
MUTEX_UNLOCK(env, td->mvcc_mtx);
if (need_free &&
(td->status == TXN_COMMITTED || td->status == TXN_ABORTED)) {
MUTEX_UNLOCK(env, hash_mtx);
ret = __mutex_free(env, &td->mvcc_mtx);
td->mvcc_mtx = MUTEX_INVALID;
TXN_SYSTEM_LOCK(env);
SH_TAILQ_REMOVE(&region->mvcc_txn, td, links, __txn_detail);
#ifdef HAVE_STATISTICS
--region->stat.st_nsnapshot;
#endif
__env_alloc_free(&mgr->reginfo, td);
TXN_SYSTEM_UNLOCK(env);
MUTEX_LOCK(env, hash_mtx);
}
return (ret);
}