db_join.c

来自「这是linux下运行的mysql软件包,可用于linux 下安装 php + m」· C语言代码 · 共 823 行 · 第 1/2 页
823 行
/* * See the file LICENSE for redistribution information. * * Copyright (c) 1998-2002 *	Sleepycat Software.  All rights reserved. */#include "db_config.h"#ifndef lintstatic const char revid[] = "$Id: db_join.c,v 11.55 2002/08/08 03:57:47 bostic Exp $";#endif /* not lint */#ifndef NO_SYSTEM_INCLUDES#include <sys/types.h>#include <stdlib.h>#include <string.h>#endif#include "db_int.h"#include "dbinc/db_page.h"#include "dbinc/db_join.h"#include "dbinc/btree.h"static int __db_join_close __P((DBC *));static int __db_join_cmp __P((const void *, const void *));static int __db_join_del __P((DBC *, u_int32_t));static int __db_join_get __P((DBC *, DBT *, DBT *, u_int32_t));static int __db_join_getnext __P((DBC *, DBT *, DBT *, u_int32_t, u_int32_t));static int __db_join_primget __P((DB *,    DB_TXN *, u_int32_t, DBT *, DBT *, u_int32_t));static int __db_join_put __P((DBC *, DBT *, DBT *, u_int32_t));/* * Check to see if the Nth secondary cursor of join cursor jc is pointing * to a sorted duplicate set. */#define	SORTED_SET(jc, n)   ((jc)->j_curslist[(n)]->dbp->dup_compare != NULL)/* * This is the duplicate-assisted join functionality.  Right now we're * going to write it such that we return one item at a time, although * I think we may need to optimize it to return them all at once. * It should be easier to get it working this way, and I believe that * changing it should be fairly straightforward. * * We optimize the join by sorting cursors from smallest to largest * cardinality.  In most cases, this is indeed optimal.  However, if * a cursor with large cardinality has very few data in common with the * first cursor, it is possible that the join will be made faster by * putting it earlier in the cursor list.  Since we have no way to detect * cases like this, we simply provide a flag, DB_JOIN_NOSORT, which retains * the sort order specified by the caller, who may know more about the * structure of the data. * * The first cursor moves sequentially through the duplicate set while * the others search explicitly for the duplicate in question. * *//* * __db_join -- *	This is the interface to the duplicate-assisted join functionality. * In the same way that cursors mark a position in a database, a cursor * can mark a position in a join.  While most cursors are created by the * cursor method of a DB, join cursors are created through an explicit * call to DB->join. * * The curslist is an array of existing, intialized cursors and primary * is the DB of the primary file.  The data item that joins all the * cursors in the curslist is used as the key into the primary and that * key and data are returned.  When no more items are left in the join * set, the  c_next operation off the join cursor will return DB_NOTFOUND. * * PUBLIC: int __db_join __P((DB *, DBC **, DBC **, u_int32_t)); */int__db_join(primary, curslist, dbcp, flags)	DB *primary;	DBC **curslist, **dbcp;	u_int32_t flags;{	DB_ENV *dbenv;	DBC *dbc;	JOIN_CURSOR *jc;	int ret;	u_int32_t i;	size_t ncurs, nslots;	COMPQUIET(nslots, 0);	PANIC_CHECK(primary->dbenv);	if ((ret = __db_joinchk(primary, curslist, flags)) != 0)		return (ret);	dbc = NULL;	jc = NULL;	dbenv = primary->dbenv;	if ((ret = __os_calloc(dbenv, 1, sizeof(DBC), &dbc)) != 0)		goto err;	if ((ret = __os_calloc(dbenv,	    1, sizeof(JOIN_CURSOR), &jc)) != 0)		goto err;	if ((ret = __os_malloc(dbenv, 256, &jc->j_key.data)) != 0)		goto err;	jc->j_key.ulen = 256;	F_SET(&jc->j_key, DB_DBT_USERMEM);	F_SET(&jc->j_rdata, DB_DBT_REALLOC);	for (jc->j_curslist = curslist;	    *jc->j_curslist != NULL; jc->j_curslist++)		;	/*	 * The number of cursor slots we allocate is one greater than	 * the number of cursors involved in the join, because the	 * list is NULL-terminated.	 */	ncurs = jc->j_curslist - curslist;	nslots = ncurs + 1;	/*	 * !!! -- A note on the various lists hanging off jc.	 *	 * j_curslist is the initial NULL-terminated list of cursors passed	 * into __db_join.  The original cursors are not modified; pristine	 * copies are required because, in databases with unsorted dups, we	 * must reset all of the secondary cursors after the first each	 * time the first one is incremented, or else we will lose data	 * which happen to be sorted differently in two different cursors.	 *	 * j_workcurs is where we put those copies that we're planning to	 * work with.  They're lazily c_dup'ed from j_curslist as we need	 * them, and closed when the join cursor is closed or when we need	 * to reset them to their original values (in which case we just	 * c_dup afresh).	 *	 * j_fdupcurs is an array of cursors which point to the first	 * duplicate in the duplicate set that contains the data value	 * we're currently interested in.  We need this to make	 * __db_join_get correctly return duplicate duplicates;  i.e., if a	 * given data value occurs twice in the set belonging to cursor #2,	 * and thrice in the set belonging to cursor #3, and once in all	 * the other cursors, successive calls to __db_join_get need to	 * return that data item six times.  To make this happen, each time	 * cursor N is allowed to advance to a new datum, all cursors M	 * such that M > N have to be reset to the first duplicate with	 * that datum, so __db_join_get will return all the dup-dups again.	 * We could just reset them to the original cursor from j_curslist,	 * but that would be a bit slower in the unsorted case and a LOT	 * slower in the sorted one.	 *	 * j_exhausted is a list of boolean values which represent	 * whether or not their corresponding cursors are "exhausted",	 * i.e. whether the datum under the corresponding cursor has	 * been found not to exist in any unreturned combinations of	 * later secondary cursors, in which case they are ready to be	 * incremented.	 */	/* We don't want to free regions whose callocs have failed. */	jc->j_curslist = NULL;	jc->j_workcurs = NULL;	jc->j_fdupcurs = NULL;	jc->j_exhausted = NULL;	if ((ret = __os_calloc(dbenv, nslots, sizeof(DBC *),	    &jc->j_curslist)) != 0)		goto err;	if ((ret = __os_calloc(dbenv, nslots, sizeof(DBC *),	    &jc->j_workcurs)) != 0)		goto err;	if ((ret = __os_calloc(dbenv, nslots, sizeof(DBC *),	    &jc->j_fdupcurs)) != 0)		goto err;	if ((ret = __os_calloc(dbenv, nslots, sizeof(u_int8_t),	    &jc->j_exhausted)) != 0)		goto err;	for (i = 0; curslist[i] != NULL; i++) {		jc->j_curslist[i] = curslist[i];		jc->j_workcurs[i] = NULL;		jc->j_fdupcurs[i] = NULL;		jc->j_exhausted[i] = 0;	}	jc->j_ncurs = (u_int32_t)ncurs;	/*	 * If DB_JOIN_NOSORT is not set, optimize secondary cursors by	 * sorting in order of increasing cardinality.	 */	if (!LF_ISSET(DB_JOIN_NOSORT))		qsort(jc->j_curslist, ncurs, sizeof(DBC *), __db_join_cmp);	/*	 * We never need to reset the 0th cursor, so there's no	 * solid reason to use workcurs[0] rather than curslist[0] in	 * join_get.  Nonetheless, it feels cleaner to do it for symmetry,	 * and this is the most logical place to copy it.	 *	 * !!!	 * There's no need to close the new cursor if we goto err only	 * because this is the last thing that can fail.  Modifier of this	 * function beware!	 */	if ((ret = jc->j_curslist[0]->c_dup(jc->j_curslist[0], jc->j_workcurs,	    DB_POSITIONI)) != 0)		goto err;	dbc->c_close = __db_join_close;	dbc->c_del = __db_join_del;	dbc->c_get = __db_join_get;	dbc->c_put = __db_join_put;	dbc->internal = (DBC_INTERNAL *) jc;	dbc->dbp = primary;	jc->j_primary = primary;	*dbcp = dbc;	MUTEX_THREAD_LOCK(dbenv, primary->mutexp);	TAILQ_INSERT_TAIL(&primary->join_queue, dbc, links);	MUTEX_THREAD_UNLOCK(dbenv, primary->mutexp);	return (0);err:	if (jc != NULL) {		if (jc->j_curslist != NULL)			__os_free(dbenv, jc->j_curslist);		if (jc->j_workcurs != NULL) {			if (jc->j_workcurs[0] != NULL)				__os_free(dbenv, jc->j_workcurs[0]);			__os_free(dbenv, jc->j_workcurs);		}		if (jc->j_fdupcurs != NULL)			__os_free(dbenv, jc->j_fdupcurs);		if (jc->j_exhausted != NULL)			__os_free(dbenv, jc->j_exhausted);		__os_free(dbenv, jc);	}	if (dbc != NULL)		__os_free(dbenv, dbc);	return (ret);}static int__db_join_put(dbc, key, data, flags)	DBC *dbc;	DBT *key;	DBT *data;	u_int32_t flags;{	PANIC_CHECK(dbc->dbp->dbenv);	COMPQUIET(key, NULL);	COMPQUIET(data, NULL);	COMPQUIET(flags, 0);	return (EINVAL);}static int__db_join_del(dbc, flags)	DBC *dbc;	u_int32_t flags;{	PANIC_CHECK(dbc->dbp->dbenv);	COMPQUIET(flags, 0);	return (EINVAL);}static int__db_join_get(dbc, key_arg, data_arg, flags)	DBC *dbc;	DBT *key_arg, *data_arg;	u_int32_t flags;{	DBT *key_n, key_n_mem;	DB *dbp;	DBC *cp;	JOIN_CURSOR *jc;	int db_manage_data, ret;	u_int32_t i, j, operation, opmods;	dbp = dbc->dbp;	jc = (JOIN_CURSOR *)dbc->internal;	PANIC_CHECK(dbp->dbenv);	operation = LF_ISSET(DB_OPFLAGS_MASK);	/* !!!	 * If the set of flags here changes, check that __db_join_primget	 * is updated to handle them properly.	 */	opmods = LF_ISSET(DB_RMW | DB_DIRTY_READ);	if ((ret = __db_joingetchk(dbp, key_arg, flags)) != 0)		return (ret);	/*	 * Since we are fetching the key as a datum in the secondary indices,	 * we must be careful of caller-specified DB_DBT_* memory	 * management flags.  If necessary, use a stack-allocated DBT;	 * we'll appropriately copy and/or allocate the data later.	 */	if (F_ISSET(key_arg, DB_DBT_USERMEM) ||	    F_ISSET(key_arg, DB_DBT_MALLOC)) {		/* We just use the default buffer;  no need to go malloc. */		key_n = &key_n_mem;		memset(key_n, 0, sizeof(DBT));	} else {		/*		 * Either DB_DBT_REALLOC or the default buffer will work		 * fine if we have to reuse it, as we do.		 */		key_n = key_arg;	}	/*	 * If our last attempt to do a get on the primary key failed,	 * short-circuit the join and try again with the same key.	 */	if (F_ISSET(jc, JOIN_RETRY))		goto samekey;	F_CLR(jc, JOIN_RETRY);retry:	ret = jc->j_workcurs[0]->c_real_get(jc->j_workcurs[0],	    &jc->j_key, key_n,	    opmods | (jc->j_exhausted[0] ? DB_NEXT_DUP : DB_CURRENT));	if (ret == ENOMEM) {		jc->j_key.ulen <<= 1;		if ((ret = __os_realloc(dbp->dbenv,		    jc->j_key.ulen, &jc->j_key.data)) != 0)			goto mem_err;		goto retry;	}	/*	 * If ret == DB_NOTFOUND, we're out of elements of the first	 * secondary cursor.  This is how we finally finish the join	 * if all goes well.	 */	if (ret != 0)		goto err;	/*	 * If jc->j_exhausted[0] == 1, we've just advanced the first cursor,	 * and we're going to want to advance all the cursors that point to	 * the first member of a duplicate duplicate set (j_fdupcurs[1..N]).	 * Close all the cursors in j_fdupcurs;  we'll reopen them the	 * first time through the upcoming loop.	 */	for (i = 1; i < jc->j_ncurs; i++) {		if (jc->j_fdupcurs[i] != NULL &&		    (ret = jc->j_fdupcurs[i]->c_close(jc->j_fdupcurs[i])) != 0)			goto err;		jc->j_fdupcurs[i] = NULL;	}	/*	 * If jc->j_curslist[1] == NULL, we have only one cursor in the join.	 * Thus, we can safely increment that one cursor on each call	 * to __db_join_get, and we signal this by setting jc->j_exhausted[0]	 * right away.	 *	 * Otherwise, reset jc->j_exhausted[0] to 0, so that we don't	 * increment it until we know we're ready to.	 */	if (jc->j_curslist[1] == NULL)		jc->j_exhausted[0] = 1;	else		jc->j_exhausted[0] = 0;	/* We have the first element; now look for it in the other cursors. */	for (i = 1; i < jc->j_ncurs; i++) {		DB_ASSERT(jc->j_curslist[i] != NULL);		if (jc->j_workcurs[i] == NULL)			/* If this is NULL, we need to dup curslist into it. */			if ((ret = jc->j_curslist[i]->c_dup(			    jc->j_curslist[i], jc->j_workcurs + i,			    DB_POSITIONI)) != 0)				goto err;retry2:		cp = jc->j_workcurs[i];		if ((ret = __db_join_getnext(cp, &jc->j_key, key_n,			    jc->j_exhausted[i], opmods)) == DB_NOTFOUND) {			/*			 * jc->j_workcurs[i] has no more of the datum we're			 * interested in.  Go back one cursor and get			 * a new dup.  We can't just move to a new			 * element of the outer relation, because that way			 * we might miss duplicate duplicates in cursor i-1.			 *			 * If this takes us back to the first cursor,			 * -then- we can move to a new element of the outer			 * relation.			 */			--i;			jc->j_exhausted[i] = 1;			if (i == 0) {				for (j = 1; jc->j_workcurs[j] != NULL; j++) {					/*					 * We're moving to a new element of					 * the first secondary cursor.  If
db_join.c - 源码说明

本页面展示了「这是linux下运行的mysql软件包,可用于linux 下安装 php + mysql + apach 的网络配置」中的 db_join.c 源码文件，采用 C语言编程语言编写，共 823 行代码。您可以在线阅读完整代码内容，也可以返回资源详情页下载完整源码包进行本地学习和开发。
虫虫下载站收录了大量与linux相关的技术资源，包括源代码、技术文档、电路图等，是电子工程师和嵌入式开发者的专业学习平台。
⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?