postgresql/src/include/executor/hashjoin.h

/*-------------------------------------------------------------------------
 *
 * hashjoin.h
 *	  internal structures for hash joins
 *
 *
 * Portions Copyright (c) 1996-2001, PostgreSQL Global Development Group
 * Portions Copyright (c) 1994, Regents of the University of California
 *
 * $Id: hashjoin.h,v 1.25 2001/11/05 17:46:33 momjian Exp $
 *
 *-------------------------------------------------------------------------
 */
#ifndef HASHJOIN_H
#define HASHJOIN_H

#include "access/htup.h"
#include "storage/buffile.h"

/* ----------------------------------------------------------------
 *				hash-join hash table structures
 *
 * Each active hashjoin has a HashJoinTable control block which is
 * palloc'd in the executor's per-query context.  All other storage needed
 * for the hashjoin is kept in private memory contexts, two for each hashjoin.
 * This makes it easy and fast to release the storage when we don't need it
 * anymore.
 *
 * The hashtable contexts are made children of the per-query context, ensuring
 * that they will be discarded at end of statement even if the join is
 * aborted early by an error.  (Likewise, any temporary files we make will
 * be cleaned up by the virtual file manager in event of an error.)
 *
 * Storage that should live through the entire join is allocated from the
 * "hashCxt", while storage that is only wanted for the current batch is
 * allocated in the "batchCxt".  By resetting the batchCxt at the end of
 * each batch, we free all the per-batch storage reliably and without tedium.
 * ----------------------------------------------------------------
 */

typedef struct HashJoinTupleData
{
	struct HashJoinTupleData *next;		/* link to next tuple in same
										 * bucket */
	HeapTupleData htup;			/* tuple header */
} HashJoinTupleData;

typedef HashJoinTupleData *HashJoinTuple;

typedef struct HashTableData
{
	int			nbuckets;		/* buckets in use during this batch */
	int			totalbuckets;	/* total number of (virtual) buckets */
	HashJoinTuple *buckets;		/* buckets[i] is head of list of tuples */
	/* buckets array is per-batch storage, as are all the tuples */

	int			nbatch;			/* number of batches; 0 means 1-pass join */
	int			curbatch;		/* current batch #, or 0 during 1st pass */

	/*
	 * all these arrays are allocated for the life of the hash join, but
	 * only if nbatch > 0:
	 */
	BufFile   **innerBatchFile; /* buffered virtual temp file per batch */
	BufFile   **outerBatchFile; /* buffered virtual temp file per batch */
	long	   *outerBatchSize; /* count of tuples in each outer batch
								 * file */
	long	   *innerBatchSize; /* count of tuples in each inner batch
								 * file */

	/*
	 * Info about the datatype being hashed.  We assume that the inner and
	 * outer sides of the hash are the same type, or at least
	 * binary-compatible types.
	 */
	int16		typLen;
	bool		typByVal;

	/*
	 * During 1st scan of inner relation, we get tuples from executor. If
	 * nbatch > 0 then tuples that don't belong in first nbuckets logical
	 * buckets get dumped into inner-batch temp files. The same statements
	 * apply for the 1st scan of the outer relation, except we write
	 * tuples to outer-batch temp files. If nbatch > 0 then we do the
	 * following for each batch: 1. Read tuples from inner batch file,
	 * load into hash buckets. 2. Read tuples from outer batch file, match
	 * to hash buckets and output.
	 */

	MemoryContext hashCxt;		/* context for whole-hash-join storage */
	MemoryContext batchCxt;		/* context for this-batch-only storage */
} HashTableData;

typedef HashTableData *HashJoinTable;

#endif   /* HASHJOIN_H */
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`/*-------------------------------------------------------------------------`
			`*`
Change my-function-name-- to my_function_name, and optimizer renames. 1999-02-14 00:22:53 +01:00			`* hashjoin.h`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`* internal structures for hash joins`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`*`
			`*`
Change Copyright from PostgreSQL, Inc to PostgreSQL Global Development Group. 2001-01-24 20:43:33 +01:00			`* Portions Copyright (c) 1996-2001, PostgreSQL Global Development Group`
Add: * Portions Copyright (c) 1996-2000, PostgreSQL, Inc to all files copyright Regents of Berkeley. Man, that's a lot of files. 2000-01-26 06:58:53 +01:00			`* Portions Copyright (c) 1994, Regents of the University of California`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`*`
New pgindent run with fixes suggested by Tom. Patch manually reviewed, initdb/regression tests pass. 2001-11-05 18:46:40 +01:00			`* $Id: hashjoin.h,v 1.25 2001/11/05 17:46:33 momjian Exp $`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`*`
			`*-------------------------------------------------------------------------`
			`*/`
Massive commit to run PGINDENT on all .c and .h files. 1997-09-07 07:04:48 +02:00			`#ifndef HASHJOIN_H`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`#define HASHJOIN_H`

Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`#include "access/htup.h"`
Split 'BufFile' routines out of fd.c into a new module, buffile.c. Extend BufFile so that it handles multi-segment temporary files transparently. This allows sorts and hashes to work with data exceeding 2Gig (or whatever the local limit on file size is). Change psort.c to use relative seeks instead of absolute seeks for backwards scanning, so that it won't fail when the data volume exceeds 2Gig. 1999-10-13 17:02:32 +02:00			`#include "storage/buffile.h"`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`/* ----------------------------------------------------------------`
			`* hash-join hash table structures`
			`*`
			`* Each active hashjoin has a HashJoinTable control block which is`
First stage of reclaiming memory in executor by resetting short-term memory contexts. Currently, only leaks in expressions executed as quals or projections are handled. Clean up some old dead cruft in executor while at it --- unused fields in state nodes, that sort of thing. 2000-07-12 04:37:39 +02:00			`* palloc'd in the executor's per-query context. All other storage needed`
			`* for the hashjoin is kept in private memory contexts, two for each hashjoin.`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`* This makes it easy and fast to release the storage when we don't need it`
			`* anymore.`
			`*`
Fix a many-legged critter reported by chifungfan@yahoo.com: under the right circumstances a hash join executed as a DECLARE CURSOR/FETCH query would crash the backend. Problem as seen in current sources was that the hash tables were stored in a context that was a child of TransactionCommandContext, which got zapped at completion of the FETCH command --- but cursor cleanup executed at COMMIT expected the tables to still be valid. I haven't chased down the details as seen in 7.0.* but I'm sure it's the same general problem. 2000-08-22 06:06:22 +02:00			`* The hashtable contexts are made children of the per-query context, ensuring`
First phase of memory management rewrite (see backend/utils/mmgr/README for details). It doesn't really do that much yet, since there are no short-term memory contexts in the executor, but the infrastructure is in place and long-term contexts are handled reasonably. A few long- standing bugs have been fixed, such as 'VACUUM; anything' in a single query string crashing. Also, out-of-memory is now considered a recoverable ERROR, not FATAL. Eliminate a large amount of crufty, now-dead code in and around memory management. Fix problem with holding off SIGTRAP, SIGSEGV, etc in postmaster and backend startup. 2000-06-28 05:33:33 +02:00			`* that they will be discarded at end of statement even if the join is`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`* aborted early by an error. (Likewise, any temporary files we make will`
			`* be cleaned up by the virtual file manager in event of an error.)`
Fix some nasty coredump bugs in hashjoin. This code was just about certain to fail anytime it decided the relation to be hashed was too big to fit in memory --- the code for 'batching' a series of hashjoins had multiple errors. I've fixed the easier problems. A remaining big problem is that you can get 'hashtable out of memory' if the code's guesstimate about how much overflow space it will need turns out wrong. That will require much more extensive revisions to fix, so I'm committing these fixes now before I start on that problem. 1999-05-06 02:30:47 +02:00			`*`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`* Storage that should live through the entire join is allocated from the`
First phase of memory management rewrite (see backend/utils/mmgr/README for details). It doesn't really do that much yet, since there are no short-term memory contexts in the executor, but the infrastructure is in place and long-term contexts are handled reasonably. A few long- standing bugs have been fixed, such as 'VACUUM; anything' in a single query string crashing. Also, out-of-memory is now considered a recoverable ERROR, not FATAL. Eliminate a large amount of crufty, now-dead code in and around memory management. Fix problem with holding off SIGTRAP, SIGSEGV, etc in postmaster and backend startup. 2000-06-28 05:33:33 +02:00			`* "hashCxt", while storage that is only wanted for the current batch is`
			`* allocated in the "batchCxt". By resetting the batchCxt at the end of`
			`* each batch, we free all the per-batch storage reliably and without tedium.`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`* ----------------------------------------------------------------`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00			`*/`

Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`typedef struct HashJoinTupleData`
			`{`
pgindent run over code. 1999-05-25 18:15:34 +02:00			`struct HashJoinTupleData next; / link to next tuple in same`
			`* bucket */`
			`HeapTupleData htup; /* tuple header */`
Another pgindent run. Sorry folks. 1999-05-26 00:43:53 +02:00			`} HashJoinTupleData;`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`typedef HashJoinTupleData *HashJoinTuple;`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
Massive commit to run PGINDENT on all .c and .h files. 1997-09-07 07:04:48 +02:00			`typedef struct HashTableData`
			`{`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`int nbuckets; /* buckets in use during this batch */`
			`int totalbuckets; /* total number of (virtual) buckets */`
pgindent run over code. 1999-05-25 18:15:34 +02:00			`HashJoinTuple buckets; / buckets[i] is head of list of tuples */`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`/* buckets array is per-batch storage, as are all the tuples */`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`int nbatch; /* number of batches; 0 means 1-pass join */`
			`int curbatch; /* current batch #, or 0 during 1st pass */`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
pgindent run over code. 1999-05-25 18:15:34 +02:00			`/*`
			`* all these arrays are allocated for the life of the hash join, but`
			`* only if nbatch > 0:`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`*/`
pgindent run over code. 1999-05-25 18:15:34 +02:00			`BufFile *innerBatchFile; / buffered virtual temp file per batch */`
			`BufFile *outerBatchFile; / buffered virtual temp file per batch */`
			`long outerBatchSize; / count of tuples in each outer batch`
			`* file */`
			`long innerBatchSize; / count of tuples in each inner batch`
			`* file */`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
First stage of reclaiming memory in executor by resetting short-term memory contexts. Currently, only leaks in expressions executed as quals or projections are handled. Clean up some old dead cruft in executor while at it --- unused fields in state nodes, that sort of thing. 2000-07-12 04:37:39 +02:00			`/*`
pgindent run. Make it all clean. 2001-03-22 05:01:46 +01:00			`* Info about the datatype being hashed. We assume that the inner and`
			`* outer sides of the hash are the same type, or at least`
First stage of reclaiming memory in executor by resetting short-term memory contexts. Currently, only leaks in expressions executed as quals or projections are handled. Clean up some old dead cruft in executor while at it --- unused fields in state nodes, that sort of thing. 2000-07-12 04:37:39 +02:00			`* binary-compatible types.`
			`*/`
Change SearchSysCache coding conventions so that a reference count is maintained for each cache entry. A cache entry will not be freed until the matching ReleaseSysCache call has been executed. This eliminates worries about cache entries getting dropped while still in use. See my posting to pg-hackers of even date for more info. 2000-11-16 23:30:52 +01:00			`int16 typLen;`
First stage of reclaiming memory in executor by resetting short-term memory contexts. Currently, only leaks in expressions executed as quals or projections are handled. Clean up some old dead cruft in executor while at it --- unused fields in state nodes, that sort of thing. 2000-07-12 04:37:39 +02:00			`bool typByVal;`

pgindent run over code. 1999-05-25 18:15:34 +02:00			`/*`
			`* During 1st scan of inner relation, we get tuples from executor. If`
			`* nbatch > 0 then tuples that don't belong in first nbuckets logical`
			`* buckets get dumped into inner-batch temp files. The same statements`
			`* apply for the 1st scan of the outer relation, except we write`
			`* tuples to outer-batch temp files. If nbatch > 0 then we do the`
			`* following for each batch: 1. Read tuples from inner batch file,`
			`* load into hash buckets. 2. Read tuples from outer batch file, match`
			`* to hash buckets and output.`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`*/`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
pgindent run over code. 1999-05-25 18:15:34 +02:00			`MemoryContext hashCxt; /* context for whole-hash-join storage */`
			`MemoryContext batchCxt; /* context for this-batch-only storage */`
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`} HashTableData;`
Postgres95 1.01 Distribution - Virgin Sources 1996-07-09 08:22:35 +02:00
Rewrite hash join to use simple linked lists instead of a fixed-size hashtable. This should prevent 'hashtable out of memory' errors, unless you really do run out of memory. Note: target size for hashtable is now taken from -S postmaster switch, not -B, since it is local memory in the backend rather than shared memory. 1999-05-18 23:33:06 +02:00			`typedef HashTableData *HashJoinTable;`
Another pgindent run. Fixes enum indenting, and improves #endif spacing. Also adds space for one-line comments. 2001-10-28 07:26:15 +01:00
New pgindent run with fixes suggested by Tom. Patch manually reviewed, initdb/regression tests pass. 2001-11-05 18:46:40 +01:00			`#endif /* HASHJOIN_H */`