postgresql/src/include/port/pg_lfind.h

/*-------------------------------------------------------------------------
 *
 * pg_lfind.h
 *	  Optimized linear search routines using SIMD intrinsics where
 *	  available.
 *
 * Copyright (c) 2022, PostgreSQL Global Development Group
 *
 * IDENTIFICATION
 *	  src/include/port/pg_lfind.h
 *
 *-------------------------------------------------------------------------
 */
#ifndef PG_LFIND_H
#define PG_LFIND_H

#include "port/simd.h"

/*
 * pg_lfind8
 *
 * Return true if there is an element in 'base' that equals 'key', otherwise
 * return false.
 */
static inline bool
pg_lfind8(uint8 key, uint8 *base, uint32 nelem)
{
	uint32		i;

	/* round down to multiple of vector length */
	uint32		tail_idx = nelem & ~(sizeof(Vector8) - 1);
	Vector8		chunk;

	for (i = 0; i < tail_idx; i += sizeof(Vector8))
	{
		vector8_load(&chunk, &base[i]);
		if (vector8_has(chunk, key))
			return true;
	}

	/* Process the remaining elements one at a time. */
	for (; i < nelem; i++)
	{
		if (key == base[i])
			return true;
	}

	return false;
}

/*
 * pg_lfind8_le
 *
 * Return true if there is an element in 'base' that is less than or equal to
 * 'key', otherwise return false.
 */
static inline bool
pg_lfind8_le(uint8 key, uint8 *base, uint32 nelem)
{
	uint32		i;

	/* round down to multiple of vector length */
	uint32		tail_idx = nelem & ~(sizeof(Vector8) - 1);
	Vector8		chunk;

	for (i = 0; i < tail_idx; i += sizeof(Vector8))
	{
		vector8_load(&chunk, &base[i]);
		if (vector8_has_le(chunk, key))
			return true;
	}

	/* Process the remaining elements one at a time. */
	for (; i < nelem; i++)
	{
		if (base[i] <= key)
			return true;
	}

	return false;
}

/*
 * pg_lfind32
 *
 * Return true if there is an element in 'base' that equals 'key', otherwise
 * return false.
 */
static inline bool
pg_lfind32(uint32 key, uint32 *base, uint32 nelem)
{
	uint32		i = 0;

#ifndef USE_NO_SIMD

	/*
	 * For better instruction-level parallelism, each loop iteration operates
	 * on a block of four registers.  Testing for SSE2 has showed this is ~40%
	 * faster than using a block of two registers.
	 */
	const Vector32 keys = vector32_broadcast(key);	/* load copies of key */
	const uint32 nelem_per_vector = sizeof(Vector32) / sizeof(uint32);
	const uint32 nelem_per_iteration = 4 * nelem_per_vector;

	/* round down to multiple of elements per iteration */
	const uint32 tail_idx = nelem & ~(nelem_per_iteration - 1);

#if defined(USE_ASSERT_CHECKING)
	bool		assert_result = false;

	/* pre-compute the result for assert checking */
	for (i = 0; i < nelem; i++)
	{
		if (key == base[i])
		{
			assert_result = true;
			break;
		}
	}
#endif

	for (i = 0; i < tail_idx; i += nelem_per_iteration)
	{
		Vector32	vals1,
					vals2,
					vals3,
					vals4,
					result1,
					result2,
					result3,
					result4,
					tmp1,
					tmp2,
					result;

		/* load the next block into 4 registers */
		vector32_load(&vals1, &base[i]);
		vector32_load(&vals2, &base[i + nelem_per_vector]);
		vector32_load(&vals3, &base[i + nelem_per_vector * 2]);
		vector32_load(&vals4, &base[i + nelem_per_vector * 3]);

		/* compare each value to the key */
		result1 = vector32_eq(keys, vals1);
		result2 = vector32_eq(keys, vals2);
		result3 = vector32_eq(keys, vals3);
		result4 = vector32_eq(keys, vals4);

		/* combine the results into a single variable */
		tmp1 = vector32_or(result1, result2);
		tmp2 = vector32_or(result3, result4);
		result = vector32_or(tmp1, tmp2);

		/* see if there was a match */
		if (vector8_is_highbit_set((Vector8) result))
		{
			Assert(assert_result == true);
			return true;
		}
	}
#endif							/* ! USE_NO_SIMD */

	/* Process the remaining elements one at a time. */
	for (; i < nelem; i++)
	{
		if (key == base[i])
		{
#ifndef USE_NO_SIMD
			Assert(assert_result == true);
#endif
			return true;
		}
	}

#ifndef USE_NO_SIMD
	Assert(assert_result == false);
#endif
	return false;
}

#endif							/* PG_LFIND_H */
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`/*-------------------------------------------------------------------------`
			`*`
			`* pg_lfind.h`
Add optimized functions for linear search within byte arrays In similar vein to b6ef167564, add pg_lfind8() and pg_lfind8_le() to search for bytes equal or less-than-or-equal to a given byte, respectively. To abstract away platform details, add helper functions and typedefs to simd.h. John Naylor and Nathan Bossart, per suggestion from Andres Freund Discussion: https://www.postgresql.org/message-id/CAFBsxsGzaaGLF%3DNuq61iRXTyspbO9rOjhSqFN%3DV6ozzmta5mXg%40mail.gmail.com 2022-08-21 06:14:01 +02:00			`* Optimized linear search routines using SIMD intrinsics where`
			`* available.`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`*`
			`* Copyright (c) 2022, PostgreSQL Global Development Group`
			`*`
			`* IDENTIFICATION`
			`* src/include/port/pg_lfind.h`
			`*`
			`*-------------------------------------------------------------------------`
			`*/`
			`#ifndef PG_LFIND_H`
			`#define PG_LFIND_H`

			`#include "port/simd.h"`

Add optimized functions for linear search within byte arrays In similar vein to b6ef167564, add pg_lfind8() and pg_lfind8_le() to search for bytes equal or less-than-or-equal to a given byte, respectively. To abstract away platform details, add helper functions and typedefs to simd.h. John Naylor and Nathan Bossart, per suggestion from Andres Freund Discussion: https://www.postgresql.org/message-id/CAFBsxsGzaaGLF%3DNuq61iRXTyspbO9rOjhSqFN%3DV6ozzmta5mXg%40mail.gmail.com 2022-08-21 06:14:01 +02:00			`/*`
			`* pg_lfind8`
			`*`
			`* Return true if there is an element in 'base' that equals 'key', otherwise`
			`* return false.`
			`*/`
			`static inline bool`
			`pg_lfind8(uint8 key, uint8 *base, uint32 nelem)`
			`{`
			`uint32 i;`

			`/* round down to multiple of vector length */`
			`uint32 tail_idx = nelem & ~(sizeof(Vector8) - 1);`
			`Vector8 chunk;`

			`for (i = 0; i < tail_idx; i += sizeof(Vector8))`
			`{`
			`vector8_load(&chunk, &base[i]);`
			`if (vector8_has(chunk, key))`
			`return true;`
			`}`

			`/* Process the remaining elements one at a time. */`
			`for (; i < nelem; i++)`
			`{`
			`if (key == base[i])`
			`return true;`
			`}`

			`return false;`
			`}`

			`/*`
			`* pg_lfind8_le`
			`*`
			`* Return true if there is an element in 'base' that is less than or equal to`
			`* 'key', otherwise return false.`
			`*/`
			`static inline bool`
			`pg_lfind8_le(uint8 key, uint8 *base, uint32 nelem)`
			`{`
			`uint32 i;`

			`/* round down to multiple of vector length */`
			`uint32 tail_idx = nelem & ~(sizeof(Vector8) - 1);`
			`Vector8 chunk;`

			`for (i = 0; i < tail_idx; i += sizeof(Vector8))`
			`{`
			`vector8_load(&chunk, &base[i]);`
			`if (vector8_has_le(chunk, key))`
			`return true;`
			`}`

			`/* Process the remaining elements one at a time. */`
			`for (; i < nelem; i++)`
			`{`
			`if (base[i] <= key)`
			`return true;`
			`}`

			`return false;`
			`}`

Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`/*`
			`* pg_lfind32`
			`*`
			`* Return true if there is an element in 'base' that equals 'key', otherwise`
			`* return false.`
			`*/`
			`static inline bool`
			`pg_lfind32(uint32 key, uint32 *base, uint32 nelem)`
			`{`
			`uint32 i = 0;`

Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`#ifndef USE_NO_SIMD`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`/*`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`* For better instruction-level parallelism, each loop iteration operates`
			`* on a block of four registers. Testing for SSE2 has showed this is ~40%`
			`* faster than using a block of two registers.`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`*/`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`const Vector32 keys = vector32_broadcast(key); /* load copies of key */`
			`const uint32 nelem_per_vector = sizeof(Vector32) / sizeof(uint32);`
			`const uint32 nelem_per_iteration = 4 * nelem_per_vector;`

			`/* round down to multiple of elements per iteration */`
			`const uint32 tail_idx = nelem & ~(nelem_per_iteration - 1);`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`#if defined(USE_ASSERT_CHECKING)`
			`bool assert_result = false;`

			`/* pre-compute the result for assert checking */`
			`for (i = 0; i < nelem; i++)`
			`{`
			`if (key == base[i])`
			`{`
			`assert_result = true;`
			`break;`
			`}`
			`}`
			`#endif`

Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`for (i = 0; i < tail_idx; i += nelem_per_iteration)`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`{`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`Vector32 vals1,`
			`vals2,`
			`vals3,`
			`vals4,`
			`result1,`
			`result2,`
			`result3,`
			`result4,`
			`tmp1,`
			`tmp2,`
			`result;`

			`/* load the next block into 4 registers */`
			`vector32_load(&vals1, &base[i]);`
			`vector32_load(&vals2, &base[i + nelem_per_vector]);`
			`vector32_load(&vals3, &base[i + nelem_per_vector * 2]);`
			`vector32_load(&vals4, &base[i + nelem_per_vector * 3]);`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`/* compare each value to the key */`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`result1 = vector32_eq(keys, vals1);`
			`result2 = vector32_eq(keys, vals2);`
			`result3 = vector32_eq(keys, vals3);`
			`result4 = vector32_eq(keys, vals4);`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`/* combine the results into a single variable */`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`tmp1 = vector32_or(result1, result2);`
			`tmp2 = vector32_or(result3, result4);`
			`result = vector32_or(tmp1, tmp2);`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`/* see if there was a match */`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`if (vector8_is_highbit_set((Vector8) result))`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`{`
			`Assert(assert_result == true);`
			`return true;`
			`}`
			`}`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`#endif /* ! USE_NO_SIMD */`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00
			`/* Process the remaining elements one at a time. */`
			`for (; i < nelem; i++)`
			`{`
			`if (key == base[i])`
			`{`
Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`#ifndef USE_NO_SIMD`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`Assert(assert_result == true);`
			`#endif`
			`return true;`
			`}`
			`}`

Abstract some more architecture-specific details away from SIMD functionality Add a typedef to represent vectors containing four 32-bit integers, and add functions operating on them. Also separate out saturating subtraction into its own function. The motivation for this is to prepare for a future commit to add ARM NEON support. Nathan Bossart Reviewed by John Naylor and Tom Lane Discussion: https://www.postgresql.org/message-id/flat/CAFBsxsEyR9JkfbPcDXBRYEfdfC__OkwVGdwEAgY4Rv0cvw35EA%40mail.gmail.com#aba7a64b11503494ffd8dd27067626a9 2022-08-29 08:40:53 +02:00			`#ifndef USE_NO_SIMD`
Introduce optimized routine for linear searches of arrays Use SSE2 intrinsics to speed up the search, where available. Otherwise, use a simple 'for' loop. The motivation to add this now is to speed up XidInMVCCSnapshot(), which is the reason only unsigned 32-bit integer arrays are optimized. Other types are left for future work, as is the extension of this technique to non-x86 platforms. Nathan Bossart Reviewed by: Andres Freund, Bharath Rupireddy, Masahiko Sawada Discussion: https://postgr.es/m/20220713170950.GA3116318%40nathanxps13 2022-08-03 18:49:04 +02:00			`Assert(assert_result == false);`
			`#endif`
			`return false;`
			`}`

			`#endif /* PG_LFIND_H */`