Allow Incremental Sorts on GiST and SP-GiST indexes

Previously an "amcanorderbyop" index would only be used when the index
could provide sorted results which satisfied all query_pathkeys.  Here
we relax this so that we also allow these indexes to be considered by the
planner when they only provide partially sorted results.  This allows the
planner to later consider making use of an Incremental Sort to satisfy the
remaining pathkeys.  This change is particularly useful for KNN-type
queries which contain a LIMIT clause and an additional ORDER BY clause for
a non-indexed column.

Author: Miroslav Bendik
Reviewed-by: Richard Guo, David Rowley
Discussion: https://postgr.es/m/CAPoEpV0QYDtzjwamwWUBqyWpaCVbJV2d6qOD7Uy09bWn47PJtw%40mail.gmail.com
This commit is contained in:
David Rowley 2023-07-04 23:08:52 +12:00
parent 28b5726561
commit 625d5b3ca0
3 changed files with 76 additions and 24 deletions

View File

@ -974,14 +974,20 @@ build_index_paths(PlannerInfo *root, RelOptInfo *rel,
}
else if (index->amcanorderbyop && pathkeys_possibly_useful)
{
/* see if we can generate ordering operators for query_pathkeys */
/*
* See if we can generate ordering operators for query_pathkeys or at
* least some prefix thereof. Matching to just a prefix of the
* query_pathkeys will allow an incremental sort to be considered on
* the index's partially sorted results.
*/
match_pathkeys_to_index(index, root->query_pathkeys,
&orderbyclauses,
&orderbyclausecols);
if (orderbyclauses)
if (list_length(root->query_pathkeys) == list_length(orderbyclauses))
useful_pathkeys = root->query_pathkeys;
else
useful_pathkeys = NIL;
useful_pathkeys = list_copy_head(root->query_pathkeys,
list_length(orderbyclauses));
}
else
{
@ -3051,24 +3057,24 @@ expand_indexqual_rowcompare(PlannerInfo *root,
/*
* match_pathkeys_to_index
* Test whether an index can produce output ordered according to the
* given pathkeys using "ordering operators".
* For the given 'index' and 'pathkeys', output a list of suitable ORDER
* BY expressions, each of the form "indexedcol operator pseudoconstant",
* along with an integer list of the index column numbers (zero based)
* that each clause would be used with.
*
* If it can, return a list of suitable ORDER BY expressions, each of the form
* "indexedcol operator pseudoconstant", along with an integer list of the
* index column numbers (zero based) that each clause would be used with.
* NIL lists are returned if the ordering is not achievable this way.
*
* On success, the result list is ordered by pathkeys, and in fact is
* one-to-one with the requested pathkeys.
* This attempts to find an ORDER BY and index column number for all items in
* the pathkey list, however, if we're unable to match any given pathkey to an
* index column, we return just the ones matched by the function so far. This
* allows callers who are interested in partial matches to get them. Callers
* can determine a partial match vs a full match by checking the outputted
* list lengths. A full match will have one item in the output lists for each
* item in the given 'pathkeys' list.
*/
static void
match_pathkeys_to_index(IndexOptInfo *index, List *pathkeys,
List **orderby_clauses_p,
List **clause_columns_p)
{
List *orderby_clauses = NIL;
List *clause_columns = NIL;
ListCell *lc1;
*orderby_clauses_p = NIL; /* set default results */
@ -3084,10 +3090,6 @@ match_pathkeys_to_index(IndexOptInfo *index, List *pathkeys,
bool found = false;
ListCell *lc2;
/*
* Note: for any failure to match, we just return NIL immediately.
* There is no value in matching just some of the pathkeys.
*/
/* Pathkey must request default sort order for the target opfamily */
if (pathkey->pk_strategy != BTLessStrategyNumber ||
@ -3133,8 +3135,8 @@ match_pathkeys_to_index(IndexOptInfo *index, List *pathkeys,
pathkey->pk_opfamily);
if (expr)
{
orderby_clauses = lappend(orderby_clauses, expr);
clause_columns = lappend_int(clause_columns, indexcol);
*orderby_clauses_p = lappend(*orderby_clauses_p, expr);
*clause_columns_p = lappend_int(*clause_columns_p, indexcol);
found = true;
break;
}
@ -3144,12 +3146,13 @@ match_pathkeys_to_index(IndexOptInfo *index, List *pathkeys,
break;
}
if (!found) /* fail if no match for this pathkey */
/*
* Return the matches found so far when this pathkey couldn't be
* matched to the index.
*/
if (!found)
return;
}
*orderby_clauses_p = orderby_clauses; /* success! */
*clause_columns_p = clause_columns;
}
/*

View File

@ -1660,3 +1660,36 @@ order by 1, 2;
-> Function Scan on generate_series
(7 rows)
reset enable_hashagg;
reset enable_seqscan;
reset enable_incremental_sort;
reset parallel_tuple_cost;
reset parallel_setup_cost;
reset min_parallel_table_scan_size;
reset min_parallel_index_scan_size;
-- Ensure incremental sorts work for amcanorderbyop type indexes
create table point_table (a point, b int);
create index point_table_a_idx on point_table using gist(a);
-- Ensure we get an incremental sort plan for both of the following queries
explain (costs off) select a, b, a <-> point(5, 5) dist from point_table order by dist, b limit 1;
QUERY PLAN
---------------------------------------------------------------
Limit
-> Incremental Sort
Sort Key: ((a <-> '(5,5)'::point)), b
Presorted Key: ((a <-> '(5,5)'::point))
-> Index Scan using point_table_a_idx on point_table
Order By: (a <-> '(5,5)'::point)
(6 rows)
explain (costs off) select a, b, a <-> point(5, 5) dist from point_table order by dist, b desc limit 1;
QUERY PLAN
---------------------------------------------------------------
Limit
-> Incremental Sort
Sort Key: ((a <-> '(5,5)'::point)), b DESC
Presorted Key: ((a <-> '(5,5)'::point))
-> Index Scan using point_table_a_idx on point_table
Order By: (a <-> '(5,5)'::point)
(6 rows)

View File

@ -276,3 +276,19 @@ from tenk1, lateral (select tenk1.unique1 from generate_series(1, 1000)) as sub;
explain (costs off) select sub.unique1, stringu1 || random()::text
from tenk1, lateral (select tenk1.unique1 from generate_series(1, 1000)) as sub
order by 1, 2;
reset enable_hashagg;
reset enable_seqscan;
reset enable_incremental_sort;
reset parallel_tuple_cost;
reset parallel_setup_cost;
reset min_parallel_table_scan_size;
reset min_parallel_index_scan_size;
-- Ensure incremental sorts work for amcanorderbyop type indexes
create table point_table (a point, b int);
create index point_table_a_idx on point_table using gist(a);
-- Ensure we get an incremental sort plan for both of the following queries
explain (costs off) select a, b, a <-> point(5, 5) dist from point_table order by dist, b limit 1;
explain (costs off) select a, b, a <-> point(5, 5) dist from point_table order by dist, b desc limit 1;