/* * GiST support for ltree * Teodor Sigaev */ #include "ltree.h" #include "access/gist.h" #include "access/rtree.h" #include "access/nbtree.h" #include "crc32.h" PG_FUNCTION_INFO_V1(ltree_gist_in); Datum ltree_gist_in(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_gist_out); Datum ltree_gist_out(PG_FUNCTION_ARGS); Datum ltree_gist_in(PG_FUNCTION_ARGS) { elog(ERROR, "Unimplemented"); PG_RETURN_DATUM(0); } Datum ltree_gist_out(PG_FUNCTION_ARGS) { elog(ERROR, "Unimplemented"); PG_RETURN_DATUM(0); } PG_FUNCTION_INFO_V1(ltree_compress); Datum ltree_compress(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_decompress); Datum ltree_decompress(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_same); Datum ltree_same(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_union); Datum ltree_union(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_penalty); Datum ltree_penalty(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_picksplit); Datum ltree_picksplit(PG_FUNCTION_ARGS); PG_FUNCTION_INFO_V1(ltree_consistent); Datum ltree_consistent(PG_FUNCTION_ARGS); #define ISEQ(a,b) ( (a)->numlevel == (b)->numlevel && ltree_compare(a,b)==0 ) #define GETENTRY(vec,pos) ((ltree_gist *) DatumGetPointer(((GISTENTRY *) VARDATA(vec))[(pos)].key)) Datum ltree_compress(PG_FUNCTION_ARGS) { GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0); GISTENTRY *retval = entry; if (entry->leafkey) { /* ltree */ ltree_gist *key; ltree *val = (ltree *) DatumGetPointer(PG_DETOAST_DATUM(entry->key)); int4 len = LTG_HDRSIZE + val->len; key = (ltree_gist *) palloc(len); key->len = len; key->flag = LTG_ONENODE; memcpy((void *) LTG_NODE(key), (void *) val, val->len); if (PointerGetDatum(val) != entry->key) pfree(val); retval = (GISTENTRY *) palloc(sizeof(GISTENTRY)); gistentryinit(*retval, PointerGetDatum(key), entry->rel, entry->page, entry->offset, key->len, FALSE); } PG_RETURN_POINTER(retval); } Datum ltree_decompress(PG_FUNCTION_ARGS) { GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0); ltree_gist *key = (ltree_gist *) DatumGetPointer(PG_DETOAST_DATUM(entry->key)); if (PointerGetDatum(key) != entry->key) { GISTENTRY *retval = (GISTENTRY *) palloc(sizeof(GISTENTRY)); gistentryinit(*retval, PointerGetDatum(key), entry->rel, entry->page, entry->offset, key->len, FALSE); PG_RETURN_POINTER(retval); } PG_RETURN_POINTER(entry); } Datum ltree_same(PG_FUNCTION_ARGS) { ltree_gist *a = (ltree_gist *) PG_GETARG_POINTER(0); ltree_gist *b = (ltree_gist *) PG_GETARG_POINTER(1); bool *result = (bool *) PG_GETARG_POINTER(2); *result = false; if (LTG_ISONENODE(a) != LTG_ISONENODE(b)) PG_RETURN_POINTER(result); if (LTG_ISONENODE(a)) *result = (ISEQ(LTG_NODE(a), LTG_NODE(b))) ? true : false; else { int4 i; BITVECP sa = LTG_SIGN(a), sb = LTG_SIGN(b); if (LTG_ISALLTRUE(a) != LTG_ISALLTRUE(b)) PG_RETURN_POINTER(result); if (!ISEQ(LTG_LNODE(a), LTG_LNODE(b))) PG_RETURN_POINTER(result); if (!ISEQ(LTG_RNODE(a), LTG_RNODE(b))) PG_RETURN_POINTER(result); *result = true; if (!LTG_ISALLTRUE(a)) LOOPBYTE( if (sa[i] != sb[i]) { *result = false; break; } ); } PG_RETURN_POINTER(result); } static void hashing(BITVECP sign, ltree * t) { int tlen = t->numlevel; ltree_level *cur = LTREE_FIRST(t); int hash; while (tlen > 0) { hash = ltree_crc32_sz(cur->name, cur->len); HASH(sign, hash); cur = LEVEL_NEXT(cur); tlen--; } } Datum ltree_union(PG_FUNCTION_ARGS) { bytea *entryvec = (bytea *) PG_GETARG_POINTER(0); int *size = (int *) PG_GETARG_POINTER(1); BITVEC base; int4 len = (VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY); int4 i, j; ltree_gist *result, *cur; ltree *left = NULL, *right = NULL, *curtree; bool isalltrue = false; bool isleqr; MemSet((void *) base, 0, sizeof(BITVEC)); for (j = 0; j < len; j++) { cur = GETENTRY(entryvec, j); if (LTG_ISONENODE(cur)) { curtree = LTG_NODE(cur); hashing(base, curtree); if (!left || ltree_compare(left, curtree) > 0) left = curtree; if (!right || ltree_compare(right, curtree) < 0) right = curtree; } else { if (isalltrue || LTG_ISALLTRUE(cur)) isalltrue = true; else { BITVECP sc = LTG_SIGN(cur); LOOPBYTE( ((unsigned char *) base)[i] |= sc[i]; ); } curtree = LTG_LNODE(cur); if (!left || ltree_compare(left, curtree) > 0) left = curtree; curtree = LTG_RNODE(cur); if (!right || ltree_compare(right, curtree) < 0) right = curtree; } } if (isalltrue == false) { isalltrue = true; LOOPBYTE( if (((unsigned char *) base)[i] != 0xff) { isalltrue = false; break; } ); } isleqr = (left == right || ISEQ(left, right)) ? true : false; *size = LTG_HDRSIZE + ((isalltrue) ? 0 : SIGLEN) + left->len + ((isleqr) ? 0 : right->len); result = (ltree_gist *) palloc(*size); result->len = *size; result->flag = 0; if (isalltrue) result->flag |= LTG_ALLTRUE; else memcpy((void *) LTG_SIGN(result), base, SIGLEN); memcpy((void *) LTG_LNODE(result), (void *) left, left->len); if (isleqr) result->flag |= LTG_NORIGHT; else memcpy((void *) LTG_RNODE(result), (void *) right, right->len); PG_RETURN_POINTER(result); } Datum ltree_penalty(PG_FUNCTION_ARGS) { ltree_gist *origval = (ltree_gist *) DatumGetPointer(((GISTENTRY *) PG_GETARG_POINTER(0))->key); ltree_gist *newval = (ltree_gist *) DatumGetPointer(((GISTENTRY *) PG_GETARG_POINTER(1))->key); float *penalty = (float *) PG_GETARG_POINTER(2); int4 cmpr, cmpl; cmpl = ltree_compare(LTG_GETLNODE(origval), LTG_GETLNODE(newval)); cmpr = ltree_compare(LTG_GETRNODE(newval), LTG_GETRNODE(origval)); *penalty = max(cmpl, 0) + max(cmpr, 0); PG_RETURN_POINTER(penalty); } /* used for sorting */ typedef struct rix { int index; ltree *r; } RIX; static int treekey_cmp(const void *a, const void *b) { return ltree_compare( ((RIX *) a)->r, ((RIX *) b)->r ); } Datum ltree_picksplit(PG_FUNCTION_ARGS) { bytea *entryvec = (bytea *) PG_GETARG_POINTER(0); GIST_SPLITVEC *v = (GIST_SPLITVEC *) PG_GETARG_POINTER(1); OffsetNumber j; int4 i; RIX *array; OffsetNumber maxoff; int nbytes; int size; ltree *lu_l, *lu_r, *ru_l, *ru_r; ltree_gist *lu, *ru; BITVEC ls, rs; bool lisat = false, risat = false, isleqr; memset((void *) ls, 0, sizeof(BITVEC)); memset((void *) rs, 0, sizeof(BITVEC)); maxoff = ((VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY)) - 1; nbytes = (maxoff + 2) * sizeof(OffsetNumber); v->spl_left = (OffsetNumber *) palloc(nbytes); v->spl_right = (OffsetNumber *) palloc(nbytes); v->spl_nleft = 0; v->spl_nright = 0; array = (RIX *) palloc(sizeof(RIX) * (maxoff + 1)); /* copy the data into RIXes, and sort the RIXes */ for (j = FirstOffsetNumber; j <= maxoff; j = OffsetNumberNext(j)) { array[j].index = j; lu = GETENTRY(entryvec, j); /* use as tmp val */ array[j].r = LTG_GETLNODE(lu); } qsort((void *) &array[FirstOffsetNumber], maxoff - FirstOffsetNumber + 1, sizeof(RIX), treekey_cmp); lu_l = lu_r = ru_l = ru_r = NULL; for (j = FirstOffsetNumber; j <= maxoff; j = OffsetNumberNext(j)) { lu = GETENTRY(entryvec, array[j].index); /* use as tmp val */ if (j <= (maxoff - FirstOffsetNumber + 1) / 2) { v->spl_left[v->spl_nleft] = array[j].index; v->spl_nleft++; if (lu_r == NULL || ltree_compare(LTG_GETRNODE(lu), lu_r) > 0) lu_r = LTG_GETRNODE(lu); if (LTG_ISONENODE(lu)) hashing(ls, LTG_NODE(lu)); else { if (lisat || LTG_ISALLTRUE(lu)) lisat = true; else { BITVECP sc = LTG_SIGN(lu); LOOPBYTE( ((unsigned char *) ls)[i] |= sc[i]; ); } } } else { v->spl_right[v->spl_nright] = array[j].index; v->spl_nright++; if (ru_r == NULL || ltree_compare(LTG_GETRNODE(lu), ru_r) > 0) ru_r = LTG_GETRNODE(lu); if (LTG_ISONENODE(lu)) hashing(rs, LTG_NODE(lu)); else { if (risat || LTG_ISALLTRUE(lu)) risat = true; else { BITVECP sc = LTG_SIGN(lu); LOOPBYTE( ((unsigned char *) rs)[i] |= sc[i]; ); } } } } if (lisat == false) { lisat = true; LOOPBYTE( if (((unsigned char *) ls)[i] != 0xff) { lisat = false; break; } ); } if (risat == false) { risat = true; LOOPBYTE( if (((unsigned char *) rs)[i] != 0xff) { risat = false; break; } ); } lu_l = LTG_GETLNODE(GETENTRY(entryvec, array[FirstOffsetNumber].index)); isleqr = (lu_l == lu_r || ISEQ(lu_l, lu_r)) ? true : false; size = LTG_HDRSIZE + ((lisat) ? 0 : SIGLEN) + lu_l->len + ((isleqr) ? 0 : lu_r->len); lu = (ltree_gist *) palloc(size); lu->len = size; lu->flag = 0; if (lisat) lu->flag |= LTG_ALLTRUE; else memcpy((void *) LTG_SIGN(lu), ls, SIGLEN); memcpy((void *) LTG_LNODE(lu), (void *) lu_l, lu_l->len); if (isleqr) lu->flag |= LTG_NORIGHT; else memcpy((void *) LTG_RNODE(lu), (void *) lu_r, lu_r->len); ru_l = LTG_GETLNODE(GETENTRY(entryvec, array[1 + ((maxoff - FirstOffsetNumber + 1) / 2)].index)); isleqr = (ru_l == ru_r || ISEQ(ru_l, ru_r)) ? true : false; size = LTG_HDRSIZE + ((risat) ? 0 : SIGLEN) + ru_l->len + ((isleqr) ? 0 : ru_r->len); ru = (ltree_gist *) palloc(size); ru->len = size; ru->flag = 0; if (risat) ru->flag |= LTG_ALLTRUE; else memcpy((void *) LTG_SIGN(ru), rs, SIGLEN); memcpy((void *) LTG_LNODE(ru), (void *) ru_l, ru_l->len); if (isleqr) ru->flag |= LTG_NORIGHT; else memcpy((void *) LTG_RNODE(ru), (void *) ru_r, ru_r->len); pfree(array); v->spl_ldatum = PointerGetDatum(lu); v->spl_rdatum = PointerGetDatum(ru); PG_RETURN_POINTER(v); } static bool gist_isparent(ltree_gist * key, ltree * query) { int4 numlevel = query->numlevel; int i; for (i = query->numlevel; i >= 0; i--) { query->numlevel = i; if (ltree_compare(query, LTG_GETLNODE(key)) >= 0 && ltree_compare(query, LTG_GETRNODE(key)) <= 0) { query->numlevel = numlevel; return true; } } query->numlevel = numlevel; return false; } static bool gist_ischild(ltree_gist * key, ltree * query) { ltree *left = LTG_GETLNODE(key); ltree *right = LTG_GETRNODE(key); int4 numlevelL = left->numlevel; int4 numlevelR = right->numlevel; bool res = true; if (numlevelL > query->numlevel) left->numlevel = query->numlevel; if (ltree_compare(query, left) < 0) res = false; if (numlevelR > query->numlevel) right->numlevel = query->numlevel; if (res && ltree_compare(query, right) > 0) res = false; left->numlevel = numlevelL; right->numlevel = numlevelR; return res; } static bool gist_qe(ltree_gist * key, lquery * query) { lquery_level *curq = LQUERY_FIRST(query); BITVECP sign = LTG_SIGN(key); int qlen = query->numlevel; if (LTG_ISALLTRUE(key)) return true; while (qlen > 0) { if (curq->numvar && LQL_CANLOOKSIGN(curq)) { bool isexist = false; int vlen = curq->numvar; lquery_variant *curv = LQL_FIRST(curq); while (vlen > 0) { if (GETBIT(sign, HASHVAL(curv->val))) { isexist = true; break; } curv = LVAR_NEXT(curv); vlen--; } if (!isexist) return false; } curq = LQL_NEXT(curq); qlen--; } return true; } static int gist_tqcmp(ltree * t, lquery * q) { ltree_level *al = LTREE_FIRST(t); lquery_level *ql = LQUERY_FIRST(q); lquery_variant *bl; int an = t->numlevel; int bn = q->firstgood; int res = 0; while (an > 0 && bn > 0) { bl = LQL_FIRST(ql); if ((res = strncmp(al->name, bl->name, min(al->len, bl->len))) == 0) { if (al->len != bl->len) return al->len - bl->len; } else return res; an--; bn--; al = LEVEL_NEXT(al); ql = LQL_NEXT(ql); } return t->numlevel - q->firstgood; } static bool gist_between(ltree_gist * key, lquery * query) { ltree *left = LTG_GETLNODE(key); ltree *right = LTG_GETRNODE(key); int4 numlevelL = left->numlevel; int4 numlevelR = right->numlevel; bool res = true; if (query->firstgood == 0) return true; if (numlevelL > query->firstgood) left->numlevel = query->firstgood; if (gist_tqcmp(left, query) > 0) res = false; if (numlevelR > query->firstgood) right->numlevel = query->firstgood; if (res && gist_tqcmp(right, query) < 0) res = false; left->numlevel = numlevelL; right->numlevel = numlevelR; return res; } static bool checkcondition_bit(void *checkval, ITEM * val) { return (FLG_CANLOOKSIGN(val->flag)) ? GETBIT(checkval, HASHVAL(val->val)) : true; } static bool gist_qtxt(ltree_gist * key, ltxtquery * query) { if (LTG_ISALLTRUE(key)) return true; return ltree_execute( GETQUERY(query), (void *) LTG_SIGN(key), false, checkcondition_bit ); } Datum ltree_consistent(PG_FUNCTION_ARGS) { GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0); char *query = (char *) DatumGetPointer(PG_DETOAST_DATUM(PG_GETARG_DATUM(1))); ltree_gist *key = (ltree_gist *) DatumGetPointer(entry->key); StrategyNumber strategy = (StrategyNumber) PG_GETARG_UINT16(2); bool res = false; #ifndef assert_enabled #define assert_enabled 0 #endif switch (strategy) { case BTLessStrategyNumber: res = (GIST_LEAF(entry)) ? (ltree_compare((ltree *) query, LTG_NODE(key)) > 0) : (ltree_compare((ltree *) query, LTG_GETLNODE(key)) >= 0); break; case BTLessEqualStrategyNumber: res = (ltree_compare((ltree *) query, LTG_GETLNODE(key)) >= 0); break; case BTEqualStrategyNumber: if (GIST_LEAF(entry)) res = (ltree_compare((ltree *) query, LTG_NODE(key)) == 0); else res = ( ltree_compare((ltree *) query, LTG_GETLNODE(key)) >= 0 && ltree_compare((ltree *) query, LTG_GETRNODE(key)) <= 0 ); break; case BTGreaterEqualStrategyNumber: res = (ltree_compare((ltree *) query, LTG_GETRNODE(key)) <= 0); break; case BTGreaterStrategyNumber: res = (GIST_LEAF(entry)) ? (ltree_compare((ltree *) query, LTG_GETRNODE(key)) < 0) : (ltree_compare((ltree *) query, LTG_GETRNODE(key)) <= 0); break; case 10: res = (GIST_LEAF(entry)) ? inner_isparent((ltree *) query, LTG_NODE(key)) : gist_isparent(key, (ltree *) query); break; case 11: res = (GIST_LEAF(entry)) ? inner_isparent(LTG_NODE(key), (ltree *) query) : gist_ischild(key, (ltree *) query); break; case 12: case 13: if (GIST_LEAF(entry)) res = DatumGetBool(DirectFunctionCall2(ltq_regex, PointerGetDatum(LTG_NODE(key)), PointerGetDatum((lquery *) query) )); else res = (gist_qe(key, (lquery *) query) && gist_between(key, (lquery *) query)); break; case 14: case 15: if (GIST_LEAF(entry)) res = DatumGetBool(DirectFunctionCall2(ltxtq_exec, PointerGetDatum(LTG_NODE(key)), PointerGetDatum((lquery *) query) )); else res = gist_qtxt(key, (ltxtquery *) query); break; default: elog(ERROR, "Unknown StrategyNumber: %d", strategy); } PG_RETURN_BOOL(res); }