/* * contrib/btree_gist/btree_utils_var.c */ #include "postgres.h" #include #include #include #include "btree_gist.h" #include "btree_utils_var.h" #include "utils/builtins.h" #include "utils/pg_locale.h" #include "utils/rel.h" /* used for key sorting */ typedef struct { int i; GBT_VARKEY *t; } Vsrt; typedef struct { const gbtree_vinfo *tinfo; Oid collation; FmgrInfo *flinfo; } gbt_vsrt_arg; PG_FUNCTION_INFO_V1(gbt_var_decompress); PG_FUNCTION_INFO_V1(gbt_var_fetch); Datum gbt_var_decompress(PG_FUNCTION_ARGS) { GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0); GBT_VARKEY *key = (GBT_VARKEY *) PG_DETOAST_DATUM(entry->key); if (key != (GBT_VARKEY *) DatumGetPointer(entry->key)) { GISTENTRY *retval = (GISTENTRY *) palloc(sizeof(GISTENTRY)); gistentryinit(*retval, PointerGetDatum(key), entry->rel, entry->page, entry->offset, false); PG_RETURN_POINTER(retval); } PG_RETURN_POINTER(entry); } /* Returns a better readable representation of variable key ( sets pointer ) */ GBT_VARKEY_R gbt_var_key_readable(const GBT_VARKEY *k) { GBT_VARKEY_R r; r.lower = (bytea *) &(((char *) k)[VARHDRSZ]); if (VARSIZE(k) > (VARHDRSZ + (VARSIZE(r.lower)))) r.upper = (bytea *) &(((char *) k)[VARHDRSZ + INTALIGN(VARSIZE(r.lower))]); else r.upper = r.lower; return r; } /* * Create a leaf-entry to store in the index, from a single Datum. */ static GBT_VARKEY * gbt_var_key_from_datum(const struct varlena *u) { int32 lowersize = VARSIZE(u); GBT_VARKEY *r; r = (GBT_VARKEY *) palloc(lowersize + VARHDRSZ); memcpy(VARDATA(r), u, lowersize); SET_VARSIZE(r, lowersize + VARHDRSZ); return r; } /* * Create an entry to store in the index, from lower and upper bound. */ GBT_VARKEY * gbt_var_key_copy(const GBT_VARKEY_R *u) { int32 lowersize = VARSIZE(u->lower); int32 uppersize = VARSIZE(u->upper); GBT_VARKEY *r; r = (GBT_VARKEY *) palloc0(INTALIGN(lowersize) + uppersize + VARHDRSZ); memcpy(VARDATA(r), u->lower, lowersize); memcpy(VARDATA(r) + INTALIGN(lowersize), u->upper, uppersize); SET_VARSIZE(r, INTALIGN(lowersize) + uppersize + VARHDRSZ); return r; } static GBT_VARKEY * gbt_var_leaf2node(GBT_VARKEY *leaf, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { GBT_VARKEY *out = leaf; if (tinfo->f_l2n) out = tinfo->f_l2n(leaf, flinfo); return out; } /* * returns the common prefix length of a node key */ static int32 gbt_var_node_cp_len(const GBT_VARKEY *node, const gbtree_vinfo *tinfo) { GBT_VARKEY_R r = gbt_var_key_readable(node); int32 i = 0; int32 l = 0; int32 t1len = VARSIZE(r.lower) - VARHDRSZ; int32 t2len = VARSIZE(r.upper) - VARHDRSZ; int32 ml = Min(t1len, t2len); char *p1 = VARDATA(r.lower); char *p2 = VARDATA(r.upper); if (ml == 0) return 0; while (i < ml) { if (tinfo->eml > 1 && l == 0) { if ((l = pg_mblen(p1)) != pg_mblen(p2)) { return i; } } if (*p1 != *p2) { if (tinfo->eml > 1) { return (i - l + 1); } else { return i; } } p1++; p2++; l--; i++; } return ml; /* lower == upper */ } /* * returns true, if query matches prefix ( common prefix ) */ static bool gbt_bytea_pf_match(const bytea *pf, const bytea *query, const gbtree_vinfo *tinfo) { bool out = false; int32 qlen = VARSIZE(query) - VARHDRSZ; int32 nlen = VARSIZE(pf) - VARHDRSZ; if (nlen <= qlen) { char *q = VARDATA(query); char *n = VARDATA(pf); out = (memcmp(q, n, nlen) == 0); } return out; } /* * returns true, if query matches node using common prefix */ static bool gbt_var_node_pf_match(const GBT_VARKEY_R *node, const bytea *query, const gbtree_vinfo *tinfo) { return (tinfo->trnc && (gbt_bytea_pf_match(node->lower, query, tinfo) || gbt_bytea_pf_match(node->upper, query, tinfo))); } /* * truncates / compresses the node key * cpf_length .. common prefix length */ static GBT_VARKEY * gbt_var_node_truncate(const GBT_VARKEY *node, int32 cpf_length, const gbtree_vinfo *tinfo) { GBT_VARKEY *out = NULL; GBT_VARKEY_R r = gbt_var_key_readable(node); int32 len1 = VARSIZE(r.lower) - VARHDRSZ; int32 len2 = VARSIZE(r.upper) - VARHDRSZ; int32 si; char *out2; len1 = Min(len1, (cpf_length + 1)); len2 = Min(len2, (cpf_length + 1)); si = 2 * VARHDRSZ + INTALIGN(len1 + VARHDRSZ) + len2; out = (GBT_VARKEY *) palloc0(si); SET_VARSIZE(out, si); memcpy(VARDATA(out), r.lower, len1 + VARHDRSZ); SET_VARSIZE(VARDATA(out), len1 + VARHDRSZ); out2 = VARDATA(out) + INTALIGN(len1 + VARHDRSZ); memcpy(out2, r.upper, len2 + VARHDRSZ); SET_VARSIZE(out2, len2 + VARHDRSZ); return out; } void gbt_var_bin_union(Datum *u, GBT_VARKEY *e, Oid collation, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { GBT_VARKEY_R eo = gbt_var_key_readable(e); GBT_VARKEY_R nr; if (eo.lower == eo.upper) /* leaf */ { GBT_VARKEY *tmp; tmp = gbt_var_leaf2node(e, tinfo, flinfo); if (tmp != e) eo = gbt_var_key_readable(tmp); } if (DatumGetPointer(*u)) { GBT_VARKEY_R ro = gbt_var_key_readable((GBT_VARKEY *) DatumGetPointer(*u)); bool update = false; nr.lower = ro.lower; nr.upper = ro.upper; if (tinfo->f_cmp(ro.lower, eo.lower, collation, flinfo) > 0) { nr.lower = eo.lower; update = true; } if (tinfo->f_cmp(ro.upper, eo.upper, collation, flinfo) < 0) { nr.upper = eo.upper; update = true; } if (update) *u = PointerGetDatum(gbt_var_key_copy(&nr)); } else { nr.lower = eo.lower; nr.upper = eo.upper; *u = PointerGetDatum(gbt_var_key_copy(&nr)); } } GISTENTRY * gbt_var_compress(GISTENTRY *entry, const gbtree_vinfo *tinfo) { GISTENTRY *retval; if (entry->leafkey) { struct varlena *leaf = PG_DETOAST_DATUM(entry->key); GBT_VARKEY *r; r = gbt_var_key_from_datum(leaf); retval = palloc(sizeof(GISTENTRY)); gistentryinit(*retval, PointerGetDatum(r), entry->rel, entry->page, entry->offset, true); } else retval = entry; return retval; } Datum gbt_var_fetch(PG_FUNCTION_ARGS) { GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0); GBT_VARKEY *key = (GBT_VARKEY *) PG_DETOAST_DATUM(entry->key); GBT_VARKEY_R r = gbt_var_key_readable(key); GISTENTRY *retval; retval = palloc(sizeof(GISTENTRY)); gistentryinit(*retval, PointerGetDatum(r.lower), entry->rel, entry->page, entry->offset, true); PG_RETURN_POINTER(retval); } GBT_VARKEY * gbt_var_union(const GistEntryVector *entryvec, int32 *size, Oid collation, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { int i = 0, numranges = entryvec->n; GBT_VARKEY *cur; Datum out; GBT_VARKEY_R rk; *size = sizeof(GBT_VARKEY); cur = (GBT_VARKEY *) DatumGetPointer(entryvec->vector[0].key); rk = gbt_var_key_readable(cur); out = PointerGetDatum(gbt_var_key_copy(&rk)); for (i = 1; i < numranges; i++) { cur = (GBT_VARKEY *) DatumGetPointer(entryvec->vector[i].key); gbt_var_bin_union(&out, cur, collation, tinfo, flinfo); } /* Truncate (=compress) key */ if (tinfo->trnc) { int32 plen; GBT_VARKEY *trc = NULL; plen = gbt_var_node_cp_len((GBT_VARKEY *) DatumGetPointer(out), tinfo); trc = gbt_var_node_truncate((GBT_VARKEY *) DatumGetPointer(out), plen + 1, tinfo); out = PointerGetDatum(trc); } return ((GBT_VARKEY *) DatumGetPointer(out)); } bool gbt_var_same(Datum d1, Datum d2, Oid collation, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { GBT_VARKEY *t1 = (GBT_VARKEY *) DatumGetPointer(d1); GBT_VARKEY *t2 = (GBT_VARKEY *) DatumGetPointer(d2); GBT_VARKEY_R r1, r2; r1 = gbt_var_key_readable(t1); r2 = gbt_var_key_readable(t2); return (tinfo->f_cmp(r1.lower, r2.lower, collation, flinfo) == 0 && tinfo->f_cmp(r1.upper, r2.upper, collation, flinfo) == 0); } float * gbt_var_penalty(float *res, const GISTENTRY *o, const GISTENTRY *n, Oid collation, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { GBT_VARKEY *orge = (GBT_VARKEY *) DatumGetPointer(o->key); GBT_VARKEY *newe = (GBT_VARKEY *) DatumGetPointer(n->key); GBT_VARKEY_R ok, nk; *res = 0.0; nk = gbt_var_key_readable(newe); if (nk.lower == nk.upper) /* leaf */ { GBT_VARKEY *tmp; tmp = gbt_var_leaf2node(newe, tinfo, flinfo); if (tmp != newe) nk = gbt_var_key_readable(tmp); } ok = gbt_var_key_readable(orge); if ((VARSIZE(ok.lower) - VARHDRSZ) == 0 && (VARSIZE(ok.upper) - VARHDRSZ) == 0) *res = 0.0; else if (!((tinfo->f_cmp(nk.lower, ok.lower, collation, flinfo) >= 0 || gbt_bytea_pf_match(ok.lower, nk.lower, tinfo)) && (tinfo->f_cmp(nk.upper, ok.upper, collation, flinfo) <= 0 || gbt_bytea_pf_match(ok.upper, nk.upper, tinfo)))) { Datum d = PointerGetDatum(0); double dres; int32 ol, ul; gbt_var_bin_union(&d, orge, collation, tinfo, flinfo); ol = gbt_var_node_cp_len((GBT_VARKEY *) DatumGetPointer(d), tinfo); gbt_var_bin_union(&d, newe, collation, tinfo, flinfo); ul = gbt_var_node_cp_len((GBT_VARKEY *) DatumGetPointer(d), tinfo); if (ul < ol) { dres = (ol - ul); /* reduction of common prefix len */ } else { GBT_VARKEY_R uk = gbt_var_key_readable((GBT_VARKEY *) DatumGetPointer(d)); unsigned char tmp[4]; tmp[0] = (unsigned char) (((VARSIZE(ok.lower) - VARHDRSZ) <= ul) ? 0 : (VARDATA(ok.lower)[ul])); tmp[1] = (unsigned char) (((VARSIZE(uk.lower) - VARHDRSZ) <= ul) ? 0 : (VARDATA(uk.lower)[ul])); tmp[2] = (unsigned char) (((VARSIZE(ok.upper) - VARHDRSZ) <= ul) ? 0 : (VARDATA(ok.upper)[ul])); tmp[3] = (unsigned char) (((VARSIZE(uk.upper) - VARHDRSZ) <= ul) ? 0 : (VARDATA(uk.upper)[ul])); dres = abs(tmp[0] - tmp[1]) + abs(tmp[3] - tmp[2]); dres /= 256.0; } *res += FLT_MIN; *res += (float) (dres / ((double) (ol + 1))); *res *= (FLT_MAX / (o->rel->rd_att->natts + 1)); } return res; } static int gbt_vsrt_cmp(const void *a, const void *b, void *arg) { GBT_VARKEY_R ar = gbt_var_key_readable(((const Vsrt *) a)->t); GBT_VARKEY_R br = gbt_var_key_readable(((const Vsrt *) b)->t); const gbt_vsrt_arg *varg = (const gbt_vsrt_arg *) arg; int res; res = varg->tinfo->f_cmp(ar.lower, br.lower, varg->collation, varg->flinfo); if (res == 0) return varg->tinfo->f_cmp(ar.upper, br.upper, varg->collation, varg->flinfo); return res; } GIST_SPLITVEC * gbt_var_picksplit(const GistEntryVector *entryvec, GIST_SPLITVEC *v, Oid collation, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { OffsetNumber i, maxoff = entryvec->n - 1; Vsrt *arr; int svcntr = 0, nbytes; char *cur; GBT_VARKEY **sv = NULL; gbt_vsrt_arg varg; arr = (Vsrt *) palloc((maxoff + 1) * sizeof(Vsrt)); nbytes = (maxoff + 2) * sizeof(OffsetNumber); v->spl_left = (OffsetNumber *) palloc(nbytes); v->spl_right = (OffsetNumber *) palloc(nbytes); v->spl_ldatum = PointerGetDatum(0); v->spl_rdatum = PointerGetDatum(0); v->spl_nleft = 0; v->spl_nright = 0; sv = palloc(sizeof(bytea *) * (maxoff + 1)); /* Sort entries */ for (i = FirstOffsetNumber; i <= maxoff; i = OffsetNumberNext(i)) { GBT_VARKEY_R ro; cur = (char *) DatumGetPointer(entryvec->vector[i].key); ro = gbt_var_key_readable((GBT_VARKEY *) cur); if (ro.lower == ro.upper) /* leaf */ { sv[svcntr] = gbt_var_leaf2node((GBT_VARKEY *) cur, tinfo, flinfo); arr[i].t = sv[svcntr]; if (sv[svcntr] != (GBT_VARKEY *) cur) svcntr++; } else arr[i].t = (GBT_VARKEY *) cur; arr[i].i = i; } /* sort */ varg.tinfo = tinfo; varg.collation = collation; varg.flinfo = flinfo; qsort_arg(&arr[FirstOffsetNumber], maxoff - FirstOffsetNumber + 1, sizeof(Vsrt), gbt_vsrt_cmp, &varg); /* We do simply create two parts */ for (i = FirstOffsetNumber; i <= maxoff; i = OffsetNumberNext(i)) { if (i <= (maxoff - FirstOffsetNumber + 1) / 2) { gbt_var_bin_union(&v->spl_ldatum, arr[i].t, collation, tinfo, flinfo); v->spl_left[v->spl_nleft] = arr[i].i; v->spl_nleft++; } else { gbt_var_bin_union(&v->spl_rdatum, arr[i].t, collation, tinfo, flinfo); v->spl_right[v->spl_nright] = arr[i].i; v->spl_nright++; } } /* Truncate (=compress) key */ if (tinfo->trnc) { int32 ll = gbt_var_node_cp_len((GBT_VARKEY *) DatumGetPointer(v->spl_ldatum), tinfo); int32 lr = gbt_var_node_cp_len((GBT_VARKEY *) DatumGetPointer(v->spl_rdatum), tinfo); GBT_VARKEY *dl; GBT_VARKEY *dr; ll = Max(ll, lr); ll++; dl = gbt_var_node_truncate((GBT_VARKEY *) DatumGetPointer(v->spl_ldatum), ll, tinfo); dr = gbt_var_node_truncate((GBT_VARKEY *) DatumGetPointer(v->spl_rdatum), ll, tinfo); v->spl_ldatum = PointerGetDatum(dl); v->spl_rdatum = PointerGetDatum(dr); } return v; } /* * The GiST consistent method */ bool gbt_var_consistent(GBT_VARKEY_R *key, const void *query, StrategyNumber strategy, Oid collation, bool is_leaf, const gbtree_vinfo *tinfo, FmgrInfo *flinfo) { bool retval = false; switch (strategy) { case BTLessEqualStrategyNumber: if (is_leaf) retval = tinfo->f_ge(query, key->lower, collation, flinfo); else retval = tinfo->f_cmp(query, key->lower, collation, flinfo) >= 0 || gbt_var_node_pf_match(key, query, tinfo); break; case BTLessStrategyNumber: if (is_leaf) retval = tinfo->f_gt(query, key->lower, collation, flinfo); else retval = tinfo->f_cmp(query, key->lower, collation, flinfo) >= 0 || gbt_var_node_pf_match(key, query, tinfo); break; case BTEqualStrategyNumber: if (is_leaf) retval = tinfo->f_eq(query, key->lower, collation, flinfo); else retval = (tinfo->f_cmp(key->lower, query, collation, flinfo) <= 0 && tinfo->f_cmp(query, key->upper, collation, flinfo) <= 0) || gbt_var_node_pf_match(key, query, tinfo); break; case BTGreaterStrategyNumber: if (is_leaf) retval = tinfo->f_lt(query, key->upper, collation, flinfo); else retval = tinfo->f_cmp(query, key->upper, collation, flinfo) <= 0 || gbt_var_node_pf_match(key, query, tinfo); break; case BTGreaterEqualStrategyNumber: if (is_leaf) retval = tinfo->f_le(query, key->upper, collation, flinfo); else retval = tinfo->f_cmp(query, key->upper, collation, flinfo) <= 0 || gbt_var_node_pf_match(key, query, tinfo); break; case BtreeGistNotEqualStrategyNumber: retval = !(tinfo->f_eq(query, key->lower, collation, flinfo) && tinfo->f_eq(query, key->upper, collation, flinfo)); break; default: retval = false; } return retval; }