2 * contrib/ltree/_ltree_gist.c
5 * GiST support for ltree[]
6 * Teodor Sigaev <teodor@stack.net>
10 #include "access/gist.h"
11 #include "access/skey.h"
16 PG_FUNCTION_INFO_V1(_ltree_compress);
17 PG_FUNCTION_INFO_V1(_ltree_same);
18 PG_FUNCTION_INFO_V1(_ltree_union);
19 PG_FUNCTION_INFO_V1(_ltree_penalty);
20 PG_FUNCTION_INFO_V1(_ltree_picksplit);
21 PG_FUNCTION_INFO_V1(_ltree_consistent);
23 #define GETENTRY(vec,pos) ((ltree_gist *) DatumGetPointer((vec)->vector[(pos)].key))
24 #define NEXTVAL(x) ( (ltree*)( (char*)(x) + INTALIGN( VARSIZE(x) ) ) )
26 /* Number of one-bits in an unsigned byte */
27 static const uint8 number_of_ones[256] = {
28 0, 1, 1, 2, 1, 2, 2, 3, 1, 2, 2, 3, 2, 3, 3, 4,
29 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,
30 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,
31 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
32 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,
33 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
34 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
35 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,
36 1, 2, 2, 3, 2, 3, 3, 4, 2, 3, 3, 4, 3, 4, 4, 5,
37 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
38 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
39 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,
40 2, 3, 3, 4, 3, 4, 4, 5, 3, 4, 4, 5, 4, 5, 5, 6,
41 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,
42 3, 4, 4, 5, 4, 5, 5, 6, 4, 5, 5, 6, 5, 6, 6, 7,
43 4, 5, 5, 6, 5, 6, 6, 7, 5, 6, 6, 7, 6, 7, 7, 8
46 #define WISH_F(a,b,c) (double)( -(double)(((a)-(b))*((a)-(b))*((a)-(b)))*(c) )
50 hashing(BITVECP sign, ltree *t)
52 int tlen = t->numlevel;
53 ltree_level *cur = LTREE_FIRST(t);
58 hash = ltree_crc32_sz(cur->name, cur->len);
60 cur = LEVEL_NEXT(cur);
66 _ltree_compress(PG_FUNCTION_ARGS)
68 GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
69 GISTENTRY *retval = entry;
74 ArrayType *val = DatumGetArrayTypeP(entry->key);
75 int32 len = LTG_HDRSIZE + ASIGLEN;
76 int num = ArrayGetNItems(ARR_NDIM(val), ARR_DIMS(val));
77 ltree *item = (ltree *) ARR_DATA_PTR(val);
79 if (ARR_NDIM(val) > 1)
81 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR),
82 errmsg("array must be one-dimensional")));
83 if (array_contains_nulls(val))
85 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED),
86 errmsg("array must not contain nulls")));
88 key = (ltree_gist *) palloc(len);
89 SET_VARSIZE(key, len);
92 MemSet(LTG_SIGN(key), 0, ASIGLEN);
95 hashing(LTG_SIGN(key), item);
100 retval = (GISTENTRY *) palloc(sizeof(GISTENTRY));
101 gistentryinit(*retval, PointerGetDatum(key),
102 entry->rel, entry->page,
103 entry->offset, FALSE);
105 else if (!LTG_ISALLTRUE(entry->key))
111 BITVECP sign = LTG_SIGN(DatumGetPointer(entry->key));
115 if ((sign[i] & 0xff) != 0xff)
116 PG_RETURN_POINTER(retval);
119 key = (ltree_gist *) palloc(len);
120 SET_VARSIZE(key, len);
121 key->flag = LTG_ALLTRUE;
123 retval = (GISTENTRY *) palloc(sizeof(GISTENTRY));
124 gistentryinit(*retval, PointerGetDatum(key),
125 entry->rel, entry->page,
126 entry->offset, FALSE);
128 PG_RETURN_POINTER(retval);
132 _ltree_same(PG_FUNCTION_ARGS)
134 ltree_gist *a = (ltree_gist *) PG_GETARG_POINTER(0);
135 ltree_gist *b = (ltree_gist *) PG_GETARG_POINTER(1);
136 bool *result = (bool *) PG_GETARG_POINTER(2);
138 if (LTG_ISALLTRUE(a) && LTG_ISALLTRUE(b))
140 else if (LTG_ISALLTRUE(a))
142 else if (LTG_ISALLTRUE(b))
147 BITVECP sa = LTG_SIGN(a),
160 PG_RETURN_POINTER(result);
164 unionkey(BITVECP sbase, ltree_gist *add)
167 BITVECP sadd = LTG_SIGN(add);
169 if (LTG_ISALLTRUE(add))
178 _ltree_union(PG_FUNCTION_ARGS)
180 GistEntryVector *entryvec = (GistEntryVector *) PG_GETARG_POINTER(0);
181 int *size = (int *) PG_GETARG_POINTER(1);
188 MemSet((void *) base, 0, sizeof(ABITVEC));
189 for (i = 0; i < entryvec->n; i++)
191 if (unionkey(base, GETENTRY(entryvec, i)))
198 len = LTG_HDRSIZE + ((flag & LTG_ALLTRUE) ? 0 : ASIGLEN);
199 result = (ltree_gist *) palloc(len);
200 SET_VARSIZE(result, len);
202 if (!LTG_ISALLTRUE(result))
203 memcpy((void *) LTG_SIGN(result), (void *) base, sizeof(ABITVEC));
206 PG_RETURN_POINTER(result);
210 sizebitvec(BITVECP sign)
216 size += number_of_ones[(unsigned char) sign[i]];
221 hemdistsign(BITVECP a, BITVECP b)
229 diff = (unsigned char) (a[i] ^ b[i]);
230 dist += number_of_ones[diff];
236 hemdist(ltree_gist *a, ltree_gist *b)
238 if (LTG_ISALLTRUE(a))
240 if (LTG_ISALLTRUE(b))
243 return ASIGLENBIT - sizebitvec(LTG_SIGN(b));
245 else if (LTG_ISALLTRUE(b))
246 return ASIGLENBIT - sizebitvec(LTG_SIGN(a));
248 return hemdistsign(LTG_SIGN(a), LTG_SIGN(b));
253 _ltree_penalty(PG_FUNCTION_ARGS)
255 ltree_gist *origval = (ltree_gist *) DatumGetPointer(((GISTENTRY *) PG_GETARG_POINTER(0))->key);
256 ltree_gist *newval = (ltree_gist *) DatumGetPointer(((GISTENTRY *) PG_GETARG_POINTER(1))->key);
257 float *penalty = (float *) PG_GETARG_POINTER(2);
259 *penalty = hemdist(origval, newval);
260 PG_RETURN_POINTER(penalty);
270 comparecost(const void *a, const void *b)
272 return ((const SPLITCOST *) a)->cost - ((const SPLITCOST *) b)->cost;
276 _ltree_picksplit(PG_FUNCTION_ARGS)
278 GistEntryVector *entryvec = (GistEntryVector *) PG_GETARG_POINTER(0);
279 GIST_SPLITVEC *v = (GIST_SPLITVEC *) PG_GETARG_POINTER(1);
291 OffsetNumber seed_1 = 0,
298 SPLITCOST *costvector;
302 maxoff = entryvec->n - 2;
303 nbytes = (maxoff + 2) * sizeof(OffsetNumber);
304 v->spl_left = (OffsetNumber *) palloc(nbytes);
305 v->spl_right = (OffsetNumber *) palloc(nbytes);
307 for (k = FirstOffsetNumber; k < maxoff; k = OffsetNumberNext(k))
309 _k = GETENTRY(entryvec, k);
310 for (j = OffsetNumberNext(k); j <= maxoff; j = OffsetNumberNext(j))
312 size_waste = hemdist(_k, GETENTRY(entryvec, j));
313 if (size_waste > waste)
324 right = v->spl_right;
327 if (seed_1 == 0 || seed_2 == 0)
333 /* form initial .. */
334 if (LTG_ISALLTRUE(GETENTRY(entryvec, seed_1)))
336 datum_l = (ltree_gist *) palloc(LTG_HDRSIZE);
337 SET_VARSIZE(datum_l, LTG_HDRSIZE);
338 datum_l->flag = LTG_ALLTRUE;
342 datum_l = (ltree_gist *) palloc(LTG_HDRSIZE + ASIGLEN);
343 SET_VARSIZE(datum_l, LTG_HDRSIZE + ASIGLEN);
345 memcpy((void *) LTG_SIGN(datum_l), (void *) LTG_SIGN(GETENTRY(entryvec, seed_1)), sizeof(ABITVEC));
347 if (LTG_ISALLTRUE(GETENTRY(entryvec, seed_2)))
349 datum_r = (ltree_gist *) palloc(LTG_HDRSIZE);
350 SET_VARSIZE(datum_r, LTG_HDRSIZE);
351 datum_r->flag = LTG_ALLTRUE;
355 datum_r = (ltree_gist *) palloc(LTG_HDRSIZE + ASIGLEN);
356 SET_VARSIZE(datum_r, LTG_HDRSIZE + ASIGLEN);
358 memcpy((void *) LTG_SIGN(datum_r), (void *) LTG_SIGN(GETENTRY(entryvec, seed_2)), sizeof(ABITVEC));
361 maxoff = OffsetNumberNext(maxoff);
362 /* sort before ... */
363 costvector = (SPLITCOST *) palloc(sizeof(SPLITCOST) * maxoff);
364 for (j = FirstOffsetNumber; j <= maxoff; j = OffsetNumberNext(j))
366 costvector[j - 1].pos = j;
367 _j = GETENTRY(entryvec, j);
368 size_alpha = hemdist(datum_l, _j);
369 size_beta = hemdist(datum_r, _j);
370 costvector[j - 1].cost = Abs(size_alpha - size_beta);
372 qsort((void *) costvector, maxoff, sizeof(SPLITCOST), comparecost);
374 union_l = LTG_SIGN(datum_l);
375 union_r = LTG_SIGN(datum_r);
377 for (k = 0; k < maxoff; k++)
379 j = costvector[k].pos;
386 else if (j == seed_2)
392 _j = GETENTRY(entryvec, j);
393 size_alpha = hemdist(datum_l, _j);
394 size_beta = hemdist(datum_r, _j);
396 if (size_alpha < size_beta + WISH_F(v->spl_nleft, v->spl_nright, 0.00001))
398 if (LTG_ISALLTRUE(datum_l) || LTG_ISALLTRUE(_j))
400 if (!LTG_ISALLTRUE(datum_l))
401 MemSet((void *) union_l, 0xff, sizeof(ABITVEC));
407 union_l[i] |= ptr[i];
414 if (LTG_ISALLTRUE(datum_r) || LTG_ISALLTRUE(_j))
416 if (!LTG_ISALLTRUE(datum_r))
417 MemSet((void *) union_r, 0xff, sizeof(ABITVEC));
423 union_r[i] |= ptr[i];
430 *right = *left = FirstOffsetNumber;
432 v->spl_ldatum = PointerGetDatum(datum_l);
433 v->spl_rdatum = PointerGetDatum(datum_r);
435 PG_RETURN_POINTER(v);
439 gist_te(ltree_gist *key, ltree *query)
441 ltree_level *curq = LTREE_FIRST(query);
442 BITVECP sign = LTG_SIGN(key);
443 int qlen = query->numlevel;
446 if (LTG_ISALLTRUE(key))
451 hv = ltree_crc32_sz(curq->name, curq->len);
452 if (!GETBIT(sign, AHASHVAL(hv)))
454 curq = LEVEL_NEXT(curq);
462 checkcondition_bit(void *checkval, ITEM *val)
464 return (FLG_CANLOOKSIGN(val->flag)) ? GETBIT(checkval, AHASHVAL(val->val)) : true;
468 gist_qtxt(ltree_gist *key, ltxtquery *query)
470 if (LTG_ISALLTRUE(key))
473 return ltree_execute(
475 (void *) LTG_SIGN(key), false,
481 gist_qe(ltree_gist *key, lquery *query)
483 lquery_level *curq = LQUERY_FIRST(query);
484 BITVECP sign = LTG_SIGN(key);
485 int qlen = query->numlevel;
487 if (LTG_ISALLTRUE(key))
492 if (curq->numvar && LQL_CANLOOKSIGN(curq))
494 bool isexist = false;
495 int vlen = curq->numvar;
496 lquery_variant *curv = LQL_FIRST(curq);
500 if (GETBIT(sign, AHASHVAL(curv->val)))
505 curv = LVAR_NEXT(curv);
512 curq = LQL_NEXT(curq);
520 _arrq_cons(ltree_gist *key, ArrayType *_query)
522 lquery *query = (lquery *) ARR_DATA_PTR(_query);
523 int num = ArrayGetNItems(ARR_NDIM(_query), ARR_DIMS(_query));
525 if (ARR_NDIM(_query) > 1)
527 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR),
528 errmsg("array must be one-dimensional")));
529 if (array_contains_nulls(_query))
531 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED),
532 errmsg("array must not contain nulls")));
536 if (gist_qe(key, query))
539 query = (lquery *) NEXTVAL(query);
545 _ltree_consistent(PG_FUNCTION_ARGS)
547 GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
548 char *query = (char *) DatumGetPointer(PG_DETOAST_DATUM(PG_GETARG_DATUM(1)));
549 StrategyNumber strategy = (StrategyNumber) PG_GETARG_UINT16(2);
551 /* Oid subtype = PG_GETARG_OID(3); */
552 bool *recheck = (bool *) PG_GETARG_POINTER(4);
553 ltree_gist *key = (ltree_gist *) DatumGetPointer(entry->key);
556 /* All cases served by this function are inexact */
563 res = gist_te(key, (ltree *) query);
567 res = gist_qe(key, (lquery *) query);
571 res = gist_qtxt(key, (ltxtquery *) query);
575 res = _arrq_cons(key, (ArrayType *) query);
579 elog(ERROR, "unrecognized StrategyNumber: %d", strategy);
581 PG_FREE_IF_COPY(query, 1);