2 * contrib/ltree/_ltree_gist.c
5 * GiST support for ltree[]
6 * Teodor Sigaev <teodor@stack.net>
12 #include "access/gist.h"
13 #include "access/reloptions.h"
14 #include "access/stratnum.h"
17 #include "port/pg_bitutils.h"
18 #include "utils/array.h"
20 PG_FUNCTION_INFO_V1(_ltree_compress
);
21 PG_FUNCTION_INFO_V1(_ltree_same
);
22 PG_FUNCTION_INFO_V1(_ltree_union
);
23 PG_FUNCTION_INFO_V1(_ltree_penalty
);
24 PG_FUNCTION_INFO_V1(_ltree_picksplit
);
25 PG_FUNCTION_INFO_V1(_ltree_consistent
);
26 PG_FUNCTION_INFO_V1(_ltree_gist_options
);
28 #define GETENTRY(vec,pos) ((ltree_gist *) DatumGetPointer((vec)->vector[(pos)].key))
29 #define NEXTVAL(x) ( (ltree*)( (char*)(x) + INTALIGN( VARSIZE(x) ) ) )
31 #define WISH_F(a,b,c) (double)( -(double)(((a)-(b))*((a)-(b))*((a)-(b)))*(c) )
35 hashing(BITVECP sign
, ltree
*t
, int siglen
)
37 int tlen
= t
->numlevel
;
38 ltree_level
*cur
= LTREE_FIRST(t
);
43 hash
= ltree_crc32_sz(cur
->name
, cur
->len
);
44 AHASH(sign
, hash
, siglen
);
45 cur
= LEVEL_NEXT(cur
);
51 _ltree_compress(PG_FUNCTION_ARGS
)
53 GISTENTRY
*entry
= (GISTENTRY
*) PG_GETARG_POINTER(0);
54 GISTENTRY
*retval
= entry
;
55 int siglen
= LTREE_GET_ASIGLEN();
60 ArrayType
*val
= DatumGetArrayTypeP(entry
->key
);
61 int num
= ArrayGetNItems(ARR_NDIM(val
), ARR_DIMS(val
));
62 ltree
*item
= (ltree
*) ARR_DATA_PTR(val
);
64 if (ARR_NDIM(val
) > 1)
66 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR
),
67 errmsg("array must be one-dimensional")));
68 if (array_contains_nulls(val
))
70 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED
),
71 errmsg("array must not contain nulls")));
73 key
= ltree_gist_alloc(false, NULL
, siglen
, NULL
, NULL
);
77 hashing(LTG_SIGN(key
), item
, siglen
);
82 retval
= (GISTENTRY
*) palloc(sizeof(GISTENTRY
));
83 gistentryinit(*retval
, PointerGetDatum(key
),
84 entry
->rel
, entry
->page
,
85 entry
->offset
, false);
87 else if (!LTG_ISALLTRUE(entry
->key
))
91 BITVECP sign
= LTG_SIGN(DatumGetPointer(entry
->key
));
95 if ((sign
[i
] & 0xff) != 0xff)
96 PG_RETURN_POINTER(retval
);
99 key
= ltree_gist_alloc(true, sign
, siglen
, NULL
, NULL
);
100 retval
= (GISTENTRY
*) palloc(sizeof(GISTENTRY
));
101 gistentryinit(*retval
, PointerGetDatum(key
),
102 entry
->rel
, entry
->page
,
103 entry
->offset
, false);
105 PG_RETURN_POINTER(retval
);
109 _ltree_same(PG_FUNCTION_ARGS
)
111 ltree_gist
*a
= (ltree_gist
*) PG_GETARG_POINTER(0);
112 ltree_gist
*b
= (ltree_gist
*) PG_GETARG_POINTER(1);
113 bool *result
= (bool *) PG_GETARG_POINTER(2);
114 int siglen
= LTREE_GET_ASIGLEN();
116 if (LTG_ISALLTRUE(a
) && LTG_ISALLTRUE(b
))
118 else if (LTG_ISALLTRUE(a
))
120 else if (LTG_ISALLTRUE(b
))
125 BITVECP sa
= LTG_SIGN(a
),
138 PG_RETURN_POINTER(result
);
142 unionkey(BITVECP sbase
, ltree_gist
*add
, int siglen
)
145 BITVECP sadd
= LTG_SIGN(add
);
147 if (LTG_ISALLTRUE(add
))
156 _ltree_union(PG_FUNCTION_ARGS
)
158 GistEntryVector
*entryvec
= (GistEntryVector
*) PG_GETARG_POINTER(0);
159 int *size
= (int *) PG_GETARG_POINTER(1);
160 int siglen
= LTREE_GET_ASIGLEN();
162 ltree_gist
*result
= ltree_gist_alloc(false, NULL
, siglen
, NULL
, NULL
);
163 BITVECP base
= LTG_SIGN(result
);
165 for (i
= 0; i
< entryvec
->n
; i
++)
167 if (unionkey(base
, GETENTRY(entryvec
, i
), siglen
))
169 result
->flag
|= LTG_ALLTRUE
;
170 SET_VARSIZE(result
, LTG_HDRSIZE
);
175 *size
= VARSIZE(result
);
177 PG_RETURN_POINTER(result
);
181 sizebitvec(BITVECP sign
, int siglen
)
183 return pg_popcount((const char *) sign
, siglen
);
187 hemdistsign(BITVECP a
, BITVECP b
, int siglen
)
195 diff
= (unsigned char) (a
[i
] ^ b
[i
]);
196 /* Using the popcount functions here isn't likely to win */
197 dist
+= pg_number_of_ones
[diff
];
203 hemdist(ltree_gist
*a
, ltree_gist
*b
, int siglen
)
205 if (LTG_ISALLTRUE(a
))
207 if (LTG_ISALLTRUE(b
))
210 return ASIGLENBIT(siglen
) - sizebitvec(LTG_SIGN(b
), siglen
);
212 else if (LTG_ISALLTRUE(b
))
213 return ASIGLENBIT(siglen
) - sizebitvec(LTG_SIGN(a
), siglen
);
215 return hemdistsign(LTG_SIGN(a
), LTG_SIGN(b
), siglen
);
220 _ltree_penalty(PG_FUNCTION_ARGS
)
222 ltree_gist
*origval
= (ltree_gist
*) DatumGetPointer(((GISTENTRY
*) PG_GETARG_POINTER(0))->key
);
223 ltree_gist
*newval
= (ltree_gist
*) DatumGetPointer(((GISTENTRY
*) PG_GETARG_POINTER(1))->key
);
224 float *penalty
= (float *) PG_GETARG_POINTER(2);
225 int siglen
= LTREE_GET_ASIGLEN();
227 *penalty
= hemdist(origval
, newval
, siglen
);
228 PG_RETURN_POINTER(penalty
);
238 comparecost(const void *a
, const void *b
)
240 return ((const SPLITCOST
*) a
)->cost
- ((const SPLITCOST
*) b
)->cost
;
244 _ltree_picksplit(PG_FUNCTION_ARGS
)
246 GistEntryVector
*entryvec
= (GistEntryVector
*) PG_GETARG_POINTER(0);
247 GIST_SPLITVEC
*v
= (GIST_SPLITVEC
*) PG_GETARG_POINTER(1);
248 int siglen
= LTREE_GET_ASIGLEN();
260 OffsetNumber seed_1
= 0,
267 SPLITCOST
*costvector
;
271 maxoff
= entryvec
->n
- 2;
272 nbytes
= (maxoff
+ 2) * sizeof(OffsetNumber
);
273 v
->spl_left
= (OffsetNumber
*) palloc(nbytes
);
274 v
->spl_right
= (OffsetNumber
*) palloc(nbytes
);
276 for (k
= FirstOffsetNumber
; k
< maxoff
; k
= OffsetNumberNext(k
))
278 _k
= GETENTRY(entryvec
, k
);
279 for (j
= OffsetNumberNext(k
); j
<= maxoff
; j
= OffsetNumberNext(j
))
281 size_waste
= hemdist(_k
, GETENTRY(entryvec
, j
), siglen
);
282 if (size_waste
> waste
)
293 right
= v
->spl_right
;
296 if (seed_1
== 0 || seed_2
== 0)
302 /* form initial .. */
303 datum_l
= ltree_gist_alloc(LTG_ISALLTRUE(GETENTRY(entryvec
, seed_1
)),
304 LTG_SIGN(GETENTRY(entryvec
, seed_1
)),
307 datum_r
= ltree_gist_alloc(LTG_ISALLTRUE(GETENTRY(entryvec
, seed_2
)),
308 LTG_SIGN(GETENTRY(entryvec
, seed_2
)),
311 maxoff
= OffsetNumberNext(maxoff
);
312 /* sort before ... */
313 costvector
= (SPLITCOST
*) palloc(sizeof(SPLITCOST
) * maxoff
);
314 for (j
= FirstOffsetNumber
; j
<= maxoff
; j
= OffsetNumberNext(j
))
316 costvector
[j
- 1].pos
= j
;
317 _j
= GETENTRY(entryvec
, j
);
318 size_alpha
= hemdist(datum_l
, _j
, siglen
);
319 size_beta
= hemdist(datum_r
, _j
, siglen
);
320 costvector
[j
- 1].cost
= abs(size_alpha
- size_beta
);
322 qsort(costvector
, maxoff
, sizeof(SPLITCOST
), comparecost
);
324 union_l
= LTG_SIGN(datum_l
);
325 union_r
= LTG_SIGN(datum_r
);
327 for (k
= 0; k
< maxoff
; k
++)
329 j
= costvector
[k
].pos
;
336 else if (j
== seed_2
)
342 _j
= GETENTRY(entryvec
, j
);
343 size_alpha
= hemdist(datum_l
, _j
, siglen
);
344 size_beta
= hemdist(datum_r
, _j
, siglen
);
346 if (size_alpha
< size_beta
+ WISH_F(v
->spl_nleft
, v
->spl_nright
, 0.00001))
348 if (LTG_ISALLTRUE(datum_l
) || LTG_ISALLTRUE(_j
))
350 if (!LTG_ISALLTRUE(datum_l
))
351 memset(union_l
, 0xff, siglen
);
357 union_l
[i
] |= ptr
[i
];
364 if (LTG_ISALLTRUE(datum_r
) || LTG_ISALLTRUE(_j
))
366 if (!LTG_ISALLTRUE(datum_r
))
367 memset(union_r
, 0xff, siglen
);
373 union_r
[i
] |= ptr
[i
];
380 *right
= *left
= FirstOffsetNumber
;
382 v
->spl_ldatum
= PointerGetDatum(datum_l
);
383 v
->spl_rdatum
= PointerGetDatum(datum_r
);
385 PG_RETURN_POINTER(v
);
389 gist_te(ltree_gist
*key
, ltree
*query
, int siglen
)
391 ltree_level
*curq
= LTREE_FIRST(query
);
392 BITVECP sign
= LTG_SIGN(key
);
393 int qlen
= query
->numlevel
;
396 if (LTG_ISALLTRUE(key
))
401 hv
= ltree_crc32_sz(curq
->name
, curq
->len
);
402 if (!GETBIT(sign
, AHASHVAL(hv
, siglen
)))
404 curq
= LEVEL_NEXT(curq
);
411 typedef struct LtreeSignature
418 checkcondition_bit(void *cxt
, ITEM
*val
)
420 LtreeSignature
*sig
= cxt
;
422 return (FLG_CANLOOKSIGN(val
->flag
)) ? GETBIT(sig
->sign
, AHASHVAL(val
->val
, sig
->siglen
)) : true;
426 gist_qtxt(ltree_gist
*key
, ltxtquery
*query
, int siglen
)
430 if (LTG_ISALLTRUE(key
))
433 sig
.sign
= LTG_SIGN(key
);
436 return ltree_execute(GETQUERY(query
),
442 gist_qe(ltree_gist
*key
, lquery
*query
, int siglen
)
444 lquery_level
*curq
= LQUERY_FIRST(query
);
445 BITVECP sign
= LTG_SIGN(key
);
446 int qlen
= query
->numlevel
;
448 if (LTG_ISALLTRUE(key
))
453 if (curq
->numvar
&& LQL_CANLOOKSIGN(curq
))
455 bool isexist
= false;
456 int vlen
= curq
->numvar
;
457 lquery_variant
*curv
= LQL_FIRST(curq
);
461 if (GETBIT(sign
, AHASHVAL(curv
->val
, siglen
)))
466 curv
= LVAR_NEXT(curv
);
473 curq
= LQL_NEXT(curq
);
481 _arrq_cons(ltree_gist
*key
, ArrayType
*_query
, int siglen
)
483 lquery
*query
= (lquery
*) ARR_DATA_PTR(_query
);
484 int num
= ArrayGetNItems(ARR_NDIM(_query
), ARR_DIMS(_query
));
486 if (ARR_NDIM(_query
) > 1)
488 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR
),
489 errmsg("array must be one-dimensional")));
490 if (array_contains_nulls(_query
))
492 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED
),
493 errmsg("array must not contain nulls")));
497 if (gist_qe(key
, query
, siglen
))
500 query
= (lquery
*) NEXTVAL(query
);
506 _ltree_consistent(PG_FUNCTION_ARGS
)
508 GISTENTRY
*entry
= (GISTENTRY
*) PG_GETARG_POINTER(0);
509 void *query
= (void *) PG_DETOAST_DATUM(PG_GETARG_DATUM(1));
510 StrategyNumber strategy
= (StrategyNumber
) PG_GETARG_UINT16(2);
512 /* Oid subtype = PG_GETARG_OID(3); */
513 bool *recheck
= (bool *) PG_GETARG_POINTER(4);
514 int siglen
= LTREE_GET_ASIGLEN();
515 ltree_gist
*key
= (ltree_gist
*) DatumGetPointer(entry
->key
);
518 /* All cases served by this function are inexact */
525 res
= gist_te(key
, (ltree
*) query
, siglen
);
529 res
= gist_qe(key
, (lquery
*) query
, siglen
);
533 res
= gist_qtxt(key
, (ltxtquery
*) query
, siglen
);
537 res
= _arrq_cons(key
, (ArrayType
*) query
, siglen
);
541 elog(ERROR
, "unrecognized StrategyNumber: %d", strategy
);
543 PG_FREE_IF_COPY(query
, 1);
548 _ltree_gist_options(PG_FUNCTION_ARGS
)
550 local_relopts
*relopts
= (local_relopts
*) PG_GETARG_POINTER(0);
552 init_local_reloptions(relopts
, sizeof(LtreeGistOptions
));
553 add_local_int_reloption(relopts
, "siglen", "signature length",
554 LTREE_ASIGLEN_DEFAULT
, 1, LTREE_ASIGLEN_MAX
,
555 offsetof(LtreeGistOptions
, siglen
));