2 * contrib/ltree/_ltree_gist.c
5 * GiST support for ltree[]
6 * Teodor Sigaev <teodor@stack.net>
10 #include "access/gist.h"
11 #include "access/reloptions.h"
12 #include "access/stratnum.h"
15 #include "port/pg_bitutils.h"
16 #include "utils/array.h"
18 PG_FUNCTION_INFO_V1(_ltree_compress
);
19 PG_FUNCTION_INFO_V1(_ltree_same
);
20 PG_FUNCTION_INFO_V1(_ltree_union
);
21 PG_FUNCTION_INFO_V1(_ltree_penalty
);
22 PG_FUNCTION_INFO_V1(_ltree_picksplit
);
23 PG_FUNCTION_INFO_V1(_ltree_consistent
);
24 PG_FUNCTION_INFO_V1(_ltree_gist_options
);
26 #define GETENTRY(vec,pos) ((ltree_gist *) DatumGetPointer((vec)->vector[(pos)].key))
27 #define NEXTVAL(x) ( (ltree*)( (char*)(x) + INTALIGN( VARSIZE(x) ) ) )
29 #define WISH_F(a,b,c) (double)( -(double)(((a)-(b))*((a)-(b))*((a)-(b)))*(c) )
33 hashing(BITVECP sign
, ltree
*t
, int siglen
)
35 int tlen
= t
->numlevel
;
36 ltree_level
*cur
= LTREE_FIRST(t
);
41 hash
= ltree_crc32_sz(cur
->name
, cur
->len
);
42 AHASH(sign
, hash
, siglen
);
43 cur
= LEVEL_NEXT(cur
);
49 _ltree_compress(PG_FUNCTION_ARGS
)
51 GISTENTRY
*entry
= (GISTENTRY
*) PG_GETARG_POINTER(0);
52 GISTENTRY
*retval
= entry
;
53 int siglen
= LTREE_GET_ASIGLEN();
58 ArrayType
*val
= DatumGetArrayTypeP(entry
->key
);
59 int num
= ArrayGetNItems(ARR_NDIM(val
), ARR_DIMS(val
));
60 ltree
*item
= (ltree
*) ARR_DATA_PTR(val
);
62 if (ARR_NDIM(val
) > 1)
64 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR
),
65 errmsg("array must be one-dimensional")));
66 if (array_contains_nulls(val
))
68 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED
),
69 errmsg("array must not contain nulls")));
71 key
= ltree_gist_alloc(false, NULL
, siglen
, NULL
, NULL
);
75 hashing(LTG_SIGN(key
), item
, siglen
);
80 retval
= (GISTENTRY
*) palloc(sizeof(GISTENTRY
));
81 gistentryinit(*retval
, PointerGetDatum(key
),
82 entry
->rel
, entry
->page
,
83 entry
->offset
, false);
85 else if (!LTG_ISALLTRUE(entry
->key
))
89 BITVECP sign
= LTG_SIGN(DatumGetPointer(entry
->key
));
93 if ((sign
[i
] & 0xff) != 0xff)
94 PG_RETURN_POINTER(retval
);
97 key
= ltree_gist_alloc(true, sign
, siglen
, NULL
, NULL
);
98 retval
= (GISTENTRY
*) palloc(sizeof(GISTENTRY
));
99 gistentryinit(*retval
, PointerGetDatum(key
),
100 entry
->rel
, entry
->page
,
101 entry
->offset
, false);
103 PG_RETURN_POINTER(retval
);
107 _ltree_same(PG_FUNCTION_ARGS
)
109 ltree_gist
*a
= (ltree_gist
*) PG_GETARG_POINTER(0);
110 ltree_gist
*b
= (ltree_gist
*) PG_GETARG_POINTER(1);
111 bool *result
= (bool *) PG_GETARG_POINTER(2);
112 int siglen
= LTREE_GET_ASIGLEN();
114 if (LTG_ISALLTRUE(a
) && LTG_ISALLTRUE(b
))
116 else if (LTG_ISALLTRUE(a
))
118 else if (LTG_ISALLTRUE(b
))
123 BITVECP sa
= LTG_SIGN(a
),
136 PG_RETURN_POINTER(result
);
140 unionkey(BITVECP sbase
, ltree_gist
*add
, int siglen
)
143 BITVECP sadd
= LTG_SIGN(add
);
145 if (LTG_ISALLTRUE(add
))
154 _ltree_union(PG_FUNCTION_ARGS
)
156 GistEntryVector
*entryvec
= (GistEntryVector
*) PG_GETARG_POINTER(0);
157 int *size
= (int *) PG_GETARG_POINTER(1);
158 int siglen
= LTREE_GET_ASIGLEN();
160 ltree_gist
*result
= ltree_gist_alloc(false, NULL
, siglen
, NULL
, NULL
);
161 BITVECP base
= LTG_SIGN(result
);
163 for (i
= 0; i
< entryvec
->n
; i
++)
165 if (unionkey(base
, GETENTRY(entryvec
, i
), siglen
))
167 result
->flag
|= LTG_ALLTRUE
;
168 SET_VARSIZE(result
, LTG_HDRSIZE
);
173 *size
= VARSIZE(result
);
175 PG_RETURN_POINTER(result
);
179 sizebitvec(BITVECP sign
, int siglen
)
181 return pg_popcount((const char *) sign
, siglen
);
185 hemdistsign(BITVECP a
, BITVECP b
, int siglen
)
193 diff
= (unsigned char) (a
[i
] ^ b
[i
]);
194 /* Using the popcount functions here isn't likely to win */
195 dist
+= pg_number_of_ones
[diff
];
201 hemdist(ltree_gist
*a
, ltree_gist
*b
, int siglen
)
203 if (LTG_ISALLTRUE(a
))
205 if (LTG_ISALLTRUE(b
))
208 return ASIGLENBIT(siglen
) - sizebitvec(LTG_SIGN(b
), siglen
);
210 else if (LTG_ISALLTRUE(b
))
211 return ASIGLENBIT(siglen
) - sizebitvec(LTG_SIGN(a
), siglen
);
213 return hemdistsign(LTG_SIGN(a
), LTG_SIGN(b
), siglen
);
218 _ltree_penalty(PG_FUNCTION_ARGS
)
220 ltree_gist
*origval
= (ltree_gist
*) DatumGetPointer(((GISTENTRY
*) PG_GETARG_POINTER(0))->key
);
221 ltree_gist
*newval
= (ltree_gist
*) DatumGetPointer(((GISTENTRY
*) PG_GETARG_POINTER(1))->key
);
222 float *penalty
= (float *) PG_GETARG_POINTER(2);
223 int siglen
= LTREE_GET_ASIGLEN();
225 *penalty
= hemdist(origval
, newval
, siglen
);
226 PG_RETURN_POINTER(penalty
);
236 comparecost(const void *a
, const void *b
)
238 return ((const SPLITCOST
*) a
)->cost
- ((const SPLITCOST
*) b
)->cost
;
242 _ltree_picksplit(PG_FUNCTION_ARGS
)
244 GistEntryVector
*entryvec
= (GistEntryVector
*) PG_GETARG_POINTER(0);
245 GIST_SPLITVEC
*v
= (GIST_SPLITVEC
*) PG_GETARG_POINTER(1);
246 int siglen
= LTREE_GET_ASIGLEN();
258 OffsetNumber seed_1
= 0,
265 SPLITCOST
*costvector
;
269 maxoff
= entryvec
->n
- 2;
270 nbytes
= (maxoff
+ 2) * sizeof(OffsetNumber
);
271 v
->spl_left
= (OffsetNumber
*) palloc(nbytes
);
272 v
->spl_right
= (OffsetNumber
*) palloc(nbytes
);
274 for (k
= FirstOffsetNumber
; k
< maxoff
; k
= OffsetNumberNext(k
))
276 _k
= GETENTRY(entryvec
, k
);
277 for (j
= OffsetNumberNext(k
); j
<= maxoff
; j
= OffsetNumberNext(j
))
279 size_waste
= hemdist(_k
, GETENTRY(entryvec
, j
), siglen
);
280 if (size_waste
> waste
)
291 right
= v
->spl_right
;
294 if (seed_1
== 0 || seed_2
== 0)
300 /* form initial .. */
301 datum_l
= ltree_gist_alloc(LTG_ISALLTRUE(GETENTRY(entryvec
, seed_1
)),
302 LTG_SIGN(GETENTRY(entryvec
, seed_1
)),
305 datum_r
= ltree_gist_alloc(LTG_ISALLTRUE(GETENTRY(entryvec
, seed_2
)),
306 LTG_SIGN(GETENTRY(entryvec
, seed_2
)),
309 maxoff
= OffsetNumberNext(maxoff
);
310 /* sort before ... */
311 costvector
= (SPLITCOST
*) palloc(sizeof(SPLITCOST
) * maxoff
);
312 for (j
= FirstOffsetNumber
; j
<= maxoff
; j
= OffsetNumberNext(j
))
314 costvector
[j
- 1].pos
= j
;
315 _j
= GETENTRY(entryvec
, j
);
316 size_alpha
= hemdist(datum_l
, _j
, siglen
);
317 size_beta
= hemdist(datum_r
, _j
, siglen
);
318 costvector
[j
- 1].cost
= Abs(size_alpha
- size_beta
);
320 qsort((void *) costvector
, maxoff
, sizeof(SPLITCOST
), comparecost
);
322 union_l
= LTG_SIGN(datum_l
);
323 union_r
= LTG_SIGN(datum_r
);
325 for (k
= 0; k
< maxoff
; k
++)
327 j
= costvector
[k
].pos
;
334 else if (j
== seed_2
)
340 _j
= GETENTRY(entryvec
, j
);
341 size_alpha
= hemdist(datum_l
, _j
, siglen
);
342 size_beta
= hemdist(datum_r
, _j
, siglen
);
344 if (size_alpha
< size_beta
+ WISH_F(v
->spl_nleft
, v
->spl_nright
, 0.00001))
346 if (LTG_ISALLTRUE(datum_l
) || LTG_ISALLTRUE(_j
))
348 if (!LTG_ISALLTRUE(datum_l
))
349 memset((void *) union_l
, 0xff, siglen
);
355 union_l
[i
] |= ptr
[i
];
362 if (LTG_ISALLTRUE(datum_r
) || LTG_ISALLTRUE(_j
))
364 if (!LTG_ISALLTRUE(datum_r
))
365 memset((void *) union_r
, 0xff, siglen
);
371 union_r
[i
] |= ptr
[i
];
378 *right
= *left
= FirstOffsetNumber
;
380 v
->spl_ldatum
= PointerGetDatum(datum_l
);
381 v
->spl_rdatum
= PointerGetDatum(datum_r
);
383 PG_RETURN_POINTER(v
);
387 gist_te(ltree_gist
*key
, ltree
*query
, int siglen
)
389 ltree_level
*curq
= LTREE_FIRST(query
);
390 BITVECP sign
= LTG_SIGN(key
);
391 int qlen
= query
->numlevel
;
394 if (LTG_ISALLTRUE(key
))
399 hv
= ltree_crc32_sz(curq
->name
, curq
->len
);
400 if (!GETBIT(sign
, AHASHVAL(hv
, siglen
)))
402 curq
= LEVEL_NEXT(curq
);
409 typedef struct LtreeSignature
416 checkcondition_bit(void *cxt
, ITEM
*val
)
418 LtreeSignature
*sig
= cxt
;
420 return (FLG_CANLOOKSIGN(val
->flag
)) ? GETBIT(sig
->sign
, AHASHVAL(val
->val
, sig
->siglen
)) : true;
424 gist_qtxt(ltree_gist
*key
, ltxtquery
*query
, int siglen
)
428 if (LTG_ISALLTRUE(key
))
431 sig
.sign
= LTG_SIGN(key
);
434 return ltree_execute(GETQUERY(query
),
440 gist_qe(ltree_gist
*key
, lquery
*query
, int siglen
)
442 lquery_level
*curq
= LQUERY_FIRST(query
);
443 BITVECP sign
= LTG_SIGN(key
);
444 int qlen
= query
->numlevel
;
446 if (LTG_ISALLTRUE(key
))
451 if (curq
->numvar
&& LQL_CANLOOKSIGN(curq
))
453 bool isexist
= false;
454 int vlen
= curq
->numvar
;
455 lquery_variant
*curv
= LQL_FIRST(curq
);
459 if (GETBIT(sign
, AHASHVAL(curv
->val
, siglen
)))
464 curv
= LVAR_NEXT(curv
);
471 curq
= LQL_NEXT(curq
);
479 _arrq_cons(ltree_gist
*key
, ArrayType
*_query
, int siglen
)
481 lquery
*query
= (lquery
*) ARR_DATA_PTR(_query
);
482 int num
= ArrayGetNItems(ARR_NDIM(_query
), ARR_DIMS(_query
));
484 if (ARR_NDIM(_query
) > 1)
486 (errcode(ERRCODE_ARRAY_SUBSCRIPT_ERROR
),
487 errmsg("array must be one-dimensional")));
488 if (array_contains_nulls(_query
))
490 (errcode(ERRCODE_NULL_VALUE_NOT_ALLOWED
),
491 errmsg("array must not contain nulls")));
495 if (gist_qe(key
, query
, siglen
))
498 query
= (lquery
*) NEXTVAL(query
);
504 _ltree_consistent(PG_FUNCTION_ARGS
)
506 GISTENTRY
*entry
= (GISTENTRY
*) PG_GETARG_POINTER(0);
507 void *query
= (void *) PG_DETOAST_DATUM(PG_GETARG_DATUM(1));
508 StrategyNumber strategy
= (StrategyNumber
) PG_GETARG_UINT16(2);
510 /* Oid subtype = PG_GETARG_OID(3); */
511 bool *recheck
= (bool *) PG_GETARG_POINTER(4);
512 int siglen
= LTREE_GET_ASIGLEN();
513 ltree_gist
*key
= (ltree_gist
*) DatumGetPointer(entry
->key
);
516 /* All cases served by this function are inexact */
523 res
= gist_te(key
, (ltree
*) query
, siglen
);
527 res
= gist_qe(key
, (lquery
*) query
, siglen
);
531 res
= gist_qtxt(key
, (ltxtquery
*) query
, siglen
);
535 res
= _arrq_cons(key
, (ArrayType
*) query
, siglen
);
539 elog(ERROR
, "unrecognized StrategyNumber: %d", strategy
);
541 PG_FREE_IF_COPY(query
, 1);
546 _ltree_gist_options(PG_FUNCTION_ARGS
)
548 local_relopts
*relopts
= (local_relopts
*) PG_GETARG_POINTER(0);
550 init_local_reloptions(relopts
, sizeof(LtreeGistOptions
));
551 add_local_int_reloption(relopts
, "siglen", "signature length",
552 LTREE_ASIGLEN_DEFAULT
, 1, LTREE_ASIGLEN_MAX
,
553 offsetof(LtreeGistOptions
, siglen
));