Commit a9289708 authored by Tom Lane's avatar Tom Lane

New contrib module for BTREE emulation in GiST.

From Oleg Bartunov and Teodor Sigaev.
parent a54075a6
# $Header: /cvsroot/pgsql/contrib/Makefile,v 1.23 2001/07/06 23:07:19 petere Exp $
# $Header: /cvsroot/pgsql/contrib/Makefile,v 1.24 2001/08/22 18:27:53 tgl Exp $
subdir = contrib
top_builddir = ..
......@@ -6,18 +6,19 @@ include $(top_builddir)/src/Makefile.global
WANTED_DIRS = \
array \
btree_gist \
cube \
dbase \
dblink \
earthdistance \
findoidjoins \
fulltextindex \
fuzzystrmatch \
intarray \
isbn_issn \
lo \
mSQL-interface \
mac \
metaphone \
miscutil \
noupdate \
oid2name \
......@@ -30,7 +31,6 @@ WANTED_DIRS = \
rserv \
rtree_gist \
seg \
soundex \
spi \
string \
tips \
......
......@@ -30,6 +30,14 @@ array -
Array iterator functions
by Massimo Dal Zotto <dz@cs.unitn.it>
btree_gist -
Support for emulating BTREE indexing in GiST
by Oleg Bartunov <oleg@sai.msu.su> and Teodor Sigaev <teodor@stack.net>
chkpass -
An auto-encrypted password datatype
by D'Arcy J.M. Cain <darcy@druid.net>
cube -
Multidimensional-cube datatype (GiST indexing example)
by Gene Selkov, Jr. <selkovjr@mcs.anl.gov>
......
subdir = contrib/btree_gist
top_builddir = ../..
include $(top_builddir)/src/Makefile.global
# override libdir to install shlib in contrib not main directory
libdir := $(libdir)/contrib
# shared library parameters
NAME= btree_gist
SO_MAJOR_VERSION= 1
SO_MINOR_VERSION= 0
override CPPFLAGS += -I$(srcdir)
OBJS= btree_gist.o
all: all-lib $(NAME).sql
# Shared library stuff
include $(top_srcdir)/src/Makefile.shlib
$(NAME).sql: $(NAME).sql.in
sed -e 's:MODULE_PATHNAME:$(libdir)/$(shlib):g' < $< > $@
.PHONY: submake
submake:
$(MAKE) -C $(top_builddir)/src/test/regress pg_regress
# against installed postmaster
installcheck: submake
$(top_builddir)/src/test/regress/pg_regress btree_gist
# in-tree test doesn't work yet (no way to install my shared library)
#check: all submake
# $(top_builddir)/src/test/regress/pg_regress --temp-install \
# --top-builddir=$(top_builddir) btree_gist
check:
@echo "'make check' is not supported."
@echo "Do 'make install', then 'make installcheck' instead."
install: all installdirs install-lib
#$(INSTALL_DATA) $(srcdir)/README.$(NAME) $(docdir)/contrib
$(INSTALL_DATA) $(NAME).sql $(datadir)/contrib
installdirs:
$(mkinstalldirs) $(docdir)/contrib $(datadir)/contrib $(libdir)
uninstall: uninstall-lib
rm -f $(docdir)/contrib/README.$(NAME) $(datadir)/contrib/$(NAME).sql
clean distclean maintainer-clean: clean-lib
rm -f *.so y.tab.c y.tab.h $(OBJS) $(NAME).sql
# things created by various check targets
rm -rf results tmp_check log
rm -f regression.diffs regression.out regress.out run_check.out
ifeq ($(PORTNAME), win)
rm -f regress.def
endif
depend dep:
$(CC) -MM $(CFLAGS) *.c >depend
ifeq (depend,$(wildcard depend))
include depend
endif
This is B-Tree implementation using GiST for int4 and
timestamp types.
All work was done by Teodor Sigaev (teodor@stack.net) and Oleg Bartunov
(oleg@sai.msu.su). See http://www.sai.msu.su/~megera/postgres/gist
for additional information.
NOTICE:
This version will works only with postgresql version 7.2 and above
because of changes in interface of function calling and in system
tables.
INSTALLATION:
gmake
gmake install
-- load functions
psql <database> < btree_gist.sql
REGRESSION TEST:
gmake installcheck
EXAMPLE USAGE:
create table test (a int4);
-- create index
create index testidx on test using gist (a);
-- query
select * from test where a < 10;
This diff is collapsed.
begin transaction;
-- create type of int4 key
CREATE FUNCTION int4key_in(opaque)
RETURNS opaque
AS 'MODULE_PATHNAME'
LANGUAGE 'c' with (isstrict);
CREATE FUNCTION int4key_out(opaque)
RETURNS opaque
AS 'MODULE_PATHNAME'
LANGUAGE 'c' with (isstrict);
CREATE TYPE int4key (
internallength = 8,
input = int4key_in,
output = int4key_out
);
--
--
--
-- int4 ops
--
--
--
-- define the GiST support methods
create function gint4_consistent(opaque,int4,int2) returns bool as 'MODULE_PATHNAME' language 'C';
create function gint4_compress(opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
create function btree_decompress(opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
create function gint4_penalty(opaque,opaque,opaque) returns opaque as 'MODULE_PATHNAME' language 'C' with(isstrict);
create function gint4_picksplit(opaque, opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
create function gint4_union(bytea, opaque) returns int4 as 'MODULE_PATHNAME' language 'C';
create function gint4_same(opaque, opaque, opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
-- add a new opclass
INSERT INTO pg_opclass (opcamid, opcname, opcintype, opckeytype, opcdefault)
SELECT pg_am.oid, 'gist_int4_ops', pg_type.oid, pg_key.oid, true
FROM pg_type, pg_am, pg_type pg_key
WHERE pg_type.typname = 'int4' and
pg_key.typname = 'int4key' and
pg_am.amname='gist';
SELECT o.oid AS opoid, o.oprname
INTO TABLE int_ops_tmp
FROM pg_operator o, pg_type t
WHERE o.oprleft = t.oid and o.oprright = t.oid
and t.typname = 'int4';
-- get the comparators for int4es and store them in a tmp table
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 1, 'f'
FROM pg_opclass opcl, int_ops_tmp c
WHERE opcname = 'gist_int4_ops'
and c.oprname = '<';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 2, 'f'
FROM pg_opclass opcl, int_ops_tmp c
WHERE opcname = 'gist_int4_ops'
and c.oprname = '<=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 3, 'f'
FROM pg_opclass opcl, int_ops_tmp c
WHERE opcname = 'gist_int4_ops'
and c.oprname = '=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 4, 'f'
FROM pg_opclass opcl, int_ops_tmp c
WHERE opcname = 'gist_int4_ops'
and c.oprname = '>=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 5, 'f'
FROM pg_opclass opcl, int_ops_tmp c
WHERE opcname = 'gist_int4_ops'
and c.oprname = '>';
DROP table int_ops_tmp;
-- add the entries to amproc for the support methods
-- note the amprocnum numbers associated with each are specific!
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 1
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_consistent';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 2
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_union';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 3
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_compress';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 4
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'btree_decompress';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 5
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_penalty';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 6
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_picksplit';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 7
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_int4_ops'
and proname = 'gint4_same';
--
--
--
-- timestamp ops
--
--
--
-- create type of timestamp key
CREATE FUNCTION tskey_in(opaque)
RETURNS opaque
AS 'MODULE_PATHNAME'
LANGUAGE 'c' with (isstrict);
CREATE FUNCTION tskey_out(opaque)
RETURNS opaque
AS 'MODULE_PATHNAME'
LANGUAGE 'c' with (isstrict);
CREATE TYPE tskey (
internallength = 16,
input = tskey_in,
output = tskey_out
);
create function gts_consistent(opaque,timestamp,int2) returns bool as 'MODULE_PATHNAME' language 'C';
create function gts_compress(opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
create function gts_penalty(opaque,opaque,opaque) returns opaque as 'MODULE_PATHNAME' language 'C' with(isstrict);
create function gts_picksplit(opaque, opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
create function gts_union(bytea, opaque) returns int4 as 'MODULE_PATHNAME' language 'C';
create function gts_same(opaque, opaque, opaque) returns opaque as 'MODULE_PATHNAME' language 'C';
INSERT INTO pg_opclass (opcamid, opcname, opcintype, opckeytype, opcdefault)
SELECT pg_am.oid, 'gist_timestamp_ops', pg_type.oid, pg_key.oid, true
FROM pg_type, pg_am, pg_type pg_key
WHERE pg_type.typname = 'timestamp' and
pg_key.typname = 'tskey' and
pg_am.amname='gist';
SELECT o.oid AS opoid, o.oprname
INTO TABLE timestamp_ops_tmp
FROM pg_operator o, pg_type t
WHERE o.oprleft = t.oid and o.oprright = t.oid
and t.typname = 'timestamp';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 1, 'f'
FROM pg_opclass opcl, timestamp_ops_tmp c
WHERE opcname = 'gist_timestamp_ops'
and c.oprname = '<';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 2, 'f'
FROM pg_opclass opcl, timestamp_ops_tmp c
WHERE opcname = 'gist_timestamp_ops'
and c.oprname = '<=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 3, 'f'
FROM pg_opclass opcl, timestamp_ops_tmp c
WHERE opcname = 'gist_timestamp_ops'
and c.oprname = '=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 4, 'f'
FROM pg_opclass opcl, timestamp_ops_tmp c
WHERE opcname = 'gist_timestamp_ops'
and c.oprname = '>=';
INSERT INTO pg_amop (amopclaid, amopopr, amopstrategy, amopreqcheck)
SELECT opcl.oid, c.opoid, 5, 'f'
FROM pg_opclass opcl, timestamp_ops_tmp c
WHERE opcname = 'gist_timestamp_ops'
and c.oprname = '>';
DROP table timestamp_ops_tmp;
-- add the entries to amproc for the support methods
-- note the amprocnum numbers associated with each are specific!
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 1
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_consistent';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 2
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_union';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 3
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_compress';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 4
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'btree_decompress';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 5
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_penalty';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 6
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_picksplit';
INSERT INTO pg_amproc (amopclaid, amproc, amprocnum)
SELECT opcl.oid, pro.oid, 7
FROM pg_opclass opcl, pg_proc pro
WHERE opcname = 'gist_timestamp_ops'
and proname = 'gts_same';
end transaction;
49
200
394
274
196
543
328
645
151
849
771
704
688
485
545
931
210
222
897
676
\N
201
533
703
410
301
633
319
329
13
942
737
533
407
876
622
430
264
785
938
680
91
179
147
108
510
336
781
3
16
\N
136
494
570
333
447
185
\N
\N
213
193
565
77
904
989
471
\N
566
117
102
515
105
\N
61
537
278
337
46
92
723
661
619
\N
293
\N
919
227
536
917
779
418
15
235
425
\N
362
587
590
103
563
369
775
404
408
142
133
566
727
413
382
42
32
548
540
\N
86
\N
58
685
11
907
274
94
987
971
383
757
327
38
854
257
318
159
224
39
\N
532
461
30
\N
790
\N
828
35
606
845
\N
313
391
869
592
821
73
\N
703
222
218
209
136
774
608
531
820
119
497
889
\N
592
899
\N
243
\N
400
\N
894
\N
\N
386
\N
550
840
606
160
386
723
16
693
601
338
368
74
436
734
806
433
679
857
679
319
85
\N
153
506
110
73
485
749
205
628
746
380
\N
573
146
314
439
102
606
\N
179
\N
921
236
509
714
353
97
\N
374
131
528
805
298
533
737
\N
135
119
294
725
826
393
740
487
932
\N
734
333
651
460
590
530
575
352
999
319
\N
277
692
939
580
\N
\N
568
92
182
885
839
303
709
891
538
58
271
577
827
459
852
812
823
\N
375
924
\N
799
297
795
853
751
\N
77
339
\N
\N
506
577
864
118
444
731
355
390
787
352
570
389
771
110
278
59
862
846
\N
362
590
719
442
525
329
945
739
857
897
835
787
657
558
455
\N
159
\N
672
795
\N
581
818
872
123
255
816
789
\N
124
\N
900
\N
240
819
386
841
282
269
259
893
570
505
769
959
\N
426
620
857
824
102
308
351
74
950
292
580
739
575
\N
594
\N
489
382
498
795
664
881
918
159
108
\N
679
724
964
8
664
267
101
869
676
433
469
657
78
381
43
959
695
545
780
390
697
733
693
387
864
613
301
374
222
564
450
307
\N
\N
912
518
593
283
529
983
379
244
819
377
225
811
69
\N
380
919
724
352
248
\N
416
788
663
395
394
707
352
658
759
825
881
563
271
\N
407
\N
157
931
233
769
78
737
525
221
216
824
353
977
757
976
843
795
603
\N
85
795
382
998
136
904
563
354
288
2
835
\N
714
915
471
\N
\N
676
556
119
490
909
\N
240
106
17
474
222
721
374
\N
262
913
234
797
\N
723
9
126
886
617
311
241
413
134
545
145
867
120
271
\N
\N
\N
177
\N
735
435
\N
855
612
803
964
417
771
359
670
682
236
492
597
220
1
585
193
837
938
389
527
423
627
\N
924
741
760
280
819
128
585
412
\N
816
710
359
318
478
803
771
642
\N
\N
842
490
462
727
214
629
276
\N
274
672
875
35
873
913
185
770
126
4
770
56
621
137
62
771
561
891
80
\N
45
996
722
940
823
\N
883
225
788
519
317
763
563
689
635
905
500
859
55
205
651
537
787
973
195
542
\N
\N
857
377
\N
\N
834
314
314
407
865
945
675
\N
\N
5
715
248
168
862
37
366
936
136
\N
324
845
854
831
225
\N
987
545
621
140
844
132
466
899
716
907
97
511
425
225
522
702
532
132
328
278
985
869
773
\N
633
624
114
879
142
762
729
890
430
241
267
616
9
457
168
\N
177
3
\N
675
558
2
\N
310
548
992
597
950
48
33
173
460
890
757
983
492
777
22
261
973
106
666
558
226
681
\N
347
92
14
96
641
495
585
458
217
386
284
719
694
\N
643
\N
928
976
44
941
396
\N
559
969
187
669
463
769
669
\N
70
861
501
\N
349
44
951
375
869
441
515
322
867
983
152
623
730
148
899
236
833
961
389
448
975
523
225
\N
698
314
19
935
269
178
349
685
702
523
165
453
756
266
997
499
880
402
40
487
261
506
886
193
237
631
630
570
90
558
348
203
\N
598
676
834
709
796
299
197
\N
94
997
458
871
964
808
321
\N
525
451
785
374
530
626
850
336
138
883
143
\N
299
\N
754
667
820
777
438
339
600
276
987
270
949
\N
474
321
325
138
620
345
\N
477
\N
690
714
897
36
469
965
259
715
580
\N
697
495
\N
284
820
992
708
638
216
181
\N
101
\N
730
902
703
176
561
945
915
246
632
441
849
\N
552
76
960
628
413
814
746
613
417
327
178
116
829
522
761
462
518
660
87
979
143
628
960
715
\N
288
\N
387
29
15
544
455
57
433
158
72
49
620
616
592
584
564
735
308
661
519
1
825
665
316
970
305
204
541
544
589
827
600
126
192
610
650
647
177
625
405
465
895
\N
152
594
492
385
693
442
173
\N
946
934
200
532
750
158
981
670
572
608
135
48
208
\N
971
594
429
655
This diff is collapsed.
--
-- first, define the datatype. Turn off echoing so that expected file
-- does not depend on contents of seg.sql.
--
\set ECHO none
create table inttmp (b int4);
\copy inttmp from 'data/test_btree.data'
create table tstmp ( t datetime );
\copy tstmp from 'data/test_btree_ts.data'
-- without idx
select count(*) from inttmp where b <=10;
count
-------
11
(1 row)
select count(*) from tstmp where t < '2001-05-29 08:33:09+04';
count
-------
7
(1 row)
-- create idx
create index aaaidx on inttmp using gist ( b );
create index tsidx on tstmp using gist ( t );
--with idx
set enable_seqscan=off;
select count(*) from inttmp where b <=10;
count
-------
11
(1 row)
select count(*) from tstmp where t < '2001-05-29 08:33:09+04';
count
-------
7
(1 row)
--
-- first, define the datatype. Turn off echoing so that expected file
-- does not depend on contents of seg.sql.
--
\set ECHO none
\i btree_gist.sql
\set ECHO all
create table inttmp (b int4);
\copy inttmp from 'data/test_btree.data'
create table tstmp ( t datetime );
\copy tstmp from 'data/test_btree_ts.data'
-- without idx
select count(*) from inttmp where b <=10;
select count(*) from tstmp where t < '2001-05-29 08:33:09+04';
-- create idx
create index aaaidx on inttmp using gist ( b );
create index tsidx on tstmp using gist ( t );
--with idx
set enable_seqscan=off;
select count(*) from inttmp where b <=10;
select count(*) from tstmp where t < '2001-05-29 08:33:09+04';
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment