Commit 5602265f authored by Tom Lane's avatar Tom Lane

Convert unused_oids and duplicate_oids to use Catalog.pm infrastructure.

unused_oids was previously a shell script, which of course didn't work at
all on Windows.  Also, commit 372728b0 introduced some other portability
problems, as complained of by Stas Kelvich.  We can improve matters by
converting it to Perl.

While we're at it, let's future-proof both this script and duplicate_oids
to use Catalog.pm rather than having a bunch of ad-hoc logic for parsing
catalog headers and .dat files.  These scripts are thereby a bit slower,
which doesn't seem like a problem for typical manual use.  It is a little
annoying for buildfarm purposes, but we should be able to fix that case
by having genbki.pl make the check instead of parsing the headers twice.
(That's not done in this commit, though.)

Stas Kelvich, adjusted a bit by me

Discussion: https://postgr.es/m/37D774E4-FE1F-437E-B3D2-593F314B7505@postgrespro.ru
parent 1eb3a09e
...@@ -384,4 +384,55 @@ sub FindDefinedSymbolFromData ...@@ -384,4 +384,55 @@ sub FindDefinedSymbolFromData
die "no definition found for $symbol\n"; die "no definition found for $symbol\n";
} }
# Extract an array of all the OIDs assigned in the specified catalog headers
# and their associated data files (if any).
sub FindAllOidsFromHeaders
{
my @input_files = @_;
my @oids = ();
foreach my $header (@input_files)
{
$header =~ /(.+)\.h$/
or die "Input files need to be header files.\n";
my $datfile = "$1.dat";
my $catalog = Catalog::ParseHeader($header);
# We ignore the pg_class OID and rowtype OID of bootstrap catalogs,
# as those are expected to appear in the initial data for pg_class
# and pg_type. For regular catalogs, include these OIDs.
if (!$catalog->{bootstrap})
{
push @oids, $catalog->{relation_oid}
if ($catalog->{relation_oid});
push @oids, $catalog->{rowtype_oid} if ($catalog->{rowtype_oid});
}
# Not all catalogs have a data file.
if (-e $datfile)
{
my $catdata =
Catalog::ParseData($datfile, $catalog->{columns}, 0);
foreach my $row (@$catdata)
{
push @oids, $row->{oid} if defined $row->{oid};
}
}
foreach my $toast (@{ $catalog->{toasting} })
{
push @oids, $toast->{toast_oid}, $toast->{toast_index_oid};
}
foreach my $index (@{ $catalog->{indexing} })
{
push @oids, $index->{index_oid};
}
}
return \@oids;
}
1; 1;
#!/usr/bin/perl #!/usr/bin/perl
use lib '../../backend/catalog/';
use Catalog;
use strict; use strict;
use warnings; use warnings;
BEGIN my @input_files = (glob("pg_*.h"), qw(indexing.h toasting.h));
{
@ARGV = (glob("pg_*.h"), glob("pg_*.dat"), qw(indexing.h toasting.h)); my $oids = Catalog::FindAllOidsFromHeaders(@input_files);
}
my %oidcounts; my %oidcounts;
while (<>) foreach my $oid (@{$oids})
{ {
next if /^CATALOG\(.*BKI_BOOTSTRAP/; $oidcounts{$oid}++;
next
unless /\boid *=> *'(\d+)'/
|| /^CATALOG\([^,]*, *(\d+).*BKI_ROWTYPE_OID\((\d+),/
|| /^CATALOG\([^,]*, *(\d+)/
|| /^DECLARE_INDEX\([^,]*, *(\d+)/
|| /^DECLARE_UNIQUE_INDEX\([^,]*, *(\d+)/
|| /^DECLARE_TOAST\([^,]*, *(\d+), *(\d+)/;
$oidcounts{$1}++;
$oidcounts{$2}++ if $2;
} }
my $found = 0; my $found = 0;
......
#!/bin/sh #!/usr/bin/perl
# #
# unused_oids # unused_oids
# #
...@@ -15,43 +15,40 @@ ...@@ -15,43 +15,40 @@
# #
# run this script in src/include/catalog. # run this script in src/include/catalog.
# #
use lib '../../backend/catalog/';
use Catalog;
use strict;
use warnings;
AWK="awk" my @input_files = (glob("pg_*.h"), qw(indexing.h toasting.h));
# Get FirstBootstrapObjectId from access/transam.h my $oids = Catalog::FindAllOidsFromHeaders(@input_files);
FIRSTOBJECTID=`grep '#define[ ]*FirstBootstrapObjectId' ../access/transam.h | $AWK '{ print $3 }'`
export FIRSTOBJECTID
# this part (down to the uniq step) should match the duplicate_oids script # Also push FirstBootstrapObjectId to serve as a terminator for the last gap.
# note: we exclude BKI_BOOTSTRAP relations since they are expected to have my $FirstBootstrapObjectId =
# matching data entries in pg_class.dat and pg_type.dat Catalog::FindDefinedSymbol('access/transam.h', [".."],
'FirstBootstrapObjectId');
push @{$oids}, $FirstBootstrapObjectId;
cat pg_*.h pg_*.dat toasting.h indexing.h | my $prev_oid = 0;
egrep -v -e '^CATALOG\(.*BKI_BOOTSTRAP' | \ foreach my $oid (sort { $a <=> $b } @{$oids})
sed -n -e 's/.*\boid *=> *'\''\([0-9][0-9]*\)'\''.*$/\1/p' \ {
-e 's/^CATALOG([^,]*, *\([0-9][0-9]*\).*BKI_ROWTYPE_OID(\([0-9][0-9]*\),.*$/\1,\2/p' \ if ($oid > $prev_oid + 1)
-e 's/^CATALOG([^,]*, *\([0-9][0-9]*\).*$/\1/p' \ {
-e 's/^DECLARE_INDEX([^,]*, *\([0-9][0-9]*\).*$/\1/p' \ if ($oid > $prev_oid + 2)
-e 's/^DECLARE_UNIQUE_INDEX([^,]*, *\([0-9][0-9]*\).*$/\1/p' \ {
-e 's/^DECLARE_TOAST([^,]*, *\([0-9][0-9]*\), *\([0-9][0-9]*\).*$/\1,\2/p' | \ printf "%d - %d\n", $prev_oid + 1, $oid - 1;
tr ',' '\n' | \ }
sort -n | \ else
uniq | \ {
$AWK ' printf "%d\n", $prev_oid + 1;
BEGIN { }
last = 0;
}
/^[0-9]/ {
if ($1 > last + 1) {
if ($1 > last + 2) {
print last + 1, "-", $1 - 1;
} else {
print last + 1;
} }
elsif ($oid == $prev_oid)
{
print "Duplicate oid detected: $oid\n";
exit 1;
} }
last = $1; $prev_oid = $oid;
} }
END {
print last + 1, "-", ENVIRON["FIRSTOBJECTID"]-1;
}'
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment