Commit 11da4c67 authored by Tom Lane's avatar Tom Lane

Adjust pgstat_initstats() to avoid repeated searches of the TabStat arrays

when a relation is opened multiple times in the same transaction.  This is
particularly useful for system catalogs, which we may heap_open or index_open
many times in a transaction, and it doesn't really cost anything extra even
if the rel is touched but once.  Motivated by study of an example from Greg
Stark, in which pgstat_initstats() accounted for an unreasonably large
fraction of the runtime.
parent ca3d14f2
...@@ -13,7 +13,7 @@ ...@@ -13,7 +13,7 @@
* *
* Copyright (c) 2001-2007, PostgreSQL Global Development Group * Copyright (c) 2001-2007, PostgreSQL Global Development Group
* *
* $PostgreSQL: pgsql/src/backend/postmaster/pgstat.c,v 1.152 2007/03/30 18:34:55 mha Exp $ * $PostgreSQL: pgsql/src/backend/postmaster/pgstat.c,v 1.153 2007/04/21 04:10:53 tgl Exp $
* ---------- * ----------
*/ */
#include "postgres.h" #include "postgres.h"
...@@ -114,6 +114,14 @@ static bool pgStatRunningInCollector = false; ...@@ -114,6 +114,14 @@ static bool pgStatRunningInCollector = false;
* Place where backends store per-table info to be sent to the collector. * Place where backends store per-table info to be sent to the collector.
* We store shared relations separately from non-shared ones, to be able to * We store shared relations separately from non-shared ones, to be able to
* send them in separate messages. * send them in separate messages.
*
* NOTE: once allocated, a PgStat_MsgTabstat struct belonging to a
* TabStatArray is never moved or deleted for the life of the backend.
* Also, we zero out the t_id fields of the contained PgStat_TableEntry
* structs whenever they are not actively in use. This allows PgStat_Info
* pointers to be treated as long-lived data, avoiding repeated searches in
* pgstat_initstats() when a relation is repeatedly heap_open'd or
* index_open'd during a transaction.
*/ */
typedef struct TabStatArray typedef struct TabStatArray
{ {
...@@ -169,6 +177,7 @@ static void pgstat_write_statsfile(void); ...@@ -169,6 +177,7 @@ static void pgstat_write_statsfile(void);
static HTAB *pgstat_read_statsfile(Oid onlydb); static HTAB *pgstat_read_statsfile(Oid onlydb);
static void backend_read_statsfile(void); static void backend_read_statsfile(void);
static void pgstat_read_current_status(void); static void pgstat_read_current_status(void);
static void pgstat_report_one_tabstat(TabStatArray *tsarr, Oid dbid);
static HTAB *pgstat_collect_oids(Oid catalogid); static HTAB *pgstat_collect_oids(Oid catalogid);
static void pgstat_setup_memcxt(void); static void pgstat_setup_memcxt(void);
...@@ -606,25 +615,22 @@ void allow_immediate_pgstat_restart(void) ...@@ -606,25 +615,22 @@ void allow_immediate_pgstat_restart(void)
void void
pgstat_report_tabstat(void) pgstat_report_tabstat(void)
{ {
int i;
if (pgStatSock < 0 ||
(!pgstat_collect_tuplelevel &&
!pgstat_collect_blocklevel))
{
/* Not reporting stats, so just flush whatever we have */
RegularTabStat.tsa_used = 0;
SharedTabStat.tsa_used = 0;
return;
}
/* /*
* For each message buffer used during the last query set the header * For each message buffer used during the last query set the header
* fields and send it out. * fields and send it out; then mark the entries unused.
*/ */
for (i = 0; i < RegularTabStat.tsa_used; i++) pgstat_report_one_tabstat(&RegularTabStat, MyDatabaseId);
pgstat_report_one_tabstat(&SharedTabStat, InvalidOid);
}
static void
pgstat_report_one_tabstat(TabStatArray *tsarr, Oid dbid)
{
int i;
for (i = 0; i < tsarr->tsa_used; i++)
{ {
PgStat_MsgTabstat *tsmsg = RegularTabStat.tsa_messages[i]; PgStat_MsgTabstat *tsmsg = tsarr->tsa_messages[i];
int n; int n;
int len; int len;
...@@ -637,32 +643,24 @@ pgstat_report_tabstat(void) ...@@ -637,32 +643,24 @@ pgstat_report_tabstat(void)
pgStatXactCommit = 0; pgStatXactCommit = 0;
pgStatXactRollback = 0; pgStatXactRollback = 0;
pgstat_setheader(&tsmsg->m_hdr, PGSTAT_MTYPE_TABSTAT); /*
tsmsg->m_databaseid = MyDatabaseId; * It's unlikely we'd get here with no socket, but maybe not
pgstat_send(tsmsg, len); * impossible
} */
RegularTabStat.tsa_used = 0; if (pgStatSock >= 0)
{
/* Ditto, for shared relations */ pgstat_setheader(&tsmsg->m_hdr, PGSTAT_MTYPE_TABSTAT);
for (i = 0; i < SharedTabStat.tsa_used; i++) tsmsg->m_databaseid = dbid;
{ pgstat_send(tsmsg, len);
PgStat_MsgTabstat *tsmsg = SharedTabStat.tsa_messages[i]; }
int n;
int len;
n = tsmsg->m_nentries;
len = offsetof(PgStat_MsgTabstat, m_entry[0]) +
n * sizeof(PgStat_TableEntry);
/* We don't report transaction commit/abort here */
tsmsg->m_xact_commit = 0;
tsmsg->m_xact_rollback = 0;
pgstat_setheader(&tsmsg->m_hdr, PGSTAT_MTYPE_TABSTAT); /*
tsmsg->m_databaseid = InvalidOid; * Zero out the entries, to mark them unused and prepare them
pgstat_send(tsmsg, len); * for next use.
*/
MemSet(tsmsg, 0, len);
} }
SharedTabStat.tsa_used = 0; tsarr->tsa_used = 0;
} }
...@@ -1013,7 +1011,7 @@ more_tabstat_space(TabStatArray *tsarr) ...@@ -1013,7 +1011,7 @@ more_tabstat_space(TabStatArray *tsarr)
newAlloc = tsarr->tsa_alloc + TABSTAT_QUANTUM; newAlloc = tsarr->tsa_alloc + TABSTAT_QUANTUM;
/* Create (another) quantum of message buffers */ /* Create (another) quantum of message buffers, and zero them */
newMessages = (PgStat_MsgTabstat *) newMessages = (PgStat_MsgTabstat *)
MemoryContextAllocZero(TopMemoryContext, MemoryContextAllocZero(TopMemoryContext,
sizeof(PgStat_MsgTabstat) * TABSTAT_QUANTUM); sizeof(PgStat_MsgTabstat) * TABSTAT_QUANTUM);
...@@ -1043,6 +1041,17 @@ more_tabstat_space(TabStatArray *tsarr) ...@@ -1043,6 +1041,17 @@ more_tabstat_space(TabStatArray *tsarr)
* of Relation or Scan structures. The data placed into these * of Relation or Scan structures. The data placed into these
* structures from here tell where later to count for buffer reads, * structures from here tell where later to count for buffer reads,
* scans and tuples fetched. * scans and tuples fetched.
*
* NOTE: PgStat_Info pointers in scan structures are really redundant
* with those in relcache entries. The passed stats pointer might point
* either to the Relation struct's own pgstat_info field, or to one in
* a scan structure; we'll set the Relation pg_statinfo and copy it to
* the scan struct.
*
* We assume that a relcache entry's pgstat_info field is zeroed by
* relcache.c when the relcache entry is made; thereafter it is long-lived
* data. We can avoid repeated searches of the TabStat arrays when the
* same relation is touched repeatedly within a transaction.
* ---------- * ----------
*/ */
void void
...@@ -1055,21 +1064,31 @@ pgstat_initstats(PgStat_Info *stats, Relation rel) ...@@ -1055,21 +1064,31 @@ pgstat_initstats(PgStat_Info *stats, Relation rel)
int mb; int mb;
int i; int i;
/*
* Initialize data not to count at all.
*/
stats->tabentry = NULL;
if (pgStatSock < 0 || if (pgStatSock < 0 ||
!(pgstat_collect_tuplelevel || !(pgstat_collect_tuplelevel ||
pgstat_collect_blocklevel)) pgstat_collect_blocklevel))
{
/* We're not counting at all. */
stats->tabentry = NULL;
return; return;
}
tsarr = rel->rd_rel->relisshared ? &SharedTabStat : &RegularTabStat; /*
* If we already set up this relation in the current transaction,
* just copy the pointer.
*/
if (rel->pgstat_info.tabentry != NULL &&
((PgStat_TableEntry *) rel->pgstat_info.tabentry)->t_id == rel_id)
{
stats->tabentry = rel->pgstat_info.tabentry;
return;
}
/* /*
* Search the already-used message slots for this relation. * Search the already-used message slots for this relation.
*/ */
tsarr = rel->rd_rel->relisshared ? &SharedTabStat : &RegularTabStat;
for (mb = 0; mb < tsarr->tsa_used; mb++) for (mb = 0; mb < tsarr->tsa_used; mb++)
{ {
tsmsg = tsarr->tsa_messages[mb]; tsmsg = tsarr->tsa_messages[mb];
...@@ -1078,7 +1097,8 @@ pgstat_initstats(PgStat_Info *stats, Relation rel) ...@@ -1078,7 +1097,8 @@ pgstat_initstats(PgStat_Info *stats, Relation rel)
{ {
if (tsmsg->m_entry[i].t_id == rel_id) if (tsmsg->m_entry[i].t_id == rel_id)
{ {
stats->tabentry = (void *) &(tsmsg->m_entry[i]); rel->pgstat_info.tabentry = (void *) &(tsmsg->m_entry[i]);
stats->tabentry = rel->pgstat_info.tabentry;
return; return;
} }
} }
...@@ -1088,13 +1108,14 @@ pgstat_initstats(PgStat_Info *stats, Relation rel) ...@@ -1088,13 +1108,14 @@ pgstat_initstats(PgStat_Info *stats, Relation rel)
/* /*
* Not found, but found a message buffer with an empty slot instead. * Not found, but found a message buffer with an empty slot instead.
* Fine, let's use this one. * Fine, let's use this one. We assume the entry was already zeroed,
* either at creation or after last use.
*/ */
i = tsmsg->m_nentries++; i = tsmsg->m_nentries++;
useent = &tsmsg->m_entry[i]; useent = &tsmsg->m_entry[i];
MemSet(useent, 0, sizeof(PgStat_TableEntry));
useent->t_id = rel_id; useent->t_id = rel_id;
stats->tabentry = (void *) useent; rel->pgstat_info.tabentry = (void *) useent;
stats->tabentry = rel->pgstat_info.tabentry;
return; return;
} }
...@@ -1111,9 +1132,9 @@ pgstat_initstats(PgStat_Info *stats, Relation rel) ...@@ -1111,9 +1132,9 @@ pgstat_initstats(PgStat_Info *stats, Relation rel)
tsmsg = tsarr->tsa_messages[mb]; tsmsg = tsarr->tsa_messages[mb];
tsmsg->m_nentries = 1; tsmsg->m_nentries = 1;
useent = &tsmsg->m_entry[0]; useent = &tsmsg->m_entry[0];
MemSet(useent, 0, sizeof(PgStat_TableEntry));
useent->t_id = rel_id; useent->t_id = rel_id;
stats->tabentry = (void *) useent; rel->pgstat_info.tabentry = (void *) useent;
stats->tabentry = rel->pgstat_info.tabentry;
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment