different coding here.
I wrote:
What I think we need to do about this is
(1) fix pgstat_vacuum_tabstats to have non-O(N^2) behavior; I'm thinking
of using a hash table for the OIDs instead of a linear list. Should be
a pretty small change; I'll work on it today.
I've applied the attached patch to 8.2 to do the above. Please give it
a try and see how much it helps for you. Some limited testing here
confirms a noticeable improvement in VACUUM startup time at 10000
tables, and of course it should be 100X worse with 100000 tables.
I am still confused why you didn't see the problem in 8.1, though.
This code is just about exactly the same in 8.1. Maybe you changed
your stats collector settings when moving to 8.2?
regards, tom lane
Index: pgstat.c
===================================================================
RCS file: /cvsroot/pgsql/src/backend/postmaster/pgstat.c,v
retrieving revision 1.140
diff -c -r1.140 pgstat.c
*** pgstat.c 21 Nov 2006 20:59:52 -0000 1.140
--- pgstat.c 11 Jan 2007 22:32:30 -0000
***************
*** 159,164 ****
--- 159,165 ----
static void pgstat_read_statsfile(HTAB **dbhash, Oid onlydb);
static void backend_read_statsfile(void);
static void pgstat_read_current_status(void);
+ static HTAB *pgstat_collect_oids(Oid catalogid);
static void pgstat_setheader(PgStat_MsgHdr *hdr, StatMsgType mtype);
static void pgstat_send(void *msg, int len);
***************
*** 657,666 ****
void
pgstat_vacuum_tabstat(void)
{
! List *oidlist;
! Relation rel;
! HeapScanDesc scan;
! HeapTuple tup;
PgStat_MsgTabpurge msg;
HASH_SEQ_STATUS hstat;
PgStat_StatDBEntry *dbentry;
--- 658,664 ----
void
pgstat_vacuum_tabstat(void)
{
! HTAB *htab;
PgStat_MsgTabpurge msg;
HASH_SEQ_STATUS hstat;
PgStat_StatDBEntry *dbentry;
***************
*** 679,693 ****
/*
* Read pg_database and make a list of OIDs of all existing databases
*/
! oidlist = NIL;
! rel = heap_open(DatabaseRelationId, AccessShareLock);
! scan = heap_beginscan(rel, SnapshotNow, 0, NULL);
! while ((tup = heap_getnext(scan, ForwardScanDirection)) != NULL)
! {
! oidlist = lappend_oid(oidlist, HeapTupleGetOid(tup));
! }
! heap_endscan(scan);
! heap_close(rel, AccessShareLock);
/*
* Search the database hash table for dead databases and tell the
--- 677,683 ----
/*
* Read pg_database and make a list of OIDs of all existing databases
*/
! htab = pgstat_collect_oids(DatabaseRelationId);
/*
* Search the database hash table for dead databases and tell the
***************
*** 698,709 ****
{
Oid dbid = dbentry->databaseid;
! if (!list_member_oid(oidlist, dbid))
pgstat_drop_database(dbid);
}
/* Clean up */
! list_free(oidlist);
/*
* Lookup our own database entry; if not found, nothing more to do.
--- 688,701 ----
{
Oid dbid = dbentry->databaseid;
! CHECK_FOR_INTERRUPTS();
!
! if (hash_search(htab, (void *) &dbid, HASH_FIND, NULL) == NULL)
pgstat_drop_database(dbid);
}
/* Clean up */
! hash_destroy(htab);
/*
* Lookup our own database entry; if not found, nothing more to do.
***************
*** 717,731 ****
/*
* Similarly to above, make a list of all known relations in this DB.
*/
! oidlist = NIL;
! rel = heap_open(RelationRelationId, AccessShareLock);
! scan = heap_beginscan(rel, SnapshotNow, 0, NULL);
! while ((tup = heap_getnext(scan, ForwardScanDirection)) != NULL)
! {
! oidlist = lappend_oid(oidlist, HeapTupleGetOid(tup));
! }
! heap_endscan(scan);
! heap_close(rel, AccessShareLock);
/*
* Initialize our messages table counter to zero
--- 709,715 ----
/*
* Similarly to above, make a list of all known relations in this DB.
*/
! htab = pgstat_collect_oids(RelationRelationId);
/*
* Initialize our messages table counter to zero
***************
*** 738,750 ****
hash_seq_init(&hstat, dbentry->tables);
while ((tabentry = (PgStat_StatTabEntry *) hash_seq_search(&hstat)) != NULL)
{
! if (list_member_oid(oidlist, tabentry->tableid))
continue;
/*
* Not there, so add this table's Oid to the message
*/
! msg.m_tableid[msg.m_nentries++] = tabentry->tableid;
/*
* If the message is full, send it out and reinitialize to empty
--- 722,738 ----
hash_seq_init(&hstat, dbentry->tables);
while ((tabentry = (PgStat_StatTabEntry *) hash_seq_search(&hstat)) != NULL)
{
! Oid tabid = tabentry->tableid;
!
! CHECK_FOR_INTERRUPTS();
!
! if (hash_search(htab, (void *) &tabid, HASH_FIND, NULL) != NULL)
continue;
/*
* Not there, so add this table's Oid to the message
*/
! msg.m_tableid[msg.m_nentries++] = tabid;
/*
* If the message is full, send it out and reinitialize to empty
***************
*** 776,782 ****
}
/* Clean up */
! list_free(oidlist);
}
--- 764,813 ----
}
/* Clean up */
! hash_destroy(htab);
! }
!
!
! /* ----------
! * pgstat_collect_oids() -
! *
! * Collect the OIDs of either all databases or all tables, according to
! * the parameter, into a temporary hash table. Caller should hash_destroy
! * the result when done with it.
! * ----------
! */
! static HTAB *
! pgstat_collect_oids(Oid catalogid)
! {
! HTAB *htab;
! HASHCTL hash_ctl;
! Relation rel;
! HeapScanDesc scan;
! HeapTuple tup;
!
! memset(&hash_ctl, 0, sizeof(hash_ctl));
! hash_ctl.keysize = sizeof(Oid);
! hash_ctl.entrysize = sizeof(Oid);
! hash_ctl.hash = oid_hash;
! htab = hash_create("Temporary table of OIDs",
! PGSTAT_TAB_HASH_SIZE,
! &hash_ctl,
! HASH_ELEM | HASH_FUNCTION);
!
! rel = heap_open(catalogid, AccessShareLock);
! scan = heap_beginscan(rel, SnapshotNow, 0, NULL);
! while ((tup = heap_getnext(scan, ForwardScanDirection)) != NULL)
! {
! Oid thisoid = HeapTupleGetOid(tup);
!
! CHECK_FOR_INTERRUPTS();
!
! (void) hash_search(htab, (void *) &thisoid, HASH_ENTER, NULL);
! }
! heap_endscan(scan);
! heap_close(rel, AccessShareLock);
!
! return htab;
}