#include "catalog/indexing.h"
#include "catalog/namespace.h"
#include "catalog/pg_autovacuum.h"
+#include "catalog/pg_database.h"
#include "commands/vacuum.h"
#include "libpq/hba.h"
#include "libpq/pqsignal.h"
int autovacuum_anl_thresh;
double autovacuum_anl_scale;
+int autovacuum_vac_cost_delay;
+int autovacuum_vac_cost_limit;
+
/* Flag to tell if we are in the autovacuum daemon process */
static bool am_autovacuum = false;
static time_t last_autovac_start_time = 0;
static time_t last_autovac_stop_time = 0;
+/* Memory context for long-lived data */
+static MemoryContext AutovacMemCxt;
+
/* struct to keep list of candidate databases for vacuum */
typedef struct autovac_dbase
{
Oid oid;
char *name;
TransactionId frozenxid;
+ TransactionId vacuumxid;
PgStat_StatDBEntry *entry;
int32 age;
} autovac_dbase;
+/* struct to keep track of tables to vacuum and/or analyze */
+typedef struct autovac_table
+{
+ Oid relid;
+ bool dovacuum;
+ bool doanalyze;
+ int vacuum_cost_delay;
+ int vacuum_cost_limit;
+} autovac_table;
+
#ifdef EXEC_BACKEND
static pid_t autovac_forkexec(void);
#endif
NON_EXEC_STATIC void AutoVacMain(int argc, char *argv[]);
-static void do_autovacuum(bool whole_db, PgStat_StatDBEntry *dbentry);
+static void process_whole_db(void);
+static void do_autovacuum(PgStat_StatDBEntry *dbentry);
static List *autovac_get_database_list(void);
static void test_rel_for_autovac(Oid relid, PgStat_StatTabEntry *tabentry,
Form_pg_class classForm, Form_pg_autovacuum avForm,
- List **vacuum_tables, List **analyze_tables);
-static void autovacuum_do_vac_analyze(List *relids, bool dovacuum);
+ List **vacuum_tables);
+static void autovacuum_do_vac_analyze(List *relids, bool dovacuum,
+ bool doanalyze, bool freeze);
/*
/* Lose the postmaster's on-exit routines */
on_exit_reset();
+ /* Identify myself via ps */
+ init_ps_display("autovacuum process", "", "");
+ set_ps_display("");
+
+ SetProcessingMode(InitProcessing);
+
/*
* Set up signal handlers. We operate on databases much like a
* regular backend, so we use the same signal handling. See
pqsignal(SIGUSR1, CatchupInterruptHandler);
/* We don't listen for async notifies */
pqsignal(SIGUSR2, SIG_IGN);
+ pqsignal(SIGFPE, FloatExceptionHandler);
pqsignal(SIGCHLD, SIG_DFL);
- /* Identify myself via ps */
- init_ps_display("autovacuum process", "", "");
- set_ps_display("");
-
/* Early initialization */
BaseInit();
{
autovac_dbase *tmp = lfirst(cell);
bool this_whole_db;
+ int32 freeze_age,
+ vacuum_age;
/*
* We look for the database that most urgently needs a database-wide
* transactions sooner than vacuum.c's vac_truncate_clog() would
* decide to start giving warnings. If any such db is found, we
* ignore all other dbs.
+ *
+ * Unlike vacuum.c, we also look at vacuumxid. This is so that
+ * pg_clog can be kept trimmed to a reasonable size.
*/
- tmp->age = (int32) (nextXid - tmp->frozenxid);
- this_whole_db = (tmp->age > (int32) ((MaxTransactionId >> 3) * 3 - 100000));
+ freeze_age = (int32) (nextXid - tmp->frozenxid);
+ vacuum_age = (int32) (nextXid - tmp->vacuumxid);
+ tmp->age = Max(freeze_age, vacuum_age);
+
+ this_whole_db = (tmp->age >
+ (int32) ((MaxTransactionId >> 3) * 3 - 100000));
if (whole_db || this_whole_db)
{
if (!this_whole_db)
set_ps_display(db->name);
ereport(LOG,
(errmsg("autovacuum: processing database \"%s\"", db->name)));
+
+ /* Create the memory context where cross-transaction state is stored */
+ AutovacMemCxt = AllocSetContextCreate(TopMemoryContext,
+ "Autovacuum context",
+ ALLOCSET_DEFAULT_MINSIZE,
+ ALLOCSET_DEFAULT_INITSIZE,
+ ALLOCSET_DEFAULT_MAXSIZE);
+
/*
- * And do an appropriate amount of work on it
+ * And do an appropriate amount of work
*/
- do_autovacuum(whole_db, db->entry);
+ if (whole_db)
+ process_whole_db();
+ else
+ do_autovacuum(db->entry);
}
/* One iteration done, go away */
Oid db_id;
Oid db_tablespace;
TransactionId db_frozenxid;
+ TransactionId db_vacuumxid;
filename = database_getflatfilename();
db_file = AllocateFile(filename, "r");
errmsg("could not open file \"%s\": %m", filename)));
while (read_pg_database_line(db_file, thisname, &db_id,
- &db_tablespace, &db_frozenxid))
+ &db_tablespace, &db_frozenxid,
+ &db_vacuumxid))
{
autovac_dbase *db;
db->oid = db_id;
db->name = pstrdup(thisname);
db->frozenxid = db_frozenxid;
+ db->vacuumxid = db_vacuumxid;
/* these get set later: */
db->entry = NULL;
db->age = 0;
}
/*
- * Process a database.
- *
- * If whole_db is true, the database is processed as a whole, and the
- * dbentry parameter is ignored. If it's false, dbentry must be a valid
- * pointer to the database entry in the stats databases' hash table, and
- * it will be used to determine whether vacuum or analyze is needed on a
- * per-table basis.
+ * Process a whole database. If it's a template database or is disallowing
+ * connection by means of datallowconn=false, then issue a VACUUM FREEZE.
+ * Else use a plain VACUUM.
+ */
+static void
+process_whole_db(void)
+{
+ Relation dbRel;
+ ScanKeyData entry[1];
+ SysScanDesc scan;
+ HeapTuple tup;
+ Form_pg_database dbForm;
+ bool freeze;
+
+ /* Start a transaction so our commands have one to play into. */
+ StartTransactionCommand();
+
+ dbRel = heap_open(DatabaseRelationId, AccessShareLock);
+
+ /* Must use a table scan, since there's no syscache for pg_database */
+ ScanKeyInit(&entry[0],
+ ObjectIdAttributeNumber,
+ BTEqualStrategyNumber, F_OIDEQ,
+ ObjectIdGetDatum(MyDatabaseId));
+
+ scan = systable_beginscan(dbRel, DatabaseOidIndexId, true,
+ SnapshotNow, 1, entry);
+
+ tup = systable_getnext(scan);
+
+ if (!HeapTupleIsValid(tup))
+ elog(ERROR, "could not find tuple for database %u", MyDatabaseId);
+
+ dbForm = (Form_pg_database) GETSTRUCT(tup);
+
+ if (!dbForm->datallowconn || dbForm->datistemplate)
+ freeze = true;
+ else
+ freeze = false;
+
+ systable_endscan(scan);
+
+ heap_close(dbRel, AccessShareLock);
+
+ elog(DEBUG2, "autovacuum: VACUUM%s whole database",
+ (freeze) ? " FREEZE" : "");
+
+ autovacuum_do_vac_analyze(NIL, true, false, freeze);
+
+ /* Finally close out the last transaction. */
+ CommitTransactionCommand();
+}
+
+/*
+ * Process a database table-by-table
*
- * Note that test_rel_for_autovac generates two separate lists, one for
- * vacuum and other for analyze. This is to facilitate processing all
- * analyzes first, and then all vacuums.
+ * dbentry must be a valid pointer to the database entry in the stats
+ * databases' hash table, and it will be used to determine whether vacuum or
+ * analyze is needed on a per-table basis.
*
* Note that CHECK_FOR_INTERRUPTS is supposed to be used in certain spots in
* order not to ignore shutdown commands for too long.
*/
static void
-do_autovacuum(bool whole_db, PgStat_StatDBEntry *dbentry)
+do_autovacuum(PgStat_StatDBEntry *dbentry)
{
Relation classRel,
avRel;
HeapTuple tuple;
HeapScanDesc relScan;
- List *vacuum_tables = NIL,
- *analyze_tables = NIL;
- MemoryContext AutovacMemCxt;
-
- Assert(whole_db || PointerIsValid(dbentry));
-
- /* Memory context where cross-transaction state is stored */
- AutovacMemCxt = AllocSetContextCreate(TopMemoryContext,
- "Autovacuum context",
- ALLOCSET_DEFAULT_MINSIZE,
- ALLOCSET_DEFAULT_INITSIZE,
- ALLOCSET_DEFAULT_MAXSIZE);
+ List *vacuum_tables = NIL;
+ ListCell *cell;
+ PgStat_StatDBEntry *shared;
/* Start a transaction so our commands have one to play into. */
StartTransactionCommand();
*/
MemoryContextSwitchTo(AutovacMemCxt);
- if (whole_db)
- {
- elog(DEBUG2, "autovacuum: VACUUM ANALYZE whole database");
- autovacuum_do_vac_analyze(NIL, true);
- }
- else
- {
- /* the hash entry where pgstat stores shared relations */
- PgStat_StatDBEntry *shared = pgstat_fetch_stat_dbentry(InvalidOid);
-
- classRel = heap_open(RelationRelationId, AccessShareLock);
- avRel = heap_open(AutovacuumRelationId, AccessShareLock);
-
- relScan = heap_beginscan(classRel, SnapshotNow, 0, NULL);
+ /* The database hash where pgstat keeps shared relations */
+ shared = pgstat_fetch_stat_dbentry(InvalidOid);
- /* Scan pg_class looking for tables to vacuum */
- while ((tuple = heap_getnext(relScan, ForwardScanDirection)) != NULL)
- {
- Form_pg_class classForm = (Form_pg_class) GETSTRUCT(tuple);
- Form_pg_autovacuum avForm = NULL;
- PgStat_StatTabEntry *tabentry;
- SysScanDesc avScan;
- HeapTuple avTup;
- ScanKeyData entry[1];
- Oid relid;
-
- /* Skip non-table entries. */
- /* XXX possibly allow RELKIND_TOASTVALUE entries here too? */
- if (classForm->relkind != RELKIND_RELATION)
- continue;
+ classRel = heap_open(RelationRelationId, AccessShareLock);
+ avRel = heap_open(AutovacuumRelationId, AccessShareLock);
- /*
- * Skip temp tables (i.e. those in temp namespaces). We cannot
- * safely process other backends' temp tables.
- */
- if (isTempNamespace(classForm->relnamespace))
- continue;
+ relScan = heap_beginscan(classRel, SnapshotNow, 0, NULL);
- relid = HeapTupleGetOid(tuple);
+ /* Scan pg_class looking for tables to vacuum */
+ while ((tuple = heap_getnext(relScan, ForwardScanDirection)) != NULL)
+ {
+ Form_pg_class classForm = (Form_pg_class) GETSTRUCT(tuple);
+ Form_pg_autovacuum avForm = NULL;
+ PgStat_StatTabEntry *tabentry;
+ SysScanDesc avScan;
+ HeapTuple avTup;
+ ScanKeyData entry[1];
+ Oid relid;
+
+ /* Skip non-table entries. */
+ /* XXX possibly allow RELKIND_TOASTVALUE entries here too? */
+ if (classForm->relkind != RELKIND_RELATION)
+ continue;
- /* See if we have a pg_autovacuum entry for this relation. */
- ScanKeyInit(&entry[0],
- Anum_pg_autovacuum_vacrelid,
- BTEqualStrategyNumber, F_OIDEQ,
- ObjectIdGetDatum(relid));
+ /*
+ * Skip temp tables (i.e. those in temp namespaces). We cannot
+ * safely process other backends' temp tables.
+ */
+ if (isTempNamespace(classForm->relnamespace))
+ continue;
- avScan = systable_beginscan(avRel, AutovacuumRelidIndexId, true,
- SnapshotNow, 1, entry);
+ relid = HeapTupleGetOid(tuple);
- avTup = systable_getnext(avScan);
+ /* See if we have a pg_autovacuum entry for this relation. */
+ ScanKeyInit(&entry[0],
+ Anum_pg_autovacuum_vacrelid,
+ BTEqualStrategyNumber, F_OIDEQ,
+ ObjectIdGetDatum(relid));
- if (HeapTupleIsValid(avTup))
- avForm = (Form_pg_autovacuum) GETSTRUCT(avTup);
+ avScan = systable_beginscan(avRel, AutovacuumRelidIndexId, true,
+ SnapshotNow, 1, entry);
- if (classForm->relisshared && PointerIsValid(shared))
- tabentry = hash_search(shared->tables, &relid,
- HASH_FIND, NULL);
- else
- tabentry = hash_search(dbentry->tables, &relid,
- HASH_FIND, NULL);
+ avTup = systable_getnext(avScan);
- test_rel_for_autovac(relid, tabentry, classForm, avForm,
- &vacuum_tables, &analyze_tables);
+ if (HeapTupleIsValid(avTup))
+ avForm = (Form_pg_autovacuum) GETSTRUCT(avTup);
- systable_endscan(avScan);
- }
+ if (classForm->relisshared && PointerIsValid(shared))
+ tabentry = hash_search(shared->tables, &relid,
+ HASH_FIND, NULL);
+ else
+ tabentry = hash_search(dbentry->tables, &relid,
+ HASH_FIND, NULL);
- heap_endscan(relScan);
- heap_close(avRel, AccessShareLock);
- heap_close(classRel, AccessShareLock);
+ test_rel_for_autovac(relid, tabentry, classForm, avForm,
+ &vacuum_tables);
- CHECK_FOR_INTERRUPTS();
+ systable_endscan(avScan);
+ }
- /*
- * Perform operations on collected tables.
- */
+ heap_endscan(relScan);
+ heap_close(avRel, AccessShareLock);
+ heap_close(classRel, AccessShareLock);
- if (analyze_tables)
- autovacuum_do_vac_analyze(analyze_tables, false);
+ /*
+ * Perform operations on collected tables.
+ */
+ foreach(cell, vacuum_tables)
+ {
+ autovac_table *tab = lfirst(cell);
CHECK_FOR_INTERRUPTS();
- /* get back to proper context */
- MemoryContextSwitchTo(AutovacMemCxt);
+ /* Set the vacuum cost parameters for this table */
+ VacuumCostDelay = tab->vacuum_cost_delay;
+ VacuumCostLimit = tab->vacuum_cost_limit;
- if (vacuum_tables)
- autovacuum_do_vac_analyze(vacuum_tables, true);
+ autovacuum_do_vac_analyze(list_make1_oid(tab->relid),
+ tab->dovacuum,
+ tab->doanalyze,
+ false);
}
/* Finally close out the last transaction. */
* test_rel_for_autovac
*
* Check whether a table needs to be vacuumed or analyzed. Add it to the
- * respective list if so.
+ * output list if so.
*
* A table needs to be vacuumed if the number of dead tuples exceeds a
* threshold. This threshold is calculated as
test_rel_for_autovac(Oid relid, PgStat_StatTabEntry *tabentry,
Form_pg_class classForm,
Form_pg_autovacuum avForm,
- List **vacuum_tables, List **analyze_tables)
+ List **vacuum_tables)
{
Relation rel;
float4 reltuples; /* pg_class.reltuples */
/* number of vacuum (resp. analyze) tuples at this time */
float4 vactuples,
anltuples;
+ /* cost-based vacuum delay parameters */
+ int vac_cost_limit;
+ int vac_cost_delay;
+ bool dovacuum;
+ bool doanalyze;
/* User disabled it in pg_autovacuum? */
if (avForm && !avForm->enabled)
*/
if (avForm != NULL)
{
- vac_scale_factor = (avForm->vac_scale_factor < 0) ?
- autovacuum_vac_scale : avForm->vac_scale_factor;
- vac_base_thresh = (avForm->vac_base_thresh < 0) ?
- autovacuum_vac_thresh : avForm->vac_base_thresh;
-
- anl_scale_factor = (avForm->anl_scale_factor < 0) ?
- autovacuum_anl_scale : avForm->anl_scale_factor;
- anl_base_thresh = (avForm->anl_base_thresh < 0) ?
- autovacuum_anl_thresh : avForm->anl_base_thresh;
+ vac_scale_factor = (avForm->vac_scale_factor >= 0) ?
+ avForm->vac_scale_factor : autovacuum_vac_scale;
+ vac_base_thresh = (avForm->vac_base_thresh >= 0) ?
+ avForm->vac_base_thresh : autovacuum_vac_thresh;
+
+ anl_scale_factor = (avForm->anl_scale_factor >= 0) ?
+ avForm->anl_scale_factor : autovacuum_anl_scale;
+ anl_base_thresh = (avForm->anl_base_thresh >= 0) ?
+ avForm->anl_base_thresh : autovacuum_anl_thresh;
+
+ vac_cost_limit = (avForm->vac_cost_limit >= 0) ?
+ avForm->vac_cost_limit :
+ ((autovacuum_vac_cost_limit >= 0) ?
+ autovacuum_vac_cost_limit : VacuumCostLimit);
+
+ vac_cost_delay = (avForm->vac_cost_delay >= 0) ?
+ avForm->vac_cost_delay :
+ ((autovacuum_vac_cost_delay >= 0) ?
+ autovacuum_vac_cost_delay : VacuumCostDelay);
}
else
{
anl_scale_factor = autovacuum_anl_scale;
anl_base_thresh = autovacuum_anl_thresh;
+
+ vac_cost_limit = (autovacuum_vac_cost_limit >= 0) ?
+ autovacuum_vac_cost_limit : VacuumCostLimit;
+
+ vac_cost_delay = (autovacuum_vac_cost_delay >= 0) ?
+ autovacuum_vac_cost_delay : VacuumCostDelay;
}
vacthresh = (float4) vac_base_thresh + vac_scale_factor * reltuples;
RelationGetRelationName(rel),
vactuples, vacthresh, anltuples, anlthresh);
+ Assert(CurrentMemoryContext == AutovacMemCxt);
+
/* Determine if this table needs vacuum or analyze. */
- if (vactuples > vacthresh)
+ dovacuum = (vactuples > vacthresh);
+ doanalyze = (anltuples > anlthresh);
+
+ /* ANALYZE refuses to work with pg_statistics */
+ if (relid == StatisticRelationId)
+ doanalyze = false;
+
+ if (dovacuum || doanalyze)
{
- elog(DEBUG2, "will VACUUM ANALYZE %s",
+ autovac_table *tab;
+
+ elog(DEBUG2, "will%s%s %s",
+ (dovacuum ? " VACUUM" : ""),
+ (doanalyze ? " ANALYZE" : ""),
RelationGetRelationName(rel));
- *vacuum_tables = lappend_oid(*vacuum_tables, relid);
- }
- else if (anltuples > anlthresh)
- {
- /* ANALYZE refuses to work with pg_statistics */
- if (relid != StatisticRelationId)
- {
- elog(DEBUG2, "will ANALYZE %s",
- RelationGetRelationName(rel));
- *analyze_tables = lappend_oid(*analyze_tables, relid);
- }
+
+ tab = (autovac_table *) palloc(sizeof(autovac_table));
+ tab->relid = relid;
+ tab->dovacuum = dovacuum;
+ tab->doanalyze = doanalyze;
+ tab->vacuum_cost_limit = vac_cost_limit;
+ tab->vacuum_cost_delay = vac_cost_delay;
+
+ *vacuum_tables = lappend(*vacuum_tables, tab);
}
RelationClose(rel);
/*
* autovacuum_do_vac_analyze
- * Vacuum or analyze a list of tables; or all tables if relids = NIL
- *
- * We must be in AutovacMemCxt when this routine is called.
+ * Vacuum and/or analyze a list of tables; or all tables if relids = NIL
*/
static void
-autovacuum_do_vac_analyze(List *relids, bool dovacuum)
+autovacuum_do_vac_analyze(List *relids, bool dovacuum, bool doanalyze,
+ bool freeze)
{
- VacuumStmt *vacstmt = makeNode(VacuumStmt);
+ VacuumStmt *vacstmt;
+ MemoryContext old_cxt;
+
+ /*
+ * The node must survive transaction boundaries, so make sure we create it
+ * in a long-lived context
+ */
+ old_cxt = MemoryContextSwitchTo(AutovacMemCxt);
+
+ vacstmt = makeNode(VacuumStmt);
/*
* Point QueryContext to the autovac memory context to fake out the
/* Set up command parameters */
vacstmt->vacuum = dovacuum;
vacstmt->full = false;
- vacstmt->analyze = true;
- vacstmt->freeze = false;
+ vacstmt->analyze = doanalyze;
+ vacstmt->freeze = freeze;
vacstmt->verbose = false;
vacstmt->relation = NULL; /* all tables, or not used if relids != NIL */
vacstmt->va_cols = NIL;
vacuum(vacstmt, relids);
+
+ pfree(vacstmt);
+ MemoryContextSwitchTo(old_cxt);
}
/*
#include <math.h>
#include <unistd.h>
+#include "access/genam.h"
#include "access/heapam.h"
#include "catalog/catalog.h"
+#include "catalog/indexing.h"
#include "catalog/namespace.h"
#include "catalog/pg_authid.h"
#include "catalog/pg_database.h"
char *filename;
FILE *db_file;
char thisname[NAMEDATALEN];
- TransactionId frozenxid;
+ TransactionId dummyxid;
filename = database_getflatfilename();
db_file = AllocateFile(filename, "r");
errmsg("could not open file \"%s\": %m", filename)));
while (read_pg_database_line(db_file, thisname, db_id,
- db_tablespace, &frozenxid))
+ db_tablespace, &dummyxid,
+ &dummyxid))
{
if (strcmp(thisname, name) == 0)
{
ReverifyMyDatabase(const char *name)
{
Relation pgdbrel;
- HeapScanDesc pgdbscan;
+ SysScanDesc pgdbscan;
ScanKeyData key;
HeapTuple tup;
Form_pg_database dbform;
BTEqualStrategyNumber, F_NAMEEQ,
NameGetDatum(name));
- pgdbscan = heap_beginscan(pgdbrel, SnapshotNow, 1, &key);
+ pgdbscan = systable_beginscan(pgdbrel, DatabaseNameIndexId, true,
+ SnapshotNow, 1, &key);
- tup = heap_getnext(pgdbscan, ForwardScanDirection);
+ tup = systable_getnext(pgdbscan);
if (!HeapTupleIsValid(tup) ||
HeapTupleGetOid(tup) != MyDatabaseId)
{
}
}
- heap_endscan(pgdbscan);
+ systable_endscan(pgdbscan);
heap_close(pgdbrel, RowShareLock);
}
/* Initialize portal manager */
EnablePortalManager();
+ /*
+ * Set up process-exit callback to do pre-shutdown cleanup. This
+ * has to be after we've initialized all the low-level modules
+ * like the buffer manager, because during shutdown this has to
+ * run before the low-level modules start to close down. On the
+ * other hand, we want it in place before we begin our first
+ * transaction --- if we fail during the initialization transaction,
+ * as is entirely possible, we need the AbortTransaction call to
+ * clean up.
+ */
+ on_shmem_exit(ShutdownPostgres, 0);
+
/* start a new transaction here before access to db */
if (!bootstrap)
StartTransactionCommand();
/*
* Unless we are bootstrapping, double-check that InitMyDatabaseInfo()
* got a correct result. We can't do this until all the
- * database-access infrastructure is up.
+ * database-access infrastructure is up. (Also, it wants to know if
+ * the user is a superuser, so the above stuff has to happen first.)
*/
if (!bootstrap)
ReverifyMyDatabase(dbname);
/* initialize client encoding */
InitializeClientEncoding();
- /*
- * Initialize statistics collection for this backend. We do this
- * here because the shutdown hook it sets up needs to be invoked
- * at the corresponding phase of backend shutdown: after
- * ShutdownPostgres and before we drop access to shared memory.
- */
+ /* initialize statistics collection for this backend */
if (IsUnderPostmaster)
pgstat_bestart();
- /*
- * Set up process-exit callback to do pre-shutdown cleanup. This
- * should be last because we want shmem_exit to call this routine
- * before the exit callbacks that are registered by buffer manager,
- * lock manager, etc. We need to run this code before we close down
- * database access!
- */
- on_shmem_exit(ShutdownPostgres, 0);
-
/* close the transaction we started above */
if (!bootstrap)
CommitTransactionCommand();
/*
* Backend-shutdown callback. Do cleanup that we want to be sure happens
* before all the supporting modules begin to nail their doors shut via
- * their own callbacks. Note that because this has to be registered very
- * late in startup, it will not get called if we suffer a failure *during*
- * startup.
+ * their own callbacks.
*
* User-level cleanup, such as temp-relation removal and UNLISTEN, happens
* via separate callbacks that execute before this one. We don't combine the