PostgreSQL Source Code  git master
vacuum.h
Go to the documentation of this file.
1 /*-------------------------------------------------------------------------
2  *
3  * vacuum.h
4  * header file for postgres vacuum cleaner and statistics analyzer
5  *
6  *
7  * Portions Copyright (c) 1996-2024, PostgreSQL Global Development Group
8  * Portions Copyright (c) 1994, Regents of the University of California
9  *
10  * src/include/commands/vacuum.h
11  *
12  *-------------------------------------------------------------------------
13  */
14 #ifndef VACUUM_H
15 #define VACUUM_H
16 
17 #include "access/htup.h"
18 #include "access/genam.h"
19 #include "access/parallel.h"
20 #include "catalog/pg_class.h"
21 #include "catalog/pg_statistic.h"
22 #include "catalog/pg_type.h"
23 #include "parser/parse_node.h"
24 #include "storage/buf.h"
25 #include "storage/lock.h"
26 #include "utils/relcache.h"
27 
28 /*
29  * Flags for amparallelvacuumoptions to control the participation of bulkdelete
30  * and vacuumcleanup in parallel vacuum.
31  */
32 
33 /*
34  * Both bulkdelete and vacuumcleanup are disabled by default. This will be
35  * used by IndexAM's that don't want to or cannot participate in parallel
36  * vacuum. For example, if an index AM doesn't have a way to communicate the
37  * index statistics allocated by the first ambulkdelete call to the subsequent
38  * ones until amvacuumcleanup, the index AM cannot participate in parallel
39  * vacuum.
40  */
41 #define VACUUM_OPTION_NO_PARALLEL 0
42 
43 /*
44  * bulkdelete can be performed in parallel. This option can be used by
45  * index AMs that need to scan indexes to delete tuples.
46  */
47 #define VACUUM_OPTION_PARALLEL_BULKDEL (1 << 0)
48 
49 /*
50  * vacuumcleanup can be performed in parallel if bulkdelete is not performed
51  * yet. This will be used by IndexAM's that can scan the index if the
52  * bulkdelete is not performed.
53  */
54 #define VACUUM_OPTION_PARALLEL_COND_CLEANUP (1 << 1)
55 
56 /*
57  * vacuumcleanup can be performed in parallel even if bulkdelete has already
58  * processed the index. This will be used by IndexAM's that scan the index
59  * during the cleanup phase of index irrespective of whether the index is
60  * already scanned or not during bulkdelete phase.
61  */
62 #define VACUUM_OPTION_PARALLEL_CLEANUP (1 << 2)
63 
64 /* value for checking vacuum flags */
65 #define VACUUM_OPTION_MAX_VALID_VALUE ((1 << 3) - 1)
66 
67 /* Abstract type for parallel vacuum state */
69 
70 /*----------
71  * ANALYZE builds one of these structs for each attribute (column) that is
72  * to be analyzed. The struct and subsidiary data are in anl_context,
73  * so they live until the end of the ANALYZE operation.
74  *
75  * The type-specific typanalyze function is passed a pointer to this struct
76  * and must return true to continue analysis, false to skip analysis of this
77  * column. In the true case it must set the compute_stats and minrows fields,
78  * and can optionally set extra_data to pass additional info to compute_stats.
79  * minrows is its request for the minimum number of sample rows to be gathered
80  * (but note this request might not be honored, eg if there are fewer rows
81  * than that in the table).
82  *
83  * The compute_stats routine will be called after sample rows have been
84  * gathered. Aside from this struct, it is passed:
85  * fetchfunc: a function for accessing the column values from the
86  * sample rows
87  * samplerows: the number of sample tuples
88  * totalrows: estimated total number of rows in relation
89  * The fetchfunc may be called with rownum running from 0 to samplerows-1.
90  * It returns a Datum and an isNull flag.
91  *
92  * compute_stats should set stats_valid true if it is able to compute
93  * any useful statistics. If it does, the remainder of the struct holds
94  * the information to be stored in a pg_statistic row for the column. Be
95  * careful to allocate any pointed-to data in anl_context, which will NOT
96  * be CurrentMemoryContext when compute_stats is called.
97  *
98  * Note: all comparisons done for statistical purposes should use the
99  * underlying column's collation (attcollation), except in situations
100  * where a noncollatable container type contains a collatable type;
101  * in that case use the type's default collation. Be sure to record
102  * the appropriate collation in stacoll.
103  *----------
104  */
105 typedef struct VacAttrStats *VacAttrStatsP;
106 
107 typedef Datum (*AnalyzeAttrFetchFunc) (VacAttrStatsP stats, int rownum,
108  bool *isNull);
109 
111  AnalyzeAttrFetchFunc fetchfunc,
112  int samplerows,
113  double totalrows);
114 
115 typedef struct VacAttrStats
116 {
117  /*
118  * These fields are set up by the main ANALYZE code before invoking the
119  * type-specific typanalyze function. They don't necessarily match what
120  * is in pg_attribute, because some index opclasses store a different type
121  * than the underlying column/expression. Therefore, use these fields for
122  * information about the datatype being fed to the typanalyze function.
123  */
124  int attstattarget; /* -1 to use default */
125  Oid attrtypid; /* type of data being analyzed */
126  int32 attrtypmod; /* typmod of data being analyzed */
127  Form_pg_type attrtype; /* copy of pg_type row for attrtypid */
128  Oid attrcollid; /* collation of data being analyzed */
129  MemoryContext anl_context; /* where to save long-lived data */
130 
131  /*
132  * These fields must be filled in by the typanalyze routine, unless it
133  * returns false.
134  */
136  int minrows; /* Minimum # of rows wanted for stats */
137  void *extra_data; /* for extra type-specific data */
138 
139  /*
140  * These fields are to be filled in by the compute_stats routine. (They
141  * are initialized to zero when the struct is created.)
142  */
144  float4 stanullfrac; /* fraction of entries that are NULL */
145  int32 stawidth; /* average width of column values */
146  float4 stadistinct; /* # distinct values */
154 
155  /*
156  * These fields describe the stavalues[n] element types. They will be
157  * initialized to match attrtypid, but a custom typanalyze function might
158  * want to store an array of something other than the analyzed column's
159  * elements. It should then overwrite these fields.
160  */
165 
166  /*
167  * These fields are private to the main ANALYZE code and should not be
168  * looked at by type-specific functions.
169  */
170  int tupattnum; /* attribute number within tuples */
171  HeapTuple *rows; /* access info for std fetch function */
173  Datum *exprvals; /* access info for index fetch function */
174  bool *exprnulls;
177 
178 /* flag bits for VacuumParams->options */
179 #define VACOPT_VACUUM 0x01 /* do VACUUM */
180 #define VACOPT_ANALYZE 0x02 /* do ANALYZE */
181 #define VACOPT_VERBOSE 0x04 /* output INFO instrumentation messages */
182 #define VACOPT_FREEZE 0x08 /* FREEZE option */
183 #define VACOPT_FULL 0x10 /* FULL (non-concurrent) vacuum */
184 #define VACOPT_SKIP_LOCKED 0x20 /* skip if cannot get lock */
185 #define VACOPT_PROCESS_MAIN 0x40 /* process main relation */
186 #define VACOPT_PROCESS_TOAST 0x80 /* process the TOAST table, if any */
187 #define VACOPT_DISABLE_PAGE_SKIPPING 0x100 /* don't skip any pages */
188 #define VACOPT_SKIP_DATABASE_STATS 0x200 /* skip vac_update_datfrozenxid() */
189 #define VACOPT_ONLY_DATABASE_STATS 0x400 /* only vac_update_datfrozenxid() */
190 
191 /*
192  * Values used by index_cleanup and truncate params.
193  *
194  * VACOPTVALUE_UNSPECIFIED is used as an initial placeholder when VACUUM
195  * command has no explicit value. When that happens the final usable value
196  * comes from the corresponding reloption (though the reloption default is
197  * usually used).
198  */
199 typedef enum VacOptValue
200 {
206 
207 /*
208  * Parameters customizing behavior of VACUUM and ANALYZE.
209  *
210  * Note that at least one of VACOPT_VACUUM and VACOPT_ANALYZE must be set
211  * in options.
212  *
213  * When adding a new VacuumParam member, consider adding it to vacuumdb as
214  * well.
215  */
216 typedef struct VacuumParams
217 {
218  bits32 options; /* bitmask of VACOPT_* */
219  int freeze_min_age; /* min freeze age, -1 to use default */
220  int freeze_table_age; /* age at which to scan whole table */
221  int multixact_freeze_min_age; /* min multixact freeze age, -1 to
222  * use default */
223  int multixact_freeze_table_age; /* multixact age at which to scan
224  * whole table */
225  bool is_wraparound; /* force a for-wraparound vacuum */
226  int log_min_duration; /* minimum execution threshold in ms at
227  * which autovacuum is logged, -1 to use
228  * default */
229  VacOptValue index_cleanup; /* Do index vacuum and cleanup */
230  VacOptValue truncate; /* Truncate empty pages at the end */
231  Oid toast_parent; /* for privilege checks when recursing */
232 
233  /*
234  * The number of parallel vacuum workers. 0 by default which means choose
235  * based on the number of indexes. -1 indicates parallel vacuum is
236  * disabled.
237  */
238  int nworkers;
240 
241 /*
242  * VacuumCutoffs is immutable state that describes the cutoffs used by VACUUM.
243  * Established at the beginning of each VACUUM operation.
244  */
246 {
247  /*
248  * Existing pg_class fields at start of VACUUM
249  */
252 
253  /*
254  * OldestXmin is the Xid below which tuples deleted by any xact (that
255  * committed) should be considered DEAD, not just RECENTLY_DEAD.
256  *
257  * OldestMxact is the Mxid below which MultiXacts are definitely not seen
258  * as visible by any running transaction.
259  *
260  * OldestXmin and OldestMxact are also the most recent values that can
261  * ever be passed to vac_update_relstats() as frozenxid and minmulti
262  * arguments at the end of VACUUM. These same values should be passed
263  * when it turns out that VACUUM will leave no unfrozen XIDs/MXIDs behind
264  * in the table.
265  */
268 
269  /*
270  * FreezeLimit is the Xid below which all Xids are definitely frozen or
271  * removed in pages VACUUM scans and cleanup locks.
272  *
273  * MultiXactCutoff is the value below which all MultiXactIds are
274  * definitely removed from Xmax in pages VACUUM scans and cleanup locks.
275  */
278 };
279 
280 /*
281  * VacDeadItems stores TIDs whose index tuples are deleted by index vacuuming.
282  */
283 typedef struct VacDeadItems
284 {
285  int max_items; /* # slots allocated in array */
286  int num_items; /* current # of entries */
287 
288  /* Sorted array of TIDs to delete from indexes */
291 
292 #define MAXDEADITEMS(avail_mem) \
293  (((avail_mem) - offsetof(VacDeadItems, items)) / sizeof(ItemPointerData))
294 
295 /* GUC parameters */
296 extern PGDLLIMPORT int default_statistics_target; /* PGDLLIMPORT for PostGIS */
303 
304 /*
305  * Maximum value for default_statistics_target and per-column statistics
306  * targets. This is fairly arbitrary, mainly to prevent users from creating
307  * unreasonably large statistics that the system cannot handle well.
308  */
309 #define MAX_STATISTICS_TARGET 10000
310 
311 /* Variables for cost-based parallel vacuum */
315 
317 extern PGDLLIMPORT double vacuum_cost_delay;
318 extern PGDLLIMPORT int vacuum_cost_limit;
319 
320 /* in commands/vacuum.c */
321 extern void ExecVacuum(ParseState *pstate, VacuumStmt *vacstmt, bool isTopLevel);
322 extern void vacuum(List *relations, VacuumParams *params,
323  BufferAccessStrategy bstrategy, MemoryContext vac_context,
324  bool isTopLevel);
325 extern void vac_open_indexes(Relation relation, LOCKMODE lockmode,
326  int *nindexes, Relation **Irel);
327 extern void vac_close_indexes(int nindexes, Relation *Irel, LOCKMODE lockmode);
328 extern double vac_estimate_reltuples(Relation relation,
329  BlockNumber total_pages,
330  BlockNumber scanned_pages,
331  double scanned_tuples);
332 extern void vac_update_relstats(Relation relation,
333  BlockNumber num_pages,
334  double num_tuples,
335  BlockNumber num_all_visible_pages,
336  bool hasindex,
337  TransactionId frozenxid,
338  MultiXactId minmulti,
339  bool *frozenxid_updated,
340  bool *minmulti_updated,
341  bool in_outer_xact);
342 extern bool vacuum_get_cutoffs(Relation rel, const VacuumParams *params,
343  struct VacuumCutoffs *cutoffs);
344 extern bool vacuum_xid_failsafe_check(const struct VacuumCutoffs *cutoffs);
345 extern void vac_update_datfrozenxid(void);
346 extern void vacuum_delay_point(void);
347 extern bool vacuum_is_permitted_for_relation(Oid relid, Form_pg_class reltuple,
348  bits32 options);
349 extern Relation vacuum_open_relation(Oid relid, RangeVar *relation,
350  bits32 options, bool verbose,
351  LOCKMODE lmode);
353  IndexBulkDeleteResult *istat,
354  VacDeadItems *dead_items);
356  IndexBulkDeleteResult *istat);
357 extern Size vac_max_items_to_alloc_size(int max_items);
358 
359 /* In postmaster/autovacuum.c */
360 extern void AutoVacuumUpdateCostLimit(void);
361 extern void VacuumUpdateCosts(void);
362 
363 /* in commands/vacuumparallel.c */
365  int nindexes, int nrequested_workers,
366  int max_items, int elevel,
367  BufferAccessStrategy bstrategy);
371  long num_table_tuples,
372  int num_index_scans);
374  long num_table_tuples,
375  int num_index_scans,
376  bool estimated_count);
377 extern void parallel_vacuum_main(dsm_segment *seg, shm_toc *toc);
378 
379 /* in commands/analyze.c */
380 extern void analyze_rel(Oid relid, RangeVar *relation,
381  VacuumParams *params, List *va_cols, bool in_outer_xact,
382  BufferAccessStrategy bstrategy);
383 extern bool std_typanalyze(VacAttrStats *stats);
384 
385 /* in utils/misc/sampling.c --- duplicate of declarations in utils/sampling.h */
386 extern double anl_random_fract(void);
387 extern double anl_init_selection_state(int n);
388 extern double anl_get_next_S(double t, int n, double *stateptr);
389 
390 #endif /* VACUUM_H */
uint32 BlockNumber
Definition: block.h:31
#define PGDLLIMPORT
Definition: c.h:1303
signed short int16
Definition: c.h:480
signed int int32
Definition: c.h:481
TransactionId MultiXactId
Definition: c.h:649
#define FLEXIBLE_ARRAY_MEMBER
Definition: c.h:385
uint32 bits32
Definition: c.h:502
float float4
Definition: c.h:616
uint32 TransactionId
Definition: c.h:639
size_t Size
Definition: c.h:592
int verbose
int LOCKMODE
Definition: lockdefs.h:26
FormData_pg_class * Form_pg_class
Definition: pg_class.h:153
#define STATISTIC_NUM_SLOTS
Definition: pg_statistic.h:127
FormData_pg_type * Form_pg_type
Definition: pg_type.h:261
uintptr_t Datum
Definition: postgres.h:64
unsigned int Oid
Definition: postgres_ext.h:31
Definition: pg_list.h:54
int32 attrtypmod
Definition: vacuum.h:126
bool stats_valid
Definition: vacuum.h:143
float4 stanullfrac
Definition: vacuum.h:144
Form_pg_type attrtype
Definition: vacuum.h:127
int16 stakind[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:147
int tupattnum
Definition: vacuum.h:170
MemoryContext anl_context
Definition: vacuum.h:129
Oid statypid[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:161
Oid staop[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:148
Oid stacoll[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:149
char statypalign[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:164
float4 * stanumbers[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:151
int rowstride
Definition: vacuum.h:175
Oid attrtypid
Definition: vacuum.h:125
HeapTuple * rows
Definition: vacuum.h:171
int minrows
Definition: vacuum.h:136
int attstattarget
Definition: vacuum.h:124
int32 stawidth
Definition: vacuum.h:145
void * extra_data
Definition: vacuum.h:137
bool statypbyval[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:163
int16 statyplen[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:162
bool * exprnulls
Definition: vacuum.h:174
TupleDesc tupDesc
Definition: vacuum.h:172
Datum * exprvals
Definition: vacuum.h:173
int numvalues[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:152
Datum * stavalues[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:153
float4 stadistinct
Definition: vacuum.h:146
int numnumbers[STATISTIC_NUM_SLOTS]
Definition: vacuum.h:150
AnalyzeAttrComputeStatsFunc compute_stats
Definition: vacuum.h:135
Oid attrcollid
Definition: vacuum.h:128
ItemPointerData items[FLEXIBLE_ARRAY_MEMBER]
Definition: vacuum.h:289
int max_items
Definition: vacuum.h:285
int num_items
Definition: vacuum.h:286
TransactionId FreezeLimit
Definition: vacuum.h:276
TransactionId OldestXmin
Definition: vacuum.h:266
TransactionId relfrozenxid
Definition: vacuum.h:250
MultiXactId relminmxid
Definition: vacuum.h:251
MultiXactId MultiXactCutoff
Definition: vacuum.h:277
MultiXactId OldestMxact
Definition: vacuum.h:267
int nworkers
Definition: vacuum.h:238
int freeze_table_age
Definition: vacuum.h:220
VacOptValue truncate
Definition: vacuum.h:230
bits32 options
Definition: vacuum.h:218
int freeze_min_age
Definition: vacuum.h:219
bool is_wraparound
Definition: vacuum.h:225
int multixact_freeze_min_age
Definition: vacuum.h:221
int multixact_freeze_table_age
Definition: vacuum.h:223
int log_min_duration
Definition: vacuum.h:226
Oid toast_parent
Definition: vacuum.h:231
VacOptValue index_cleanup
Definition: vacuum.h:229
IndexBulkDeleteResult * vac_bulkdel_one_index(IndexVacuumInfo *ivinfo, IndexBulkDeleteResult *istat, VacDeadItems *dead_items)
Definition: vacuum.c:2491
void ExecVacuum(ParseState *pstate, VacuumStmt *vacstmt, bool isTopLevel)
Definition: vacuum.c:148
void VacuumUpdateCosts(void)
Definition: autovacuum.c:1632
PGDLLIMPORT int VacuumCostBalanceLocal
Definition: vacuum.c:104
Size vac_max_items_to_alloc_size(int max_items)
Definition: vacuum.c:2537
PGDLLIMPORT int vacuum_freeze_table_age
Definition: vacuum.c:68
struct VacDeadItems VacDeadItems
PGDLLIMPORT pg_atomic_uint32 * VacuumSharedCostBalance
Definition: vacuum.c:102
PGDLLIMPORT int vacuum_cost_limit
Definition: vacuum.c:81
bool std_typanalyze(VacAttrStats *stats)
Definition: analyze.c:1886
void vac_open_indexes(Relation relation, LOCKMODE lockmode, int *nindexes, Relation **Irel)
Definition: vacuum.c:2273
void vacuum(List *relations, VacuumParams *params, BufferAccessStrategy bstrategy, MemoryContext vac_context, bool isTopLevel)
Definition: vacuum.c:479
PGDLLIMPORT pg_atomic_uint32 * VacuumActiveNWorkers
Definition: vacuum.c:103
void vac_update_relstats(Relation relation, BlockNumber num_pages, double num_tuples, BlockNumber num_all_visible_pages, bool hasindex, TransactionId frozenxid, MultiXactId minmulti, bool *frozenxid_updated, bool *minmulti_updated, bool in_outer_xact)
Definition: vacuum.c:1399
PGDLLIMPORT double vacuum_cost_delay
Definition: vacuum.c:80
double anl_get_next_S(double t, int n, double *stateptr)
Definition: sampling.c:296
PGDLLIMPORT int vacuum_failsafe_age
Definition: vacuum.c:71
VacDeadItems * parallel_vacuum_get_dead_items(ParallelVacuumState *pvs)
struct VacAttrStats VacAttrStats
PGDLLIMPORT bool VacuumFailsafeActive
Definition: vacuum.c:96
PGDLLIMPORT int vacuum_freeze_min_age
Definition: vacuum.c:67
void parallel_vacuum_bulkdel_all_indexes(ParallelVacuumState *pvs, long num_table_tuples, int num_index_scans)
Relation vacuum_open_relation(Oid relid, RangeVar *relation, bits32 options, bool verbose, LOCKMODE lmode)
Definition: vacuum.c:759
void vac_close_indexes(int nindexes, Relation *Irel, LOCKMODE lockmode)
Definition: vacuum.c:2316
void vacuum_delay_point(void)
Definition: vacuum.c:2337
void parallel_vacuum_cleanup_all_indexes(ParallelVacuumState *pvs, long num_table_tuples, int num_index_scans, bool estimated_count)
Datum(* AnalyzeAttrFetchFunc)(VacAttrStatsP stats, int rownum, bool *isNull)
Definition: vacuum.h:107
void vac_update_datfrozenxid(void)
Definition: vacuum.c:1566
bool vacuum_get_cutoffs(Relation rel, const VacuumParams *params, struct VacuumCutoffs *cutoffs)
Definition: vacuum.c:1073
bool vacuum_xid_failsafe_check(const struct VacuumCutoffs *cutoffs)
Definition: vacuum.c:1241
VacOptValue
Definition: vacuum.h:200
@ VACOPTVALUE_AUTO
Definition: vacuum.h:202
@ VACOPTVALUE_ENABLED
Definition: vacuum.h:204
@ VACOPTVALUE_UNSPECIFIED
Definition: vacuum.h:201
@ VACOPTVALUE_DISABLED
Definition: vacuum.h:203
PGDLLIMPORT int default_statistics_target
Definition: analyze.c:73
void parallel_vacuum_main(dsm_segment *seg, shm_toc *toc)
struct VacAttrStats * VacAttrStatsP
Definition: vacuum.h:105
PGDLLIMPORT int vacuum_multixact_freeze_table_age
Definition: vacuum.c:70
PGDLLIMPORT int vacuum_multixact_freeze_min_age
Definition: vacuum.c:69
double vac_estimate_reltuples(Relation relation, BlockNumber total_pages, BlockNumber scanned_pages, double scanned_tuples)
Definition: vacuum.c:1303
double anl_init_selection_state(int n)
Definition: sampling.c:281
void(* AnalyzeAttrComputeStatsFunc)(VacAttrStatsP stats, AnalyzeAttrFetchFunc fetchfunc, int samplerows, double totalrows)
Definition: vacuum.h:110
void analyze_rel(Oid relid, RangeVar *relation, VacuumParams *params, List *va_cols, bool in_outer_xact, BufferAccessStrategy bstrategy)
Definition: analyze.c:111
void AutoVacuumUpdateCostLimit(void)
Definition: autovacuum.c:1701
IndexBulkDeleteResult * vac_cleanup_one_index(IndexVacuumInfo *ivinfo, IndexBulkDeleteResult *istat)
Definition: vacuum.c:2512
struct VacuumParams VacuumParams
void parallel_vacuum_end(ParallelVacuumState *pvs, IndexBulkDeleteResult **istats)
bool vacuum_is_permitted_for_relation(Oid relid, Form_pg_class reltuple, bits32 options)
Definition: vacuum.c:707
PGDLLIMPORT int vacuum_multixact_failsafe_age
Definition: vacuum.c:72
ParallelVacuumState * parallel_vacuum_init(Relation rel, Relation *indrels, int nindexes, int nrequested_workers, int max_items, int elevel, BufferAccessStrategy bstrategy)
double anl_random_fract(void)
Definition: sampling.c:266