PostgreSQL Source Code  git master
pgstatapprox.c
Go to the documentation of this file.
1 /*-------------------------------------------------------------------------
2  *
3  * pgstatapprox.c
4  * Bloat estimation functions
5  *
6  * Copyright (c) 2014-2024, PostgreSQL Global Development Group
7  *
8  * IDENTIFICATION
9  * contrib/pgstattuple/pgstatapprox.c
10  *
11  *-------------------------------------------------------------------------
12  */
13 #include "postgres.h"
14 
15 #include "access/heapam.h"
16 #include "access/htup_details.h"
17 #include "access/multixact.h"
18 #include "access/relation.h"
19 #include "access/transam.h"
20 #include "access/visibilitymap.h"
21 #include "access/xact.h"
22 #include "catalog/namespace.h"
23 #include "catalog/pg_am_d.h"
24 #include "commands/vacuum.h"
25 #include "funcapi.h"
26 #include "miscadmin.h"
27 #include "storage/bufmgr.h"
28 #include "storage/freespace.h"
29 #include "storage/lmgr.h"
30 #include "storage/procarray.h"
31 #include "utils/builtins.h"
32 
35 
37 
38 typedef struct output_type
39 {
40  uint64 table_len;
42  uint64 tuple_count;
43  uint64 tuple_len;
44  double tuple_percent;
48  uint64 free_space;
49  double free_percent;
51 
52 #define NUM_OUTPUT_COLUMNS 10
53 
54 /*
55  * This function takes an already open relation and scans its pages,
56  * skipping those that have the corresponding visibility map bit set.
57  * For pages we skip, we find the free space from the free space map
58  * and approximate tuple_len on that basis. For the others, we count
59  * the exact number of dead tuples etc.
60  *
61  * This scan is loosely based on vacuumlazy.c:lazy_scan_heap(), but
62  * we do not try to avoid skipping single pages.
63  */
64 static void
66 {
67  BlockNumber scanned,
68  nblocks,
69  blkno;
70  Buffer vmbuffer = InvalidBuffer;
71  BufferAccessStrategy bstrategy;
72  TransactionId OldestXmin;
73 
74  OldestXmin = GetOldestNonRemovableTransactionId(rel);
75  bstrategy = GetAccessStrategy(BAS_BULKREAD);
76 
77  nblocks = RelationGetNumberOfBlocks(rel);
78  scanned = 0;
79 
80  for (blkno = 0; blkno < nblocks; blkno++)
81  {
82  Buffer buf;
83  Page page;
84  OffsetNumber offnum,
85  maxoff;
86  Size freespace;
87 
89 
90  /*
91  * If the page has only visible tuples, then we can find out the free
92  * space from the FSM and move on.
93  */
94  if (VM_ALL_VISIBLE(rel, blkno, &vmbuffer))
95  {
96  freespace = GetRecordedFreeSpace(rel, blkno);
97  stat->tuple_len += BLCKSZ - freespace;
98  stat->free_space += freespace;
99  continue;
100  }
101 
102  buf = ReadBufferExtended(rel, MAIN_FORKNUM, blkno,
103  RBM_NORMAL, bstrategy);
104 
106 
107  page = BufferGetPage(buf);
108 
109  /*
110  * It's not safe to call PageGetHeapFreeSpace() on new pages, so we
111  * treat them as being free space for our purposes.
112  */
113  if (!PageIsNew(page))
114  stat->free_space += PageGetHeapFreeSpace(page);
115  else
116  stat->free_space += BLCKSZ - SizeOfPageHeaderData;
117 
118  /* We may count the page as scanned even if it's new/empty */
119  scanned++;
120 
121  if (PageIsNew(page) || PageIsEmpty(page))
122  {
124  continue;
125  }
126 
127  /*
128  * Look at each tuple on the page and decide whether it's live or
129  * dead, then count it and its size. Unlike lazy_scan_heap, we can
130  * afford to ignore problems and special cases.
131  */
132  maxoff = PageGetMaxOffsetNumber(page);
133 
134  for (offnum = FirstOffsetNumber;
135  offnum <= maxoff;
136  offnum = OffsetNumberNext(offnum))
137  {
138  ItemId itemid;
139  HeapTupleData tuple;
140 
141  itemid = PageGetItemId(page, offnum);
142 
143  if (!ItemIdIsUsed(itemid) || ItemIdIsRedirected(itemid) ||
144  ItemIdIsDead(itemid))
145  {
146  continue;
147  }
148 
149  Assert(ItemIdIsNormal(itemid));
150 
151  ItemPointerSet(&(tuple.t_self), blkno, offnum);
152 
153  tuple.t_data = (HeapTupleHeader) PageGetItem(page, itemid);
154  tuple.t_len = ItemIdGetLength(itemid);
155  tuple.t_tableOid = RelationGetRelid(rel);
156 
157  /*
158  * We follow VACUUM's lead in counting INSERT_IN_PROGRESS tuples
159  * as "dead" while DELETE_IN_PROGRESS tuples are "live". We don't
160  * bother distinguishing tuples inserted/deleted by our own
161  * transaction.
162  */
163  switch (HeapTupleSatisfiesVacuum(&tuple, OldestXmin, buf))
164  {
165  case HEAPTUPLE_LIVE:
167  stat->tuple_len += tuple.t_len;
168  stat->tuple_count++;
169  break;
170  case HEAPTUPLE_DEAD:
173  stat->dead_tuple_len += tuple.t_len;
174  stat->dead_tuple_count++;
175  break;
176  default:
177  elog(ERROR, "unexpected HeapTupleSatisfiesVacuum result");
178  break;
179  }
180  }
181 
183  }
184 
185  stat->table_len = (uint64) nblocks * BLCKSZ;
186 
187  /*
188  * We don't know how many tuples are in the pages we didn't scan, so
189  * extrapolate the live-tuple count to the whole table in the same way
190  * that VACUUM does. (Like VACUUM, we're not taking a random sample, so
191  * just extrapolating linearly seems unsafe.) There should be no dead
192  * tuples in all-visible pages, so no correction is needed for that, and
193  * we already accounted for the space in those pages, too.
194  */
195  stat->tuple_count = vac_estimate_reltuples(rel, nblocks, scanned,
196  stat->tuple_count);
197 
198  /* It's not clear if we could get -1 here, but be safe. */
199  stat->tuple_count = Max(stat->tuple_count, 0);
200 
201  /*
202  * Calculate percentages if the relation has one or more pages.
203  */
204  if (nblocks != 0)
205  {
206  stat->scanned_percent = 100.0 * scanned / nblocks;
207  stat->tuple_percent = 100.0 * stat->tuple_len / stat->table_len;
208  stat->dead_tuple_percent = 100.0 * stat->dead_tuple_len / stat->table_len;
209  stat->free_percent = 100.0 * stat->free_space / stat->table_len;
210  }
211 
212  if (BufferIsValid(vmbuffer))
213  {
214  ReleaseBuffer(vmbuffer);
215  vmbuffer = InvalidBuffer;
216  }
217 }
218 
219 /*
220  * Returns estimated live/dead tuple statistics for the given relid.
221  *
222  * The superuser() check here must be kept as the library might be upgraded
223  * without the extension being upgraded, meaning that in pre-1.5 installations
224  * these functions could be called by any user.
225  */
226 Datum
228 {
229  Oid relid = PG_GETARG_OID(0);
230 
231  if (!superuser())
232  ereport(ERROR,
233  (errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
234  errmsg("must be superuser to use pgstattuple functions")));
235 
237 }
238 
239 /*
240  * As of pgstattuple version 1.5, we no longer need to check if the user
241  * is a superuser because we REVOKE EXECUTE on the SQL function from PUBLIC.
242  * Users can then grant access to it based on their policies.
243  *
244  * Otherwise identical to pgstattuple_approx (above).
245  */
246 Datum
248 {
249  Oid relid = PG_GETARG_OID(0);
250 
252 }
253 
254 Datum
256 {
257  Relation rel;
258  output_type stat = {0};
259  TupleDesc tupdesc;
260  bool nulls[NUM_OUTPUT_COLUMNS];
262  HeapTuple ret;
263  int i = 0;
264 
265  if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE)
266  elog(ERROR, "return type must be a row type");
267 
268  if (tupdesc->natts != NUM_OUTPUT_COLUMNS)
269  elog(ERROR, "incorrect number of output arguments");
270 
271  rel = relation_open(relid, AccessShareLock);
272 
273  /*
274  * Reject attempts to read non-local temporary relations; we would be
275  * likely to get wrong data since we have no visibility into the owning
276  * session's local buffers.
277  */
278  if (RELATION_IS_OTHER_TEMP(rel))
279  ereport(ERROR,
280  (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
281  errmsg("cannot access temporary tables of other sessions")));
282 
283  /*
284  * We support only relation kinds with a visibility map and a free space
285  * map.
286  */
287  if (!(rel->rd_rel->relkind == RELKIND_RELATION ||
288  rel->rd_rel->relkind == RELKIND_MATVIEW ||
289  rel->rd_rel->relkind == RELKIND_TOASTVALUE))
290  ereport(ERROR,
291  (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
292  errmsg("relation \"%s\" is of wrong relation kind",
294  errdetail_relkind_not_supported(rel->rd_rel->relkind)));
295 
296  if (rel->rd_rel->relam != HEAP_TABLE_AM_OID)
297  ereport(ERROR, (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
298  errmsg("only heap AM is supported")));
299 
300  statapprox_heap(rel, &stat);
301 
303 
304  memset(nulls, 0, sizeof(nulls));
305 
306  values[i++] = Int64GetDatum(stat.table_len);
307  values[i++] = Float8GetDatum(stat.scanned_percent);
308  values[i++] = Int64GetDatum(stat.tuple_count);
309  values[i++] = Int64GetDatum(stat.tuple_len);
310  values[i++] = Float8GetDatum(stat.tuple_percent);
311  values[i++] = Int64GetDatum(stat.dead_tuple_count);
312  values[i++] = Int64GetDatum(stat.dead_tuple_len);
313  values[i++] = Float8GetDatum(stat.dead_tuple_percent);
314  values[i++] = Int64GetDatum(stat.free_space);
315  values[i++] = Float8GetDatum(stat.free_percent);
316 
317  ret = heap_form_tuple(tupdesc, values, nulls);
318  return HeapTupleGetDatum(ret);
319 }
uint32 BlockNumber
Definition: block.h:31
static Datum values[MAXATTR]
Definition: bootstrap.c:152
int Buffer
Definition: buf.h:23
#define InvalidBuffer
Definition: buf.h:25
void ReleaseBuffer(Buffer buffer)
Definition: bufmgr.c:4850
void UnlockReleaseBuffer(Buffer buffer)
Definition: bufmgr.c:4867
void LockBuffer(Buffer buffer, int mode)
Definition: bufmgr.c:5085
Buffer ReadBufferExtended(Relation reln, ForkNumber forkNum, BlockNumber blockNum, ReadBufferMode mode, BufferAccessStrategy strategy)
Definition: bufmgr.c:792
@ BAS_BULKREAD
Definition: bufmgr.h:36
#define BUFFER_LOCK_SHARE
Definition: bufmgr.h:198
#define RelationGetNumberOfBlocks(reln)
Definition: bufmgr.h:281
static Page BufferGetPage(Buffer buffer)
Definition: bufmgr.h:408
@ RBM_NORMAL
Definition: bufmgr.h:45
static bool BufferIsValid(Buffer bufnum)
Definition: bufmgr.h:359
Size PageGetHeapFreeSpace(Page page)
Definition: bufpage.c:991
static bool PageIsEmpty(Page page)
Definition: bufpage.h:220
Pointer Page
Definition: bufpage.h:78
static Item PageGetItem(Page page, ItemId itemId)
Definition: bufpage.h:351
#define SizeOfPageHeaderData
Definition: bufpage.h:213
static ItemId PageGetItemId(Page page, OffsetNumber offsetNumber)
Definition: bufpage.h:240
static bool PageIsNew(Page page)
Definition: bufpage.h:230
static OffsetNumber PageGetMaxOffsetNumber(Page page)
Definition: bufpage.h:369
#define Max(x, y)
Definition: c.h:998
#define Assert(condition)
Definition: c.h:858
uint32 TransactionId
Definition: c.h:652
size_t Size
Definition: c.h:605
int errcode(int sqlerrcode)
Definition: elog.c:859
int errmsg(const char *fmt,...)
Definition: elog.c:1072
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:224
#define ereport(elevel,...)
Definition: elog.h:149
Datum Int64GetDatum(int64 X)
Definition: fmgr.c:1807
Datum Float8GetDatum(float8 X)
Definition: fmgr.c:1816
#define PG_GETARG_OID(n)
Definition: fmgr.h:275
#define PG_RETURN_DATUM(x)
Definition: fmgr.h:353
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193
BufferAccessStrategy GetAccessStrategy(BufferAccessStrategyType btype)
Definition: freelist.c:541
Size GetRecordedFreeSpace(Relation rel, BlockNumber heapBlk)
Definition: freespace.c:244
TypeFuncClass get_call_result_type(FunctionCallInfo fcinfo, Oid *resultTypeId, TupleDesc *resultTupleDesc)
Definition: funcapi.c:276
@ TYPEFUNC_COMPOSITE
Definition: funcapi.h:149
static Datum HeapTupleGetDatum(const HeapTupleData *tuple)
Definition: funcapi.h:230
@ HEAPTUPLE_RECENTLY_DEAD
Definition: heapam.h:127
@ HEAPTUPLE_INSERT_IN_PROGRESS
Definition: heapam.h:128
@ HEAPTUPLE_LIVE
Definition: heapam.h:126
@ HEAPTUPLE_DELETE_IN_PROGRESS
Definition: heapam.h:129
@ HEAPTUPLE_DEAD
Definition: heapam.h:125
HTSV_Result HeapTupleSatisfiesVacuum(HeapTuple htup, TransactionId OldestXmin, Buffer buffer)
HeapTuple heap_form_tuple(TupleDesc tupleDescriptor, const Datum *values, const bool *isnull)
Definition: heaptuple.c:1116
HeapTupleHeaderData * HeapTupleHeader
Definition: htup.h:23
int i
Definition: isn.c:73
#define ItemIdGetLength(itemId)
Definition: itemid.h:59
#define ItemIdIsNormal(itemId)
Definition: itemid.h:99
#define ItemIdIsDead(itemId)
Definition: itemid.h:113
#define ItemIdIsUsed(itemId)
Definition: itemid.h:92
#define ItemIdIsRedirected(itemId)
Definition: itemid.h:106
static void ItemPointerSet(ItemPointerData *pointer, BlockNumber blockNumber, OffsetNumber offNum)
Definition: itemptr.h:135
#define AccessShareLock
Definition: lockdefs.h:36
#define CHECK_FOR_INTERRUPTS()
Definition: miscadmin.h:122
#define OffsetNumberNext(offsetNumber)
Definition: off.h:52
uint16 OffsetNumber
Definition: off.h:24
#define FirstOffsetNumber
Definition: off.h:27
int errdetail_relkind_not_supported(char relkind)
Definition: pg_class.c:24
static char * buf
Definition: pg_test_fsync.c:73
static void statapprox_heap(Relation rel, output_type *stat)
Definition: pgstatapprox.c:65
Datum pgstattuple_approx(PG_FUNCTION_ARGS)
Definition: pgstatapprox.c:227
#define NUM_OUTPUT_COLUMNS
Definition: pgstatapprox.c:52
struct output_type output_type
Datum pgstattuple_approx_internal(Oid relid, FunctionCallInfo fcinfo)
Definition: pgstatapprox.c:255
PG_FUNCTION_INFO_V1(pgstattuple_approx)
Datum pgstattuple_approx_v1_5(PG_FUNCTION_ARGS)
Definition: pgstatapprox.c:247
uintptr_t Datum
Definition: postgres.h:64
unsigned int Oid
Definition: postgres_ext.h:31
TransactionId GetOldestNonRemovableTransactionId(Relation rel)
Definition: procarray.c:1993
#define RelationGetRelid(relation)
Definition: rel.h:505
#define RelationGetRelationName(relation)
Definition: rel.h:539
#define RELATION_IS_OTHER_TEMP(relation)
Definition: rel.h:658
@ MAIN_FORKNUM
Definition: relpath.h:50
void relation_close(Relation relation, LOCKMODE lockmode)
Definition: relation.c:205
Relation relation_open(Oid relationId, LOCKMODE lockmode)
Definition: relation.c:47
ItemPointerData t_self
Definition: htup.h:65
uint32 t_len
Definition: htup.h:64
HeapTupleHeader t_data
Definition: htup.h:68
Oid t_tableOid
Definition: htup.h:66
Form_pg_class rd_rel
Definition: rel.h:111
uint64 dead_tuple_count
Definition: pgstatapprox.c:45
double free_percent
Definition: pgstatapprox.c:49
double tuple_percent
Definition: pgstatapprox.c:44
double dead_tuple_percent
Definition: pgstatapprox.c:47
uint64 dead_tuple_len
Definition: pgstatapprox.c:46
uint64 tuple_count
Definition: pgstatapprox.c:42
uint64 free_space
Definition: pgstatapprox.c:48
uint64 table_len
Definition: pgstatapprox.c:40
uint64 tuple_len
Definition: pgstatapprox.c:43
double scanned_percent
Definition: pgstatapprox.c:41
bool superuser(void)
Definition: superuser.c:46
double vac_estimate_reltuples(Relation relation, BlockNumber total_pages, BlockNumber scanned_pages, double scanned_tuples)
Definition: vacuum.c:1302
#define VM_ALL_VISIBLE(r, b, v)
Definition: visibilitymap.h:24