PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
slru.h File Reference
#include "access/xlogdefs.h"
#include "storage/lwlock.h"
#include "storage/sync.h"
Include dependency graph for slru.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Data Structures

struct  SlruSharedData
 
struct  SlruCtlData
 

Macros

#define SLRU_MAX_ALLOWED_BUFFERS   ((1024 * 1024 * 1024) / BLCKSZ)
 
#define SLRU_PAGES_PER_SEGMENT   32
 
#define SlruPagePrecedesUnitTests(ctl, per_page)   do {} while (0)
 

Typedefs

typedef struct SlruSharedData SlruSharedData
 
typedef SlruSharedDataSlruShared
 
typedef struct SlruCtlData SlruCtlData
 
typedef SlruCtlDataSlruCtl
 
typedef bool(* SlruScanCallback) (SlruCtl ctl, char *filename, int64 segpage, void *data)
 

Enumerations

enum  SlruPageStatus { SLRU_PAGE_EMPTY , SLRU_PAGE_READ_IN_PROGRESS , SLRU_PAGE_VALID , SLRU_PAGE_WRITE_IN_PROGRESS }
 

Functions

static LWLockSimpleLruGetBankLock (SlruCtl ctl, int64 pageno)
 
Size SimpleLruShmemSize (int nslots, int nlsns)
 
int SimpleLruAutotuneBuffers (int divisor, int max)
 
void SimpleLruInit (SlruCtl ctl, const char *name, int nslots, int nlsns, const char *subdir, int buffer_tranche_id, int bank_tranche_id, SyncRequestHandler sync_handler, bool long_segment_names)
 
int SimpleLruZeroPage (SlruCtl ctl, int64 pageno)
 
int SimpleLruReadPage (SlruCtl ctl, int64 pageno, bool write_ok, TransactionId xid)
 
int SimpleLruReadPage_ReadOnly (SlruCtl ctl, int64 pageno, TransactionId xid)
 
void SimpleLruWritePage (SlruCtl ctl, int slotno)
 
void SimpleLruWriteAll (SlruCtl ctl, bool allow_redirtied)
 
void SimpleLruTruncate (SlruCtl ctl, int64 cutoffPage)
 
bool SimpleLruDoesPhysicalPageExist (SlruCtl ctl, int64 pageno)
 
bool SlruScanDirectory (SlruCtl ctl, SlruScanCallback callback, void *data)
 
void SlruDeleteSegment (SlruCtl ctl, int64 segno)
 
int SlruSyncFileTag (SlruCtl ctl, const FileTag *ftag, char *path)
 
bool SlruScanDirCbReportPresence (SlruCtl ctl, char *filename, int64 segpage, void *data)
 
bool SlruScanDirCbDeleteAll (SlruCtl ctl, char *filename, int64 segpage, void *data)
 
bool check_slru_buffers (const char *name, int *newval)
 

Macro Definition Documentation

◆ SLRU_MAX_ALLOWED_BUFFERS

#define SLRU_MAX_ALLOWED_BUFFERS   ((1024 * 1024 * 1024) / BLCKSZ)

Definition at line 24 of file slru.h.

◆ SLRU_PAGES_PER_SEGMENT

#define SLRU_PAGES_PER_SEGMENT   32

Definition at line 39 of file slru.h.

◆ SlruPagePrecedesUnitTests

#define SlruPagePrecedesUnitTests (   ctl,
  per_page 
)    do {} while (0)

Definition at line 199 of file slru.h.

Typedef Documentation

◆ SlruCtl

typedef SlruCtlData* SlruCtl

Definition at line 166 of file slru.h.

◆ SlruCtlData

typedef struct SlruCtlData SlruCtlData

◆ SlruScanCallback

typedef bool(* SlruScanCallback) (SlruCtl ctl, char *filename, int64 segpage, void *data)

Definition at line 204 of file slru.h.

◆ SlruShared

Definition at line 121 of file slru.h.

◆ SlruSharedData

Enumeration Type Documentation

◆ SlruPageStatus

Enumerator
SLRU_PAGE_EMPTY 
SLRU_PAGE_READ_IN_PROGRESS 
SLRU_PAGE_VALID 
SLRU_PAGE_WRITE_IN_PROGRESS 

Definition at line 47 of file slru.h.

48{
49 SLRU_PAGE_EMPTY, /* buffer is not in use */
50 SLRU_PAGE_READ_IN_PROGRESS, /* page is being read in */
51 SLRU_PAGE_VALID, /* page is valid and not being written */
52 SLRU_PAGE_WRITE_IN_PROGRESS, /* page is being written out */
SlruPageStatus
Definition: slru.h:48
@ SLRU_PAGE_VALID
Definition: slru.h:51
@ SLRU_PAGE_WRITE_IN_PROGRESS
Definition: slru.h:52
@ SLRU_PAGE_READ_IN_PROGRESS
Definition: slru.h:50
@ SLRU_PAGE_EMPTY
Definition: slru.h:49

Function Documentation

◆ check_slru_buffers()

bool check_slru_buffers ( const char *  name,
int *  newval 
)

Definition at line 354 of file slru.c.

355{
356 /* Valid values are multiples of SLRU_BANK_SIZE */
357 if (*newval % SLRU_BANK_SIZE == 0)
358 return true;
359
360 GUC_check_errdetail("\"%s\" must be a multiple of %d.", name,
362 return false;
363}
#define newval
#define GUC_check_errdetail
Definition: guc.h:481
#define SLRU_BANK_SIZE
Definition: slru.c:143
const char * name

References GUC_check_errdetail, name, newval, and SLRU_BANK_SIZE.

Referenced by check_commit_ts_buffers(), check_multixact_member_buffers(), check_multixact_offset_buffers(), check_notify_buffers(), check_serial_buffers(), check_subtrans_buffers(), and check_transaction_buffers().

◆ SimpleLruAutotuneBuffers()

int SimpleLruAutotuneBuffers ( int  divisor,
int  max 
)

Definition at line 231 of file slru.c.

232{
233 return Min(max - (max % SLRU_BANK_SIZE),
235 NBuffers / divisor - (NBuffers / divisor) % SLRU_BANK_SIZE));
236}
#define Min(x, y)
Definition: c.h:975
#define Max(x, y)
Definition: c.h:969
int NBuffers
Definition: globals.c:143

References Max, Min, NBuffers, and SLRU_BANK_SIZE.

Referenced by CLOGShmemBuffers(), CommitTsShmemBuffers(), and SUBTRANSShmemBuffers().

◆ SimpleLruDoesPhysicalPageExist()

bool SimpleLruDoesPhysicalPageExist ( SlruCtl  ctl,
int64  pageno 
)

Definition at line 745 of file slru.c.

746{
747 int64 segno = pageno / SLRU_PAGES_PER_SEGMENT;
748 int rpageno = pageno % SLRU_PAGES_PER_SEGMENT;
749 int offset = rpageno * BLCKSZ;
750 char path[MAXPGPATH];
751 int fd;
752 bool result;
753 off_t endpos;
754
755 /* update the stats counter of checked pages */
756 pgstat_count_slru_page_exists(ctl->shared->slru_stats_idx);
757
758 SlruFileName(ctl, path, segno);
759
760 fd = OpenTransientFile(path, O_RDONLY | PG_BINARY);
761 if (fd < 0)
762 {
763 /* expected: file doesn't exist */
764 if (errno == ENOENT)
765 return false;
766
767 /* report error normally */
769 slru_errno = errno;
770 SlruReportIOError(ctl, pageno, 0);
771 }
772
773 if ((endpos = lseek(fd, 0, SEEK_END)) < 0)
774 {
776 slru_errno = errno;
777 SlruReportIOError(ctl, pageno, 0);
778 }
779
780 result = endpos >= (off_t) (offset + BLCKSZ);
781
782 if (CloseTransientFile(fd) != 0)
783 {
785 slru_errno = errno;
786 return false;
787 }
788
789 return result;
790}
int64_t int64
Definition: c.h:499
#define PG_BINARY
Definition: c.h:1244
int CloseTransientFile(int fd)
Definition: fd.c:2871
int OpenTransientFile(const char *fileName, int fileFlags)
Definition: fd.c:2694
#define MAXPGPATH
static XLogRecPtr endpos
Definition: pg_receivewal.c:56
void pgstat_count_slru_page_exists(int slru_idx)
Definition: pgstat_slru.c:71
static int fd(const char *x, int i)
Definition: preproc-init.c:105
tree ctl
Definition: radixtree.h:1838
static int SlruFileName(SlruCtl ctl, char *path, int64 segno)
Definition: slru.c:91
static void SlruReportIOError(SlruCtl ctl, int64 pageno, TransactionId xid)
Definition: slru.c:1047
static SlruErrorCause slru_errcause
Definition: slru.c:174
static int slru_errno
Definition: slru.c:175
@ SLRU_SEEK_FAILED
Definition: slru.c:167
@ SLRU_OPEN_FAILED
Definition: slru.c:166
@ SLRU_CLOSE_FAILED
Definition: slru.c:171
#define SLRU_PAGES_PER_SEGMENT
Definition: slru.h:39

References CloseTransientFile(), ctl, endpos, fd(), MAXPGPATH, OpenTransientFile(), PG_BINARY, pgstat_count_slru_page_exists(), SlruWriteAllData::segno, SLRU_CLOSE_FAILED, slru_errcause, slru_errno, SLRU_OPEN_FAILED, SLRU_PAGES_PER_SEGMENT, SLRU_SEEK_FAILED, SlruFileName(), and SlruReportIOError().

Referenced by ActivateCommitTs(), find_multixact_start(), MaybeExtendOffsetSlru(), and test_slru_page_exists().

◆ SimpleLruGetBankLock()

◆ SimpleLruInit()

void SimpleLruInit ( SlruCtl  ctl,
const char *  name,
int  nslots,
int  nlsns,
const char *  subdir,
int  buffer_tranche_id,
int  bank_tranche_id,
SyncRequestHandler  sync_handler,
bool  long_segment_names 
)

Definition at line 251 of file slru.c.

254{
255 SlruShared shared;
256 bool found;
257 int nbanks = nslots / SLRU_BANK_SIZE;
258
260
262 SimpleLruShmemSize(nslots, nlsns),
263 &found);
264
266 {
267 /* Initialize locks and shared memory area */
268 char *ptr;
269 Size offset;
270
271 Assert(!found);
272
273 memset(shared, 0, sizeof(SlruSharedData));
274
275 shared->num_slots = nslots;
276 shared->lsn_groups_per_page = nlsns;
277
279
281
282 ptr = (char *) shared;
283 offset = MAXALIGN(sizeof(SlruSharedData));
284 shared->page_buffer = (char **) (ptr + offset);
285 offset += MAXALIGN(nslots * sizeof(char *));
286 shared->page_status = (SlruPageStatus *) (ptr + offset);
287 offset += MAXALIGN(nslots * sizeof(SlruPageStatus));
288 shared->page_dirty = (bool *) (ptr + offset);
289 offset += MAXALIGN(nslots * sizeof(bool));
290 shared->page_number = (int64 *) (ptr + offset);
291 offset += MAXALIGN(nslots * sizeof(int64));
292 shared->page_lru_count = (int *) (ptr + offset);
293 offset += MAXALIGN(nslots * sizeof(int));
294
295 /* Initialize LWLocks */
296 shared->buffer_locks = (LWLockPadded *) (ptr + offset);
297 offset += MAXALIGN(nslots * sizeof(LWLockPadded));
298 shared->bank_locks = (LWLockPadded *) (ptr + offset);
299 offset += MAXALIGN(nbanks * sizeof(LWLockPadded));
300 shared->bank_cur_lru_count = (int *) (ptr + offset);
301 offset += MAXALIGN(nbanks * sizeof(int));
302
303 if (nlsns > 0)
304 {
305 shared->group_lsn = (XLogRecPtr *) (ptr + offset);
306 offset += MAXALIGN(nslots * nlsns * sizeof(XLogRecPtr));
307 }
308
309 ptr += BUFFERALIGN(offset);
310 for (int slotno = 0; slotno < nslots; slotno++)
311 {
312 LWLockInitialize(&shared->buffer_locks[slotno].lock,
313 buffer_tranche_id);
314
315 shared->page_buffer[slotno] = ptr;
316 shared->page_status[slotno] = SLRU_PAGE_EMPTY;
317 shared->page_dirty[slotno] = false;
318 shared->page_lru_count[slotno] = 0;
319 ptr += BLCKSZ;
320 }
321
322 /* Initialize the slot banks. */
323 for (int bankno = 0; bankno < nbanks; bankno++)
324 {
325 LWLockInitialize(&shared->bank_locks[bankno].lock, bank_tranche_id);
326 shared->bank_cur_lru_count[bankno] = 0;
327 }
328
329 /* Should fit to estimated shmem size */
330 Assert(ptr - (char *) shared <= SimpleLruShmemSize(nslots, nlsns));
331 }
332 else
333 {
334 Assert(found);
335 Assert(shared->num_slots == nslots);
336 }
337
338 /*
339 * Initialize the unshared control struct, including directory path. We
340 * assume caller set PagePrecedes.
341 */
342 ctl->shared = shared;
343 ctl->sync_handler = sync_handler;
344 ctl->long_segment_names = long_segment_names;
345 ctl->nbanks = nbanks;
346 strlcpy(ctl->Dir, subdir, sizeof(ctl->Dir));
347}
static void pg_atomic_init_u64(volatile pg_atomic_uint64 *ptr, uint64 val)
Definition: atomics.h:453
#define MAXALIGN(LEN)
Definition: c.h:782
#define BUFFERALIGN(LEN)
Definition: c.h:784
size_t Size
Definition: c.h:576
bool IsUnderPostmaster
Definition: globals.c:121
Assert(PointerIsAligned(start, uint64))
void LWLockInitialize(LWLock *lock, int tranche_id)
Definition: lwlock.c:721
int pgstat_get_slru_index(const char *name)
Definition: pgstat_slru.c:132
size_t strlcpy(char *dst, const char *src, size_t siz)
Definition: strlcpy.c:45
void * ShmemInitStruct(const char *name, Size size, bool *foundPtr)
Definition: shmem.c:387
Size SimpleLruShmemSize(int nslots, int nlsns)
Definition: slru.c:198
SlruSharedData * SlruShared
Definition: slru.h:121
#define SLRU_MAX_ALLOWED_BUFFERS
Definition: slru.h:24
int slru_stats_idx
Definition: slru.h:118
int64 * page_number
Definition: slru.h:73
int num_slots
Definition: slru.h:64
LWLockPadded * bank_locks
Definition: slru.h:80
int * page_lru_count
Definition: slru.h:74
pg_atomic_uint64 latest_page_number
Definition: slru.h:115
XLogRecPtr * group_lsn
Definition: slru.h:107
int * bank_cur_lru_count
Definition: slru.h:97
int lsn_groups_per_page
Definition: slru.h:108
SlruPageStatus * page_status
Definition: slru.h:71
bool * page_dirty
Definition: slru.h:72
LWLockPadded * buffer_locks
Definition: slru.h:77
char ** page_buffer
Definition: slru.h:70
LWLock lock
Definition: lwlock.h:70
uint64 XLogRecPtr
Definition: xlogdefs.h:21

References Assert(), SlruSharedData::bank_cur_lru_count, SlruSharedData::bank_locks, SlruSharedData::buffer_locks, BUFFERALIGN, ctl, SlruSharedData::group_lsn, IsUnderPostmaster, SlruSharedData::latest_page_number, LWLockPadded::lock, SlruSharedData::lsn_groups_per_page, LWLockInitialize(), MAXALIGN, name, SlruSharedData::num_slots, SlruSharedData::page_buffer, SlruSharedData::page_dirty, SlruSharedData::page_lru_count, SlruSharedData::page_number, SlruSharedData::page_status, pg_atomic_init_u64(), pgstat_get_slru_index(), ShmemInitStruct(), SimpleLruShmemSize(), SLRU_BANK_SIZE, SLRU_MAX_ALLOWED_BUFFERS, SLRU_PAGE_EMPTY, SlruSharedData::slru_stats_idx, and strlcpy().

Referenced by AsyncShmemInit(), CLOGShmemInit(), CommitTsShmemInit(), MultiXactShmemInit(), SerialInit(), SUBTRANSShmemInit(), and test_slru_shmem_startup().

◆ SimpleLruReadPage()

int SimpleLruReadPage ( SlruCtl  ctl,
int64  pageno,
bool  write_ok,
TransactionId  xid 
)

Definition at line 501 of file slru.c.

503{
504 SlruShared shared = ctl->shared;
505 LWLock *banklock = SimpleLruGetBankLock(ctl, pageno);
506
508
509 /* Outer loop handles restart if we must wait for someone else's I/O */
510 for (;;)
511 {
512 int slotno;
513 bool ok;
514
515 /* See if page already is in memory; if not, pick victim slot */
516 slotno = SlruSelectLRUPage(ctl, pageno);
517
518 /* Did we find the page in memory? */
519 if (shared->page_status[slotno] != SLRU_PAGE_EMPTY &&
520 shared->page_number[slotno] == pageno)
521 {
522 /*
523 * If page is still being read in, we must wait for I/O. Likewise
524 * if the page is being written and the caller said that's not OK.
525 */
526 if (shared->page_status[slotno] == SLRU_PAGE_READ_IN_PROGRESS ||
527 (shared->page_status[slotno] == SLRU_PAGE_WRITE_IN_PROGRESS &&
528 !write_ok))
529 {
530 SimpleLruWaitIO(ctl, slotno);
531 /* Now we must recheck state from the top */
532 continue;
533 }
534 /* Otherwise, it's ready to use */
535 SlruRecentlyUsed(shared, slotno);
536
537 /* update the stats counter of pages found in the SLRU */
539
540 return slotno;
541 }
542
543 /* We found no match; assert we selected a freeable slot */
544 Assert(shared->page_status[slotno] == SLRU_PAGE_EMPTY ||
545 (shared->page_status[slotno] == SLRU_PAGE_VALID &&
546 !shared->page_dirty[slotno]));
547
548 /* Mark the slot read-busy */
549 shared->page_number[slotno] = pageno;
550 shared->page_status[slotno] = SLRU_PAGE_READ_IN_PROGRESS;
551 shared->page_dirty[slotno] = false;
552
553 /* Acquire per-buffer lock (cannot deadlock, see notes at top) */
554 LWLockAcquire(&shared->buffer_locks[slotno].lock, LW_EXCLUSIVE);
555
556 /* Release bank lock while doing I/O */
557 LWLockRelease(banklock);
558
559 /* Do the read */
560 ok = SlruPhysicalReadPage(ctl, pageno, slotno);
561
562 /* Set the LSNs for this newly read-in page to zero */
563 SimpleLruZeroLSNs(ctl, slotno);
564
565 /* Re-acquire bank control lock and update page state */
566 LWLockAcquire(banklock, LW_EXCLUSIVE);
567
568 Assert(shared->page_number[slotno] == pageno &&
569 shared->page_status[slotno] == SLRU_PAGE_READ_IN_PROGRESS &&
570 !shared->page_dirty[slotno]);
571
572 shared->page_status[slotno] = ok ? SLRU_PAGE_VALID : SLRU_PAGE_EMPTY;
573
574 LWLockRelease(&shared->buffer_locks[slotno].lock);
575
576 /* Now it's okay to ereport if we failed */
577 if (!ok)
578 SlruReportIOError(ctl, pageno, xid);
579
580 SlruRecentlyUsed(shared, slotno);
581
582 /* update the stats counter of pages not found in SLRU */
584
585 return slotno;
586 }
587}
bool LWLockAcquire(LWLock *lock, LWLockMode mode)
Definition: lwlock.c:1182
bool LWLockHeldByMeInMode(LWLock *lock, LWLockMode mode)
Definition: lwlock.c:2014
void LWLockRelease(LWLock *lock)
Definition: lwlock.c:1902
@ LW_EXCLUSIVE
Definition: lwlock.h:114
void pgstat_count_slru_page_read(int slru_idx)
Definition: pgstat_slru.c:77
void pgstat_count_slru_page_hit(int slru_idx)
Definition: pgstat_slru.c:65
static bool SlruPhysicalReadPage(SlruCtl ctl, int64 pageno, int slotno)
Definition: slru.c:803
static void SimpleLruZeroLSNs(SlruCtl ctl, int slotno)
Definition: slru.c:427
static void SimpleLruWaitIO(SlruCtl ctl, int slotno)
Definition: slru.c:444
static int SlruSelectLRUPage(SlruCtl ctl, int64 pageno)
Definition: slru.c:1168
static void SlruRecentlyUsed(SlruShared shared, int slotno)
Definition: slru.c:1122
static LWLock * SimpleLruGetBankLock(SlruCtl ctl, int64 pageno)
Definition: slru.h:175
Definition: lwlock.h:42

References Assert(), SlruSharedData::buffer_locks, ctl, LWLockPadded::lock, LW_EXCLUSIVE, LWLockAcquire(), LWLockHeldByMeInMode(), LWLockRelease(), SlruSharedData::page_dirty, SlruSharedData::page_number, SlruSharedData::page_status, pgstat_count_slru_page_hit(), pgstat_count_slru_page_read(), SimpleLruGetBankLock(), SimpleLruWaitIO(), SimpleLruZeroLSNs(), SLRU_PAGE_EMPTY, SLRU_PAGE_READ_IN_PROGRESS, SLRU_PAGE_VALID, SLRU_PAGE_WRITE_IN_PROGRESS, SlruSharedData::slru_stats_idx, SlruPhysicalReadPage(), SlruRecentlyUsed(), SlruReportIOError(), and SlruSelectLRUPage().

Referenced by asyncQueueAddEntries(), GetMultiXactIdMembers(), RecordNewMultiXact(), SerialAdd(), SetXidCommitTsInPage(), SimpleLruReadPage_ReadOnly(), SubTransSetParent(), test_slru_page_read(), TransactionIdSetPageStatusInternal(), TrimCLOG(), and TrimMultiXact().

◆ SimpleLruReadPage_ReadOnly()

int SimpleLruReadPage_ReadOnly ( SlruCtl  ctl,
int64  pageno,
TransactionId  xid 
)

Definition at line 604 of file slru.c.

605{
606 SlruShared shared = ctl->shared;
607 LWLock *banklock = SimpleLruGetBankLock(ctl, pageno);
608 int bankno = pageno % ctl->nbanks;
609 int bankstart = bankno * SLRU_BANK_SIZE;
610 int bankend = bankstart + SLRU_BANK_SIZE;
611
612 /* Try to find the page while holding only shared lock */
613 LWLockAcquire(banklock, LW_SHARED);
614
615 /* See if page is already in a buffer */
616 for (int slotno = bankstart; slotno < bankend; slotno++)
617 {
618 if (shared->page_status[slotno] != SLRU_PAGE_EMPTY &&
619 shared->page_number[slotno] == pageno &&
620 shared->page_status[slotno] != SLRU_PAGE_READ_IN_PROGRESS)
621 {
622 /* See comments for SlruRecentlyUsed macro */
623 SlruRecentlyUsed(shared, slotno);
624
625 /* update the stats counter of pages found in the SLRU */
627
628 return slotno;
629 }
630 }
631
632 /* No luck, so switch to normal exclusive lock and do regular read */
633 LWLockRelease(banklock);
634 LWLockAcquire(banklock, LW_EXCLUSIVE);
635
636 return SimpleLruReadPage(ctl, pageno, true, xid);
637}
@ LW_SHARED
Definition: lwlock.h:115
int SimpleLruReadPage(SlruCtl ctl, int64 pageno, bool write_ok, TransactionId xid)
Definition: slru.c:501

References ctl, LW_EXCLUSIVE, LW_SHARED, LWLockAcquire(), LWLockRelease(), SlruSharedData::page_number, SlruSharedData::page_status, pgstat_count_slru_page_hit(), SimpleLruGetBankLock(), SimpleLruReadPage(), SLRU_BANK_SIZE, SLRU_PAGE_EMPTY, SLRU_PAGE_READ_IN_PROGRESS, SlruSharedData::slru_stats_idx, and SlruRecentlyUsed().

Referenced by asyncQueueReadAllNotifications(), find_multixact_start(), SerialGetMinConflictCommitSeqNo(), SubTransGetParent(), test_slru_page_readonly(), TransactionIdGetCommitTsData(), and TransactionIdGetStatus().

◆ SimpleLruShmemSize()

Size SimpleLruShmemSize ( int  nslots,
int  nlsns 
)

Definition at line 198 of file slru.c.

199{
200 int nbanks = nslots / SLRU_BANK_SIZE;
201 Size sz;
202
204 Assert(nslots % SLRU_BANK_SIZE == 0);
205
206 /* we assume nslots isn't so large as to risk overflow */
207 sz = MAXALIGN(sizeof(SlruSharedData));
208 sz += MAXALIGN(nslots * sizeof(char *)); /* page_buffer[] */
209 sz += MAXALIGN(nslots * sizeof(SlruPageStatus)); /* page_status[] */
210 sz += MAXALIGN(nslots * sizeof(bool)); /* page_dirty[] */
211 sz += MAXALIGN(nslots * sizeof(int64)); /* page_number[] */
212 sz += MAXALIGN(nslots * sizeof(int)); /* page_lru_count[] */
213 sz += MAXALIGN(nslots * sizeof(LWLockPadded)); /* buffer_locks[] */
214 sz += MAXALIGN(nbanks * sizeof(LWLockPadded)); /* bank_locks[] */
215 sz += MAXALIGN(nbanks * sizeof(int)); /* bank_cur_lru_count[] */
216
217 if (nlsns > 0)
218 sz += MAXALIGN(nslots * nlsns * sizeof(XLogRecPtr)); /* group_lsn[] */
219
220 return BUFFERALIGN(sz) + BLCKSZ * nslots;
221}

References Assert(), BUFFERALIGN, MAXALIGN, SLRU_BANK_SIZE, and SLRU_MAX_ALLOWED_BUFFERS.

Referenced by AsyncShmemSize(), CLOGShmemSize(), CommitTsShmemSize(), MultiXactShmemSize(), PredicateLockShmemSize(), SimpleLruInit(), SUBTRANSShmemSize(), and test_slru_shmem_request().

◆ SimpleLruTruncate()

void SimpleLruTruncate ( SlruCtl  ctl,
int64  cutoffPage 
)

Definition at line 1407 of file slru.c.

1408{
1409 SlruShared shared = ctl->shared;
1410 int prevbank;
1411
1412 /* update the stats counter of truncates */
1414
1415 /*
1416 * Scan shared memory and remove any pages preceding the cutoff page, to
1417 * ensure we won't rewrite them later. (Since this is normally called in
1418 * or just after a checkpoint, any dirty pages should have been flushed
1419 * already ... we're just being extra careful here.)
1420 */
1421restart:
1422
1423 /*
1424 * An important safety check: the current endpoint page must not be
1425 * eligible for removal. This check is just a backstop against wraparound
1426 * bugs elsewhere in SLRU handling, so we don't care if we read a slightly
1427 * outdated value; therefore we don't add a memory barrier.
1428 */
1429 if (ctl->PagePrecedes(pg_atomic_read_u64(&shared->latest_page_number),
1430 cutoffPage))
1431 {
1432 ereport(LOG,
1433 (errmsg("could not truncate directory \"%s\": apparent wraparound",
1434 ctl->Dir)));
1435 return;
1436 }
1437
1438 prevbank = SlotGetBankNumber(0);
1439 LWLockAcquire(&shared->bank_locks[prevbank].lock, LW_EXCLUSIVE);
1440 for (int slotno = 0; slotno < shared->num_slots; slotno++)
1441 {
1442 int curbank = SlotGetBankNumber(slotno);
1443
1444 /*
1445 * If the current bank lock is not same as the previous bank lock then
1446 * release the previous lock and acquire the new lock.
1447 */
1448 if (curbank != prevbank)
1449 {
1450 LWLockRelease(&shared->bank_locks[prevbank].lock);
1451 LWLockAcquire(&shared->bank_locks[curbank].lock, LW_EXCLUSIVE);
1452 prevbank = curbank;
1453 }
1454
1455 if (shared->page_status[slotno] == SLRU_PAGE_EMPTY)
1456 continue;
1457 if (!ctl->PagePrecedes(shared->page_number[slotno], cutoffPage))
1458 continue;
1459
1460 /*
1461 * If page is clean, just change state to EMPTY (expected case).
1462 */
1463 if (shared->page_status[slotno] == SLRU_PAGE_VALID &&
1464 !shared->page_dirty[slotno])
1465 {
1466 shared->page_status[slotno] = SLRU_PAGE_EMPTY;
1467 continue;
1468 }
1469
1470 /*
1471 * Hmm, we have (or may have) I/O operations acting on the page, so
1472 * we've got to wait for them to finish and then start again. This is
1473 * the same logic as in SlruSelectLRUPage. (XXX if page is dirty,
1474 * wouldn't it be OK to just discard it without writing it?
1475 * SlruMayDeleteSegment() uses a stricter qualification, so we might
1476 * not delete this page in the end; even if we don't delete it, we
1477 * won't have cause to read its data again. For now, keep the logic
1478 * the same as it was.)
1479 */
1480 if (shared->page_status[slotno] == SLRU_PAGE_VALID)
1481 SlruInternalWritePage(ctl, slotno, NULL);
1482 else
1483 SimpleLruWaitIO(ctl, slotno);
1484
1485 LWLockRelease(&shared->bank_locks[prevbank].lock);
1486 goto restart;
1487 }
1488
1489 LWLockRelease(&shared->bank_locks[prevbank].lock);
1490
1491 /* Now we can remove the old segment(s) */
1492 (void) SlruScanDirectory(ctl, SlruScanDirCbDeleteCutoff, &cutoffPage);
1493}
static uint64 pg_atomic_read_u64(volatile pg_atomic_uint64 *ptr)
Definition: atomics.h:467
int errmsg(const char *fmt,...)
Definition: elog.c:1071
#define LOG
Definition: elog.h:31
#define ereport(elevel,...)
Definition: elog.h:149
void pgstat_count_slru_truncate(int slru_idx)
Definition: pgstat_slru.c:95
static void SlruInternalWritePage(SlruCtl ctl, int slotno, SlruWriteAll fdata)
Definition: slru.c:651
bool SlruScanDirectory(SlruCtl ctl, SlruScanCallback callback, void *data)
Definition: slru.c:1790
#define SlotGetBankNumber(slotno)
Definition: slru.c:148
static bool SlruScanDirCbDeleteCutoff(SlruCtl ctl, char *filename, int64 segpage, void *data)
Definition: slru.c:1727

References SlruSharedData::bank_locks, ctl, ereport, errmsg(), SlruSharedData::latest_page_number, LWLockPadded::lock, LOG, LW_EXCLUSIVE, LWLockAcquire(), LWLockRelease(), SlruSharedData::num_slots, SlruSharedData::page_dirty, SlruSharedData::page_number, SlruSharedData::page_status, pg_atomic_read_u64(), pgstat_count_slru_truncate(), SimpleLruWaitIO(), SlotGetBankNumber, SLRU_PAGE_EMPTY, SLRU_PAGE_VALID, SlruSharedData::slru_stats_idx, SlruInternalWritePage(), SlruScanDirCbDeleteCutoff(), and SlruScanDirectory().

Referenced by asyncQueueAdvanceTail(), CheckPointPredicate(), clog_redo(), commit_ts_redo(), PerformOffsetsTruncation(), test_slru_page_truncate(), TruncateCLOG(), TruncateCommitTs(), and TruncateSUBTRANS().

◆ SimpleLruWriteAll()

void SimpleLruWriteAll ( SlruCtl  ctl,
bool  allow_redirtied 
)

Definition at line 1321 of file slru.c.

1322{
1323 SlruShared shared = ctl->shared;
1324 SlruWriteAllData fdata;
1325 int64 pageno = 0;
1326 int prevbank = SlotGetBankNumber(0);
1327 bool ok;
1328
1329 /* update the stats counter of flushes */
1331
1332 /*
1333 * Find and write dirty pages
1334 */
1335 fdata.num_files = 0;
1336
1337 LWLockAcquire(&shared->bank_locks[prevbank].lock, LW_EXCLUSIVE);
1338
1339 for (int slotno = 0; slotno < shared->num_slots; slotno++)
1340 {
1341 int curbank = SlotGetBankNumber(slotno);
1342
1343 /*
1344 * If the current bank lock is not same as the previous bank lock then
1345 * release the previous lock and acquire the new lock.
1346 */
1347 if (curbank != prevbank)
1348 {
1349 LWLockRelease(&shared->bank_locks[prevbank].lock);
1350 LWLockAcquire(&shared->bank_locks[curbank].lock, LW_EXCLUSIVE);
1351 prevbank = curbank;
1352 }
1353
1354 /* Do nothing if slot is unused */
1355 if (shared->page_status[slotno] == SLRU_PAGE_EMPTY)
1356 continue;
1357
1358 SlruInternalWritePage(ctl, slotno, &fdata);
1359
1360 /*
1361 * In some places (e.g. checkpoints), we cannot assert that the slot
1362 * is clean now, since another process might have re-dirtied it
1363 * already. That's okay.
1364 */
1365 Assert(allow_redirtied ||
1366 shared->page_status[slotno] == SLRU_PAGE_EMPTY ||
1367 (shared->page_status[slotno] == SLRU_PAGE_VALID &&
1368 !shared->page_dirty[slotno]));
1369 }
1370
1371 LWLockRelease(&shared->bank_locks[prevbank].lock);
1372
1373 /*
1374 * Now close any files that were open
1375 */
1376 ok = true;
1377 for (int i = 0; i < fdata.num_files; i++)
1378 {
1379 if (CloseTransientFile(fdata.fd[i]) != 0)
1380 {
1382 slru_errno = errno;
1383 pageno = fdata.segno[i] * SLRU_PAGES_PER_SEGMENT;
1384 ok = false;
1385 }
1386 }
1387 if (!ok)
1389
1390 /* Ensure that directory entries for new files are on disk. */
1391 if (ctl->sync_handler != SYNC_HANDLER_NONE)
1392 fsync_fname(ctl->Dir, true);
1393}
void fsync_fname(const char *fname, bool isdir)
Definition: fd.c:756
int i
Definition: isn.c:77
void pgstat_count_slru_flush(int slru_idx)
Definition: pgstat_slru.c:89
int num_files
Definition: slru.c:127
int fd[MAX_WRITEALL_BUFFERS]
Definition: slru.c:128
int64 segno[MAX_WRITEALL_BUFFERS]
Definition: slru.c:129
@ SYNC_HANDLER_NONE
Definition: sync.h:42
#define InvalidTransactionId
Definition: transam.h:31

References Assert(), SlruSharedData::bank_locks, CloseTransientFile(), ctl, SlruWriteAllData::fd, fsync_fname(), i, InvalidTransactionId, LWLockPadded::lock, LW_EXCLUSIVE, LWLockAcquire(), LWLockRelease(), SlruWriteAllData::num_files, SlruSharedData::num_slots, SlruSharedData::page_dirty, SlruSharedData::page_status, pgstat_count_slru_flush(), SlruWriteAllData::segno, SlotGetBankNumber, SLRU_CLOSE_FAILED, slru_errcause, slru_errno, SLRU_PAGE_EMPTY, SLRU_PAGE_VALID, SLRU_PAGES_PER_SEGMENT, SlruSharedData::slru_stats_idx, SlruInternalWritePage(), SlruReportIOError(), and SYNC_HANDLER_NONE.

Referenced by CheckPointCLOG(), CheckPointCommitTs(), CheckPointMultiXact(), CheckPointPredicate(), CheckPointSUBTRANS(), find_multixact_start(), and test_slru_page_writeall().

◆ SimpleLruWritePage()

void SimpleLruWritePage ( SlruCtl  ctl,
int  slotno 
)

◆ SimpleLruZeroPage()

int SimpleLruZeroPage ( SlruCtl  ctl,
int64  pageno 
)

Definition at line 374 of file slru.c.

375{
376 SlruShared shared = ctl->shared;
377 int slotno;
378
380
381 /* Find a suitable buffer slot for the page */
382 slotno = SlruSelectLRUPage(ctl, pageno);
383 Assert(shared->page_status[slotno] == SLRU_PAGE_EMPTY ||
384 (shared->page_status[slotno] == SLRU_PAGE_VALID &&
385 !shared->page_dirty[slotno]) ||
386 shared->page_number[slotno] == pageno);
387
388 /* Mark the slot as containing this page */
389 shared->page_number[slotno] = pageno;
390 shared->page_status[slotno] = SLRU_PAGE_VALID;
391 shared->page_dirty[slotno] = true;
392 SlruRecentlyUsed(shared, slotno);
393
394 /* Set the buffer to zeroes */
395 MemSet(shared->page_buffer[slotno], 0, BLCKSZ);
396
397 /* Set the LSNs for this new page to zero */
398 SimpleLruZeroLSNs(ctl, slotno);
399
400 /*
401 * Assume this page is now the latest active page.
402 *
403 * Note that because both this routine and SlruSelectLRUPage run with
404 * ControlLock held, it is not possible for this to be zeroing a page that
405 * SlruSelectLRUPage is going to evict simultaneously. Therefore, there's
406 * no memory barrier here.
407 */
408 pg_atomic_write_u64(&shared->latest_page_number, pageno);
409
410 /* update the stats counter of zeroed pages */
412
413 return slotno;
414}
static void pg_atomic_write_u64(volatile pg_atomic_uint64 *ptr, uint64 val)
Definition: atomics.h:485
#define MemSet(start, val, len)
Definition: c.h:991
void pgstat_count_slru_page_zeroed(int slru_idx)
Definition: pgstat_slru.c:59

References Assert(), ctl, SlruSharedData::latest_page_number, LW_EXCLUSIVE, LWLockHeldByMeInMode(), MemSet, SlruSharedData::page_buffer, SlruSharedData::page_dirty, SlruSharedData::page_number, SlruSharedData::page_status, pg_atomic_write_u64(), pgstat_count_slru_page_zeroed(), SimpleLruGetBankLock(), SimpleLruZeroLSNs(), SLRU_PAGE_EMPTY, SLRU_PAGE_VALID, SlruSharedData::slru_stats_idx, SlruRecentlyUsed(), and SlruSelectLRUPage().

Referenced by asyncQueueAddEntries(), SerialAdd(), test_slru_page_write(), ZeroCLOGPage(), ZeroCommitTsPage(), ZeroMultiXactMemberPage(), ZeroMultiXactOffsetPage(), and ZeroSUBTRANSPage().

◆ SlruDeleteSegment()

void SlruDeleteSegment ( SlruCtl  ctl,
int64  segno 
)

Definition at line 1525 of file slru.c.

1526{
1527 SlruShared shared = ctl->shared;
1528 int prevbank = SlotGetBankNumber(0);
1529 bool did_write;
1530
1531 /* Clean out any possibly existing references to the segment. */
1532 LWLockAcquire(&shared->bank_locks[prevbank].lock, LW_EXCLUSIVE);
1533restart:
1534 did_write = false;
1535 for (int slotno = 0; slotno < shared->num_slots; slotno++)
1536 {
1537 int64 pagesegno;
1538 int curbank = SlotGetBankNumber(slotno);
1539
1540 /*
1541 * If the current bank lock is not same as the previous bank lock then
1542 * release the previous lock and acquire the new lock.
1543 */
1544 if (curbank != prevbank)
1545 {
1546 LWLockRelease(&shared->bank_locks[prevbank].lock);
1547 LWLockAcquire(&shared->bank_locks[curbank].lock, LW_EXCLUSIVE);
1548 prevbank = curbank;
1549 }
1550
1551 if (shared->page_status[slotno] == SLRU_PAGE_EMPTY)
1552 continue;
1553
1554 pagesegno = shared->page_number[slotno] / SLRU_PAGES_PER_SEGMENT;
1555 /* not the segment we're looking for */
1556 if (pagesegno != segno)
1557 continue;
1558
1559 /* If page is clean, just change state to EMPTY (expected case). */
1560 if (shared->page_status[slotno] == SLRU_PAGE_VALID &&
1561 !shared->page_dirty[slotno])
1562 {
1563 shared->page_status[slotno] = SLRU_PAGE_EMPTY;
1564 continue;
1565 }
1566
1567 /* Same logic as SimpleLruTruncate() */
1568 if (shared->page_status[slotno] == SLRU_PAGE_VALID)
1569 SlruInternalWritePage(ctl, slotno, NULL);
1570 else
1571 SimpleLruWaitIO(ctl, slotno);
1572
1573 did_write = true;
1574 }
1575
1576 /*
1577 * Be extra careful and re-check. The IO functions release the control
1578 * lock, so new pages could have been read in.
1579 */
1580 if (did_write)
1581 goto restart;
1582
1584
1585 LWLockRelease(&shared->bank_locks[prevbank].lock);
1586}
static void SlruInternalDeleteSegment(SlruCtl ctl, int64 segno)
Definition: slru.c:1502

References SlruSharedData::bank_locks, ctl, LWLockPadded::lock, LW_EXCLUSIVE, LWLockAcquire(), LWLockRelease(), SlruSharedData::num_slots, SlruSharedData::page_dirty, SlruSharedData::page_number, SlruSharedData::page_status, SlruWriteAllData::segno, SimpleLruWaitIO(), SlotGetBankNumber, SLRU_PAGE_EMPTY, SLRU_PAGE_VALID, SLRU_PAGES_PER_SEGMENT, SlruInternalDeleteSegment(), and SlruInternalWritePage().

Referenced by PerformMembersTruncation(), and test_slru_page_delete().

◆ SlruScanDirCbDeleteAll()

bool SlruScanDirCbDeleteAll ( SlruCtl  ctl,
char *  filename,
int64  segpage,
void *  data 
)

Definition at line 1743 of file slru.c.

1744{
1746
1747 return false; /* keep going */
1748}

References ctl, SLRU_PAGES_PER_SEGMENT, and SlruInternalDeleteSegment().

Referenced by AsyncShmemInit(), DeactivateCommitTs(), and test_slru_scan_cb().

◆ SlruScanDirCbReportPresence()

bool SlruScanDirCbReportPresence ( SlruCtl  ctl,
char *  filename,
int64  segpage,
void *  data 
)

Definition at line 1711 of file slru.c.

1713{
1714 int64 cutoffPage = *(int64 *) data;
1715
1716 if (SlruMayDeleteSegment(ctl, segpage, cutoffPage))
1717 return true; /* found one; don't iterate any more */
1718
1719 return false; /* keep going */
1720}
const void * data
static bool SlruMayDeleteSegment(SlruCtl ctl, int64 segpage, int64 cutoffPage)
Definition: slru.c:1602

References ctl, data, and SlruMayDeleteSegment().

Referenced by TruncateCLOG(), and TruncateCommitTs().

◆ SlruScanDirectory()

bool SlruScanDirectory ( SlruCtl  ctl,
SlruScanCallback  callback,
void *  data 
)

Definition at line 1790 of file slru.c.

1791{
1792 bool retval = false;
1793 DIR *cldir;
1794 struct dirent *clde;
1795 int64 segno;
1796 int64 segpage;
1797
1798 cldir = AllocateDir(ctl->Dir);
1799 while ((clde = ReadDir(cldir, ctl->Dir)) != NULL)
1800 {
1801 size_t len;
1802
1803 len = strlen(clde->d_name);
1804
1806 strspn(clde->d_name, "0123456789ABCDEF") == len)
1807 {
1808 segno = strtoi64(clde->d_name, NULL, 16);
1809 segpage = segno * SLRU_PAGES_PER_SEGMENT;
1810
1811 elog(DEBUG2, "SlruScanDirectory invoking callback on %s/%s",
1812 ctl->Dir, clde->d_name);
1813 retval = callback(ctl, clde->d_name, segpage, data);
1814 if (retval)
1815 break;
1816 }
1817 }
1818 FreeDir(cldir);
1819
1820 return retval;
1821}
#define DEBUG2
Definition: elog.h:29
#define elog(elevel,...)
Definition: elog.h:226
int FreeDir(DIR *dir)
Definition: fd.c:3025
DIR * AllocateDir(const char *dirname)
Definition: fd.c:2907
struct dirent * ReadDir(DIR *dir, const char *dirname)
Definition: fd.c:2973
const void size_t len
static bool SlruCorrectSegmentFilenameLength(SlruCtl ctl, size_t len)
Definition: slru.c:1757
Definition: dirent.c:26
Definition: dirent.h:10
char d_name[MAX_PATH]
Definition: dirent.h:15
static void callback(struct sockaddr *addr, struct sockaddr *mask, void *unused)
Definition: test_ifaddrs.c:46

References AllocateDir(), callback(), ctl, dirent::d_name, data, DEBUG2, elog, FreeDir(), len, ReadDir(), SLRU_PAGES_PER_SEGMENT, and SlruCorrectSegmentFilenameLength().

Referenced by AsyncShmemInit(), DeactivateCommitTs(), SimpleLruTruncate(), test_slru_delete_all(), TruncateCLOG(), TruncateCommitTs(), and TruncateMultiXact().

◆ SlruSyncFileTag()

int SlruSyncFileTag ( SlruCtl  ctl,
const FileTag ftag,
char *  path 
)

Definition at line 1830 of file slru.c.

1831{
1832 int fd;
1833 int save_errno;
1834 int result;
1835
1836 SlruFileName(ctl, path, ftag->segno);
1837
1838 fd = OpenTransientFile(path, O_RDWR | PG_BINARY);
1839 if (fd < 0)
1840 return -1;
1841
1842 pgstat_report_wait_start(WAIT_EVENT_SLRU_FLUSH_SYNC);
1843 result = pg_fsync(fd);
1845 save_errno = errno;
1846
1848
1849 errno = save_errno;
1850 return result;
1851}
int pg_fsync(int fd)
Definition: fd.c:386
uint64 segno
Definition: sync.h:55
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: wait_event.h:85
static void pgstat_report_wait_end(void)
Definition: wait_event.h:101

References CloseTransientFile(), ctl, fd(), OpenTransientFile(), PG_BINARY, pg_fsync(), pgstat_report_wait_end(), pgstat_report_wait_start(), FileTag::segno, and SlruFileName().

Referenced by clogsyncfiletag(), committssyncfiletag(), multixactmemberssyncfiletag(), multixactoffsetssyncfiletag(), and test_slru_page_sync().