PostgreSQL Source Code git master
Loading...
Searching...
No Matches
lwlock.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * lwlock.c
4 * Lightweight lock manager
5 *
6 * Lightweight locks are intended primarily to provide mutual exclusion of
7 * access to shared-memory data structures. Therefore, they offer both
8 * exclusive and shared lock modes (to support read/write and read-only
9 * access to a shared object). There are few other frammishes. User-level
10 * locking should be done with the full lock manager --- which depends on
11 * LWLocks to protect its shared state.
12 *
13 * In addition to exclusive and shared modes, lightweight locks can be used to
14 * wait until a variable changes value. The variable is initially not set
15 * when the lock is acquired with LWLockAcquire, i.e. it remains set to the
16 * value it was set to when the lock was released last, and can be updated
17 * without releasing the lock by calling LWLockUpdateVar. LWLockWaitForVar
18 * waits for the variable to be updated, or until the lock is free. When
19 * releasing the lock with LWLockReleaseClearVar() the value can be set to an
20 * appropriate value for a free lock. The meaning of the variable is up to
21 * the caller, the lightweight lock code just assigns and compares it.
22 *
23 * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
24 * Portions Copyright (c) 1994, Regents of the University of California
25 *
26 * IDENTIFICATION
27 * src/backend/storage/lmgr/lwlock.c
28 *
29 * NOTES:
30 *
31 * This used to be a pretty straight forward reader-writer lock
32 * implementation, in which the internal state was protected by a
33 * spinlock. Unfortunately the overhead of taking the spinlock proved to be
34 * too high for workloads/locks that were taken in shared mode very
35 * frequently. Often we were spinning in the (obviously exclusive) spinlock,
36 * while trying to acquire a shared lock that was actually free.
37 *
38 * Thus a new implementation was devised that provides wait-free shared lock
39 * acquisition for locks that aren't exclusively locked.
40 *
41 * The basic idea is to have a single atomic variable 'lockcount' instead of
42 * the formerly separate shared and exclusive counters and to use atomic
43 * operations to acquire the lock. That's fairly easy to do for plain
44 * rw-spinlocks, but a lot harder for something like LWLocks that want to wait
45 * in the OS.
46 *
47 * For lock acquisition we use an atomic compare-and-exchange on the lockcount
48 * variable. For exclusive lock we swap in a sentinel value
49 * (LW_VAL_EXCLUSIVE), for shared locks we count the number of holders.
50 *
51 * To release the lock we use an atomic decrement to release the lock. If the
52 * new value is zero (we get that atomically), we know we can/have to release
53 * waiters.
54 *
55 * Obviously it is important that the sentinel value for exclusive locks
56 * doesn't conflict with the maximum number of possible share lockers -
57 * luckily MAX_BACKENDS makes that easily possible.
58 *
59 *
60 * The attentive reader might have noticed that naively doing the above has a
61 * glaring race condition: We try to lock using the atomic operations and
62 * notice that we have to wait. Unfortunately by the time we have finished
63 * queuing, the former locker very well might have already finished its
64 * work. That's problematic because we're now stuck waiting inside the OS.
65
66 * To mitigate those races we use a two phased attempt at locking:
67 * Phase 1: Try to do it atomically, if we succeed, nice
68 * Phase 2: Add ourselves to the waitqueue of the lock
69 * Phase 3: Try to grab the lock again, if we succeed, remove ourselves from
70 * the queue
71 * Phase 4: Sleep till wake-up, goto Phase 1
72 *
73 * This protects us against the problem from above as nobody can release too
74 * quick, before we're queued, since after Phase 2 we're already queued.
75 * -------------------------------------------------------------------------
76 */
77#include "postgres.h"
78
79#include "miscadmin.h"
80#include "pg_trace.h"
81#include "pgstat.h"
82#include "port/pg_bitutils.h"
83#include "storage/proc.h"
84#include "storage/proclist.h"
85#include "storage/procnumber.h"
86#include "storage/spin.h"
87#include "utils/memutils.h"
88
89#ifdef LWLOCK_STATS
90#include "utils/hsearch.h"
91#endif
92
93
94#define LW_FLAG_HAS_WAITERS ((uint32) 1 << 31)
95#define LW_FLAG_WAKE_IN_PROGRESS ((uint32) 1 << 30)
96#define LW_FLAG_LOCKED ((uint32) 1 << 29)
97#define LW_FLAG_BITS 3
98#define LW_FLAG_MASK (((1<<LW_FLAG_BITS)-1)<<(32-LW_FLAG_BITS))
99
100/* assumes MAX_BACKENDS is a (power of 2) - 1, checked below */
101#define LW_VAL_EXCLUSIVE (MAX_BACKENDS + 1)
102#define LW_VAL_SHARED 1
103
104/* already (power of 2)-1, i.e. suitable for a mask */
105#define LW_SHARED_MASK MAX_BACKENDS
106#define LW_LOCK_MASK (MAX_BACKENDS | LW_VAL_EXCLUSIVE)
107
108
110 "MAX_BACKENDS + 1 needs to be a power of 2");
111
113 "MAX_BACKENDS and LW_FLAG_MASK overlap");
114
116 "LW_VAL_EXCLUSIVE and LW_FLAG_MASK overlap");
117
118/*
119 * There are three sorts of LWLock "tranches":
120 *
121 * 1. The individually-named locks defined in lwlocklist.h each have their
122 * own tranche. We absorb the names of these tranches from there into
123 * BuiltinTrancheNames here.
124 *
125 * 2. There are some predefined tranches for built-in groups of locks defined
126 * in lwlocklist.h. We absorb the names of these tranches, too.
127 *
128 * 3. Extensions can create new tranches, via either RequestNamedLWLockTranche
129 * or LWLockNewTrancheId. These names are stored in shared memory and can be
130 * accessed via LWLockTrancheNames.
131 *
132 * All these names are user-visible as wait event names, so choose with care
133 * ... and do not forget to update the documentation's list of wait events.
134 */
135static const char *const BuiltinTrancheNames[] = {
136#define PG_LWLOCK(id, lockname) [id] = CppAsString(lockname),
137#define PG_LWLOCKTRANCHE(id, lockname) [LWTRANCHE_##id] = CppAsString(lockname),
138#include "storage/lwlocklist.h"
139#undef PG_LWLOCK
140#undef PG_LWLOCKTRANCHE
141};
142
145 "missing entries in BuiltinTrancheNames[]");
146
147/*
148 * This is indexed by tranche ID minus LWTRANCHE_FIRST_USER_DEFINED, and
149 * points to the shared memory locations of the names of all
150 * dynamically-created tranches. Backends inherit the pointer by fork from the
151 * postmaster (except in the EXEC_BACKEND case, where we have special measures
152 * to pass it down).
153 */
155
156/*
157 * This points to the main array of LWLocks in shared memory. Backends inherit
158 * the pointer by fork from the postmaster (except in the EXEC_BACKEND case,
159 * where we have special measures to pass it down).
160 */
162
163/*
164 * We use this structure to keep track of locked LWLocks for release
165 * during error recovery. Normally, only a few will be held at once, but
166 * occasionally the number can be much higher.
167 */
168#define MAX_SIMUL_LWLOCKS 200
169
170/* struct representing the LWLocks we're holding */
176
177static int num_held_lwlocks = 0;
179
180/* struct representing the LWLock tranche request for named tranche */
186
187/*
188 * NamedLWLockTrancheRequests is the valid length of the request array. These
189 * variables are non-static so that launch_backend.c can copy them to child
190 * processes in EXEC_BACKEND builds.
191 */
194
195/* postmaster's local copy of the request array */
197
198/* shared memory counter of registered tranches */
200
201/* backend-local counter of registered tranches */
203
204#define MAX_NAMED_TRANCHES 256
205
206static void InitializeLWLocks(void);
207static inline void LWLockReportWaitStart(LWLock *lock);
208static inline void LWLockReportWaitEnd(void);
209static const char *GetLWTrancheName(uint16 trancheId);
210
211#define T_NAME(lock) \
212 GetLWTrancheName((lock)->tranche)
213
214#ifdef LWLOCK_STATS
215typedef struct lwlock_stats_key
216{
217 int tranche;
218 void *instance;
220
221typedef struct lwlock_stats
222{
226 int block_count;
230
231static HTAB *lwlock_stats_htab;
233#endif
234
235#ifdef LOCK_DEBUG
236bool Trace_lwlocks = false;
237
238inline static void
239PRINT_LWDEBUG(const char *where, LWLock *lock, LWLockMode mode)
240{
241 /* hide statement & context here, otherwise the log is just too verbose */
242 if (Trace_lwlocks)
243 {
245
246 ereport(LOG,
247 (errhidestmt(true),
248 errhidecontext(true),
249 errmsg_internal("%d: %s(%s %p): excl %u shared %u haswaiters %u waiters %u waking %d",
250 MyProcPid,
251 where, T_NAME(lock), lock,
252 (state & LW_VAL_EXCLUSIVE) != 0,
254 (state & LW_FLAG_HAS_WAITERS) != 0,
255 pg_atomic_read_u32(&lock->nwaiters),
257 }
258}
259
260inline static void
261LOG_LWDEBUG(const char *where, LWLock *lock, const char *msg)
262{
263 /* hide statement & context here, otherwise the log is just too verbose */
264 if (Trace_lwlocks)
265 {
266 ereport(LOG,
267 (errhidestmt(true),
268 errhidecontext(true),
269 errmsg_internal("%s(%s %p): %s", where,
270 T_NAME(lock), lock, msg)));
271 }
272}
273
274#else /* not LOCK_DEBUG */
275#define PRINT_LWDEBUG(a,b,c) ((void)0)
276#define LOG_LWDEBUG(a,b,c) ((void)0)
277#endif /* LOCK_DEBUG */
278
279#ifdef LWLOCK_STATS
280
281static void init_lwlock_stats(void);
282static void print_lwlock_stats(int code, Datum arg);
284
285static void
287{
288 HASHCTL ctl;
290 static bool exit_registered = false;
291
292 if (lwlock_stats_cxt != NULL)
294
295 /*
296 * The LWLock stats will be updated within a critical section, which
297 * requires allocating new hash entries. Allocations within a critical
298 * section are normally not allowed because running out of memory would
299 * lead to a PANIC, but LWLOCK_STATS is debugging code that's not normally
300 * turned on in production, so that's an acceptable risk. The hash entries
301 * are small, so the risk of running out of memory is minimal in practice.
302 */
304 "LWLock stats",
307
308 ctl.keysize = sizeof(lwlock_stats_key);
309 ctl.entrysize = sizeof(lwlock_stats);
310 ctl.hcxt = lwlock_stats_cxt;
311 lwlock_stats_htab = hash_create("lwlock stats", 16384, &ctl,
313 if (!exit_registered)
314 {
316 exit_registered = true;
317 }
318}
319
320static void
322{
323 HASH_SEQ_STATUS scan;
325
327
328 /* Grab an LWLock to keep different backends from mixing reports */
330
331 while ((lwstats = (lwlock_stats *) hash_seq_search(&scan)) != NULL)
332 {
334 "PID %d lwlock %s %p: shacq %u exacq %u blk %u spindelay %u dequeue self %u\n",
335 MyProcPid, GetLWTrancheName(lwstats->key.tranche),
336 lwstats->key.instance, lwstats->sh_acquire_count,
337 lwstats->ex_acquire_count, lwstats->block_count,
338 lwstats->spin_delay_count, lwstats->dequeue_self_count);
339 }
340
342}
343
344static lwlock_stats *
346{
349 bool found;
350
351 /*
352 * During shared memory initialization, the hash table doesn't exist yet.
353 * Stats of that phase aren't very interesting, so just collect operations
354 * on all locks in a single dummy entry.
355 */
356 if (lwlock_stats_htab == NULL)
357 return &lwlock_stats_dummy;
358
359 /* Fetch or create the entry. */
360 MemSet(&key, 0, sizeof(key));
361 key.tranche = lock->tranche;
362 key.instance = lock;
364 if (!found)
365 {
366 lwstats->sh_acquire_count = 0;
367 lwstats->ex_acquire_count = 0;
368 lwstats->block_count = 0;
369 lwstats->dequeue_self_count = 0;
370 lwstats->spin_delay_count = 0;
371 }
372 return lwstats;
373}
374#endif /* LWLOCK_STATS */
375
376
377/*
378 * Compute number of LWLocks required by named tranches. These will be
379 * allocated in the main array.
380 */
381static int
383{
384 int numLocks = 0;
385 int i;
386
387 for (i = 0; i < NamedLWLockTrancheRequests; i++)
388 numLocks += NamedLWLockTrancheRequestArray[i].num_lwlocks;
389
390 return numLocks;
391}
392
393/*
394 * Compute shmem space needed for LWLocks and named tranches.
395 */
396Size
398{
399 Size size;
400 int numLocks = NUM_FIXED_LWLOCKS;
401
402 /*
403 * If re-initializing shared memory, the request array will no longer be
404 * accessible, so switch to the copy in postmaster's local memory. We'll
405 * copy it back into shared memory later when CreateLWLocks() is called
406 * again.
407 */
410
411 /* Calculate total number of locks needed in the main array. */
412 numLocks += NumLWLocksForNamedTranches();
413
414 /* Space for dynamic allocation counter. */
415 size = MAXALIGN(sizeof(int));
416
417 /* Space for named tranches. */
418 size = add_size(size, mul_size(MAX_NAMED_TRANCHES, sizeof(char *)));
420
421 /*
422 * Make space for named tranche requests. This is done for the benefit of
423 * EXEC_BACKEND builds, which otherwise wouldn't be able to call
424 * GetNamedLWLockTranche() outside postmaster.
425 */
428
429 /* Space for the LWLock array, plus room for cache line alignment. */
430 size = add_size(size, LWLOCK_PADDED_SIZE);
431 size = add_size(size, mul_size(numLocks, sizeof(LWLockPadded)));
432
433 return size;
434}
435
436/*
437 * Allocate shmem space for the main LWLock array and all tranches and
438 * initialize it.
439 */
440void
442{
444 {
446 char *ptr;
447
448 /* Allocate space */
449 ptr = (char *) ShmemAlloc(spaceLocks);
450
451 /* Initialize the dynamic-allocation counter for tranches */
452 LWLockCounter = (int *) ptr;
454 ptr += MAXALIGN(sizeof(int));
455
456 /* Initialize tranche names */
457 LWLockTrancheNames = (char **) ptr;
458 ptr += MAX_NAMED_TRANCHES * sizeof(char *);
459 for (int i = 0; i < MAX_NAMED_TRANCHES; i++)
460 {
461 LWLockTrancheNames[i] = ptr;
462 ptr += NAMEDATALEN;
463 }
464
465 /*
466 * Move named tranche requests to shared memory. This is done for the
467 * benefit of EXEC_BACKEND builds, which otherwise wouldn't be able to
468 * call GetNamedLWLockTranche() outside postmaster.
469 */
471 {
472 /*
473 * Save the pointer to the request array in postmaster's local
474 * memory. We'll need it if we ever need to re-initialize shared
475 * memory after a crash.
476 */
478
483 }
484
485 /* Ensure desired alignment of LWLock array */
488
489 /* Initialize all LWLocks */
491 }
492}
493
494/*
495 * Initialize LWLocks that are fixed and those belonging to named tranches.
496 */
497static void
499{
500 int id;
501 int i;
502 int j;
503 LWLockPadded *lock;
504
505 /* Initialize all individual LWLocks in main array */
506 for (id = 0, lock = MainLWLockArray; id < NUM_INDIVIDUAL_LWLOCKS; id++, lock++)
507 LWLockInitialize(&lock->lock, id);
508
509 /* Initialize buffer mapping LWLocks in main array */
511 for (id = 0; id < NUM_BUFFER_PARTITIONS; id++, lock++)
513
514 /* Initialize lmgrs' LWLocks in main array */
516 for (id = 0; id < NUM_LOCK_PARTITIONS; id++, lock++)
518
519 /* Initialize predicate lmgrs' LWLocks in main array */
521 for (id = 0; id < NUM_PREDICATELOCK_PARTITIONS; id++, lock++)
523
524 /*
525 * Copy the info about any named tranches into shared memory (so that
526 * other processes can see it), and initialize the requested LWLocks.
527 */
529 {
531
532 for (i = 0; i < NamedLWLockTrancheRequests; i++)
533 {
535 int tranche;
536
538 tranche = LWLockNewTrancheId(request->tranche_name);
539
540 for (j = 0; j < request->num_lwlocks; j++, lock++)
541 LWLockInitialize(&lock->lock, tranche);
542 }
543 }
544}
545
546/*
547 * InitLWLockAccess - initialize backend-local state needed to hold LWLocks
548 */
549void
551{
552#ifdef LWLOCK_STATS
554#endif
555}
556
557/*
558 * GetNamedLWLockTranche - returns the base address of LWLock from the
559 * specified tranche.
560 *
561 * Caller needs to retrieve the requested number of LWLocks starting from
562 * the base lock address returned by this API. This can be used for
563 * tranches that are requested by using RequestNamedLWLockTranche() API.
564 */
566GetNamedLWLockTranche(const char *tranche_name)
567{
568 int lock_pos;
569 int i;
570
571 /*
572 * Obtain the position of base address of LWLock belonging to requested
573 * tranche_name in MainLWLockArray. LWLocks for named tranches are placed
574 * in MainLWLockArray after fixed locks.
575 */
577 for (i = 0; i < NamedLWLockTrancheRequests; i++)
578 {
579 if (strcmp(NamedLWLockTrancheRequestArray[i].tranche_name,
580 tranche_name) == 0)
581 return &MainLWLockArray[lock_pos];
582
584 }
585
586 elog(ERROR, "requested tranche is not registered");
587
588 /* just to keep compiler quiet */
589 return NULL;
590}
591
592/*
593 * Allocate a new tranche ID with the provided name.
594 */
595int
597{
598 int result;
599
600 if (!name)
603 errmsg("tranche name cannot be NULL")));
604
605 if (strlen(name) >= NAMEDATALEN)
608 errmsg("tranche name too long"),
609 errdetail("LWLock tranche names must be no longer than %d bytes.",
610 NAMEDATALEN - 1)));
611
612 /*
613 * We use the ShmemLock spinlock to protect LWLockCounter and
614 * LWLockTrancheNames.
615 */
617
619 {
622 (errmsg("maximum number of tranches already registered"),
623 errdetail("No more than %d tranches may be registered.",
625 }
626
627 result = (*LWLockCounter)++;
630
632
633 return result;
634}
635
636/*
637 * RequestNamedLWLockTranche
638 * Request that extra LWLocks be allocated during postmaster
639 * startup.
640 *
641 * This may only be called via the shmem_request_hook of a library that is
642 * loaded into the postmaster via shared_preload_libraries. Calls from
643 * elsewhere will fail.
644 *
645 * The tranche name will be user-visible as a wait event name, so try to
646 * use a name that fits the style for those.
647 */
648void
649RequestNamedLWLockTranche(const char *tranche_name, int num_lwlocks)
650{
653
655 elog(FATAL, "cannot request additional LWLocks outside shmem_request_hook");
656
657 if (!tranche_name)
660 errmsg("tranche name cannot be NULL")));
661
662 if (strlen(tranche_name) >= NAMEDATALEN)
665 errmsg("tranche name too long"),
666 errdetail("LWLock tranche names must be no longer than %d bytes.",
667 NAMEDATALEN - 1)));
668
670 {
675 * sizeof(NamedLWLockTrancheRequest));
676 }
677
679 {
681
684 i * sizeof(NamedLWLockTrancheRequest));
686 }
687
689 strlcpy(request->tranche_name, tranche_name, NAMEDATALEN);
690 request->num_lwlocks = num_lwlocks;
692}
693
694/*
695 * LWLockInitialize - initialize a new lwlock; it's initially unlocked
696 */
697void
698LWLockInitialize(LWLock *lock, int tranche_id)
699{
700 /* verify the tranche_id is valid */
701 (void) GetLWTrancheName(tranche_id);
702
703 pg_atomic_init_u32(&lock->state, 0);
704#ifdef LOCK_DEBUG
705 pg_atomic_init_u32(&lock->nwaiters, 0);
706#endif
707 lock->tranche = tranche_id;
708 proclist_init(&lock->waiters);
709}
710
711/*
712 * Report start of wait event for light-weight locks.
713 *
714 * This function will be used by all the light-weight lock calls which
715 * needs to wait to acquire the lock. This function distinguishes wait
716 * event based on tranche and lock id.
717 */
718static inline void
723
724/*
725 * Report end of wait event for light-weight locks.
726 */
727static inline void
732
733/*
734 * Return the name of an LWLock tranche.
735 */
736static const char *
738{
739 /* Built-in tranche or individual LWLock? */
742
743 /*
744 * We only ever add new entries to LWLockTrancheNames, so most lookups can
745 * avoid taking the spinlock as long as the backend-local counter
746 * (LocalLWLockCounter) is greater than the requested tranche ID. Else,
747 * we need to first update the backend-local counter with ShmemLock held
748 * before attempting the lookup again. In practice, the latter case is
749 * probably rare.
750 */
752 {
756
758 elog(ERROR, "tranche %d is not registered", trancheId);
759 }
760
761 /*
762 * It's an extension tranche, so look in LWLockTrancheNames.
763 */
765
767}
768
769/*
770 * Return an identifier for an LWLock based on the wait class and event.
771 */
772const char *
774{
775 Assert(classId == PG_WAIT_LWLOCK);
776 /* The event IDs are just tranche numbers. */
778}
779
780/*
781 * Internal function that tries to atomically acquire the lwlock in the passed
782 * in mode.
783 *
784 * This function will not block waiting for a lock to become free - that's the
785 * caller's job.
786 *
787 * Returns true if the lock isn't free and we need to wait.
788 */
789static bool
791{
793
795
796 /*
797 * Read once outside the loop, later iterations will get the newer value
798 * via compare & exchange.
799 */
801
802 /* loop until we've determined whether we could acquire the lock or not */
803 while (true)
804 {
806 bool lock_free;
807
809
810 if (mode == LW_EXCLUSIVE)
811 {
813 if (lock_free)
815 }
816 else
817 {
819 if (lock_free)
821 }
822
823 /*
824 * Attempt to swap in the state we are expecting. If we didn't see
825 * lock to be free, that's just the old value. If we saw it as free,
826 * we'll attempt to mark it acquired. The reason that we always swap
827 * in the value is that this doubles as a memory barrier. We could try
828 * to be smarter and only swap in values if we saw the lock as free,
829 * but benchmark haven't shown it as beneficial so far.
830 *
831 * Retry if the value changed since we last looked at it.
832 */
835 {
836 if (lock_free)
837 {
838 /* Great! Got the lock. */
839#ifdef LOCK_DEBUG
840 if (mode == LW_EXCLUSIVE)
841 lock->owner = MyProc;
842#endif
843 return false;
844 }
845 else
846 return true; /* somebody else has the lock */
847 }
848 }
850}
851
852/*
853 * Lock the LWLock's wait list against concurrent activity.
854 *
855 * NB: even though the wait list is locked, non-conflicting lock operations
856 * may still happen concurrently.
857 *
858 * Time spent holding mutex should be short!
859 */
860static void
862{
864#ifdef LWLOCK_STATS
866 uint32 delays = 0;
867
869#endif
870
871 while (true)
872 {
873 /*
874 * Always try once to acquire the lock directly, without setting up
875 * the spin-delay infrastructure. The work necessary for that shows up
876 * in profiles and is rarely necessary.
877 */
880 break; /* got lock */
881
882 /* and then spin without atomic operations until lock is released */
883 {
885
887
888 while (old_state & LW_FLAG_LOCKED)
889 {
892 }
893#ifdef LWLOCK_STATS
894 delays += delayStatus.delays;
895#endif
897 }
898
899 /*
900 * Retry. The lock might obviously already be re-acquired by the time
901 * we're attempting to get it again.
902 */
903 }
904
905#ifdef LWLOCK_STATS
906 lwstats->spin_delay_count += delays;
907#endif
908}
909
910/*
911 * Unlock the LWLock's wait list.
912 *
913 * Note that it can be more efficient to manipulate flags and release the
914 * locks in a single atomic operation.
915 */
916static void
925
926/*
927 * Wakeup all the lockers that currently have a chance to acquire the lock.
928 */
929static void
931{
932 bool new_wake_in_progress = false;
933 bool wokeup_somebody = false;
936
938
939 /* lock wait list while collecting backends to wake up */
940 LWLockWaitListLock(lock);
941
942 proclist_foreach_modify(iter, &lock->waiters, lwWaitLink)
943 {
944 PGPROC *waiter = GetPGProcByNumber(iter.cur);
945
946 if (wokeup_somebody && waiter->lwWaitMode == LW_EXCLUSIVE)
947 continue;
948
949 proclist_delete(&lock->waiters, iter.cur, lwWaitLink);
950 proclist_push_tail(&wakeup, iter.cur, lwWaitLink);
951
952 if (waiter->lwWaitMode != LW_WAIT_UNTIL_FREE)
953 {
954 /*
955 * Prevent additional wakeups until retryer gets to run. Backends
956 * that are just waiting for the lock to become free don't retry
957 * automatically.
958 */
960
961 /*
962 * Don't wakeup (further) exclusive locks.
963 */
964 wokeup_somebody = true;
965 }
966
967 /*
968 * Signal that the process isn't on the wait list anymore. This allows
969 * LWLockDequeueSelf() to remove itself of the waitlist with a
970 * proclist_delete(), rather than having to check if it has been
971 * removed from the list.
972 */
973 Assert(waiter->lwWaiting == LW_WS_WAITING);
975
976 /*
977 * Once we've woken up an exclusive lock, there's no point in waking
978 * up anybody else.
979 */
980 if (waiter->lwWaitMode == LW_EXCLUSIVE)
981 break;
982 }
983
985
986 /* unset required flags, and release lock, in one fell swoop */
987 {
990
992 while (true)
993 {
995
996 /* compute desired flags */
997
1000 else
1002
1003 if (proclist_is_empty(&lock->waiters))
1005
1006 desired_state &= ~LW_FLAG_LOCKED; /* release lock */
1007
1010 break;
1011 }
1012 }
1013
1014 /* Awaken any waiters I removed from the queue. */
1015 proclist_foreach_modify(iter, &wakeup, lwWaitLink)
1016 {
1017 PGPROC *waiter = GetPGProcByNumber(iter.cur);
1018
1019 LOG_LWDEBUG("LWLockRelease", lock, "release waiter");
1020 proclist_delete(&wakeup, iter.cur, lwWaitLink);
1021
1022 /*
1023 * Guarantee that lwWaiting being unset only becomes visible once the
1024 * unlink from the link has completed. Otherwise the target backend
1025 * could be woken up for other reason and enqueue for a new lock - if
1026 * that happens before the list unlink happens, the list would end up
1027 * being corrupted.
1028 *
1029 * The barrier pairs with the LWLockWaitListLock() when enqueuing for
1030 * another lock.
1031 */
1033 waiter->lwWaiting = LW_WS_NOT_WAITING;
1034 PGSemaphoreUnlock(waiter->sem);
1035 }
1036}
1037
1038/*
1039 * Add ourselves to the end of the queue.
1040 *
1041 * NB: Mode can be LW_WAIT_UNTIL_FREE here!
1042 */
1043static void
1045{
1046 /*
1047 * If we don't have a PGPROC structure, there's no way to wait. This
1048 * should never occur, since MyProc should only be null during shared
1049 * memory initialization.
1050 */
1051 if (MyProc == NULL)
1052 elog(PANIC, "cannot wait without a PGPROC structure");
1053
1055 elog(PANIC, "queueing for lock while waiting on another one");
1056
1057 LWLockWaitListLock(lock);
1058
1059 /* setting the flag is protected by the spinlock */
1061
1064
1065 /* LW_WAIT_UNTIL_FREE waiters are always at the front of the queue */
1066 if (mode == LW_WAIT_UNTIL_FREE)
1067 proclist_push_head(&lock->waiters, MyProcNumber, lwWaitLink);
1068 else
1069 proclist_push_tail(&lock->waiters, MyProcNumber, lwWaitLink);
1070
1071 /* Can release the mutex now */
1073
1074#ifdef LOCK_DEBUG
1075 pg_atomic_fetch_add_u32(&lock->nwaiters, 1);
1076#endif
1077}
1078
1079/*
1080 * Remove ourselves from the waitlist.
1081 *
1082 * This is used if we queued ourselves because we thought we needed to sleep
1083 * but, after further checking, we discovered that we don't actually need to
1084 * do so.
1085 */
1086static void
1088{
1089 bool on_waitlist;
1090
1091#ifdef LWLOCK_STATS
1093
1095
1096 lwstats->dequeue_self_count++;
1097#endif
1098
1099 LWLockWaitListLock(lock);
1100
1101 /*
1102 * Remove ourselves from the waitlist, unless we've already been removed.
1103 * The removal happens with the wait list lock held, so there's no race in
1104 * this check.
1105 */
1107 if (on_waitlist)
1108 proclist_delete(&lock->waiters, MyProcNumber, lwWaitLink);
1109
1110 if (proclist_is_empty(&lock->waiters) &&
1112 {
1114 }
1115
1116 /* XXX: combine with fetch_and above? */
1118
1119 /* clear waiting state again, nice for debugging */
1120 if (on_waitlist)
1122 else
1123 {
1124 int extraWaits = 0;
1125
1126 /*
1127 * Somebody else dequeued us and has or will wake us up. Deal with the
1128 * superfluous absorption of a wakeup.
1129 */
1130
1131 /*
1132 * Clear LW_FLAG_WAKE_IN_PROGRESS if somebody woke us before we
1133 * removed ourselves - they'll have set it.
1134 */
1136
1137 /*
1138 * Now wait for the scheduled wakeup, otherwise our ->lwWaiting would
1139 * get reset at some inconvenient point later. Most of the time this
1140 * will immediately return.
1141 */
1142 for (;;)
1143 {
1146 break;
1147 extraWaits++;
1148 }
1149
1150 /*
1151 * Fix the process wait semaphore's count for any absorbed wakeups.
1152 */
1153 while (extraWaits-- > 0)
1155 }
1156
1157#ifdef LOCK_DEBUG
1158 {
1159 /* not waiting anymore */
1161
1163 }
1164#endif
1165}
1166
1167/*
1168 * LWLockAcquire - acquire a lightweight lock in the specified mode
1169 *
1170 * If the lock is not available, sleep until it is. Returns true if the lock
1171 * was available immediately, false if we had to sleep.
1172 *
1173 * Side effect: cancel/die interrupts are held off until lock release.
1174 */
1175bool
1177{
1178 PGPROC *proc = MyProc;
1179 bool result = true;
1180 int extraWaits = 0;
1181#ifdef LWLOCK_STATS
1183
1185#endif
1186
1188
1189 PRINT_LWDEBUG("LWLockAcquire", lock, mode);
1190
1191#ifdef LWLOCK_STATS
1192 /* Count lock acquisition attempts */
1193 if (mode == LW_EXCLUSIVE)
1194 lwstats->ex_acquire_count++;
1195 else
1196 lwstats->sh_acquire_count++;
1197#endif /* LWLOCK_STATS */
1198
1199 /*
1200 * We can't wait if we haven't got a PGPROC. This should only occur
1201 * during bootstrap or shared memory initialization. Put an Assert here
1202 * to catch unsafe coding practices.
1203 */
1204 Assert(!(proc == NULL && IsUnderPostmaster));
1205
1206 /* Ensure we will have room to remember the lock */
1208 elog(ERROR, "too many LWLocks taken");
1209
1210 /*
1211 * Lock out cancel/die interrupts until we exit the code section protected
1212 * by the LWLock. This ensures that interrupts will not interfere with
1213 * manipulations of data structures in shared memory.
1214 */
1216
1217 /*
1218 * Loop here to try to acquire lock after each time we are signaled by
1219 * LWLockRelease.
1220 *
1221 * NOTE: it might seem better to have LWLockRelease actually grant us the
1222 * lock, rather than retrying and possibly having to go back to sleep. But
1223 * in practice that is no good because it means a process swap for every
1224 * lock acquisition when two or more processes are contending for the same
1225 * lock. Since LWLocks are normally used to protect not-very-long
1226 * sections of computation, a process needs to be able to acquire and
1227 * release the same lock many times during a single CPU time slice, even
1228 * in the presence of contention. The efficiency of being able to do that
1229 * outweighs the inefficiency of sometimes wasting a process dispatch
1230 * cycle because the lock is not free when a released waiter finally gets
1231 * to run. See pgsql-hackers archives for 29-Dec-01.
1232 */
1233 for (;;)
1234 {
1235 bool mustwait;
1236
1237 /*
1238 * Try to grab the lock the first time, we're not in the waitqueue
1239 * yet/anymore.
1240 */
1242
1243 if (!mustwait)
1244 {
1245 LOG_LWDEBUG("LWLockAcquire", lock, "immediately acquired lock");
1246 break; /* got the lock */
1247 }
1248
1249 /*
1250 * Ok, at this point we couldn't grab the lock on the first try. We
1251 * cannot simply queue ourselves to the end of the list and wait to be
1252 * woken up because by now the lock could long have been released.
1253 * Instead add us to the queue and try to grab the lock again. If we
1254 * succeed we need to revert the queuing and be happy, otherwise we
1255 * recheck the lock. If we still couldn't grab it, we know that the
1256 * other locker will see our queue entries when releasing since they
1257 * existed before we checked for the lock.
1258 */
1259
1260 /* add to the queue */
1261 LWLockQueueSelf(lock, mode);
1262
1263 /* we're now guaranteed to be woken up if necessary */
1265
1266 /* ok, grabbed the lock the second time round, need to undo queueing */
1267 if (!mustwait)
1268 {
1269 LOG_LWDEBUG("LWLockAcquire", lock, "acquired, undoing queue");
1270
1271 LWLockDequeueSelf(lock);
1272 break;
1273 }
1274
1275 /*
1276 * Wait until awakened.
1277 *
1278 * It is possible that we get awakened for a reason other than being
1279 * signaled by LWLockRelease. If so, loop back and wait again. Once
1280 * we've gotten the LWLock, re-increment the sema by the number of
1281 * additional signals received.
1282 */
1283 LOG_LWDEBUG("LWLockAcquire", lock, "waiting");
1284
1285#ifdef LWLOCK_STATS
1286 lwstats->block_count++;
1287#endif
1288
1292
1293 for (;;)
1294 {
1295 PGSemaphoreLock(proc->sem);
1296 if (proc->lwWaiting == LW_WS_NOT_WAITING)
1297 break;
1298 extraWaits++;
1299 }
1300
1301 /* Retrying, allow LWLockRelease to release waiters again. */
1303
1304#ifdef LOCK_DEBUG
1305 {
1306 /* not waiting anymore */
1308
1310 }
1311#endif
1312
1316
1317 LOG_LWDEBUG("LWLockAcquire", lock, "awakened");
1318
1319 /* Now loop back and try to acquire lock again. */
1320 result = false;
1321 }
1322
1325
1326 /* Add lock to list of locks held by this backend */
1329
1330 /*
1331 * Fix the process wait semaphore's count for any absorbed wakeups.
1332 */
1333 while (extraWaits-- > 0)
1334 PGSemaphoreUnlock(proc->sem);
1335
1336 return result;
1337}
1338
1339/*
1340 * LWLockConditionalAcquire - acquire a lightweight lock in the specified mode
1341 *
1342 * If the lock is not available, return false with no side-effects.
1343 *
1344 * If successful, cancel/die interrupts are held off until lock release.
1345 */
1346bool
1348{
1349 bool mustwait;
1350
1352
1353 PRINT_LWDEBUG("LWLockConditionalAcquire", lock, mode);
1354
1355 /* Ensure we will have room to remember the lock */
1357 elog(ERROR, "too many LWLocks taken");
1358
1359 /*
1360 * Lock out cancel/die interrupts until we exit the code section protected
1361 * by the LWLock. This ensures that interrupts will not interfere with
1362 * manipulations of data structures in shared memory.
1363 */
1365
1366 /* Check for the lock */
1368
1369 if (mustwait)
1370 {
1371 /* Failed to get lock, so release interrupt holdoff */
1373
1374 LOG_LWDEBUG("LWLockConditionalAcquire", lock, "failed");
1377 }
1378 else
1379 {
1380 /* Add lock to list of locks held by this backend */
1385 }
1386 return !mustwait;
1387}
1388
1389/*
1390 * LWLockAcquireOrWait - Acquire lock, or wait until it's free
1391 *
1392 * The semantics of this function are a bit funky. If the lock is currently
1393 * free, it is acquired in the given mode, and the function returns true. If
1394 * the lock isn't immediately free, the function waits until it is released
1395 * and returns false, but does not acquire the lock.
1396 *
1397 * This is currently used for WALWriteLock: when a backend flushes the WAL,
1398 * holding WALWriteLock, it can flush the commit records of many other
1399 * backends as a side-effect. Those other backends need to wait until the
1400 * flush finishes, but don't need to acquire the lock anymore. They can just
1401 * wake up, observe that their records have already been flushed, and return.
1402 */
1403bool
1405{
1406 PGPROC *proc = MyProc;
1407 bool mustwait;
1408 int extraWaits = 0;
1409#ifdef LWLOCK_STATS
1411
1413#endif
1414
1416
1417 PRINT_LWDEBUG("LWLockAcquireOrWait", lock, mode);
1418
1419 /* Ensure we will have room to remember the lock */
1421 elog(ERROR, "too many LWLocks taken");
1422
1423 /*
1424 * Lock out cancel/die interrupts until we exit the code section protected
1425 * by the LWLock. This ensures that interrupts will not interfere with
1426 * manipulations of data structures in shared memory.
1427 */
1429
1430 /*
1431 * NB: We're using nearly the same twice-in-a-row lock acquisition
1432 * protocol as LWLockAcquire(). Check its comments for details.
1433 */
1435
1436 if (mustwait)
1437 {
1439
1441
1442 if (mustwait)
1443 {
1444 /*
1445 * Wait until awakened. Like in LWLockAcquire, be prepared for
1446 * bogus wakeups.
1447 */
1448 LOG_LWDEBUG("LWLockAcquireOrWait", lock, "waiting");
1449
1450#ifdef LWLOCK_STATS
1451 lwstats->block_count++;
1452#endif
1453
1457
1458 for (;;)
1459 {
1460 PGSemaphoreLock(proc->sem);
1461 if (proc->lwWaiting == LW_WS_NOT_WAITING)
1462 break;
1463 extraWaits++;
1464 }
1465
1466#ifdef LOCK_DEBUG
1467 {
1468 /* not waiting anymore */
1470
1472 }
1473#endif
1477
1478 LOG_LWDEBUG("LWLockAcquireOrWait", lock, "awakened");
1479 }
1480 else
1481 {
1482 LOG_LWDEBUG("LWLockAcquireOrWait", lock, "acquired, undoing queue");
1483
1484 /*
1485 * Got lock in the second attempt, undo queueing. We need to treat
1486 * this as having successfully acquired the lock, otherwise we'd
1487 * not necessarily wake up people we've prevented from acquiring
1488 * the lock.
1489 */
1490 LWLockDequeueSelf(lock);
1491 }
1492 }
1493
1494 /*
1495 * Fix the process wait semaphore's count for any absorbed wakeups.
1496 */
1497 while (extraWaits-- > 0)
1498 PGSemaphoreUnlock(proc->sem);
1499
1500 if (mustwait)
1501 {
1502 /* Failed to get lock, so release interrupt holdoff */
1504 LOG_LWDEBUG("LWLockAcquireOrWait", lock, "failed");
1507 }
1508 else
1509 {
1510 LOG_LWDEBUG("LWLockAcquireOrWait", lock, "succeeded");
1511 /* Add lock to list of locks held by this backend */
1516 }
1517
1518 return !mustwait;
1519}
1520
1521/*
1522 * Does the lwlock in its current state need to wait for the variable value to
1523 * change?
1524 *
1525 * If we don't need to wait, and it's because the value of the variable has
1526 * changed, store the current value in newval.
1527 *
1528 * *result is set to true if the lock was free, and false otherwise.
1529 */
1530static bool
1532 uint64 *newval, bool *result)
1533{
1534 bool mustwait;
1535 uint64 value;
1536
1537 /*
1538 * Test first to see if it the slot is free right now.
1539 *
1540 * XXX: the unique caller of this routine, WaitXLogInsertionsToFinish()
1541 * via LWLockWaitForVar(), uses an implied barrier with a spinlock before
1542 * this, so we don't need a memory barrier here as far as the current
1543 * usage is concerned. But that might not be safe in general.
1544 */
1546
1547 if (!mustwait)
1548 {
1549 *result = true;
1550 return false;
1551 }
1552
1553 *result = false;
1554
1555 /*
1556 * Reading this value atomically is safe even on platforms where uint64
1557 * cannot be read without observing a torn value.
1558 */
1560
1561 if (value != oldval)
1562 {
1563 mustwait = false;
1564 *newval = value;
1565 }
1566 else
1567 {
1568 mustwait = true;
1569 }
1570
1571 return mustwait;
1572}
1573
1574/*
1575 * LWLockWaitForVar - Wait until lock is free, or a variable is updated.
1576 *
1577 * If the lock is held and *valptr equals oldval, waits until the lock is
1578 * either freed, or the lock holder updates *valptr by calling
1579 * LWLockUpdateVar. If the lock is free on exit (immediately or after
1580 * waiting), returns true. If the lock is still held, but *valptr no longer
1581 * matches oldval, returns false and sets *newval to the current value in
1582 * *valptr.
1583 *
1584 * Note: this function ignores shared lock holders; if the lock is held
1585 * in shared mode, returns 'true'.
1586 *
1587 * Be aware that LWLockConflictsWithVar() does not include a memory barrier,
1588 * hence the caller of this function may want to rely on an explicit barrier or
1589 * an implied barrier via spinlock or LWLock to avoid memory ordering issues.
1590 */
1591bool
1593 uint64 *newval)
1594{
1595 PGPROC *proc = MyProc;
1596 int extraWaits = 0;
1597 bool result = false;
1598#ifdef LWLOCK_STATS
1600
1602#endif
1603
1604 PRINT_LWDEBUG("LWLockWaitForVar", lock, LW_WAIT_UNTIL_FREE);
1605
1606 /*
1607 * Lock out cancel/die interrupts while we sleep on the lock. There is no
1608 * cleanup mechanism to remove us from the wait queue if we got
1609 * interrupted.
1610 */
1612
1613 /*
1614 * Loop here to check the lock's status after each time we are signaled.
1615 */
1616 for (;;)
1617 {
1618 bool mustwait;
1619
1621 &result);
1622
1623 if (!mustwait)
1624 break; /* the lock was free or value didn't match */
1625
1626 /*
1627 * Add myself to wait queue. Note that this is racy, somebody else
1628 * could wakeup before we're finished queuing. NB: We're using nearly
1629 * the same twice-in-a-row lock acquisition protocol as
1630 * LWLockAcquire(). Check its comments for details. The only
1631 * difference is that we also have to check the variable's values when
1632 * checking the state of the lock.
1633 */
1635
1636 /*
1637 * Clear LW_FLAG_WAKE_IN_PROGRESS flag, to make sure we get woken up
1638 * as soon as the lock is released.
1639 */
1641
1642 /*
1643 * We're now guaranteed to be woken up if necessary. Recheck the lock
1644 * and variables state.
1645 */
1647 &result);
1648
1649 /* Ok, no conflict after we queued ourselves. Undo queueing. */
1650 if (!mustwait)
1651 {
1652 LOG_LWDEBUG("LWLockWaitForVar", lock, "free, undoing queue");
1653
1654 LWLockDequeueSelf(lock);
1655 break;
1656 }
1657
1658 /*
1659 * Wait until awakened.
1660 *
1661 * It is possible that we get awakened for a reason other than being
1662 * signaled by LWLockRelease. If so, loop back and wait again. Once
1663 * we've gotten the LWLock, re-increment the sema by the number of
1664 * additional signals received.
1665 */
1666 LOG_LWDEBUG("LWLockWaitForVar", lock, "waiting");
1667
1668#ifdef LWLOCK_STATS
1669 lwstats->block_count++;
1670#endif
1671
1675
1676 for (;;)
1677 {
1678 PGSemaphoreLock(proc->sem);
1679 if (proc->lwWaiting == LW_WS_NOT_WAITING)
1680 break;
1681 extraWaits++;
1682 }
1683
1684#ifdef LOCK_DEBUG
1685 {
1686 /* not waiting anymore */
1688
1690 }
1691#endif
1692
1696
1697 LOG_LWDEBUG("LWLockWaitForVar", lock, "awakened");
1698
1699 /* Now loop back and check the status of the lock again. */
1700 }
1701
1702 /*
1703 * Fix the process wait semaphore's count for any absorbed wakeups.
1704 */
1705 while (extraWaits-- > 0)
1706 PGSemaphoreUnlock(proc->sem);
1707
1708 /*
1709 * Now okay to allow cancel/die interrupts.
1710 */
1712
1713 return result;
1714}
1715
1716
1717/*
1718 * LWLockUpdateVar - Update a variable and wake up waiters atomically
1719 *
1720 * Sets *valptr to 'val', and wakes up all processes waiting for us with
1721 * LWLockWaitForVar(). It first sets the value atomically and then wakes up
1722 * waiting processes so that any process calling LWLockWaitForVar() on the same
1723 * lock is guaranteed to see the new value, and act accordingly.
1724 *
1725 * The caller must be holding the lock in exclusive mode.
1726 */
1727void
1729{
1732
1733 PRINT_LWDEBUG("LWLockUpdateVar", lock, LW_EXCLUSIVE);
1734
1735 /*
1736 * Note that pg_atomic_exchange_u64 is a full barrier, so we're guaranteed
1737 * that the variable is updated before waking up waiters.
1738 */
1740
1742
1743 LWLockWaitListLock(lock);
1744
1746
1747 /*
1748 * See if there are any LW_WAIT_UNTIL_FREE waiters that need to be woken
1749 * up. They are always in the front of the queue.
1750 */
1751 proclist_foreach_modify(iter, &lock->waiters, lwWaitLink)
1752 {
1753 PGPROC *waiter = GetPGProcByNumber(iter.cur);
1754
1755 if (waiter->lwWaitMode != LW_WAIT_UNTIL_FREE)
1756 break;
1757
1758 proclist_delete(&lock->waiters, iter.cur, lwWaitLink);
1759 proclist_push_tail(&wakeup, iter.cur, lwWaitLink);
1760
1761 /* see LWLockWakeup() */
1762 Assert(waiter->lwWaiting == LW_WS_WAITING);
1764 }
1765
1766 /* We are done updating shared state of the lock itself. */
1768
1769 /*
1770 * Awaken any waiters I removed from the queue.
1771 */
1772 proclist_foreach_modify(iter, &wakeup, lwWaitLink)
1773 {
1774 PGPROC *waiter = GetPGProcByNumber(iter.cur);
1775
1776 proclist_delete(&wakeup, iter.cur, lwWaitLink);
1777 /* check comment in LWLockWakeup() about this barrier */
1779 waiter->lwWaiting = LW_WS_NOT_WAITING;
1780 PGSemaphoreUnlock(waiter->sem);
1781 }
1782}
1783
1784
1785/*
1786 * LWLockRelease - release a previously acquired lock
1787 *
1788 * NB: This will leave lock->owner pointing to the current backend (if
1789 * LOCK_DEBUG is set). This is somewhat intentional, as it makes it easier to
1790 * debug cases of missing wakeups during lock release.
1791 */
1792void
1794{
1797 bool check_waiters;
1798 int i;
1799
1800 /*
1801 * Remove lock from list of locks held. Usually, but not always, it will
1802 * be the latest-acquired lock; so search array backwards.
1803 */
1804 for (i = num_held_lwlocks; --i >= 0;)
1805 if (lock == held_lwlocks[i].lock)
1806 break;
1807
1808 if (i < 0)
1809 elog(ERROR, "lock %s is not held", T_NAME(lock));
1810
1812
1814 for (; i < num_held_lwlocks; i++)
1815 held_lwlocks[i] = held_lwlocks[i + 1];
1816
1817 PRINT_LWDEBUG("LWLockRelease", lock, mode);
1818
1819 /*
1820 * Release my hold on lock, after that it can immediately be acquired by
1821 * others, even if we still have to wakeup other waiters.
1822 */
1823 if (mode == LW_EXCLUSIVE)
1825 else
1827
1828 /* nobody else can have that kind of lock */
1830
1833
1834 /*
1835 * Check if we're still waiting for backends to get scheduled, if so,
1836 * don't wake them up again.
1837 */
1838 if ((oldstate & LW_FLAG_HAS_WAITERS) &&
1840 (oldstate & LW_LOCK_MASK) == 0)
1841 check_waiters = true;
1842 else
1843 check_waiters = false;
1844
1845 /*
1846 * As waking up waiters requires the spinlock to be acquired, only do so
1847 * if necessary.
1848 */
1849 if (check_waiters)
1850 {
1851 /* XXX: remove before commit? */
1852 LOG_LWDEBUG("LWLockRelease", lock, "releasing waiters");
1853 LWLockWakeup(lock);
1854 }
1855
1856 /*
1857 * Now okay to allow cancel/die interrupts.
1858 */
1860}
1861
1862/*
1863 * LWLockReleaseClearVar - release a previously acquired lock, reset variable
1864 */
1865void
1867{
1868 /*
1869 * Note that pg_atomic_exchange_u64 is a full barrier, so we're guaranteed
1870 * that the variable is updated before releasing the lock.
1871 */
1873
1874 LWLockRelease(lock);
1875}
1876
1877
1878/*
1879 * LWLockReleaseAll - release all currently-held locks
1880 *
1881 * Used to clean up after ereport(ERROR). An important difference between this
1882 * function and retail LWLockRelease calls is that InterruptHoldoffCount is
1883 * unchanged by this operation. This is necessary since InterruptHoldoffCount
1884 * has been set to an appropriate level earlier in error recovery. We could
1885 * decrement it below zero if we allow it to drop for each released lock!
1886 *
1887 * Note that this function must be safe to call even before the LWLock
1888 * subsystem has been initialized (e.g., during early startup failures).
1889 * In that case, num_held_lwlocks will be 0 and we do nothing.
1890 */
1891void
1893{
1894 while (num_held_lwlocks > 0)
1895 {
1896 HOLD_INTERRUPTS(); /* match the upcoming RESUME_INTERRUPTS */
1897
1899 }
1900
1902}
1903
1904
1905/*
1906 * LWLockHeldByMe - test whether my process holds a lock in any mode
1907 *
1908 * This is meant as debug support only.
1909 */
1910bool
1912{
1913 int i;
1914
1915 for (i = 0; i < num_held_lwlocks; i++)
1916 {
1917 if (held_lwlocks[i].lock == lock)
1918 return true;
1919 }
1920 return false;
1921}
1922
1923/*
1924 * LWLockAnyHeldByMe - test whether my process holds any of an array of locks
1925 *
1926 * This is meant as debug support only.
1927 */
1928bool
1929LWLockAnyHeldByMe(LWLock *lock, int nlocks, size_t stride)
1930{
1931 char *held_lock_addr;
1932 char *begin;
1933 char *end;
1934 int i;
1935
1936 begin = (char *) lock;
1937 end = begin + nlocks * stride;
1938 for (i = 0; i < num_held_lwlocks; i++)
1939 {
1940 held_lock_addr = (char *) held_lwlocks[i].lock;
1941 if (held_lock_addr >= begin &&
1942 held_lock_addr < end &&
1943 (held_lock_addr - begin) % stride == 0)
1944 return true;
1945 }
1946 return false;
1947}
1948
1949/*
1950 * LWLockHeldByMeInMode - test whether my process holds a lock in given mode
1951 *
1952 * This is meant as debug support only.
1953 */
1954bool
1956{
1957 int i;
1958
1959 for (i = 0; i < num_held_lwlocks; i++)
1960 {
1961 if (held_lwlocks[i].lock == lock && held_lwlocks[i].mode == mode)
1962 return true;
1963 }
1964 return false;
1965}
static uint32 pg_atomic_fetch_and_u32(volatile pg_atomic_uint32 *ptr, uint32 and_)
Definition atomics.h:396
static bool pg_atomic_compare_exchange_u32(volatile pg_atomic_uint32 *ptr, uint32 *expected, uint32 newval)
Definition atomics.h:349
static uint32 pg_atomic_fetch_or_u32(volatile pg_atomic_uint32 *ptr, uint32 or_)
Definition atomics.h:410
static uint32 pg_atomic_sub_fetch_u32(volatile pg_atomic_uint32 *ptr, int32 sub_)
Definition atomics.h:439
static uint32 pg_atomic_fetch_sub_u32(volatile pg_atomic_uint32 *ptr, int32 sub_)
Definition atomics.h:381
static void pg_atomic_init_u32(volatile pg_atomic_uint32 *ptr, uint32 val)
Definition atomics.h:219
#define pg_write_barrier()
Definition atomics.h:155
static uint32 pg_atomic_fetch_add_u32(volatile pg_atomic_uint32 *ptr, int32 add_)
Definition atomics.h:366
static uint32 pg_atomic_read_u32(volatile pg_atomic_uint32 *ptr)
Definition atomics.h:237
static uint64 pg_atomic_read_u64(volatile pg_atomic_uint64 *ptr)
Definition atomics.h:467
static uint64 pg_atomic_exchange_u64(volatile pg_atomic_uint64 *ptr, uint64 newval)
Definition atomics.h:513
#define likely(x)
Definition c.h:411
#define MAXALIGN(LEN)
Definition c.h:826
#define PG_USED_FOR_ASSERTS_ONLY
Definition c.h:223
#define Assert(condition)
Definition c.h:873
uint64_t uint64
Definition c.h:547
uint16_t uint16
Definition c.h:545
#define pg_unreachable()
Definition c.h:341
uint32_t uint32
Definition c.h:546
#define lengthof(array)
Definition c.h:803
#define MemSet(start, val, len)
Definition c.h:1013
#define StaticAssertDecl(condition, errmessage)
Definition c.h:942
size_t Size
Definition c.h:619
#define fprintf(file, fmt, msg)
Definition cubescan.l:21
void * hash_search(HTAB *hashp, const void *keyPtr, HASHACTION action, bool *foundPtr)
Definition dynahash.c:952
HTAB * hash_create(const char *tabname, int64 nelem, const HASHCTL *info, int flags)
Definition dynahash.c:358
void * hash_seq_search(HASH_SEQ_STATUS *status)
Definition dynahash.c:1415
void hash_seq_init(HASH_SEQ_STATUS *status, HTAB *hashp)
Definition dynahash.c:1380
int errmsg_internal(const char *fmt,...)
Definition elog.c:1170
int errhidestmt(bool hide_stmt)
Definition elog.c:1445
int errdetail(const char *fmt,...)
Definition elog.c:1216
int errhidecontext(bool hide_ctx)
Definition elog.c:1464
int errcode(int sqlerrcode)
Definition elog.c:863
int errmsg(const char *fmt,...)
Definition elog.c:1080
#define LOG
Definition elog.h:31
#define FATAL
Definition elog.h:41
#define PANIC
Definition elog.h:42
#define ERROR
Definition elog.h:39
#define elog(elevel,...)
Definition elog.h:226
#define ereport(elevel,...)
Definition elog.h:150
int MyProcPid
Definition globals.c:47
ProcNumber MyProcNumber
Definition globals.c:90
bool IsUnderPostmaster
Definition globals.c:120
#define newval
@ HASH_ENTER
Definition hsearch.h:114
#define HASH_CONTEXT
Definition hsearch.h:102
#define HASH_ELEM
Definition hsearch.h:95
#define HASH_BLOBS
Definition hsearch.h:97
long val
Definition informix.c:689
static struct @172 value
void on_shmem_exit(pg_on_exit_callback function, Datum arg)
Definition ipc.c:372
int j
Definition isn.c:78
int i
Definition isn.c:77
#define LW_VAL_EXCLUSIVE
Definition lwlock.c:101
void LWLockUpdateVar(LWLock *lock, pg_atomic_uint64 *valptr, uint64 val)
Definition lwlock.c:1728
static void LWLockWakeup(LWLock *lock)
Definition lwlock.c:930
#define LW_FLAG_LOCKED
Definition lwlock.c:96
bool LWLockHeldByMe(LWLock *lock)
Definition lwlock.c:1911
static int LocalLWLockCounter
Definition lwlock.c:202
static LWLockHandle held_lwlocks[MAX_SIMUL_LWLOCKS]
Definition lwlock.c:178
void LWLockReleaseClearVar(LWLock *lock, pg_atomic_uint64 *valptr, uint64 val)
Definition lwlock.c:1866
bool LWLockAcquire(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1176
void CreateLWLocks(void)
Definition lwlock.c:441
int LWLockNewTrancheId(const char *name)
Definition lwlock.c:596
#define LW_VAL_SHARED
Definition lwlock.c:102
static bool LWLockAttemptLock(LWLock *lock, LWLockMode mode)
Definition lwlock.c:790
static void LWLockWaitListLock(LWLock *lock)
Definition lwlock.c:861
LWLockPadded * GetNamedLWLockTranche(const char *tranche_name)
Definition lwlock.c:566
bool LWLockHeldByMeInMode(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1955
static void LWLockReportWaitEnd(void)
Definition lwlock.c:728
char ** LWLockTrancheNames
Definition lwlock.c:154
bool LWLockWaitForVar(LWLock *lock, pg_atomic_uint64 *valptr, uint64 oldval, uint64 *newval)
Definition lwlock.c:1592
static const char * GetLWTrancheName(uint16 trancheId)
Definition lwlock.c:737
#define LW_LOCK_MASK
Definition lwlock.c:106
int NamedLWLockTrancheRequests
Definition lwlock.c:192
void RequestNamedLWLockTranche(const char *tranche_name, int num_lwlocks)
Definition lwlock.c:649
#define LW_FLAG_MASK
Definition lwlock.c:98
#define LW_FLAG_HAS_WAITERS
Definition lwlock.c:94
#define MAX_SIMUL_LWLOCKS
Definition lwlock.c:168
static int NumLWLocksForNamedTranches(void)
Definition lwlock.c:382
void LWLockRelease(LWLock *lock)
Definition lwlock.c:1793
static NamedLWLockTrancheRequest * LocalNamedLWLockTrancheRequestArray
Definition lwlock.c:196
#define T_NAME(lock)
Definition lwlock.c:211
static int num_held_lwlocks
Definition lwlock.c:177
void LWLockReleaseAll(void)
Definition lwlock.c:1892
static void InitializeLWLocks(void)
Definition lwlock.c:498
void LWLockInitialize(LWLock *lock, int tranche_id)
Definition lwlock.c:698
static const char *const BuiltinTrancheNames[]
Definition lwlock.c:135
NamedLWLockTrancheRequest * NamedLWLockTrancheRequestArray
Definition lwlock.c:193
static void LWLockWaitListUnlock(LWLock *lock)
Definition lwlock.c:917
#define LOG_LWDEBUG(a, b, c)
Definition lwlock.c:276
bool LWLockConditionalAcquire(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1347
bool LWLockAcquireOrWait(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1404
static void LWLockQueueSelf(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1044
#define PRINT_LWDEBUG(a, b, c)
Definition lwlock.c:275
static void LWLockReportWaitStart(LWLock *lock)
Definition lwlock.c:719
LWLockPadded * MainLWLockArray
Definition lwlock.c:161
#define LW_FLAG_WAKE_IN_PROGRESS
Definition lwlock.c:95
const char * GetLWLockIdentifier(uint32 classId, uint16 eventId)
Definition lwlock.c:773
static void LWLockDequeueSelf(LWLock *lock)
Definition lwlock.c:1087
int * LWLockCounter
Definition lwlock.c:199
Size LWLockShmemSize(void)
Definition lwlock.c:397
bool LWLockAnyHeldByMe(LWLock *lock, int nlocks, size_t stride)
Definition lwlock.c:1929
#define MAX_NAMED_TRANCHES
Definition lwlock.c:204
#define LW_SHARED_MASK
Definition lwlock.c:105
static bool LWLockConflictsWithVar(LWLock *lock, pg_atomic_uint64 *valptr, uint64 oldval, uint64 *newval, bool *result)
Definition lwlock.c:1531
void InitLWLockAccess(void)
Definition lwlock.c:550
@ LW_WS_NOT_WAITING
Definition lwlock.h:30
@ LW_WS_WAITING
Definition lwlock.h:31
@ LW_WS_PENDING_WAKEUP
Definition lwlock.h:32
#define LWLOCK_PADDED_SIZE
Definition lwlock.h:62
#define BUFFER_MAPPING_LWLOCK_OFFSET
Definition lwlock.h:102
#define NUM_LOCK_PARTITIONS
Definition lwlock.h:95
@ LWTRANCHE_FIRST_USER_DEFINED
Definition lwlock.h:182
#define LOCK_MANAGER_LWLOCK_OFFSET
Definition lwlock.h:103
#define NUM_BUFFER_PARTITIONS
Definition lwlock.h:91
#define PREDICATELOCK_MANAGER_LWLOCK_OFFSET
Definition lwlock.h:105
#define NUM_FIXED_LWLOCKS
Definition lwlock.h:107
LWLockMode
Definition lwlock.h:111
@ LW_SHARED
Definition lwlock.h:113
@ LW_WAIT_UNTIL_FREE
Definition lwlock.h:114
@ LW_EXCLUSIVE
Definition lwlock.h:112
#define NUM_PREDICATELOCK_PARTITIONS
Definition lwlock.h:99
void * MemoryContextAlloc(MemoryContext context, Size size)
Definition mcxt.c:1232
void * repalloc(void *pointer, Size size)
Definition mcxt.c:1632
MemoryContext TopMemoryContext
Definition mcxt.c:166
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
void MemoryContextAllowInCriticalSection(MemoryContext context, bool allow)
Definition mcxt.c:743
#define AllocSetContextCreate
Definition memutils.h:129
#define ALLOCSET_DEFAULT_SIZES
Definition memutils.h:160
#define RESUME_INTERRUPTS()
Definition miscadmin.h:136
#define HOLD_INTERRUPTS()
Definition miscadmin.h:134
bool process_shmem_requests_in_progress
Definition miscinit.c:1790
void * arg
static uint32 pg_nextpower2_32(uint32 num)
static PgChecksumMode mode
#define NAMEDATALEN
size_t strlcpy(char *dst, const char *src, size_t siz)
Definition strlcpy.c:45
void PGSemaphoreUnlock(PGSemaphore sema)
Definition posix_sema.c:335
void PGSemaphoreLock(PGSemaphore sema)
Definition posix_sema.c:315
uint64_t Datum
Definition postgres.h:70
static int fb(int x)
#define GetPGProcByNumber(n)
Definition proc.h:446
#define proclist_delete(list, procno, link_member)
Definition proclist.h:187
static void proclist_init(proclist_head *list)
Definition proclist.h:29
#define proclist_push_tail(list, procno, link_member)
Definition proclist.h:191
#define proclist_push_head(list, procno, link_member)
Definition proclist.h:189
#define proclist_foreach_modify(iter, lhead, link_member)
Definition proclist.h:206
static bool proclist_is_empty(const proclist_head *list)
Definition proclist.h:38
#define MAX_BACKENDS
Definition procnumber.h:39
tree ctl
Definition radixtree.h:1838
void perform_spin_delay(SpinDelayStatus *status)
Definition s_lock.c:126
void finish_spin_delay(SpinDelayStatus *status)
Definition s_lock.c:186
#define init_local_spin_delay(status)
Definition s_lock.h:753
Size add_size(Size s1, Size s2)
Definition shmem.c:495
Size mul_size(Size s1, Size s2)
Definition shmem.c:510
void * ShmemAlloc(Size size)
Definition shmem.c:154
slock_t * ShmemLock
Definition shmem.c:90
#define SpinLockRelease(lock)
Definition spin.h:61
#define SpinLockAcquire(lock)
Definition spin.h:59
PGPROC * MyProc
Definition proc.c:67
LWLockMode mode
Definition lwlock.c:174
LWLock * lock
Definition lwlock.c:173
pg_atomic_uint32 state
Definition lwlock.h:44
uint16 tranche
Definition lwlock.h:43
proclist_head waiters
Definition lwlock.h:45
char tranche_name[NAMEDATALEN]
Definition lwlock.c:183
Definition proc.h:179
uint8 lwWaitMode
Definition proc.h:247
PGSemaphore sem
Definition proc.h:183
uint8 lwWaiting
Definition proc.h:246
LWLock lock
Definition lwlock.h:70
#define PG_WAIT_LWLOCK
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition wait_event.h:69
static void pgstat_report_wait_end(void)
Definition wait_event.h:85
const char * name
static TimestampTz wakeup[NUM_WALRCV_WAKEUPS]