PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
waiteventset.c File Reference
#include "postgres.h"
#include <fcntl.h>
#include <limits.h>
#include <signal.h>
#include <unistd.h>
#include <poll.h>
#include "libpq/pqsignal.h"
#include "miscadmin.h"
#include "pgstat.h"
#include "portability/instr_time.h"
#include "postmaster/postmaster.h"
#include "storage/fd.h"
#include "storage/ipc.h"
#include "storage/pmsignal.h"
#include "storage/latch.h"
#include "storage/waiteventset.h"
#include "utils/memutils.h"
#include "utils/resowner.h"
Include dependency graph for waiteventset.c:

Go to the source code of this file.

Data Structures

struct  WaitEventSet
 

Macros

#define WAIT_USE_POLL
 
#define WAIT_USE_SELF_PIPE
 

Functions

static void latch_sigurg_handler (SIGNAL_ARGS)
 
static void sendSelfPipeByte (void)
 
static void drain (void)
 
static void WaitEventAdjustPoll (WaitEventSet *set, WaitEvent *event)
 
static int WaitEventSetWaitBlock (WaitEventSet *set, int cur_timeout, WaitEvent *occurred_events, int nevents)
 
static void ResOwnerReleaseWaitEventSet (Datum res)
 
static void ResourceOwnerRememberWaitEventSet (ResourceOwner owner, WaitEventSet *set)
 
static void ResourceOwnerForgetWaitEventSet (ResourceOwner owner, WaitEventSet *set)
 
void InitializeWaitEventSupport (void)
 
WaitEventSetCreateWaitEventSet (ResourceOwner resowner, int nevents)
 
void FreeWaitEventSet (WaitEventSet *set)
 
void FreeWaitEventSetAfterFork (WaitEventSet *set)
 
int AddWaitEventToSet (WaitEventSet *set, uint32 events, pgsocket fd, Latch *latch, void *user_data)
 
void ModifyWaitEvent (WaitEventSet *set, int pos, uint32 events, Latch *latch)
 
int WaitEventSetWait (WaitEventSet *set, long timeout, WaitEvent *occurred_events, int nevents, uint32 wait_event_info)
 
bool WaitEventSetCanReportClosed (void)
 
int GetNumRegisteredWaitEvents (WaitEventSet *set)
 
void WakeupMyProc (void)
 
void WakeupOtherProc (int pid)
 

Variables

static volatile sig_atomic_t waiting = false
 
static int selfpipe_readfd = -1
 
static int selfpipe_writefd = -1
 
static int selfpipe_owner_pid = 0
 
static const ResourceOwnerDesc wait_event_set_resowner_desc
 

Macro Definition Documentation

◆ WAIT_USE_POLL

#define WAIT_USE_POLL

Definition at line 94 of file waiteventset.c.

◆ WAIT_USE_SELF_PIPE

#define WAIT_USE_SELF_PIPE

Definition at line 111 of file waiteventset.c.

Function Documentation

◆ AddWaitEventToSet()

int AddWaitEventToSet ( WaitEventSet set,
uint32  events,
pgsocket  fd,
Latch latch,
void *  user_data 
)

Definition at line 569 of file waiteventset.c.

571{
572 WaitEvent *event;
573
574 /* not enough space */
575 Assert(set->nevents < set->nevents_space);
576
577 if (events == WL_EXIT_ON_PM_DEATH)
578 {
579 events = WL_POSTMASTER_DEATH;
580 set->exit_on_postmaster_death = true;
581 }
582
583 if (latch)
584 {
585 if (latch->owner_pid != MyProcPid)
586 elog(ERROR, "cannot wait on a latch owned by another process");
587 if (set->latch)
588 elog(ERROR, "cannot wait on more than one latch");
589 if ((events & WL_LATCH_SET) != WL_LATCH_SET)
590 elog(ERROR, "latch events only support being set");
591 }
592 else
593 {
594 if (events & WL_LATCH_SET)
595 elog(ERROR, "cannot wait on latch without a specified latch");
596 }
597
598 /* waiting for socket readiness without a socket indicates a bug */
599 if (fd == PGINVALID_SOCKET && (events & WL_SOCKET_MASK))
600 elog(ERROR, "cannot wait on socket event without a socket");
601
602 event = &set->events[set->nevents];
603 event->pos = set->nevents++;
604 event->fd = fd;
605 event->events = events;
606 event->user_data = user_data;
607#ifdef WIN32
608 event->reset = false;
609#endif
610
611 if (events == WL_LATCH_SET)
612 {
613 set->latch = latch;
614 set->latch_pos = event->pos;
615#if defined(WAIT_USE_SELF_PIPE)
616 event->fd = selfpipe_readfd;
617#elif defined(WAIT_USE_SIGNALFD)
618 event->fd = signal_fd;
619#else
620 event->fd = PGINVALID_SOCKET;
621#ifdef WAIT_USE_EPOLL
622 return event->pos;
623#endif
624#endif
625 }
626 else if (events == WL_POSTMASTER_DEATH)
627 {
628#ifndef WIN32
630#endif
631 }
632
633 /* perform wait primitive specific initialization, if needed */
634#if defined(WAIT_USE_EPOLL)
635 WaitEventAdjustEpoll(set, event, EPOLL_CTL_ADD);
636#elif defined(WAIT_USE_KQUEUE)
637 WaitEventAdjustKqueue(set, event, 0);
638#elif defined(WAIT_USE_POLL)
639 WaitEventAdjustPoll(set, event);
640#elif defined(WAIT_USE_WIN32)
641 WaitEventAdjustWin32(set, event);
642#endif
643
644 return event->pos;
645}
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:225
int MyProcPid
Definition: globals.c:46
Assert(PointerIsAligned(start, uint64))
#define PGINVALID_SOCKET
Definition: port.h:31
int postmaster_alive_fds[2]
Definition: postmaster.c:482
#define POSTMASTER_FD_WATCH
Definition: postmaster.h:83
static int fd(const char *x, int i)
Definition: preproc-init.c:105
int owner_pid
Definition: latch.h:118
Latch * latch
Definition: waiteventset.c:135
bool exit_on_postmaster_death
Definition: waiteventset.c:143
WaitEvent * events
Definition: waiteventset.c:127
static int selfpipe_readfd
Definition: waiteventset.c:180
static void WaitEventAdjustPoll(WaitEventSet *set, WaitEvent *event)
Definition: waiteventset.c:789
#define WL_EXIT_ON_PM_DEATH
Definition: waiteventset.h:39
#define WL_LATCH_SET
Definition: waiteventset.h:34
#define WL_POSTMASTER_DEATH
Definition: waiteventset.h:38
#define WL_SOCKET_MASK
Definition: waiteventset.h:53

References Assert(), elog, ERROR, WaitEventSet::events, WaitEventSet::exit_on_postmaster_death, fd(), WaitEventSet::latch, WaitEventSet::latch_pos, MyProcPid, WaitEventSet::nevents, WaitEventSet::nevents_space, Latch::owner_pid, PGINVALID_SOCKET, WaitEvent::pos, postmaster_alive_fds, POSTMASTER_FD_WATCH, selfpipe_readfd, WaitEventAdjustPoll(), WL_EXIT_ON_PM_DEATH, WL_LATCH_SET, WL_POSTMASTER_DEATH, and WL_SOCKET_MASK.

Referenced by ConfigurePostmasterWaitSet(), ExecAppendAsyncEventWait(), InitializeLatchWaitSet(), postgresForeignAsyncConfigureWait(), pq_init(), SysLoggerMain(), and WaitLatchOrSocket().

◆ CreateWaitEventSet()

WaitEventSet * CreateWaitEventSet ( ResourceOwner  resowner,
int  nevents 
)

Definition at line 363 of file waiteventset.c.

364{
365 WaitEventSet *set;
366 char *data;
367 Size sz = 0;
368
369 /*
370 * Use MAXALIGN size/alignment to guarantee that later uses of memory are
371 * aligned correctly. E.g. epoll_event might need 8 byte alignment on some
372 * platforms, but earlier allocations like WaitEventSet and WaitEvent
373 * might not be sized to guarantee that when purely using sizeof().
374 */
375 sz += MAXALIGN(sizeof(WaitEventSet));
376 sz += MAXALIGN(sizeof(WaitEvent) * nevents);
377
378#if defined(WAIT_USE_EPOLL)
379 sz += MAXALIGN(sizeof(struct epoll_event) * nevents);
380#elif defined(WAIT_USE_KQUEUE)
381 sz += MAXALIGN(sizeof(struct kevent) * nevents);
382#elif defined(WAIT_USE_POLL)
383 sz += MAXALIGN(sizeof(struct pollfd) * nevents);
384#elif defined(WAIT_USE_WIN32)
385 /* need space for the pgwin32_signal_event */
386 sz += MAXALIGN(sizeof(HANDLE) * (nevents + 1));
387#endif
388
389 if (resowner != NULL)
390 ResourceOwnerEnlarge(resowner);
391
393
394 set = (WaitEventSet *) data;
395 data += MAXALIGN(sizeof(WaitEventSet));
396
397 set->events = (WaitEvent *) data;
398 data += MAXALIGN(sizeof(WaitEvent) * nevents);
399
400#if defined(WAIT_USE_EPOLL)
401 set->epoll_ret_events = (struct epoll_event *) data;
402 data += MAXALIGN(sizeof(struct epoll_event) * nevents);
403#elif defined(WAIT_USE_KQUEUE)
404 set->kqueue_ret_events = (struct kevent *) data;
405 data += MAXALIGN(sizeof(struct kevent) * nevents);
406#elif defined(WAIT_USE_POLL)
407 set->pollfds = (struct pollfd *) data;
408 data += MAXALIGN(sizeof(struct pollfd) * nevents);
409#elif defined(WAIT_USE_WIN32)
410 set->handles = (HANDLE) data;
411 data += MAXALIGN(sizeof(HANDLE) * nevents);
412#endif
413
414 set->latch = NULL;
415 set->nevents_space = nevents;
416 set->exit_on_postmaster_death = false;
417
418 if (resowner != NULL)
419 {
421 set->owner = resowner;
422 }
423
424#if defined(WAIT_USE_EPOLL)
425 if (!AcquireExternalFD())
426 elog(ERROR, "AcquireExternalFD, for epoll_create1, failed: %m");
427 set->epoll_fd = epoll_create1(EPOLL_CLOEXEC);
428 if (set->epoll_fd < 0)
429 {
431 elog(ERROR, "epoll_create1 failed: %m");
432 }
433#elif defined(WAIT_USE_KQUEUE)
434 if (!AcquireExternalFD())
435 elog(ERROR, "AcquireExternalFD, for kqueue, failed: %m");
436 set->kqueue_fd = kqueue();
437 if (set->kqueue_fd < 0)
438 {
440 elog(ERROR, "kqueue failed: %m");
441 }
442 if (fcntl(set->kqueue_fd, F_SETFD, FD_CLOEXEC) == -1)
443 {
444 int save_errno = errno;
445
446 close(set->kqueue_fd);
448 errno = save_errno;
449 elog(ERROR, "fcntl(F_SETFD) failed on kqueue descriptor: %m");
450 }
451 set->report_postmaster_not_running = false;
452#elif defined(WAIT_USE_WIN32)
453
454 /*
455 * To handle signals while waiting, we need to add a win32 specific event.
456 * We accounted for the additional event at the top of this routine. See
457 * port/win32/signal.c for more details.
458 *
459 * Note: pgwin32_signal_event should be first to ensure that it will be
460 * reported when multiple events are set. We want to guarantee that
461 * pending signals are serviced.
462 */
463 set->handles[0] = pgwin32_signal_event;
464 StaticAssertStmt(WSA_INVALID_EVENT == NULL, "");
465#endif
466
467 return set;
468}
#define MAXALIGN(LEN)
Definition: c.h:782
#define StaticAssertStmt(condition, errmessage)
Definition: c.h:909
size_t Size
Definition: c.h:576
void ReleaseExternalFD(void)
Definition: fd.c:1240
bool AcquireExternalFD(void)
Definition: fd.c:1187
#define close(a)
Definition: win32.h:12
void * MemoryContextAllocZero(MemoryContext context, Size size)
Definition: mcxt.c:1215
MemoryContext TopMemoryContext
Definition: mcxt.c:149
const void * data
void ResourceOwnerEnlarge(ResourceOwner owner)
Definition: resowner.c:452
HANDLE pgwin32_signal_event
Definition: signal.c:27
ResourceOwner owner
Definition: waiteventset.c:118
struct pollfd * pollfds
Definition: waiteventset.c:156
static void ResourceOwnerRememberWaitEventSet(ResourceOwner owner, WaitEventSet *set)
Definition: waiteventset.c:222

References AcquireExternalFD(), close, data, elog, ERROR, WaitEventSet::events, WaitEventSet::exit_on_postmaster_death, WaitEventSet::latch, MAXALIGN, MemoryContextAllocZero(), WaitEventSet::nevents_space, WaitEventSet::owner, pgwin32_signal_event, WaitEventSet::pollfds, ReleaseExternalFD(), ResourceOwnerEnlarge(), ResourceOwnerRememberWaitEventSet(), StaticAssertStmt, and TopMemoryContext.

Referenced by ConfigurePostmasterWaitSet(), ExecAppendAsyncEventWait(), InitializeLatchWaitSet(), pq_init(), SysLoggerMain(), and WaitLatchOrSocket().

◆ drain()

static void drain ( void  )
static

Definition at line 1944 of file waiteventset.c.

1945{
1946 char buf[1024];
1947 int rc;
1948 int fd;
1949
1950#ifdef WAIT_USE_SELF_PIPE
1952#else
1953 fd = signal_fd;
1954#endif
1955
1956 for (;;)
1957 {
1958 rc = read(fd, buf, sizeof(buf));
1959 if (rc < 0)
1960 {
1961 if (errno == EAGAIN || errno == EWOULDBLOCK)
1962 break; /* the descriptor is empty */
1963 else if (errno == EINTR)
1964 continue; /* retry */
1965 else
1966 {
1967 waiting = false;
1968#ifdef WAIT_USE_SELF_PIPE
1969 elog(ERROR, "read() on self-pipe failed: %m");
1970#else
1971 elog(ERROR, "read() on signalfd failed: %m");
1972#endif
1973 }
1974 }
1975 else if (rc == 0)
1976 {
1977 waiting = false;
1978#ifdef WAIT_USE_SELF_PIPE
1979 elog(ERROR, "unexpected EOF on self-pipe");
1980#else
1981 elog(ERROR, "unexpected EOF on signalfd");
1982#endif
1983 }
1984 else if (rc < sizeof(buf))
1985 {
1986 /* we successfully drained the pipe; no need to read() again */
1987 break;
1988 }
1989 /* else buffer wasn't big enough, so read again */
1990 }
1991}
#define read(a, b, c)
Definition: win32.h:13
static char * buf
Definition: pg_test_fsync.c:72
static volatile sig_atomic_t waiting
Definition: waiteventset.c:170
#define EINTR
Definition: win32_port.h:364
#define EWOULDBLOCK
Definition: win32_port.h:370
#define EAGAIN
Definition: win32_port.h:362

References buf, EAGAIN, EINTR, elog, ERROR, EWOULDBLOCK, fd(), read, selfpipe_readfd, and waiting.

Referenced by WaitEventSetWaitBlock().

◆ FreeWaitEventSet()

void FreeWaitEventSet ( WaitEventSet set)

Definition at line 480 of file waiteventset.c.

481{
482 if (set->owner)
483 {
485 set->owner = NULL;
486 }
487
488#if defined(WAIT_USE_EPOLL)
489 close(set->epoll_fd);
491#elif defined(WAIT_USE_KQUEUE)
492 close(set->kqueue_fd);
494#elif defined(WAIT_USE_WIN32)
495 for (WaitEvent *cur_event = set->events;
496 cur_event < (set->events + set->nevents);
497 cur_event++)
498 {
499 if (cur_event->events & WL_LATCH_SET)
500 {
501 /* uses the latch's HANDLE */
502 }
503 else if (cur_event->events & WL_POSTMASTER_DEATH)
504 {
505 /* uses PostmasterHandle */
506 }
507 else
508 {
509 /* Clean up the event object we created for the socket */
510 WSAEventSelect(cur_event->fd, NULL, 0);
511 WSACloseEvent(set->handles[cur_event->pos + 1]);
512 }
513 }
514#endif
515
516 pfree(set);
517}
void pfree(void *pointer)
Definition: mcxt.c:1524
static void ResourceOwnerForgetWaitEventSet(ResourceOwner owner, WaitEventSet *set)
Definition: waiteventset.c:227

References close, WaitEventSet::events, WaitEventSet::nevents, WaitEventSet::owner, pfree(), ReleaseExternalFD(), ResourceOwnerForgetWaitEventSet(), WL_LATCH_SET, and WL_POSTMASTER_DEATH.

Referenced by ConfigurePostmasterWaitSet(), ExecAppendAsyncEventWait(), ResOwnerReleaseWaitEventSet(), and WaitLatchOrSocket().

◆ FreeWaitEventSetAfterFork()

void FreeWaitEventSetAfterFork ( WaitEventSet set)

Definition at line 523 of file waiteventset.c.

524{
525#if defined(WAIT_USE_EPOLL)
526 close(set->epoll_fd);
528#elif defined(WAIT_USE_KQUEUE)
529 /* kqueues are not normally inherited by child processes */
531#endif
532
533 pfree(set);
534}

References close, pfree(), and ReleaseExternalFD().

Referenced by ClosePostmasterPorts().

◆ GetNumRegisteredWaitEvents()

int GetNumRegisteredWaitEvents ( WaitEventSet set)

Definition at line 1882 of file waiteventset.c.

1883{
1884 return set->nevents;
1885}

References WaitEventSet::nevents.

Referenced by ExecAppendAsyncEventWait(), and postgresForeignAsyncConfigureWait().

◆ InitializeWaitEventSupport()

void InitializeWaitEventSupport ( void  )

Definition at line 240 of file waiteventset.c.

241{
242#if defined(WAIT_USE_SELF_PIPE)
243 int pipefd[2];
244
246 {
247 /*
248 * We might have inherited connections to a self-pipe created by the
249 * postmaster. It's critical that child processes create their own
250 * self-pipes, of course, and we really want them to close the
251 * inherited FDs for safety's sake.
252 */
253 if (selfpipe_owner_pid != 0)
254 {
255 /* Assert we go through here but once in a child process */
257 /* Release postmaster's pipe FDs; ignore any error */
258 (void) close(selfpipe_readfd);
259 (void) close(selfpipe_writefd);
260 /* Clean up, just for safety's sake; we'll set these below */
263 /* Keep fd.c's accounting straight */
266 }
267 else
268 {
269 /*
270 * Postmaster didn't create a self-pipe ... or else we're in an
271 * EXEC_BACKEND build, in which case it doesn't matter since the
272 * postmaster's pipe FDs were closed by the action of FD_CLOEXEC.
273 * fd.c won't have state to clean up, either.
274 */
275 Assert(selfpipe_readfd == -1);
276 }
277 }
278 else
279 {
280 /* In postmaster or standalone backend, assert we do this but once */
281 Assert(selfpipe_readfd == -1);
283 }
284
285 /*
286 * Set up the self-pipe that allows a signal handler to wake up the
287 * poll()/epoll_wait() in WaitLatch. Make the write-end non-blocking, so
288 * that SetLatch won't block if the event has already been set many times
289 * filling the kernel buffer. Make the read-end non-blocking too, so that
290 * we can easily clear the pipe by reading until EAGAIN or EWOULDBLOCK.
291 * Also, make both FDs close-on-exec, since we surely do not want any
292 * child processes messing with them.
293 */
294 if (pipe(pipefd) < 0)
295 elog(FATAL, "pipe() failed: %m");
296 if (fcntl(pipefd[0], F_SETFL, O_NONBLOCK) == -1)
297 elog(FATAL, "fcntl(F_SETFL) failed on read-end of self-pipe: %m");
298 if (fcntl(pipefd[1], F_SETFL, O_NONBLOCK) == -1)
299 elog(FATAL, "fcntl(F_SETFL) failed on write-end of self-pipe: %m");
300 if (fcntl(pipefd[0], F_SETFD, FD_CLOEXEC) == -1)
301 elog(FATAL, "fcntl(F_SETFD) failed on read-end of self-pipe: %m");
302 if (fcntl(pipefd[1], F_SETFD, FD_CLOEXEC) == -1)
303 elog(FATAL, "fcntl(F_SETFD) failed on write-end of self-pipe: %m");
304
305 selfpipe_readfd = pipefd[0];
306 selfpipe_writefd = pipefd[1];
308
309 /* Tell fd.c about these two long-lived FDs */
312
314#endif
315
316#ifdef WAIT_USE_SIGNALFD
317 sigset_t signalfd_mask;
318
320 {
321 /*
322 * It would probably be safe to re-use the inherited signalfd since
323 * signalfds only see the current process's pending signals, but it
324 * seems less surprising to close it and create our own.
325 */
326 if (signal_fd != -1)
327 {
328 /* Release postmaster's signal FD; ignore any error */
329 (void) close(signal_fd);
330 signal_fd = -1;
332 }
333 }
334
335 /* Block SIGURG, because we'll receive it through a signalfd. */
336 sigaddset(&UnBlockSig, SIGURG);
337
338 /* Set up the signalfd to receive SIGURG notifications. */
339 sigemptyset(&signalfd_mask);
340 sigaddset(&signalfd_mask, SIGURG);
341 signal_fd = signalfd(-1, &signalfd_mask, SFD_NONBLOCK | SFD_CLOEXEC);
342 if (signal_fd < 0)
343 elog(FATAL, "signalfd() failed");
345#endif
346
347#ifdef WAIT_USE_KQUEUE
348 /* Ignore SIGURG, because we'll receive it via kqueue. */
349 pqsignal(SIGURG, SIG_IGN);
350#endif
351}
sigset_t UnBlockSig
Definition: pqsignal.c:22
#define FATAL
Definition: elog.h:41
void ReserveExternalFD(void)
Definition: fd.c:1222
bool IsUnderPostmaster
Definition: globals.c:119
#define pqsignal
Definition: port.h:521
static void latch_sigurg_handler(SIGNAL_ARGS)
static int selfpipe_owner_pid
Definition: waiteventset.c:184
static int selfpipe_writefd
Definition: waiteventset.c:181

References Assert(), close, elog, FATAL, IsUnderPostmaster, latch_sigurg_handler(), MyProcPid, pqsignal, ReleaseExternalFD(), ReserveExternalFD(), selfpipe_owner_pid, selfpipe_readfd, selfpipe_writefd, and UnBlockSig.

Referenced by InitPostmasterChild(), InitStandaloneProcess(), and PostmasterMain().

◆ latch_sigurg_handler()

static void latch_sigurg_handler ( SIGNAL_ARGS  )
static

Definition at line 1895 of file waiteventset.c.

1896{
1897 if (waiting)
1899}
static void sendSelfPipeByte(void)

References sendSelfPipeByte(), and waiting.

Referenced by InitializeWaitEventSupport().

◆ ModifyWaitEvent()

void ModifyWaitEvent ( WaitEventSet set,
int  pos,
uint32  events,
Latch latch 
)

Definition at line 655 of file waiteventset.c.

656{
657 WaitEvent *event;
658#if defined(WAIT_USE_KQUEUE)
659 int old_events;
660#endif
661
662 Assert(pos < set->nevents);
663
664 event = &set->events[pos];
665#if defined(WAIT_USE_KQUEUE)
666 old_events = event->events;
667#endif
668
669 /*
670 * Allow switching between WL_POSTMASTER_DEATH and WL_EXIT_ON_PM_DEATH.
671 *
672 * Note that because WL_EXIT_ON_PM_DEATH is mapped to WL_POSTMASTER_DEATH
673 * in AddWaitEventToSet(), this needs to be checked before the fast-path
674 * below that checks if 'events' has changed.
675 */
676 if (event->events == WL_POSTMASTER_DEATH)
677 {
678 if (events != WL_POSTMASTER_DEATH && events != WL_EXIT_ON_PM_DEATH)
679 elog(ERROR, "cannot remove postmaster death event");
680 set->exit_on_postmaster_death = ((events & WL_EXIT_ON_PM_DEATH) != 0);
681 return;
682 }
683
684 /*
685 * If neither the event mask nor the associated latch changes, return
686 * early. That's an important optimization for some sockets, where
687 * ModifyWaitEvent is frequently used to switch from waiting for reads to
688 * waiting on writes.
689 */
690 if (events == event->events &&
691 (!(event->events & WL_LATCH_SET) || set->latch == latch))
692 return;
693
694 if (event->events & WL_LATCH_SET && events != event->events)
695 elog(ERROR, "cannot modify latch event");
696
697 /* FIXME: validate event mask */
698 event->events = events;
699
700 if (events == WL_LATCH_SET)
701 {
702 if (latch && latch->owner_pid != MyProcPid)
703 elog(ERROR, "cannot wait on a latch owned by another process");
704 set->latch = latch;
705
706 /*
707 * On Unix, we don't need to modify the kernel object because the
708 * underlying pipe (if there is one) is the same for all latches so we
709 * can return immediately. On Windows, we need to update our array of
710 * handles, but we leave the old one in place and tolerate spurious
711 * wakeups if the latch is disabled.
712 */
713#if defined(WAIT_USE_WIN32)
714 if (!latch)
715 return;
716#else
717 return;
718#endif
719 }
720
721#if defined(WAIT_USE_EPOLL)
722 WaitEventAdjustEpoll(set, event, EPOLL_CTL_MOD);
723#elif defined(WAIT_USE_KQUEUE)
724 WaitEventAdjustKqueue(set, event, old_events);
725#elif defined(WAIT_USE_POLL)
726 WaitEventAdjustPoll(set, event);
727#elif defined(WAIT_USE_WIN32)
728 WaitEventAdjustWin32(set, event);
729#endif
730}
uint32 events
Definition: waiteventset.h:62

References Assert(), elog, ERROR, WaitEventSet::events, WaitEvent::events, WaitEventSet::exit_on_postmaster_death, WaitEventSet::latch, MyProcPid, Latch::owner_pid, WaitEventAdjustPoll(), WL_EXIT_ON_PM_DEATH, WL_LATCH_SET, and WL_POSTMASTER_DEATH.

Referenced by pq_check_connection(), secure_read(), secure_write(), SwitchBackToLocalLatch(), SwitchToSharedLatch(), WaitLatch(), and WalSndWait().

◆ ResourceOwnerForgetWaitEventSet()

static void ResourceOwnerForgetWaitEventSet ( ResourceOwner  owner,
WaitEventSet set 
)
inlinestatic

Definition at line 227 of file waiteventset.c.

228{
230}
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:327
void ResourceOwnerForget(ResourceOwner owner, Datum value, const ResourceOwnerDesc *kind)
Definition: resowner.c:564
static const ResourceOwnerDesc wait_event_set_resowner_desc
Definition: waiteventset.c:211

References PointerGetDatum(), ResourceOwnerForget(), and wait_event_set_resowner_desc.

Referenced by FreeWaitEventSet().

◆ ResourceOwnerRememberWaitEventSet()

static void ResourceOwnerRememberWaitEventSet ( ResourceOwner  owner,
WaitEventSet set 
)
inlinestatic

Definition at line 222 of file waiteventset.c.

223{
225}
void ResourceOwnerRemember(ResourceOwner owner, Datum value, const ResourceOwnerDesc *kind)
Definition: resowner.c:524

References PointerGetDatum(), ResourceOwnerRemember(), and wait_event_set_resowner_desc.

Referenced by CreateWaitEventSet().

◆ ResOwnerReleaseWaitEventSet()

static void ResOwnerReleaseWaitEventSet ( Datum  res)
static

Definition at line 1996 of file waiteventset.c.

1997{
1999
2000 Assert(set->owner != NULL);
2001 set->owner = NULL;
2002 FreeWaitEventSet(set);
2003}
static Pointer DatumGetPointer(Datum X)
Definition: postgres.h:317
void FreeWaitEventSet(WaitEventSet *set)
Definition: waiteventset.c:480

References Assert(), DatumGetPointer(), FreeWaitEventSet(), and WaitEventSet::owner.

◆ sendSelfPipeByte()

static void sendSelfPipeByte ( void  )
static

Definition at line 1903 of file waiteventset.c.

1904{
1905 int rc;
1906 char dummy = 0;
1907
1908retry:
1909 rc = write(selfpipe_writefd, &dummy, 1);
1910 if (rc < 0)
1911 {
1912 /* If interrupted by signal, just retry */
1913 if (errno == EINTR)
1914 goto retry;
1915
1916 /*
1917 * If the pipe is full, we don't need to retry, the data that's there
1918 * already is enough to wake up WaitLatch.
1919 */
1920 if (errno == EAGAIN || errno == EWOULDBLOCK)
1921 return;
1922
1923 /*
1924 * Oops, the write() failed for some other reason. We might be in a
1925 * signal handler, so it's not safe to elog(). We have no choice but
1926 * silently ignore the error.
1927 */
1928 return;
1929 }
1930}
#define write(a, b, c)
Definition: win32.h:14

References EAGAIN, EINTR, EWOULDBLOCK, selfpipe_writefd, and write.

Referenced by latch_sigurg_handler(), and WakeupMyProc().

◆ WaitEventAdjustPoll()

static void WaitEventAdjustPoll ( WaitEventSet set,
WaitEvent event 
)
static

Definition at line 789 of file waiteventset.c.

790{
791 struct pollfd *pollfd = &set->pollfds[event->pos];
792
793 pollfd->revents = 0;
794 pollfd->fd = event->fd;
795
796 /* prepare pollfd entry once */
797 if (event->events == WL_LATCH_SET)
798 {
799 Assert(set->latch != NULL);
800 pollfd->events = POLLIN;
801 }
802 else if (event->events == WL_POSTMASTER_DEATH)
803 {
804 pollfd->events = POLLIN;
805 }
806 else
807 {
811 pollfd->events = 0;
812 if (event->events & WL_SOCKET_READABLE)
813 pollfd->events |= POLLIN;
814 if (event->events & WL_SOCKET_WRITEABLE)
815 pollfd->events |= POLLOUT;
816#ifdef POLLRDHUP
817 if (event->events & WL_SOCKET_CLOSED)
818 pollfd->events |= POLLRDHUP;
819#endif
820 }
821
822 Assert(event->fd != PGINVALID_SOCKET);
823}
pgsocket fd
Definition: waiteventset.h:63
#define WL_SOCKET_READABLE
Definition: waiteventset.h:35
#define WL_SOCKET_CLOSED
Definition: waiteventset.h:46
#define WL_SOCKET_WRITEABLE
Definition: waiteventset.h:36

References Assert(), WaitEvent::events, WaitEvent::fd, WaitEventSet::latch, PGINVALID_SOCKET, WaitEventSet::pollfds, WL_LATCH_SET, WL_POSTMASTER_DEATH, WL_SOCKET_CLOSED, WL_SOCKET_READABLE, and WL_SOCKET_WRITEABLE.

Referenced by AddWaitEventToSet(), and ModifyWaitEvent().

◆ WaitEventSetCanReportClosed()

bool WaitEventSetCanReportClosed ( void  )

Definition at line 1867 of file waiteventset.c.

1868{
1869#if (defined(WAIT_USE_POLL) && defined(POLLRDHUP)) || \
1870 defined(WAIT_USE_EPOLL) || \
1871 defined(WAIT_USE_KQUEUE)
1872 return true;
1873#else
1874 return false;
1875#endif
1876}

Referenced by check_client_connection_check_interval().

◆ WaitEventSetWait()

int WaitEventSetWait ( WaitEventSet set,
long  timeout,
WaitEvent occurred_events,
int  nevents,
uint32  wait_event_info 
)

Definition at line 1037 of file waiteventset.c.

1040{
1041 int returned_events = 0;
1043 instr_time cur_time;
1044 long cur_timeout = -1;
1045
1046 Assert(nevents > 0);
1047
1048 /*
1049 * Initialize timeout if requested. We must record the current time so
1050 * that we can determine the remaining timeout if interrupted.
1051 */
1052 if (timeout >= 0)
1053 {
1055 Assert(timeout >= 0 && timeout <= INT_MAX);
1056 cur_timeout = timeout;
1057 }
1058 else
1060
1061 pgstat_report_wait_start(wait_event_info);
1062
1063#ifndef WIN32
1064 waiting = true;
1065#else
1066 /* Ensure that signals are serviced even if latch is already set */
1068#endif
1069 while (returned_events == 0)
1070 {
1071 int rc;
1072
1073 /*
1074 * Check if the latch is set already first. If so, we either exit
1075 * immediately or ask the kernel for further events available right
1076 * now without waiting, depending on how many events the caller wants.
1077 *
1078 * If someone sets the latch between this and the
1079 * WaitEventSetWaitBlock() below, the setter will write a byte to the
1080 * pipe (or signal us and the signal handler will do that), and the
1081 * readiness routine will return immediately.
1082 *
1083 * On unix, If there's a pending byte in the self pipe, we'll notice
1084 * whenever blocking. Only clearing the pipe in that case avoids
1085 * having to drain it every time WaitLatchOrSocket() is used. Should
1086 * the pipe-buffer fill up we're still ok, because the pipe is in
1087 * nonblocking mode. It's unlikely for that to happen, because the
1088 * self pipe isn't filled unless we're blocking (waiting = true), or
1089 * from inside a signal handler in latch_sigurg_handler().
1090 *
1091 * On windows, we'll also notice if there's a pending event for the
1092 * latch when blocking, but there's no danger of anything filling up,
1093 * as "Setting an event that is already set has no effect.".
1094 *
1095 * Note: we assume that the kernel calls involved in latch management
1096 * will provide adequate synchronization on machines with weak memory
1097 * ordering, so that we cannot miss seeing is_set if a notification
1098 * has already been queued.
1099 */
1100 if (set->latch && !set->latch->is_set)
1101 {
1102 /* about to sleep on a latch */
1103 set->latch->maybe_sleeping = true;
1105 /* and recheck */
1106 }
1107
1108 if (set->latch && set->latch->is_set)
1109 {
1110 occurred_events->fd = PGINVALID_SOCKET;
1111 occurred_events->pos = set->latch_pos;
1112 occurred_events->user_data =
1113 set->events[set->latch_pos].user_data;
1114 occurred_events->events = WL_LATCH_SET;
1115 occurred_events++;
1116 returned_events++;
1117
1118 /* could have been set above */
1119 set->latch->maybe_sleeping = false;
1120
1121 if (returned_events == nevents)
1122 break; /* output buffer full already */
1123
1124 /*
1125 * Even though we already have an event, we'll poll just once with
1126 * zero timeout to see what non-latch events we can fit into the
1127 * output buffer at the same time.
1128 */
1129 cur_timeout = 0;
1130 timeout = 0;
1131 }
1132
1133 /*
1134 * Wait for events using the readiness primitive chosen at the top of
1135 * this file. If -1 is returned, a timeout has occurred, if 0 we have
1136 * to retry, everything >= 1 is the number of returned events.
1137 */
1138 rc = WaitEventSetWaitBlock(set, cur_timeout,
1139 occurred_events, nevents - returned_events);
1140
1141 if (set->latch &&
1142 set->latch->maybe_sleeping)
1143 set->latch->maybe_sleeping = false;
1144
1145 if (rc == -1)
1146 break; /* timeout occurred */
1147 else
1148 returned_events += rc;
1149
1150 /* If we're not done, update cur_timeout for next iteration */
1151 if (returned_events == 0 && timeout >= 0)
1152 {
1153 INSTR_TIME_SET_CURRENT(cur_time);
1155 cur_timeout = timeout - (long) INSTR_TIME_GET_MILLISEC(cur_time);
1156 if (cur_timeout <= 0)
1157 break;
1158 }
1159 }
1160#ifndef WIN32
1161 waiting = false;
1162#endif
1163
1165
1166 return returned_events;
1167}
#define pg_memory_barrier()
Definition: atomics.h:143
#define INSTR_TIME_SET_CURRENT(t)
Definition: instr_time.h:122
#define INSTR_TIME_SUBTRACT(x, y)
Definition: instr_time.h:181
#define INSTR_TIME_GET_MILLISEC(t)
Definition: instr_time.h:191
#define INSTR_TIME_SET_ZERO(t)
Definition: instr_time.h:172
static time_t start_time
Definition: pg_ctl.c:95
void pgwin32_dispatch_queued_signals(void)
Definition: signal.c:120
sig_atomic_t is_set
Definition: latch.h:115
sig_atomic_t maybe_sleeping
Definition: latch.h:116
void * user_data
Definition: waiteventset.h:64
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: wait_event.h:85
static void pgstat_report_wait_end(void)
Definition: wait_event.h:101
static int WaitEventSetWaitBlock(WaitEventSet *set, int cur_timeout, WaitEvent *occurred_events, int nevents)

References Assert(), WaitEventSet::events, WaitEvent::events, WaitEvent::fd, INSTR_TIME_GET_MILLISEC, INSTR_TIME_SET_CURRENT, INSTR_TIME_SET_ZERO, INSTR_TIME_SUBTRACT, Latch::is_set, WaitEventSet::latch, WaitEventSet::latch_pos, Latch::maybe_sleeping, pg_memory_barrier, PGINVALID_SOCKET, pgstat_report_wait_end(), pgstat_report_wait_start(), pgwin32_dispatch_queued_signals(), WaitEvent::pos, start_time, WaitEvent::user_data, WaitEventSetWaitBlock(), waiting, and WL_LATCH_SET.

Referenced by ExecAppendAsyncEventWait(), pq_check_connection(), secure_read(), secure_write(), ServerLoop(), SysLoggerMain(), WaitLatch(), WaitLatchOrSocket(), and WalSndWait().

◆ WaitEventSetWaitBlock()

static int WaitEventSetWaitBlock ( WaitEventSet set,
int  cur_timeout,
WaitEvent occurred_events,
int  nevents 
)
inlinestatic

Definition at line 1470 of file waiteventset.c.

1472{
1473 int returned_events = 0;
1474 int rc;
1475 WaitEvent *cur_event;
1476 struct pollfd *cur_pollfd;
1477
1478 /* Sleep */
1479 rc = poll(set->pollfds, set->nevents, (int) cur_timeout);
1480
1481 /* Check return code */
1482 if (rc < 0)
1483 {
1484 /* EINTR is okay, otherwise complain */
1485 if (errno != EINTR)
1486 {
1487 waiting = false;
1488 ereport(ERROR,
1490 errmsg("%s() failed: %m",
1491 "poll")));
1492 }
1493 return 0;
1494 }
1495 else if (rc == 0)
1496 {
1497 /* timeout exceeded */
1498 return -1;
1499 }
1500
1501 for (cur_event = set->events, cur_pollfd = set->pollfds;
1502 cur_event < (set->events + set->nevents) &&
1503 returned_events < nevents;
1504 cur_event++, cur_pollfd++)
1505 {
1506 /* no activity on this FD, skip */
1507 if (cur_pollfd->revents == 0)
1508 continue;
1509
1510 occurred_events->pos = cur_event->pos;
1511 occurred_events->user_data = cur_event->user_data;
1512 occurred_events->events = 0;
1513
1514 if (cur_event->events == WL_LATCH_SET &&
1515 (cur_pollfd->revents & (POLLIN | POLLHUP | POLLERR | POLLNVAL)))
1516 {
1517 /* There's data in the self-pipe, clear it. */
1518 drain();
1519
1520 if (set->latch && set->latch->maybe_sleeping && set->latch->is_set)
1521 {
1522 occurred_events->fd = PGINVALID_SOCKET;
1523 occurred_events->events = WL_LATCH_SET;
1524 occurred_events++;
1525 returned_events++;
1526 }
1527 }
1528 else if (cur_event->events == WL_POSTMASTER_DEATH &&
1529 (cur_pollfd->revents & (POLLIN | POLLHUP | POLLERR | POLLNVAL)))
1530 {
1531 /*
1532 * We expect an POLLHUP when the remote end is closed, but because
1533 * we don't expect the pipe to become readable or to have any
1534 * errors either, treat those cases as postmaster death, too.
1535 *
1536 * Be paranoid about a spurious event signaling the postmaster as
1537 * being dead. There have been reports about that happening with
1538 * older primitives (select(2) to be specific), and a spurious
1539 * WL_POSTMASTER_DEATH event would be painful. Re-checking doesn't
1540 * cost much.
1541 */
1543 {
1544 if (set->exit_on_postmaster_death)
1545 proc_exit(1);
1546 occurred_events->fd = PGINVALID_SOCKET;
1547 occurred_events->events = WL_POSTMASTER_DEATH;
1548 occurred_events++;
1549 returned_events++;
1550 }
1551 }
1552 else if (cur_event->events & (WL_SOCKET_READABLE |
1555 {
1556 int errflags = POLLHUP | POLLERR | POLLNVAL;
1557
1558 Assert(cur_event->fd >= PGINVALID_SOCKET);
1559
1560 if ((cur_event->events & WL_SOCKET_READABLE) &&
1561 (cur_pollfd->revents & (POLLIN | errflags)))
1562 {
1563 /* data available in socket, or EOF */
1564 occurred_events->events |= WL_SOCKET_READABLE;
1565 }
1566
1567 if ((cur_event->events & WL_SOCKET_WRITEABLE) &&
1568 (cur_pollfd->revents & (POLLOUT | errflags)))
1569 {
1570 /* writeable, or EOF */
1571 occurred_events->events |= WL_SOCKET_WRITEABLE;
1572 }
1573
1574#ifdef POLLRDHUP
1575 if ((cur_event->events & WL_SOCKET_CLOSED) &&
1576 (cur_pollfd->revents & (POLLRDHUP | errflags)))
1577 {
1578 /* remote peer closed, or error */
1579 occurred_events->events |= WL_SOCKET_CLOSED;
1580 }
1581#endif
1582
1583 if (occurred_events->events != 0)
1584 {
1585 occurred_events->fd = cur_event->fd;
1586 occurred_events++;
1587 returned_events++;
1588 }
1589 }
1590 }
1591 return returned_events;
1592}
int errcode_for_socket_access(void)
Definition: elog.c:953
int errmsg(const char *fmt,...)
Definition: elog.c:1070
#define ereport(elevel,...)
Definition: elog.h:149
void proc_exit(int code)
Definition: ipc.c:104
bool PostmasterIsAliveInternal(void)
Definition: pmsignal.c:346
static void drain(void)

References Assert(), drain(), EINTR, ereport, errcode_for_socket_access(), errmsg(), ERROR, WaitEventSet::events, WaitEvent::events, WaitEventSet::exit_on_postmaster_death, WaitEvent::fd, Latch::is_set, WaitEventSet::latch, Latch::maybe_sleeping, WaitEventSet::nevents, PGINVALID_SOCKET, WaitEventSet::pollfds, WaitEvent::pos, PostmasterIsAliveInternal(), proc_exit(), WaitEvent::user_data, waiting, WL_LATCH_SET, WL_POSTMASTER_DEATH, WL_SOCKET_CLOSED, WL_SOCKET_READABLE, and WL_SOCKET_WRITEABLE.

Referenced by WaitEventSetWait().

◆ WakeupMyProc()

void WakeupMyProc ( void  )

Definition at line 2019 of file waiteventset.c.

2020{
2021#if defined(WAIT_USE_SELF_PIPE)
2022 if (waiting)
2024#else
2025 if (waiting)
2026 kill(MyProcPid, SIGURG);
2027#endif
2028}
#define kill(pid, sig)
Definition: win32_port.h:493

References kill, MyProcPid, sendSelfPipeByte(), and waiting.

Referenced by SetLatch().

◆ WakeupOtherProc()

void WakeupOtherProc ( int  pid)

Definition at line 2032 of file waiteventset.c.

2033{
2034 kill(pid, SIGURG);
2035}

References kill.

Referenced by SetLatch().

Variable Documentation

◆ selfpipe_owner_pid

int selfpipe_owner_pid = 0
static

Definition at line 184 of file waiteventset.c.

Referenced by InitializeWaitEventSupport().

◆ selfpipe_readfd

int selfpipe_readfd = -1
static

Definition at line 180 of file waiteventset.c.

Referenced by AddWaitEventToSet(), drain(), and InitializeWaitEventSupport().

◆ selfpipe_writefd

int selfpipe_writefd = -1
static

Definition at line 181 of file waiteventset.c.

Referenced by InitializeWaitEventSupport(), and sendSelfPipeByte().

◆ wait_event_set_resowner_desc

const ResourceOwnerDesc wait_event_set_resowner_desc
static
Initial value:
=
{
.name = "WaitEventSet",
.release_phase = RESOURCE_RELEASE_AFTER_LOCKS,
.release_priority = RELEASE_PRIO_WAITEVENTSETS,
.ReleaseResource = ResOwnerReleaseWaitEventSet,
.DebugPrint = NULL
}
#define RELEASE_PRIO_WAITEVENTSETS
Definition: resowner.h:77
@ RESOURCE_RELEASE_AFTER_LOCKS
Definition: resowner.h:56
static void ResOwnerReleaseWaitEventSet(Datum res)

Definition at line 211 of file waiteventset.c.

Referenced by ResourceOwnerForgetWaitEventSet(), and ResourceOwnerRememberWaitEventSet().

◆ waiting