54#ifdef HAVE_SYS_EPOLL_H
57#ifdef HAVE_SYS_EVENT_H
60#ifdef HAVE_SYS_SIGNALFD_H
61#include <sys/signalfd.h>
86#if defined(WAIT_USE_EPOLL) || defined(WAIT_USE_POLL) || \
87 defined(WAIT_USE_KQUEUE) || defined(WAIT_USE_WIN32)
89#elif defined(HAVE_SYS_EPOLL_H)
91#elif defined(HAVE_KQUEUE)
92#define WAIT_USE_KQUEUE
93#elif defined(HAVE_POLL)
98#error "no wait set implementation available"
105#if defined(WAIT_USE_POLL) || defined(WAIT_USE_EPOLL)
106#if defined(WAIT_USE_SELF_PIPE) || defined(WAIT_USE_SIGNALFD)
108#elif defined(WAIT_USE_EPOLL) && defined(HAVE_SYS_SIGNALFD_H)
109#define WAIT_USE_SIGNALFD
111#define WAIT_USE_SELF_PIPE
145#if defined(WAIT_USE_EPOLL)
148 struct epoll_event *epoll_ret_events;
149#elif defined(WAIT_USE_KQUEUE)
152 struct kevent *kqueue_ret_events;
153 bool report_postmaster_not_running;
154#elif defined(WAIT_USE_POLL)
157#elif defined(WAIT_USE_WIN32)
173#ifdef WAIT_USE_SIGNALFD
175static int signal_fd = -1;
178#ifdef WAIT_USE_SELF_PIPE
191#if defined(WAIT_USE_SELF_PIPE) || defined(WAIT_USE_SIGNALFD)
192static void drain(
void);
195#if defined(WAIT_USE_EPOLL)
197#elif defined(WAIT_USE_KQUEUE)
199#elif defined(WAIT_USE_POLL)
201#elif defined(WAIT_USE_WIN32)
206 WaitEvent *occurred_events,
int nevents);
213 .
name =
"WaitEventSet",
242#if defined(WAIT_USE_SELF_PIPE)
294 if (pipe(pipefd) < 0)
296 if (fcntl(pipefd[0], F_SETFL, O_NONBLOCK) == -1)
297 elog(
FATAL,
"fcntl(F_SETFL) failed on read-end of self-pipe: %m");
298 if (fcntl(pipefd[1], F_SETFL, O_NONBLOCK) == -1)
299 elog(
FATAL,
"fcntl(F_SETFL) failed on write-end of self-pipe: %m");
300 if (fcntl(pipefd[0], F_SETFD, FD_CLOEXEC) == -1)
301 elog(
FATAL,
"fcntl(F_SETFD) failed on read-end of self-pipe: %m");
302 if (fcntl(pipefd[1], F_SETFD, FD_CLOEXEC) == -1)
303 elog(
FATAL,
"fcntl(F_SETFD) failed on write-end of self-pipe: %m");
316#ifdef WAIT_USE_SIGNALFD
317 sigset_t signalfd_mask;
329 (void)
close(signal_fd);
339 sigemptyset(&signalfd_mask);
340 sigaddset(&signalfd_mask, SIGURG);
341 signal_fd = signalfd(-1, &signalfd_mask, SFD_NONBLOCK | SFD_CLOEXEC);
347#ifdef WAIT_USE_KQUEUE
378#if defined(WAIT_USE_EPOLL)
379 sz +=
MAXALIGN(
sizeof(
struct epoll_event) * nevents);
380#elif defined(WAIT_USE_KQUEUE)
381 sz +=
MAXALIGN(
sizeof(
struct kevent) * nevents);
382#elif defined(WAIT_USE_POLL)
383 sz +=
MAXALIGN(
sizeof(
struct pollfd) * nevents);
384#elif defined(WAIT_USE_WIN32)
386 sz +=
MAXALIGN(
sizeof(HANDLE) * (nevents + 1));
389 if (resowner != NULL)
400#if defined(WAIT_USE_EPOLL)
401 set->epoll_ret_events = (
struct epoll_event *)
data;
403#elif defined(WAIT_USE_KQUEUE)
404 set->kqueue_ret_events = (
struct kevent *)
data;
406#elif defined(WAIT_USE_POLL)
409#elif defined(WAIT_USE_WIN32)
410 set->handles = (HANDLE)
data;
418 if (resowner != NULL)
421 set->
owner = resowner;
424#if defined(WAIT_USE_EPOLL)
426 elog(
ERROR,
"AcquireExternalFD, for epoll_create1, failed: %m");
427 set->epoll_fd = epoll_create1(EPOLL_CLOEXEC);
428 if (set->epoll_fd < 0)
433#elif defined(WAIT_USE_KQUEUE)
435 elog(
ERROR,
"AcquireExternalFD, for kqueue, failed: %m");
436 set->kqueue_fd = kqueue();
437 if (set->kqueue_fd < 0)
442 if (fcntl(set->kqueue_fd, F_SETFD, FD_CLOEXEC) == -1)
444 int save_errno = errno;
446 close(set->kqueue_fd);
449 elog(
ERROR,
"fcntl(F_SETFD) failed on kqueue descriptor: %m");
451 set->report_postmaster_not_running =
false;
452#elif defined(WAIT_USE_WIN32)
488#if defined(WAIT_USE_EPOLL)
489 close(set->epoll_fd);
491#elif defined(WAIT_USE_KQUEUE)
492 close(set->kqueue_fd);
494#elif defined(WAIT_USE_WIN32)
510 WSAEventSelect(cur_event->fd, NULL, 0);
511 WSACloseEvent(set->handles[cur_event->pos + 1]);
525#if defined(WAIT_USE_EPOLL)
526 close(set->epoll_fd);
528#elif defined(WAIT_USE_KQUEUE)
586 elog(
ERROR,
"cannot wait on a latch owned by another process");
588 elog(
ERROR,
"cannot wait on more than one latch");
590 elog(
ERROR,
"latch events only support being set");
595 elog(
ERROR,
"cannot wait on latch without a specified latch");
600 elog(
ERROR,
"cannot wait on socket event without a socket");
605 event->events = events;
606 event->user_data = user_data;
608 event->reset =
false;
615#if defined(WAIT_USE_SELF_PIPE)
617#elif defined(WAIT_USE_SIGNALFD)
618 event->fd = signal_fd;
634#if defined(WAIT_USE_EPOLL)
635 WaitEventAdjustEpoll(set, event, EPOLL_CTL_ADD);
636#elif defined(WAIT_USE_KQUEUE)
637 WaitEventAdjustKqueue(set, event, 0);
638#elif defined(WAIT_USE_POLL)
640#elif defined(WAIT_USE_WIN32)
641 WaitEventAdjustWin32(set, event);
658#if defined(WAIT_USE_KQUEUE)
662 Assert(pos < set->nevents);
664 event = &set->
events[pos];
665#if defined(WAIT_USE_KQUEUE)
666 old_events =
event->
events;
679 elog(
ERROR,
"cannot remove postmaster death event");
690 if (events == event->
events &&
695 elog(
ERROR,
"cannot modify latch event");
698 event->events = events;
703 elog(
ERROR,
"cannot wait on a latch owned by another process");
713#if defined(WAIT_USE_WIN32)
721#if defined(WAIT_USE_EPOLL)
722 WaitEventAdjustEpoll(set, event, EPOLL_CTL_MOD);
723#elif defined(WAIT_USE_KQUEUE)
724 WaitEventAdjustKqueue(set, event, old_events);
725#elif defined(WAIT_USE_POLL)
727#elif defined(WAIT_USE_WIN32)
728 WaitEventAdjustWin32(set, event);
732#if defined(WAIT_USE_EPOLL)
739 struct epoll_event epoll_ev;
743 epoll_ev.data.ptr = event;
745 epoll_ev.
events = EPOLLERR | EPOLLHUP;
751 epoll_ev.events |= EPOLLIN;
755 epoll_ev.events |= EPOLLIN;
765 epoll_ev.events |= EPOLLIN;
767 epoll_ev.events |= EPOLLOUT;
769 epoll_ev.events |= EPOLLRDHUP;
777 rc = epoll_ctl(set->epoll_fd,
action, event->
fd, &epoll_ev);
787#if defined(WAIT_USE_POLL)
791 struct pollfd *pollfd = &set->
pollfds[
event->pos];
794 pollfd->fd =
event->fd;
800 pollfd->events = POLLIN;
804 pollfd->events = POLLIN;
813 pollfd->events |= POLLIN;
815 pollfd->events |= POLLOUT;
818 pollfd->events |= POLLRDHUP;
826#if defined(WAIT_USE_KQUEUE)
834#define AccessWaitEvent(k_ev) (*((WaitEvent **)(&(k_ev)->udata)))
837WaitEventAdjustKqueueAdd(
struct kevent *k_ev,
int filter,
int action,
840 k_ev->ident =
event->fd;
841 k_ev->filter = filter;
845 AccessWaitEvent(k_ev) = event;
849WaitEventAdjustKqueueAddPostmaster(
struct kevent *k_ev,
WaitEvent *event)
853 k_ev->filter = EVFILT_PROC;
854 k_ev->flags = EV_ADD;
855 k_ev->fflags = NOTE_EXIT;
857 AccessWaitEvent(k_ev) = event;
861WaitEventAdjustKqueueAddLatch(
struct kevent *k_ev,
WaitEvent *event)
864 k_ev->ident = SIGURG;
865 k_ev->filter = EVFILT_SIGNAL;
866 k_ev->flags = EV_ADD;
869 AccessWaitEvent(k_ev) = event;
879 struct kevent k_ev[2];
881 bool new_filt_read =
false;
882 bool old_filt_read =
false;
883 bool new_filt_write =
false;
884 bool old_filt_write =
false;
886 if (old_events == event->
events)
903 WaitEventAdjustKqueueAddPostmaster(&k_ev[count++], event);
908 WaitEventAdjustKqueueAddLatch(&k_ev[count++], event);
918 old_filt_read =
true;
920 new_filt_read =
true;
922 old_filt_write =
true;
924 new_filt_write =
true;
925 if (old_filt_read && !new_filt_read)
926 WaitEventAdjustKqueueAdd(&k_ev[count++], EVFILT_READ, EV_DELETE,
928 else if (!old_filt_read && new_filt_read)
929 WaitEventAdjustKqueueAdd(&k_ev[count++], EVFILT_READ, EV_ADD,
931 if (old_filt_write && !new_filt_write)
932 WaitEventAdjustKqueueAdd(&k_ev[count++], EVFILT_WRITE, EV_DELETE,
934 else if (!old_filt_write && new_filt_write)
935 WaitEventAdjustKqueueAdd(&k_ev[count++], EVFILT_WRITE, EV_ADD,
945 rc = kevent(set->kqueue_fd, &k_ev[0], count, NULL, 0, NULL);
957 (errno == ESRCH || errno == EACCES))
958 set->report_postmaster_not_running =
true;
974 set->report_postmaster_not_running =
true;
980#if defined(WAIT_USE_WIN32)
984 HANDLE *handle = &set->handles[
event->pos + 1];
989 *handle = set->
latch->event;
993 *handle = PostmasterHandle;
997 int flags = FD_CLOSE;
1004 flags |= FD_CONNECT;
1008 if (*handle == WSA_INVALID_EVENT)
1010 *handle = WSACreateEvent();
1011 if (*handle == WSA_INVALID_EVENT)
1012 elog(
ERROR,
"failed to create event for socket: error code %d",
1015 if (WSAEventSelect(event->
fd, *handle, flags) != 0)
1016 elog(
ERROR,
"failed to set up event for socket: error code %d",
1038 WaitEvent *occurred_events,
int nevents,
1041 int returned_events = 0;
1044 long cur_timeout = -1;
1055 Assert(timeout >= 0 && timeout <= INT_MAX);
1056 cur_timeout = timeout;
1069 while (returned_events == 0)
1121 if (returned_events == nevents)
1139 occurred_events, nevents - returned_events);
1148 returned_events += rc;
1151 if (returned_events == 0 && timeout >= 0)
1156 if (cur_timeout <= 0)
1166 return returned_events;
1170#if defined(WAIT_USE_EPOLL)
1182 WaitEvent *occurred_events,
int nevents)
1184 int returned_events = 0;
1187 struct epoll_event *cur_epoll_event;
1190 rc = epoll_wait(set->epoll_fd, set->epoll_ret_events,
1202 errmsg(
"%s() failed: %m",
1218 for (cur_epoll_event = set->epoll_ret_events;
1219 cur_epoll_event < (set->epoll_ret_events + rc) &&
1220 returned_events < nevents;
1224 cur_event = (
WaitEvent *) cur_epoll_event->data.ptr;
1226 occurred_events->
pos = cur_event->
pos;
1228 occurred_events->
events = 0;
1231 cur_epoll_event->events & (EPOLLIN | EPOLLERR | EPOLLHUP))
1245 cur_epoll_event->events & (EPOLLIN | EPOLLERR | EPOLLHUP))
1275 (cur_epoll_event->events & (EPOLLIN | EPOLLERR | EPOLLHUP)))
1282 (cur_epoll_event->events & (EPOLLOUT | EPOLLERR | EPOLLHUP)))
1289 (cur_epoll_event->events & (EPOLLRDHUP | EPOLLERR | EPOLLHUP)))
1295 if (occurred_events->
events != 0)
1297 occurred_events->
fd = cur_event->
fd;
1304 return returned_events;
1307#elif defined(WAIT_USE_KQUEUE)
1318 WaitEvent *occurred_events,
int nevents)
1320 int returned_events = 0;
1323 struct kevent *cur_kqueue_event;
1324 struct timespec timeout;
1325 struct timespec *timeout_p;
1327 if (cur_timeout < 0)
1331 timeout.tv_sec = cur_timeout / 1000;
1332 timeout.tv_nsec = (cur_timeout % 1000) * 1000000;
1333 timeout_p = &timeout;
1340 if (
unlikely(set->report_postmaster_not_running))
1350 rc = kevent(set->kqueue_fd, NULL, 0,
1351 set->kqueue_ret_events,
1364 errmsg(
"%s() failed: %m",
1380 for (cur_kqueue_event = set->kqueue_ret_events;
1381 cur_kqueue_event < (set->kqueue_ret_events + rc) &&
1382 returned_events < nevents;
1386 cur_event = AccessWaitEvent(cur_kqueue_event);
1388 occurred_events->
pos = cur_event->
pos;
1390 occurred_events->
events = 0;
1393 cur_kqueue_event->filter == EVFILT_SIGNAL)
1404 cur_kqueue_event->filter == EVFILT_PROC &&
1405 (cur_kqueue_event->fflags & NOTE_EXIT) != 0)
1412 set->report_postmaster_not_running =
true;
1428 (cur_kqueue_event->filter == EVFILT_READ))
1435 (cur_kqueue_event->filter == EVFILT_READ) &&
1436 (cur_kqueue_event->flags & EV_EOF))
1443 (cur_kqueue_event->filter == EVFILT_WRITE))
1449 if (occurred_events->
events != 0)
1451 occurred_events->
fd = cur_event->
fd;
1458 return returned_events;
1461#elif defined(WAIT_USE_POLL)
1471 WaitEvent *occurred_events,
int nevents)
1473 int returned_events = 0;
1476 struct pollfd *cur_pollfd;
1490 errmsg(
"%s() failed: %m",
1503 returned_events < nevents;
1504 cur_event++, cur_pollfd++)
1507 if (cur_pollfd->revents == 0)
1510 occurred_events->
pos = cur_event->
pos;
1512 occurred_events->
events = 0;
1515 (cur_pollfd->revents & (POLLIN | POLLHUP | POLLERR | POLLNVAL)))
1529 (cur_pollfd->revents & (POLLIN | POLLHUP | POLLERR | POLLNVAL)))
1556 int errflags = POLLHUP | POLLERR | POLLNVAL;
1561 (cur_pollfd->revents & (POLLIN | errflags)))
1568 (cur_pollfd->revents & (POLLOUT | errflags)))
1576 (cur_pollfd->revents & (POLLRDHUP | errflags)))
1583 if (occurred_events->
events != 0)
1585 occurred_events->
fd = cur_event->
fd;
1591 return returned_events;
1594#elif defined(WAIT_USE_WIN32)
1605 WaitEvent *occurred_events,
int nevents)
1607 int returned_events = 0;
1612 for (cur_event = set->
events;
1616 if (cur_event->reset)
1618 WaitEventAdjustWin32(set, cur_event);
1619 cur_event->reset =
false;
1644 if (WSARecv(cur_event->
fd, &
buf, 1, &received, &flags, NULL, NULL) == 0)
1646 occurred_events->
pos = cur_event->
pos;
1649 occurred_events->
fd = cur_event->
fd;
1675 r = WSASend(cur_event->
fd, &
buf, 1, &sent, 0, NULL, NULL);
1676 if (r == 0 || WSAGetLastError() != WSAEWOULDBLOCK)
1678 occurred_events->
pos = cur_event->
pos;
1681 occurred_events->
fd = cur_event->
fd;
1692 rc = WaitForMultipleObjects(set->
nevents + 1, set->handles, FALSE,
1696 if (rc == WAIT_FAILED)
1697 elog(
ERROR,
"WaitForMultipleObjects() failed: error code %lu",
1699 else if (rc == WAIT_TIMEOUT)
1705 if (rc == WAIT_OBJECT_0)
1723 occurred_events->
pos = cur_event->
pos;
1725 occurred_events->
events = 0;
1733 if (!ResetEvent(set->handles[cur_event->
pos + 1]))
1734 elog(
ERROR,
"ResetEvent failed: error code %lu", GetLastError());
1765 WSANETWORKEVENTS resEvents;
1766 HANDLE handle = set->handles[cur_event->
pos + 1];
1770 occurred_events->
fd = cur_event->
fd;
1772 ZeroMemory(&resEvents,
sizeof(resEvents));
1773 if (WSAEnumNetworkEvents(cur_event->
fd, handle, &resEvents) != 0)
1774 elog(
ERROR,
"failed to enumerate network events: error code %d",
1777 (resEvents.lNetworkEvents & FD_READ))
1795 cur_event->reset =
true;
1798 (resEvents.lNetworkEvents & FD_WRITE))
1804 (resEvents.lNetworkEvents & FD_CONNECT))
1810 (resEvents.lNetworkEvents & FD_ACCEPT))
1815 if (resEvents.lNetworkEvents & FD_CLOSE)
1821 if (occurred_events->
events != 0)
1829 if (returned_events == nevents)
1833 next_pos = cur_event->
pos + 1;
1842 count = set->
nevents - next_pos;
1843 rc = WaitForMultipleObjects(count,
1844 set->handles + 1 + next_pos,
1852 if (rc < WAIT_OBJECT_0 || rc >= WAIT_OBJECT_0 + count)
1856 cur_event = &set->
events[next_pos + (rc - WAIT_OBJECT_0)];
1859 return returned_events;
1869#if (defined(WAIT_USE_POLL) && defined(POLLRDHUP)) || \
1870 defined(WAIT_USE_EPOLL) || \
1871 defined(WAIT_USE_KQUEUE)
1887#if defined(WAIT_USE_SELF_PIPE)
1934#if defined(WAIT_USE_SELF_PIPE) || defined(WAIT_USE_SIGNALFD)
1950#ifdef WAIT_USE_SELF_PIPE
1963 else if (errno ==
EINTR)
1968#ifdef WAIT_USE_SELF_PIPE
1969 elog(
ERROR,
"read() on self-pipe failed: %m");
1971 elog(
ERROR,
"read() on signalfd failed: %m");
1978#ifdef WAIT_USE_SELF_PIPE
1979 elog(
ERROR,
"unexpected EOF on self-pipe");
1981 elog(
ERROR,
"unexpected EOF on signalfd");
1984 else if (rc <
sizeof(
buf))
2021#if defined(WAIT_USE_SELF_PIPE)
#define pg_memory_barrier()
#define StaticAssertStmt(condition, errmessage)
int errcode_for_socket_access(void)
int errmsg(const char *fmt,...)
#define ereport(elevel,...)
void ReleaseExternalFD(void)
bool AcquireExternalFD(void)
void ReserveExternalFD(void)
Assert(PointerIsAligned(start, uint64))
#define INSTR_TIME_SET_CURRENT(t)
#define INSTR_TIME_SUBTRACT(x, y)
#define INSTR_TIME_GET_MILLISEC(t)
#define INSTR_TIME_SET_ZERO(t)
if(TABLE==NULL||TABLE_index==NULL)
void * MemoryContextAllocZero(MemoryContext context, Size size)
void pfree(void *pointer)
MemoryContext TopMemoryContext
bool PostmasterIsAliveInternal(void)
#define PostmasterIsAlive()
static Datum PointerGetDatum(const void *X)
static Pointer DatumGetPointer(Datum X)
int postmaster_alive_fds[2]
#define POSTMASTER_FD_WATCH
static int fd(const char *x, int i)
void ResourceOwnerForget(ResourceOwner owner, Datum value, const ResourceOwnerDesc *kind)
void ResourceOwnerRemember(ResourceOwner owner, Datum value, const ResourceOwnerDesc *kind)
void ResourceOwnerEnlarge(ResourceOwner owner)
#define RELEASE_PRIO_WAITEVENTSETS
@ RESOURCE_RELEASE_AFTER_LOCKS
void pgwin32_dispatch_queued_signals(void)
HANDLE pgwin32_signal_event
sig_atomic_t maybe_sleeping
bool exit_on_postmaster_death
static void pgstat_report_wait_start(uint32 wait_event_info)
static void pgstat_report_wait_end(void)
static void latch_sigurg_handler(SIGNAL_ARGS)
static void sendSelfPipeByte(void)
static void ResourceOwnerForgetWaitEventSet(ResourceOwner owner, WaitEventSet *set)
static int selfpipe_readfd
static const ResourceOwnerDesc wait_event_set_resowner_desc
void FreeWaitEventSetAfterFork(WaitEventSet *set)
static void WaitEventAdjustPoll(WaitEventSet *set, WaitEvent *event)
static int selfpipe_owner_pid
static int selfpipe_writefd
int GetNumRegisteredWaitEvents(WaitEventSet *set)
void WakeupOtherProc(int pid)
static void ResourceOwnerRememberWaitEventSet(ResourceOwner owner, WaitEventSet *set)
void ModifyWaitEvent(WaitEventSet *set, int pos, uint32 events, Latch *latch)
static int WaitEventSetWaitBlock(WaitEventSet *set, int cur_timeout, WaitEvent *occurred_events, int nevents)
static void ResOwnerReleaseWaitEventSet(Datum res)
void InitializeWaitEventSupport(void)
bool WaitEventSetCanReportClosed(void)
int AddWaitEventToSet(WaitEventSet *set, uint32 events, pgsocket fd, Latch *latch, void *user_data)
int WaitEventSetWait(WaitEventSet *set, long timeout, WaitEvent *occurred_events, int nevents, uint32 wait_event_info)
static volatile sig_atomic_t waiting
void FreeWaitEventSet(WaitEventSet *set)
WaitEventSet * CreateWaitEventSet(ResourceOwner resowner, int nevents)
#define WL_SOCKET_READABLE
#define WL_EXIT_ON_PM_DEATH
#define WL_SOCKET_CONNECTED
#define WL_POSTMASTER_DEATH
#define WL_SOCKET_WRITEABLE