PostgreSQL Source Code git master
Loading...
Searching...
No Matches
bgworker.c
Go to the documentation of this file.
1/*--------------------------------------------------------------------
2 * bgworker.c
3 * POSTGRES pluggable background workers implementation
4 *
5 * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
6 *
7 * IDENTIFICATION
8 * src/backend/postmaster/bgworker.c
9 *
10 *-------------------------------------------------------------------------
11 */
12
13#include "postgres.h"
14
15#include "access/parallel.h"
16#include "libpq/pqsignal.h"
17#include "miscadmin.h"
18#include "pgstat.h"
19#include "port/atomics.h"
24#include "storage/ipc.h"
25#include "storage/latch.h"
26#include "storage/lwlock.h"
27#include "storage/pmsignal.h"
28#include "storage/proc.h"
29#include "storage/procarray.h"
30#include "storage/procsignal.h"
31#include "storage/shmem.h"
32#include "tcop/tcopprot.h"
33#include "utils/ascii.h"
34#include "utils/memutils.h"
35#include "utils/ps_status.h"
36#include "utils/timeout.h"
37#include "utils/wait_event.h"
38
39/*
40 * The postmaster's list of registered background workers, in private memory.
41 */
43
44/*
45 * BackgroundWorkerSlots exist in shared memory and can be accessed (via
46 * the BackgroundWorkerArray) by both the postmaster and by regular backends.
47 * However, the postmaster cannot take locks, even spinlocks, because this
48 * might allow it to crash or become wedged if shared memory gets corrupted.
49 * Such an outcome is intolerable. Therefore, we need a lockless protocol
50 * for coordinating access to this data.
51 *
52 * The 'in_use' flag is used to hand off responsibility for the slot between
53 * the postmaster and the rest of the system. When 'in_use' is false,
54 * the postmaster will ignore the slot entirely, except for the 'in_use' flag
55 * itself, which it may read. In this state, regular backends may modify the
56 * slot. Once a backend sets 'in_use' to true, the slot becomes the
57 * responsibility of the postmaster. Regular backends may no longer modify it,
58 * but the postmaster may examine it. Thus, a backend initializing a slot
59 * must fully initialize the slot - and insert a write memory barrier - before
60 * marking it as in use.
61 *
62 * As an exception, however, even when the slot is in use, regular backends
63 * may set the 'terminate' flag for a slot, telling the postmaster not
64 * to restart it. Once the background worker is no longer running, the slot
65 * will be released for reuse.
66 *
67 * In addition to coordinating with the postmaster, backends modifying this
68 * data structure must coordinate with each other. Since they can take locks,
69 * this is straightforward: any backend wishing to manipulate a slot must
70 * take BackgroundWorkerLock in exclusive mode. Backends wishing to read
71 * data that might get concurrently modified by other backends should take
72 * this lock in shared mode. No matter what, backends reading this data
73 * structure must be able to tolerate concurrent modifications by the
74 * postmaster.
75 */
77{
78 bool in_use;
80 pid_t pid; /* InvalidPid = not started yet; 0 = dead */
81 uint64 generation; /* incremented when slot is recycled */
84
85/*
86 * In order to limit the total number of parallel workers (according to
87 * max_parallel_workers GUC), we maintain the number of active parallel
88 * workers. Since the postmaster cannot take locks, two variables are used for
89 * this purpose: the number of registered parallel workers (modified by the
90 * backends, protected by BackgroundWorkerLock) and the number of terminated
91 * parallel workers (modified only by the postmaster, lockless). The active
92 * number of parallel workers is the number of registered workers minus the
93 * terminated ones. These counters can of course overflow, but it's not
94 * important here since the subtraction will still give the right number.
95 */
103
109
111
112/*
113 * List of internal background worker entry points. We need this for
114 * reasons explained in LookupBackgroundWorkerFunction(), below.
115 */
116static const struct
117{
118 const char *fn_name;
121
122{
123 {
124 .fn_name = "ParallelWorkerMain",
125 .fn_addr = ParallelWorkerMain
126 },
127 {
128 .fn_name = "ApplyLauncherMain",
129 .fn_addr = ApplyLauncherMain
130 },
131 {
132 .fn_name = "ApplyWorkerMain",
133 .fn_addr = ApplyWorkerMain
134 },
135 {
136 .fn_name = "ParallelApplyWorkerMain",
137 .fn_addr = ParallelApplyWorkerMain
138 },
139 {
140 .fn_name = "TableSyncWorkerMain",
141 .fn_addr = TableSyncWorkerMain
142 },
143 {
144 .fn_name = "SequenceSyncWorkerMain",
145 .fn_addr = SequenceSyncWorkerMain
146 }
148
149/* Private functions. */
151
152
153/*
154 * Calculate shared memory needed.
155 */
156Size
158{
159 Size size;
160
161 /* Array of workers is variably sized. */
162 size = offsetof(BackgroundWorkerArray, slot);
164 sizeof(BackgroundWorkerSlot)));
165
166 return size;
167}
168
169/*
170 * Initialize shared memory.
171 */
172void
174{
175 bool found;
176
177 BackgroundWorkerData = ShmemInitStruct("Background Worker Data",
179 &found);
181 {
182 dlist_iter iter;
183 int slotno = 0;
184
188
189 /*
190 * Copy contents of worker list into shared memory. Record the shared
191 * memory slot assigned to each worker. This ensures a 1-to-1
192 * correspondence between the postmaster's private list and the array
193 * in shared memory.
194 */
196 {
199
200 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
202 slot->in_use = true;
203 slot->terminate = false;
204 slot->pid = InvalidPid;
205 slot->generation = 0;
206 rw->rw_shmem_slot = slotno;
207 rw->rw_worker.bgw_notify_pid = 0; /* might be reinit after crash */
208 memcpy(&slot->worker, &rw->rw_worker, sizeof(BackgroundWorker));
209 ++slotno;
210 }
211
212 /*
213 * Mark any remaining slots as not in use.
214 */
216 {
218
219 slot->in_use = false;
220 ++slotno;
221 }
222 }
223 else
224 Assert(found);
225}
226
227/*
228 * Search the postmaster's backend-private list of RegisteredBgWorker objects
229 * for the one that maps to the given slot number.
230 */
231static RegisteredBgWorker *
233{
234 dlist_iter iter;
235
237 {
239
240 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
241 if (rw->rw_shmem_slot == slotno)
242 return rw;
243 }
244
245 return NULL;
246}
247
248/*
249 * Notice changes to shared memory made by other backends.
250 * Accept new worker requests only if allow_new_workers is true.
251 *
252 * This code runs in the postmaster, so we must be very careful not to assume
253 * that shared memory contents are sane. Otherwise, a rogue backend could
254 * take out the postmaster.
255 */
256void
258{
259 int slotno;
260
261 /*
262 * The total number of slots stored in shared memory should match our
263 * notion of max_worker_processes. If it does not, something is very
264 * wrong. Further down, we always refer to this value as
265 * max_worker_processes, in case shared memory gets corrupted while we're
266 * looping.
267 */
269 {
270 ereport(LOG,
271 (errmsg("inconsistent background worker state (\"max_worker_processes\"=%d, total slots=%d)",
274 return;
275 }
276
277 /*
278 * Iterate through slots, looking for newly-registered workers or workers
279 * who must die.
280 */
282 {
285
286 if (!slot->in_use)
287 continue;
288
289 /*
290 * Make sure we don't see the in_use flag before the updated slot
291 * contents.
292 */
294
295 /* See whether we already know about this worker. */
297 if (rw != NULL)
298 {
299 /*
300 * In general, the worker data can't change after it's initially
301 * registered. However, someone can set the terminate flag.
302 */
303 if (slot->terminate && !rw->rw_terminate)
304 {
305 rw->rw_terminate = true;
306 if (rw->rw_pid != 0)
307 kill(rw->rw_pid, SIGTERM);
308 else
309 {
310 /* Report never-started, now-terminated worker as dead. */
312 }
313 }
314 continue;
315 }
316
317 /*
318 * If we aren't allowing new workers, then immediately mark it for
319 * termination; the next stanza will take care of cleaning it up.
320 * Doing this ensures that any process waiting for the worker will get
321 * awoken, even though the worker will never be allowed to run.
322 */
324 slot->terminate = true;
325
326 /*
327 * If the worker is marked for termination, we don't need to add it to
328 * the registered workers list; we can just free the slot. However, if
329 * bgw_notify_pid is set, the process that registered the worker may
330 * need to know that we've processed the terminate request, so be sure
331 * to signal it.
332 */
333 if (slot->terminate)
334 {
335 int notify_pid;
336
337 /*
338 * We need a memory barrier here to make sure that the load of
339 * bgw_notify_pid and the update of parallel_terminate_count
340 * complete before the store to in_use.
341 */
343 if ((slot->worker.bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
345 slot->pid = 0;
346
348 slot->in_use = false;
349
350 if (notify_pid != 0)
352
353 continue;
354 }
355
356 /*
357 * Copy the registration data into the registered workers list.
358 */
360 sizeof(RegisteredBgWorker),
362 if (rw == NULL)
363 {
364 ereport(LOG,
366 errmsg("out of memory")));
367 return;
368 }
369
370 /*
371 * Copy strings in a paranoid way. If shared memory is corrupted, the
372 * source data might not even be NUL-terminated.
373 */
375 slot->worker.bgw_name, BGW_MAXLEN);
377 slot->worker.bgw_type, BGW_MAXLEN);
382
383 /*
384 * Copy various fixed-size fields.
385 *
386 * flags, start_time, and restart_time are examined by the postmaster,
387 * but nothing too bad will happen if they are corrupted. The
388 * remaining fields will only be examined by the child process. It
389 * might crash, but we won't.
390 */
396
397 /*
398 * Copy the PID to be notified about state changes, but only if the
399 * postmaster knows about a backend with that PID. It isn't an error
400 * if the postmaster doesn't know about the PID, because the backend
401 * that requested the worker could have died (or been killed) just
402 * after doing so. Nonetheless, at least until we get some experience
403 * with how this plays out in the wild, log a message at a relative
404 * high debug level.
405 */
408 {
409 elog(DEBUG1, "worker notification PID %d is not valid",
410 (int) rw->rw_worker.bgw_notify_pid);
412 }
413
414 /* Initialize postmaster bookkeeping. */
415 rw->rw_pid = 0;
416 rw->rw_crashed_at = 0;
417 rw->rw_shmem_slot = slotno;
418 rw->rw_terminate = false;
419
420 /* Log it! */
422 (errmsg_internal("registering background worker \"%s\"",
423 rw->rw_worker.bgw_name)));
424
426 }
427}
428
429/*
430 * Forget about a background worker that's no longer needed.
431 *
432 * NOTE: The entry is unlinked from BackgroundWorkerList. If the caller is
433 * iterating through it, better use a mutable iterator!
434 *
435 * Caller is responsible for notifying bgw_notify_pid, if appropriate.
436 *
437 * This function must be invoked only in the postmaster.
438 */
439void
441{
443
446 Assert(slot->in_use);
447
448 /*
449 * We need a memory barrier here to make sure that the update of
450 * parallel_terminate_count completes before the store to in_use.
451 */
454
456 slot->in_use = false;
457
459 (errmsg_internal("unregistering background worker \"%s\"",
460 rw->rw_worker.bgw_name)));
461
463 pfree(rw);
464}
465
466/*
467 * Report the PID of a newly-launched background worker in shared memory.
468 *
469 * This function should only be called from the postmaster.
470 */
471void
483
484/*
485 * Report that the PID of a background worker is now zero because a
486 * previously-running background worker has exited.
487 *
488 * NOTE: The entry may be unlinked from BackgroundWorkerList. If the caller
489 * is iterating through it, better use a mutable iterator!
490 *
491 * This function should only be called from the postmaster.
492 */
493void
495{
497 int notify_pid;
498
501 slot->pid = rw->rw_pid;
503
504 /*
505 * If this worker is slated for deregistration, do that before notifying
506 * the process which started it. Otherwise, if that process tries to
507 * reuse the slot immediately, it might not be available yet. In theory
508 * that could happen anyway if the process checks slot->pid at just the
509 * wrong moment, but this makes the window narrower.
510 */
511 if (rw->rw_terminate ||
514
515 if (notify_pid != 0)
517}
518
519/*
520 * Cancel SIGUSR1 notifications for a PID belonging to an exiting backend.
521 *
522 * This function should only be called from the postmaster.
523 */
524void
526{
527 dlist_iter iter;
528
530 {
532
533 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
534 if (rw->rw_worker.bgw_notify_pid == pid)
536 }
537}
538
539/*
540 * Cancel any not-yet-started worker requests that have waiting processes.
541 *
542 * This is called during a normal ("smart" or "fast") database shutdown.
543 * After this point, no new background workers will be started, so anything
544 * that might be waiting for them needs to be kicked off its wait. We do
545 * that by canceling the bgworker registration entirely, which is perhaps
546 * overkill, but since we're shutting down it does not matter whether the
547 * registration record sticks around.
548 *
549 * This function should only be called from the postmaster.
550 */
551void
553{
555
557 {
560
561 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
564
565 /* If it's not yet started, and there's someone waiting ... */
566 if (slot->pid == InvalidPid &&
567 rw->rw_worker.bgw_notify_pid != 0)
568 {
569 /* ... then zap it, and notify the waiter */
571
573 if (notify_pid != 0)
575 }
576 }
577}
578
579/*
580 * Reset background worker crash state.
581 *
582 * We assume that, after a crash-and-restart cycle, background workers without
583 * the never-restart flag should be restarted immediately, instead of waiting
584 * for bgw_restart_time to elapse. On the other hand, workers with that flag
585 * should be forgotten immediately, since we won't ever restart them.
586 *
587 * This function should only be called from the postmaster.
588 */
589void
591{
593
595 {
597
598 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
599
601 {
602 /*
603 * Workers marked BGW_NEVER_RESTART shouldn't get relaunched after
604 * the crash, so forget about them. (If we wait until after the
605 * crash to forget about them, and they are parallel workers,
606 * parallel_terminate_count will get incremented after we've
607 * already zeroed parallel_register_count, which would be bad.)
608 */
610 }
611 else
612 {
613 /*
614 * The accounting which we do via parallel_register_count and
615 * parallel_terminate_count would get messed up if a worker marked
616 * parallel could survive a crash and restart cycle. All such
617 * workers should be marked BGW_NEVER_RESTART, and thus control
618 * should never reach this branch.
619 */
621
622 /*
623 * Allow this worker to be restarted immediately after we finish
624 * resetting.
625 */
626 rw->rw_crashed_at = 0;
627 rw->rw_pid = 0;
628
629 /*
630 * If there was anyone waiting for it, they're history.
631 */
633 }
634 }
635}
636
637/*
638 * Complain about the BackgroundWorker definition using error level elevel.
639 * Return true if it looks ok, false if not (unless elevel >= ERROR, in
640 * which case we won't return at all in the not-OK case).
641 */
642static bool
644{
645 /* sanity check for flags */
646
647 /*
648 * We used to support workers not connected to shared memory, but don't
649 * anymore. Thus this is a required flag now. We're not removing the flag
650 * for compatibility reasons and because the flag still provides some
651 * signal when reading code.
652 */
653 if (!(worker->bgw_flags & BGWORKER_SHMEM_ACCESS))
654 {
655 ereport(elevel,
657 errmsg("background worker \"%s\": background workers without shared memory access are not supported",
658 worker->bgw_name)));
659 return false;
660 }
661
663 {
665 {
666 ereport(elevel,
668 errmsg("background worker \"%s\": cannot request database access if starting at postmaster start",
669 worker->bgw_name)));
670 return false;
671 }
672
673 /* XXX other checks? */
674 }
675
676 /* Interruptible workers require a database connection */
677 if ((worker->bgw_flags & BGWORKER_INTERRUPTIBLE) &&
679 {
680 ereport(elevel,
682 errmsg("background worker \"%s\": cannot make background workers interruptible without database access",
683 worker->bgw_name)));
684 return false;
685 }
686
687 if ((worker->bgw_restart_time < 0 &&
689 (worker->bgw_restart_time > USECS_PER_DAY / 1000))
690 {
691 ereport(elevel,
693 errmsg("background worker \"%s\": invalid restart interval",
694 worker->bgw_name)));
695 return false;
696 }
697
698 /*
699 * Parallel workers may not be configured for restart, because the
700 * parallel_register_count/parallel_terminate_count accounting can't
701 * handle parallel workers lasting through a crash-and-restart cycle.
702 */
703 if (worker->bgw_restart_time != BGW_NEVER_RESTART &&
704 (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
705 {
706 ereport(elevel,
708 errmsg("background worker \"%s\": parallel workers may not be configured for restart",
709 worker->bgw_name)));
710 return false;
711 }
712
713 /*
714 * If bgw_type is not filled in, use bgw_name.
715 */
716 if (strcmp(worker->bgw_type, "") == 0)
717 strcpy(worker->bgw_type, worker->bgw_name);
718
719 return true;
720}
721
722/*
723 * Main entry point for background worker processes.
724 */
725void
727{
729 BackgroundWorker *worker;
731
732 if (startup_data == NULL)
733 elog(FATAL, "unable to find bgworker entry");
736 memcpy(worker, startup_data, sizeof(BackgroundWorker));
737
738 /*
739 * Now that we're done reading the startup data, release postmaster's
740 * working memory context.
741 */
743 {
746 }
747
748 MyBgworkerEntry = worker;
749 init_ps_display(worker->bgw_name);
750
752
753 /* Apply PostAuthDelay */
754 if (PostAuthDelay > 0)
755 pg_usleep(PostAuthDelay * 1000000L);
756
757 /*
758 * Set up signal handlers.
759 */
761 {
762 /*
763 * SIGINT is used to signal canceling the current action
764 */
768
769 /* XXX Any other handlers needed here? */
770 }
771 else
772 {
776 }
778 /* SIGQUIT handler was already set up by InitPostmasterChild */
780
781 InitializeTimeouts(); /* establishes SIGALRM handler */
782
786
787 /*
788 * If an exception is encountered, processing resumes here.
789 *
790 * We just need to clean up, report the error, and go away.
791 */
792 if (sigsetjmp(local_sigjmp_buf, 1) != 0)
793 {
794 /* Since not using PG_TRY, must reset error stack by hand */
796
797 /* Prevent interrupts while cleaning up */
799
800 /*
801 * sigsetjmp will have blocked all signals, but we may need to accept
802 * signals while communicating with our parallel leader. Once we've
803 * done HOLD_INTERRUPTS() it should be safe to unblock signals.
804 */
806
807 /* Report the error to the parallel leader and the server log */
809
810 /*
811 * Do we need more cleanup here? For shmem-connected bgworkers, we
812 * will call InitProcess below, which will install ProcKill as exit
813 * callback. That will take care of releasing locks, etc.
814 */
815
816 /* and go away */
817 proc_exit(1);
818 }
819
820 /* We can now handle ereport(ERROR) */
822
823 /*
824 * Create a per-backend PGPROC struct in shared memory. We must do this
825 * before we can use LWLocks or access any shared memory.
826 */
827 InitProcess();
828
829 /*
830 * Early initialization.
831 */
832 BaseInit();
833
834 /*
835 * Look up the entry point function, loading its library if necessary.
836 */
838 worker->bgw_function_name);
839
840 /*
841 * Note that in normal processes, we would call InitPostgres here. For a
842 * worker, however, we don't know what database to connect to, yet; so we
843 * need to wait until the user code does it via
844 * BackgroundWorkerInitializeConnection().
845 */
846
847 /*
848 * Now invoke the user-defined worker code
849 */
850 entrypt(worker->bgw_main_arg);
851
852 /* ... and if it returns, we're done */
853 proc_exit(0);
854}
855
856/*
857 * Connect background worker to a database.
858 */
859void
861{
863 bits32 init_flags = 0; /* never honor session_preload_libraries */
864
865 /* ignore datallowconn and ACL_CONNECT? */
866 if (flags & BGWORKER_BYPASS_ALLOWCONN)
868 /* ignore rolcanlogin? */
871
872 /* XXX is this the right errcode? */
876 errmsg("database connection requirement not indicated during registration")));
877
878 InitPostgres(dbname, InvalidOid, /* database to connect to */
879 username, InvalidOid, /* role to connect as */
881 NULL); /* no out_dbname */
882
883 /* it had better not gotten out of "init" mode yet */
886 (errmsg("invalid processing mode in background worker")));
888}
889
890/*
891 * Connect background worker to a database using OIDs.
892 */
893void
895{
897 bits32 init_flags = 0; /* never honor session_preload_libraries */
898
899 /* ignore datallowconn and ACL_CONNECT? */
900 if (flags & BGWORKER_BYPASS_ALLOWCONN)
902 /* ignore rolcanlogin? */
905
906 /* XXX is this the right errcode? */
910 errmsg("database connection requirement not indicated during registration")));
911
912 InitPostgres(NULL, dboid, /* database to connect to */
913 NULL, useroid, /* role to connect as */
915 NULL); /* no out_dbname */
916
917 /* it had better not gotten out of "init" mode yet */
920 (errmsg("invalid processing mode in background worker")));
922}
923
924/*
925 * Block/unblock signals in a background worker
926 */
927void
932
933void
938
939/*
940 * Register a new static background worker.
941 *
942 * This can only be called directly from postmaster or in the _PG_init
943 * function of a module library that's loaded by shared_preload_libraries;
944 * otherwise it will have no effect.
945 */
946void
948{
950 static int numworkers = 0;
951
952 /*
953 * Static background workers can only be registered in the postmaster
954 * process.
955 */
957 {
958 /*
959 * In EXEC_BACKEND or single-user mode, we process
960 * shared_preload_libraries in backend processes too. We cannot
961 * register static background workers at that stage, but many
962 * libraries' _PG_init() functions don't distinguish whether they're
963 * being loaded in the postmaster or in a backend, they just check
964 * process_shared_preload_libraries_in_progress. It's a bit sloppy,
965 * but for historical reasons we tolerate it. In EXEC_BACKEND mode,
966 * the background workers should already have been registered when the
967 * library was loaded in postmaster.
968 */
970 return;
971 ereport(LOG,
973 errmsg("background worker \"%s\": must be registered in \"shared_preload_libraries\"",
974 worker->bgw_name)));
975 return;
976 }
977
978 /*
979 * Cannot register static background workers after calling
980 * BackgroundWorkerShmemInit().
981 */
983 elog(ERROR, "cannot register background worker \"%s\" after shmem init",
984 worker->bgw_name);
985
987 (errmsg_internal("registering background worker \"%s\"", worker->bgw_name)));
988
989 if (!SanityCheckBackgroundWorker(worker, LOG))
990 return;
991
992 if (worker->bgw_notify_pid != 0)
993 {
994 ereport(LOG,
996 errmsg("background worker \"%s\": only dynamic background workers can request notification",
997 worker->bgw_name)));
998 return;
999 }
1000
1001 /*
1002 * Enforce maximum number of workers. Note this is overly restrictive: we
1003 * could allow more non-shmem-connected workers, because these don't count
1004 * towards the MAX_BACKENDS limit elsewhere. For now, it doesn't seem
1005 * important to relax this restriction.
1006 */
1008 {
1009 ereport(LOG,
1011 errmsg("too many background workers"),
1012 errdetail_plural("Up to %d background worker can be registered with the current settings.",
1013 "Up to %d background workers can be registered with the current settings.",
1016 errhint("Consider increasing the configuration parameter \"%s\".", "max_worker_processes")));
1017 return;
1018 }
1019
1020 /*
1021 * Copy the registration data into the registered workers list.
1022 */
1024 sizeof(RegisteredBgWorker),
1026 if (rw == NULL)
1027 {
1028 ereport(LOG,
1030 errmsg("out of memory")));
1031 return;
1032 }
1033
1034 rw->rw_worker = *worker;
1035 rw->rw_pid = 0;
1036 rw->rw_crashed_at = 0;
1037 rw->rw_terminate = false;
1038
1040}
1041
1042/*
1043 * Register a new background worker from a regular backend.
1044 *
1045 * Returns true on success and false on failure. Failure typically indicates
1046 * that no background worker slots are currently available.
1047 *
1048 * If handle != NULL, we'll set *handle to a pointer that can subsequently
1049 * be used as an argument to GetBackgroundWorkerPid(). The caller can
1050 * free this pointer using pfree(), if desired.
1051 */
1052bool
1054 BackgroundWorkerHandle **handle)
1055{
1056 int slotno;
1057 bool success = false;
1058 bool parallel;
1059 uint64 generation = 0;
1060
1061 /*
1062 * We can't register dynamic background workers from the postmaster. If
1063 * this is a standalone backend, we're the only process and can't start
1064 * any more. In a multi-process environment, it might be theoretically
1065 * possible, but we don't currently support it due to locking
1066 * considerations; see comments on the BackgroundWorkerSlot data
1067 * structure.
1068 */
1069 if (!IsUnderPostmaster)
1070 return false;
1071
1072 if (!SanityCheckBackgroundWorker(worker, ERROR))
1073 return false;
1074
1075 parallel = (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0;
1076
1078
1079 /*
1080 * If this is a parallel worker, check whether there are already too many
1081 * parallel workers; if so, don't register another one. Our view of
1082 * parallel_terminate_count may be slightly stale, but that doesn't really
1083 * matter: we would have gotten the same result if we'd arrived here
1084 * slightly earlier anyway. There's no help for it, either, since the
1085 * postmaster must not take locks; a memory barrier wouldn't guarantee
1086 * anything useful.
1087 */
1091 {
1096 return false;
1097 }
1098
1099 /*
1100 * Look for an unused slot. If we find one, grab it.
1101 */
1103 {
1105
1106 if (!slot->in_use)
1107 {
1108 memcpy(&slot->worker, worker, sizeof(BackgroundWorker));
1109 slot->pid = InvalidPid; /* indicates not started yet */
1110 slot->generation++;
1111 slot->terminate = false;
1112 generation = slot->generation;
1113 if (parallel)
1115
1116 /*
1117 * Make sure postmaster doesn't see the slot as in use before it
1118 * sees the new contents.
1119 */
1121
1122 slot->in_use = true;
1123 success = true;
1124 break;
1125 }
1126 }
1127
1129
1130 /* If we found a slot, tell the postmaster to notice the change. */
1131 if (success)
1133
1134 /*
1135 * If we found a slot and the user has provided a handle, initialize it.
1136 */
1137 if (success && handle)
1138 {
1140 (*handle)->slot = slotno;
1141 (*handle)->generation = generation;
1142 }
1143
1144 return success;
1145}
1146
1147/*
1148 * Get the PID of a dynamically-registered background worker.
1149 *
1150 * If the worker is determined to be running, the return value will be
1151 * BGWH_STARTED and *pidp will get the PID of the worker process. If the
1152 * postmaster has not yet attempted to start the worker, the return value will
1153 * be BGWH_NOT_YET_STARTED. Otherwise, the return value is BGWH_STOPPED.
1154 *
1155 * BGWH_STOPPED can indicate either that the worker is temporarily stopped
1156 * (because it is configured for automatic restart and exited non-zero),
1157 * or that the worker is permanently stopped (because it exited with exit
1158 * code 0, or was not configured for automatic restart), or even that the
1159 * worker was unregistered without ever starting (either because startup
1160 * failed and the worker is not configured for automatic restart, or because
1161 * TerminateBackgroundWorker was used before the worker was successfully
1162 * started).
1163 */
1166{
1168 pid_t pid;
1169
1170 Assert(handle->slot < max_worker_processes);
1171 slot = &BackgroundWorkerData->slot[handle->slot];
1172
1173 /*
1174 * We could probably arrange to synchronize access to data using memory
1175 * barriers only, but for now, let's just keep it simple and grab the
1176 * lock. It seems unlikely that there will be enough traffic here to
1177 * result in meaningful contention.
1178 */
1180
1181 /*
1182 * The generation number can't be concurrently changed while we hold the
1183 * lock. The pid, which is updated by the postmaster, can change at any
1184 * time, but we assume such changes are atomic. So the value we read
1185 * won't be garbage, but it might be out of date by the time the caller
1186 * examines it (but that's unavoidable anyway).
1187 *
1188 * The in_use flag could be in the process of changing from true to false,
1189 * but if it is already false then it can't change further.
1190 */
1191 if (handle->generation != slot->generation || !slot->in_use)
1192 pid = 0;
1193 else
1194 pid = slot->pid;
1195
1196 /* All done. */
1198
1199 if (pid == 0)
1200 return BGWH_STOPPED;
1201 else if (pid == InvalidPid)
1202 return BGWH_NOT_YET_STARTED;
1203 *pidp = pid;
1204 return BGWH_STARTED;
1205}
1206
1207/*
1208 * Wait for a background worker to start up.
1209 *
1210 * This is like GetBackgroundWorkerPid(), except that if the worker has not
1211 * yet started, we wait for it to do so; thus, BGWH_NOT_YET_STARTED is never
1212 * returned. However, if the postmaster has died, we give up and return
1213 * BGWH_POSTMASTER_DIED, since it that case we know that startup will not
1214 * take place.
1215 *
1216 * The caller *must* have set our PID as the worker's bgw_notify_pid,
1217 * else we will not be awoken promptly when the worker's state changes.
1218 */
1221{
1222 BgwHandleStatus status;
1223 int rc;
1224
1225 for (;;)
1226 {
1227 pid_t pid;
1228
1230
1231 status = GetBackgroundWorkerPid(handle, &pid);
1232 if (status == BGWH_STARTED)
1233 *pidp = pid;
1234 if (status != BGWH_NOT_YET_STARTED)
1235 break;
1236
1237 rc = WaitLatch(MyLatch,
1240
1241 if (rc & WL_POSTMASTER_DEATH)
1242 {
1243 status = BGWH_POSTMASTER_DIED;
1244 break;
1245 }
1246
1248 }
1249
1250 return status;
1251}
1252
1253/*
1254 * Wait for a background worker to stop.
1255 *
1256 * If the worker hasn't yet started, or is running, we wait for it to stop
1257 * and then return BGWH_STOPPED. However, if the postmaster has died, we give
1258 * up and return BGWH_POSTMASTER_DIED, because it's the postmaster that
1259 * notifies us when a worker's state changes.
1260 *
1261 * The caller *must* have set our PID as the worker's bgw_notify_pid,
1262 * else we will not be awoken promptly when the worker's state changes.
1263 */
1266{
1267 BgwHandleStatus status;
1268 int rc;
1269
1270 for (;;)
1271 {
1272 pid_t pid;
1273
1275
1276 status = GetBackgroundWorkerPid(handle, &pid);
1277 if (status == BGWH_STOPPED)
1278 break;
1279
1280 rc = WaitLatch(MyLatch,
1283
1284 if (rc & WL_POSTMASTER_DEATH)
1285 {
1286 status = BGWH_POSTMASTER_DIED;
1287 break;
1288 }
1289
1291 }
1292
1293 return status;
1294}
1295
1296/*
1297 * Instruct the postmaster to terminate a background worker.
1298 *
1299 * Note that it's safe to do this without regard to whether the worker is
1300 * still running, or even if the worker may already have exited and been
1301 * unregistered.
1302 */
1303void
1305{
1307 bool signal_postmaster = false;
1308
1309 Assert(handle->slot < max_worker_processes);
1310 slot = &BackgroundWorkerData->slot[handle->slot];
1311
1312 /* Set terminate flag in shared memory, unless slot has been reused. */
1314 if (handle->generation == slot->generation)
1315 {
1316 slot->terminate = true;
1317 signal_postmaster = true;
1318 }
1320
1321 /* Make sure the postmaster notices the change to shared memory. */
1324}
1325
1326/*
1327 * Look up (and possibly load) a bgworker entry point function.
1328 *
1329 * For functions contained in the core code, we use library name "postgres"
1330 * and consult the InternalBGWorkers array. External functions are
1331 * looked up, and loaded if necessary, using load_external_function().
1332 *
1333 * The point of this is to pass function names as strings across process
1334 * boundaries. We can't pass actual function addresses because of the
1335 * possibility that the function has been loaded at a different address
1336 * in a different process. This is obviously a hazard for functions in
1337 * loadable libraries, but it can happen even for functions in the core code
1338 * on platforms using EXEC_BACKEND (e.g., Windows).
1339 *
1340 * At some point it might be worthwhile to get rid of InternalBGWorkers[]
1341 * in favor of applying load_external_function() for core functions too;
1342 * but that raises portability issues that are not worth addressing now.
1343 */
1344static bgworker_main_type
1346{
1347 /*
1348 * If the function is to be loaded from postgres itself, search the
1349 * InternalBGWorkers array.
1350 */
1351 if (strcmp(libraryname, "postgres") == 0)
1352 {
1353 int i;
1354
1355 for (i = 0; i < lengthof(InternalBGWorkers); i++)
1356 {
1358 return InternalBGWorkers[i].fn_addr;
1359 }
1360
1361 /* We can only reach this by programming error. */
1362 elog(ERROR, "internal function \"%s\" not found", funcname);
1363 }
1364
1365 /* Otherwise load from external library. */
1366 return (bgworker_main_type)
1368}
1369
1370/*
1371 * Given a PID, get the bgw_type of the background worker. Returns NULL if
1372 * not a valid background worker.
1373 *
1374 * The return value is in static memory belonging to this function, so it has
1375 * to be used before calling this function again. This is so that the caller
1376 * doesn't have to worry about the background worker locking protocol.
1377 */
1378const char *
1380{
1381 int slotno;
1382 bool found = false;
1383 static char result[BGW_MAXLEN];
1384
1386
1388 {
1390
1391 if (slot->pid > 0 && slot->pid == pid)
1392 {
1393 strcpy(result, slot->worker.bgw_type);
1394 found = true;
1395 break;
1396 }
1397 }
1398
1400
1401 if (!found)
1402 return NULL;
1403
1404 return result;
1405}
1406
1407/*
1408 * Terminate all background workers connected to the given database, if the
1409 * workers can be interrupted.
1410 */
1411void
1413{
1414 bool signal_postmaster = false;
1415
1416 elog(DEBUG1, "attempting worker termination for database %u",
1417 databaseId);
1418
1420
1421 /*
1422 * Iterate through slots, looking for workers connected to the given
1423 * database.
1424 */
1426 {
1428
1429 if (slot->in_use &&
1431 {
1432 PGPROC *proc = BackendPidGetProc(slot->pid);
1433
1434 if (proc && proc->databaseId == databaseId)
1435 {
1436 slot->terminate = true;
1437 signal_postmaster = true;
1438
1439 elog(DEBUG1, "termination requested for worker (PID %d) on database %u",
1440 (int) slot->pid, databaseId);
1441 }
1442 }
1443 }
1444
1446
1447 /* Make sure the postmaster notices the change to shared memory. */
1450}
void ParallelApplyWorkerMain(Datum main_arg)
void ascii_safe_strlcpy(char *dest, const char *src, size_t destsiz)
Definition ascii.c:174
#define pg_memory_barrier()
Definition atomics.h:141
#define pg_read_barrier()
Definition atomics.h:154
#define pg_write_barrier()
Definition atomics.h:155
void ParallelWorkerMain(Datum main_arg)
Definition parallel.c:1301
sigset_t UnBlockSig
Definition pqsignal.c:22
sigset_t BlockSig
Definition pqsignal.c:23
void ApplyWorkerMain(Datum main_arg)
Definition worker.c:5986
void RegisterBackgroundWorker(BackgroundWorker *worker)
Definition bgworker.c:947
BgwHandleStatus WaitForBackgroundWorkerStartup(BackgroundWorkerHandle *handle, pid_t *pidp)
Definition bgworker.c:1220
void BackgroundWorkerInitializeConnection(const char *dbname, const char *username, uint32 flags)
Definition bgworker.c:860
static bool SanityCheckBackgroundWorker(BackgroundWorker *worker, int elevel)
Definition bgworker.c:643
void ReportBackgroundWorkerPID(RegisteredBgWorker *rw)
Definition bgworker.c:472
void TerminateBackgroundWorker(BackgroundWorkerHandle *handle)
Definition bgworker.c:1304
static const struct @18 InternalBGWorkers[]
void TerminateBackgroundWorkersForDatabase(Oid databaseId)
Definition bgworker.c:1412
void ReportBackgroundWorkerExit(RegisteredBgWorker *rw)
Definition bgworker.c:494
BgwHandleStatus WaitForBackgroundWorkerShutdown(BackgroundWorkerHandle *handle)
Definition bgworker.c:1265
void ResetBackgroundWorkerCrashTimes(void)
Definition bgworker.c:590
void BackgroundWorkerShmemInit(void)
Definition bgworker.c:173
void BackgroundWorkerUnblockSignals(void)
Definition bgworker.c:934
void BackgroundWorkerInitializeConnectionByOid(Oid dboid, Oid useroid, uint32 flags)
Definition bgworker.c:894
void BackgroundWorkerBlockSignals(void)
Definition bgworker.c:928
dlist_head BackgroundWorkerList
Definition bgworker.c:42
void ForgetBackgroundWorker(RegisteredBgWorker *rw)
Definition bgworker.c:440
const char * fn_name
Definition bgworker.c:118
BgwHandleStatus GetBackgroundWorkerPid(BackgroundWorkerHandle *handle, pid_t *pidp)
Definition bgworker.c:1165
static BackgroundWorkerArray * BackgroundWorkerData
Definition bgworker.c:110
static RegisteredBgWorker * FindRegisteredWorkerBySlotNumber(int slotno)
Definition bgworker.c:232
static bgworker_main_type LookupBackgroundWorkerFunction(const char *libraryname, const char *funcname)
Definition bgworker.c:1345
void BackgroundWorkerStopNotifications(pid_t pid)
Definition bgworker.c:525
Size BackgroundWorkerShmemSize(void)
Definition bgworker.c:157
void BackgroundWorkerStateChange(bool allow_new_workers)
Definition bgworker.c:257
const char * GetBackgroundWorkerTypeByPid(pid_t pid)
Definition bgworker.c:1379
bool RegisterDynamicBackgroundWorker(BackgroundWorker *worker, BackgroundWorkerHandle **handle)
Definition bgworker.c:1053
void BackgroundWorkerMain(const void *startup_data, size_t startup_data_len)
Definition bgworker.c:726
bgworker_main_type fn_addr
Definition bgworker.c:119
void ForgetUnstartedBackgroundWorkers(void)
Definition bgworker.c:552
#define BGW_NEVER_RESTART
Definition bgworker.h:92
#define BGWORKER_BYPASS_ROLELOGINCHECK
Definition bgworker.h:167
#define BGW_EXTRALEN
Definition bgworker.h:94
#define BGWORKER_CLASS_PARALLEL
Definition bgworker.h:75
#define BGWORKER_INTERRUPTIBLE
Definition bgworker.h:67
BgwHandleStatus
Definition bgworker.h:111
@ BGWH_POSTMASTER_DIED
Definition bgworker.h:115
@ BGWH_STARTED
Definition bgworker.h:112
@ BGWH_NOT_YET_STARTED
Definition bgworker.h:113
@ BGWH_STOPPED
Definition bgworker.h:114
@ BgWorkerStart_PostmasterStart
Definition bgworker.h:86
#define BGWORKER_BACKEND_DATABASE_CONNECTION
Definition bgworker.h:60
#define BGWORKER_BYPASS_ALLOWCONN
Definition bgworker.h:166
#define BGWORKER_SHMEM_ACCESS
Definition bgworker.h:53
void(* bgworker_main_type)(Datum main_arg)
Definition bgworker.h:79
#define BGW_MAXLEN
Definition bgworker.h:93
#define MAX_PARALLEL_WORKER_LIMIT
#define Assert(condition)
Definition c.h:945
#define FLEXIBLE_ARRAY_MEMBER
Definition c.h:552
uint32 bits32
Definition c.h:627
uint64_t uint64
Definition c.h:619
uint32_t uint32
Definition c.h:618
#define lengthof(array)
Definition c.h:875
size_t Size
Definition c.h:691
#define USECS_PER_DAY
Definition timestamp.h:131
void * load_external_function(const char *filename, const char *funcname, bool signalNotFound, void **filehandle)
Definition dfmgr.c:95
void EmitErrorReport(void)
Definition elog.c:1882
ErrorContextCallback * error_context_stack
Definition elog.c:99
int errcode(int sqlerrcode)
Definition elog.c:874
sigjmp_buf * PG_exception_stack
Definition elog.c:101
#define LOG
Definition elog.h:31
int errhint(const char *fmt,...) pg_attribute_printf(1
#define FATAL
Definition elog.h:41
int int errmsg_internal(const char *fmt,...) pg_attribute_printf(1
#define DEBUG1
Definition elog.h:30
#define ERROR
Definition elog.h:39
#define elog(elevel,...)
Definition elog.h:226
#define ereport(elevel,...)
Definition elog.h:150
int errdetail_plural(const char *fmt_singular, const char *fmt_plural, unsigned long n,...) pg_attribute_printf(1
#define MCXT_ALLOC_ZERO
Definition fe_memutils.h:30
#define palloc_object(type)
Definition fe_memutils.h:74
#define MCXT_ALLOC_NO_OOM
Definition fe_memutils.h:29
bool IsUnderPostmaster
Definition globals.c:120
int max_parallel_workers
Definition globals.c:145
bool IsPostmasterEnvironment
Definition globals.c:119
struct Latch * MyLatch
Definition globals.c:63
int max_worker_processes
Definition globals.c:144
#define dlist_foreach(iter, lhead)
Definition ilist.h:623
static void dlist_delete(dlist_node *node)
Definition ilist.h:405
static void dlist_push_head(dlist_head *head, dlist_node *node)
Definition ilist.h:347
#define dlist_foreach_modify(iter, lhead)
Definition ilist.h:640
#define DLIST_STATIC_INIT(name)
Definition ilist.h:281
#define dlist_container(type, membername, ptr)
Definition ilist.h:593
#define funcname
static bool success
Definition initdb.c:188
static char * username
Definition initdb.c:153
void proc_exit(int code)
Definition ipc.c:105
int i
Definition isn.c:77
void ResetLatch(Latch *latch)
Definition latch.c:374
int WaitLatch(Latch *latch, int wakeEvents, long timeout, uint32 wait_event_info)
Definition latch.c:172
void ApplyLauncherMain(Datum main_arg)
Definition launcher.c:1205
bool LWLockAcquire(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1177
void LWLockRelease(LWLock *lock)
Definition lwlock.c:1794
@ LW_SHARED
Definition lwlock.h:113
@ LW_EXCLUSIVE
Definition lwlock.h:112
void * MemoryContextAlloc(MemoryContext context, Size size)
Definition mcxt.c:1232
void pfree(void *pointer)
Definition mcxt.c:1616
MemoryContext TopMemoryContext
Definition mcxt.c:166
void * MemoryContextAllocExtended(MemoryContext context, Size size, int flags)
Definition mcxt.c:1289
MemoryContext PostmasterContext
Definition mcxt.c:168
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
@ NormalProcessing
Definition miscadmin.h:472
@ InitProcessing
Definition miscadmin.h:471
#define GetProcessingMode()
Definition miscadmin.h:481
#define CHECK_FOR_INTERRUPTS()
Definition miscadmin.h:123
#define HOLD_INTERRUPTS()
Definition miscadmin.h:134
#define IsInitProcessingMode()
Definition miscadmin.h:478
#define SetProcessingMode(mode)
Definition miscadmin.h:483
#define INIT_PG_OVERRIDE_ROLE_LOGIN
Definition miscadmin.h:501
#define INIT_PG_OVERRIDE_ALLOW_CONNS
Definition miscadmin.h:500
#define InvalidPid
Definition miscadmin.h:32
bool process_shared_preload_libraries_in_progress
Definition miscinit.c:1787
static char * errmsg
#define MAXPGPATH
#define die(msg)
void SendPostmasterSignal(PMSignalReason reason)
Definition pmsignal.c:165
@ PMSIGNAL_BACKGROUND_WORKER_CHANGE
Definition pmsignal.h:41
#define pqsignal
Definition port.h:547
int PostAuthDelay
Definition postgres.c:102
void FloatExceptionHandler(SIGNAL_ARGS)
Definition postgres.c:3059
void StatementCancelHandler(SIGNAL_ARGS)
Definition postgres.c:3042
#define InvalidOid
unsigned int Oid
void BaseInit(void)
Definition postinit.c:616
void InitPostgres(const char *in_dbname, Oid dboid, const char *username, Oid useroid, bits32 flags, char *out_dbname)
Definition postinit.c:719
BackgroundWorker * MyBgworkerEntry
Definition postmaster.c:200
bool PostmasterMarkPIDForWorkerNotify(int pid)
static int fb(int x)
PGPROC * BackendPidGetProc(int pid)
Definition procarray.c:3156
void procsignal_sigusr1_handler(SIGNAL_ARGS)
Definition procsignal.c:680
void init_ps_display(const char *fixed_part)
Definition ps_status.c:285
void SequenceSyncWorkerMain(Datum main_arg)
Size add_size(Size s1, Size s2)
Definition shmem.c:485
Size mul_size(Size s1, Size s2)
Definition shmem.c:500
void * ShmemInitStruct(const char *name, Size size, bool *foundPtr)
Definition shmem.c:381
void pg_usleep(long microsec)
Definition signal.c:53
void InitProcess(void)
Definition proc.c:380
char * dbname
Definition streamutil.c:49
uint32 parallel_terminate_count
Definition bgworker.c:100
uint32 parallel_register_count
Definition bgworker.c:99
BackgroundWorkerSlot slot[FLEXIBLE_ARRAY_MEMBER]
Definition bgworker.c:101
BackgroundWorker worker
Definition bgworker.c:82
char bgw_function_name[BGW_MAXLEN]
Definition bgworker.h:104
char bgw_name[BGW_MAXLEN]
Definition bgworker.h:98
char bgw_type[BGW_MAXLEN]
Definition bgworker.h:99
BgWorkerStartTime bgw_start_time
Definition bgworker.h:101
char bgw_extra[BGW_EXTRALEN]
Definition bgworker.h:106
pid_t bgw_notify_pid
Definition bgworker.h:107
char bgw_library_name[MAXPGPATH]
Definition bgworker.h:103
Definition proc.h:176
Oid databaseId
Definition proc.h:198
BackgroundWorker rw_worker
dlist_node * cur
Definition ilist.h:179
dlist_node * cur
Definition ilist.h:200
void TableSyncWorkerMain(Datum main_arg)
Definition tablesync.c:1577
void InitializeTimeouts(void)
Definition timeout.c:470
#define WL_LATCH_SET
#define WL_POSTMASTER_DEATH
#define SIGCHLD
Definition win32_port.h:168
#define SIGHUP
Definition win32_port.h:158
#define SIGPIPE
Definition win32_port.h:163
#define kill(pid, sig)
Definition win32_port.h:490
#define SIGUSR1
Definition win32_port.h:170
#define SIGUSR2
Definition win32_port.h:171