PostgreSQL Source Code git master
Loading...
Searching...
No Matches
bgworker.c
Go to the documentation of this file.
1/*--------------------------------------------------------------------
2 * bgworker.c
3 * POSTGRES pluggable background workers implementation
4 *
5 * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
6 *
7 * IDENTIFICATION
8 * src/backend/postmaster/bgworker.c
9 *
10 *-------------------------------------------------------------------------
11 */
12
13#include "postgres.h"
14
15#include "access/parallel.h"
16#include "commands/repack.h"
17#include "libpq/pqsignal.h"
18#include "miscadmin.h"
19#include "pgstat.h"
20#include "port/atomics.h"
26#include "storage/ipc.h"
27#include "storage/latch.h"
28#include "storage/lwlock.h"
29#include "storage/pmsignal.h"
30#include "storage/proc.h"
31#include "storage/procarray.h"
32#include "storage/procsignal.h"
33#include "storage/shmem.h"
34#include "storage/subsystems.h"
35#include "tcop/tcopprot.h"
36#include "utils/ascii.h"
37#include "utils/memutils.h"
38#include "utils/ps_status.h"
39#include "utils/timeout.h"
40#include "utils/wait_event.h"
41
42/*
43 * The postmaster's list of registered background workers, in private memory.
44 */
46
47/*
48 * BackgroundWorkerSlots exist in shared memory and can be accessed (via
49 * the BackgroundWorkerArray) by both the postmaster and by regular backends.
50 * However, the postmaster cannot take locks, even spinlocks, because this
51 * might allow it to crash or become wedged if shared memory gets corrupted.
52 * Such an outcome is intolerable. Therefore, we need a lockless protocol
53 * for coordinating access to this data.
54 *
55 * The 'in_use' flag is used to hand off responsibility for the slot between
56 * the postmaster and the rest of the system. When 'in_use' is false,
57 * the postmaster will ignore the slot entirely, except for the 'in_use' flag
58 * itself, which it may read. In this state, regular backends may modify the
59 * slot. Once a backend sets 'in_use' to true, the slot becomes the
60 * responsibility of the postmaster. Regular backends may no longer modify it,
61 * but the postmaster may examine it. Thus, a backend initializing a slot
62 * must fully initialize the slot - and insert a write memory barrier - before
63 * marking it as in use.
64 *
65 * As an exception, however, even when the slot is in use, regular backends
66 * may set the 'terminate' flag for a slot, telling the postmaster not
67 * to restart it. Once the background worker is no longer running, the slot
68 * will be released for reuse.
69 *
70 * In addition to coordinating with the postmaster, backends modifying this
71 * data structure must coordinate with each other. Since they can take locks,
72 * this is straightforward: any backend wishing to manipulate a slot must
73 * take BackgroundWorkerLock in exclusive mode. Backends wishing to read
74 * data that might get concurrently modified by other backends should take
75 * this lock in shared mode. No matter what, backends reading this data
76 * structure must be able to tolerate concurrent modifications by the
77 * postmaster.
78 */
80{
81 bool in_use;
83 pid_t pid; /* InvalidPid = not started yet; 0 = dead */
84 uint64 generation; /* incremented when slot is recycled */
87
88/*
89 * In order to limit the total number of parallel workers (according to
90 * max_parallel_workers GUC), we maintain the number of active parallel
91 * workers. Since the postmaster cannot take locks, two variables are used for
92 * this purpose: the number of registered parallel workers (modified by the
93 * backends, protected by BackgroundWorkerLock) and the number of terminated
94 * parallel workers (modified only by the postmaster, lockless). The active
95 * number of parallel workers is the number of registered workers minus the
96 * terminated ones. These counters can of course overflow, but it's not
97 * important here since the subtraction will still give the right number.
98 */
106
112
114
115static void BackgroundWorkerShmemRequest(void *arg);
116static void BackgroundWorkerShmemInit(void *arg);
117
122
123/*
124 * List of internal background worker entry points. We need this for
125 * reasons explained in LookupBackgroundWorkerFunction(), below.
126 */
127static const struct
128{
129 const char *fn_name;
132
133{
134 {
135 .fn_name = "ApplyLauncherMain",
136 .fn_addr = ApplyLauncherMain
137 },
138 {
139 .fn_name = "ApplyWorkerMain",
140 .fn_addr = ApplyWorkerMain
141 },
142 {
143 .fn_name = "ParallelApplyWorkerMain",
144 .fn_addr = ParallelApplyWorkerMain
145 },
146 {
147 .fn_name = "ParallelWorkerMain",
148 .fn_addr = ParallelWorkerMain
149 },
150 {
151 .fn_name = "RepackWorkerMain",
152 .fn_addr = RepackWorkerMain
153 },
154 {
155 .fn_name = "SequenceSyncWorkerMain",
156 .fn_addr = SequenceSyncWorkerMain
157 },
158 {
159 .fn_name = "TableSyncWorkerMain",
160 .fn_addr = TableSyncWorkerMain
161 },
162 {
163 .fn_name = "DataChecksumsWorkerLauncherMain",
165 },
166 {
167 .fn_name = "DataChecksumsWorkerMain",
168 .fn_addr = DataChecksumsWorkerMain
169 }
171
172/* Private functions. */
174
175
176/*
177 * Register shared memory needed for background workers.
178 */
179static void
181{
182 Size size;
183
184 /* Array of workers is variably sized. */
185 size = offsetof(BackgroundWorkerArray, slot);
187 sizeof(BackgroundWorkerSlot)));
188 ShmemRequestStruct(.name = "Background Worker Data",
189 .size = size,
190 .ptr = (void **) &BackgroundWorkerData,
191 );
192}
193
194/*
195 * Initialize shared memory for background workers.
196 */
197static void
199{
200 dlist_iter iter;
201 int slotno = 0;
202
206
207 /*
208 * Copy contents of worker list into shared memory. Record the shared
209 * memory slot assigned to each worker. This ensures a 1-to-1
210 * correspondence between the postmaster's private list and the array in
211 * shared memory.
212 */
214 {
217
218 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
220 slot->in_use = true;
221 slot->terminate = false;
222 slot->pid = InvalidPid;
223 slot->generation = 0;
224 rw->rw_shmem_slot = slotno;
225 rw->rw_worker.bgw_notify_pid = 0; /* might be reinit after crash */
226 memcpy(&slot->worker, &rw->rw_worker, sizeof(BackgroundWorker));
227 ++slotno;
228 }
229
230 /*
231 * Mark any remaining slots as not in use.
232 */
234 {
236
237 slot->in_use = false;
238 ++slotno;
239 }
240}
241
242/*
243 * Search the postmaster's backend-private list of RegisteredBgWorker objects
244 * for the one that maps to the given slot number.
245 */
246static RegisteredBgWorker *
248{
249 dlist_iter iter;
250
252 {
254
255 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
256 if (rw->rw_shmem_slot == slotno)
257 return rw;
258 }
259
260 return NULL;
261}
262
263/*
264 * Notice changes to shared memory made by other backends.
265 * Accept new worker requests only if allow_new_workers is true.
266 *
267 * This code runs in the postmaster, so we must be very careful not to assume
268 * that shared memory contents are sane. Otherwise, a rogue backend could
269 * take out the postmaster.
270 */
271void
273{
274 int slotno;
275
276 /*
277 * The total number of slots stored in shared memory should match our
278 * notion of max_worker_processes. If it does not, something is very
279 * wrong. Further down, we always refer to this value as
280 * max_worker_processes, in case shared memory gets corrupted while we're
281 * looping.
282 */
284 {
285 ereport(LOG,
286 (errmsg("inconsistent background worker state (\"max_worker_processes\"=%d, total slots=%d)",
289 return;
290 }
291
292 /*
293 * Iterate through slots, looking for newly-registered workers or workers
294 * who must die.
295 */
297 {
300
301 if (!slot->in_use)
302 continue;
303
304 /*
305 * Make sure we don't see the in_use flag before the updated slot
306 * contents.
307 */
309
310 /* See whether we already know about this worker. */
312 if (rw != NULL)
313 {
314 /*
315 * In general, the worker data can't change after it's initially
316 * registered. However, someone can set the terminate flag.
317 */
318 if (slot->terminate && !rw->rw_terminate)
319 {
320 rw->rw_terminate = true;
321 if (rw->rw_pid != 0)
322 kill(rw->rw_pid, SIGTERM);
323 else
324 {
325 /* Report never-started, now-terminated worker as dead. */
327 }
328 }
329 continue;
330 }
331
332 /*
333 * If we aren't allowing new workers, then immediately mark it for
334 * termination; the next stanza will take care of cleaning it up.
335 * Doing this ensures that any process waiting for the worker will get
336 * awoken, even though the worker will never be allowed to run.
337 */
339 slot->terminate = true;
340
341 /*
342 * If the worker is marked for termination, we don't need to add it to
343 * the registered workers list; we can just free the slot. However, if
344 * bgw_notify_pid is set, the process that registered the worker may
345 * need to know that we've processed the terminate request, so be sure
346 * to signal it.
347 */
348 if (slot->terminate)
349 {
350 int notify_pid;
351
352 /*
353 * We need a memory barrier here to make sure that the load of
354 * bgw_notify_pid and the update of parallel_terminate_count
355 * complete before the store to in_use.
356 */
358 if ((slot->worker.bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
360 slot->pid = 0;
361
363 slot->in_use = false;
364
365 if (notify_pid != 0)
367
368 continue;
369 }
370
371 /*
372 * Copy the registration data into the registered workers list.
373 */
375 sizeof(RegisteredBgWorker),
377 if (rw == NULL)
378 {
379 ereport(LOG,
381 errmsg("out of memory")));
382 return;
383 }
384
385 /*
386 * Copy strings in a paranoid way. If shared memory is corrupted, the
387 * source data might not even be NUL-terminated.
388 */
390 slot->worker.bgw_name, BGW_MAXLEN);
392 slot->worker.bgw_type, BGW_MAXLEN);
397
398 /*
399 * Copy various fixed-size fields.
400 *
401 * flags, start_time, and restart_time are examined by the postmaster,
402 * but nothing too bad will happen if they are corrupted. The
403 * remaining fields will only be examined by the child process. It
404 * might crash, but we won't.
405 */
411
412 /*
413 * Copy the PID to be notified about state changes, but only if the
414 * postmaster knows about a backend with that PID. It isn't an error
415 * if the postmaster doesn't know about the PID, because the backend
416 * that requested the worker could have died (or been killed) just
417 * after doing so. Nonetheless, at least until we get some experience
418 * with how this plays out in the wild, log a message at a relative
419 * high debug level.
420 */
423 {
424 elog(DEBUG1, "worker notification PID %d is not valid",
425 (int) rw->rw_worker.bgw_notify_pid);
427 }
428
429 /* Initialize postmaster bookkeeping. */
430 rw->rw_pid = 0;
431 rw->rw_crashed_at = 0;
432 rw->rw_shmem_slot = slotno;
433 rw->rw_terminate = false;
434
435 /* Log it! */
437 (errmsg_internal("registering background worker \"%s\"",
438 rw->rw_worker.bgw_name)));
439
441 }
442}
443
444/*
445 * Forget about a background worker that's no longer needed.
446 *
447 * NOTE: The entry is unlinked from BackgroundWorkerList. If the caller is
448 * iterating through it, better use a mutable iterator!
449 *
450 * Caller is responsible for notifying bgw_notify_pid, if appropriate.
451 *
452 * This function must be invoked only in the postmaster.
453 */
454void
456{
458
461 Assert(slot->in_use);
462
463 /*
464 * We need a memory barrier here to make sure that the update of
465 * parallel_terminate_count completes before the store to in_use.
466 */
469
471 slot->in_use = false;
472
474 (errmsg_internal("unregistering background worker \"%s\"",
475 rw->rw_worker.bgw_name)));
476
478 pfree(rw);
479}
480
481/*
482 * Report the PID of a newly-launched background worker in shared memory.
483 *
484 * This function should only be called from the postmaster.
485 */
486void
498
499/*
500 * Report that the PID of a background worker is now zero because a
501 * previously-running background worker has exited.
502 *
503 * NOTE: The entry may be unlinked from BackgroundWorkerList. If the caller
504 * is iterating through it, better use a mutable iterator!
505 *
506 * This function should only be called from the postmaster.
507 */
508void
510{
512 int notify_pid;
513
516 slot->pid = rw->rw_pid;
518
519 /*
520 * If this worker is slated for deregistration, do that before notifying
521 * the process which started it. Otherwise, if that process tries to
522 * reuse the slot immediately, it might not be available yet. In theory
523 * that could happen anyway if the process checks slot->pid at just the
524 * wrong moment, but this makes the window narrower.
525 */
526 if (rw->rw_terminate ||
529
530 if (notify_pid != 0)
532}
533
534/*
535 * Cancel SIGUSR1 notifications for a PID belonging to an exiting backend.
536 *
537 * This function should only be called from the postmaster.
538 */
539void
541{
542 dlist_iter iter;
543
545 {
547
548 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
549 if (rw->rw_worker.bgw_notify_pid == pid)
551 }
552}
553
554/*
555 * Cancel any not-yet-started worker requests that have waiting processes.
556 *
557 * This is called during a normal ("smart" or "fast") database shutdown.
558 * After this point, no new background workers will be started, so anything
559 * that might be waiting for them needs to be kicked off its wait. We do
560 * that by canceling the bgworker registration entirely, which is perhaps
561 * overkill, but since we're shutting down it does not matter whether the
562 * registration record sticks around.
563 *
564 * This function should only be called from the postmaster.
565 */
566void
568{
570
572 {
575
576 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
579
580 /* If it's not yet started, and there's someone waiting ... */
581 if (slot->pid == InvalidPid &&
582 rw->rw_worker.bgw_notify_pid != 0)
583 {
584 /* ... then zap it, and notify the waiter */
586
588 if (notify_pid != 0)
590 }
591 }
592}
593
594/*
595 * Reset background worker crash state.
596 *
597 * We assume that, after a crash-and-restart cycle, background workers without
598 * the never-restart flag should be restarted immediately, instead of waiting
599 * for bgw_restart_time to elapse. On the other hand, workers with that flag
600 * should be forgotten immediately, since we won't ever restart them.
601 *
602 * This function should only be called from the postmaster.
603 */
604void
606{
608
610 {
612
613 rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
614
616 {
617 /*
618 * Workers marked BGW_NEVER_RESTART shouldn't get relaunched after
619 * the crash, so forget about them. (If we wait until after the
620 * crash to forget about them, and they are parallel workers,
621 * parallel_terminate_count will get incremented after we've
622 * already zeroed parallel_register_count, which would be bad.)
623 */
625 }
626 else
627 {
628 /*
629 * The accounting which we do via parallel_register_count and
630 * parallel_terminate_count would get messed up if a worker marked
631 * parallel could survive a crash and restart cycle. All such
632 * workers should be marked BGW_NEVER_RESTART, and thus control
633 * should never reach this branch.
634 */
636
637 /*
638 * Allow this worker to be restarted immediately after we finish
639 * resetting.
640 */
641 rw->rw_crashed_at = 0;
642 rw->rw_pid = 0;
643
644 /*
645 * If there was anyone waiting for it, they're history.
646 */
648 }
649 }
650}
651
652/*
653 * Complain about the BackgroundWorker definition using error level elevel.
654 * Return true if it looks ok, false if not (unless elevel >= ERROR, in
655 * which case we won't return at all in the not-OK case).
656 */
657static bool
659{
660 /* sanity check for flags */
661
662 /*
663 * We used to support workers not connected to shared memory, but don't
664 * anymore. Thus this is a required flag now. We're not removing the flag
665 * for compatibility reasons and because the flag still provides some
666 * signal when reading code.
667 */
668 if (!(worker->bgw_flags & BGWORKER_SHMEM_ACCESS))
669 {
670 ereport(elevel,
672 errmsg("background worker \"%s\": background workers without shared memory access are not supported",
673 worker->bgw_name)));
674 return false;
675 }
676
678 {
680 {
681 ereport(elevel,
683 errmsg("background worker \"%s\": cannot request database access if starting at postmaster start",
684 worker->bgw_name)));
685 return false;
686 }
687
688 /* XXX other checks? */
689 }
690
691 /* Interruptible workers require a database connection */
692 if ((worker->bgw_flags & BGWORKER_INTERRUPTIBLE) &&
694 {
695 ereport(elevel,
697 errmsg("background worker \"%s\": cannot make background workers interruptible without database access",
698 worker->bgw_name)));
699 return false;
700 }
701
702 if ((worker->bgw_restart_time < 0 &&
704 (worker->bgw_restart_time > USECS_PER_DAY / 1000))
705 {
706 ereport(elevel,
708 errmsg("background worker \"%s\": invalid restart interval",
709 worker->bgw_name)));
710 return false;
711 }
712
713 /*
714 * Parallel workers may not be configured for restart, because the
715 * parallel_register_count/parallel_terminate_count accounting can't
716 * handle parallel workers lasting through a crash-and-restart cycle.
717 */
718 if (worker->bgw_restart_time != BGW_NEVER_RESTART &&
719 (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
720 {
721 ereport(elevel,
723 errmsg("background worker \"%s\": parallel workers may not be configured for restart",
724 worker->bgw_name)));
725 return false;
726 }
727
728 /*
729 * If bgw_type is not filled in, use bgw_name.
730 */
731 if (strcmp(worker->bgw_type, "") == 0)
732 strcpy(worker->bgw_type, worker->bgw_name);
733
734 return true;
735}
736
737/*
738 * Main entry point for background worker processes.
739 */
740void
742{
744 BackgroundWorker *worker;
746
747 if (startup_data == NULL)
748 elog(FATAL, "unable to find bgworker entry");
751 memcpy(worker, startup_data, sizeof(BackgroundWorker));
752
753 /*
754 * Now that we're done reading the startup data, release postmaster's
755 * working memory context.
756 */
758 {
761 }
762
763 MyBgworkerEntry = worker;
764 init_ps_display(worker->bgw_name);
765
767
768 /* Apply PostAuthDelay */
769 if (PostAuthDelay > 0)
770 pg_usleep(PostAuthDelay * 1000000L);
771
772 /*
773 * Set up signal handlers.
774 */
776 {
777 /*
778 * SIGINT is used to signal canceling the current action
779 */
783
784 /* XXX Any other handlers needed here? */
785 }
786 else
787 {
791 }
793 /* SIGQUIT handler was already set up by InitPostmasterChild */
795
796 InitializeTimeouts(); /* establishes SIGALRM handler */
797
801
802 /*
803 * If an exception is encountered, processing resumes here.
804 *
805 * We just need to clean up, report the error, and go away.
806 */
807 if (sigsetjmp(local_sigjmp_buf, 1) != 0)
808 {
809 /* Since not using PG_TRY, must reset error stack by hand */
811
812 /* Prevent interrupts while cleaning up */
814
815 /*
816 * sigsetjmp will have blocked all signals, but we may need to accept
817 * signals while communicating with our parallel leader. Once we've
818 * done HOLD_INTERRUPTS() it should be safe to unblock signals.
819 */
821
822 /* Report the error to the parallel leader and the server log */
824
825 /*
826 * Do we need more cleanup here? For shmem-connected bgworkers, we
827 * will call InitProcess below, which will install ProcKill as exit
828 * callback. That will take care of releasing locks, etc.
829 */
830
831 /* and go away */
832 proc_exit(1);
833 }
834
835 /* We can now handle ereport(ERROR) */
837
838 /*
839 * Create a per-backend PGPROC struct in shared memory. We must do this
840 * before we can use LWLocks or access any shared memory.
841 */
842 InitProcess();
843
844 /*
845 * Early initialization.
846 */
847 BaseInit();
848
849 /*
850 * Look up the entry point function, loading its library if necessary.
851 */
853 worker->bgw_function_name);
854
855 /*
856 * Note that in normal processes, we would call InitPostgres here. For a
857 * worker, however, we don't know what database to connect to, yet; so we
858 * need to wait until the user code does it via
859 * BackgroundWorkerInitializeConnection().
860 */
861
862 /*
863 * Now invoke the user-defined worker code
864 */
865 entrypt(worker->bgw_main_arg);
866
867 /* ... and if it returns, we're done */
868 proc_exit(0);
869}
870
871/*
872 * Connect background worker to a database.
873 */
874void
876{
878 uint32 init_flags = 0; /* never honor session_preload_libraries */
879
880 /* ignore datallowconn and ACL_CONNECT? */
881 if (flags & BGWORKER_BYPASS_ALLOWCONN)
883 /* ignore rolcanlogin? */
886
887 /* XXX is this the right errcode? */
891 errmsg("database connection requirement not indicated during registration")));
892
893 InitPostgres(dbname, InvalidOid, /* database to connect to */
894 username, InvalidOid, /* role to connect as */
896 NULL); /* no out_dbname */
897
898 /* it had better not gotten out of "init" mode yet */
901 (errmsg("invalid processing mode in background worker")));
903}
904
905/*
906 * Connect background worker to a database using OIDs.
907 */
908void
910{
912 uint32 init_flags = 0; /* never honor session_preload_libraries */
913
914 /* ignore datallowconn and ACL_CONNECT? */
915 if (flags & BGWORKER_BYPASS_ALLOWCONN)
917 /* ignore rolcanlogin? */
920
921 /* XXX is this the right errcode? */
925 errmsg("database connection requirement not indicated during registration")));
926
927 InitPostgres(NULL, dboid, /* database to connect to */
928 NULL, useroid, /* role to connect as */
930 NULL); /* no out_dbname */
931
932 /* it had better not gotten out of "init" mode yet */
935 (errmsg("invalid processing mode in background worker")));
937}
938
939/*
940 * Block/unblock signals in a background worker
941 */
942void
947
948void
953
954/*
955 * Register a new static background worker.
956 *
957 * This can only be called directly from postmaster or in the _PG_init
958 * function of a module library that's loaded by shared_preload_libraries;
959 * otherwise it will have no effect.
960 */
961void
963{
965 static int numworkers = 0;
966
967 /*
968 * Static background workers can only be registered in the postmaster
969 * process.
970 */
972 {
973 /*
974 * In EXEC_BACKEND or single-user mode, we process
975 * shared_preload_libraries in backend processes too. We cannot
976 * register static background workers at that stage, but many
977 * libraries' _PG_init() functions don't distinguish whether they're
978 * being loaded in the postmaster or in a backend, they just check
979 * process_shared_preload_libraries_in_progress. It's a bit sloppy,
980 * but for historical reasons we tolerate it. In EXEC_BACKEND mode,
981 * the background workers should already have been registered when the
982 * library was loaded in postmaster.
983 */
985 return;
986 ereport(LOG,
988 errmsg("background worker \"%s\": must be registered in \"shared_preload_libraries\"",
989 worker->bgw_name)));
990 return;
991 }
992
993 /*
994 * Cannot register static background workers after calling
995 * BackgroundWorkerShmemInit().
996 */
998 elog(ERROR, "cannot register background worker \"%s\" after shmem init",
999 worker->bgw_name);
1000
1002 (errmsg_internal("registering background worker \"%s\"", worker->bgw_name)));
1003
1004 if (!SanityCheckBackgroundWorker(worker, LOG))
1005 return;
1006
1007 if (worker->bgw_notify_pid != 0)
1008 {
1009 ereport(LOG,
1011 errmsg("background worker \"%s\": only dynamic background workers can request notification",
1012 worker->bgw_name)));
1013 return;
1014 }
1015
1016 /*
1017 * Enforce maximum number of workers. Note this is overly restrictive: we
1018 * could allow more non-shmem-connected workers, because these don't count
1019 * towards the MAX_BACKENDS limit elsewhere. For now, it doesn't seem
1020 * important to relax this restriction.
1021 */
1023 {
1024 ereport(LOG,
1026 errmsg("too many background workers"),
1027 errdetail_plural("Up to %d background worker can be registered with the current settings.",
1028 "Up to %d background workers can be registered with the current settings.",
1031 errhint("Consider increasing the configuration parameter \"%s\".", "max_worker_processes")));
1032 return;
1033 }
1034
1035 /*
1036 * Copy the registration data into the registered workers list.
1037 */
1039 sizeof(RegisteredBgWorker),
1041 if (rw == NULL)
1042 {
1043 ereport(LOG,
1045 errmsg("out of memory")));
1046 return;
1047 }
1048
1049 rw->rw_worker = *worker;
1050 rw->rw_pid = 0;
1051 rw->rw_crashed_at = 0;
1052 rw->rw_terminate = false;
1053
1055}
1056
1057/*
1058 * Register a new background worker from a regular backend.
1059 *
1060 * Returns true on success and false on failure. Failure typically indicates
1061 * that no background worker slots are currently available.
1062 *
1063 * If handle != NULL, we'll set *handle to a pointer that can subsequently
1064 * be used as an argument to GetBackgroundWorkerPid(). The caller can
1065 * free this pointer using pfree(), if desired.
1066 */
1067bool
1069 BackgroundWorkerHandle **handle)
1070{
1071 int slotno;
1072 bool success = false;
1073 bool parallel;
1074 uint64 generation = 0;
1075
1076 /*
1077 * We can't register dynamic background workers from the postmaster. If
1078 * this is a standalone backend, we're the only process and can't start
1079 * any more. In a multi-process environment, it might be theoretically
1080 * possible, but we don't currently support it due to locking
1081 * considerations; see comments on the BackgroundWorkerSlot data
1082 * structure.
1083 */
1084 if (!IsUnderPostmaster)
1085 return false;
1086
1087 if (!SanityCheckBackgroundWorker(worker, ERROR))
1088 return false;
1089
1090 parallel = (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0;
1091
1093
1094 /*
1095 * If this is a parallel worker, check whether there are already too many
1096 * parallel workers; if so, don't register another one. Our view of
1097 * parallel_terminate_count may be slightly stale, but that doesn't really
1098 * matter: we would have gotten the same result if we'd arrived here
1099 * slightly earlier anyway. There's no help for it, either, since the
1100 * postmaster must not take locks; a memory barrier wouldn't guarantee
1101 * anything useful.
1102 */
1106 {
1111 return false;
1112 }
1113
1114 /*
1115 * Look for an unused slot. If we find one, grab it.
1116 */
1118 {
1120
1121 if (!slot->in_use)
1122 {
1123 memcpy(&slot->worker, worker, sizeof(BackgroundWorker));
1124 slot->pid = InvalidPid; /* indicates not started yet */
1125 slot->generation++;
1126 slot->terminate = false;
1127 generation = slot->generation;
1128 if (parallel)
1130
1131 /*
1132 * Make sure postmaster doesn't see the slot as in use before it
1133 * sees the new contents.
1134 */
1136
1137 slot->in_use = true;
1138 success = true;
1139 break;
1140 }
1141 }
1142
1144
1145 /* If we found a slot, tell the postmaster to notice the change. */
1146 if (success)
1148
1149 /*
1150 * If we found a slot and the user has provided a handle, initialize it.
1151 */
1152 if (success && handle)
1153 {
1155 (*handle)->slot = slotno;
1156 (*handle)->generation = generation;
1157 }
1158
1159 return success;
1160}
1161
1162/*
1163 * Get the PID of a dynamically-registered background worker.
1164 *
1165 * If the worker is determined to be running, the return value will be
1166 * BGWH_STARTED and *pidp will get the PID of the worker process. If the
1167 * postmaster has not yet attempted to start the worker, the return value will
1168 * be BGWH_NOT_YET_STARTED. Otherwise, the return value is BGWH_STOPPED.
1169 *
1170 * BGWH_STOPPED can indicate either that the worker is temporarily stopped
1171 * (because it is configured for automatic restart and exited non-zero),
1172 * or that the worker is permanently stopped (because it exited with exit
1173 * code 0, or was not configured for automatic restart), or even that the
1174 * worker was unregistered without ever starting (either because startup
1175 * failed and the worker is not configured for automatic restart, or because
1176 * TerminateBackgroundWorker was used before the worker was successfully
1177 * started).
1178 */
1181{
1183 pid_t pid;
1184
1185 Assert(handle->slot < max_worker_processes);
1186 slot = &BackgroundWorkerData->slot[handle->slot];
1187
1188 /*
1189 * We could probably arrange to synchronize access to data using memory
1190 * barriers only, but for now, let's just keep it simple and grab the
1191 * lock. It seems unlikely that there will be enough traffic here to
1192 * result in meaningful contention.
1193 */
1195
1196 /*
1197 * The generation number can't be concurrently changed while we hold the
1198 * lock. The pid, which is updated by the postmaster, can change at any
1199 * time, but we assume such changes are atomic. So the value we read
1200 * won't be garbage, but it might be out of date by the time the caller
1201 * examines it (but that's unavoidable anyway).
1202 *
1203 * The in_use flag could be in the process of changing from true to false,
1204 * but if it is already false then it can't change further.
1205 */
1206 if (handle->generation != slot->generation || !slot->in_use)
1207 pid = 0;
1208 else
1209 pid = slot->pid;
1210
1211 /* All done. */
1213
1214 if (pid == 0)
1215 return BGWH_STOPPED;
1216 else if (pid == InvalidPid)
1217 return BGWH_NOT_YET_STARTED;
1218 *pidp = pid;
1219 return BGWH_STARTED;
1220}
1221
1222/*
1223 * Wait for a background worker to start up.
1224 *
1225 * This is like GetBackgroundWorkerPid(), except that if the worker has not
1226 * yet started, we wait for it to do so; thus, BGWH_NOT_YET_STARTED is never
1227 * returned. However, if the postmaster has died, we give up and return
1228 * BGWH_POSTMASTER_DIED, since it that case we know that startup will not
1229 * take place.
1230 *
1231 * The caller *must* have set our PID as the worker's bgw_notify_pid,
1232 * else we will not be awoken promptly when the worker's state changes.
1233 */
1236{
1237 BgwHandleStatus status;
1238 int rc;
1239
1240 for (;;)
1241 {
1242 pid_t pid;
1243
1245
1246 status = GetBackgroundWorkerPid(handle, &pid);
1247 if (status == BGWH_STARTED)
1248 *pidp = pid;
1249 if (status != BGWH_NOT_YET_STARTED)
1250 break;
1251
1252 rc = WaitLatch(MyLatch,
1255
1256 if (rc & WL_POSTMASTER_DEATH)
1257 {
1258 status = BGWH_POSTMASTER_DIED;
1259 break;
1260 }
1261
1263 }
1264
1265 return status;
1266}
1267
1268/*
1269 * Wait for a background worker to stop.
1270 *
1271 * If the worker hasn't yet started, or is running, we wait for it to stop
1272 * and then return BGWH_STOPPED. However, if the postmaster has died, we give
1273 * up and return BGWH_POSTMASTER_DIED, because it's the postmaster that
1274 * notifies us when a worker's state changes.
1275 *
1276 * The caller *must* have set our PID as the worker's bgw_notify_pid,
1277 * else we will not be awoken promptly when the worker's state changes.
1278 */
1281{
1282 BgwHandleStatus status;
1283 int rc;
1284
1285 for (;;)
1286 {
1287 pid_t pid;
1288
1290
1291 status = GetBackgroundWorkerPid(handle, &pid);
1292 if (status == BGWH_STOPPED)
1293 break;
1294
1295 rc = WaitLatch(MyLatch,
1298
1299 if (rc & WL_POSTMASTER_DEATH)
1300 {
1301 status = BGWH_POSTMASTER_DIED;
1302 break;
1303 }
1304
1306 }
1307
1308 return status;
1309}
1310
1311/*
1312 * Instruct the postmaster to terminate a background worker.
1313 *
1314 * Note that it's safe to do this without regard to whether the worker is
1315 * still running, or even if the worker may already have exited and been
1316 * unregistered.
1317 */
1318void
1320{
1322 bool signal_postmaster = false;
1323
1324 Assert(handle->slot < max_worker_processes);
1325 slot = &BackgroundWorkerData->slot[handle->slot];
1326
1327 /* Set terminate flag in shared memory, unless slot has been reused. */
1329 if (handle->generation == slot->generation)
1330 {
1331 slot->terminate = true;
1332 signal_postmaster = true;
1333 }
1335
1336 /* Make sure the postmaster notices the change to shared memory. */
1339}
1340
1341/*
1342 * Look up (and possibly load) a bgworker entry point function.
1343 *
1344 * For functions contained in the core code, we use library name "postgres"
1345 * and consult the InternalBGWorkers array. External functions are
1346 * looked up, and loaded if necessary, using load_external_function().
1347 *
1348 * The point of this is to pass function names as strings across process
1349 * boundaries. We can't pass actual function addresses because of the
1350 * possibility that the function has been loaded at a different address
1351 * in a different process. This is obviously a hazard for functions in
1352 * loadable libraries, but it can happen even for functions in the core code
1353 * on platforms using EXEC_BACKEND (e.g., Windows).
1354 *
1355 * At some point it might be worthwhile to get rid of InternalBGWorkers[]
1356 * in favor of applying load_external_function() for core functions too;
1357 * but that raises portability issues that are not worth addressing now.
1358 */
1359static bgworker_main_type
1361{
1362 /*
1363 * If the function is to be loaded from postgres itself, search the
1364 * InternalBGWorkers array.
1365 */
1366 if (strcmp(libraryname, "postgres") == 0)
1367 {
1368 int i;
1369
1370 for (i = 0; i < lengthof(InternalBGWorkers); i++)
1371 {
1373 return InternalBGWorkers[i].fn_addr;
1374 }
1375
1376 /* We can only reach this by programming error. */
1377 elog(ERROR, "internal function \"%s\" not found", funcname);
1378 }
1379
1380 /* Otherwise load from external library. */
1381 return (bgworker_main_type)
1383}
1384
1385/*
1386 * Given a PID, get the bgw_type of the background worker. Returns NULL if
1387 * not a valid background worker.
1388 *
1389 * The return value is in static memory belonging to this function, so it has
1390 * to be used before calling this function again. This is so that the caller
1391 * doesn't have to worry about the background worker locking protocol.
1392 */
1393const char *
1395{
1396 int slotno;
1397 bool found = false;
1398 static char result[BGW_MAXLEN];
1399
1401
1403 {
1405
1406 if (slot->pid > 0 && slot->pid == pid)
1407 {
1408 strcpy(result, slot->worker.bgw_type);
1409 found = true;
1410 break;
1411 }
1412 }
1413
1415
1416 if (!found)
1417 return NULL;
1418
1419 return result;
1420}
1421
1422/*
1423 * Terminate all background workers connected to the given database, if the
1424 * workers can be interrupted.
1425 */
1426void
1428{
1429 bool signal_postmaster = false;
1430
1431 elog(DEBUG1, "attempting worker termination for database %u",
1432 databaseId);
1433
1435
1436 /*
1437 * Iterate through slots, looking for workers connected to the given
1438 * database.
1439 */
1441 {
1443
1444 if (slot->in_use &&
1446 {
1447 PGPROC *proc = BackendPidGetProc(slot->pid);
1448
1449 if (proc && proc->databaseId == databaseId)
1450 {
1451 slot->terminate = true;
1452 signal_postmaster = true;
1453
1454 elog(DEBUG1, "termination requested for worker (PID %d) on database %u",
1455 (int) slot->pid, databaseId);
1456 }
1457 }
1458 }
1459
1461
1462 /* Make sure the postmaster notices the change to shared memory. */
1465}
void ParallelApplyWorkerMain(Datum main_arg)
void ascii_safe_strlcpy(char *dest, const char *src, size_t destsiz)
Definition ascii.c:174
#define pg_memory_barrier()
Definition atomics.h:141
#define pg_read_barrier()
Definition atomics.h:154
#define pg_write_barrier()
Definition atomics.h:155
void ParallelWorkerMain(Datum main_arg)
Definition parallel.c:1301
sigset_t UnBlockSig
Definition pqsignal.c:22
sigset_t BlockSig
Definition pqsignal.c:23
void ApplyWorkerMain(Datum main_arg)
Definition worker.c:5987
void RegisterBackgroundWorker(BackgroundWorker *worker)
Definition bgworker.c:962
BgwHandleStatus WaitForBackgroundWorkerStartup(BackgroundWorkerHandle *handle, pid_t *pidp)
Definition bgworker.c:1235
void BackgroundWorkerInitializeConnection(const char *dbname, const char *username, uint32 flags)
Definition bgworker.c:875
static bool SanityCheckBackgroundWorker(BackgroundWorker *worker, int elevel)
Definition bgworker.c:658
void ReportBackgroundWorkerPID(RegisteredBgWorker *rw)
Definition bgworker.c:487
void TerminateBackgroundWorker(BackgroundWorkerHandle *handle)
Definition bgworker.c:1319
static const struct @18 InternalBGWorkers[]
void TerminateBackgroundWorkersForDatabase(Oid databaseId)
Definition bgworker.c:1427
void ReportBackgroundWorkerExit(RegisteredBgWorker *rw)
Definition bgworker.c:509
BgwHandleStatus WaitForBackgroundWorkerShutdown(BackgroundWorkerHandle *handle)
Definition bgworker.c:1280
void ResetBackgroundWorkerCrashTimes(void)
Definition bgworker.c:605
void BackgroundWorkerUnblockSignals(void)
Definition bgworker.c:949
void BackgroundWorkerInitializeConnectionByOid(Oid dboid, Oid useroid, uint32 flags)
Definition bgworker.c:909
static void BackgroundWorkerShmemRequest(void *arg)
Definition bgworker.c:180
void BackgroundWorkerBlockSignals(void)
Definition bgworker.c:943
dlist_head BackgroundWorkerList
Definition bgworker.c:45
void ForgetBackgroundWorker(RegisteredBgWorker *rw)
Definition bgworker.c:455
const char * fn_name
Definition bgworker.c:129
BgwHandleStatus GetBackgroundWorkerPid(BackgroundWorkerHandle *handle, pid_t *pidp)
Definition bgworker.c:1180
static BackgroundWorkerArray * BackgroundWorkerData
Definition bgworker.c:113
static RegisteredBgWorker * FindRegisteredWorkerBySlotNumber(int slotno)
Definition bgworker.c:247
static bgworker_main_type LookupBackgroundWorkerFunction(const char *libraryname, const char *funcname)
Definition bgworker.c:1360
const ShmemCallbacks BackgroundWorkerShmemCallbacks
Definition bgworker.c:118
void BackgroundWorkerStopNotifications(pid_t pid)
Definition bgworker.c:540
void BackgroundWorkerStateChange(bool allow_new_workers)
Definition bgworker.c:272
const char * GetBackgroundWorkerTypeByPid(pid_t pid)
Definition bgworker.c:1394
static void BackgroundWorkerShmemInit(void *arg)
Definition bgworker.c:198
bool RegisterDynamicBackgroundWorker(BackgroundWorker *worker, BackgroundWorkerHandle **handle)
Definition bgworker.c:1068
void BackgroundWorkerMain(const void *startup_data, size_t startup_data_len)
Definition bgworker.c:741
bgworker_main_type fn_addr
Definition bgworker.c:130
void ForgetUnstartedBackgroundWorkers(void)
Definition bgworker.c:567
#define BGW_NEVER_RESTART
Definition bgworker.h:92
#define BGWORKER_BYPASS_ROLELOGINCHECK
Definition bgworker.h:167
#define BGW_EXTRALEN
Definition bgworker.h:94
#define BGWORKER_CLASS_PARALLEL
Definition bgworker.h:75
#define BGWORKER_INTERRUPTIBLE
Definition bgworker.h:67
BgwHandleStatus
Definition bgworker.h:111
@ BGWH_POSTMASTER_DIED
Definition bgworker.h:115
@ BGWH_STARTED
Definition bgworker.h:112
@ BGWH_NOT_YET_STARTED
Definition bgworker.h:113
@ BGWH_STOPPED
Definition bgworker.h:114
@ BgWorkerStart_PostmasterStart
Definition bgworker.h:86
#define BGWORKER_BACKEND_DATABASE_CONNECTION
Definition bgworker.h:60
#define BGWORKER_BYPASS_ALLOWCONN
Definition bgworker.h:166
#define BGWORKER_SHMEM_ACCESS
Definition bgworker.h:53
void(* bgworker_main_type)(Datum main_arg)
Definition bgworker.h:79
#define BGW_MAXLEN
Definition bgworker.h:93
#define MAX_PARALLEL_WORKER_LIMIT
#define Assert(condition)
Definition c.h:943
#define FLEXIBLE_ARRAY_MEMBER
Definition c.h:558
uint64_t uint64
Definition c.h:625
uint32_t uint32
Definition c.h:624
#define lengthof(array)
Definition c.h:873
size_t Size
Definition c.h:689
uint32 result
memcpy(sums, checksumBaseOffsets, sizeof(checksumBaseOffsets))
void DataChecksumsWorkerMain(Datum arg)
void DataChecksumsWorkerLauncherMain(Datum arg)
#define USECS_PER_DAY
Definition timestamp.h:131
void * load_external_function(const char *filename, const char *funcname, bool signalNotFound, void **filehandle)
Definition dfmgr.c:95
Datum arg
Definition elog.c:1322
void EmitErrorReport(void)
Definition elog.c:1882
ErrorContextCallback * error_context_stack
Definition elog.c:99
int errcode(int sqlerrcode)
Definition elog.c:874
sigjmp_buf * PG_exception_stack
Definition elog.c:101
#define LOG
Definition elog.h:32
int errhint(const char *fmt,...) pg_attribute_printf(1
#define FATAL
Definition elog.h:42
int int errmsg_internal(const char *fmt,...) pg_attribute_printf(1
#define DEBUG1
Definition elog.h:31
#define ERROR
Definition elog.h:40
#define elog(elevel,...)
Definition elog.h:228
#define ereport(elevel,...)
Definition elog.h:152
int errdetail_plural(const char *fmt_singular, const char *fmt_plural, unsigned long n,...) pg_attribute_printf(1
#define MCXT_ALLOC_ZERO
Definition fe_memutils.h:30
#define palloc_object(type)
Definition fe_memutils.h:74
#define MCXT_ALLOC_NO_OOM
Definition fe_memutils.h:29
bool IsUnderPostmaster
Definition globals.c:122
int max_parallel_workers
Definition globals.c:147
bool IsPostmasterEnvironment
Definition globals.c:121
struct Latch * MyLatch
Definition globals.c:65
int max_worker_processes
Definition globals.c:146
#define dlist_foreach(iter, lhead)
Definition ilist.h:623
static void dlist_delete(dlist_node *node)
Definition ilist.h:405
static void dlist_push_head(dlist_head *head, dlist_node *node)
Definition ilist.h:347
#define dlist_foreach_modify(iter, lhead)
Definition ilist.h:640
#define DLIST_STATIC_INIT(name)
Definition ilist.h:281
#define dlist_container(type, membername, ptr)
Definition ilist.h:593
#define funcname
static bool success
Definition initdb.c:188
static char * username
Definition initdb.c:153
void proc_exit(int code)
Definition ipc.c:105
int i
Definition isn.c:77
void ResetLatch(Latch *latch)
Definition latch.c:374
int WaitLatch(Latch *latch, int wakeEvents, long timeout, uint32 wait_event_info)
Definition latch.c:172
void ApplyLauncherMain(Datum main_arg)
Definition launcher.c:1205
bool LWLockAcquire(LWLock *lock, LWLockMode mode)
Definition lwlock.c:1150
void LWLockRelease(LWLock *lock)
Definition lwlock.c:1767
@ LW_SHARED
Definition lwlock.h:105
@ LW_EXCLUSIVE
Definition lwlock.h:104
void * MemoryContextAlloc(MemoryContext context, Size size)
Definition mcxt.c:1232
void pfree(void *pointer)
Definition mcxt.c:1616
MemoryContext TopMemoryContext
Definition mcxt.c:166
void * MemoryContextAllocExtended(MemoryContext context, Size size, int flags)
Definition mcxt.c:1289
MemoryContext PostmasterContext
Definition mcxt.c:168
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
@ NormalProcessing
Definition miscadmin.h:490
@ InitProcessing
Definition miscadmin.h:489
#define GetProcessingMode()
Definition miscadmin.h:499
#define CHECK_FOR_INTERRUPTS()
Definition miscadmin.h:125
#define HOLD_INTERRUPTS()
Definition miscadmin.h:136
#define IsInitProcessingMode()
Definition miscadmin.h:496
#define SetProcessingMode(mode)
Definition miscadmin.h:501
#define INIT_PG_OVERRIDE_ROLE_LOGIN
Definition miscadmin.h:519
#define INIT_PG_OVERRIDE_ALLOW_CONNS
Definition miscadmin.h:518
#define InvalidPid
Definition miscadmin.h:32
bool process_shared_preload_libraries_in_progress
Definition miscinit.c:1788
static char * errmsg
#define MAXPGPATH
#define die(msg)
void SendPostmasterSignal(PMSignalReason reason)
Definition pmsignal.c:164
@ PMSIGNAL_BACKGROUND_WORKER_CHANGE
Definition pmsignal.h:42
#define pqsignal
Definition port.h:547
int PostAuthDelay
Definition postgres.c:105
void FloatExceptionHandler(SIGNAL_ARGS)
Definition postgres.c:3070
void StatementCancelHandler(SIGNAL_ARGS)
Definition postgres.c:3053
#define InvalidOid
unsigned int Oid
void BaseInit(void)
Definition postinit.c:616
void InitPostgres(const char *in_dbname, Oid dboid, const char *username, Oid useroid, uint32 flags, char *out_dbname)
Definition postinit.c:719
BackgroundWorker * MyBgworkerEntry
Definition postmaster.c:201
bool PostmasterMarkPIDForWorkerNotify(int pid)
static int fb(int x)
PGPROC * BackendPidGetProc(int pid)
Definition procarray.c:3169
void procsignal_sigusr1_handler(SIGNAL_ARGS)
Definition procsignal.c:688
void init_ps_display(const char *fixed_part)
Definition ps_status.c:286
void RepackWorkerMain(Datum main_arg)
void SequenceSyncWorkerMain(Datum main_arg)
Size add_size(Size s1, Size s2)
Definition shmem.c:1048
Size mul_size(Size s1, Size s2)
Definition shmem.c:1063
#define ShmemRequestStruct(...)
Definition shmem.h:176
void pg_usleep(long microsec)
Definition signal.c:53
void InitProcess(void)
Definition proc.c:392
char * dbname
Definition streamutil.c:49
uint32 parallel_terminate_count
Definition bgworker.c:103
uint32 parallel_register_count
Definition bgworker.c:102
BackgroundWorkerSlot slot[FLEXIBLE_ARRAY_MEMBER]
Definition bgworker.c:104
BackgroundWorker worker
Definition bgworker.c:85
char bgw_function_name[BGW_MAXLEN]
Definition bgworker.h:104
char bgw_name[BGW_MAXLEN]
Definition bgworker.h:98
char bgw_type[BGW_MAXLEN]
Definition bgworker.h:99
BgWorkerStartTime bgw_start_time
Definition bgworker.h:101
char bgw_extra[BGW_EXTRALEN]
Definition bgworker.h:106
pid_t bgw_notify_pid
Definition bgworker.h:107
char bgw_library_name[MAXPGPATH]
Definition bgworker.h:103
Definition proc.h:179
Oid databaseId
Definition proc.h:201
BackgroundWorker rw_worker
ShmemRequestCallback request_fn
Definition shmem.h:133
dlist_node * cur
Definition ilist.h:179
dlist_node * cur
Definition ilist.h:200
void TableSyncWorkerMain(Datum main_arg)
Definition tablesync.c:1609
void InitializeTimeouts(void)
Definition timeout.c:470
const char * name
#define WL_LATCH_SET
#define WL_POSTMASTER_DEATH
#define SIGCHLD
Definition win32_port.h:168
#define SIGHUP
Definition win32_port.h:158
#define SIGPIPE
Definition win32_port.h:163
#define kill(pid, sig)
Definition win32_port.h:490
#define SIGUSR1
Definition win32_port.h:170
#define SIGUSR2
Definition win32_port.h:171