Age Owner Branch data TLA Line data Source code
1 : : /*--------------------------------------------------------------------
2 : : * bgworker.c
3 : : * POSTGRES pluggable background workers implementation
4 : : *
5 : : * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
6 : : *
7 : : * IDENTIFICATION
8 : : * src/backend/postmaster/bgworker.c
9 : : *
10 : : *-------------------------------------------------------------------------
11 : : */
12 : :
13 : : #include "postgres.h"
14 : :
15 : : #include "access/parallel.h"
16 : : #include "commands/repack.h"
17 : : #include "libpq/pqsignal.h"
18 : : #include "miscadmin.h"
19 : : #include "pgstat.h"
20 : : #include "port/atomics.h"
21 : : #include "postmaster/bgworker_internals.h"
22 : : #include "postmaster/datachecksum_state.h"
23 : : #include "postmaster/postmaster.h"
24 : : #include "replication/logicallauncher.h"
25 : : #include "replication/logicalworker.h"
26 : : #include "storage/ipc.h"
27 : : #include "storage/latch.h"
28 : : #include "storage/lwlock.h"
29 : : #include "storage/pmsignal.h"
30 : : #include "storage/proc.h"
31 : : #include "storage/procarray.h"
32 : : #include "storage/procsignal.h"
33 : : #include "storage/shmem.h"
34 : : #include "storage/subsystems.h"
35 : : #include "tcop/tcopprot.h"
36 : : #include "utils/ascii.h"
37 : : #include "utils/memutils.h"
38 : : #include "utils/ps_status.h"
39 : : #include "utils/timeout.h"
40 : : #include "utils/wait_event.h"
41 : :
42 : : /*
43 : : * The postmaster's list of registered background workers, in private memory.
44 : : */
45 : : dlist_head BackgroundWorkerList = DLIST_STATIC_INIT(BackgroundWorkerList);
46 : :
47 : : /*
48 : : * BackgroundWorkerSlots exist in shared memory and can be accessed (via
49 : : * the BackgroundWorkerArray) by both the postmaster and by regular backends.
50 : : * However, the postmaster cannot take locks, even spinlocks, because this
51 : : * might allow it to crash or become wedged if shared memory gets corrupted.
52 : : * Such an outcome is intolerable. Therefore, we need a lockless protocol
53 : : * for coordinating access to this data.
54 : : *
55 : : * The 'in_use' flag is used to hand off responsibility for the slot between
56 : : * the postmaster and the rest of the system. When 'in_use' is false,
57 : : * the postmaster will ignore the slot entirely, except for the 'in_use' flag
58 : : * itself, which it may read. In this state, regular backends may modify the
59 : : * slot. Once a backend sets 'in_use' to true, the slot becomes the
60 : : * responsibility of the postmaster. Regular backends may no longer modify it,
61 : : * but the postmaster may examine it. Thus, a backend initializing a slot
62 : : * must fully initialize the slot - and insert a write memory barrier - before
63 : : * marking it as in use.
64 : : *
65 : : * As an exception, however, even when the slot is in use, regular backends
66 : : * may set the 'terminate' flag for a slot, telling the postmaster not
67 : : * to restart it. Once the background worker is no longer running, the slot
68 : : * will be released for reuse.
69 : : *
70 : : * In addition to coordinating with the postmaster, backends modifying this
71 : : * data structure must coordinate with each other. Since they can take locks,
72 : : * this is straightforward: any backend wishing to manipulate a slot must
73 : : * take BackgroundWorkerLock in exclusive mode. Backends wishing to read
74 : : * data that might get concurrently modified by other backends should take
75 : : * this lock in shared mode. No matter what, backends reading this data
76 : : * structure must be able to tolerate concurrent modifications by the
77 : : * postmaster.
78 : : */
79 : : typedef struct BackgroundWorkerSlot
80 : : {
81 : : bool in_use;
82 : : bool terminate;
83 : : pid_t pid; /* InvalidPid = not started yet; 0 = dead */
84 : : uint64 generation; /* incremented when slot is recycled */
85 : : BackgroundWorker worker;
86 : : } BackgroundWorkerSlot;
87 : :
88 : : /*
89 : : * In order to limit the total number of parallel workers (according to
90 : : * max_parallel_workers GUC), we maintain the number of active parallel
91 : : * workers. Since the postmaster cannot take locks, two variables are used for
92 : : * this purpose: the number of registered parallel workers (modified by the
93 : : * backends, protected by BackgroundWorkerLock) and the number of terminated
94 : : * parallel workers (modified only by the postmaster, lockless). The active
95 : : * number of parallel workers is the number of registered workers minus the
96 : : * terminated ones. These counters can of course overflow, but it's not
97 : : * important here since the subtraction will still give the right number.
98 : : */
99 : : typedef struct BackgroundWorkerArray
100 : : {
101 : : int total_slots;
102 : : uint32 parallel_register_count;
103 : : uint32 parallel_terminate_count;
104 : : BackgroundWorkerSlot slot[FLEXIBLE_ARRAY_MEMBER];
105 : : } BackgroundWorkerArray;
106 : :
107 : : struct BackgroundWorkerHandle
108 : : {
109 : : int slot;
110 : : uint64 generation;
111 : : };
112 : :
113 : : static BackgroundWorkerArray *BackgroundWorkerData;
114 : :
115 : : static void BackgroundWorkerShmemRequest(void *arg);
116 : : static void BackgroundWorkerShmemInit(void *arg);
117 : :
118 : : const ShmemCallbacks BackgroundWorkerShmemCallbacks = {
119 : : .request_fn = BackgroundWorkerShmemRequest,
120 : : .init_fn = BackgroundWorkerShmemInit,
121 : : };
122 : :
123 : : /*
124 : : * List of internal background worker entry points. We need this for
125 : : * reasons explained in LookupBackgroundWorkerFunction(), below.
126 : : */
127 : : static const struct
128 : : {
129 : : const char *fn_name;
130 : : bgworker_main_type fn_addr;
131 : : } InternalBGWorkers[] =
132 : :
133 : : {
134 : : {
135 : : .fn_name = "ApplyLauncherMain",
136 : : .fn_addr = ApplyLauncherMain
137 : : },
138 : : {
139 : : .fn_name = "ApplyWorkerMain",
140 : : .fn_addr = ApplyWorkerMain
141 : : },
142 : : {
143 : : .fn_name = "ParallelApplyWorkerMain",
144 : : .fn_addr = ParallelApplyWorkerMain
145 : : },
146 : : {
147 : : .fn_name = "ParallelWorkerMain",
148 : : .fn_addr = ParallelWorkerMain
149 : : },
150 : : {
151 : : .fn_name = "RepackWorkerMain",
152 : : .fn_addr = RepackWorkerMain
153 : : },
154 : : {
155 : : .fn_name = "SequenceSyncWorkerMain",
156 : : .fn_addr = SequenceSyncWorkerMain
157 : : },
158 : : {
159 : : .fn_name = "TableSyncWorkerMain",
160 : : .fn_addr = TableSyncWorkerMain
161 : : },
162 : : {
163 : : .fn_name = "DataChecksumsWorkerLauncherMain",
164 : : .fn_addr = DataChecksumsWorkerLauncherMain
165 : : },
166 : : {
167 : : .fn_name = "DataChecksumsWorkerMain",
168 : : .fn_addr = DataChecksumsWorkerMain
169 : : }
170 : : };
171 : :
172 : : /* Private functions. */
173 : : static bgworker_main_type LookupBackgroundWorkerFunction(const char *libraryname, const char *funcname);
174 : :
175 : :
176 : : /*
177 : : * Register shared memory needed for background workers.
178 : : */
179 : : static void
29 heikki.linnakangas@i 180 :GNC 1244 : BackgroundWorkerShmemRequest(void *arg)
181 : : {
182 : : Size size;
183 : :
184 : : /* Array of workers is variably sized. */
4676 rhaas@postgresql.org 185 :CBC 1244 : size = offsetof(BackgroundWorkerArray, slot);
186 : 1244 : size = add_size(size, mul_size(max_worker_processes,
187 : : sizeof(BackgroundWorkerSlot)));
29 heikki.linnakangas@i 188 :GNC 1244 : ShmemRequestStruct(.name = "Background Worker Data",
189 : : .size = size,
190 : : .ptr = (void **) &BackgroundWorkerData,
191 : : );
4676 rhaas@postgresql.org 192 :GIC 1244 : }
193 : :
194 : : /*
195 : : * Initialize shared memory for background workers.
196 : : */
197 : : static void
29 heikki.linnakangas@i 198 :GNC 1241 : BackgroundWorkerShmemInit(void *arg)
199 : : {
200 : : dlist_iter iter;
201 : 1241 : int slotno = 0;
202 : :
203 : 1241 : BackgroundWorkerData->total_slots = max_worker_processes;
204 : 1241 : BackgroundWorkerData->parallel_register_count = 0;
205 : 1241 : BackgroundWorkerData->parallel_terminate_count = 0;
206 : :
207 : : /*
208 : : * Copy contents of worker list into shared memory. Record the shared
209 : : * memory slot assigned to each worker. This ensures a 1-to-1
210 : : * correspondence between the postmaster's private list and the array in
211 : : * shared memory.
212 : : */
213 [ + - + + ]: 2183 : dlist_foreach(iter, &BackgroundWorkerList)
214 : : {
215 : 942 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
216 : : RegisteredBgWorker *rw;
217 : :
218 : 942 : rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
219 [ - + ]: 942 : Assert(slotno < max_worker_processes);
220 : 942 : slot->in_use = true;
221 : 942 : slot->terminate = false;
222 : 942 : slot->pid = InvalidPid;
223 : 942 : slot->generation = 0;
224 : 942 : rw->rw_shmem_slot = slotno;
225 : 942 : rw->rw_worker.bgw_notify_pid = 0; /* might be reinit after crash */
226 : 942 : memcpy(&slot->worker, &rw->rw_worker, sizeof(BackgroundWorker));
227 : 942 : ++slotno;
228 : : }
229 : :
230 : : /*
231 : : * Mark any remaining slots as not in use.
232 : : */
233 [ + + ]: 10220 : while (slotno < max_worker_processes)
234 : : {
235 : 8979 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
236 : :
237 : 8979 : slot->in_use = false;
238 : 8979 : ++slotno;
239 : : }
4676 rhaas@postgresql.org 240 :CBC 1241 : }
241 : :
242 : : /*
243 : : * Search the postmaster's backend-private list of RegisteredBgWorker objects
244 : : * for the one that maps to the given slot number.
245 : : */
246 : : static RegisteredBgWorker *
247 : 5560 : FindRegisteredWorkerBySlotNumber(int slotno)
248 : : {
249 : : dlist_iter iter;
250 : :
634 heikki.linnakangas@i 251 [ + - + + ]: 13627 : dlist_foreach(iter, &BackgroundWorkerList)
252 : : {
253 : : RegisteredBgWorker *rw;
254 : :
255 : 10960 : rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
4676 rhaas@postgresql.org 256 [ + + ]: 10960 : if (rw->rw_shmem_slot == slotno)
257 : 2893 : return rw;
258 : : }
259 : :
260 : 2667 : return NULL;
261 : : }
262 : :
263 : : /*
264 : : * Notice changes to shared memory made by other backends.
265 : : * Accept new worker requests only if allow_new_workers is true.
266 : : *
267 : : * This code runs in the postmaster, so we must be very careful not to assume
268 : : * that shared memory contents are sane. Otherwise, a rogue backend could
269 : : * take out the postmaster.
270 : : */
271 : : void
1958 tgl@sss.pgh.pa.us 272 : 1680 : BackgroundWorkerStateChange(bool allow_new_workers)
273 : : {
274 : : int slotno;
275 : :
276 : : /*
277 : : * The total number of slots stored in shared memory should match our
278 : : * notion of max_worker_processes. If it does not, something is very
279 : : * wrong. Further down, we always refer to this value as
280 : : * max_worker_processes, in case shared memory gets corrupted while we're
281 : : * looping.
282 : : */
4676 rhaas@postgresql.org 283 [ - + ]: 1680 : if (max_worker_processes != BackgroundWorkerData->total_slots)
284 : : {
1978 peter@eisentraut.org 285 [ # # ]:UBC 0 : ereport(LOG,
286 : : (errmsg("inconsistent background worker state (\"max_worker_processes\"=%d, total slots=%d)",
287 : : max_worker_processes,
288 : : BackgroundWorkerData->total_slots)));
4676 rhaas@postgresql.org 289 : 0 : return;
290 : : }
291 : :
292 : : /*
293 : : * Iterate through slots, looking for newly-registered workers or workers
294 : : * who must die.
295 : : */
4676 rhaas@postgresql.org 296 [ + + ]:CBC 15270 : for (slotno = 0; slotno < max_worker_processes; ++slotno)
297 : : {
298 : 13590 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
299 : : RegisteredBgWorker *rw;
300 : :
301 [ + + ]: 13590 : if (!slot->in_use)
302 : 8030 : continue;
303 : :
304 : : /*
305 : : * Make sure we don't see the in_use flag before the updated slot
306 : : * contents.
307 : : */
308 : 5560 : pg_read_barrier();
309 : :
310 : : /* See whether we already know about this worker. */
311 : 5560 : rw = FindRegisteredWorkerBySlotNumber(slotno);
312 [ + + ]: 5560 : if (rw != NULL)
313 : : {
314 : : /*
315 : : * In general, the worker data can't change after it's initially
316 : : * registered. However, someone can set the terminate flag.
317 : : */
4582 318 [ + + + - ]: 2893 : if (slot->terminate && !rw->rw_terminate)
319 : : {
320 : 15 : rw->rw_terminate = true;
321 [ + - ]: 15 : if (rw->rw_pid != 0)
322 : 15 : kill(rw->rw_pid, SIGTERM);
323 : : else
324 : : {
325 : : /* Report never-started, now-terminated worker as dead. */
4065 rhaas@postgresql.org 326 :UBC 0 : ReportBackgroundWorkerPID(rw);
327 : : }
328 : : }
4676 rhaas@postgresql.org 329 :CBC 2893 : continue;
330 : : }
331 : :
332 : : /*
333 : : * If we aren't allowing new workers, then immediately mark it for
334 : : * termination; the next stanza will take care of cleaning it up.
335 : : * Doing this ensures that any process waiting for the worker will get
336 : : * awoken, even though the worker will never be allowed to run.
337 : : */
1958 tgl@sss.pgh.pa.us 338 [ + + ]: 2667 : if (!allow_new_workers)
339 : 1 : slot->terminate = true;
340 : :
341 : : /*
342 : : * If the worker is marked for termination, we don't need to add it to
343 : : * the registered workers list; we can just free the slot. However, if
344 : : * bgw_notify_pid is set, the process that registered the worker may
345 : : * need to know that we've processed the terminate request, so be sure
346 : : * to signal it.
347 : : */
4582 rhaas@postgresql.org 348 [ + + ]: 2667 : if (slot->terminate)
349 : 1 : {
350 : : int notify_pid;
351 : :
352 : : /*
353 : : * We need a memory barrier here to make sure that the load of
354 : : * bgw_notify_pid and the update of parallel_terminate_count
355 : : * complete before the store to in_use.
356 : : */
4065 357 : 1 : notify_pid = slot->worker.bgw_notify_pid;
3441 358 [ - + ]: 1 : if ((slot->worker.bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
3441 rhaas@postgresql.org 359 :UBC 0 : BackgroundWorkerData->parallel_terminate_count++;
4065 rhaas@postgresql.org 360 :CBC 1 : slot->pid = 0;
361 : :
1816 tgl@sss.pgh.pa.us 362 : 1 : pg_memory_barrier();
4582 rhaas@postgresql.org 363 : 1 : slot->in_use = false;
364 : :
4065 365 [ + - ]: 1 : if (notify_pid != 0)
366 : 1 : kill(notify_pid, SIGUSR1);
367 : :
4582 368 : 1 : continue;
369 : : }
370 : :
371 : : /*
372 : : * Copy the registration data into the registered workers list.
373 : : */
939 heikki.linnakangas@i 374 : 2666 : rw = MemoryContextAllocExtended(PostmasterContext,
375 : : sizeof(RegisteredBgWorker),
376 : : MCXT_ALLOC_NO_OOM | MCXT_ALLOC_ZERO);
4676 rhaas@postgresql.org 377 [ - + ]: 2666 : if (rw == NULL)
378 : : {
4676 rhaas@postgresql.org 379 [ # # ]:UBC 0 : ereport(LOG,
380 : : (errcode(ERRCODE_OUT_OF_MEMORY),
381 : : errmsg("out of memory")));
382 : 0 : return;
383 : : }
384 : :
385 : : /*
386 : : * Copy strings in a paranoid way. If shared memory is corrupted, the
387 : : * source data might not even be NUL-terminated.
388 : : */
4676 rhaas@postgresql.org 389 :CBC 2666 : ascii_safe_strlcpy(rw->rw_worker.bgw_name,
390 : 2666 : slot->worker.bgw_name, BGW_MAXLEN);
3169 peter_e@gmx.net 391 : 2666 : ascii_safe_strlcpy(rw->rw_worker.bgw_type,
392 : 2666 : slot->worker.bgw_type, BGW_MAXLEN);
4676 rhaas@postgresql.org 393 : 2666 : ascii_safe_strlcpy(rw->rw_worker.bgw_library_name,
1037 nathan@postgresql.or 394 : 2666 : slot->worker.bgw_library_name, MAXPGPATH);
4676 rhaas@postgresql.org 395 : 2666 : ascii_safe_strlcpy(rw->rw_worker.bgw_function_name,
396 : 2666 : slot->worker.bgw_function_name, BGW_MAXLEN);
397 : :
398 : : /*
399 : : * Copy various fixed-size fields.
400 : : *
401 : : * flags, start_time, and restart_time are examined by the postmaster,
402 : : * but nothing too bad will happen if they are corrupted. The
403 : : * remaining fields will only be examined by the child process. It
404 : : * might crash, but we won't.
405 : : */
406 : 2666 : rw->rw_worker.bgw_flags = slot->worker.bgw_flags;
407 : 2666 : rw->rw_worker.bgw_start_time = slot->worker.bgw_start_time;
408 : 2666 : rw->rw_worker.bgw_restart_time = slot->worker.bgw_restart_time;
409 : 2666 : rw->rw_worker.bgw_main_arg = slot->worker.bgw_main_arg;
3834 410 : 2666 : memcpy(rw->rw_worker.bgw_extra, slot->worker.bgw_extra, BGW_EXTRALEN);
411 : :
412 : : /*
413 : : * Copy the PID to be notified about state changes, but only if the
414 : : * postmaster knows about a backend with that PID. It isn't an error
415 : : * if the postmaster doesn't know about the PID, because the backend
416 : : * that requested the worker could have died (or been killed) just
417 : : * after doing so. Nonetheless, at least until we get some experience
418 : : * with how this plays out in the wild, log a message at a relative
419 : : * high debug level.
420 : : */
4633 421 : 2666 : rw->rw_worker.bgw_notify_pid = slot->worker.bgw_notify_pid;
422 [ - + ]: 2666 : if (!PostmasterMarkPIDForWorkerNotify(rw->rw_worker.bgw_notify_pid))
423 : : {
1299 peter@eisentraut.org 424 [ # # ]:UBC 0 : elog(DEBUG1, "worker notification PID %d is not valid",
425 : : (int) rw->rw_worker.bgw_notify_pid);
4633 rhaas@postgresql.org 426 : 0 : rw->rw_worker.bgw_notify_pid = 0;
427 : : }
428 : :
429 : : /* Initialize postmaster bookkeeping. */
4676 rhaas@postgresql.org 430 :CBC 2666 : rw->rw_pid = 0;
431 : 2666 : rw->rw_crashed_at = 0;
432 : 2666 : rw->rw_shmem_slot = slotno;
4582 433 : 2666 : rw->rw_terminate = false;
434 : :
435 : : /* Log it! */
3966 436 [ + + ]: 2666 : ereport(DEBUG1,
437 : : (errmsg_internal("registering background worker \"%s\"",
438 : : rw->rw_worker.bgw_name)));
439 : :
634 heikki.linnakangas@i 440 : 2666 : dlist_push_head(&BackgroundWorkerList, &rw->rw_lnode);
441 : : }
442 : : }
443 : :
444 : : /*
445 : : * Forget about a background worker that's no longer needed.
446 : : *
447 : : * NOTE: The entry is unlinked from BackgroundWorkerList. If the caller is
448 : : * iterating through it, better use a mutable iterator!
449 : : *
450 : : * Caller is responsible for notifying bgw_notify_pid, if appropriate.
451 : : *
452 : : * This function must be invoked only in the postmaster.
453 : : */
454 : : void
455 : 2641 : ForgetBackgroundWorker(RegisteredBgWorker *rw)
456 : : {
457 : : BackgroundWorkerSlot *slot;
458 : :
4676 rhaas@postgresql.org 459 [ - + ]: 2641 : Assert(rw->rw_shmem_slot < max_worker_processes);
460 : 2641 : slot = &BackgroundWorkerData->slot[rw->rw_shmem_slot];
1816 tgl@sss.pgh.pa.us 461 [ - + ]: 2641 : Assert(slot->in_use);
462 : :
463 : : /*
464 : : * We need a memory barrier here to make sure that the update of
465 : : * parallel_terminate_count completes before the store to in_use.
466 : : */
3441 rhaas@postgresql.org 467 [ + + ]: 2641 : if ((rw->rw_worker.bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
468 : 2008 : BackgroundWorkerData->parallel_terminate_count++;
469 : :
1816 tgl@sss.pgh.pa.us 470 : 2641 : pg_memory_barrier();
4676 rhaas@postgresql.org 471 : 2641 : slot->in_use = false;
472 : :
3966 473 [ + + ]: 2641 : ereport(DEBUG1,
474 : : (errmsg_internal("unregistering background worker \"%s\"",
475 : : rw->rw_worker.bgw_name)));
476 : :
634 heikki.linnakangas@i 477 : 2641 : dlist_delete(&rw->rw_lnode);
939 478 : 2641 : pfree(rw);
4676 rhaas@postgresql.org 479 : 2641 : }
480 : :
481 : : /*
482 : : * Report the PID of a newly-launched background worker in shared memory.
483 : : *
484 : : * This function should only be called from the postmaster.
485 : : */
486 : : void
4633 487 : 3488 : ReportBackgroundWorkerPID(RegisteredBgWorker *rw)
488 : : {
489 : : BackgroundWorkerSlot *slot;
490 : :
491 [ - + ]: 3488 : Assert(rw->rw_shmem_slot < max_worker_processes);
492 : 3488 : slot = &BackgroundWorkerData->slot[rw->rw_shmem_slot];
493 : 3488 : slot->pid = rw->rw_pid;
494 : :
495 [ + + ]: 3488 : if (rw->rw_worker.bgw_notify_pid != 0)
496 : 2666 : kill(rw->rw_worker.bgw_notify_pid, SIGUSR1);
497 : 3488 : }
498 : :
499 : : /*
500 : : * Report that the PID of a background worker is now zero because a
501 : : * previously-running background worker has exited.
502 : : *
503 : : * NOTE: The entry may be unlinked from BackgroundWorkerList. If the caller
504 : : * is iterating through it, better use a mutable iterator!
505 : : *
506 : : * This function should only be called from the postmaster.
507 : : */
508 : : void
634 heikki.linnakangas@i 509 : 3151 : ReportBackgroundWorkerExit(RegisteredBgWorker *rw)
510 : : {
511 : : BackgroundWorkerSlot *slot;
512 : : int notify_pid;
513 : :
3350 rhaas@postgresql.org 514 [ - + ]: 3151 : Assert(rw->rw_shmem_slot < max_worker_processes);
515 : 3151 : slot = &BackgroundWorkerData->slot[rw->rw_shmem_slot];
516 : 3151 : slot->pid = rw->rw_pid;
3347 517 : 3151 : notify_pid = rw->rw_worker.bgw_notify_pid;
518 : :
519 : : /*
520 : : * If this worker is slated for deregistration, do that before notifying
521 : : * the process which started it. Otherwise, if that process tries to
522 : : * reuse the slot immediately, it might not be available yet. In theory
523 : : * that could happen anyway if the process checks slot->pid at just the
524 : : * wrong moment, but this makes the window narrower.
525 : : */
3350 526 [ + + ]: 3151 : if (rw->rw_terminate ||
527 [ + + ]: 769 : rw->rw_worker.bgw_restart_time == BGW_NEVER_RESTART)
634 heikki.linnakangas@i 528 : 2641 : ForgetBackgroundWorker(rw);
529 : :
3347 rhaas@postgresql.org 530 [ + + ]: 3151 : if (notify_pid != 0)
531 : 2590 : kill(notify_pid, SIGUSR1);
3350 532 : 3151 : }
533 : :
534 : : /*
535 : : * Cancel SIGUSR1 notifications for a PID belonging to an exiting backend.
536 : : *
537 : : * This function should only be called from the postmaster.
538 : : */
539 : : void
4633 540 : 336 : BackgroundWorkerStopNotifications(pid_t pid)
541 : : {
542 : : dlist_iter iter;
543 : :
634 heikki.linnakangas@i 544 [ + - + + ]: 1055 : dlist_foreach(iter, &BackgroundWorkerList)
545 : : {
546 : : RegisteredBgWorker *rw;
547 : :
548 : 719 : rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
4633 rhaas@postgresql.org 549 [ + + ]: 719 : if (rw->rw_worker.bgw_notify_pid == pid)
550 : 48 : rw->rw_worker.bgw_notify_pid = 0;
551 : : }
552 : 336 : }
553 : :
554 : : /*
555 : : * Cancel any not-yet-started worker requests that have waiting processes.
556 : : *
557 : : * This is called during a normal ("smart" or "fast") database shutdown.
558 : : * After this point, no new background workers will be started, so anything
559 : : * that might be waiting for them needs to be kicked off its wait. We do
560 : : * that by canceling the bgworker registration entirely, which is perhaps
561 : : * overkill, but since we're shutting down it does not matter whether the
562 : : * registration record sticks around.
563 : : *
564 : : * This function should only be called from the postmaster.
565 : : */
566 : : void
1958 tgl@sss.pgh.pa.us 567 : 635 : ForgetUnstartedBackgroundWorkers(void)
568 : : {
569 : : dlist_mutable_iter iter;
570 : :
634 heikki.linnakangas@i 571 [ + - + + ]: 1269 : dlist_foreach_modify(iter, &BackgroundWorkerList)
572 : : {
573 : : RegisteredBgWorker *rw;
574 : : BackgroundWorkerSlot *slot;
575 : :
576 : 634 : rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
1958 tgl@sss.pgh.pa.us 577 [ - + ]: 634 : Assert(rw->rw_shmem_slot < max_worker_processes);
578 : 634 : slot = &BackgroundWorkerData->slot[rw->rw_shmem_slot];
579 : :
580 : : /* If it's not yet started, and there's someone waiting ... */
581 [ + + ]: 634 : if (slot->pid == InvalidPid &&
582 [ - + ]: 64 : rw->rw_worker.bgw_notify_pid != 0)
583 : : {
584 : : /* ... then zap it, and notify the waiter */
1958 tgl@sss.pgh.pa.us 585 :UBC 0 : int notify_pid = rw->rw_worker.bgw_notify_pid;
586 : :
634 heikki.linnakangas@i 587 : 0 : ForgetBackgroundWorker(rw);
1958 tgl@sss.pgh.pa.us 588 [ # # ]: 0 : if (notify_pid != 0)
589 : 0 : kill(notify_pid, SIGUSR1);
590 : : }
591 : : }
1958 tgl@sss.pgh.pa.us 592 :CBC 635 : }
593 : :
594 : : /*
595 : : * Reset background worker crash state.
596 : : *
597 : : * We assume that, after a crash-and-restart cycle, background workers without
598 : : * the never-restart flag should be restarted immediately, instead of waiting
599 : : * for bgw_restart_time to elapse. On the other hand, workers with that flag
600 : : * should be forgotten immediately, since we won't ever restart them.
601 : : *
602 : : * This function should only be called from the postmaster.
603 : : */
604 : : void
4381 rhaas@postgresql.org 605 : 5 : ResetBackgroundWorkerCrashTimes(void)
606 : : {
607 : : dlist_mutable_iter iter;
608 : :
634 heikki.linnakangas@i 609 [ + - + + ]: 10 : dlist_foreach_modify(iter, &BackgroundWorkerList)
610 : : {
611 : : RegisteredBgWorker *rw;
612 : :
613 : 5 : rw = dlist_container(RegisteredBgWorker, rw_lnode, iter.cur);
614 : :
3311 rhaas@postgresql.org 615 [ - + ]: 5 : if (rw->rw_worker.bgw_restart_time == BGW_NEVER_RESTART)
616 : : {
617 : : /*
618 : : * Workers marked BGW_NEVER_RESTART shouldn't get relaunched after
619 : : * the crash, so forget about them. (If we wait until after the
620 : : * crash to forget about them, and they are parallel workers,
621 : : * parallel_terminate_count will get incremented after we've
622 : : * already zeroed parallel_register_count, which would be bad.)
623 : : */
634 heikki.linnakangas@i 624 :UBC 0 : ForgetBackgroundWorker(rw);
625 : : }
626 : : else
627 : : {
628 : : /*
629 : : * The accounting which we do via parallel_register_count and
630 : : * parallel_terminate_count would get messed up if a worker marked
631 : : * parallel could survive a crash and restart cycle. All such
632 : : * workers should be marked BGW_NEVER_RESTART, and thus control
633 : : * should never reach this branch.
634 : : */
3311 rhaas@postgresql.org 635 [ - + ]:CBC 5 : Assert((rw->rw_worker.bgw_flags & BGWORKER_CLASS_PARALLEL) == 0);
636 : :
637 : : /*
638 : : * Allow this worker to be restarted immediately after we finish
639 : : * resetting.
640 : : */
4051 641 : 5 : rw->rw_crashed_at = 0;
284 fujii@postgresql.org 642 : 5 : rw->rw_pid = 0;
643 : :
644 : : /*
645 : : * If there was anyone waiting for it, they're history.
646 : : */
1958 tgl@sss.pgh.pa.us 647 : 5 : rw->rw_worker.bgw_notify_pid = 0;
648 : : }
649 : : }
4381 rhaas@postgresql.org 650 : 5 : }
651 : :
652 : : /*
653 : : * Complain about the BackgroundWorker definition using error level elevel.
654 : : * Return true if it looks ok, false if not (unless elevel >= ERROR, in
655 : : * which case we won't return at all in the not-OK case).
656 : : */
657 : : static bool
4676 658 : 3491 : SanityCheckBackgroundWorker(BackgroundWorker *worker, int elevel)
659 : : {
660 : : /* sanity check for flags */
661 : :
662 : : /*
663 : : * We used to support workers not connected to shared memory, but don't
664 : : * anymore. Thus this is a required flag now. We're not removing the flag
665 : : * for compatibility reasons and because the flag still provides some
666 : : * signal when reading code.
667 : : */
1726 andres@anarazel.de 668 [ - + ]: 3491 : if (!(worker->bgw_flags & BGWORKER_SHMEM_ACCESS))
669 : : {
1726 andres@anarazel.de 670 [ # # ]:UBC 0 : ereport(elevel,
671 : : (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
672 : : errmsg("background worker \"%s\": background workers without shared memory access are not supported",
673 : : worker->bgw_name)));
674 : 0 : return false;
675 : : }
676 : :
1726 andres@anarazel.de 677 [ + + ]:CBC 3491 : if (worker->bgw_flags & BGWORKER_BACKEND_DATABASE_CONNECTION)
678 : : {
4676 rhaas@postgresql.org 679 [ - + ]: 3478 : if (worker->bgw_start_time == BgWorkerStart_PostmasterStart)
680 : : {
4676 rhaas@postgresql.org 681 [ # # ]:UBC 0 : ereport(elevel,
682 : : (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
683 : : errmsg("background worker \"%s\": cannot request database access if starting at postmaster start",
684 : : worker->bgw_name)));
685 : 0 : return false;
686 : : }
687 : :
688 : : /* XXX other checks? */
689 : : }
690 : :
691 : : /* Interruptible workers require a database connection */
119 michael@paquier.xyz 692 [ + + ]:GNC 3491 : if ((worker->bgw_flags & BGWORKER_INTERRUPTIBLE) &&
693 [ - + ]: 4 : !(worker->bgw_flags & BGWORKER_BACKEND_DATABASE_CONNECTION))
694 : : {
119 michael@paquier.xyz 695 [ # # ]:UNC 0 : ereport(elevel,
696 : : (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
697 : : errmsg("background worker \"%s\": cannot make background workers interruptible without database access",
698 : : worker->bgw_name)));
699 : 0 : return false;
700 : : }
701 : :
4676 rhaas@postgresql.org 702 [ + + ]:CBC 3491 : if ((worker->bgw_restart_time < 0 &&
703 [ + - ]: 2542 : worker->bgw_restart_time != BGW_NEVER_RESTART) ||
704 [ - + ]: 3491 : (worker->bgw_restart_time > USECS_PER_DAY / 1000))
705 : : {
4676 rhaas@postgresql.org 706 [ # # ]:UBC 0 : ereport(elevel,
707 : : (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
708 : : errmsg("background worker \"%s\": invalid restart interval",
709 : : worker->bgw_name)));
710 : 0 : return false;
711 : : }
712 : :
713 : : /*
714 : : * Parallel workers may not be configured for restart, because the
715 : : * parallel_register_count/parallel_terminate_count accounting can't
716 : : * handle parallel workers lasting through a crash-and-restart cycle.
717 : : */
3311 rhaas@postgresql.org 718 [ + + ]:CBC 3491 : if (worker->bgw_restart_time != BGW_NEVER_RESTART &&
719 [ - + ]: 949 : (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0)
720 : : {
3311 rhaas@postgresql.org 721 [ # # ]:UBC 0 : ereport(elevel,
722 : : (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
723 : : errmsg("background worker \"%s\": parallel workers may not be configured for restart",
724 : : worker->bgw_name)));
725 : 0 : return false;
726 : : }
727 : :
728 : : /*
729 : : * If bgw_type is not filled in, use bgw_name.
730 : : */
3169 peter_e@gmx.net 731 [ - + ]:CBC 3491 : if (strcmp(worker->bgw_type, "") == 0)
3169 peter_e@gmx.net 732 :UBC 0 : strcpy(worker->bgw_type, worker->bgw_name);
733 : :
4676 rhaas@postgresql.org 734 :CBC 3491 : return true;
735 : : }
736 : :
737 : : /*
738 : : * Main entry point for background worker processes.
739 : : */
740 : : void
438 peter@eisentraut.org 741 : 3169 : BackgroundWorkerMain(const void *startup_data, size_t startup_data_len)
742 : : {
743 : : sigjmp_buf local_sigjmp_buf;
744 : : BackgroundWorker *worker;
745 : : bgworker_main_type entrypt;
746 : :
778 heikki.linnakangas@i 747 [ - + ]: 3169 : if (startup_data == NULL)
4645 rhaas@postgresql.org 748 [ # # ]:UBC 0 : elog(FATAL, "unable to find bgworker entry");
778 heikki.linnakangas@i 749 [ - + ]:CBC 3169 : Assert(startup_data_len == sizeof(BackgroundWorker));
750 : 3169 : worker = MemoryContextAlloc(TopMemoryContext, sizeof(BackgroundWorker));
751 : 3169 : memcpy(worker, startup_data, sizeof(BackgroundWorker));
752 : :
753 : : /*
754 : : * Now that we're done reading the startup data, release postmaster's
755 : : * working memory context.
756 : : */
757 [ + - ]: 3169 : if (PostmasterContext)
758 : : {
759 : 3169 : MemoryContextDelete(PostmasterContext);
760 : 3169 : PostmasterContext = NULL;
761 : : }
762 : :
763 : 3169 : MyBgworkerEntry = worker;
2246 peter@eisentraut.org 764 : 3169 : init_ps_display(worker->bgw_name);
765 : :
672 heikki.linnakangas@i 766 [ - + ]: 3169 : Assert(GetProcessingMode() == InitProcessing);
767 : :
768 : : /* Apply PostAuthDelay */
4645 rhaas@postgresql.org 769 [ - + ]: 3169 : if (PostAuthDelay > 0)
4645 rhaas@postgresql.org 770 :UBC 0 : pg_usleep(PostAuthDelay * 1000000L);
771 : :
772 : : /*
773 : : * Set up signal handlers.
774 : : */
4645 rhaas@postgresql.org 775 [ + + ]:CBC 3169 : if (worker->bgw_flags & BGWORKER_BACKEND_DATABASE_CONNECTION)
776 : : {
777 : : /*
778 : : * SIGINT is used to signal canceling the current action
779 : : */
780 : 3156 : pqsignal(SIGINT, StatementCancelHandler);
781 : 3156 : pqsignal(SIGUSR1, procsignal_sigusr1_handler);
782 : 3156 : pqsignal(SIGFPE, FloatExceptionHandler);
783 : :
784 : : /* XXX Any other handlers needed here? */
785 : : }
786 : : else
787 : : {
21 andrew@dunslane.net 788 :GNC 13 : pqsignal(SIGINT, PG_SIG_IGN);
789 : 13 : pqsignal(SIGUSR1, PG_SIG_IGN);
790 : 13 : pqsignal(SIGFPE, PG_SIG_IGN);
791 : : }
76 heikki.linnakangas@i 792 : 3169 : pqsignal(SIGTERM, die);
793 : : /* SIGQUIT handler was already set up by InitPostmasterChild */
21 andrew@dunslane.net 794 : 3169 : pqsignal(SIGHUP, PG_SIG_IGN);
795 : :
4382 bruce@momjian.us 796 :CBC 3169 : InitializeTimeouts(); /* establishes SIGALRM handler */
797 : :
21 andrew@dunslane.net 798 :GNC 3169 : pqsignal(SIGPIPE, PG_SIG_IGN);
799 : 3169 : pqsignal(SIGUSR2, PG_SIG_IGN);
800 : 3169 : pqsignal(SIGCHLD, PG_SIG_DFL);
801 : :
802 : : /*
803 : : * If an exception is encountered, processing resumes here.
804 : : *
805 : : * We just need to clean up, report the error, and go away.
806 : : */
4645 rhaas@postgresql.org 807 [ + + ]:CBC 3169 : if (sigsetjmp(local_sigjmp_buf, 1) != 0)
808 : : {
809 : : /* Since not using PG_TRY, must reset error stack by hand */
810 : 154 : error_context_stack = NULL;
811 : :
812 : : /* Prevent interrupts while cleaning up */
813 : 154 : HOLD_INTERRUPTS();
814 : :
815 : : /*
816 : : * sigsetjmp will have blocked all signals, but we may need to accept
817 : : * signals while communicating with our parallel leader. Once we've
818 : : * done HOLD_INTERRUPTS() it should be safe to unblock signals.
819 : : */
2070 tgl@sss.pgh.pa.us 820 : 154 : BackgroundWorkerUnblockSignals();
821 : :
822 : : /* Report the error to the parallel leader and the server log */
4645 rhaas@postgresql.org 823 : 154 : EmitErrorReport();
824 : :
825 : : /*
826 : : * Do we need more cleanup here? For shmem-connected bgworkers, we
827 : : * will call InitProcess below, which will install ProcKill as exit
828 : : * callback. That will take care of releasing locks, etc.
829 : : */
830 : :
831 : : /* and go away */
832 : 154 : proc_exit(1);
833 : : }
834 : :
835 : : /* We can now handle ereport(ERROR) */
836 : 3169 : PG_exception_stack = &local_sigjmp_buf;
837 : :
838 : : /*
839 : : * Create a per-backend PGPROC struct in shared memory. We must do this
840 : : * before we can use LWLocks or access any shared memory.
841 : : */
1726 andres@anarazel.de 842 : 3169 : InitProcess();
843 : :
844 : : /*
845 : : * Early initialization.
846 : : */
847 : 3169 : BaseInit();
848 : :
849 : : /*
850 : : * Look up the entry point function, loading its library if necessary.
851 : : */
3308 tgl@sss.pgh.pa.us 852 : 6338 : entrypt = LookupBackgroundWorkerFunction(worker->bgw_library_name,
853 : 3169 : worker->bgw_function_name);
854 : :
855 : : /*
856 : : * Note that in normal processes, we would call InitPostgres here. For a
857 : : * worker, however, we don't know what database to connect to, yet; so we
858 : : * need to wait until the user code does it via
859 : : * BackgroundWorkerInitializeConnection().
860 : : */
861 : :
862 : : /*
863 : : * Now invoke the user-defined worker code
864 : : */
4645 rhaas@postgresql.org 865 : 3169 : entrypt(worker->bgw_main_arg);
866 : :
867 : : /* ... and if it returns, we're done */
868 : 2039 : proc_exit(0);
869 : : }
870 : :
871 : : /*
872 : : * Connect background worker to a database.
873 : : */
874 : : void
672 heikki.linnakangas@i 875 : 513 : BackgroundWorkerInitializeConnection(const char *dbname, const char *username, uint32 flags)
876 : : {
877 : 513 : BackgroundWorker *worker = MyBgworkerEntry;
36 nathan@postgresql.or 878 :GNC 513 : uint32 init_flags = 0; /* never honor session_preload_libraries */
879 : :
880 : : /* ignore datallowconn and ACL_CONNECT? */
672 heikki.linnakangas@i 881 [ - + ]:CBC 513 : if (flags & BGWORKER_BYPASS_ALLOWCONN)
672 heikki.linnakangas@i 882 :UBC 0 : init_flags |= INIT_PG_OVERRIDE_ALLOW_CONNS;
883 : : /* ignore rolcanlogin? */
672 heikki.linnakangas@i 884 [ - + ]:CBC 513 : if (flags & BGWORKER_BYPASS_ROLELOGINCHECK)
672 heikki.linnakangas@i 885 :UBC 0 : init_flags |= INIT_PG_OVERRIDE_ROLE_LOGIN;
886 : :
887 : : /* XXX is this the right errcode? */
672 heikki.linnakangas@i 888 [ - + ]:CBC 513 : if (!(worker->bgw_flags & BGWORKER_BACKEND_DATABASE_CONNECTION))
672 heikki.linnakangas@i 889 [ # # ]:UBC 0 : ereport(FATAL,
890 : : (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
891 : : errmsg("database connection requirement not indicated during registration")));
892 : :
672 heikki.linnakangas@i 893 :CBC 513 : InitPostgres(dbname, InvalidOid, /* database to connect to */
894 : : username, InvalidOid, /* role to connect as */
895 : : init_flags,
896 : : NULL); /* no out_dbname */
897 : :
898 : : /* it had better not gotten out of "init" mode yet */
899 [ - + ]: 513 : if (!IsInitProcessingMode())
672 heikki.linnakangas@i 900 [ # # ]:UBC 0 : ereport(ERROR,
901 : : (errmsg("invalid processing mode in background worker")));
672 heikki.linnakangas@i 902 :CBC 513 : SetProcessingMode(NormalProcessing);
903 : 513 : }
904 : :
905 : : /*
906 : : * Connect background worker to a database using OIDs.
907 : : */
908 : : void
909 : 2643 : BackgroundWorkerInitializeConnectionByOid(Oid dboid, Oid useroid, uint32 flags)
910 : : {
911 : 2643 : BackgroundWorker *worker = MyBgworkerEntry;
36 nathan@postgresql.or 912 :GNC 2643 : uint32 init_flags = 0; /* never honor session_preload_libraries */
913 : :
914 : : /* ignore datallowconn and ACL_CONNECT? */
672 heikki.linnakangas@i 915 [ + + ]:CBC 2643 : if (flags & BGWORKER_BYPASS_ALLOWCONN)
916 : 2028 : init_flags |= INIT_PG_OVERRIDE_ALLOW_CONNS;
917 : : /* ignore rolcanlogin? */
918 [ + + ]: 2643 : if (flags & BGWORKER_BYPASS_ROLELOGINCHECK)
919 : 2011 : init_flags |= INIT_PG_OVERRIDE_ROLE_LOGIN;
920 : :
921 : : /* XXX is this the right errcode? */
922 [ - + ]: 2643 : if (!(worker->bgw_flags & BGWORKER_BACKEND_DATABASE_CONNECTION))
672 heikki.linnakangas@i 923 [ # # ]:UBC 0 : ereport(FATAL,
924 : : (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
925 : : errmsg("database connection requirement not indicated during registration")));
926 : :
672 heikki.linnakangas@i 927 :CBC 2643 : InitPostgres(NULL, dboid, /* database to connect to */
928 : : NULL, useroid, /* role to connect as */
929 : : init_flags,
930 : : NULL); /* no out_dbname */
931 : :
932 : : /* it had better not gotten out of "init" mode yet */
933 [ - + ]: 2636 : if (!IsInitProcessingMode())
672 heikki.linnakangas@i 934 [ # # ]:UBC 0 : ereport(ERROR,
935 : : (errmsg("invalid processing mode in background worker")));
672 heikki.linnakangas@i 936 :CBC 2636 : SetProcessingMode(NormalProcessing);
937 : 2636 : }
938 : :
939 : : /*
940 : : * Block/unblock signals in a background worker
941 : : */
942 : : void
672 heikki.linnakangas@i 943 :UBC 0 : BackgroundWorkerBlockSignals(void)
944 : : {
945 : 0 : sigprocmask(SIG_SETMASK, &BlockSig, NULL);
946 : 0 : }
947 : :
948 : : void
672 heikki.linnakangas@i 949 :CBC 3323 : BackgroundWorkerUnblockSignals(void)
950 : : {
951 : 3323 : sigprocmask(SIG_SETMASK, &UnBlockSig, NULL);
952 : 3323 : }
953 : :
954 : : /*
955 : : * Register a new static background worker.
956 : : *
957 : : * This can only be called directly from postmaster or in the _PG_init
958 : : * function of a module library that's loaded by shared_preload_libraries;
959 : : * otherwise it will have no effect.
960 : : */
961 : : void
4676 rhaas@postgresql.org 962 : 952 : RegisterBackgroundWorker(BackgroundWorker *worker)
963 : : {
964 : : RegisteredBgWorker *rw;
965 : : static int numworkers = 0;
966 : :
967 : : /*
968 : : * Static background workers can only be registered in the postmaster
969 : : * process.
970 : : */
939 heikki.linnakangas@i 971 [ + - - + ]: 952 : if (IsUnderPostmaster || !IsPostmasterEnvironment)
972 : : {
973 : : /*
974 : : * In EXEC_BACKEND or single-user mode, we process
975 : : * shared_preload_libraries in backend processes too. We cannot
976 : : * register static background workers at that stage, but many
977 : : * libraries' _PG_init() functions don't distinguish whether they're
978 : : * being loaded in the postmaster or in a backend, they just check
979 : : * process_shared_preload_libraries_in_progress. It's a bit sloppy,
980 : : * but for historical reasons we tolerate it. In EXEC_BACKEND mode,
981 : : * the background workers should already have been registered when the
982 : : * library was loaded in postmaster.
983 : : */
939 heikki.linnakangas@i 984 [ # # ]:UBC 0 : if (process_shared_preload_libraries_in_progress)
985 : 0 : return;
986 [ # # ]: 0 : ereport(LOG,
987 : : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
988 : : errmsg("background worker \"%s\": must be registered in \"shared_preload_libraries\"",
989 : : worker->bgw_name)));
4676 rhaas@postgresql.org 990 : 0 : return;
991 : : }
992 : :
993 : : /*
994 : : * Cannot register static background workers after calling
995 : : * BackgroundWorkerShmemInit().
996 : : */
939 heikki.linnakangas@i 997 [ - + ]:CBC 952 : if (BackgroundWorkerData != NULL)
939 heikki.linnakangas@i 998 [ # # ]:UBC 0 : elog(ERROR, "cannot register background worker \"%s\" after shmem init",
999 : : worker->bgw_name);
1000 : :
939 heikki.linnakangas@i 1001 [ + + ]:CBC 952 : ereport(DEBUG1,
1002 : : (errmsg_internal("registering background worker \"%s\"", worker->bgw_name)));
1003 : :
4676 rhaas@postgresql.org 1004 [ - + ]: 952 : if (!SanityCheckBackgroundWorker(worker, LOG))
4676 rhaas@postgresql.org 1005 :UBC 0 : return;
1006 : :
4633 rhaas@postgresql.org 1007 [ - + ]:CBC 952 : if (worker->bgw_notify_pid != 0)
1008 : : {
4633 rhaas@postgresql.org 1009 [ # # ]:UBC 0 : ereport(LOG,
1010 : : (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
1011 : : errmsg("background worker \"%s\": only dynamic background workers can request notification",
1012 : : worker->bgw_name)));
1013 : 0 : return;
1014 : : }
1015 : :
1016 : : /*
1017 : : * Enforce maximum number of workers. Note this is overly restrictive: we
1018 : : * could allow more non-shmem-connected workers, because these don't count
1019 : : * towards the MAX_BACKENDS limit elsewhere. For now, it doesn't seem
1020 : : * important to relax this restriction.
1021 : : */
4676 rhaas@postgresql.org 1022 [ - + ]:CBC 952 : if (++numworkers > max_worker_processes)
1023 : : {
4676 rhaas@postgresql.org 1024 [ # # ]:UBC 0 : ereport(LOG,
1025 : : (errcode(ERRCODE_CONFIGURATION_LIMIT_EXCEEDED),
1026 : : errmsg("too many background workers"),
1027 : : errdetail_plural("Up to %d background worker can be registered with the current settings.",
1028 : : "Up to %d background workers can be registered with the current settings.",
1029 : : max_worker_processes,
1030 : : max_worker_processes),
1031 : : errhint("Consider increasing the configuration parameter \"%s\".", "max_worker_processes")));
1032 : 0 : return;
1033 : : }
1034 : :
1035 : : /*
1036 : : * Copy the registration data into the registered workers list.
1037 : : */
939 heikki.linnakangas@i 1038 :CBC 952 : rw = MemoryContextAllocExtended(PostmasterContext,
1039 : : sizeof(RegisteredBgWorker),
1040 : : MCXT_ALLOC_NO_OOM);
4676 rhaas@postgresql.org 1041 [ - + ]: 952 : if (rw == NULL)
1042 : : {
4676 rhaas@postgresql.org 1043 [ # # ]:UBC 0 : ereport(LOG,
1044 : : (errcode(ERRCODE_OUT_OF_MEMORY),
1045 : : errmsg("out of memory")));
1046 : 0 : return;
1047 : : }
1048 : :
4676 rhaas@postgresql.org 1049 :CBC 952 : rw->rw_worker = *worker;
1050 : 952 : rw->rw_pid = 0;
1051 : 952 : rw->rw_crashed_at = 0;
4582 1052 : 952 : rw->rw_terminate = false;
1053 : :
634 heikki.linnakangas@i 1054 : 952 : dlist_push_head(&BackgroundWorkerList, &rw->rw_lnode);
1055 : : }
1056 : :
1057 : : /*
1058 : : * Register a new background worker from a regular backend.
1059 : : *
1060 : : * Returns true on success and false on failure. Failure typically indicates
1061 : : * that no background worker slots are currently available.
1062 : : *
1063 : : * If handle != NULL, we'll set *handle to a pointer that can subsequently
1064 : : * be used as an argument to GetBackgroundWorkerPid(). The caller can
1065 : : * free this pointer using pfree(), if desired.
1066 : : */
1067 : : bool
4633 rhaas@postgresql.org 1068 : 2539 : RegisterDynamicBackgroundWorker(BackgroundWorker *worker,
1069 : : BackgroundWorkerHandle **handle)
1070 : : {
1071 : : int slotno;
4382 bruce@momjian.us 1072 : 2539 : bool success = false;
1073 : : bool parallel;
1074 : 2539 : uint64 generation = 0;
1075 : :
1076 : : /*
1077 : : * We can't register dynamic background workers from the postmaster. If
1078 : : * this is a standalone backend, we're the only process and can't start
1079 : : * any more. In a multi-process environment, it might be theoretically
1080 : : * possible, but we don't currently support it due to locking
1081 : : * considerations; see comments on the BackgroundWorkerSlot data
1082 : : * structure.
1083 : : */
4676 rhaas@postgresql.org 1084 [ - + ]: 2539 : if (!IsUnderPostmaster)
4676 rhaas@postgresql.org 1085 :UBC 0 : return false;
1086 : :
4676 rhaas@postgresql.org 1087 [ - + ]:CBC 2539 : if (!SanityCheckBackgroundWorker(worker, ERROR))
4676 rhaas@postgresql.org 1088 :UBC 0 : return false;
1089 : :
3441 rhaas@postgresql.org 1090 :CBC 2539 : parallel = (worker->bgw_flags & BGWORKER_CLASS_PARALLEL) != 0;
1091 : :
4676 1092 : 2539 : LWLockAcquire(BackgroundWorkerLock, LW_EXCLUSIVE);
1093 : :
1094 : : /*
1095 : : * If this is a parallel worker, check whether there are already too many
1096 : : * parallel workers; if so, don't register another one. Our view of
1097 : : * parallel_terminate_count may be slightly stale, but that doesn't really
1098 : : * matter: we would have gotten the same result if we'd arrived here
1099 : : * slightly earlier anyway. There's no help for it, either, since the
1100 : : * postmaster must not take locks; a memory barrier wouldn't guarantee
1101 : : * anything useful.
1102 : : */
3441 1103 [ + + ]: 2539 : if (parallel && (BackgroundWorkerData->parallel_register_count -
1104 [ + + ]: 2027 : BackgroundWorkerData->parallel_terminate_count) >=
1105 : : max_parallel_workers)
1106 : : {
3311 1107 [ - + ]: 13 : Assert(BackgroundWorkerData->parallel_register_count -
1108 : : BackgroundWorkerData->parallel_terminate_count <=
1109 : : MAX_PARALLEL_WORKER_LIMIT);
3441 1110 : 13 : LWLockRelease(BackgroundWorkerLock);
1111 : 13 : return false;
1112 : : }
1113 : :
1114 : : /*
1115 : : * Look for an unused slot. If we find one, grab it.
1116 : : */
4676 1117 [ + + ]: 7976 : for (slotno = 0; slotno < BackgroundWorkerData->total_slots; ++slotno)
1118 : : {
1119 : 7970 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
1120 : :
1121 [ + + ]: 7970 : if (!slot->in_use)
1122 : : {
1123 : 2520 : memcpy(&slot->worker, worker, sizeof(BackgroundWorker));
3240 tgl@sss.pgh.pa.us 1124 : 2520 : slot->pid = InvalidPid; /* indicates not started yet */
4633 rhaas@postgresql.org 1125 : 2520 : slot->generation++;
4582 1126 : 2520 : slot->terminate = false;
4633 1127 : 2520 : generation = slot->generation;
3441 1128 [ + + ]: 2520 : if (parallel)
1129 : 2008 : BackgroundWorkerData->parallel_register_count++;
1130 : :
1131 : : /*
1132 : : * Make sure postmaster doesn't see the slot as in use before it
1133 : : * sees the new contents.
1134 : : */
4676 1135 : 2520 : pg_write_barrier();
1136 : :
1137 : 2520 : slot->in_use = true;
1138 : 2520 : success = true;
1139 : 2520 : break;
1140 : : }
1141 : : }
1142 : :
1143 : 2526 : LWLockRelease(BackgroundWorkerLock);
1144 : :
1145 : : /* If we found a slot, tell the postmaster to notice the change. */
1146 [ + + ]: 2526 : if (success)
1147 : 2520 : SendPostmasterSignal(PMSIGNAL_BACKGROUND_WORKER_CHANGE);
1148 : :
1149 : : /*
1150 : : * If we found a slot and the user has provided a handle, initialize it.
1151 : : */
4633 1152 [ + + + - ]: 2526 : if (success && handle)
1153 : : {
146 michael@paquier.xyz 1154 :GNC 2520 : *handle = palloc_object(BackgroundWorkerHandle);
4633 rhaas@postgresql.org 1155 :CBC 2520 : (*handle)->slot = slotno;
1156 : 2520 : (*handle)->generation = generation;
1157 : : }
1158 : :
4676 1159 : 2526 : return success;
1160 : : }
1161 : :
1162 : : /*
1163 : : * Get the PID of a dynamically-registered background worker.
1164 : : *
1165 : : * If the worker is determined to be running, the return value will be
1166 : : * BGWH_STARTED and *pidp will get the PID of the worker process. If the
1167 : : * postmaster has not yet attempted to start the worker, the return value will
1168 : : * be BGWH_NOT_YET_STARTED. Otherwise, the return value is BGWH_STOPPED.
1169 : : *
1170 : : * BGWH_STOPPED can indicate either that the worker is temporarily stopped
1171 : : * (because it is configured for automatic restart and exited non-zero),
1172 : : * or that the worker is permanently stopped (because it exited with exit
1173 : : * code 0, or was not configured for automatic restart), or even that the
1174 : : * worker was unregistered without ever starting (either because startup
1175 : : * failed and the worker is not configured for automatic restart, or because
1176 : : * TerminateBackgroundWorker was used before the worker was successfully
1177 : : * started).
1178 : : */
1179 : : BgwHandleStatus
4633 1180 : 4261523 : GetBackgroundWorkerPid(BackgroundWorkerHandle *handle, pid_t *pidp)
1181 : : {
1182 : : BackgroundWorkerSlot *slot;
1183 : : pid_t pid;
1184 : :
1185 [ - + ]: 4261523 : Assert(handle->slot < max_worker_processes);
1186 : 4261523 : slot = &BackgroundWorkerData->slot[handle->slot];
1187 : :
1188 : : /*
1189 : : * We could probably arrange to synchronize access to data using memory
1190 : : * barriers only, but for now, let's just keep it simple and grab the
1191 : : * lock. It seems unlikely that there will be enough traffic here to
1192 : : * result in meaningful contention.
1193 : : */
1194 : 4261523 : LWLockAcquire(BackgroundWorkerLock, LW_SHARED);
1195 : :
1196 : : /*
1197 : : * The generation number can't be concurrently changed while we hold the
1198 : : * lock. The pid, which is updated by the postmaster, can change at any
1199 : : * time, but we assume such changes are atomic. So the value we read
1200 : : * won't be garbage, but it might be out of date by the time the caller
1201 : : * examines it (but that's unavoidable anyway).
1202 : : *
1203 : : * The in_use flag could be in the process of changing from true to false,
1204 : : * but if it is already false then it can't change further.
1205 : : */
3072 1206 [ + + + + ]: 4261523 : if (handle->generation != slot->generation || !slot->in_use)
4633 1207 : 2031 : pid = 0;
1208 : : else
1209 : 4259492 : pid = slot->pid;
1210 : :
1211 : : /* All done. */
1212 : 4261523 : LWLockRelease(BackgroundWorkerLock);
1213 : :
1214 [ + + ]: 4261523 : if (pid == 0)
1215 : 2031 : return BGWH_STOPPED;
1216 [ + + ]: 4259492 : else if (pid == InvalidPid)
1217 : 191968 : return BGWH_NOT_YET_STARTED;
1218 : 4067524 : *pidp = pid;
1219 : 4067524 : return BGWH_STARTED;
1220 : : }
1221 : :
1222 : : /*
1223 : : * Wait for a background worker to start up.
1224 : : *
1225 : : * This is like GetBackgroundWorkerPid(), except that if the worker has not
1226 : : * yet started, we wait for it to do so; thus, BGWH_NOT_YET_STARTED is never
1227 : : * returned. However, if the postmaster has died, we give up and return
1228 : : * BGWH_POSTMASTER_DIED, since it that case we know that startup will not
1229 : : * take place.
1230 : : *
1231 : : * The caller *must* have set our PID as the worker's bgw_notify_pid,
1232 : : * else we will not be awoken promptly when the worker's state changes.
1233 : : */
1234 : : BgwHandleStatus
1235 : 32 : WaitForBackgroundWorkerStartup(BackgroundWorkerHandle *handle, pid_t *pidp)
1236 : : {
1237 : : BgwHandleStatus status;
1238 : : int rc;
1239 : :
1240 : : for (;;)
1241 : 31 : {
1242 : : pid_t pid;
1243 : :
3861 1244 [ - + ]: 63 : CHECK_FOR_INTERRUPTS();
1245 : :
1246 : 63 : status = GetBackgroundWorkerPid(handle, &pid);
1247 [ + + ]: 63 : if (status == BGWH_STARTED)
1248 : 32 : *pidp = pid;
1249 [ + + ]: 63 : if (status != BGWH_NOT_YET_STARTED)
1250 : 32 : break;
1251 : :
1252 : 31 : rc = WaitLatch(MyLatch,
1253 : : WL_LATCH_SET | WL_POSTMASTER_DEATH, 0,
1254 : : WAIT_EVENT_BGWORKER_STARTUP);
1255 : :
1256 [ - + ]: 31 : if (rc & WL_POSTMASTER_DEATH)
1257 : : {
3861 rhaas@postgresql.org 1258 :UBC 0 : status = BGWH_POSTMASTER_DIED;
1259 : 0 : break;
1260 : : }
1261 : :
3861 rhaas@postgresql.org 1262 :CBC 31 : ResetLatch(MyLatch);
1263 : : }
1264 : :
4023 1265 : 32 : return status;
1266 : : }
1267 : :
1268 : : /*
1269 : : * Wait for a background worker to stop.
1270 : : *
1271 : : * If the worker hasn't yet started, or is running, we wait for it to stop
1272 : : * and then return BGWH_STOPPED. However, if the postmaster has died, we give
1273 : : * up and return BGWH_POSTMASTER_DIED, because it's the postmaster that
1274 : : * notifies us when a worker's state changes.
1275 : : *
1276 : : * The caller *must* have set our PID as the worker's bgw_notify_pid,
1277 : : * else we will not be awoken promptly when the worker's state changes.
1278 : : */
1279 : : BgwHandleStatus
1280 : 2032 : WaitForBackgroundWorkerShutdown(BackgroundWorkerHandle *handle)
1281 : : {
1282 : : BgwHandleStatus status;
1283 : : int rc;
1284 : :
1285 : : for (;;)
1286 : 2321 : {
1287 : : pid_t pid;
1288 : :
3861 1289 [ + + ]: 4353 : CHECK_FOR_INTERRUPTS();
1290 : :
1291 : 4352 : status = GetBackgroundWorkerPid(handle, &pid);
1292 [ + + ]: 4352 : if (status == BGWH_STOPPED)
3561 tgl@sss.pgh.pa.us 1293 : 2031 : break;
1294 : :
3255 andres@anarazel.de 1295 : 2321 : rc = WaitLatch(MyLatch,
1296 : : WL_LATCH_SET | WL_POSTMASTER_DEATH, 0,
1297 : : WAIT_EVENT_BGWORKER_SHUTDOWN);
1298 : :
3861 rhaas@postgresql.org 1299 [ - + ]: 2321 : if (rc & WL_POSTMASTER_DEATH)
1300 : : {
3561 tgl@sss.pgh.pa.us 1301 :UBC 0 : status = BGWH_POSTMASTER_DIED;
1302 : 0 : break;
1303 : : }
1304 : :
3255 andres@anarazel.de 1305 :CBC 2321 : ResetLatch(MyLatch);
1306 : : }
1307 : :
4633 rhaas@postgresql.org 1308 : 2031 : return status;
1309 : : }
1310 : :
1311 : : /*
1312 : : * Instruct the postmaster to terminate a background worker.
1313 : : *
1314 : : * Note that it's safe to do this without regard to whether the worker is
1315 : : * still running, or even if the worker may already have exited and been
1316 : : * unregistered.
1317 : : */
1318 : : void
4582 1319 : 11 : TerminateBackgroundWorker(BackgroundWorkerHandle *handle)
1320 : : {
1321 : : BackgroundWorkerSlot *slot;
4382 bruce@momjian.us 1322 : 11 : bool signal_postmaster = false;
1323 : :
4582 rhaas@postgresql.org 1324 [ - + ]: 11 : Assert(handle->slot < max_worker_processes);
1325 : 11 : slot = &BackgroundWorkerData->slot[handle->slot];
1326 : :
1327 : : /* Set terminate flag in shared memory, unless slot has been reused. */
1328 : 11 : LWLockAcquire(BackgroundWorkerLock, LW_EXCLUSIVE);
1329 [ + - ]: 11 : if (handle->generation == slot->generation)
1330 : : {
1331 : 11 : slot->terminate = true;
1332 : 11 : signal_postmaster = true;
1333 : : }
1334 : 11 : LWLockRelease(BackgroundWorkerLock);
1335 : :
1336 : : /* Make sure the postmaster notices the change to shared memory. */
1337 [ + - ]: 11 : if (signal_postmaster)
1338 : 11 : SendPostmasterSignal(PMSIGNAL_BACKGROUND_WORKER_CHANGE);
1339 : 11 : }
1340 : :
1341 : : /*
1342 : : * Look up (and possibly load) a bgworker entry point function.
1343 : : *
1344 : : * For functions contained in the core code, we use library name "postgres"
1345 : : * and consult the InternalBGWorkers array. External functions are
1346 : : * looked up, and loaded if necessary, using load_external_function().
1347 : : *
1348 : : * The point of this is to pass function names as strings across process
1349 : : * boundaries. We can't pass actual function addresses because of the
1350 : : * possibility that the function has been loaded at a different address
1351 : : * in a different process. This is obviously a hazard for functions in
1352 : : * loadable libraries, but it can happen even for functions in the core code
1353 : : * on platforms using EXEC_BACKEND (e.g., Windows).
1354 : : *
1355 : : * At some point it might be worthwhile to get rid of InternalBGWorkers[]
1356 : : * in favor of applying load_external_function() for core functions too;
1357 : : * but that raises portability issues that are not worth addressing now.
1358 : : */
1359 : : static bgworker_main_type
3308 tgl@sss.pgh.pa.us 1360 : 3169 : LookupBackgroundWorkerFunction(const char *libraryname, const char *funcname)
1361 : : {
1362 : : /*
1363 : : * If the function is to be loaded from postgres itself, search the
1364 : : * InternalBGWorkers array.
1365 : : */
1366 [ + + ]: 3169 : if (strcmp(libraryname, "postgres") == 0)
1367 : : {
1368 : : int i;
1369 : :
1370 [ + - ]: 11140 : for (i = 0; i < lengthof(InternalBGWorkers); i++)
1371 : : {
1372 [ + + ]: 11140 : if (strcmp(InternalBGWorkers[i].fn_name, funcname) == 0)
1373 : 3147 : return InternalBGWorkers[i].fn_addr;
1374 : : }
1375 : :
1376 : : /* We can only reach this by programming error. */
3308 tgl@sss.pgh.pa.us 1377 [ # # ]:UBC 0 : elog(ERROR, "internal function \"%s\" not found", funcname);
1378 : : }
1379 : :
1380 : : /* Otherwise load from external library. */
3308 tgl@sss.pgh.pa.us 1381 :CBC 22 : return (bgworker_main_type)
1382 : 22 : load_external_function(libraryname, funcname, true, NULL);
1383 : : }
1384 : :
1385 : : /*
1386 : : * Given a PID, get the bgw_type of the background worker. Returns NULL if
1387 : : * not a valid background worker.
1388 : : *
1389 : : * The return value is in static memory belonging to this function, so it has
1390 : : * to be used before calling this function again. This is so that the caller
1391 : : * doesn't have to worry about the background worker locking protocol.
1392 : : */
1393 : : const char *
3169 peter_e@gmx.net 1394 : 864 : GetBackgroundWorkerTypeByPid(pid_t pid)
1395 : : {
1396 : : int slotno;
1397 : 864 : bool found = false;
1398 : : static char result[BGW_MAXLEN];
1399 : :
1400 : 864 : LWLockAcquire(BackgroundWorkerLock, LW_SHARED);
1401 : :
1402 [ + - ]: 997 : for (slotno = 0; slotno < BackgroundWorkerData->total_slots; slotno++)
1403 : : {
1404 : 997 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
1405 : :
1406 [ + + + + ]: 997 : if (slot->pid > 0 && slot->pid == pid)
1407 : : {
1408 : 864 : strcpy(result, slot->worker.bgw_type);
1409 : 864 : found = true;
1410 : 864 : break;
1411 : : }
1412 : : }
1413 : :
1414 : 864 : LWLockRelease(BackgroundWorkerLock);
1415 : :
1416 [ - + ]: 864 : if (!found)
3169 peter_e@gmx.net 1417 :UBC 0 : return NULL;
1418 : :
3169 peter_e@gmx.net 1419 :CBC 864 : return result;
1420 : : }
1421 : :
1422 : : /*
1423 : : * Terminate all background workers connected to the given database, if the
1424 : : * workers can be interrupted.
1425 : : */
1426 : : void
119 michael@paquier.xyz 1427 :GNC 7 : TerminateBackgroundWorkersForDatabase(Oid databaseId)
1428 : : {
1429 : 7 : bool signal_postmaster = false;
1430 : :
47 1431 [ + - ]: 7 : elog(DEBUG1, "attempting worker termination for database %u",
1432 : : databaseId);
1433 : :
119 1434 : 7 : LWLockAcquire(BackgroundWorkerLock, LW_EXCLUSIVE);
1435 : :
1436 : : /*
1437 : : * Iterate through slots, looking for workers connected to the given
1438 : : * database.
1439 : : */
1440 [ + + ]: 63 : for (int slotno = 0; slotno < BackgroundWorkerData->total_slots; slotno++)
1441 : : {
1442 : 56 : BackgroundWorkerSlot *slot = &BackgroundWorkerData->slot[slotno];
1443 : :
1444 [ + + ]: 56 : if (slot->in_use &&
1445 [ + + ]: 14 : (slot->worker.bgw_flags & BGWORKER_INTERRUPTIBLE))
1446 : : {
1447 : 4 : PGPROC *proc = BackendPidGetProc(slot->pid);
1448 : :
1449 [ + - + - ]: 4 : if (proc && proc->databaseId == databaseId)
1450 : : {
1451 : 4 : slot->terminate = true;
1452 : 4 : signal_postmaster = true;
1453 : :
47 1454 [ + - ]: 4 : elog(DEBUG1, "termination requested for worker (PID %d) on database %u",
1455 : : (int) slot->pid, databaseId);
1456 : : }
1457 : : }
1458 : : }
1459 : :
119 1460 : 7 : LWLockRelease(BackgroundWorkerLock);
1461 : :
1462 : : /* Make sure the postmaster notices the change to shared memory. */
1463 [ + + ]: 7 : if (signal_postmaster)
1464 : 4 : SendPostmasterSignal(PMSIGNAL_BACKGROUND_WORKER_CHANGE);
1465 : 7 : }
|