| 1 | /*------------------------------------------------------------------------- |
| 2 | * |
| 3 | * ipc.c |
| 4 | * POSTGRES inter-process communication definitions. |
| 5 | * |
| 6 | * This file is misnamed, as it no longer has much of anything directly |
| 7 | * to do with IPC. The functionality here is concerned with managing |
| 8 | * exit-time cleanup for either a postmaster or a backend. |
| 9 | * |
| 10 | * |
| 11 | * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group |
| 12 | * Portions Copyright (c) 1994, Regents of the University of California |
| 13 | * |
| 14 | * |
| 15 | * IDENTIFICATION |
| 16 | * src/backend/storage/ipc/ipc.c |
| 17 | * |
| 18 | *------------------------------------------------------------------------- |
| 19 | */ |
| 20 | #include "postgres.h" |
| 21 | |
| 22 | #include <signal.h> |
| 23 | #include <unistd.h> |
| 24 | #include <sys/stat.h> |
| 25 | |
| 26 | #include "miscadmin.h" |
| 27 | #ifdef PROFILE_PID_DIR |
| 28 | #include "postmaster/autovacuum.h" |
| 29 | #endif |
| 30 | #include "storage/dsm.h" |
| 31 | #include "storage/ipc.h" |
| 32 | #include "tcop/tcopprot.h" |
| 33 | |
| 34 | |
| 35 | /* |
| 36 | * This flag is set during proc_exit() to change ereport()'s behavior, |
| 37 | * so that an ereport() from an on_proc_exit routine cannot get us out |
| 38 | * of the exit procedure. We do NOT want to go back to the idle loop... |
| 39 | */ |
| 40 | bool proc_exit_inprogress = false; |
| 41 | |
| 42 | /* |
| 43 | * Set when shmem_exit() is in progress. |
| 44 | */ |
| 45 | bool shmem_exit_inprogress = false; |
| 46 | |
| 47 | /* |
| 48 | * This flag tracks whether we've called atexit() in the current process |
| 49 | * (or in the parent postmaster). |
| 50 | */ |
| 51 | static bool atexit_callback_setup = false; |
| 52 | |
| 53 | /* local functions */ |
| 54 | static void proc_exit_prepare(int code); |
| 55 | |
| 56 | |
| 57 | /* ---------------------------------------------------------------- |
| 58 | * exit() handling stuff |
| 59 | * |
| 60 | * These functions are in generally the same spirit as atexit(), |
| 61 | * but provide some additional features we need --- in particular, |
| 62 | * we want to register callbacks to invoke when we are disconnecting |
| 63 | * from a broken shared-memory context but not exiting the postmaster. |
| 64 | * |
| 65 | * Callback functions can take zero, one, or two args: the first passed |
| 66 | * arg is the integer exitcode, the second is the Datum supplied when |
| 67 | * the callback was registered. |
| 68 | * ---------------------------------------------------------------- |
| 69 | */ |
| 70 | |
| 71 | #define MAX_ON_EXITS 20 |
| 72 | |
| 73 | struct ONEXIT |
| 74 | { |
| 75 | pg_on_exit_callback function; |
| 76 | Datum arg; |
| 77 | }; |
| 78 | |
| 79 | static struct ONEXIT on_proc_exit_list[MAX_ON_EXITS]; |
| 80 | static struct ONEXIT on_shmem_exit_list[MAX_ON_EXITS]; |
| 81 | static struct ONEXIT before_shmem_exit_list[MAX_ON_EXITS]; |
| 82 | |
| 83 | static int on_proc_exit_index, |
| 84 | on_shmem_exit_index, |
| 85 | before_shmem_exit_index; |
| 86 | |
| 87 | |
| 88 | /* ---------------------------------------------------------------- |
| 89 | * proc_exit |
| 90 | * |
| 91 | * this function calls all the callbacks registered |
| 92 | * for it (to free resources) and then calls exit. |
| 93 | * |
| 94 | * This should be the only function to call exit(). |
| 95 | * -cim 2/6/90 |
| 96 | * |
| 97 | * Unfortunately, we can't really guarantee that add-on code |
| 98 | * obeys the rule of not calling exit() directly. So, while |
| 99 | * this is the preferred way out of the system, we also register |
| 100 | * an atexit callback that will make sure cleanup happens. |
| 101 | * ---------------------------------------------------------------- |
| 102 | */ |
| 103 | void |
| 104 | proc_exit(int code) |
| 105 | { |
| 106 | /* Clean up everything that must be cleaned up */ |
| 107 | proc_exit_prepare(code); |
| 108 | |
| 109 | #ifdef PROFILE_PID_DIR |
| 110 | { |
| 111 | /* |
| 112 | * If we are profiling ourself then gprof's mcleanup() is about to |
| 113 | * write out a profile to ./gmon.out. Since mcleanup() always uses a |
| 114 | * fixed file name, each backend will overwrite earlier profiles. To |
| 115 | * fix that, we create a separate subdirectory for each backend |
| 116 | * (./gprof/pid) and 'cd' to that subdirectory before we exit() - that |
| 117 | * forces mcleanup() to write each profile into its own directory. We |
| 118 | * end up with something like: $PGDATA/gprof/8829/gmon.out |
| 119 | * $PGDATA/gprof/8845/gmon.out ... |
| 120 | * |
| 121 | * To avoid undesirable disk space bloat, autovacuum workers are |
| 122 | * discriminated against: all their gmon.out files go into the same |
| 123 | * subdirectory. Without this, an installation that is "just sitting |
| 124 | * there" nonetheless eats megabytes of disk space every few seconds. |
| 125 | * |
| 126 | * Note that we do this here instead of in an on_proc_exit() callback |
| 127 | * because we want to ensure that this code executes last - we don't |
| 128 | * want to interfere with any other on_proc_exit() callback. For the |
| 129 | * same reason, we do not include it in proc_exit_prepare ... so if |
| 130 | * you are exiting in the "wrong way" you won't drop your profile in a |
| 131 | * nice place. |
| 132 | */ |
| 133 | char gprofDirName[32]; |
| 134 | |
| 135 | if (IsAutoVacuumWorkerProcess()) |
| 136 | snprintf(gprofDirName, 32, "gprof/avworker" ); |
| 137 | else |
| 138 | snprintf(gprofDirName, 32, "gprof/%d" , (int) getpid()); |
| 139 | |
| 140 | /* |
| 141 | * Use mkdir() instead of MakePGDirectory() since we aren't making a |
| 142 | * PG directory here. |
| 143 | */ |
| 144 | mkdir("gprof" , S_IRWXU | S_IRWXG | S_IRWXO); |
| 145 | mkdir(gprofDirName, S_IRWXU | S_IRWXG | S_IRWXO); |
| 146 | chdir(gprofDirName); |
| 147 | } |
| 148 | #endif |
| 149 | |
| 150 | elog(DEBUG3, "exit(%d)" , code); |
| 151 | |
| 152 | exit(code); |
| 153 | } |
| 154 | |
| 155 | /* |
| 156 | * Code shared between proc_exit and the atexit handler. Note that in |
| 157 | * normal exit through proc_exit, this will actually be called twice ... |
| 158 | * but the second call will have nothing to do. |
| 159 | */ |
| 160 | static void |
| 161 | proc_exit_prepare(int code) |
| 162 | { |
| 163 | /* |
| 164 | * Once we set this flag, we are committed to exit. Any ereport() will |
| 165 | * NOT send control back to the main loop, but right back here. |
| 166 | */ |
| 167 | proc_exit_inprogress = true; |
| 168 | |
| 169 | /* |
| 170 | * Forget any pending cancel or die requests; we're doing our best to |
| 171 | * close up shop already. Note that the signal handlers will not set |
| 172 | * these flags again, now that proc_exit_inprogress is set. |
| 173 | */ |
| 174 | InterruptPending = false; |
| 175 | ProcDiePending = false; |
| 176 | QueryCancelPending = false; |
| 177 | InterruptHoldoffCount = 1; |
| 178 | CritSectionCount = 0; |
| 179 | |
| 180 | /* |
| 181 | * Also clear the error context stack, to prevent error callbacks from |
| 182 | * being invoked by any elog/ereport calls made during proc_exit. Whatever |
| 183 | * context they might want to offer is probably not relevant, and in any |
| 184 | * case they are likely to fail outright after we've done things like |
| 185 | * aborting any open transaction. (In normal exit scenarios the context |
| 186 | * stack should be empty anyway, but it might not be in the case of |
| 187 | * elog(FATAL) for example.) |
| 188 | */ |
| 189 | error_context_stack = NULL; |
| 190 | /* For the same reason, reset debug_query_string before it's clobbered */ |
| 191 | debug_query_string = NULL; |
| 192 | |
| 193 | /* do our shared memory exits first */ |
| 194 | shmem_exit(code); |
| 195 | |
| 196 | elog(DEBUG3, "proc_exit(%d): %d callbacks to make" , |
| 197 | code, on_proc_exit_index); |
| 198 | |
| 199 | /* |
| 200 | * call all the registered callbacks. |
| 201 | * |
| 202 | * Note that since we decrement on_proc_exit_index each time, if a |
| 203 | * callback calls ereport(ERROR) or ereport(FATAL) then it won't be |
| 204 | * invoked again when control comes back here (nor will the |
| 205 | * previously-completed callbacks). So, an infinite loop should not be |
| 206 | * possible. |
| 207 | */ |
| 208 | while (--on_proc_exit_index >= 0) |
| 209 | on_proc_exit_list[on_proc_exit_index].function(code, |
| 210 | on_proc_exit_list[on_proc_exit_index].arg); |
| 211 | |
| 212 | on_proc_exit_index = 0; |
| 213 | } |
| 214 | |
| 215 | /* ------------------ |
| 216 | * Run all of the on_shmem_exit routines --- but don't actually exit. |
| 217 | * This is used by the postmaster to re-initialize shared memory and |
| 218 | * semaphores after a backend dies horribly. As with proc_exit(), we |
| 219 | * remove each callback from the list before calling it, to avoid |
| 220 | * infinite loop in case of error. |
| 221 | * ------------------ |
| 222 | */ |
| 223 | void |
| 224 | shmem_exit(int code) |
| 225 | { |
| 226 | shmem_exit_inprogress = true; |
| 227 | |
| 228 | /* |
| 229 | * Call before_shmem_exit callbacks. |
| 230 | * |
| 231 | * These should be things that need most of the system to still be up and |
| 232 | * working, such as cleanup of temp relations, which requires catalog |
| 233 | * access; or things that need to be completed because later cleanup steps |
| 234 | * depend on them, such as releasing lwlocks. |
| 235 | */ |
| 236 | elog(DEBUG3, "shmem_exit(%d): %d before_shmem_exit callbacks to make" , |
| 237 | code, before_shmem_exit_index); |
| 238 | while (--before_shmem_exit_index >= 0) |
| 239 | before_shmem_exit_list[before_shmem_exit_index].function(code, |
| 240 | before_shmem_exit_list[before_shmem_exit_index].arg); |
| 241 | before_shmem_exit_index = 0; |
| 242 | |
| 243 | /* |
| 244 | * Call dynamic shared memory callbacks. |
| 245 | * |
| 246 | * These serve the same purpose as late callbacks, but for dynamic shared |
| 247 | * memory segments rather than the main shared memory segment. |
| 248 | * dsm_backend_shutdown() has the same kind of progressive logic we use |
| 249 | * for the main shared memory segment; namely, it unregisters each |
| 250 | * callback before invoking it, so that we don't get stuck in an infinite |
| 251 | * loop if one of those callbacks itself throws an ERROR or FATAL. |
| 252 | * |
| 253 | * Note that explicitly calling this function here is quite different from |
| 254 | * registering it as an on_shmem_exit callback for precisely this reason: |
| 255 | * if one dynamic shared memory callback errors out, the remaining |
| 256 | * callbacks will still be invoked. Thus, hard-coding this call puts it |
| 257 | * equal footing with callbacks for the main shared memory segment. |
| 258 | */ |
| 259 | dsm_backend_shutdown(); |
| 260 | |
| 261 | /* |
| 262 | * Call on_shmem_exit callbacks. |
| 263 | * |
| 264 | * These are generally releasing low-level shared memory resources. In |
| 265 | * some cases, this is a backstop against the possibility that the early |
| 266 | * callbacks might themselves fail, leading to re-entry to this routine; |
| 267 | * in other cases, it's cleanup that only happens at process exit. |
| 268 | */ |
| 269 | elog(DEBUG3, "shmem_exit(%d): %d on_shmem_exit callbacks to make" , |
| 270 | code, on_shmem_exit_index); |
| 271 | while (--on_shmem_exit_index >= 0) |
| 272 | on_shmem_exit_list[on_shmem_exit_index].function(code, |
| 273 | on_shmem_exit_list[on_shmem_exit_index].arg); |
| 274 | on_shmem_exit_index = 0; |
| 275 | |
| 276 | shmem_exit_inprogress = false; |
| 277 | } |
| 278 | |
| 279 | /* ---------------------------------------------------------------- |
| 280 | * atexit_callback |
| 281 | * |
| 282 | * Backstop to ensure that direct calls of exit() don't mess us up. |
| 283 | * |
| 284 | * Somebody who was being really uncooperative could call _exit(), |
| 285 | * but for that case we have a "dead man switch" that will make the |
| 286 | * postmaster treat it as a crash --- see pmsignal.c. |
| 287 | * ---------------------------------------------------------------- |
| 288 | */ |
| 289 | static void |
| 290 | atexit_callback(void) |
| 291 | { |
| 292 | /* Clean up everything that must be cleaned up */ |
| 293 | /* ... too bad we don't know the real exit code ... */ |
| 294 | proc_exit_prepare(-1); |
| 295 | } |
| 296 | |
| 297 | /* ---------------------------------------------------------------- |
| 298 | * on_proc_exit |
| 299 | * |
| 300 | * this function adds a callback function to the list of |
| 301 | * functions invoked by proc_exit(). -cim 2/6/90 |
| 302 | * ---------------------------------------------------------------- |
| 303 | */ |
| 304 | void |
| 305 | on_proc_exit(pg_on_exit_callback function, Datum arg) |
| 306 | { |
| 307 | if (on_proc_exit_index >= MAX_ON_EXITS) |
| 308 | ereport(FATAL, |
| 309 | (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED), |
| 310 | errmsg_internal("out of on_proc_exit slots" ))); |
| 311 | |
| 312 | on_proc_exit_list[on_proc_exit_index].function = function; |
| 313 | on_proc_exit_list[on_proc_exit_index].arg = arg; |
| 314 | |
| 315 | ++on_proc_exit_index; |
| 316 | |
| 317 | if (!atexit_callback_setup) |
| 318 | { |
| 319 | atexit(atexit_callback); |
| 320 | atexit_callback_setup = true; |
| 321 | } |
| 322 | } |
| 323 | |
| 324 | /* ---------------------------------------------------------------- |
| 325 | * before_shmem_exit |
| 326 | * |
| 327 | * Register early callback to perform user-level cleanup, |
| 328 | * e.g. transaction abort, before we begin shutting down |
| 329 | * low-level subsystems. |
| 330 | * ---------------------------------------------------------------- |
| 331 | */ |
| 332 | void |
| 333 | before_shmem_exit(pg_on_exit_callback function, Datum arg) |
| 334 | { |
| 335 | if (before_shmem_exit_index >= MAX_ON_EXITS) |
| 336 | ereport(FATAL, |
| 337 | (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED), |
| 338 | errmsg_internal("out of before_shmem_exit slots" ))); |
| 339 | |
| 340 | before_shmem_exit_list[before_shmem_exit_index].function = function; |
| 341 | before_shmem_exit_list[before_shmem_exit_index].arg = arg; |
| 342 | |
| 343 | ++before_shmem_exit_index; |
| 344 | |
| 345 | if (!atexit_callback_setup) |
| 346 | { |
| 347 | atexit(atexit_callback); |
| 348 | atexit_callback_setup = true; |
| 349 | } |
| 350 | } |
| 351 | |
| 352 | /* ---------------------------------------------------------------- |
| 353 | * on_shmem_exit |
| 354 | * |
| 355 | * Register ordinary callback to perform low-level shutdown |
| 356 | * (e.g. releasing our PGPROC); run after before_shmem_exit |
| 357 | * callbacks and before on_proc_exit callbacks. |
| 358 | * ---------------------------------------------------------------- |
| 359 | */ |
| 360 | void |
| 361 | on_shmem_exit(pg_on_exit_callback function, Datum arg) |
| 362 | { |
| 363 | if (on_shmem_exit_index >= MAX_ON_EXITS) |
| 364 | ereport(FATAL, |
| 365 | (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED), |
| 366 | errmsg_internal("out of on_shmem_exit slots" ))); |
| 367 | |
| 368 | on_shmem_exit_list[on_shmem_exit_index].function = function; |
| 369 | on_shmem_exit_list[on_shmem_exit_index].arg = arg; |
| 370 | |
| 371 | ++on_shmem_exit_index; |
| 372 | |
| 373 | if (!atexit_callback_setup) |
| 374 | { |
| 375 | atexit(atexit_callback); |
| 376 | atexit_callback_setup = true; |
| 377 | } |
| 378 | } |
| 379 | |
| 380 | /* ---------------------------------------------------------------- |
| 381 | * cancel_before_shmem_exit |
| 382 | * |
| 383 | * this function removes a previously-registered before_shmem_exit |
| 384 | * callback. For simplicity, only the latest entry can be |
| 385 | * removed. (We could work harder but there is no need for |
| 386 | * current uses.) |
| 387 | * ---------------------------------------------------------------- |
| 388 | */ |
| 389 | void |
| 390 | cancel_before_shmem_exit(pg_on_exit_callback function, Datum arg) |
| 391 | { |
| 392 | if (before_shmem_exit_index > 0 && |
| 393 | before_shmem_exit_list[before_shmem_exit_index - 1].function |
| 394 | == function && |
| 395 | before_shmem_exit_list[before_shmem_exit_index - 1].arg == arg) |
| 396 | --before_shmem_exit_index; |
| 397 | } |
| 398 | |
| 399 | /* ---------------------------------------------------------------- |
| 400 | * on_exit_reset |
| 401 | * |
| 402 | * this function clears all on_proc_exit() and on_shmem_exit() |
| 403 | * registered functions. This is used just after forking a backend, |
| 404 | * so that the backend doesn't believe it should call the postmaster's |
| 405 | * on-exit routines when it exits... |
| 406 | * ---------------------------------------------------------------- |
| 407 | */ |
| 408 | void |
| 409 | on_exit_reset(void) |
| 410 | { |
| 411 | before_shmem_exit_index = 0; |
| 412 | on_shmem_exit_index = 0; |
| 413 | on_proc_exit_index = 0; |
| 414 | reset_on_dsm_detach(); |
| 415 | } |
| 416 | |