1/*-------------------------------------------------------------------------
2 *
3 * walwriter.c
4 *
5 * The WAL writer background process is new as of Postgres 8.3. It attempts
6 * to keep regular backends from having to write out (and fsync) WAL pages.
7 * Also, it guarantees that transaction commit records that weren't synced
8 * to disk immediately upon commit (ie, were "asynchronously committed")
9 * will reach disk within a knowable time --- which, as it happens, is at
10 * most three times the wal_writer_delay cycle time.
11 *
12 * Note that as with the bgwriter for shared buffers, regular backends are
13 * still empowered to issue WAL writes and fsyncs when the walwriter doesn't
14 * keep up. This means that the WALWriter is not an essential process and
15 * can shutdown quickly when requested.
16 *
17 * Because the walwriter's cycle is directly linked to the maximum delay
18 * before async-commit transactions are guaranteed committed, it's probably
19 * unwise to load additional functionality onto it. For instance, if you've
20 * got a yen to create xlog segments further in advance, that'd be better done
21 * in bgwriter than in walwriter.
22 *
23 * The walwriter is started by the postmaster as soon as the startup subprocess
24 * finishes. It remains alive until the postmaster commands it to terminate.
25 * Normal termination is by SIGTERM, which instructs the walwriter to exit(0).
26 * Emergency termination is by SIGQUIT; like any backend, the walwriter will
27 * simply abort and exit on SIGQUIT.
28 *
29 * If the walwriter exits unexpectedly, the postmaster treats that the same
30 * as a backend crash: shared memory may be corrupted, so remaining backends
31 * should be killed by SIGQUIT and then a recovery cycle started.
32 *
33 *
34 * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group
35 *
36 *
37 * IDENTIFICATION
38 * src/backend/postmaster/walwriter.c
39 *
40 *-------------------------------------------------------------------------
41 */
42#include "postgres.h"
43
44#include <signal.h>
45#include <unistd.h>
46
47#include "access/xlog.h"
48#include "libpq/pqsignal.h"
49#include "miscadmin.h"
50#include "pgstat.h"
51#include "postmaster/walwriter.h"
52#include "storage/bufmgr.h"
53#include "storage/condition_variable.h"
54#include "storage/fd.h"
55#include "storage/ipc.h"
56#include "storage/lwlock.h"
57#include "storage/proc.h"
58#include "storage/smgr.h"
59#include "utils/guc.h"
60#include "utils/hsearch.h"
61#include "utils/memutils.h"
62#include "utils/resowner.h"
63
64
65/*
66 * GUC parameters
67 */
68int WalWriterDelay = 200;
69int WalWriterFlushAfter = 128;
70
71/*
72 * Number of do-nothing loops before lengthening the delay time, and the
73 * multiplier to apply to WalWriterDelay when we do decide to hibernate.
74 * (Perhaps these need to be configurable?)
75 */
76#define LOOPS_UNTIL_HIBERNATE 50
77#define HIBERNATE_FACTOR 25
78
79/*
80 * Flags set by interrupt handlers for later service in the main loop.
81 */
82static volatile sig_atomic_t got_SIGHUP = false;
83static volatile sig_atomic_t shutdown_requested = false;
84
85/* Signal handlers */
86static void wal_quickdie(SIGNAL_ARGS);
87static void WalSigHupHandler(SIGNAL_ARGS);
88static void WalShutdownHandler(SIGNAL_ARGS);
89static void walwriter_sigusr1_handler(SIGNAL_ARGS);
90
91/*
92 * Main entry point for walwriter process
93 *
94 * This is invoked from AuxiliaryProcessMain, which has already created the
95 * basic execution environment, but not enabled signals yet.
96 */
97void
98WalWriterMain(void)
99{
100 sigjmp_buf local_sigjmp_buf;
101 MemoryContext walwriter_context;
102 int left_till_hibernate;
103 bool hibernating;
104
105 /*
106 * Properly accept or ignore signals the postmaster might send us
107 *
108 * We have no particular use for SIGINT at the moment, but seems
109 * reasonable to treat like SIGTERM.
110 */
111 pqsignal(SIGHUP, WalSigHupHandler); /* set flag to read config file */
112 pqsignal(SIGINT, WalShutdownHandler); /* request shutdown */
113 pqsignal(SIGTERM, WalShutdownHandler); /* request shutdown */
114 pqsignal(SIGQUIT, wal_quickdie); /* hard crash time */
115 pqsignal(SIGALRM, SIG_IGN);
116 pqsignal(SIGPIPE, SIG_IGN);
117 pqsignal(SIGUSR1, walwriter_sigusr1_handler);
118 pqsignal(SIGUSR2, SIG_IGN); /* not used */
119
120 /*
121 * Reset some signals that are accepted by postmaster but not here
122 */
123 pqsignal(SIGCHLD, SIG_DFL);
124
125 /* We allow SIGQUIT (quickdie) at all times */
126 sigdelset(&BlockSig, SIGQUIT);
127
128 /*
129 * Create a memory context that we will do all our work in. We do this so
130 * that we can reset the context during error recovery and thereby avoid
131 * possible memory leaks. Formerly this code just ran in
132 * TopMemoryContext, but resetting that would be a really bad idea.
133 */
134 walwriter_context = AllocSetContextCreate(TopMemoryContext,
135 "Wal Writer",
136 ALLOCSET_DEFAULT_SIZES);
137 MemoryContextSwitchTo(walwriter_context);
138
139 /*
140 * If an exception is encountered, processing resumes here.
141 *
142 * This code is heavily based on bgwriter.c, q.v.
143 */
144 if (sigsetjmp(local_sigjmp_buf, 1) != 0)
145 {
146 /* Since not using PG_TRY, must reset error stack by hand */
147 error_context_stack = NULL;
148
149 /* Prevent interrupts while cleaning up */
150 HOLD_INTERRUPTS();
151
152 /* Report the error to the server log */
153 EmitErrorReport();
154
155 /*
156 * These operations are really just a minimal subset of
157 * AbortTransaction(). We don't have very many resources to worry
158 * about in walwriter, but we do have LWLocks, and perhaps buffers?
159 */
160 LWLockReleaseAll();
161 ConditionVariableCancelSleep();
162 pgstat_report_wait_end();
163 AbortBufferIO();
164 UnlockBuffers();
165 ReleaseAuxProcessResources(false);
166 AtEOXact_Buffers(false);
167 AtEOXact_SMgr();
168 AtEOXact_Files(false);
169 AtEOXact_HashTables(false);
170
171 /*
172 * Now return to normal top-level context and clear ErrorContext for
173 * next time.
174 */
175 MemoryContextSwitchTo(walwriter_context);
176 FlushErrorState();
177
178 /* Flush any leaked data in the top-level context */
179 MemoryContextResetAndDeleteChildren(walwriter_context);
180
181 /* Now we can allow interrupts again */
182 RESUME_INTERRUPTS();
183
184 /*
185 * Sleep at least 1 second after any error. A write error is likely
186 * to be repeated, and we don't want to be filling the error logs as
187 * fast as we can.
188 */
189 pg_usleep(1000000L);
190
191 /*
192 * Close all open files after any error. This is helpful on Windows,
193 * where holding deleted files open causes various strange errors.
194 * It's not clear we need it elsewhere, but shouldn't hurt.
195 */
196 smgrcloseall();
197 }
198
199 /* We can now handle ereport(ERROR) */
200 PG_exception_stack = &local_sigjmp_buf;
201
202 /*
203 * Unblock signals (they were blocked when the postmaster forked us)
204 */
205 PG_SETMASK(&UnBlockSig);
206
207 /*
208 * Reset hibernation state after any error.
209 */
210 left_till_hibernate = LOOPS_UNTIL_HIBERNATE;
211 hibernating = false;
212 SetWalWriterSleeping(false);
213
214 /*
215 * Advertise our latch that backends can use to wake us up while we're
216 * sleeping.
217 */
218 ProcGlobal->walwriterLatch = &MyProc->procLatch;
219
220 /*
221 * Loop forever
222 */
223 for (;;)
224 {
225 long cur_timeout;
226
227 /*
228 * Advertise whether we might hibernate in this cycle. We do this
229 * before resetting the latch to ensure that any async commits will
230 * see the flag set if they might possibly need to wake us up, and
231 * that we won't miss any signal they send us. (If we discover work
232 * to do in the last cycle before we would hibernate, the global flag
233 * will be set unnecessarily, but little harm is done.) But avoid
234 * touching the global flag if it doesn't need to change.
235 */
236 if (hibernating != (left_till_hibernate <= 1))
237 {
238 hibernating = (left_till_hibernate <= 1);
239 SetWalWriterSleeping(hibernating);
240 }
241
242 /* Clear any already-pending wakeups */
243 ResetLatch(MyLatch);
244
245 /*
246 * Process any requests or signals received recently.
247 */
248 if (got_SIGHUP)
249 {
250 got_SIGHUP = false;
251 ProcessConfigFile(PGC_SIGHUP);
252 }
253 if (shutdown_requested)
254 {
255 /* Normal exit from the walwriter is here */
256 proc_exit(0); /* done */
257 }
258
259 /*
260 * Do what we're here for; then, if XLogBackgroundFlush() found useful
261 * work to do, reset hibernation counter.
262 */
263 if (XLogBackgroundFlush())
264 left_till_hibernate = LOOPS_UNTIL_HIBERNATE;
265 else if (left_till_hibernate > 0)
266 left_till_hibernate--;
267
268 /*
269 * Sleep until we are signaled or WalWriterDelay has elapsed. If we
270 * haven't done anything useful for quite some time, lengthen the
271 * sleep time so as to reduce the server's idle power consumption.
272 */
273 if (left_till_hibernate > 0)
274 cur_timeout = WalWriterDelay; /* in ms */
275 else
276 cur_timeout = WalWriterDelay * HIBERNATE_FACTOR;
277
278 (void) WaitLatch(MyLatch,
279 WL_LATCH_SET | WL_TIMEOUT | WL_EXIT_ON_PM_DEATH,
280 cur_timeout,
281 WAIT_EVENT_WAL_WRITER_MAIN);
282 }
283}
284
285
286/* --------------------------------
287 * signal handler routines
288 * --------------------------------
289 */
290
291/*
292 * wal_quickdie() occurs when signalled SIGQUIT by the postmaster.
293 *
294 * Some backend has bought the farm,
295 * so we need to stop what we're doing and exit.
296 */
297static void
298wal_quickdie(SIGNAL_ARGS)
299{
300 /*
301 * We DO NOT want to run proc_exit() or atexit() callbacks -- we're here
302 * because shared memory may be corrupted, so we don't want to try to
303 * clean up our transaction. Just nail the windows shut and get out of
304 * town. The callbacks wouldn't be safe to run from a signal handler,
305 * anyway.
306 *
307 * Note we do _exit(2) not _exit(0). This is to force the postmaster into
308 * a system reset cycle if someone sends a manual SIGQUIT to a random
309 * backend. This is necessary precisely because we don't clean up our
310 * shared memory state. (The "dead man switch" mechanism in pmsignal.c
311 * should ensure the postmaster sees this as a crash, too, but no harm in
312 * being doubly sure.)
313 */
314 _exit(2);
315}
316
317/* SIGHUP: set flag to re-read config file at next convenient time */
318static void
319WalSigHupHandler(SIGNAL_ARGS)
320{
321 int save_errno = errno;
322
323 got_SIGHUP = true;
324 SetLatch(MyLatch);
325
326 errno = save_errno;
327}
328
329/* SIGTERM: set flag to exit normally */
330static void
331WalShutdownHandler(SIGNAL_ARGS)
332{
333 int save_errno = errno;
334
335 shutdown_requested = true;
336 SetLatch(MyLatch);
337
338 errno = save_errno;
339}
340
341/* SIGUSR1: used for latch wakeups */
342static void
343walwriter_sigusr1_handler(SIGNAL_ARGS)
344{
345 int save_errno = errno;
346
347 latch_sigusr1_handler();
348
349 errno = save_errno;
350}
351