1 | /* |
2 | * parallel.c |
3 | * |
4 | * multi-process support |
5 | * |
6 | * Copyright (c) 2010-2019, PostgreSQL Global Development Group |
7 | * src/bin/pg_upgrade/parallel.c |
8 | */ |
9 | |
10 | #include "postgres_fe.h" |
11 | |
12 | #include <sys/wait.h> |
13 | #ifdef WIN32 |
14 | #include <io.h> |
15 | #endif |
16 | |
17 | #include "pg_upgrade.h" |
18 | |
19 | |
20 | static int parallel_jobs; |
21 | |
22 | #ifdef WIN32 |
23 | /* |
24 | * Array holding all active threads. There can't be any gaps/zeros so |
25 | * it can be passed to WaitForMultipleObjects(). We use two arrays |
26 | * so the thread_handles array can be passed to WaitForMultipleObjects(). |
27 | */ |
28 | HANDLE *thread_handles; |
29 | |
30 | typedef struct |
31 | { |
32 | char *log_file; |
33 | char *opt_log_file; |
34 | char *cmd; |
35 | } exec_thread_arg; |
36 | |
37 | typedef struct |
38 | { |
39 | DbInfoArr *old_db_arr; |
40 | DbInfoArr *new_db_arr; |
41 | char *old_pgdata; |
42 | char *new_pgdata; |
43 | char *old_tablespace; |
44 | } transfer_thread_arg; |
45 | |
46 | exec_thread_arg **exec_thread_args; |
47 | transfer_thread_arg **transfer_thread_args; |
48 | |
49 | /* track current thread_args struct so reap_child() can be used for all cases */ |
50 | void **cur_thread_args; |
51 | |
52 | DWORD win32_exec_prog(exec_thread_arg *args); |
53 | DWORD win32_transfer_all_new_dbs(transfer_thread_arg *args); |
54 | #endif |
55 | |
56 | /* |
57 | * parallel_exec_prog |
58 | * |
59 | * This has the same API as exec_prog, except it does parallel execution, |
60 | * and therefore must throw errors and doesn't return an error status. |
61 | */ |
62 | void |
63 | parallel_exec_prog(const char *log_file, const char *opt_log_file, |
64 | const char *fmt,...) |
65 | { |
66 | va_list args; |
67 | char cmd[MAX_STRING]; |
68 | |
69 | #ifndef WIN32 |
70 | pid_t child; |
71 | #else |
72 | HANDLE child; |
73 | exec_thread_arg *new_arg; |
74 | #endif |
75 | |
76 | va_start(args, fmt); |
77 | vsnprintf(cmd, sizeof(cmd), fmt, args); |
78 | va_end(args); |
79 | |
80 | if (user_opts.jobs <= 1) |
81 | /* exit_on_error must be true to allow jobs */ |
82 | exec_prog(log_file, opt_log_file, true, true, "%s" , cmd); |
83 | else |
84 | { |
85 | /* parallel */ |
86 | #ifdef WIN32 |
87 | if (thread_handles == NULL) |
88 | thread_handles = pg_malloc(user_opts.jobs * sizeof(HANDLE)); |
89 | |
90 | if (exec_thread_args == NULL) |
91 | { |
92 | int i; |
93 | |
94 | exec_thread_args = pg_malloc(user_opts.jobs * sizeof(exec_thread_arg *)); |
95 | |
96 | /* |
97 | * For safety and performance, we keep the args allocated during |
98 | * the entire life of the process, and we don't free the args in a |
99 | * thread different from the one that allocated it. |
100 | */ |
101 | for (i = 0; i < user_opts.jobs; i++) |
102 | exec_thread_args[i] = pg_malloc0(sizeof(exec_thread_arg)); |
103 | } |
104 | |
105 | cur_thread_args = (void **) exec_thread_args; |
106 | #endif |
107 | /* harvest any dead children */ |
108 | while (reap_child(false) == true) |
109 | ; |
110 | |
111 | /* must we wait for a dead child? */ |
112 | if (parallel_jobs >= user_opts.jobs) |
113 | reap_child(true); |
114 | |
115 | /* set this before we start the job */ |
116 | parallel_jobs++; |
117 | |
118 | /* Ensure stdio state is quiesced before forking */ |
119 | fflush(NULL); |
120 | |
121 | #ifndef WIN32 |
122 | child = fork(); |
123 | if (child == 0) |
124 | /* use _exit to skip atexit() functions */ |
125 | _exit(!exec_prog(log_file, opt_log_file, true, true, "%s" , cmd)); |
126 | else if (child < 0) |
127 | /* fork failed */ |
128 | pg_fatal("could not create worker process: %s\n" , strerror(errno)); |
129 | #else |
130 | /* empty array element are always at the end */ |
131 | new_arg = exec_thread_args[parallel_jobs - 1]; |
132 | |
133 | /* Can only pass one pointer into the function, so use a struct */ |
134 | if (new_arg->log_file) |
135 | pg_free(new_arg->log_file); |
136 | new_arg->log_file = pg_strdup(log_file); |
137 | if (new_arg->opt_log_file) |
138 | pg_free(new_arg->opt_log_file); |
139 | new_arg->opt_log_file = opt_log_file ? pg_strdup(opt_log_file) : NULL; |
140 | if (new_arg->cmd) |
141 | pg_free(new_arg->cmd); |
142 | new_arg->cmd = pg_strdup(cmd); |
143 | |
144 | child = (HANDLE) _beginthreadex(NULL, 0, (void *) win32_exec_prog, |
145 | new_arg, 0, NULL); |
146 | if (child == 0) |
147 | pg_fatal("could not create worker thread: %s\n" , strerror(errno)); |
148 | |
149 | thread_handles[parallel_jobs - 1] = child; |
150 | #endif |
151 | } |
152 | |
153 | return; |
154 | } |
155 | |
156 | |
157 | #ifdef WIN32 |
158 | DWORD |
159 | win32_exec_prog(exec_thread_arg *args) |
160 | { |
161 | int ret; |
162 | |
163 | ret = !exec_prog(args->log_file, args->opt_log_file, true, true, "%s" , args->cmd); |
164 | |
165 | /* terminates thread */ |
166 | return ret; |
167 | } |
168 | #endif |
169 | |
170 | |
171 | /* |
172 | * parallel_transfer_all_new_dbs |
173 | * |
174 | * This has the same API as transfer_all_new_dbs, except it does parallel execution |
175 | * by transferring multiple tablespaces in parallel |
176 | */ |
177 | void |
178 | parallel_transfer_all_new_dbs(DbInfoArr *old_db_arr, DbInfoArr *new_db_arr, |
179 | char *old_pgdata, char *new_pgdata, |
180 | char *old_tablespace) |
181 | { |
182 | #ifndef WIN32 |
183 | pid_t child; |
184 | #else |
185 | HANDLE child; |
186 | transfer_thread_arg *new_arg; |
187 | #endif |
188 | |
189 | if (user_opts.jobs <= 1) |
190 | transfer_all_new_dbs(old_db_arr, new_db_arr, old_pgdata, new_pgdata, NULL); |
191 | else |
192 | { |
193 | /* parallel */ |
194 | #ifdef WIN32 |
195 | if (thread_handles == NULL) |
196 | thread_handles = pg_malloc(user_opts.jobs * sizeof(HANDLE)); |
197 | |
198 | if (transfer_thread_args == NULL) |
199 | { |
200 | int i; |
201 | |
202 | transfer_thread_args = pg_malloc(user_opts.jobs * sizeof(transfer_thread_arg *)); |
203 | |
204 | /* |
205 | * For safety and performance, we keep the args allocated during |
206 | * the entire life of the process, and we don't free the args in a |
207 | * thread different from the one that allocated it. |
208 | */ |
209 | for (i = 0; i < user_opts.jobs; i++) |
210 | transfer_thread_args[i] = pg_malloc0(sizeof(transfer_thread_arg)); |
211 | } |
212 | |
213 | cur_thread_args = (void **) transfer_thread_args; |
214 | #endif |
215 | /* harvest any dead children */ |
216 | while (reap_child(false) == true) |
217 | ; |
218 | |
219 | /* must we wait for a dead child? */ |
220 | if (parallel_jobs >= user_opts.jobs) |
221 | reap_child(true); |
222 | |
223 | /* set this before we start the job */ |
224 | parallel_jobs++; |
225 | |
226 | /* Ensure stdio state is quiesced before forking */ |
227 | fflush(NULL); |
228 | |
229 | #ifndef WIN32 |
230 | child = fork(); |
231 | if (child == 0) |
232 | { |
233 | transfer_all_new_dbs(old_db_arr, new_db_arr, old_pgdata, new_pgdata, |
234 | old_tablespace); |
235 | /* if we take another exit path, it will be non-zero */ |
236 | /* use _exit to skip atexit() functions */ |
237 | _exit(0); |
238 | } |
239 | else if (child < 0) |
240 | /* fork failed */ |
241 | pg_fatal("could not create worker process: %s\n" , strerror(errno)); |
242 | #else |
243 | /* empty array element are always at the end */ |
244 | new_arg = transfer_thread_args[parallel_jobs - 1]; |
245 | |
246 | /* Can only pass one pointer into the function, so use a struct */ |
247 | new_arg->old_db_arr = old_db_arr; |
248 | new_arg->new_db_arr = new_db_arr; |
249 | if (new_arg->old_pgdata) |
250 | pg_free(new_arg->old_pgdata); |
251 | new_arg->old_pgdata = pg_strdup(old_pgdata); |
252 | if (new_arg->new_pgdata) |
253 | pg_free(new_arg->new_pgdata); |
254 | new_arg->new_pgdata = pg_strdup(new_pgdata); |
255 | if (new_arg->old_tablespace) |
256 | pg_free(new_arg->old_tablespace); |
257 | new_arg->old_tablespace = old_tablespace ? pg_strdup(old_tablespace) : NULL; |
258 | |
259 | child = (HANDLE) _beginthreadex(NULL, 0, (void *) win32_transfer_all_new_dbs, |
260 | new_arg, 0, NULL); |
261 | if (child == 0) |
262 | pg_fatal("could not create worker thread: %s\n" , strerror(errno)); |
263 | |
264 | thread_handles[parallel_jobs - 1] = child; |
265 | #endif |
266 | } |
267 | |
268 | return; |
269 | } |
270 | |
271 | |
272 | #ifdef WIN32 |
273 | DWORD |
274 | win32_transfer_all_new_dbs(transfer_thread_arg *args) |
275 | { |
276 | transfer_all_new_dbs(args->old_db_arr, args->new_db_arr, args->old_pgdata, |
277 | args->new_pgdata, args->old_tablespace); |
278 | |
279 | /* terminates thread */ |
280 | return 0; |
281 | } |
282 | #endif |
283 | |
284 | |
285 | /* |
286 | * collect status from a completed worker child |
287 | */ |
288 | bool |
289 | reap_child(bool wait_for_child) |
290 | { |
291 | #ifndef WIN32 |
292 | int work_status; |
293 | pid_t child; |
294 | #else |
295 | int thread_num; |
296 | DWORD res; |
297 | #endif |
298 | |
299 | if (user_opts.jobs <= 1 || parallel_jobs == 0) |
300 | return false; |
301 | |
302 | #ifndef WIN32 |
303 | child = waitpid(-1, &work_status, wait_for_child ? 0 : WNOHANG); |
304 | if (child == (pid_t) -1) |
305 | pg_fatal("waitpid() failed: %s\n" , strerror(errno)); |
306 | if (child == 0) |
307 | return false; /* no children, or no dead children */ |
308 | if (work_status != 0) |
309 | pg_fatal("child process exited abnormally: status %d\n" , work_status); |
310 | #else |
311 | /* wait for one to finish */ |
312 | thread_num = WaitForMultipleObjects(parallel_jobs, thread_handles, |
313 | false, wait_for_child ? INFINITE : 0); |
314 | |
315 | if (thread_num == WAIT_TIMEOUT || thread_num == WAIT_FAILED) |
316 | return false; |
317 | |
318 | /* compute thread index in active_threads */ |
319 | thread_num -= WAIT_OBJECT_0; |
320 | |
321 | /* get the result */ |
322 | GetExitCodeThread(thread_handles[thread_num], &res); |
323 | if (res != 0) |
324 | pg_fatal("child worker exited abnormally: %s\n" , strerror(errno)); |
325 | |
326 | /* dispose of handle to stop leaks */ |
327 | CloseHandle(thread_handles[thread_num]); |
328 | |
329 | /* Move last slot into dead child's position */ |
330 | if (thread_num != parallel_jobs - 1) |
331 | { |
332 | void *tmp_args; |
333 | |
334 | thread_handles[thread_num] = thread_handles[parallel_jobs - 1]; |
335 | |
336 | /* |
337 | * Move last active thead arg struct into the now-dead slot, and the |
338 | * now-dead slot to the end for reuse by the next thread. Though the |
339 | * thread struct is in use by another thread, we can safely swap the |
340 | * struct pointers within the array. |
341 | */ |
342 | tmp_args = cur_thread_args[thread_num]; |
343 | cur_thread_args[thread_num] = cur_thread_args[parallel_jobs - 1]; |
344 | cur_thread_args[parallel_jobs - 1] = tmp_args; |
345 | } |
346 | #endif |
347 | |
348 | /* do this after job has been removed */ |
349 | parallel_jobs--; |
350 | |
351 | return true; |
352 | } |
353 | |