| 1 | /* |
| 2 | * parallel.c |
| 3 | * |
| 4 | * multi-process support |
| 5 | * |
| 6 | * Copyright (c) 2010-2019, PostgreSQL Global Development Group |
| 7 | * src/bin/pg_upgrade/parallel.c |
| 8 | */ |
| 9 | |
| 10 | #include "postgres_fe.h" |
| 11 | |
| 12 | #include <sys/wait.h> |
| 13 | #ifdef WIN32 |
| 14 | #include <io.h> |
| 15 | #endif |
| 16 | |
| 17 | #include "pg_upgrade.h" |
| 18 | |
| 19 | |
| 20 | static int parallel_jobs; |
| 21 | |
| 22 | #ifdef WIN32 |
| 23 | /* |
| 24 | * Array holding all active threads. There can't be any gaps/zeros so |
| 25 | * it can be passed to WaitForMultipleObjects(). We use two arrays |
| 26 | * so the thread_handles array can be passed to WaitForMultipleObjects(). |
| 27 | */ |
| 28 | HANDLE *thread_handles; |
| 29 | |
| 30 | typedef struct |
| 31 | { |
| 32 | char *log_file; |
| 33 | char *opt_log_file; |
| 34 | char *cmd; |
| 35 | } exec_thread_arg; |
| 36 | |
| 37 | typedef struct |
| 38 | { |
| 39 | DbInfoArr *old_db_arr; |
| 40 | DbInfoArr *new_db_arr; |
| 41 | char *old_pgdata; |
| 42 | char *new_pgdata; |
| 43 | char *old_tablespace; |
| 44 | } transfer_thread_arg; |
| 45 | |
| 46 | exec_thread_arg **exec_thread_args; |
| 47 | transfer_thread_arg **transfer_thread_args; |
| 48 | |
| 49 | /* track current thread_args struct so reap_child() can be used for all cases */ |
| 50 | void **cur_thread_args; |
| 51 | |
| 52 | DWORD win32_exec_prog(exec_thread_arg *args); |
| 53 | DWORD win32_transfer_all_new_dbs(transfer_thread_arg *args); |
| 54 | #endif |
| 55 | |
| 56 | /* |
| 57 | * parallel_exec_prog |
| 58 | * |
| 59 | * This has the same API as exec_prog, except it does parallel execution, |
| 60 | * and therefore must throw errors and doesn't return an error status. |
| 61 | */ |
| 62 | void |
| 63 | parallel_exec_prog(const char *log_file, const char *opt_log_file, |
| 64 | const char *fmt,...) |
| 65 | { |
| 66 | va_list args; |
| 67 | char cmd[MAX_STRING]; |
| 68 | |
| 69 | #ifndef WIN32 |
| 70 | pid_t child; |
| 71 | #else |
| 72 | HANDLE child; |
| 73 | exec_thread_arg *new_arg; |
| 74 | #endif |
| 75 | |
| 76 | va_start(args, fmt); |
| 77 | vsnprintf(cmd, sizeof(cmd), fmt, args); |
| 78 | va_end(args); |
| 79 | |
| 80 | if (user_opts.jobs <= 1) |
| 81 | /* exit_on_error must be true to allow jobs */ |
| 82 | exec_prog(log_file, opt_log_file, true, true, "%s" , cmd); |
| 83 | else |
| 84 | { |
| 85 | /* parallel */ |
| 86 | #ifdef WIN32 |
| 87 | if (thread_handles == NULL) |
| 88 | thread_handles = pg_malloc(user_opts.jobs * sizeof(HANDLE)); |
| 89 | |
| 90 | if (exec_thread_args == NULL) |
| 91 | { |
| 92 | int i; |
| 93 | |
| 94 | exec_thread_args = pg_malloc(user_opts.jobs * sizeof(exec_thread_arg *)); |
| 95 | |
| 96 | /* |
| 97 | * For safety and performance, we keep the args allocated during |
| 98 | * the entire life of the process, and we don't free the args in a |
| 99 | * thread different from the one that allocated it. |
| 100 | */ |
| 101 | for (i = 0; i < user_opts.jobs; i++) |
| 102 | exec_thread_args[i] = pg_malloc0(sizeof(exec_thread_arg)); |
| 103 | } |
| 104 | |
| 105 | cur_thread_args = (void **) exec_thread_args; |
| 106 | #endif |
| 107 | /* harvest any dead children */ |
| 108 | while (reap_child(false) == true) |
| 109 | ; |
| 110 | |
| 111 | /* must we wait for a dead child? */ |
| 112 | if (parallel_jobs >= user_opts.jobs) |
| 113 | reap_child(true); |
| 114 | |
| 115 | /* set this before we start the job */ |
| 116 | parallel_jobs++; |
| 117 | |
| 118 | /* Ensure stdio state is quiesced before forking */ |
| 119 | fflush(NULL); |
| 120 | |
| 121 | #ifndef WIN32 |
| 122 | child = fork(); |
| 123 | if (child == 0) |
| 124 | /* use _exit to skip atexit() functions */ |
| 125 | _exit(!exec_prog(log_file, opt_log_file, true, true, "%s" , cmd)); |
| 126 | else if (child < 0) |
| 127 | /* fork failed */ |
| 128 | pg_fatal("could not create worker process: %s\n" , strerror(errno)); |
| 129 | #else |
| 130 | /* empty array element are always at the end */ |
| 131 | new_arg = exec_thread_args[parallel_jobs - 1]; |
| 132 | |
| 133 | /* Can only pass one pointer into the function, so use a struct */ |
| 134 | if (new_arg->log_file) |
| 135 | pg_free(new_arg->log_file); |
| 136 | new_arg->log_file = pg_strdup(log_file); |
| 137 | if (new_arg->opt_log_file) |
| 138 | pg_free(new_arg->opt_log_file); |
| 139 | new_arg->opt_log_file = opt_log_file ? pg_strdup(opt_log_file) : NULL; |
| 140 | if (new_arg->cmd) |
| 141 | pg_free(new_arg->cmd); |
| 142 | new_arg->cmd = pg_strdup(cmd); |
| 143 | |
| 144 | child = (HANDLE) _beginthreadex(NULL, 0, (void *) win32_exec_prog, |
| 145 | new_arg, 0, NULL); |
| 146 | if (child == 0) |
| 147 | pg_fatal("could not create worker thread: %s\n" , strerror(errno)); |
| 148 | |
| 149 | thread_handles[parallel_jobs - 1] = child; |
| 150 | #endif |
| 151 | } |
| 152 | |
| 153 | return; |
| 154 | } |
| 155 | |
| 156 | |
| 157 | #ifdef WIN32 |
| 158 | DWORD |
| 159 | win32_exec_prog(exec_thread_arg *args) |
| 160 | { |
| 161 | int ret; |
| 162 | |
| 163 | ret = !exec_prog(args->log_file, args->opt_log_file, true, true, "%s" , args->cmd); |
| 164 | |
| 165 | /* terminates thread */ |
| 166 | return ret; |
| 167 | } |
| 168 | #endif |
| 169 | |
| 170 | |
| 171 | /* |
| 172 | * parallel_transfer_all_new_dbs |
| 173 | * |
| 174 | * This has the same API as transfer_all_new_dbs, except it does parallel execution |
| 175 | * by transferring multiple tablespaces in parallel |
| 176 | */ |
| 177 | void |
| 178 | parallel_transfer_all_new_dbs(DbInfoArr *old_db_arr, DbInfoArr *new_db_arr, |
| 179 | char *old_pgdata, char *new_pgdata, |
| 180 | char *old_tablespace) |
| 181 | { |
| 182 | #ifndef WIN32 |
| 183 | pid_t child; |
| 184 | #else |
| 185 | HANDLE child; |
| 186 | transfer_thread_arg *new_arg; |
| 187 | #endif |
| 188 | |
| 189 | if (user_opts.jobs <= 1) |
| 190 | transfer_all_new_dbs(old_db_arr, new_db_arr, old_pgdata, new_pgdata, NULL); |
| 191 | else |
| 192 | { |
| 193 | /* parallel */ |
| 194 | #ifdef WIN32 |
| 195 | if (thread_handles == NULL) |
| 196 | thread_handles = pg_malloc(user_opts.jobs * sizeof(HANDLE)); |
| 197 | |
| 198 | if (transfer_thread_args == NULL) |
| 199 | { |
| 200 | int i; |
| 201 | |
| 202 | transfer_thread_args = pg_malloc(user_opts.jobs * sizeof(transfer_thread_arg *)); |
| 203 | |
| 204 | /* |
| 205 | * For safety and performance, we keep the args allocated during |
| 206 | * the entire life of the process, and we don't free the args in a |
| 207 | * thread different from the one that allocated it. |
| 208 | */ |
| 209 | for (i = 0; i < user_opts.jobs; i++) |
| 210 | transfer_thread_args[i] = pg_malloc0(sizeof(transfer_thread_arg)); |
| 211 | } |
| 212 | |
| 213 | cur_thread_args = (void **) transfer_thread_args; |
| 214 | #endif |
| 215 | /* harvest any dead children */ |
| 216 | while (reap_child(false) == true) |
| 217 | ; |
| 218 | |
| 219 | /* must we wait for a dead child? */ |
| 220 | if (parallel_jobs >= user_opts.jobs) |
| 221 | reap_child(true); |
| 222 | |
| 223 | /* set this before we start the job */ |
| 224 | parallel_jobs++; |
| 225 | |
| 226 | /* Ensure stdio state is quiesced before forking */ |
| 227 | fflush(NULL); |
| 228 | |
| 229 | #ifndef WIN32 |
| 230 | child = fork(); |
| 231 | if (child == 0) |
| 232 | { |
| 233 | transfer_all_new_dbs(old_db_arr, new_db_arr, old_pgdata, new_pgdata, |
| 234 | old_tablespace); |
| 235 | /* if we take another exit path, it will be non-zero */ |
| 236 | /* use _exit to skip atexit() functions */ |
| 237 | _exit(0); |
| 238 | } |
| 239 | else if (child < 0) |
| 240 | /* fork failed */ |
| 241 | pg_fatal("could not create worker process: %s\n" , strerror(errno)); |
| 242 | #else |
| 243 | /* empty array element are always at the end */ |
| 244 | new_arg = transfer_thread_args[parallel_jobs - 1]; |
| 245 | |
| 246 | /* Can only pass one pointer into the function, so use a struct */ |
| 247 | new_arg->old_db_arr = old_db_arr; |
| 248 | new_arg->new_db_arr = new_db_arr; |
| 249 | if (new_arg->old_pgdata) |
| 250 | pg_free(new_arg->old_pgdata); |
| 251 | new_arg->old_pgdata = pg_strdup(old_pgdata); |
| 252 | if (new_arg->new_pgdata) |
| 253 | pg_free(new_arg->new_pgdata); |
| 254 | new_arg->new_pgdata = pg_strdup(new_pgdata); |
| 255 | if (new_arg->old_tablespace) |
| 256 | pg_free(new_arg->old_tablespace); |
| 257 | new_arg->old_tablespace = old_tablespace ? pg_strdup(old_tablespace) : NULL; |
| 258 | |
| 259 | child = (HANDLE) _beginthreadex(NULL, 0, (void *) win32_transfer_all_new_dbs, |
| 260 | new_arg, 0, NULL); |
| 261 | if (child == 0) |
| 262 | pg_fatal("could not create worker thread: %s\n" , strerror(errno)); |
| 263 | |
| 264 | thread_handles[parallel_jobs - 1] = child; |
| 265 | #endif |
| 266 | } |
| 267 | |
| 268 | return; |
| 269 | } |
| 270 | |
| 271 | |
| 272 | #ifdef WIN32 |
| 273 | DWORD |
| 274 | win32_transfer_all_new_dbs(transfer_thread_arg *args) |
| 275 | { |
| 276 | transfer_all_new_dbs(args->old_db_arr, args->new_db_arr, args->old_pgdata, |
| 277 | args->new_pgdata, args->old_tablespace); |
| 278 | |
| 279 | /* terminates thread */ |
| 280 | return 0; |
| 281 | } |
| 282 | #endif |
| 283 | |
| 284 | |
| 285 | /* |
| 286 | * collect status from a completed worker child |
| 287 | */ |
| 288 | bool |
| 289 | reap_child(bool wait_for_child) |
| 290 | { |
| 291 | #ifndef WIN32 |
| 292 | int work_status; |
| 293 | pid_t child; |
| 294 | #else |
| 295 | int thread_num; |
| 296 | DWORD res; |
| 297 | #endif |
| 298 | |
| 299 | if (user_opts.jobs <= 1 || parallel_jobs == 0) |
| 300 | return false; |
| 301 | |
| 302 | #ifndef WIN32 |
| 303 | child = waitpid(-1, &work_status, wait_for_child ? 0 : WNOHANG); |
| 304 | if (child == (pid_t) -1) |
| 305 | pg_fatal("waitpid() failed: %s\n" , strerror(errno)); |
| 306 | if (child == 0) |
| 307 | return false; /* no children, or no dead children */ |
| 308 | if (work_status != 0) |
| 309 | pg_fatal("child process exited abnormally: status %d\n" , work_status); |
| 310 | #else |
| 311 | /* wait for one to finish */ |
| 312 | thread_num = WaitForMultipleObjects(parallel_jobs, thread_handles, |
| 313 | false, wait_for_child ? INFINITE : 0); |
| 314 | |
| 315 | if (thread_num == WAIT_TIMEOUT || thread_num == WAIT_FAILED) |
| 316 | return false; |
| 317 | |
| 318 | /* compute thread index in active_threads */ |
| 319 | thread_num -= WAIT_OBJECT_0; |
| 320 | |
| 321 | /* get the result */ |
| 322 | GetExitCodeThread(thread_handles[thread_num], &res); |
| 323 | if (res != 0) |
| 324 | pg_fatal("child worker exited abnormally: %s\n" , strerror(errno)); |
| 325 | |
| 326 | /* dispose of handle to stop leaks */ |
| 327 | CloseHandle(thread_handles[thread_num]); |
| 328 | |
| 329 | /* Move last slot into dead child's position */ |
| 330 | if (thread_num != parallel_jobs - 1) |
| 331 | { |
| 332 | void *tmp_args; |
| 333 | |
| 334 | thread_handles[thread_num] = thread_handles[parallel_jobs - 1]; |
| 335 | |
| 336 | /* |
| 337 | * Move last active thead arg struct into the now-dead slot, and the |
| 338 | * now-dead slot to the end for reuse by the next thread. Though the |
| 339 | * thread struct is in use by another thread, we can safely swap the |
| 340 | * struct pointers within the array. |
| 341 | */ |
| 342 | tmp_args = cur_thread_args[thread_num]; |
| 343 | cur_thread_args[thread_num] = cur_thread_args[parallel_jobs - 1]; |
| 344 | cur_thread_args[parallel_jobs - 1] = tmp_args; |
| 345 | } |
| 346 | #endif |
| 347 | |
| 348 | /* do this after job has been removed */ |
| 349 | parallel_jobs--; |
| 350 | |
| 351 | return true; |
| 352 | } |
| 353 | |