| 1 | /****************************************************** |
| 2 | MariaBackup: hot backup tool for InnoDB |
| 3 | (c) 2009-2013 Percona LLC and/or its affiliates. |
| 4 | Originally Created 3/3/2009 Yasufumi Kinoshita |
| 5 | Written by Alexey Kopytov, Aleksandr Kuzminsky, Stewart Smith, Vadim Tkachenko, |
| 6 | Yasufumi Kinoshita, Ignacio Nin and Baron Schwartz. |
| 7 | |
| 8 | This program is free software; you can redistribute it and/or modify |
| 9 | it under the terms of the GNU General Public License as published by |
| 10 | the Free Software Foundation; version 2 of the License. |
| 11 | |
| 12 | This program is distributed in the hope that it will be useful, |
| 13 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 15 | GNU General Public License for more details. |
| 16 | |
| 17 | You should have received a copy of the GNU General Public License |
| 18 | along with this program; if not, write to the Free Software |
| 19 | Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA |
| 20 | |
| 21 | *******************************************************/ |
| 22 | |
| 23 | /* Source file cursor implementation */ |
| 24 | |
| 25 | #include <my_global.h> |
| 26 | #include <my_base.h> |
| 27 | #include <fil0fil.h> |
| 28 | #include <fsp0fsp.h> |
| 29 | #include <srv0start.h> |
| 30 | #include <trx0sys.h> |
| 31 | |
| 32 | #include "fil_cur.h" |
| 33 | #include "common.h" |
| 34 | #include "read_filt.h" |
| 35 | #include "xtrabackup.h" |
| 36 | |
| 37 | /* Size of read buffer in pages (640 pages = 10M for 16K sized pages) */ |
| 38 | #define XB_FIL_CUR_PAGES 640 |
| 39 | |
| 40 | /*********************************************************************** |
| 41 | Extracts the relative path ("database/table.ibd") of a tablespace from a |
| 42 | specified possibly absolute path. |
| 43 | |
| 44 | For user tablespaces both "./database/table.ibd" and |
| 45 | "/remote/dir/database/table.ibd" result in "database/table.ibd". |
| 46 | |
| 47 | For system tablepsaces (i.e. When is_system is TRUE) both "/remote/dir/ibdata1" |
| 48 | and "./ibdata1" yield "ibdata1" in the output. */ |
| 49 | const char * |
| 50 | xb_get_relative_path( |
| 51 | /*=================*/ |
| 52 | const char* path, /*!< in: tablespace path (either |
| 53 | relative or absolute) */ |
| 54 | ibool is_system) /*!< in: TRUE for system tablespaces, |
| 55 | i.e. when only the filename must be |
| 56 | returned. */ |
| 57 | { |
| 58 | const char *next; |
| 59 | const char *cur; |
| 60 | const char *prev; |
| 61 | |
| 62 | prev = NULL; |
| 63 | cur = path; |
| 64 | |
| 65 | while ((next = strchr(cur, OS_PATH_SEPARATOR)) != NULL) { |
| 66 | |
| 67 | prev = cur; |
| 68 | cur = next + 1; |
| 69 | } |
| 70 | |
| 71 | if (is_system) { |
| 72 | |
| 73 | return(cur); |
| 74 | } else { |
| 75 | |
| 76 | return((prev == NULL) ? cur : prev); |
| 77 | } |
| 78 | |
| 79 | } |
| 80 | |
| 81 | /**********************************************************************//** |
| 82 | Closes a file. */ |
| 83 | static |
| 84 | void |
| 85 | xb_fil_node_close_file( |
| 86 | /*===================*/ |
| 87 | fil_node_t* node) /*!< in: file node */ |
| 88 | { |
| 89 | ibool ret; |
| 90 | |
| 91 | mutex_enter(&fil_system.mutex); |
| 92 | |
| 93 | ut_ad(node); |
| 94 | ut_a(node->n_pending == 0); |
| 95 | ut_a(node->n_pending_flushes == 0); |
| 96 | ut_a(!node->being_extended); |
| 97 | |
| 98 | if (!node->is_open()) { |
| 99 | |
| 100 | mutex_exit(&fil_system.mutex); |
| 101 | |
| 102 | return; |
| 103 | } |
| 104 | |
| 105 | ret = os_file_close(node->handle); |
| 106 | ut_a(ret); |
| 107 | |
| 108 | node->handle = OS_FILE_CLOSED; |
| 109 | |
| 110 | ut_a(fil_system.n_open > 0); |
| 111 | fil_system.n_open--; |
| 112 | fil_n_file_opened--; |
| 113 | |
| 114 | if (node->space->purpose == FIL_TYPE_TABLESPACE && |
| 115 | fil_is_user_tablespace_id(node->space->id)) { |
| 116 | |
| 117 | ut_a(UT_LIST_GET_LEN(fil_system.LRU) > 0); |
| 118 | |
| 119 | /* The node is in the LRU list, remove it */ |
| 120 | UT_LIST_REMOVE(fil_system.LRU, node); |
| 121 | } |
| 122 | |
| 123 | mutex_exit(&fil_system.mutex); |
| 124 | } |
| 125 | |
| 126 | /************************************************************************ |
| 127 | Open a source file cursor and initialize the associated read filter. |
| 128 | |
| 129 | @return XB_FIL_CUR_SUCCESS on success, XB_FIL_CUR_SKIP if the source file must |
| 130 | be skipped and XB_FIL_CUR_ERROR on error. */ |
| 131 | xb_fil_cur_result_t |
| 132 | xb_fil_cur_open( |
| 133 | /*============*/ |
| 134 | xb_fil_cur_t* cursor, /*!< out: source file cursor */ |
| 135 | xb_read_filt_t* read_filter, /*!< in/out: the read filter */ |
| 136 | fil_node_t* node, /*!< in: source tablespace node */ |
| 137 | uint thread_n) /*!< thread number for diagnostics */ |
| 138 | { |
| 139 | bool success; |
| 140 | |
| 141 | /* Initialize these first so xb_fil_cur_close() handles them correctly |
| 142 | in case of error */ |
| 143 | cursor->orig_buf = NULL; |
| 144 | cursor->node = NULL; |
| 145 | |
| 146 | cursor->space_id = node->space->id; |
| 147 | |
| 148 | strncpy(cursor->abs_path, node->name, sizeof(cursor->abs_path)); |
| 149 | |
| 150 | /* Get the relative path for the destination tablespace name, i.e. the |
| 151 | one that can be appended to the backup root directory. Non-system |
| 152 | tablespaces may have absolute paths for DATA DIRECTORY. |
| 153 | We want to make "local" copies for the backup. */ |
| 154 | strncpy(cursor->rel_path, |
| 155 | xb_get_relative_path(cursor->abs_path, cursor->is_system()), |
| 156 | sizeof(cursor->rel_path)); |
| 157 | |
| 158 | /* In the backup mode we should already have a tablespace handle created |
| 159 | by fil_ibd_load() unless it is a system |
| 160 | tablespace. Otherwise we open the file here. */ |
| 161 | if (cursor->is_system() || srv_operation == SRV_OPERATION_RESTORE_DELTA |
| 162 | || xb_close_files) { |
| 163 | node->handle = os_file_create_simple_no_error_handling( |
| 164 | 0, node->name, |
| 165 | OS_FILE_OPEN, |
| 166 | OS_FILE_READ_ALLOW_DELETE, true, &success); |
| 167 | if (!success) { |
| 168 | /* The following call prints an error message */ |
| 169 | os_file_get_last_error(TRUE); |
| 170 | |
| 171 | msg("[%02u] mariabackup: error: cannot open " |
| 172 | "tablespace %s\n" , |
| 173 | thread_n, cursor->abs_path); |
| 174 | |
| 175 | return(XB_FIL_CUR_ERROR); |
| 176 | } |
| 177 | mutex_enter(&fil_system.mutex); |
| 178 | |
| 179 | fil_system.n_open++; |
| 180 | fil_n_file_opened++; |
| 181 | |
| 182 | if (node->space->purpose == FIL_TYPE_TABLESPACE && |
| 183 | fil_is_user_tablespace_id(node->space->id)) { |
| 184 | |
| 185 | /* Put the node to the LRU list */ |
| 186 | UT_LIST_ADD_FIRST(fil_system.LRU, node); |
| 187 | } |
| 188 | |
| 189 | mutex_exit(&fil_system.mutex); |
| 190 | } |
| 191 | |
| 192 | ut_ad(node->is_open()); |
| 193 | |
| 194 | cursor->node = node; |
| 195 | cursor->file = node->handle; |
| 196 | |
| 197 | if (stat(cursor->abs_path, &cursor->statinfo)) { |
| 198 | msg("[%02u] mariabackup: error: cannot stat %s\n" , |
| 199 | thread_n, cursor->abs_path); |
| 200 | |
| 201 | xb_fil_cur_close(cursor); |
| 202 | |
| 203 | return(XB_FIL_CUR_ERROR); |
| 204 | } |
| 205 | |
| 206 | if (srv_file_flush_method == SRV_O_DIRECT |
| 207 | || srv_file_flush_method == SRV_O_DIRECT_NO_FSYNC) { |
| 208 | |
| 209 | os_file_set_nocache(cursor->file, node->name, "OPEN" ); |
| 210 | } |
| 211 | |
| 212 | posix_fadvise(cursor->file, 0, 0, POSIX_FADV_SEQUENTIAL); |
| 213 | |
| 214 | const page_size_t page_size(cursor->node->space->flags); |
| 215 | cursor->page_size = page_size; |
| 216 | |
| 217 | /* Allocate read buffer */ |
| 218 | cursor->buf_size = XB_FIL_CUR_PAGES * page_size.physical(); |
| 219 | cursor->orig_buf = static_cast<byte *> |
| 220 | (malloc(cursor->buf_size + srv_page_size)); |
| 221 | cursor->buf = static_cast<byte *> |
| 222 | (ut_align(cursor->orig_buf, srv_page_size)); |
| 223 | |
| 224 | cursor->buf_read = 0; |
| 225 | cursor->buf_npages = 0; |
| 226 | cursor->buf_offset = 0; |
| 227 | cursor->buf_page_no = 0; |
| 228 | cursor->thread_n = thread_n; |
| 229 | |
| 230 | cursor->space_size = (ulint)(cursor->statinfo.st_size |
| 231 | / page_size.physical()); |
| 232 | |
| 233 | cursor->read_filter = read_filter; |
| 234 | cursor->read_filter->init(&cursor->read_filter_ctxt, cursor, |
| 235 | node->space->id); |
| 236 | |
| 237 | return(XB_FIL_CUR_SUCCESS); |
| 238 | } |
| 239 | |
| 240 | /************************************************************************ |
| 241 | Reads and verifies the next block of pages from the source |
| 242 | file. Positions the cursor after the last read non-corrupted page. |
| 243 | |
| 244 | @return XB_FIL_CUR_SUCCESS if some have been read successfully, XB_FIL_CUR_EOF |
| 245 | if there are no more pages to read and XB_FIL_CUR_ERROR on error. */ |
| 246 | xb_fil_cur_result_t |
| 247 | xb_fil_cur_read( |
| 248 | /*============*/ |
| 249 | xb_fil_cur_t* cursor) /*!< in/out: source file cursor */ |
| 250 | { |
| 251 | ibool success; |
| 252 | byte* page; |
| 253 | ulint i; |
| 254 | ulint npages; |
| 255 | ulint retry_count; |
| 256 | xb_fil_cur_result_t ret; |
| 257 | ib_int64_t offset; |
| 258 | ib_int64_t to_read; |
| 259 | const ulint page_size = cursor->page_size.physical(); |
| 260 | xb_ad(!cursor->is_system() || page_size == srv_page_size); |
| 261 | |
| 262 | cursor->read_filter->get_next_batch(&cursor->read_filter_ctxt, |
| 263 | &offset, &to_read); |
| 264 | |
| 265 | if (to_read == 0LL) { |
| 266 | return(XB_FIL_CUR_EOF); |
| 267 | } |
| 268 | |
| 269 | if (to_read > (ib_int64_t) cursor->buf_size) { |
| 270 | to_read = (ib_int64_t) cursor->buf_size; |
| 271 | } |
| 272 | |
| 273 | xb_a(to_read > 0 && to_read <= 0xFFFFFFFFLL); |
| 274 | |
| 275 | if ((to_read & ~(page_size - 1)) |
| 276 | && offset + to_read == cursor->statinfo.st_size) { |
| 277 | |
| 278 | if (to_read < (ib_int64_t) page_size) { |
| 279 | msg("[%02u] mariabackup: Warning: junk at the end of " |
| 280 | "%s:\n" , cursor->thread_n, cursor->abs_path); |
| 281 | msg("[%02u] mariabackup: Warning: offset = %llu, " |
| 282 | "to_read = %llu\n" , |
| 283 | cursor->thread_n, |
| 284 | (unsigned long long) offset, |
| 285 | (unsigned long long) to_read); |
| 286 | |
| 287 | return(XB_FIL_CUR_EOF); |
| 288 | } |
| 289 | |
| 290 | to_read = (ib_int64_t) (((ulint) to_read) & |
| 291 | ~(page_size - 1)); |
| 292 | } |
| 293 | |
| 294 | xb_a((to_read & (page_size - 1)) == 0); |
| 295 | |
| 296 | npages = (ulint) (to_read / cursor->page_size.physical()); |
| 297 | |
| 298 | retry_count = 10; |
| 299 | ret = XB_FIL_CUR_SUCCESS; |
| 300 | |
| 301 | read_retry: |
| 302 | xtrabackup_io_throttling(); |
| 303 | |
| 304 | cursor->buf_read = 0; |
| 305 | cursor->buf_npages = 0; |
| 306 | cursor->buf_offset = offset; |
| 307 | cursor->buf_page_no = (ulint)(offset / cursor->page_size.physical()); |
| 308 | |
| 309 | fil_space_t* space = fil_space_get(cursor->space_id); |
| 310 | |
| 311 | if (!space) { |
| 312 | return(XB_FIL_CUR_ERROR); |
| 313 | } |
| 314 | |
| 315 | success = os_file_read(IORequestRead, |
| 316 | cursor->file, cursor->buf, offset, |
| 317 | (ulint) to_read); |
| 318 | if (!success) { |
| 319 | return(XB_FIL_CUR_ERROR); |
| 320 | } |
| 321 | |
| 322 | /* check pages for corruption and re-read if necessary. i.e. in case of |
| 323 | partially written pages */ |
| 324 | for (page = cursor->buf, i = 0; i < npages; |
| 325 | page += page_size, i++) { |
| 326 | ulint page_no = cursor->buf_page_no + i; |
| 327 | |
| 328 | if (cursor->space_id == TRX_SYS_SPACE && |
| 329 | page_no >= FSP_EXTENT_SIZE && |
| 330 | page_no < FSP_EXTENT_SIZE * 3) { |
| 331 | /* We ignore the doublewrite buffer pages */ |
| 332 | } else if (!fil_space_verify_crypt_checksum( |
| 333 | page, cursor->page_size, space->id, page_no) |
| 334 | && buf_page_is_corrupted(true, page, |
| 335 | cursor->page_size, |
| 336 | space)) { |
| 337 | retry_count--; |
| 338 | if (retry_count == 0) { |
| 339 | msg("[%02u] mariabackup: " |
| 340 | "Error: failed to read page after " |
| 341 | "10 retries. File %s seems to be " |
| 342 | "corrupted.\n" , cursor->thread_n, |
| 343 | cursor->abs_path); |
| 344 | ret = XB_FIL_CUR_ERROR; |
| 345 | break; |
| 346 | } |
| 347 | |
| 348 | if (retry_count == 9) { |
| 349 | msg("[%02u] mariabackup: " |
| 350 | "Database page corruption detected at page " |
| 351 | ULINTPF ", retrying...\n" , |
| 352 | cursor->thread_n, page_no); |
| 353 | } |
| 354 | |
| 355 | os_thread_sleep(100000); |
| 356 | |
| 357 | goto read_retry; |
| 358 | } |
| 359 | cursor->buf_read += page_size; |
| 360 | cursor->buf_npages++; |
| 361 | } |
| 362 | |
| 363 | posix_fadvise(cursor->file, offset, to_read, POSIX_FADV_DONTNEED); |
| 364 | |
| 365 | return(ret); |
| 366 | } |
| 367 | |
| 368 | /************************************************************************ |
| 369 | Close the source file cursor opened with xb_fil_cur_open() and its |
| 370 | associated read filter. */ |
| 371 | void |
| 372 | xb_fil_cur_close( |
| 373 | /*=============*/ |
| 374 | xb_fil_cur_t *cursor) /*!< in/out: source file cursor */ |
| 375 | { |
| 376 | cursor->read_filter->deinit(&cursor->read_filter_ctxt); |
| 377 | |
| 378 | free(cursor->orig_buf); |
| 379 | |
| 380 | if (cursor->node != NULL) { |
| 381 | xb_fil_node_close_file(cursor->node); |
| 382 | cursor->file = OS_FILE_CLOSED; |
| 383 | } |
| 384 | } |
| 385 | |