| rjw | 1f88458 | 2022-01-06 17:20:42 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2007 Oracle. All rights reserved. |
| 3 | * |
| 4 | * This program is free software; you can redistribute it and/or |
| 5 | * modify it under the terms of the GNU General Public |
| 6 | * License v2 as published by the Free Software Foundation. |
| 7 | * |
| 8 | * This program is distributed in the hope that it will be useful, |
| 9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 11 | * General Public License for more details. |
| 12 | * |
| 13 | * You should have received a copy of the GNU General Public |
| 14 | * License along with this program; if not, write to the |
| 15 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
| 16 | * Boston, MA 021110-1307, USA. |
| 17 | */ |
| 18 | |
| 19 | #include <linux/err.h> |
| 20 | #include <linux/uuid.h> |
| 21 | #include "ctree.h" |
| 22 | #include "transaction.h" |
| 23 | #include "disk-io.h" |
| 24 | #include "print-tree.h" |
| 25 | |
| 26 | /* |
| 27 | * Read a root item from the tree. In case we detect a root item smaller then |
| 28 | * sizeof(root_item), we know it's an old version of the root structure and |
| 29 | * initialize all new fields to zero. The same happens if we detect mismatching |
| 30 | * generation numbers as then we know the root was once mounted with an older |
| 31 | * kernel that was not aware of the root item structure change. |
| 32 | */ |
| 33 | static void btrfs_read_root_item(struct extent_buffer *eb, int slot, |
| 34 | struct btrfs_root_item *item) |
| 35 | { |
| 36 | uuid_le uuid; |
| 37 | int len; |
| 38 | int need_reset = 0; |
| 39 | |
| 40 | len = btrfs_item_size_nr(eb, slot); |
| 41 | read_extent_buffer(eb, item, btrfs_item_ptr_offset(eb, slot), |
| 42 | min_t(int, len, (int)sizeof(*item))); |
| 43 | if (len < sizeof(*item)) |
| 44 | need_reset = 1; |
| 45 | if (!need_reset && btrfs_root_generation(item) |
| 46 | != btrfs_root_generation_v2(item)) { |
| 47 | if (btrfs_root_generation_v2(item) != 0) { |
| 48 | btrfs_warn(eb->fs_info, |
| 49 | "mismatching generation and generation_v2 found in root item. This root was probably mounted with an older kernel. Resetting all new fields."); |
| 50 | } |
| 51 | need_reset = 1; |
| 52 | } |
| 53 | if (need_reset) { |
| 54 | memset(&item->generation_v2, 0, |
| 55 | sizeof(*item) - offsetof(struct btrfs_root_item, |
| 56 | generation_v2)); |
| 57 | |
| 58 | uuid_le_gen(&uuid); |
| 59 | memcpy(item->uuid, uuid.b, BTRFS_UUID_SIZE); |
| 60 | } |
| 61 | } |
| 62 | |
| 63 | /* |
| 64 | * btrfs_find_root - lookup the root by the key. |
| 65 | * root: the root of the root tree |
| 66 | * search_key: the key to search |
| 67 | * path: the path we search |
| 68 | * root_item: the root item of the tree we look for |
| 69 | * root_key: the root key of the tree we look for |
| 70 | * |
| 71 | * If ->offset of 'search_key' is -1ULL, it means we are not sure the offset |
| 72 | * of the search key, just lookup the root with the highest offset for a |
| 73 | * given objectid. |
| 74 | * |
| 75 | * If we find something return 0, otherwise > 0, < 0 on error. |
| 76 | */ |
| 77 | int btrfs_find_root(struct btrfs_root *root, const struct btrfs_key *search_key, |
| 78 | struct btrfs_path *path, struct btrfs_root_item *root_item, |
| 79 | struct btrfs_key *root_key) |
| 80 | { |
| 81 | struct btrfs_key found_key; |
| 82 | struct extent_buffer *l; |
| 83 | int ret; |
| 84 | int slot; |
| 85 | |
| 86 | ret = btrfs_search_slot(NULL, root, search_key, path, 0, 0); |
| 87 | if (ret < 0) |
| 88 | return ret; |
| 89 | |
| 90 | if (search_key->offset != -1ULL) { /* the search key is exact */ |
| 91 | if (ret > 0) |
| 92 | goto out; |
| 93 | } else { |
| 94 | BUG_ON(ret == 0); /* Logical error */ |
| 95 | if (path->slots[0] == 0) |
| 96 | goto out; |
| 97 | path->slots[0]--; |
| 98 | ret = 0; |
| 99 | } |
| 100 | |
| 101 | l = path->nodes[0]; |
| 102 | slot = path->slots[0]; |
| 103 | |
| 104 | btrfs_item_key_to_cpu(l, &found_key, slot); |
| 105 | if (found_key.objectid != search_key->objectid || |
| 106 | found_key.type != BTRFS_ROOT_ITEM_KEY) { |
| 107 | ret = 1; |
| 108 | goto out; |
| 109 | } |
| 110 | |
| 111 | if (root_item) |
| 112 | btrfs_read_root_item(l, slot, root_item); |
| 113 | if (root_key) |
| 114 | memcpy(root_key, &found_key, sizeof(found_key)); |
| 115 | out: |
| 116 | btrfs_release_path(path); |
| 117 | return ret; |
| 118 | } |
| 119 | |
| 120 | void btrfs_set_root_node(struct btrfs_root_item *item, |
| 121 | struct extent_buffer *node) |
| 122 | { |
| 123 | btrfs_set_root_bytenr(item, node->start); |
| 124 | btrfs_set_root_level(item, btrfs_header_level(node)); |
| 125 | btrfs_set_root_generation(item, btrfs_header_generation(node)); |
| 126 | } |
| 127 | |
| 128 | /* |
| 129 | * copy the data in 'item' into the btree |
| 130 | */ |
| 131 | int btrfs_update_root(struct btrfs_trans_handle *trans, struct btrfs_root |
| 132 | *root, struct btrfs_key *key, struct btrfs_root_item |
| 133 | *item) |
| 134 | { |
| 135 | struct btrfs_fs_info *fs_info = root->fs_info; |
| 136 | struct btrfs_path *path; |
| 137 | struct extent_buffer *l; |
| 138 | int ret; |
| 139 | int slot; |
| 140 | unsigned long ptr; |
| 141 | u32 old_len; |
| 142 | |
| 143 | path = btrfs_alloc_path(); |
| 144 | if (!path) |
| 145 | return -ENOMEM; |
| 146 | |
| 147 | ret = btrfs_search_slot(trans, root, key, path, 0, 1); |
| 148 | if (ret < 0) |
| 149 | goto out; |
| 150 | |
| 151 | if (ret > 0) { |
| 152 | btrfs_crit(fs_info, |
| 153 | "unable to find root key (%llu %u %llu) in tree %llu", |
| 154 | key->objectid, key->type, key->offset, |
| 155 | root->root_key.objectid); |
| 156 | ret = -EUCLEAN; |
| 157 | btrfs_abort_transaction(trans, ret); |
| 158 | goto out; |
| 159 | } |
| 160 | |
| 161 | l = path->nodes[0]; |
| 162 | slot = path->slots[0]; |
| 163 | ptr = btrfs_item_ptr_offset(l, slot); |
| 164 | old_len = btrfs_item_size_nr(l, slot); |
| 165 | |
| 166 | /* |
| 167 | * If this is the first time we update the root item which originated |
| 168 | * from an older kernel, we need to enlarge the item size to make room |
| 169 | * for the added fields. |
| 170 | */ |
| 171 | if (old_len < sizeof(*item)) { |
| 172 | btrfs_release_path(path); |
| 173 | ret = btrfs_search_slot(trans, root, key, path, |
| 174 | -1, 1); |
| 175 | if (ret < 0) { |
| 176 | btrfs_abort_transaction(trans, ret); |
| 177 | goto out; |
| 178 | } |
| 179 | |
| 180 | ret = btrfs_del_item(trans, root, path); |
| 181 | if (ret < 0) { |
| 182 | btrfs_abort_transaction(trans, ret); |
| 183 | goto out; |
| 184 | } |
| 185 | btrfs_release_path(path); |
| 186 | ret = btrfs_insert_empty_item(trans, root, path, |
| 187 | key, sizeof(*item)); |
| 188 | if (ret < 0) { |
| 189 | btrfs_abort_transaction(trans, ret); |
| 190 | goto out; |
| 191 | } |
| 192 | l = path->nodes[0]; |
| 193 | slot = path->slots[0]; |
| 194 | ptr = btrfs_item_ptr_offset(l, slot); |
| 195 | } |
| 196 | |
| 197 | /* |
| 198 | * Update generation_v2 so at the next mount we know the new root |
| 199 | * fields are valid. |
| 200 | */ |
| 201 | btrfs_set_root_generation_v2(item, btrfs_root_generation(item)); |
| 202 | |
| 203 | write_extent_buffer(l, item, ptr, sizeof(*item)); |
| 204 | btrfs_mark_buffer_dirty(path->nodes[0]); |
| 205 | out: |
| 206 | btrfs_free_path(path); |
| 207 | return ret; |
| 208 | } |
| 209 | |
| 210 | int btrfs_insert_root(struct btrfs_trans_handle *trans, struct btrfs_root *root, |
| 211 | const struct btrfs_key *key, struct btrfs_root_item *item) |
| 212 | { |
| 213 | /* |
| 214 | * Make sure generation v1 and v2 match. See update_root for details. |
| 215 | */ |
| 216 | btrfs_set_root_generation_v2(item, btrfs_root_generation(item)); |
| 217 | return btrfs_insert_item(trans, root, key, item, sizeof(*item)); |
| 218 | } |
| 219 | |
| 220 | int btrfs_find_orphan_roots(struct btrfs_fs_info *fs_info) |
| 221 | { |
| 222 | struct btrfs_root *tree_root = fs_info->tree_root; |
| 223 | struct extent_buffer *leaf; |
| 224 | struct btrfs_path *path; |
| 225 | struct btrfs_key key; |
| 226 | struct btrfs_key root_key; |
| 227 | struct btrfs_root *root; |
| 228 | int err = 0; |
| 229 | int ret; |
| 230 | bool can_recover = true; |
| 231 | |
| 232 | if (sb_rdonly(fs_info->sb)) |
| 233 | can_recover = false; |
| 234 | |
| 235 | path = btrfs_alloc_path(); |
| 236 | if (!path) |
| 237 | return -ENOMEM; |
| 238 | |
| 239 | key.objectid = BTRFS_ORPHAN_OBJECTID; |
| 240 | key.type = BTRFS_ORPHAN_ITEM_KEY; |
| 241 | key.offset = 0; |
| 242 | |
| 243 | root_key.type = BTRFS_ROOT_ITEM_KEY; |
| 244 | root_key.offset = (u64)-1; |
| 245 | |
| 246 | while (1) { |
| 247 | ret = btrfs_search_slot(NULL, tree_root, &key, path, 0, 0); |
| 248 | if (ret < 0) { |
| 249 | err = ret; |
| 250 | break; |
| 251 | } |
| 252 | |
| 253 | leaf = path->nodes[0]; |
| 254 | if (path->slots[0] >= btrfs_header_nritems(leaf)) { |
| 255 | ret = btrfs_next_leaf(tree_root, path); |
| 256 | if (ret < 0) |
| 257 | err = ret; |
| 258 | if (ret != 0) |
| 259 | break; |
| 260 | leaf = path->nodes[0]; |
| 261 | } |
| 262 | |
| 263 | btrfs_item_key_to_cpu(leaf, &key, path->slots[0]); |
| 264 | btrfs_release_path(path); |
| 265 | |
| 266 | if (key.objectid != BTRFS_ORPHAN_OBJECTID || |
| 267 | key.type != BTRFS_ORPHAN_ITEM_KEY) |
| 268 | break; |
| 269 | |
| 270 | root_key.objectid = key.offset; |
| 271 | key.offset++; |
| 272 | |
| 273 | /* |
| 274 | * The root might have been inserted already, as before we look |
| 275 | * for orphan roots, log replay might have happened, which |
| 276 | * triggers a transaction commit and qgroup accounting, which |
| 277 | * in turn reads and inserts fs roots while doing backref |
| 278 | * walking. |
| 279 | */ |
| 280 | root = btrfs_lookup_fs_root(fs_info, root_key.objectid); |
| 281 | if (root) { |
| 282 | WARN_ON(!test_bit(BTRFS_ROOT_ORPHAN_ITEM_INSERTED, |
| 283 | &root->state)); |
| 284 | if (btrfs_root_refs(&root->root_item) == 0) |
| 285 | btrfs_add_dead_root(root); |
| 286 | continue; |
| 287 | } |
| 288 | |
| 289 | root = btrfs_read_fs_root(tree_root, &root_key); |
| 290 | err = PTR_ERR_OR_ZERO(root); |
| 291 | if (err && err != -ENOENT) { |
| 292 | break; |
| 293 | } else if (err == -ENOENT) { |
| 294 | struct btrfs_trans_handle *trans; |
| 295 | |
| 296 | btrfs_release_path(path); |
| 297 | |
| 298 | trans = btrfs_join_transaction(tree_root); |
| 299 | if (IS_ERR(trans)) { |
| 300 | err = PTR_ERR(trans); |
| 301 | btrfs_handle_fs_error(fs_info, err, |
| 302 | "Failed to start trans to delete orphan item"); |
| 303 | break; |
| 304 | } |
| 305 | err = btrfs_del_orphan_item(trans, tree_root, |
| 306 | root_key.objectid); |
| 307 | btrfs_end_transaction(trans); |
| 308 | if (err) { |
| 309 | btrfs_handle_fs_error(fs_info, err, |
| 310 | "Failed to delete root orphan item"); |
| 311 | break; |
| 312 | } |
| 313 | continue; |
| 314 | } |
| 315 | |
| 316 | err = btrfs_init_fs_root(root); |
| 317 | if (err) { |
| 318 | btrfs_free_fs_root(root); |
| 319 | break; |
| 320 | } |
| 321 | |
| 322 | set_bit(BTRFS_ROOT_ORPHAN_ITEM_INSERTED, &root->state); |
| 323 | |
| 324 | err = btrfs_insert_fs_root(fs_info, root); |
| 325 | if (err) { |
| 326 | BUG_ON(err == -EEXIST); |
| 327 | btrfs_free_fs_root(root); |
| 328 | break; |
| 329 | } |
| 330 | |
| 331 | if (btrfs_root_refs(&root->root_item) == 0) |
| 332 | btrfs_add_dead_root(root); |
| 333 | } |
| 334 | |
| 335 | btrfs_free_path(path); |
| 336 | return err; |
| 337 | } |
| 338 | |
| 339 | /* drop the root item for 'key' from the tree root */ |
| 340 | int btrfs_del_root(struct btrfs_trans_handle *trans, |
| 341 | struct btrfs_fs_info *fs_info, const struct btrfs_key *key) |
| 342 | { |
| 343 | struct btrfs_root *root = fs_info->tree_root; |
| 344 | struct btrfs_path *path; |
| 345 | int ret; |
| 346 | |
| 347 | path = btrfs_alloc_path(); |
| 348 | if (!path) |
| 349 | return -ENOMEM; |
| 350 | ret = btrfs_search_slot(trans, root, key, path, -1, 1); |
| 351 | if (ret < 0) |
| 352 | goto out; |
| 353 | |
| 354 | BUG_ON(ret != 0); |
| 355 | |
| 356 | ret = btrfs_del_item(trans, root, path); |
| 357 | out: |
| 358 | btrfs_free_path(path); |
| 359 | return ret; |
| 360 | } |
| 361 | |
| 362 | int btrfs_del_root_ref(struct btrfs_trans_handle *trans, |
| 363 | struct btrfs_fs_info *fs_info, |
| 364 | u64 root_id, u64 ref_id, u64 dirid, u64 *sequence, |
| 365 | const char *name, int name_len) |
| 366 | |
| 367 | { |
| 368 | struct btrfs_root *tree_root = fs_info->tree_root; |
| 369 | struct btrfs_path *path; |
| 370 | struct btrfs_root_ref *ref; |
| 371 | struct extent_buffer *leaf; |
| 372 | struct btrfs_key key; |
| 373 | unsigned long ptr; |
| 374 | int err = 0; |
| 375 | int ret; |
| 376 | |
| 377 | path = btrfs_alloc_path(); |
| 378 | if (!path) |
| 379 | return -ENOMEM; |
| 380 | |
| 381 | key.objectid = root_id; |
| 382 | key.type = BTRFS_ROOT_BACKREF_KEY; |
| 383 | key.offset = ref_id; |
| 384 | again: |
| 385 | ret = btrfs_search_slot(trans, tree_root, &key, path, -1, 1); |
| 386 | BUG_ON(ret < 0); |
| 387 | if (ret == 0) { |
| 388 | leaf = path->nodes[0]; |
| 389 | ref = btrfs_item_ptr(leaf, path->slots[0], |
| 390 | struct btrfs_root_ref); |
| 391 | |
| 392 | WARN_ON(btrfs_root_ref_dirid(leaf, ref) != dirid); |
| 393 | WARN_ON(btrfs_root_ref_name_len(leaf, ref) != name_len); |
| 394 | ptr = (unsigned long)(ref + 1); |
| 395 | ret = btrfs_is_name_len_valid(leaf, path->slots[0], ptr, |
| 396 | name_len); |
| 397 | if (!ret) { |
| 398 | err = -EIO; |
| 399 | goto out; |
| 400 | } |
| 401 | |
| 402 | WARN_ON(memcmp_extent_buffer(leaf, name, ptr, name_len)); |
| 403 | *sequence = btrfs_root_ref_sequence(leaf, ref); |
| 404 | |
| 405 | ret = btrfs_del_item(trans, tree_root, path); |
| 406 | if (ret) { |
| 407 | err = ret; |
| 408 | goto out; |
| 409 | } |
| 410 | } else |
| 411 | err = -ENOENT; |
| 412 | |
| 413 | if (key.type == BTRFS_ROOT_BACKREF_KEY) { |
| 414 | btrfs_release_path(path); |
| 415 | key.objectid = ref_id; |
| 416 | key.type = BTRFS_ROOT_REF_KEY; |
| 417 | key.offset = root_id; |
| 418 | goto again; |
| 419 | } |
| 420 | |
| 421 | out: |
| 422 | btrfs_free_path(path); |
| 423 | return err; |
| 424 | } |
| 425 | |
| 426 | /* |
| 427 | * add a btrfs_root_ref item. type is either BTRFS_ROOT_REF_KEY |
| 428 | * or BTRFS_ROOT_BACKREF_KEY. |
| 429 | * |
| 430 | * The dirid, sequence, name and name_len refer to the directory entry |
| 431 | * that is referencing the root. |
| 432 | * |
| 433 | * For a forward ref, the root_id is the id of the tree referencing |
| 434 | * the root and ref_id is the id of the subvol or snapshot. |
| 435 | * |
| 436 | * For a back ref the root_id is the id of the subvol or snapshot and |
| 437 | * ref_id is the id of the tree referencing it. |
| 438 | * |
| 439 | * Will return 0, -ENOMEM, or anything from the CoW path |
| 440 | */ |
| 441 | int btrfs_add_root_ref(struct btrfs_trans_handle *trans, |
| 442 | struct btrfs_fs_info *fs_info, |
| 443 | u64 root_id, u64 ref_id, u64 dirid, u64 sequence, |
| 444 | const char *name, int name_len) |
| 445 | { |
| 446 | struct btrfs_root *tree_root = fs_info->tree_root; |
| 447 | struct btrfs_key key; |
| 448 | int ret; |
| 449 | struct btrfs_path *path; |
| 450 | struct btrfs_root_ref *ref; |
| 451 | struct extent_buffer *leaf; |
| 452 | unsigned long ptr; |
| 453 | |
| 454 | path = btrfs_alloc_path(); |
| 455 | if (!path) |
| 456 | return -ENOMEM; |
| 457 | |
| 458 | key.objectid = root_id; |
| 459 | key.type = BTRFS_ROOT_BACKREF_KEY; |
| 460 | key.offset = ref_id; |
| 461 | again: |
| 462 | ret = btrfs_insert_empty_item(trans, tree_root, path, &key, |
| 463 | sizeof(*ref) + name_len); |
| 464 | if (ret) { |
| 465 | btrfs_abort_transaction(trans, ret); |
| 466 | btrfs_free_path(path); |
| 467 | return ret; |
| 468 | } |
| 469 | |
| 470 | leaf = path->nodes[0]; |
| 471 | ref = btrfs_item_ptr(leaf, path->slots[0], struct btrfs_root_ref); |
| 472 | btrfs_set_root_ref_dirid(leaf, ref, dirid); |
| 473 | btrfs_set_root_ref_sequence(leaf, ref, sequence); |
| 474 | btrfs_set_root_ref_name_len(leaf, ref, name_len); |
| 475 | ptr = (unsigned long)(ref + 1); |
| 476 | write_extent_buffer(leaf, name, ptr, name_len); |
| 477 | btrfs_mark_buffer_dirty(leaf); |
| 478 | |
| 479 | if (key.type == BTRFS_ROOT_BACKREF_KEY) { |
| 480 | btrfs_release_path(path); |
| 481 | key.objectid = ref_id; |
| 482 | key.type = BTRFS_ROOT_REF_KEY; |
| 483 | key.offset = root_id; |
| 484 | goto again; |
| 485 | } |
| 486 | |
| 487 | btrfs_free_path(path); |
| 488 | return 0; |
| 489 | } |
| 490 | |
| 491 | /* |
| 492 | * Old btrfs forgets to init root_item->flags and root_item->byte_limit |
| 493 | * for subvolumes. To work around this problem, we steal a bit from |
| 494 | * root_item->inode_item->flags, and use it to indicate if those fields |
| 495 | * have been properly initialized. |
| 496 | */ |
| 497 | void btrfs_check_and_init_root_item(struct btrfs_root_item *root_item) |
| 498 | { |
| 499 | u64 inode_flags = btrfs_stack_inode_flags(&root_item->inode); |
| 500 | |
| 501 | if (!(inode_flags & BTRFS_INODE_ROOT_ITEM_INIT)) { |
| 502 | inode_flags |= BTRFS_INODE_ROOT_ITEM_INIT; |
| 503 | btrfs_set_stack_inode_flags(&root_item->inode, inode_flags); |
| 504 | btrfs_set_root_flags(root_item, 0); |
| 505 | btrfs_set_root_limit(root_item, 0); |
| 506 | } |
| 507 | } |
| 508 | |
| 509 | void btrfs_update_root_times(struct btrfs_trans_handle *trans, |
| 510 | struct btrfs_root *root) |
| 511 | { |
| 512 | struct btrfs_root_item *item = &root->root_item; |
| 513 | struct timespec ct; |
| 514 | |
| 515 | ktime_get_real_ts(&ct); |
| 516 | spin_lock(&root->root_item_lock); |
| 517 | btrfs_set_root_ctransid(item, trans->transid); |
| 518 | btrfs_set_stack_timespec_sec(&item->ctime, ct.tv_sec); |
| 519 | btrfs_set_stack_timespec_nsec(&item->ctime, ct.tv_nsec); |
| 520 | spin_unlock(&root->root_item_lock); |
| 521 | } |