tree-checker.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584
  1. /*
  2. * Copyright (C) Qu Wenruo 2017. All rights reserved.
  3. *
  4. * This program is free software; you can redistribute it and/or
  5. * modify it under the terms of the GNU General Public
  6. * License v2 as published by the Free Software Foundation.
  7. *
  8. * This program is distributed in the hope that it will be useful,
  9. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  11. * General Public License for more details.
  12. *
  13. * You should have received a copy of the GNU General Public
  14. * License along with this program.
  15. */
  16. /*
  17. * The module is used to catch unexpected/corrupted tree block data.
  18. * Such behavior can be caused either by a fuzzed image or bugs.
  19. *
  20. * The objective is to do leaf/node validation checks when tree block is read
  21. * from disk, and check *every* possible member, so other code won't
  22. * need to checking them again.
  23. *
  24. * Due to the potential and unwanted damage, every checker needs to be
  25. * carefully reviewed otherwise so it does not prevent mount of valid images.
  26. */
  27. #include "ctree.h"
  28. #include "tree-checker.h"
  29. #include "disk-io.h"
  30. #include "compression.h"
  31. #include "hash.h"
  32. /*
  33. * Error message should follow the following format:
  34. * corrupt <type>: <identifier>, <reason>[, <bad_value>]
  35. *
  36. * @type: leaf or node
  37. * @identifier: the necessary info to locate the leaf/node.
  38. * It's recommened to decode key.objecitd/offset if it's
  39. * meaningful.
  40. * @reason: describe the error
  41. * @bad_value: optional, it's recommened to output bad value and its
  42. * expected value (range).
  43. *
  44. * Since comma is used to separate the components, only space is allowed
  45. * inside each component.
  46. */
  47. /*
  48. * Append generic "corrupt leaf/node root=%llu block=%llu slot=%d: " to @fmt.
  49. * Allows callers to customize the output.
  50. */
  51. __printf(4, 5)
  52. static void generic_err(const struct btrfs_root *root,
  53. const struct extent_buffer *eb, int slot,
  54. const char *fmt, ...)
  55. {
  56. struct va_format vaf;
  57. va_list args;
  58. va_start(args, fmt);
  59. vaf.fmt = fmt;
  60. vaf.va = &args;
  61. btrfs_crit(root->fs_info,
  62. "corrupt %s: root=%llu block=%llu slot=%d, %pV",
  63. btrfs_header_level(eb) == 0 ? "leaf" : "node",
  64. root->objectid, btrfs_header_bytenr(eb), slot, &vaf);
  65. va_end(args);
  66. }
  67. /*
  68. * Customized reporter for extent data item, since its key objectid and
  69. * offset has its own meaning.
  70. */
  71. __printf(4, 5)
  72. static void file_extent_err(const struct btrfs_root *root,
  73. const struct extent_buffer *eb, int slot,
  74. const char *fmt, ...)
  75. {
  76. struct btrfs_key key;
  77. struct va_format vaf;
  78. va_list args;
  79. btrfs_item_key_to_cpu(eb, &key, slot);
  80. va_start(args, fmt);
  81. vaf.fmt = fmt;
  82. vaf.va = &args;
  83. btrfs_crit(root->fs_info,
  84. "corrupt %s: root=%llu block=%llu slot=%d ino=%llu file_offset=%llu, %pV",
  85. btrfs_header_level(eb) == 0 ? "leaf" : "node", root->objectid,
  86. btrfs_header_bytenr(eb), slot, key.objectid, key.offset, &vaf);
  87. va_end(args);
  88. }
  89. /*
  90. * Return 0 if the btrfs_file_extent_##name is aligned to @alignment
  91. * Else return 1
  92. */
  93. #define CHECK_FE_ALIGNED(root, leaf, slot, fi, name, alignment) \
  94. ({ \
  95. if (!IS_ALIGNED(btrfs_file_extent_##name((leaf), (fi)), (alignment))) \
  96. file_extent_err((root), (leaf), (slot), \
  97. "invalid %s for file extent, have %llu, should be aligned to %u", \
  98. (#name), btrfs_file_extent_##name((leaf), (fi)), \
  99. (alignment)); \
  100. (!IS_ALIGNED(btrfs_file_extent_##name((leaf), (fi)), (alignment))); \
  101. })
  102. static int check_extent_data_item(struct btrfs_root *root,
  103. struct extent_buffer *leaf,
  104. struct btrfs_key *key, int slot)
  105. {
  106. struct btrfs_file_extent_item *fi;
  107. u32 sectorsize = root->fs_info->sectorsize;
  108. u32 item_size = btrfs_item_size_nr(leaf, slot);
  109. if (!IS_ALIGNED(key->offset, sectorsize)) {
  110. file_extent_err(root, leaf, slot,
  111. "unaligned file_offset for file extent, have %llu should be aligned to %u",
  112. key->offset, sectorsize);
  113. return -EUCLEAN;
  114. }
  115. fi = btrfs_item_ptr(leaf, slot, struct btrfs_file_extent_item);
  116. if (btrfs_file_extent_type(leaf, fi) > BTRFS_FILE_EXTENT_TYPES) {
  117. file_extent_err(root, leaf, slot,
  118. "invalid type for file extent, have %u expect range [0, %u]",
  119. btrfs_file_extent_type(leaf, fi),
  120. BTRFS_FILE_EXTENT_TYPES);
  121. return -EUCLEAN;
  122. }
  123. /*
  124. * Support for new compression/encrption must introduce incompat flag,
  125. * and must be caught in open_ctree().
  126. */
  127. if (btrfs_file_extent_compression(leaf, fi) > BTRFS_COMPRESS_TYPES) {
  128. file_extent_err(root, leaf, slot,
  129. "invalid compression for file extent, have %u expect range [0, %u]",
  130. btrfs_file_extent_compression(leaf, fi),
  131. BTRFS_COMPRESS_TYPES);
  132. return -EUCLEAN;
  133. }
  134. if (btrfs_file_extent_encryption(leaf, fi)) {
  135. file_extent_err(root, leaf, slot,
  136. "invalid encryption for file extent, have %u expect 0",
  137. btrfs_file_extent_encryption(leaf, fi));
  138. return -EUCLEAN;
  139. }
  140. if (btrfs_file_extent_type(leaf, fi) == BTRFS_FILE_EXTENT_INLINE) {
  141. /* Inline extent must have 0 as key offset */
  142. if (key->offset) {
  143. file_extent_err(root, leaf, slot,
  144. "invalid file_offset for inline file extent, have %llu expect 0",
  145. key->offset);
  146. return -EUCLEAN;
  147. }
  148. /* Compressed inline extent has no on-disk size, skip it */
  149. if (btrfs_file_extent_compression(leaf, fi) !=
  150. BTRFS_COMPRESS_NONE)
  151. return 0;
  152. /* Uncompressed inline extent size must match item size */
  153. if (item_size != BTRFS_FILE_EXTENT_INLINE_DATA_START +
  154. btrfs_file_extent_ram_bytes(leaf, fi)) {
  155. file_extent_err(root, leaf, slot,
  156. "invalid ram_bytes for uncompressed inline extent, have %u expect %llu",
  157. item_size, BTRFS_FILE_EXTENT_INLINE_DATA_START +
  158. btrfs_file_extent_ram_bytes(leaf, fi));
  159. return -EUCLEAN;
  160. }
  161. return 0;
  162. }
  163. /* Regular or preallocated extent has fixed item size */
  164. if (item_size != sizeof(*fi)) {
  165. file_extent_err(root, leaf, slot,
  166. "invalid item size for reg/prealloc file extent, have %u expect %zu",
  167. item_size, sizeof(*fi));
  168. return -EUCLEAN;
  169. }
  170. if (CHECK_FE_ALIGNED(root, leaf, slot, fi, ram_bytes, sectorsize) ||
  171. CHECK_FE_ALIGNED(root, leaf, slot, fi, disk_bytenr, sectorsize) ||
  172. CHECK_FE_ALIGNED(root, leaf, slot, fi, disk_num_bytes, sectorsize) ||
  173. CHECK_FE_ALIGNED(root, leaf, slot, fi, offset, sectorsize) ||
  174. CHECK_FE_ALIGNED(root, leaf, slot, fi, num_bytes, sectorsize))
  175. return -EUCLEAN;
  176. return 0;
  177. }
  178. static int check_csum_item(struct btrfs_root *root, struct extent_buffer *leaf,
  179. struct btrfs_key *key, int slot)
  180. {
  181. u32 sectorsize = root->fs_info->sectorsize;
  182. u32 csumsize = btrfs_super_csum_size(root->fs_info->super_copy);
  183. if (key->objectid != BTRFS_EXTENT_CSUM_OBJECTID) {
  184. generic_err(root, leaf, slot,
  185. "invalid key objectid for csum item, have %llu expect %llu",
  186. key->objectid, BTRFS_EXTENT_CSUM_OBJECTID);
  187. return -EUCLEAN;
  188. }
  189. if (!IS_ALIGNED(key->offset, sectorsize)) {
  190. generic_err(root, leaf, slot,
  191. "unaligned key offset for csum item, have %llu should be aligned to %u",
  192. key->offset, sectorsize);
  193. return -EUCLEAN;
  194. }
  195. if (!IS_ALIGNED(btrfs_item_size_nr(leaf, slot), csumsize)) {
  196. generic_err(root, leaf, slot,
  197. "unaligned item size for csum item, have %u should be aligned to %u",
  198. btrfs_item_size_nr(leaf, slot), csumsize);
  199. return -EUCLEAN;
  200. }
  201. return 0;
  202. }
  203. /*
  204. * Customized reported for dir_item, only important new info is key->objectid,
  205. * which represents inode number
  206. */
  207. __printf(4, 5)
  208. static void dir_item_err(const struct btrfs_root *root,
  209. const struct extent_buffer *eb, int slot,
  210. const char *fmt, ...)
  211. {
  212. struct btrfs_key key;
  213. struct va_format vaf;
  214. va_list args;
  215. btrfs_item_key_to_cpu(eb, &key, slot);
  216. va_start(args, fmt);
  217. vaf.fmt = fmt;
  218. vaf.va = &args;
  219. btrfs_crit(root->fs_info,
  220. "corrupt %s: root=%llu block=%llu slot=%d ino=%llu, %pV",
  221. btrfs_header_level(eb) == 0 ? "leaf" : "node", root->objectid,
  222. btrfs_header_bytenr(eb), slot, key.objectid, &vaf);
  223. va_end(args);
  224. }
  225. static int check_dir_item(struct btrfs_root *root,
  226. struct extent_buffer *leaf,
  227. struct btrfs_key *key, int slot)
  228. {
  229. struct btrfs_dir_item *di;
  230. u32 item_size = btrfs_item_size_nr(leaf, slot);
  231. u32 cur = 0;
  232. di = btrfs_item_ptr(leaf, slot, struct btrfs_dir_item);
  233. while (cur < item_size) {
  234. u32 name_len;
  235. u32 data_len;
  236. u32 max_name_len;
  237. u32 total_size;
  238. u32 name_hash;
  239. u8 dir_type;
  240. /* header itself should not cross item boundary */
  241. if (cur + sizeof(*di) > item_size) {
  242. dir_item_err(root, leaf, slot,
  243. "dir item header crosses item boundary, have %zu boundary %u",
  244. cur + sizeof(*di), item_size);
  245. return -EUCLEAN;
  246. }
  247. /* dir type check */
  248. dir_type = btrfs_dir_type(leaf, di);
  249. if (dir_type >= BTRFS_FT_MAX) {
  250. dir_item_err(root, leaf, slot,
  251. "invalid dir item type, have %u expect [0, %u)",
  252. dir_type, BTRFS_FT_MAX);
  253. return -EUCLEAN;
  254. }
  255. if (key->type == BTRFS_XATTR_ITEM_KEY &&
  256. dir_type != BTRFS_FT_XATTR) {
  257. dir_item_err(root, leaf, slot,
  258. "invalid dir item type for XATTR key, have %u expect %u",
  259. dir_type, BTRFS_FT_XATTR);
  260. return -EUCLEAN;
  261. }
  262. if (dir_type == BTRFS_FT_XATTR &&
  263. key->type != BTRFS_XATTR_ITEM_KEY) {
  264. dir_item_err(root, leaf, slot,
  265. "xattr dir type found for non-XATTR key");
  266. return -EUCLEAN;
  267. }
  268. if (dir_type == BTRFS_FT_XATTR)
  269. max_name_len = XATTR_NAME_MAX;
  270. else
  271. max_name_len = BTRFS_NAME_LEN;
  272. /* Name/data length check */
  273. name_len = btrfs_dir_name_len(leaf, di);
  274. data_len = btrfs_dir_data_len(leaf, di);
  275. if (name_len > max_name_len) {
  276. dir_item_err(root, leaf, slot,
  277. "dir item name len too long, have %u max %u",
  278. name_len, max_name_len);
  279. return -EUCLEAN;
  280. }
  281. if (name_len + data_len > BTRFS_MAX_XATTR_SIZE(root->fs_info)) {
  282. dir_item_err(root, leaf, slot,
  283. "dir item name and data len too long, have %u max %u",
  284. name_len + data_len,
  285. BTRFS_MAX_XATTR_SIZE(root->fs_info));
  286. return -EUCLEAN;
  287. }
  288. if (data_len && dir_type != BTRFS_FT_XATTR) {
  289. dir_item_err(root, leaf, slot,
  290. "dir item with invalid data len, have %u expect 0",
  291. data_len);
  292. return -EUCLEAN;
  293. }
  294. total_size = sizeof(*di) + name_len + data_len;
  295. /* header and name/data should not cross item boundary */
  296. if (cur + total_size > item_size) {
  297. dir_item_err(root, leaf, slot,
  298. "dir item data crosses item boundary, have %u boundary %u",
  299. cur + total_size, item_size);
  300. return -EUCLEAN;
  301. }
  302. /*
  303. * Special check for XATTR/DIR_ITEM, as key->offset is name
  304. * hash, should match its name
  305. */
  306. if (key->type == BTRFS_DIR_ITEM_KEY ||
  307. key->type == BTRFS_XATTR_ITEM_KEY) {
  308. char namebuf[max(BTRFS_NAME_LEN, XATTR_NAME_MAX)];
  309. read_extent_buffer(leaf, namebuf,
  310. (unsigned long)(di + 1), name_len);
  311. name_hash = btrfs_name_hash(namebuf, name_len);
  312. if (key->offset != name_hash) {
  313. dir_item_err(root, leaf, slot,
  314. "name hash mismatch with key, have 0x%016x expect 0x%016llx",
  315. name_hash, key->offset);
  316. return -EUCLEAN;
  317. }
  318. }
  319. cur += total_size;
  320. di = (struct btrfs_dir_item *)((void *)di + total_size);
  321. }
  322. return 0;
  323. }
  324. /*
  325. * Common point to switch the item-specific validation.
  326. */
  327. static int check_leaf_item(struct btrfs_root *root,
  328. struct extent_buffer *leaf,
  329. struct btrfs_key *key, int slot)
  330. {
  331. int ret = 0;
  332. switch (key->type) {
  333. case BTRFS_EXTENT_DATA_KEY:
  334. ret = check_extent_data_item(root, leaf, key, slot);
  335. break;
  336. case BTRFS_EXTENT_CSUM_KEY:
  337. ret = check_csum_item(root, leaf, key, slot);
  338. break;
  339. case BTRFS_DIR_ITEM_KEY:
  340. case BTRFS_DIR_INDEX_KEY:
  341. case BTRFS_XATTR_ITEM_KEY:
  342. ret = check_dir_item(root, leaf, key, slot);
  343. break;
  344. }
  345. return ret;
  346. }
  347. static int check_leaf(struct btrfs_root *root, struct extent_buffer *leaf,
  348. bool check_item_data)
  349. {
  350. struct btrfs_fs_info *fs_info = root->fs_info;
  351. /* No valid key type is 0, so all key should be larger than this key */
  352. struct btrfs_key prev_key = {0, 0, 0};
  353. struct btrfs_key key;
  354. u32 nritems = btrfs_header_nritems(leaf);
  355. int slot;
  356. /*
  357. * Extent buffers from a relocation tree have a owner field that
  358. * corresponds to the subvolume tree they are based on. So just from an
  359. * extent buffer alone we can not find out what is the id of the
  360. * corresponding subvolume tree, so we can not figure out if the extent
  361. * buffer corresponds to the root of the relocation tree or not. So
  362. * skip this check for relocation trees.
  363. */
  364. if (nritems == 0 && !btrfs_header_flag(leaf, BTRFS_HEADER_FLAG_RELOC)) {
  365. struct btrfs_root *check_root;
  366. key.objectid = btrfs_header_owner(leaf);
  367. key.type = BTRFS_ROOT_ITEM_KEY;
  368. key.offset = (u64)-1;
  369. check_root = btrfs_get_fs_root(fs_info, &key, false);
  370. /*
  371. * The only reason we also check NULL here is that during
  372. * open_ctree() some roots has not yet been set up.
  373. */
  374. if (!IS_ERR_OR_NULL(check_root)) {
  375. struct extent_buffer *eb;
  376. eb = btrfs_root_node(check_root);
  377. /* if leaf is the root, then it's fine */
  378. if (leaf != eb) {
  379. generic_err(check_root, leaf, 0,
  380. "invalid nritems, have %u should not be 0 for non-root leaf",
  381. nritems);
  382. free_extent_buffer(eb);
  383. return -EUCLEAN;
  384. }
  385. free_extent_buffer(eb);
  386. }
  387. return 0;
  388. }
  389. if (nritems == 0)
  390. return 0;
  391. /*
  392. * Check the following things to make sure this is a good leaf, and
  393. * leaf users won't need to bother with similar sanity checks:
  394. *
  395. * 1) key ordering
  396. * 2) item offset and size
  397. * No overlap, no hole, all inside the leaf.
  398. * 3) item content
  399. * If possible, do comprehensive sanity check.
  400. * NOTE: All checks must only rely on the item data itself.
  401. */
  402. for (slot = 0; slot < nritems; slot++) {
  403. u32 item_end_expected;
  404. int ret;
  405. btrfs_item_key_to_cpu(leaf, &key, slot);
  406. /* Make sure the keys are in the right order */
  407. if (btrfs_comp_cpu_keys(&prev_key, &key) >= 0) {
  408. generic_err(root, leaf, slot,
  409. "bad key order, prev (%llu %u %llu) current (%llu %u %llu)",
  410. prev_key.objectid, prev_key.type,
  411. prev_key.offset, key.objectid, key.type,
  412. key.offset);
  413. return -EUCLEAN;
  414. }
  415. /*
  416. * Make sure the offset and ends are right, remember that the
  417. * item data starts at the end of the leaf and grows towards the
  418. * front.
  419. */
  420. if (slot == 0)
  421. item_end_expected = BTRFS_LEAF_DATA_SIZE(fs_info);
  422. else
  423. item_end_expected = btrfs_item_offset_nr(leaf,
  424. slot - 1);
  425. if (btrfs_item_end_nr(leaf, slot) != item_end_expected) {
  426. generic_err(root, leaf, slot,
  427. "unexpected item end, have %u expect %u",
  428. btrfs_item_end_nr(leaf, slot),
  429. item_end_expected);
  430. return -EUCLEAN;
  431. }
  432. /*
  433. * Check to make sure that we don't point outside of the leaf,
  434. * just in case all the items are consistent to each other, but
  435. * all point outside of the leaf.
  436. */
  437. if (btrfs_item_end_nr(leaf, slot) >
  438. BTRFS_LEAF_DATA_SIZE(fs_info)) {
  439. generic_err(root, leaf, slot,
  440. "slot end outside of leaf, have %u expect range [0, %u]",
  441. btrfs_item_end_nr(leaf, slot),
  442. BTRFS_LEAF_DATA_SIZE(fs_info));
  443. return -EUCLEAN;
  444. }
  445. /* Also check if the item pointer overlaps with btrfs item. */
  446. if (btrfs_item_nr_offset(slot) + sizeof(struct btrfs_item) >
  447. btrfs_item_ptr_offset(leaf, slot)) {
  448. generic_err(root, leaf, slot,
  449. "slot overlaps with its data, item end %lu data start %lu",
  450. btrfs_item_nr_offset(slot) +
  451. sizeof(struct btrfs_item),
  452. btrfs_item_ptr_offset(leaf, slot));
  453. return -EUCLEAN;
  454. }
  455. if (check_item_data) {
  456. /*
  457. * Check if the item size and content meet other
  458. * criteria
  459. */
  460. ret = check_leaf_item(root, leaf, &key, slot);
  461. if (ret < 0)
  462. return ret;
  463. }
  464. prev_key.objectid = key.objectid;
  465. prev_key.type = key.type;
  466. prev_key.offset = key.offset;
  467. }
  468. return 0;
  469. }
  470. int btrfs_check_leaf_full(struct btrfs_root *root, struct extent_buffer *leaf)
  471. {
  472. return check_leaf(root, leaf, true);
  473. }
  474. int btrfs_check_leaf_relaxed(struct btrfs_root *root,
  475. struct extent_buffer *leaf)
  476. {
  477. return check_leaf(root, leaf, false);
  478. }
  479. int btrfs_check_node(struct btrfs_root *root, struct extent_buffer *node)
  480. {
  481. unsigned long nr = btrfs_header_nritems(node);
  482. struct btrfs_key key, next_key;
  483. int slot;
  484. u64 bytenr;
  485. int ret = 0;
  486. if (nr == 0 || nr > BTRFS_NODEPTRS_PER_BLOCK(root->fs_info)) {
  487. btrfs_crit(root->fs_info,
  488. "corrupt node: root=%llu block=%llu, nritems too %s, have %lu expect range [1,%u]",
  489. root->objectid, node->start,
  490. nr == 0 ? "small" : "large", nr,
  491. BTRFS_NODEPTRS_PER_BLOCK(root->fs_info));
  492. return -EUCLEAN;
  493. }
  494. for (slot = 0; slot < nr - 1; slot++) {
  495. bytenr = btrfs_node_blockptr(node, slot);
  496. btrfs_node_key_to_cpu(node, &key, slot);
  497. btrfs_node_key_to_cpu(node, &next_key, slot + 1);
  498. if (!bytenr) {
  499. generic_err(root, node, slot,
  500. "invalid NULL node pointer");
  501. ret = -EUCLEAN;
  502. goto out;
  503. }
  504. if (!IS_ALIGNED(bytenr, root->fs_info->sectorsize)) {
  505. generic_err(root, node, slot,
  506. "unaligned pointer, have %llu should be aligned to %u",
  507. bytenr, root->fs_info->sectorsize);
  508. ret = -EUCLEAN;
  509. goto out;
  510. }
  511. if (btrfs_comp_cpu_keys(&key, &next_key) >= 0) {
  512. generic_err(root, node, slot,
  513. "bad key order, current (%llu %u %llu) next (%llu %u %llu)",
  514. key.objectid, key.type, key.offset,
  515. next_key.objectid, next_key.type,
  516. next_key.offset);
  517. ret = -EUCLEAN;
  518. goto out;
  519. }
  520. }
  521. out:
  522. return ret;
  523. }