debug.c 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563
  1. /*
  2. * Assorted bcache debug code
  3. *
  4. * Copyright 2010, 2011 Kent Overstreet <kent.overstreet@gmail.com>
  5. * Copyright 2012 Google, Inc.
  6. */
  7. #include "bcache.h"
  8. #include "btree.h"
  9. #include "debug.h"
  10. #include "request.h"
  11. #include <linux/console.h>
  12. #include <linux/debugfs.h>
  13. #include <linux/module.h>
  14. #include <linux/random.h>
  15. #include <linux/seq_file.h>
  16. static struct dentry *debug;
  17. const char *bch_ptr_status(struct cache_set *c, const struct bkey *k)
  18. {
  19. unsigned i;
  20. for (i = 0; i < KEY_PTRS(k); i++)
  21. if (ptr_available(c, k, i)) {
  22. struct cache *ca = PTR_CACHE(c, k, i);
  23. size_t bucket = PTR_BUCKET_NR(c, k, i);
  24. size_t r = bucket_remainder(c, PTR_OFFSET(k, i));
  25. if (KEY_SIZE(k) + r > c->sb.bucket_size)
  26. return "bad, length too big";
  27. if (bucket < ca->sb.first_bucket)
  28. return "bad, short offset";
  29. if (bucket >= ca->sb.nbuckets)
  30. return "bad, offset past end of device";
  31. if (ptr_stale(c, k, i))
  32. return "stale";
  33. }
  34. if (!bkey_cmp(k, &ZERO_KEY))
  35. return "bad, null key";
  36. if (!KEY_PTRS(k))
  37. return "bad, no pointers";
  38. if (!KEY_SIZE(k))
  39. return "zeroed key";
  40. return "";
  41. }
  42. struct keyprint_hack bch_pkey(const struct bkey *k)
  43. {
  44. unsigned i = 0;
  45. struct keyprint_hack r;
  46. char *out = r.s, *end = r.s + KEYHACK_SIZE;
  47. #define p(...) (out += scnprintf(out, end - out, __VA_ARGS__))
  48. p("%llu:%llu len %llu -> [", KEY_INODE(k), KEY_OFFSET(k), KEY_SIZE(k));
  49. if (KEY_PTRS(k))
  50. while (1) {
  51. p("%llu:%llu gen %llu",
  52. PTR_DEV(k, i), PTR_OFFSET(k, i), PTR_GEN(k, i));
  53. if (++i == KEY_PTRS(k))
  54. break;
  55. p(", ");
  56. }
  57. p("]");
  58. if (KEY_DIRTY(k))
  59. p(" dirty");
  60. if (KEY_CSUM(k))
  61. p(" cs%llu %llx", KEY_CSUM(k), k->ptr[1]);
  62. #undef p
  63. return r;
  64. }
  65. struct keyprint_hack bch_pbtree(const struct btree *b)
  66. {
  67. struct keyprint_hack r;
  68. snprintf(r.s, 40, "%li level %i/%i", PTR_BUCKET_NR(b->c, &b->key, 0),
  69. b->level, b->c->root ? b->c->root->level : -1);
  70. return r;
  71. }
  72. #if defined(CONFIG_BCACHE_DEBUG) || defined(CONFIG_BCACHE_EDEBUG)
  73. static bool skipped_backwards(struct btree *b, struct bkey *k)
  74. {
  75. return bkey_cmp(k, (!b->level)
  76. ? &START_KEY(bkey_next(k))
  77. : bkey_next(k)) > 0;
  78. }
  79. static void dump_bset(struct btree *b, struct bset *i)
  80. {
  81. struct bkey *k;
  82. unsigned j;
  83. for (k = i->start; k < end(i); k = bkey_next(k)) {
  84. printk(KERN_ERR "block %zu key %zi/%u: %s", index(i, b),
  85. (uint64_t *) k - i->d, i->keys, pkey(k));
  86. for (j = 0; j < KEY_PTRS(k); j++) {
  87. size_t n = PTR_BUCKET_NR(b->c, k, j);
  88. printk(" bucket %zu", n);
  89. if (n >= b->c->sb.first_bucket && n < b->c->sb.nbuckets)
  90. printk(" prio %i",
  91. PTR_BUCKET(b->c, k, j)->prio);
  92. }
  93. printk(" %s\n", bch_ptr_status(b->c, k));
  94. if (bkey_next(k) < end(i) &&
  95. skipped_backwards(b, k))
  96. printk(KERN_ERR "Key skipped backwards\n");
  97. }
  98. }
  99. #endif
  100. #ifdef CONFIG_BCACHE_DEBUG
  101. void bch_btree_verify(struct btree *b, struct bset *new)
  102. {
  103. struct btree *v = b->c->verify_data;
  104. struct closure cl;
  105. closure_init_stack(&cl);
  106. if (!b->c->verify)
  107. return;
  108. closure_wait_event(&b->io.wait, &cl,
  109. atomic_read(&b->io.cl.remaining) == -1);
  110. mutex_lock(&b->c->verify_lock);
  111. bkey_copy(&v->key, &b->key);
  112. v->written = 0;
  113. v->level = b->level;
  114. bch_btree_read(v);
  115. closure_wait_event(&v->io.wait, &cl,
  116. atomic_read(&b->io.cl.remaining) == -1);
  117. if (new->keys != v->sets[0].data->keys ||
  118. memcmp(new->start,
  119. v->sets[0].data->start,
  120. (void *) end(new) - (void *) new->start)) {
  121. unsigned i, j;
  122. console_lock();
  123. printk(KERN_ERR "*** original memory node:\n");
  124. for (i = 0; i <= b->nsets; i++)
  125. dump_bset(b, b->sets[i].data);
  126. printk(KERN_ERR "*** sorted memory node:\n");
  127. dump_bset(b, new);
  128. printk(KERN_ERR "*** on disk node:\n");
  129. dump_bset(v, v->sets[0].data);
  130. for (j = 0; j < new->keys; j++)
  131. if (new->d[j] != v->sets[0].data->d[j])
  132. break;
  133. console_unlock();
  134. panic("verify failed at %u\n", j);
  135. }
  136. mutex_unlock(&b->c->verify_lock);
  137. }
  138. static void data_verify_endio(struct bio *bio, int error)
  139. {
  140. struct closure *cl = bio->bi_private;
  141. closure_put(cl);
  142. }
  143. void bch_data_verify(struct search *s)
  144. {
  145. char name[BDEVNAME_SIZE];
  146. struct cached_dev *dc = container_of(s->d, struct cached_dev, disk);
  147. struct closure *cl = &s->cl;
  148. struct bio *check;
  149. struct bio_vec *bv;
  150. int i;
  151. if (!s->unaligned_bvec)
  152. bio_for_each_segment(bv, s->orig_bio, i)
  153. bv->bv_offset = 0, bv->bv_len = PAGE_SIZE;
  154. check = bio_clone(s->orig_bio, GFP_NOIO);
  155. if (!check)
  156. return;
  157. if (bio_alloc_pages(check, GFP_NOIO))
  158. goto out_put;
  159. check->bi_rw = READ_SYNC;
  160. check->bi_private = cl;
  161. check->bi_end_io = data_verify_endio;
  162. closure_bio_submit(check, cl, &dc->disk);
  163. closure_sync(cl);
  164. bio_for_each_segment(bv, s->orig_bio, i) {
  165. void *p1 = kmap(bv->bv_page);
  166. void *p2 = kmap(check->bi_io_vec[i].bv_page);
  167. if (memcmp(p1 + bv->bv_offset,
  168. p2 + bv->bv_offset,
  169. bv->bv_len))
  170. printk(KERN_ERR
  171. "bcache (%s): verify failed at sector %llu\n",
  172. bdevname(dc->bdev, name),
  173. (uint64_t) s->orig_bio->bi_sector);
  174. kunmap(bv->bv_page);
  175. kunmap(check->bi_io_vec[i].bv_page);
  176. }
  177. __bio_for_each_segment(bv, check, i, 0)
  178. __free_page(bv->bv_page);
  179. out_put:
  180. bio_put(check);
  181. }
  182. #endif
  183. #ifdef CONFIG_BCACHE_EDEBUG
  184. unsigned bch_count_data(struct btree *b)
  185. {
  186. unsigned ret = 0;
  187. struct btree_iter iter;
  188. struct bkey *k;
  189. if (!b->level)
  190. for_each_key(b, k, &iter)
  191. ret += KEY_SIZE(k);
  192. return ret;
  193. }
  194. static void vdump_bucket_and_panic(struct btree *b, const char *fmt,
  195. va_list args)
  196. {
  197. unsigned i;
  198. console_lock();
  199. for (i = 0; i <= b->nsets; i++)
  200. dump_bset(b, b->sets[i].data);
  201. vprintk(fmt, args);
  202. console_unlock();
  203. panic("at %s\n", pbtree(b));
  204. }
  205. void bch_check_key_order_msg(struct btree *b, struct bset *i,
  206. const char *fmt, ...)
  207. {
  208. struct bkey *k;
  209. if (!i->keys)
  210. return;
  211. for (k = i->start; bkey_next(k) < end(i); k = bkey_next(k))
  212. if (skipped_backwards(b, k)) {
  213. va_list args;
  214. va_start(args, fmt);
  215. vdump_bucket_and_panic(b, fmt, args);
  216. va_end(args);
  217. }
  218. }
  219. void bch_check_keys(struct btree *b, const char *fmt, ...)
  220. {
  221. va_list args;
  222. struct bkey *k, *p = NULL;
  223. struct btree_iter iter;
  224. if (b->level)
  225. return;
  226. for_each_key(b, k, &iter) {
  227. if (p && bkey_cmp(&START_KEY(p), &START_KEY(k)) > 0) {
  228. printk(KERN_ERR "Keys out of order:\n");
  229. goto bug;
  230. }
  231. if (bch_ptr_invalid(b, k))
  232. continue;
  233. if (p && bkey_cmp(p, &START_KEY(k)) > 0) {
  234. printk(KERN_ERR "Overlapping keys:\n");
  235. goto bug;
  236. }
  237. p = k;
  238. }
  239. return;
  240. bug:
  241. va_start(args, fmt);
  242. vdump_bucket_and_panic(b, fmt, args);
  243. va_end(args);
  244. }
  245. #endif
  246. #ifdef CONFIG_DEBUG_FS
  247. /* XXX: cache set refcounting */
  248. struct dump_iterator {
  249. char buf[PAGE_SIZE];
  250. size_t bytes;
  251. struct cache_set *c;
  252. struct keybuf keys;
  253. };
  254. static bool dump_pred(struct keybuf *buf, struct bkey *k)
  255. {
  256. return true;
  257. }
  258. static ssize_t bch_dump_read(struct file *file, char __user *buf,
  259. size_t size, loff_t *ppos)
  260. {
  261. struct dump_iterator *i = file->private_data;
  262. ssize_t ret = 0;
  263. while (size) {
  264. struct keybuf_key *w;
  265. unsigned bytes = min(i->bytes, size);
  266. int err = copy_to_user(buf, i->buf, bytes);
  267. if (err)
  268. return err;
  269. ret += bytes;
  270. buf += bytes;
  271. size -= bytes;
  272. i->bytes -= bytes;
  273. memmove(i->buf, i->buf + bytes, i->bytes);
  274. if (i->bytes)
  275. break;
  276. w = bch_keybuf_next_rescan(i->c, &i->keys, &MAX_KEY);
  277. if (!w)
  278. break;
  279. i->bytes = snprintf(i->buf, PAGE_SIZE, "%s\n", pkey(&w->key));
  280. bch_keybuf_del(&i->keys, w);
  281. }
  282. return ret;
  283. }
  284. static int bch_dump_open(struct inode *inode, struct file *file)
  285. {
  286. struct cache_set *c = inode->i_private;
  287. struct dump_iterator *i;
  288. i = kzalloc(sizeof(struct dump_iterator), GFP_KERNEL);
  289. if (!i)
  290. return -ENOMEM;
  291. file->private_data = i;
  292. i->c = c;
  293. bch_keybuf_init(&i->keys, dump_pred);
  294. i->keys.last_scanned = KEY(0, 0, 0);
  295. return 0;
  296. }
  297. static int bch_dump_release(struct inode *inode, struct file *file)
  298. {
  299. kfree(file->private_data);
  300. return 0;
  301. }
  302. static const struct file_operations cache_set_debug_ops = {
  303. .owner = THIS_MODULE,
  304. .open = bch_dump_open,
  305. .read = bch_dump_read,
  306. .release = bch_dump_release
  307. };
  308. void bch_debug_init_cache_set(struct cache_set *c)
  309. {
  310. if (!IS_ERR_OR_NULL(debug)) {
  311. char name[50];
  312. snprintf(name, 50, "bcache-%pU", c->sb.set_uuid);
  313. c->debug = debugfs_create_file(name, 0400, debug, c,
  314. &cache_set_debug_ops);
  315. }
  316. }
  317. #endif
  318. #ifdef CONFIG_BCACHE_DEBUG
  319. static ssize_t btree_fuzz(struct kobject *k, struct kobj_attribute *a,
  320. const char *buffer, size_t size)
  321. {
  322. void dump(struct btree *b)
  323. {
  324. struct bset *i;
  325. for (i = b->sets[0].data;
  326. index(i, b) < btree_blocks(b) &&
  327. i->seq == b->sets[0].data->seq;
  328. i = ((void *) i) + set_blocks(i, b->c) * block_bytes(b->c))
  329. dump_bset(b, i);
  330. }
  331. struct cache_sb *sb;
  332. struct cache_set *c;
  333. struct btree *all[3], *b, *fill, *orig;
  334. int j;
  335. struct btree_op op;
  336. bch_btree_op_init_stack(&op);
  337. sb = kzalloc(sizeof(struct cache_sb), GFP_KERNEL);
  338. if (!sb)
  339. return -ENOMEM;
  340. sb->bucket_size = 128;
  341. sb->block_size = 4;
  342. c = bch_cache_set_alloc(sb);
  343. if (!c)
  344. return -ENOMEM;
  345. for (j = 0; j < 3; j++) {
  346. BUG_ON(list_empty(&c->btree_cache));
  347. all[j] = list_first_entry(&c->btree_cache, struct btree, list);
  348. list_del_init(&all[j]->list);
  349. all[j]->key = KEY(0, 0, c->sb.bucket_size);
  350. bkey_copy_key(&all[j]->key, &MAX_KEY);
  351. }
  352. b = all[0];
  353. fill = all[1];
  354. orig = all[2];
  355. while (1) {
  356. for (j = 0; j < 3; j++)
  357. all[j]->written = all[j]->nsets = 0;
  358. bch_bset_init_next(b);
  359. while (1) {
  360. struct bset *i = write_block(b);
  361. struct bkey *k = op.keys.top;
  362. unsigned rand;
  363. bkey_init(k);
  364. rand = get_random_int();
  365. op.type = rand & 1
  366. ? BTREE_INSERT
  367. : BTREE_REPLACE;
  368. rand >>= 1;
  369. SET_KEY_SIZE(k, bucket_remainder(c, rand));
  370. rand >>= c->bucket_bits;
  371. rand &= 1024 * 512 - 1;
  372. rand += c->sb.bucket_size;
  373. SET_KEY_OFFSET(k, rand);
  374. #if 0
  375. SET_KEY_PTRS(k, 1);
  376. #endif
  377. bch_keylist_push(&op.keys);
  378. bch_btree_insert_keys(b, &op);
  379. if (should_split(b) ||
  380. set_blocks(i, b->c) !=
  381. __set_blocks(i, i->keys + 15, b->c)) {
  382. i->csum = csum_set(i);
  383. memcpy(write_block(fill),
  384. i, set_bytes(i));
  385. b->written += set_blocks(i, b->c);
  386. fill->written = b->written;
  387. if (b->written == btree_blocks(b))
  388. break;
  389. bch_btree_sort_lazy(b);
  390. bch_bset_init_next(b);
  391. }
  392. }
  393. memcpy(orig->sets[0].data,
  394. fill->sets[0].data,
  395. btree_bytes(c));
  396. bch_btree_sort(b);
  397. fill->written = 0;
  398. bch_btree_read_done(&fill->io.cl);
  399. if (b->sets[0].data->keys != fill->sets[0].data->keys ||
  400. memcmp(b->sets[0].data->start,
  401. fill->sets[0].data->start,
  402. b->sets[0].data->keys * sizeof(uint64_t))) {
  403. struct bset *i = b->sets[0].data;
  404. struct bkey *k, *l;
  405. for (k = i->start,
  406. l = fill->sets[0].data->start;
  407. k < end(i);
  408. k = bkey_next(k), l = bkey_next(l))
  409. if (bkey_cmp(k, l) ||
  410. KEY_SIZE(k) != KEY_SIZE(l))
  411. pr_err("key %zi differs: %s != %s",
  412. (uint64_t *) k - i->d,
  413. pkey(k), pkey(l));
  414. for (j = 0; j < 3; j++) {
  415. pr_err("**** Set %i ****", j);
  416. dump(all[j]);
  417. }
  418. panic("\n");
  419. }
  420. pr_info("fuzz complete: %i keys", b->sets[0].data->keys);
  421. }
  422. }
  423. kobj_attribute_write(fuzz, btree_fuzz);
  424. #endif
  425. void bch_debug_exit(void)
  426. {
  427. if (!IS_ERR_OR_NULL(debug))
  428. debugfs_remove_recursive(debug);
  429. }
  430. int __init bch_debug_init(struct kobject *kobj)
  431. {
  432. int ret = 0;
  433. #ifdef CONFIG_BCACHE_DEBUG
  434. ret = sysfs_create_file(kobj, &ksysfs_fuzz.attr);
  435. if (ret)
  436. return ret;
  437. #endif
  438. debug = debugfs_create_dir("bcache", NULL);
  439. return ret;
  440. }