123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563 |
- /*
- * Assorted bcache debug code
- *
- * Copyright 2010, 2011 Kent Overstreet <kent.overstreet@gmail.com>
- * Copyright 2012 Google, Inc.
- */
- #include "bcache.h"
- #include "btree.h"
- #include "debug.h"
- #include "request.h"
- #include <linux/console.h>
- #include <linux/debugfs.h>
- #include <linux/module.h>
- #include <linux/random.h>
- #include <linux/seq_file.h>
- static struct dentry *debug;
- const char *bch_ptr_status(struct cache_set *c, const struct bkey *k)
- {
- unsigned i;
- for (i = 0; i < KEY_PTRS(k); i++)
- if (ptr_available(c, k, i)) {
- struct cache *ca = PTR_CACHE(c, k, i);
- size_t bucket = PTR_BUCKET_NR(c, k, i);
- size_t r = bucket_remainder(c, PTR_OFFSET(k, i));
- if (KEY_SIZE(k) + r > c->sb.bucket_size)
- return "bad, length too big";
- if (bucket < ca->sb.first_bucket)
- return "bad, short offset";
- if (bucket >= ca->sb.nbuckets)
- return "bad, offset past end of device";
- if (ptr_stale(c, k, i))
- return "stale";
- }
- if (!bkey_cmp(k, &ZERO_KEY))
- return "bad, null key";
- if (!KEY_PTRS(k))
- return "bad, no pointers";
- if (!KEY_SIZE(k))
- return "zeroed key";
- return "";
- }
- struct keyprint_hack bch_pkey(const struct bkey *k)
- {
- unsigned i = 0;
- struct keyprint_hack r;
- char *out = r.s, *end = r.s + KEYHACK_SIZE;
- #define p(...) (out += scnprintf(out, end - out, __VA_ARGS__))
- p("%llu:%llu len %llu -> [", KEY_INODE(k), KEY_OFFSET(k), KEY_SIZE(k));
- if (KEY_PTRS(k))
- while (1) {
- p("%llu:%llu gen %llu",
- PTR_DEV(k, i), PTR_OFFSET(k, i), PTR_GEN(k, i));
- if (++i == KEY_PTRS(k))
- break;
- p(", ");
- }
- p("]");
- if (KEY_DIRTY(k))
- p(" dirty");
- if (KEY_CSUM(k))
- p(" cs%llu %llx", KEY_CSUM(k), k->ptr[1]);
- #undef p
- return r;
- }
- struct keyprint_hack bch_pbtree(const struct btree *b)
- {
- struct keyprint_hack r;
- snprintf(r.s, 40, "%li level %i/%i", PTR_BUCKET_NR(b->c, &b->key, 0),
- b->level, b->c->root ? b->c->root->level : -1);
- return r;
- }
- #if defined(CONFIG_BCACHE_DEBUG) || defined(CONFIG_BCACHE_EDEBUG)
- static bool skipped_backwards(struct btree *b, struct bkey *k)
- {
- return bkey_cmp(k, (!b->level)
- ? &START_KEY(bkey_next(k))
- : bkey_next(k)) > 0;
- }
- static void dump_bset(struct btree *b, struct bset *i)
- {
- struct bkey *k;
- unsigned j;
- for (k = i->start; k < end(i); k = bkey_next(k)) {
- printk(KERN_ERR "block %zu key %zi/%u: %s", index(i, b),
- (uint64_t *) k - i->d, i->keys, pkey(k));
- for (j = 0; j < KEY_PTRS(k); j++) {
- size_t n = PTR_BUCKET_NR(b->c, k, j);
- printk(" bucket %zu", n);
- if (n >= b->c->sb.first_bucket && n < b->c->sb.nbuckets)
- printk(" prio %i",
- PTR_BUCKET(b->c, k, j)->prio);
- }
- printk(" %s\n", bch_ptr_status(b->c, k));
- if (bkey_next(k) < end(i) &&
- skipped_backwards(b, k))
- printk(KERN_ERR "Key skipped backwards\n");
- }
- }
- #endif
- #ifdef CONFIG_BCACHE_DEBUG
- void bch_btree_verify(struct btree *b, struct bset *new)
- {
- struct btree *v = b->c->verify_data;
- struct closure cl;
- closure_init_stack(&cl);
- if (!b->c->verify)
- return;
- closure_wait_event(&b->io.wait, &cl,
- atomic_read(&b->io.cl.remaining) == -1);
- mutex_lock(&b->c->verify_lock);
- bkey_copy(&v->key, &b->key);
- v->written = 0;
- v->level = b->level;
- bch_btree_read(v);
- closure_wait_event(&v->io.wait, &cl,
- atomic_read(&b->io.cl.remaining) == -1);
- if (new->keys != v->sets[0].data->keys ||
- memcmp(new->start,
- v->sets[0].data->start,
- (void *) end(new) - (void *) new->start)) {
- unsigned i, j;
- console_lock();
- printk(KERN_ERR "*** original memory node:\n");
- for (i = 0; i <= b->nsets; i++)
- dump_bset(b, b->sets[i].data);
- printk(KERN_ERR "*** sorted memory node:\n");
- dump_bset(b, new);
- printk(KERN_ERR "*** on disk node:\n");
- dump_bset(v, v->sets[0].data);
- for (j = 0; j < new->keys; j++)
- if (new->d[j] != v->sets[0].data->d[j])
- break;
- console_unlock();
- panic("verify failed at %u\n", j);
- }
- mutex_unlock(&b->c->verify_lock);
- }
- static void data_verify_endio(struct bio *bio, int error)
- {
- struct closure *cl = bio->bi_private;
- closure_put(cl);
- }
- void bch_data_verify(struct search *s)
- {
- char name[BDEVNAME_SIZE];
- struct cached_dev *dc = container_of(s->d, struct cached_dev, disk);
- struct closure *cl = &s->cl;
- struct bio *check;
- struct bio_vec *bv;
- int i;
- if (!s->unaligned_bvec)
- bio_for_each_segment(bv, s->orig_bio, i)
- bv->bv_offset = 0, bv->bv_len = PAGE_SIZE;
- check = bio_clone(s->orig_bio, GFP_NOIO);
- if (!check)
- return;
- if (bio_alloc_pages(check, GFP_NOIO))
- goto out_put;
- check->bi_rw = READ_SYNC;
- check->bi_private = cl;
- check->bi_end_io = data_verify_endio;
- closure_bio_submit(check, cl, &dc->disk);
- closure_sync(cl);
- bio_for_each_segment(bv, s->orig_bio, i) {
- void *p1 = kmap(bv->bv_page);
- void *p2 = kmap(check->bi_io_vec[i].bv_page);
- if (memcmp(p1 + bv->bv_offset,
- p2 + bv->bv_offset,
- bv->bv_len))
- printk(KERN_ERR
- "bcache (%s): verify failed at sector %llu\n",
- bdevname(dc->bdev, name),
- (uint64_t) s->orig_bio->bi_sector);
- kunmap(bv->bv_page);
- kunmap(check->bi_io_vec[i].bv_page);
- }
- __bio_for_each_segment(bv, check, i, 0)
- __free_page(bv->bv_page);
- out_put:
- bio_put(check);
- }
- #endif
- #ifdef CONFIG_BCACHE_EDEBUG
- unsigned bch_count_data(struct btree *b)
- {
- unsigned ret = 0;
- struct btree_iter iter;
- struct bkey *k;
- if (!b->level)
- for_each_key(b, k, &iter)
- ret += KEY_SIZE(k);
- return ret;
- }
- static void vdump_bucket_and_panic(struct btree *b, const char *fmt,
- va_list args)
- {
- unsigned i;
- console_lock();
- for (i = 0; i <= b->nsets; i++)
- dump_bset(b, b->sets[i].data);
- vprintk(fmt, args);
- console_unlock();
- panic("at %s\n", pbtree(b));
- }
- void bch_check_key_order_msg(struct btree *b, struct bset *i,
- const char *fmt, ...)
- {
- struct bkey *k;
- if (!i->keys)
- return;
- for (k = i->start; bkey_next(k) < end(i); k = bkey_next(k))
- if (skipped_backwards(b, k)) {
- va_list args;
- va_start(args, fmt);
- vdump_bucket_and_panic(b, fmt, args);
- va_end(args);
- }
- }
- void bch_check_keys(struct btree *b, const char *fmt, ...)
- {
- va_list args;
- struct bkey *k, *p = NULL;
- struct btree_iter iter;
- if (b->level)
- return;
- for_each_key(b, k, &iter) {
- if (p && bkey_cmp(&START_KEY(p), &START_KEY(k)) > 0) {
- printk(KERN_ERR "Keys out of order:\n");
- goto bug;
- }
- if (bch_ptr_invalid(b, k))
- continue;
- if (p && bkey_cmp(p, &START_KEY(k)) > 0) {
- printk(KERN_ERR "Overlapping keys:\n");
- goto bug;
- }
- p = k;
- }
- return;
- bug:
- va_start(args, fmt);
- vdump_bucket_and_panic(b, fmt, args);
- va_end(args);
- }
- #endif
- #ifdef CONFIG_DEBUG_FS
- /* XXX: cache set refcounting */
- struct dump_iterator {
- char buf[PAGE_SIZE];
- size_t bytes;
- struct cache_set *c;
- struct keybuf keys;
- };
- static bool dump_pred(struct keybuf *buf, struct bkey *k)
- {
- return true;
- }
- static ssize_t bch_dump_read(struct file *file, char __user *buf,
- size_t size, loff_t *ppos)
- {
- struct dump_iterator *i = file->private_data;
- ssize_t ret = 0;
- while (size) {
- struct keybuf_key *w;
- unsigned bytes = min(i->bytes, size);
- int err = copy_to_user(buf, i->buf, bytes);
- if (err)
- return err;
- ret += bytes;
- buf += bytes;
- size -= bytes;
- i->bytes -= bytes;
- memmove(i->buf, i->buf + bytes, i->bytes);
- if (i->bytes)
- break;
- w = bch_keybuf_next_rescan(i->c, &i->keys, &MAX_KEY);
- if (!w)
- break;
- i->bytes = snprintf(i->buf, PAGE_SIZE, "%s\n", pkey(&w->key));
- bch_keybuf_del(&i->keys, w);
- }
- return ret;
- }
- static int bch_dump_open(struct inode *inode, struct file *file)
- {
- struct cache_set *c = inode->i_private;
- struct dump_iterator *i;
- i = kzalloc(sizeof(struct dump_iterator), GFP_KERNEL);
- if (!i)
- return -ENOMEM;
- file->private_data = i;
- i->c = c;
- bch_keybuf_init(&i->keys, dump_pred);
- i->keys.last_scanned = KEY(0, 0, 0);
- return 0;
- }
- static int bch_dump_release(struct inode *inode, struct file *file)
- {
- kfree(file->private_data);
- return 0;
- }
- static const struct file_operations cache_set_debug_ops = {
- .owner = THIS_MODULE,
- .open = bch_dump_open,
- .read = bch_dump_read,
- .release = bch_dump_release
- };
- void bch_debug_init_cache_set(struct cache_set *c)
- {
- if (!IS_ERR_OR_NULL(debug)) {
- char name[50];
- snprintf(name, 50, "bcache-%pU", c->sb.set_uuid);
- c->debug = debugfs_create_file(name, 0400, debug, c,
- &cache_set_debug_ops);
- }
- }
- #endif
- #ifdef CONFIG_BCACHE_DEBUG
- static ssize_t btree_fuzz(struct kobject *k, struct kobj_attribute *a,
- const char *buffer, size_t size)
- {
- void dump(struct btree *b)
- {
- struct bset *i;
- for (i = b->sets[0].data;
- index(i, b) < btree_blocks(b) &&
- i->seq == b->sets[0].data->seq;
- i = ((void *) i) + set_blocks(i, b->c) * block_bytes(b->c))
- dump_bset(b, i);
- }
- struct cache_sb *sb;
- struct cache_set *c;
- struct btree *all[3], *b, *fill, *orig;
- int j;
- struct btree_op op;
- bch_btree_op_init_stack(&op);
- sb = kzalloc(sizeof(struct cache_sb), GFP_KERNEL);
- if (!sb)
- return -ENOMEM;
- sb->bucket_size = 128;
- sb->block_size = 4;
- c = bch_cache_set_alloc(sb);
- if (!c)
- return -ENOMEM;
- for (j = 0; j < 3; j++) {
- BUG_ON(list_empty(&c->btree_cache));
- all[j] = list_first_entry(&c->btree_cache, struct btree, list);
- list_del_init(&all[j]->list);
- all[j]->key = KEY(0, 0, c->sb.bucket_size);
- bkey_copy_key(&all[j]->key, &MAX_KEY);
- }
- b = all[0];
- fill = all[1];
- orig = all[2];
- while (1) {
- for (j = 0; j < 3; j++)
- all[j]->written = all[j]->nsets = 0;
- bch_bset_init_next(b);
- while (1) {
- struct bset *i = write_block(b);
- struct bkey *k = op.keys.top;
- unsigned rand;
- bkey_init(k);
- rand = get_random_int();
- op.type = rand & 1
- ? BTREE_INSERT
- : BTREE_REPLACE;
- rand >>= 1;
- SET_KEY_SIZE(k, bucket_remainder(c, rand));
- rand >>= c->bucket_bits;
- rand &= 1024 * 512 - 1;
- rand += c->sb.bucket_size;
- SET_KEY_OFFSET(k, rand);
- #if 0
- SET_KEY_PTRS(k, 1);
- #endif
- bch_keylist_push(&op.keys);
- bch_btree_insert_keys(b, &op);
- if (should_split(b) ||
- set_blocks(i, b->c) !=
- __set_blocks(i, i->keys + 15, b->c)) {
- i->csum = csum_set(i);
- memcpy(write_block(fill),
- i, set_bytes(i));
- b->written += set_blocks(i, b->c);
- fill->written = b->written;
- if (b->written == btree_blocks(b))
- break;
- bch_btree_sort_lazy(b);
- bch_bset_init_next(b);
- }
- }
- memcpy(orig->sets[0].data,
- fill->sets[0].data,
- btree_bytes(c));
- bch_btree_sort(b);
- fill->written = 0;
- bch_btree_read_done(&fill->io.cl);
- if (b->sets[0].data->keys != fill->sets[0].data->keys ||
- memcmp(b->sets[0].data->start,
- fill->sets[0].data->start,
- b->sets[0].data->keys * sizeof(uint64_t))) {
- struct bset *i = b->sets[0].data;
- struct bkey *k, *l;
- for (k = i->start,
- l = fill->sets[0].data->start;
- k < end(i);
- k = bkey_next(k), l = bkey_next(l))
- if (bkey_cmp(k, l) ||
- KEY_SIZE(k) != KEY_SIZE(l))
- pr_err("key %zi differs: %s != %s",
- (uint64_t *) k - i->d,
- pkey(k), pkey(l));
- for (j = 0; j < 3; j++) {
- pr_err("**** Set %i ****", j);
- dump(all[j]);
- }
- panic("\n");
- }
- pr_info("fuzz complete: %i keys", b->sets[0].data->keys);
- }
- }
- kobj_attribute_write(fuzz, btree_fuzz);
- #endif
- void bch_debug_exit(void)
- {
- if (!IS_ERR_OR_NULL(debug))
- debugfs_remove_recursive(debug);
- }
- int __init bch_debug_init(struct kobject *kobj)
- {
- int ret = 0;
- #ifdef CONFIG_BCACHE_DEBUG
- ret = sysfs_create_file(kobj, &ksysfs_fuzz.attr);
- if (ret)
- return ret;
- #endif
- debug = debugfs_create_dir("bcache", NULL);
- return ret;
- }
|