/* * Assorted bcache debug code * * Copyright 2010, 2011 Kent Overstreet * Copyright 2012 Google, Inc. */ #include "bcache.h" #include "btree.h" #include "debug.h" #include "request.h" #include #include #include #include #include static struct dentry *debug; const char *bch_ptr_status(struct cache_set *c, const struct bkey *k) { unsigned i; for (i = 0; i < KEY_PTRS(k); i++) if (ptr_available(c, k, i)) { struct cache *ca = PTR_CACHE(c, k, i); size_t bucket = PTR_BUCKET_NR(c, k, i); size_t r = bucket_remainder(c, PTR_OFFSET(k, i)); if (KEY_SIZE(k) + r > c->sb.bucket_size) return "bad, length too big"; if (bucket < ca->sb.first_bucket) return "bad, short offset"; if (bucket >= ca->sb.nbuckets) return "bad, offset past end of device"; if (ptr_stale(c, k, i)) return "stale"; } if (!bkey_cmp(k, &ZERO_KEY)) return "bad, null key"; if (!KEY_PTRS(k)) return "bad, no pointers"; if (!KEY_SIZE(k)) return "zeroed key"; return ""; } struct keyprint_hack bch_pkey(const struct bkey *k) { unsigned i = 0; struct keyprint_hack r; char *out = r.s, *end = r.s + KEYHACK_SIZE; #define p(...) (out += scnprintf(out, end - out, __VA_ARGS__)) p("%llu:%llu len %llu -> [", KEY_INODE(k), KEY_OFFSET(k), KEY_SIZE(k)); if (KEY_PTRS(k)) while (1) { p("%llu:%llu gen %llu", PTR_DEV(k, i), PTR_OFFSET(k, i), PTR_GEN(k, i)); if (++i == KEY_PTRS(k)) break; p(", "); } p("]"); if (KEY_DIRTY(k)) p(" dirty"); if (KEY_CSUM(k)) p(" cs%llu %llx", KEY_CSUM(k), k->ptr[1]); #undef p return r; } struct keyprint_hack bch_pbtree(const struct btree *b) { struct keyprint_hack r; snprintf(r.s, 40, "%li level %i/%i", PTR_BUCKET_NR(b->c, &b->key, 0), b->level, b->c->root ? b->c->root->level : -1); return r; } #if defined(CONFIG_BCACHE_DEBUG) || defined(CONFIG_BCACHE_EDEBUG) static bool skipped_backwards(struct btree *b, struct bkey *k) { return bkey_cmp(k, (!b->level) ? &START_KEY(bkey_next(k)) : bkey_next(k)) > 0; } static void dump_bset(struct btree *b, struct bset *i) { struct bkey *k; unsigned j; for (k = i->start; k < end(i); k = bkey_next(k)) { printk(KERN_ERR "block %zu key %zi/%u: %s", index(i, b), (uint64_t *) k - i->d, i->keys, pkey(k)); for (j = 0; j < KEY_PTRS(k); j++) { size_t n = PTR_BUCKET_NR(b->c, k, j); printk(" bucket %zu", n); if (n >= b->c->sb.first_bucket && n < b->c->sb.nbuckets) printk(" prio %i", PTR_BUCKET(b->c, k, j)->prio); } printk(" %s\n", bch_ptr_status(b->c, k)); if (bkey_next(k) < end(i) && skipped_backwards(b, k)) printk(KERN_ERR "Key skipped backwards\n"); } } #endif #ifdef CONFIG_BCACHE_DEBUG void bch_btree_verify(struct btree *b, struct bset *new) { struct btree *v = b->c->verify_data; struct closure cl; closure_init_stack(&cl); if (!b->c->verify) return; closure_wait_event(&b->io.wait, &cl, atomic_read(&b->io.cl.remaining) == -1); mutex_lock(&b->c->verify_lock); bkey_copy(&v->key, &b->key); v->written = 0; v->level = b->level; bch_btree_read(v); closure_wait_event(&v->io.wait, &cl, atomic_read(&b->io.cl.remaining) == -1); if (new->keys != v->sets[0].data->keys || memcmp(new->start, v->sets[0].data->start, (void *) end(new) - (void *) new->start)) { unsigned i, j; console_lock(); printk(KERN_ERR "*** original memory node:\n"); for (i = 0; i <= b->nsets; i++) dump_bset(b, b->sets[i].data); printk(KERN_ERR "*** sorted memory node:\n"); dump_bset(b, new); printk(KERN_ERR "*** on disk node:\n"); dump_bset(v, v->sets[0].data); for (j = 0; j < new->keys; j++) if (new->d[j] != v->sets[0].data->d[j]) break; console_unlock(); panic("verify failed at %u\n", j); } mutex_unlock(&b->c->verify_lock); } static void data_verify_endio(struct bio *bio, int error) { struct closure *cl = bio->bi_private; closure_put(cl); } void bch_data_verify(struct search *s) { char name[BDEVNAME_SIZE]; struct cached_dev *dc = container_of(s->d, struct cached_dev, disk); struct closure *cl = &s->cl; struct bio *check; struct bio_vec *bv; int i; if (!s->unaligned_bvec) bio_for_each_segment(bv, s->orig_bio, i) bv->bv_offset = 0, bv->bv_len = PAGE_SIZE; check = bio_clone(s->orig_bio, GFP_NOIO); if (!check) return; if (bch_bio_alloc_pages(check, GFP_NOIO)) goto out_put; check->bi_rw = READ_SYNC; check->bi_private = cl; check->bi_end_io = data_verify_endio; closure_bio_submit(check, cl, &dc->disk); closure_sync(cl); bio_for_each_segment(bv, s->orig_bio, i) { void *p1 = kmap(bv->bv_page); void *p2 = kmap(check->bi_io_vec[i].bv_page); if (memcmp(p1 + bv->bv_offset, p2 + bv->bv_offset, bv->bv_len)) printk(KERN_ERR "bcache (%s): verify failed at sector %llu\n", bdevname(dc->bdev, name), (uint64_t) s->orig_bio->bi_sector); kunmap(bv->bv_page); kunmap(check->bi_io_vec[i].bv_page); } __bio_for_each_segment(bv, check, i, 0) __free_page(bv->bv_page); out_put: bio_put(check); } #endif #ifdef CONFIG_BCACHE_EDEBUG unsigned bch_count_data(struct btree *b) { unsigned ret = 0; struct btree_iter iter; struct bkey *k; if (!b->level) for_each_key(b, k, &iter) ret += KEY_SIZE(k); return ret; } static void vdump_bucket_and_panic(struct btree *b, const char *fmt, va_list args) { unsigned i; console_lock(); for (i = 0; i <= b->nsets; i++) dump_bset(b, b->sets[i].data); vprintk(fmt, args); console_unlock(); panic("at %s\n", pbtree(b)); } void bch_check_key_order_msg(struct btree *b, struct bset *i, const char *fmt, ...) { struct bkey *k; if (!i->keys) return; for (k = i->start; bkey_next(k) < end(i); k = bkey_next(k)) if (skipped_backwards(b, k)) { va_list args; va_start(args, fmt); vdump_bucket_and_panic(b, fmt, args); va_end(args); } } void bch_check_keys(struct btree *b, const char *fmt, ...) { va_list args; struct bkey *k, *p = NULL; struct btree_iter iter; if (b->level) return; for_each_key(b, k, &iter) { if (p && bkey_cmp(&START_KEY(p), &START_KEY(k)) > 0) { printk(KERN_ERR "Keys out of order:\n"); goto bug; } if (bch_ptr_invalid(b, k)) continue; if (p && bkey_cmp(p, &START_KEY(k)) > 0) { printk(KERN_ERR "Overlapping keys:\n"); goto bug; } p = k; } return; bug: va_start(args, fmt); vdump_bucket_and_panic(b, fmt, args); va_end(args); } #endif #ifdef CONFIG_DEBUG_FS /* XXX: cache set refcounting */ struct dump_iterator { char buf[PAGE_SIZE]; size_t bytes; struct cache_set *c; struct keybuf keys; }; static bool dump_pred(struct keybuf *buf, struct bkey *k) { return true; } static ssize_t bch_dump_read(struct file *file, char __user *buf, size_t size, loff_t *ppos) { struct dump_iterator *i = file->private_data; ssize_t ret = 0; while (size) { struct keybuf_key *w; unsigned bytes = min(i->bytes, size); int err = copy_to_user(buf, i->buf, bytes); if (err) return err; ret += bytes; buf += bytes; size -= bytes; i->bytes -= bytes; memmove(i->buf, i->buf + bytes, i->bytes); if (i->bytes) break; w = bch_keybuf_next_rescan(i->c, &i->keys, &MAX_KEY); if (!w) break; i->bytes = snprintf(i->buf, PAGE_SIZE, "%s\n", pkey(&w->key)); bch_keybuf_del(&i->keys, w); } return ret; } static int bch_dump_open(struct inode *inode, struct file *file) { struct cache_set *c = inode->i_private; struct dump_iterator *i; i = kzalloc(sizeof(struct dump_iterator), GFP_KERNEL); if (!i) return -ENOMEM; file->private_data = i; i->c = c; bch_keybuf_init(&i->keys, dump_pred); i->keys.last_scanned = KEY(0, 0, 0); return 0; } static int bch_dump_release(struct inode *inode, struct file *file) { kfree(file->private_data); return 0; } static const struct file_operations cache_set_debug_ops = { .owner = THIS_MODULE, .open = bch_dump_open, .read = bch_dump_read, .release = bch_dump_release }; void bch_debug_init_cache_set(struct cache_set *c) { if (!IS_ERR_OR_NULL(debug)) { char name[50]; snprintf(name, 50, "bcache-%pU", c->sb.set_uuid); c->debug = debugfs_create_file(name, 0400, debug, c, &cache_set_debug_ops); } } #endif #ifdef CONFIG_BCACHE_DEBUG static ssize_t btree_fuzz(struct kobject *k, struct kobj_attribute *a, const char *buffer, size_t size) { void dump(struct btree *b) { struct bset *i; for (i = b->sets[0].data; index(i, b) < btree_blocks(b) && i->seq == b->sets[0].data->seq; i = ((void *) i) + set_blocks(i, b->c) * block_bytes(b->c)) dump_bset(b, i); } struct cache_sb *sb; struct cache_set *c; struct btree *all[3], *b, *fill, *orig; int j; struct btree_op op; bch_btree_op_init_stack(&op); sb = kzalloc(sizeof(struct cache_sb), GFP_KERNEL); if (!sb) return -ENOMEM; sb->bucket_size = 128; sb->block_size = 4; c = bch_cache_set_alloc(sb); if (!c) return -ENOMEM; for (j = 0; j < 3; j++) { BUG_ON(list_empty(&c->btree_cache)); all[j] = list_first_entry(&c->btree_cache, struct btree, list); list_del_init(&all[j]->list); all[j]->key = KEY(0, 0, c->sb.bucket_size); bkey_copy_key(&all[j]->key, &MAX_KEY); } b = all[0]; fill = all[1]; orig = all[2]; while (1) { for (j = 0; j < 3; j++) all[j]->written = all[j]->nsets = 0; bch_bset_init_next(b); while (1) { struct bset *i = write_block(b); struct bkey *k = op.keys.top; unsigned rand; bkey_init(k); rand = get_random_int(); op.type = rand & 1 ? BTREE_INSERT : BTREE_REPLACE; rand >>= 1; SET_KEY_SIZE(k, bucket_remainder(c, rand)); rand >>= c->bucket_bits; rand &= 1024 * 512 - 1; rand += c->sb.bucket_size; SET_KEY_OFFSET(k, rand); #if 0 SET_KEY_PTRS(k, 1); #endif bch_keylist_push(&op.keys); bch_btree_insert_keys(b, &op); if (should_split(b) || set_blocks(i, b->c) != __set_blocks(i, i->keys + 15, b->c)) { i->csum = csum_set(i); memcpy(write_block(fill), i, set_bytes(i)); b->written += set_blocks(i, b->c); fill->written = b->written; if (b->written == btree_blocks(b)) break; bch_btree_sort_lazy(b); bch_bset_init_next(b); } } memcpy(orig->sets[0].data, fill->sets[0].data, btree_bytes(c)); bch_btree_sort(b); fill->written = 0; bch_btree_read_done(&fill->io.cl); if (b->sets[0].data->keys != fill->sets[0].data->keys || memcmp(b->sets[0].data->start, fill->sets[0].data->start, b->sets[0].data->keys * sizeof(uint64_t))) { struct bset *i = b->sets[0].data; struct bkey *k, *l; for (k = i->start, l = fill->sets[0].data->start; k < end(i); k = bkey_next(k), l = bkey_next(l)) if (bkey_cmp(k, l) || KEY_SIZE(k) != KEY_SIZE(l)) pr_err("key %zi differs: %s != %s", (uint64_t *) k - i->d, pkey(k), pkey(l)); for (j = 0; j < 3; j++) { pr_err("**** Set %i ****", j); dump(all[j]); } panic("\n"); } pr_info("fuzz complete: %i keys", b->sets[0].data->keys); } } kobj_attribute_write(fuzz, btree_fuzz); #endif void bch_debug_exit(void) { if (!IS_ERR_OR_NULL(debug)) debugfs_remove_recursive(debug); } int __init bch_debug_init(struct kobject *kobj) { int ret = 0; #ifdef CONFIG_BCACHE_DEBUG ret = sysfs_create_file(kobj, &ksysfs_fuzz.attr); if (ret) return ret; #endif debug = debugfs_create_dir("bcache", NULL); return ret; }