4f024f3797
Immutable biovecs are going to require an explicit iterator. To implement immutable bvecs, a later patch is going to add a bi_bvec_done member to this struct; for now, this patch effectively just renames things. Signed-off-by: Kent Overstreet <kmo@daterainc.com> Cc: Jens Axboe <axboe@kernel.dk> Cc: Geert Uytterhoeven <geert@linux-m68k.org> Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org> Cc: Paul Mackerras <paulus@samba.org> Cc: "Ed L. Cashin" <ecashin@coraid.com> Cc: Nick Piggin <npiggin@kernel.dk> Cc: Lars Ellenberg <drbd-dev@lists.linbit.com> Cc: Jiri Kosina <jkosina@suse.cz> Cc: Matthew Wilcox <willy@linux.intel.com> Cc: Geoff Levand <geoff@infradead.org> Cc: Yehuda Sadeh <yehuda@inktank.com> Cc: Sage Weil <sage@inktank.com> Cc: Alex Elder <elder@inktank.com> Cc: ceph-devel@vger.kernel.org Cc: Joshua Morris <josh.h.morris@us.ibm.com> Cc: Philip Kelleher <pjk1939@linux.vnet.ibm.com> Cc: Rusty Russell <rusty@rustcorp.com.au> Cc: "Michael S. Tsirkin" <mst@redhat.com> Cc: Konrad Rzeszutek Wilk <konrad.wilk@oracle.com> Cc: Jeremy Fitzhardinge <jeremy@goop.org> Cc: Neil Brown <neilb@suse.de> Cc: Alasdair Kergon <agk@redhat.com> Cc: Mike Snitzer <snitzer@redhat.com> Cc: dm-devel@redhat.com Cc: Martin Schwidefsky <schwidefsky@de.ibm.com> Cc: Heiko Carstens <heiko.carstens@de.ibm.com> Cc: linux390@de.ibm.com Cc: Boaz Harrosh <bharrosh@panasas.com> Cc: Benny Halevy <bhalevy@tonian.com> Cc: "James E.J. Bottomley" <JBottomley@parallels.com> Cc: Greg Kroah-Hartman <gregkh@linuxfoundation.org> Cc: "Nicholas A. Bellinger" <nab@linux-iscsi.org> Cc: Alexander Viro <viro@zeniv.linux.org.uk> Cc: Chris Mason <chris.mason@fusionio.com> Cc: "Theodore Ts'o" <tytso@mit.edu> Cc: Andreas Dilger <adilger.kernel@dilger.ca> Cc: Jaegeuk Kim <jaegeuk.kim@samsung.com> Cc: Steven Whitehouse <swhiteho@redhat.com> Cc: Dave Kleikamp <shaggy@kernel.org> Cc: Joern Engel <joern@logfs.org> Cc: Prasad Joshi <prasadjoshi.linux@gmail.com> Cc: Trond Myklebust <Trond.Myklebust@netapp.com> Cc: KONISHI Ryusuke <konishi.ryusuke@lab.ntt.co.jp> Cc: Mark Fasheh <mfasheh@suse.com> Cc: Joel Becker <jlbec@evilplan.org> Cc: Ben Myers <bpm@sgi.com> Cc: xfs@oss.sgi.com Cc: Steven Rostedt <rostedt@goodmis.org> Cc: Frederic Weisbecker <fweisbec@gmail.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Len Brown <len.brown@intel.com> Cc: Pavel Machek <pavel@ucw.cz> Cc: "Rafael J. Wysocki" <rjw@sisk.pl> Cc: Herton Ronaldo Krzesinski <herton.krzesinski@canonical.com> Cc: Ben Hutchings <ben@decadent.org.uk> Cc: Andrew Morton <akpm@linux-foundation.org> Cc: Guo Chao <yan@linux.vnet.ibm.com> Cc: Tejun Heo <tj@kernel.org> Cc: Asai Thambi S P <asamymuthupa@micron.com> Cc: Selvan Mani <smani@micron.com> Cc: Sam Bradshaw <sbradshaw@micron.com> Cc: Wei Yongjun <yongjun_wei@trendmicro.com.cn> Cc: "Roger Pau Monné" <roger.pau@citrix.com> Cc: Jan Beulich <jbeulich@suse.com> Cc: Stefano Stabellini <stefano.stabellini@eu.citrix.com> Cc: Ian Campbell <Ian.Campbell@citrix.com> Cc: Sebastian Ott <sebott@linux.vnet.ibm.com> Cc: Christian Borntraeger <borntraeger@de.ibm.com> Cc: Minchan Kim <minchan@kernel.org> Cc: Jiang Liu <jiang.liu@huawei.com> Cc: Nitin Gupta <ngupta@vflare.org> Cc: Jerome Marchand <jmarchand@redhat.com> Cc: Joe Perches <joe@perches.com> Cc: Peng Tao <tao.peng@emc.com> Cc: Andy Adamson <andros@netapp.com> Cc: fanchaoting <fanchaoting@cn.fujitsu.com> Cc: Jie Liu <jeff.liu@oracle.com> Cc: Sunil Mushran <sunil.mushran@gmail.com> Cc: "Martin K. Petersen" <martin.petersen@oracle.com> Cc: Namjae Jeon <namjae.jeon@samsung.com> Cc: Pankaj Kumar <pankaj.km@samsung.com> Cc: Dan Magenheimer <dan.magenheimer@oracle.com> Cc: Mel Gorman <mgorman@suse.de>6
387 lines
7.6 KiB
C
387 lines
7.6 KiB
C
/*
|
|
* Assorted bcache debug code
|
|
*
|
|
* Copyright 2010, 2011 Kent Overstreet <kent.overstreet@gmail.com>
|
|
* Copyright 2012 Google, Inc.
|
|
*/
|
|
|
|
#include "bcache.h"
|
|
#include "btree.h"
|
|
#include "debug.h"
|
|
|
|
#include <linux/console.h>
|
|
#include <linux/debugfs.h>
|
|
#include <linux/module.h>
|
|
#include <linux/random.h>
|
|
#include <linux/seq_file.h>
|
|
|
|
static struct dentry *debug;
|
|
|
|
const char *bch_ptr_status(struct cache_set *c, const struct bkey *k)
|
|
{
|
|
unsigned i;
|
|
|
|
for (i = 0; i < KEY_PTRS(k); i++)
|
|
if (ptr_available(c, k, i)) {
|
|
struct cache *ca = PTR_CACHE(c, k, i);
|
|
size_t bucket = PTR_BUCKET_NR(c, k, i);
|
|
size_t r = bucket_remainder(c, PTR_OFFSET(k, i));
|
|
|
|
if (KEY_SIZE(k) + r > c->sb.bucket_size)
|
|
return "bad, length too big";
|
|
if (bucket < ca->sb.first_bucket)
|
|
return "bad, short offset";
|
|
if (bucket >= ca->sb.nbuckets)
|
|
return "bad, offset past end of device";
|
|
if (ptr_stale(c, k, i))
|
|
return "stale";
|
|
}
|
|
|
|
if (!bkey_cmp(k, &ZERO_KEY))
|
|
return "bad, null key";
|
|
if (!KEY_PTRS(k))
|
|
return "bad, no pointers";
|
|
if (!KEY_SIZE(k))
|
|
return "zeroed key";
|
|
return "";
|
|
}
|
|
|
|
int bch_bkey_to_text(char *buf, size_t size, const struct bkey *k)
|
|
{
|
|
unsigned i = 0;
|
|
char *out = buf, *end = buf + size;
|
|
|
|
#define p(...) (out += scnprintf(out, end - out, __VA_ARGS__))
|
|
|
|
p("%llu:%llu len %llu -> [", KEY_INODE(k), KEY_OFFSET(k), KEY_SIZE(k));
|
|
|
|
if (KEY_PTRS(k))
|
|
while (1) {
|
|
p("%llu:%llu gen %llu",
|
|
PTR_DEV(k, i), PTR_OFFSET(k, i), PTR_GEN(k, i));
|
|
|
|
if (++i == KEY_PTRS(k))
|
|
break;
|
|
|
|
p(", ");
|
|
}
|
|
|
|
p("]");
|
|
|
|
if (KEY_DIRTY(k))
|
|
p(" dirty");
|
|
if (KEY_CSUM(k))
|
|
p(" cs%llu %llx", KEY_CSUM(k), k->ptr[1]);
|
|
#undef p
|
|
return out - buf;
|
|
}
|
|
|
|
#ifdef CONFIG_BCACHE_DEBUG
|
|
|
|
static void dump_bset(struct btree *b, struct bset *i)
|
|
{
|
|
struct bkey *k, *next;
|
|
unsigned j;
|
|
char buf[80];
|
|
|
|
for (k = i->start; k < end(i); k = next) {
|
|
next = bkey_next(k);
|
|
|
|
bch_bkey_to_text(buf, sizeof(buf), k);
|
|
printk(KERN_ERR "block %zu key %zi/%u: %s", index(i, b),
|
|
(uint64_t *) k - i->d, i->keys, buf);
|
|
|
|
for (j = 0; j < KEY_PTRS(k); j++) {
|
|
size_t n = PTR_BUCKET_NR(b->c, k, j);
|
|
printk(" bucket %zu", n);
|
|
|
|
if (n >= b->c->sb.first_bucket && n < b->c->sb.nbuckets)
|
|
printk(" prio %i",
|
|
PTR_BUCKET(b->c, k, j)->prio);
|
|
}
|
|
|
|
printk(" %s\n", bch_ptr_status(b->c, k));
|
|
|
|
if (next < end(i) &&
|
|
bkey_cmp(k, !b->level ? &START_KEY(next) : next) > 0)
|
|
printk(KERN_ERR "Key skipped backwards\n");
|
|
}
|
|
}
|
|
|
|
static void bch_dump_bucket(struct btree *b)
|
|
{
|
|
unsigned i;
|
|
|
|
console_lock();
|
|
for (i = 0; i <= b->nsets; i++)
|
|
dump_bset(b, b->sets[i].data);
|
|
console_unlock();
|
|
}
|
|
|
|
void bch_btree_verify(struct btree *b, struct bset *new)
|
|
{
|
|
struct btree *v = b->c->verify_data;
|
|
struct closure cl;
|
|
closure_init_stack(&cl);
|
|
|
|
if (!b->c->verify)
|
|
return;
|
|
|
|
closure_wait_event(&b->io.wait, &cl,
|
|
atomic_read(&b->io.cl.remaining) == -1);
|
|
|
|
mutex_lock(&b->c->verify_lock);
|
|
|
|
bkey_copy(&v->key, &b->key);
|
|
v->written = 0;
|
|
v->level = b->level;
|
|
|
|
bch_btree_node_read(v);
|
|
closure_wait_event(&v->io.wait, &cl,
|
|
atomic_read(&b->io.cl.remaining) == -1);
|
|
|
|
if (new->keys != v->sets[0].data->keys ||
|
|
memcmp(new->start,
|
|
v->sets[0].data->start,
|
|
(void *) end(new) - (void *) new->start)) {
|
|
unsigned i, j;
|
|
|
|
console_lock();
|
|
|
|
printk(KERN_ERR "*** original memory node:\n");
|
|
for (i = 0; i <= b->nsets; i++)
|
|
dump_bset(b, b->sets[i].data);
|
|
|
|
printk(KERN_ERR "*** sorted memory node:\n");
|
|
dump_bset(b, new);
|
|
|
|
printk(KERN_ERR "*** on disk node:\n");
|
|
dump_bset(v, v->sets[0].data);
|
|
|
|
for (j = 0; j < new->keys; j++)
|
|
if (new->d[j] != v->sets[0].data->d[j])
|
|
break;
|
|
|
|
console_unlock();
|
|
panic("verify failed at %u\n", j);
|
|
}
|
|
|
|
mutex_unlock(&b->c->verify_lock);
|
|
}
|
|
|
|
void bch_data_verify(struct cached_dev *dc, struct bio *bio)
|
|
{
|
|
char name[BDEVNAME_SIZE];
|
|
struct bio *check;
|
|
struct bio_vec *bv;
|
|
int i;
|
|
|
|
check = bio_clone(bio, GFP_NOIO);
|
|
if (!check)
|
|
return;
|
|
|
|
if (bio_alloc_pages(check, GFP_NOIO))
|
|
goto out_put;
|
|
|
|
submit_bio_wait(READ_SYNC, check);
|
|
|
|
bio_for_each_segment(bv, bio, i) {
|
|
void *p1 = kmap_atomic(bv->bv_page);
|
|
void *p2 = page_address(check->bi_io_vec[i].bv_page);
|
|
|
|
cache_set_err_on(memcmp(p1 + bv->bv_offset,
|
|
p2 + bv->bv_offset,
|
|
bv->bv_len),
|
|
dc->disk.c,
|
|
"verify failed at dev %s sector %llu",
|
|
bdevname(dc->bdev, name),
|
|
(uint64_t) bio->bi_iter.bi_sector);
|
|
|
|
kunmap_atomic(p1);
|
|
}
|
|
|
|
bio_for_each_segment_all(bv, check, i)
|
|
__free_page(bv->bv_page);
|
|
out_put:
|
|
bio_put(check);
|
|
}
|
|
|
|
int __bch_count_data(struct btree *b)
|
|
{
|
|
unsigned ret = 0;
|
|
struct btree_iter iter;
|
|
struct bkey *k;
|
|
|
|
if (!b->level)
|
|
for_each_key(b, k, &iter)
|
|
ret += KEY_SIZE(k);
|
|
return ret;
|
|
}
|
|
|
|
void __bch_check_keys(struct btree *b, const char *fmt, ...)
|
|
{
|
|
va_list args;
|
|
struct bkey *k, *p = NULL;
|
|
struct btree_iter iter;
|
|
const char *err;
|
|
|
|
for_each_key(b, k, &iter) {
|
|
if (!b->level) {
|
|
err = "Keys out of order";
|
|
if (p && bkey_cmp(&START_KEY(p), &START_KEY(k)) > 0)
|
|
goto bug;
|
|
|
|
if (bch_ptr_invalid(b, k))
|
|
continue;
|
|
|
|
err = "Overlapping keys";
|
|
if (p && bkey_cmp(p, &START_KEY(k)) > 0)
|
|
goto bug;
|
|
} else {
|
|
if (bch_ptr_bad(b, k))
|
|
continue;
|
|
|
|
err = "Duplicate keys";
|
|
if (p && !bkey_cmp(p, k))
|
|
goto bug;
|
|
}
|
|
p = k;
|
|
}
|
|
|
|
err = "Key larger than btree node key";
|
|
if (p && bkey_cmp(p, &b->key) > 0)
|
|
goto bug;
|
|
|
|
return;
|
|
bug:
|
|
bch_dump_bucket(b);
|
|
|
|
va_start(args, fmt);
|
|
vprintk(fmt, args);
|
|
va_end(args);
|
|
|
|
panic("bcache error: %s:\n", err);
|
|
}
|
|
|
|
void bch_btree_iter_next_check(struct btree_iter *iter)
|
|
{
|
|
struct bkey *k = iter->data->k, *next = bkey_next(k);
|
|
|
|
if (next < iter->data->end &&
|
|
bkey_cmp(k, iter->b->level ? next : &START_KEY(next)) > 0) {
|
|
bch_dump_bucket(iter->b);
|
|
panic("Key skipped backwards\n");
|
|
}
|
|
}
|
|
|
|
#endif
|
|
|
|
#ifdef CONFIG_DEBUG_FS
|
|
|
|
/* XXX: cache set refcounting */
|
|
|
|
struct dump_iterator {
|
|
char buf[PAGE_SIZE];
|
|
size_t bytes;
|
|
struct cache_set *c;
|
|
struct keybuf keys;
|
|
};
|
|
|
|
static bool dump_pred(struct keybuf *buf, struct bkey *k)
|
|
{
|
|
return true;
|
|
}
|
|
|
|
static ssize_t bch_dump_read(struct file *file, char __user *buf,
|
|
size_t size, loff_t *ppos)
|
|
{
|
|
struct dump_iterator *i = file->private_data;
|
|
ssize_t ret = 0;
|
|
char kbuf[80];
|
|
|
|
while (size) {
|
|
struct keybuf_key *w;
|
|
unsigned bytes = min(i->bytes, size);
|
|
|
|
int err = copy_to_user(buf, i->buf, bytes);
|
|
if (err)
|
|
return err;
|
|
|
|
ret += bytes;
|
|
buf += bytes;
|
|
size -= bytes;
|
|
i->bytes -= bytes;
|
|
memmove(i->buf, i->buf + bytes, i->bytes);
|
|
|
|
if (i->bytes)
|
|
break;
|
|
|
|
w = bch_keybuf_next_rescan(i->c, &i->keys, &MAX_KEY, dump_pred);
|
|
if (!w)
|
|
break;
|
|
|
|
bch_bkey_to_text(kbuf, sizeof(kbuf), &w->key);
|
|
i->bytes = snprintf(i->buf, PAGE_SIZE, "%s\n", kbuf);
|
|
bch_keybuf_del(&i->keys, w);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int bch_dump_open(struct inode *inode, struct file *file)
|
|
{
|
|
struct cache_set *c = inode->i_private;
|
|
struct dump_iterator *i;
|
|
|
|
i = kzalloc(sizeof(struct dump_iterator), GFP_KERNEL);
|
|
if (!i)
|
|
return -ENOMEM;
|
|
|
|
file->private_data = i;
|
|
i->c = c;
|
|
bch_keybuf_init(&i->keys);
|
|
i->keys.last_scanned = KEY(0, 0, 0);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int bch_dump_release(struct inode *inode, struct file *file)
|
|
{
|
|
kfree(file->private_data);
|
|
return 0;
|
|
}
|
|
|
|
static const struct file_operations cache_set_debug_ops = {
|
|
.owner = THIS_MODULE,
|
|
.open = bch_dump_open,
|
|
.read = bch_dump_read,
|
|
.release = bch_dump_release
|
|
};
|
|
|
|
void bch_debug_init_cache_set(struct cache_set *c)
|
|
{
|
|
if (!IS_ERR_OR_NULL(debug)) {
|
|
char name[50];
|
|
snprintf(name, 50, "bcache-%pU", c->sb.set_uuid);
|
|
|
|
c->debug = debugfs_create_file(name, 0400, debug, c,
|
|
&cache_set_debug_ops);
|
|
}
|
|
}
|
|
|
|
#endif
|
|
|
|
void bch_debug_exit(void)
|
|
{
|
|
if (!IS_ERR_OR_NULL(debug))
|
|
debugfs_remove_recursive(debug);
|
|
}
|
|
|
|
int __init bch_debug_init(struct kobject *kobj)
|
|
{
|
|
int ret = 0;
|
|
|
|
debug = debugfs_create_dir("bcache", NULL);
|
|
return ret;
|
|
}
|