From: Liu Bo <liubo2009@cn.fujitsu.com>
To: Stefan Behrens <sbehrens@giantdisaster.de>
Cc: linux-btrfs@vger.kernel.org
Subject: Re: [PATCH v3 3/3] Btrfs: read device stats on mount, write modified ones during commit
Date: Thu, 17 May 2012 09:52:48 +0800 [thread overview]
Message-ID: <4FB459F0.3050502@cn.fujitsu.com> (raw)
In-Reply-To: <f7e60650b3463d028f86b38ef3e6aaf77efa665b.1337185201.git.sbehrens@giantdisaster.de>
On 05/17/2012 12:50 AM, Stefan Behrens wrote:
> The device statistics are written into the device tree with each
> transaction commit. Only modified statistics are written.
> When a filesystem is mounted, the device statistics for each involved
> device are read from the device tree and used to initialize the
> counters.
>
Hi Stefan,
Just scaned the patch for a while and got a question:
Adding a new key type usually means changing the disk format,
so have you done something for this?
thanks,
liubo
> Signed-off-by: Stefan Behrens <sbehrens@giantdisaster.de>
> ---
> fs/btrfs/ctree.h | 51 ++++++++++++
> fs/btrfs/disk-io.c | 7 ++
> fs/btrfs/print-tree.c | 3 +
> fs/btrfs/transaction.c | 4 +
> fs/btrfs/volumes.c | 205 ++++++++++++++++++++++++++++++++++++++++++++++++
> fs/btrfs/volumes.h | 9 +++
> 6 files changed, 279 insertions(+)
>
> diff --git a/fs/btrfs/ctree.h b/fs/btrfs/ctree.h
> index ec42a24..1dd7651 100644
> --- a/fs/btrfs/ctree.h
> +++ b/fs/btrfs/ctree.h
> @@ -823,6 +823,26 @@ struct btrfs_csum_item {
> u8 csum;
> } __attribute__ ((__packed__));
>
> +struct btrfs_device_stats_item {
> + /*
> + * grow this item struct at the end for future enhancements and keep
> + * the existing values unchanged
> + */
> + __le64 cnt_write_io_errs; /* EIO or EREMOTEIO from lower layers */
> + __le64 cnt_read_io_errs; /* EIO or EREMOTEIO from lower layers */
> + __le64 cnt_flush_io_errs; /* EIO or EREMOTEIO from lower layers */
> +
> + /* stats for indirect indications for I/O failures */
> + __le64 cnt_corruption_errs; /* checksum error, bytenr error or
> + * contents is illegal: this is an
> + * indication that the block was damaged
> + * during read or write, or written to
> + * wrong location or read from wrong
> + * location */
> + __le64 cnt_generation_errs; /* an indication that blocks have not
> + * been written */
> +} __attribute__ ((__packed__));
> +
> /* different types of block groups (and chunks) */
> #define BTRFS_BLOCK_GROUP_DATA (1ULL << 0)
> #define BTRFS_BLOCK_GROUP_SYSTEM (1ULL << 1)
> @@ -1508,6 +1528,12 @@ struct btrfs_ioctl_defrag_range_args {
> #define BTRFS_BALANCE_ITEM_KEY 248
>
> /*
> + * Persistantly stores the io stats in the device tree.
> + * One key for all stats, (0, BTRFS_DEVICE_STATS_KEY, devid).
> + */
> +#define BTRFS_DEVICE_STATS_KEY 249
> +
> +/*
> * string items are for debugging. They just store a short string of
> * data in the FS
> */
> @@ -2415,6 +2441,31 @@ static inline u32 btrfs_file_extent_inline_item_len(struct extent_buffer *eb,
> return btrfs_item_size(eb, e) - offset;
> }
>
> +/* btrfs_device_stats_item */
> +BTRFS_SETGET_FUNCS(device_stats_cnt_write_io_errs,
> + struct btrfs_device_stats_item, cnt_write_io_errs, 64);
> +BTRFS_SETGET_FUNCS(device_stats_cnt_read_io_errs,
> + struct btrfs_device_stats_item, cnt_read_io_errs, 64);
> +BTRFS_SETGET_FUNCS(device_stats_cnt_flush_io_errs,
> + struct btrfs_device_stats_item, cnt_flush_io_errs, 64);
> +BTRFS_SETGET_FUNCS(device_stats_cnt_corruption_errs,
> + struct btrfs_device_stats_item, cnt_corruption_errs, 64);
> +BTRFS_SETGET_FUNCS(device_stats_cnt_generation_errs,
> + struct btrfs_device_stats_item, cnt_generation_errs, 64);
> +
> +BTRFS_SETGET_STACK_FUNCS(stack_device_stats_cnt_write_io_errs,
> + struct btrfs_device_stats_item, cnt_write_io_errs, 64);
> +BTRFS_SETGET_STACK_FUNCS(stack_device_stats_cnt_read_io_errs,
> + struct btrfs_device_stats_item, cnt_read_io_errs, 64);
> +BTRFS_SETGET_STACK_FUNCS(stack_device_stats_cnt_flush_io_errs,
> + struct btrfs_device_stats_item, cnt_flush_io_errs, 64);
> +BTRFS_SETGET_STACK_FUNCS(stack_device_stats_cnt_corruption_errs,
> + struct btrfs_device_stats_item, cnt_corruption_errs,
> + 64);
> +BTRFS_SETGET_STACK_FUNCS(stack_device_stats_cnt_generation_errs,
> + struct btrfs_device_stats_item, cnt_generation_errs,
> + 64);
> +
> static inline struct btrfs_fs_info *btrfs_sb(struct super_block *sb)
> {
> return sb->s_fs_info;
> diff --git a/fs/btrfs/disk-io.c b/fs/btrfs/disk-io.c
> index e123629..7ba08f7 100644
> --- a/fs/btrfs/disk-io.c
> +++ b/fs/btrfs/disk-io.c
> @@ -2353,6 +2353,13 @@ retry_root_backup:
> fs_info->generation = generation;
> fs_info->last_trans_committed = generation;
>
> + ret = btrfs_init_device_stats(fs_info);
> + if (ret) {
> + printk(KERN_ERR "btrfs: failed to init device_stats: %d\n",
> + ret);
> + goto fail_block_groups;
> + }
> +
> ret = btrfs_init_space_info(fs_info);
> if (ret) {
> printk(KERN_ERR "Failed to initial space info: %d\n", ret);
> diff --git a/fs/btrfs/print-tree.c b/fs/btrfs/print-tree.c
> index f38e452..a9e45e4 100644
> --- a/fs/btrfs/print-tree.c
> +++ b/fs/btrfs/print-tree.c
> @@ -294,6 +294,9 @@ void btrfs_print_leaf(struct btrfs_root *root, struct extent_buffer *l)
> btrfs_dev_extent_chunk_offset(l, dev_extent),
> (unsigned long long)
> btrfs_dev_extent_length(l, dev_extent));
> + case BTRFS_DEVICE_STATS_KEY:
> + printk(KERN_INFO "\t\tdevice stats\n");
> + break;
> };
> }
> }
> diff --git a/fs/btrfs/transaction.c b/fs/btrfs/transaction.c
> index 3642225..1722af0 100644
> --- a/fs/btrfs/transaction.c
> +++ b/fs/btrfs/transaction.c
> @@ -28,6 +28,7 @@
> #include "locking.h"
> #include "tree-log.h"
> #include "inode-map.h"
> +#include "volumes.h"
>
> #define BTRFS_ROOT_TRANS_TAG 0
>
> @@ -758,6 +759,9 @@ static noinline int commit_cowonly_roots(struct btrfs_trans_handle *trans,
> if (ret)
> return ret;
>
> + ret = btrfs_run_device_stats(trans, root->fs_info);
> + BUG_ON(ret);
> +
> while (!list_empty(&fs_info->dirty_cowonly_roots)) {
> next = fs_info->dirty_cowonly_roots.next;
> list_del_init(next);
> diff --git a/fs/btrfs/volumes.c b/fs/btrfs/volumes.c
> index 5f5a6ce..80d1a50 100644
> --- a/fs/btrfs/volumes.c
> +++ b/fs/btrfs/volumes.c
> @@ -40,6 +40,8 @@ static int init_first_rw_device(struct btrfs_trans_handle *trans,
> struct btrfs_root *root,
> struct btrfs_device *device);
> static int btrfs_relocate_sys_chunks(struct btrfs_root *root);
> +static void __btrfs_reset_device_stats(struct btrfs_device *dev);
> +static void btrfs_device_stat_print_on_load(struct btrfs_device *device);
>
> static DEFINE_MUTEX(uuid_mutex);
> static LIST_HEAD(fs_uuids);
> @@ -362,6 +364,7 @@ static noinline int device_list_add(const char *path,
> return -ENOMEM;
> }
> device->devid = devid;
> + device->device_stats_valid = 0;
> device->work.func = pending_bios_fn;
> memcpy(device->uuid, disk_super->dev_item.uuid,
> BTRFS_UUID_SIZE);
> @@ -4626,8 +4629,194 @@ error:
> return ret;
> }
>
> +static void __btrfs_reset_device_stats(struct btrfs_device *device)
> +{
> + btrfs_device_stat_reset(&device->cnt_write_io_errs);
> + btrfs_device_stat_reset(&device->cnt_read_io_errs);
> + btrfs_device_stat_reset(&device->cnt_flush_io_errs);
> + btrfs_device_stat_reset(&device->cnt_corruption_errs);
> + btrfs_device_stat_reset(&device->cnt_generation_errs);
> +}
> +
> +int btrfs_init_device_stats(struct btrfs_fs_info *fs_info)
> +{
> + struct btrfs_key key;
> + struct btrfs_key found_key;
> + struct btrfs_root *dev_root = fs_info->dev_root;
> + struct btrfs_fs_devices *fs_devices = fs_info->fs_devices;
> + struct extent_buffer *eb;
> + int slot;
> + int ret = 0;
> + struct btrfs_device *device;
> + struct btrfs_path *path = NULL;
> +
> + path = btrfs_alloc_path();
> + if (!path) {
> + ret = -ENOMEM;
> + goto out;
> + }
> +
> + mutex_lock(&fs_devices->device_list_mutex);
> + list_for_each_entry(device, &fs_devices->devices, dev_list) {
> + int item_size;
> + struct btrfs_device_stats_item *ptr;
> +
> + key.objectid = 0;
> + key.type = BTRFS_DEVICE_STATS_KEY;
> + key.offset = device->devid;
> + ret = btrfs_search_slot(NULL, dev_root, &key, path, 0, 0);
> + if (ret) {
> + printk(KERN_WARNING "btrfs: no device_stats entry found for device %s (devid %llu) (OK on first mount after mkfs)\n",
> + device->name, (unsigned long long)device->devid);
> + __btrfs_reset_device_stats(device);
> + device->device_stats_valid = 1;
> + device->device_stats_dirty = 1;
> + btrfs_release_path(path);
> + continue;
> + }
> + slot = path->slots[0];
> + eb = path->nodes[0];
> + btrfs_item_key_to_cpu(eb, &found_key, slot);
> + item_size = btrfs_item_size_nr(eb, slot);
> +
> + ptr = btrfs_item_ptr(eb, slot,
> + struct btrfs_device_stats_item);
> +
> + if (item_size >= 1 * sizeof(__le64))
> + btrfs_device_stat_set(&device->cnt_write_io_errs,
> + btrfs_device_stats_cnt_write_io_errs(eb, ptr));
> + else
> + btrfs_device_stat_reset(&device->cnt_write_io_errs);
> + if (item_size >= 2 * sizeof(__le64))
> + btrfs_device_stat_set(&device->cnt_read_io_errs,
> + btrfs_device_stats_cnt_read_io_errs(eb, ptr));
> + else
> + btrfs_device_stat_reset(&device->cnt_read_io_errs);
> + if (item_size >= 3 * sizeof(__le64))
> + btrfs_device_stat_set(&device->cnt_flush_io_errs,
> + btrfs_device_stats_cnt_flush_io_errs(eb, ptr));
> + else
> + btrfs_device_stat_reset(&device->cnt_flush_io_errs);
> + if (item_size >= 4 * sizeof(__le64))
> + btrfs_device_stat_set(&device->cnt_corruption_errs,
> + btrfs_device_stats_cnt_corruption_errs(eb,
> + ptr));
> + else
> + btrfs_device_stat_reset(&device->cnt_corruption_errs);
> + if (item_size >= 5 * sizeof(__le64))
> + btrfs_device_stat_set(&device->cnt_generation_errs,
> + btrfs_device_stats_cnt_generation_errs(eb,
> + ptr));
> + else
> + btrfs_device_stat_reset(&device->cnt_generation_errs);
> +
> + btrfs_device_stat_print_on_load(device);
> + device->device_stats_valid = 1;
> + btrfs_release_path(path);
> + }
> + mutex_unlock(&fs_devices->device_list_mutex);
> +
> +out:
> + btrfs_free_path(path);
> + return ret < 0 ? ret : 0;
> +}
> +
> +static int update_device_stat_item(struct btrfs_trans_handle *trans,
> + struct btrfs_root *dev_root,
> + struct btrfs_device *device)
> +{
> + struct btrfs_path *path;
> + struct btrfs_key key;
> + struct extent_buffer *eb;
> + struct btrfs_device_stats_item *ptr;
> + int ret;
> +
> + key.objectid = 0;
> + key.type = BTRFS_DEVICE_STATS_KEY;
> + key.offset = device->devid;
> +
> + path = btrfs_alloc_path();
> + BUG_ON(!path);
> + ret = btrfs_search_slot(trans, dev_root, &key, path, 0, 1);
> + if (ret < 0) {
> + printk(KERN_WARNING "btrfs: error %d while searching for device_stats item for device %s!\n",
> + ret, device->name);
> + goto out;
> + }
> +
> + if (0 == ret &&
> + btrfs_item_size_nr(path->nodes[0], path->slots[0]) < sizeof(*ptr)) {
> + /* need to delete old one and insert a new one */
> + ret = btrfs_del_item(trans, dev_root, path);
> + if (0 != ret) {
> + printk(KERN_WARNING "btrfs: delete too small device_stats item for device %s failed %d!\n",
> + device->name, ret);
> + goto out;
> + }
> + ret = 1;
> + }
> +
> + if (1 == ret) {
> + /* need to insert a new item */
> + btrfs_release_path(path);
> + ret = btrfs_insert_empty_item(trans, dev_root, path,
> + &key, sizeof(*ptr));
> + if (ret < 0) {
> + printk(KERN_WARNING "btrfs: insert device_stats item for device %s failed %d!\n",
> + device->name, ret);
> + goto out;
> + }
> + }
> +
> + eb = path->nodes[0];
> + ptr = btrfs_item_ptr(eb, path->slots[0],
> + struct btrfs_device_stats_item);
> + btrfs_set_device_stats_cnt_write_io_errs(eb, ptr,
> + btrfs_device_stat_read(&device->cnt_write_io_errs));
> + btrfs_set_device_stats_cnt_read_io_errs(eb, ptr,
> + btrfs_device_stat_read(&device->cnt_read_io_errs));
> + btrfs_set_device_stats_cnt_flush_io_errs(eb, ptr,
> + btrfs_device_stat_read(&device->cnt_flush_io_errs));
> + btrfs_set_device_stats_cnt_corruption_errs(eb, ptr,
> + btrfs_device_stat_read(&device->cnt_corruption_errs));
> + btrfs_set_device_stats_cnt_generation_errs(eb, ptr,
> + btrfs_device_stat_read(&device->cnt_generation_errs));
> + btrfs_mark_buffer_dirty(eb);
> +
> +out:
> + btrfs_free_path(path);
> + return ret;
> +}
> +
> +/*
> + * called from commit_transaction. Writes all changed device stats to disk.
> + */
> +int btrfs_run_device_stats(struct btrfs_trans_handle *trans,
> + struct btrfs_fs_info *fs_info)
> +{
> + struct btrfs_root *dev_root = fs_info->dev_root;
> + struct btrfs_fs_devices *fs_devices = fs_info->fs_devices;
> + struct btrfs_device *device;
> + int ret = 0;
> +
> + mutex_lock(&fs_devices->device_list_mutex);
> + list_for_each_entry(device, &fs_devices->devices, dev_list) {
> + if (!device->device_stats_valid || !device->device_stats_dirty)
> + continue;
> +
> + ret = update_device_stat_item(trans, dev_root, device);
> + if (!ret)
> + device->device_stats_dirty = 0;
> + }
> + mutex_unlock(&fs_devices->device_list_mutex);
> +
> + return ret;
> +}
> +
> void btrfs_device_stat_print_on_error(struct btrfs_device *device)
> {
> + if (!device->device_stats_valid)
> + return;
> printk_ratelimited(KERN_ERR
> "btrfs: bdev %s errs: wr %u, rd %u, flush %u, corrupt %u, gen %u\n",
> device->name,
> @@ -4639,6 +4828,18 @@ void btrfs_device_stat_print_on_error(struct btrfs_device *device)
> &device->cnt_generation_errs));
> }
>
> +static void btrfs_device_stat_print_on_load(struct btrfs_device *device)
> +{
> + printk(KERN_INFO "btrfs: bdev %s errs: wr %u, rd %u, flush %u,"
> + " corrupt %u, gen %u\n",
> + device->name,
> + btrfs_device_stat_read(&device->cnt_write_io_errs),
> + btrfs_device_stat_read(&device->cnt_read_io_errs),
> + btrfs_device_stat_read(&device->cnt_flush_io_errs),
> + btrfs_device_stat_read(&device->cnt_corruption_errs),
> + btrfs_device_stat_read(&device->cnt_generation_errs));
> +}
> +
> int btrfs_get_device_stats(struct btrfs_root *root,
> struct btrfs_ioctl_get_device_stats *stats,
> int reset_after_read)
> @@ -4654,6 +4855,10 @@ int btrfs_get_device_stats(struct btrfs_root *root,
> printk(KERN_WARNING
> "btrfs: get device_stats failed, device not found\n");
> return -ENODEV;
> + } else if (!dev->device_stats_valid) {
> + printk(KERN_WARNING
> + "btrfs: get device_stats failed, not yet valid\n");
> + return -ENODEV;
> } else if (reset_after_read) {
> if (stats->nr_items >= 1)
> stats->cnt_write_io_errs =
> diff --git a/fs/btrfs/volumes.h b/fs/btrfs/volumes.h
> index e0b31f1..3134662 100644
> --- a/fs/btrfs/volumes.h
> +++ b/fs/btrfs/volumes.h
> @@ -108,6 +108,7 @@ struct btrfs_device {
>
> /* disk I/O failure stats. For detailed description refer to
> * struct btrfs_device_stats_item in ctree.h */
> + int device_stats_valid;
> int device_stats_dirty; /* counters need to be written to disk */
> atomic_t cnt_write_io_errs;
> atomic_t cnt_read_io_errs;
> @@ -291,6 +292,9 @@ int find_free_dev_extent(struct btrfs_device *device, u64 num_bytes,
> u64 *start, u64 *max_avail);
> struct btrfs_device *btrfs_find_device_for_logical(struct btrfs_root *root,
> u64 logical, int mirror_num);
> +int btrfs_init_device_stats(struct btrfs_fs_info *fs_info);
> +int btrfs_run_device_stats(struct btrfs_trans_handle *trans,
> + struct btrfs_fs_info *fs_info);
> void btrfs_device_stat_print_on_error(struct btrfs_device *device);
> int btrfs_get_device_stats(struct btrfs_root *root,
> struct btrfs_ioctl_get_device_stats *stats,
> @@ -315,4 +319,9 @@ static inline void btrfs_device_stat_reset(atomic_t *cnt)
> {
> atomic_set(cnt, 0);
> }
> +
> +static inline void btrfs_device_stat_set(atomic_t *cnt, unsigned long val)
> +{
> + atomic_set(cnt, val);
> +}
> #endif
next prev parent reply other threads:[~2012-05-17 1:48 UTC|newest]
Thread overview: 8+ messages / expand[flat|nested] mbox.gz Atom feed top
2012-05-16 16:50 [PATCH v3 0/3] Btrfs: add IO error device stats Stefan Behrens
2012-05-16 16:50 ` [PATCH v3 1/3] Btrfs: add device counters for detected IO and checksum errors Stefan Behrens
2012-05-16 16:50 ` [PATCH v3 2/3] Btrfs: add ioctl to get and reset the device stats Stefan Behrens
2012-05-16 16:50 ` [PATCH v3 3/3] Btrfs: read device stats on mount, write modified ones during commit Stefan Behrens
2012-05-17 1:52 ` Liu Bo [this message]
2012-05-17 8:49 ` Stefan Behrens
2012-05-18 11:57 ` David Sterba
2012-05-21 14:57 ` Stefan Behrens
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=4FB459F0.3050502@cn.fujitsu.com \
--to=liubo2009@cn.fujitsu.com \
--cc=linux-btrfs@vger.kernel.org \
--cc=sbehrens@giantdisaster.de \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.