All of lore.kernel.org
 help / color / mirror / Atom feed
From: Eric Sandeen <sandeen@redhat.com>
To: "Theodore Ts'o" <tytso@mit.edu>
Cc: Ext4 Developers List <linux-ext4@vger.kernel.org>
Subject: Re: [PATCH] ext4: add ratelimiting to ext4 messages
Date: Fri, 18 Oct 2013 09:08:40 -0500	[thread overview]
Message-ID: <526140E8.7000002@redhat.com> (raw)
In-Reply-To: <1382059728-29483-1-git-send-email-tytso@mit.edu>

On 10/17/13 8:28 PM, Theodore Ts'o wrote:
> In the case of a storage device that suddenly disappears, or in the
> case of significant file system corruption, this can result in a huge
> flood of messages being sent to the console.  This can overflow the
> file system containing /var/log/messages, or if a serial console is
> configured, this can slow down the system so much that a hardware
> watchdog can end up triggering forcing a system reboot.

Just out of curiosity, after the fs shuts down, is there still a flood
of messages?  Shouldn't that clamp down on the errors?

If not, shouldn't it do so?  xfs has a lot of short-circuiting if
the filesystem is shut down, so it (I think) won't get into paths that
will generate more errors.

(If not, would just shutting up ext_* error message post-shutdown accomplish
the same thing w/ fewer lines & fewer /proc configuration knobs)?

Just a thought,

-Eric

> Google-Bug-Id: 7258357
> 
> Signed-off-by: "Theodore Ts'o" <tytso@mit.edu>
> ---
>  fs/ext4/ext4.h  |   6 +++
>  fs/ext4/super.c | 152 +++++++++++++++++++++++++++++++++++---------------------
>  2 files changed, 100 insertions(+), 58 deletions(-)
> 
> diff --git a/fs/ext4/ext4.h b/fs/ext4/ext4.h
> index af815ea..65485ab 100644
> --- a/fs/ext4/ext4.h
> +++ b/fs/ext4/ext4.h
> @@ -29,6 +29,7 @@
>  #include <linux/wait.h>
>  #include <linux/blockgroup_lock.h>
>  #include <linux/percpu_counter.h>
> +#include <linux/ratelimit.h>
>  #include <crypto/hash.h>
>  #ifdef __KERNEL__
>  #include <linux/compat.h>
> @@ -1314,6 +1315,11 @@ struct ext4_sb_info {
>  	unsigned long s_es_last_sorted;
>  	struct percpu_counter s_extent_cache_cnt;
>  	spinlock_t s_es_lru_lock ____cacheline_aligned_in_smp;
> +
> +	/* Ratelimit ext4 messages. */
> +	struct ratelimit_state s_err_ratelimit_state;
> +	struct ratelimit_state s_warning_ratelimit_state;
> +	struct ratelimit_state s_msg_ratelimit_state;
>  };
>  
>  static inline struct ext4_sb_info *EXT4_SB(struct super_block *sb)
> diff --git a/fs/ext4/super.c b/fs/ext4/super.c
> index 2c2e6cb..d3a857b 100644
> --- a/fs/ext4/super.c
> +++ b/fs/ext4/super.c
> @@ -411,20 +411,26 @@ static void ext4_handle_error(struct super_block *sb)
>  			sb->s_id);
>  }
>  
> +#define ext4_error_ratelimit(sb)					\
> +		___ratelimit(&(EXT4_SB(sb)->s_err_ratelimit_state),	\
> +			     "EXT4-fs error")
> +
>  void __ext4_error(struct super_block *sb, const char *function,
>  		  unsigned int line, const char *fmt, ...)
>  {
>  	struct va_format vaf;
>  	va_list args;
>  
> -	va_start(args, fmt);
> -	vaf.fmt = fmt;
> -	vaf.va = &args;
> -	printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n",
> -	       sb->s_id, function, line, current->comm, &vaf);
> -	va_end(args);
> +	if (ext4_error_ratelimit(sb)) {
> +		va_start(args, fmt);
> +		vaf.fmt = fmt;
> +		vaf.va = &args;
> +		printk(KERN_CRIT
> +		       "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n",
> +		       sb->s_id, function, line, current->comm, &vaf);
> +		va_end(args);
> +	}
>  	save_error_info(sb, function, line);
> -
>  	ext4_handle_error(sb);
>  }
>  
> @@ -438,22 +444,23 @@ void __ext4_error_inode(struct inode *inode, const char *function,
>  
>  	es->s_last_error_ino = cpu_to_le32(inode->i_ino);
>  	es->s_last_error_block = cpu_to_le64(block);
> +	if (ext4_error_ratelimit(inode->i_sb)) {
> +		va_start(args, fmt);
> +		vaf.fmt = fmt;
> +		vaf.va = &args;
> +		if (block)
> +			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
> +			       "inode #%lu: block %llu: comm %s: %pV\n",
> +			       inode->i_sb->s_id, function, line, inode->i_ino,
> +			       block, current->comm, &vaf);
> +		else
> +			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
> +			       "inode #%lu: comm %s: %pV\n",
> +			       inode->i_sb->s_id, function, line, inode->i_ino,
> +			       current->comm, &vaf);
> +		va_end(args);
> +	}
>  	save_error_info(inode->i_sb, function, line);
> -	va_start(args, fmt);
> -	vaf.fmt = fmt;
> -	vaf.va = &args;
> -	if (block)
> -		printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
> -		       "inode #%lu: block %llu: comm %s: %pV\n",
> -		       inode->i_sb->s_id, function, line, inode->i_ino,
> -		       block, current->comm, &vaf);
> -	else
> -		printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
> -		       "inode #%lu: comm %s: %pV\n",
> -		       inode->i_sb->s_id, function, line, inode->i_ino,
> -		       current->comm, &vaf);
> -	va_end(args);
> -
>  	ext4_handle_error(inode->i_sb);
>  }
>  
> @@ -469,27 +476,28 @@ void __ext4_error_file(struct file *file, const char *function,
>  
>  	es = EXT4_SB(inode->i_sb)->s_es;
>  	es->s_last_error_ino = cpu_to_le32(inode->i_ino);
> +	if (ext4_error_ratelimit(inode->i_sb)) {
> +		path = d_path(&(file->f_path), pathname, sizeof(pathname));
> +		if (IS_ERR(path))
> +			path = "(unknown)";
> +		va_start(args, fmt);
> +		vaf.fmt = fmt;
> +		vaf.va = &args;
> +		if (block)
> +			printk(KERN_CRIT
> +			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
> +			       "block %llu: comm %s: path %s: %pV\n",
> +			       inode->i_sb->s_id, function, line, inode->i_ino,
> +			       block, current->comm, path, &vaf);
> +		else
> +			printk(KERN_CRIT
> +			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
> +			       "comm %s: path %s: %pV\n",
> +			       inode->i_sb->s_id, function, line, inode->i_ino,
> +			       current->comm, path, &vaf);
> +		va_end(args);
> +	}
>  	save_error_info(inode->i_sb, function, line);
> -	path = d_path(&(file->f_path), pathname, sizeof(pathname));
> -	if (IS_ERR(path))
> -		path = "(unknown)";
> -	va_start(args, fmt);
> -	vaf.fmt = fmt;
> -	vaf.va = &args;
> -	if (block)
> -		printk(KERN_CRIT
> -		       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
> -		       "block %llu: comm %s: path %s: %pV\n",
> -		       inode->i_sb->s_id, function, line, inode->i_ino,
> -		       block, current->comm, path, &vaf);
> -	else
> -		printk(KERN_CRIT
> -		       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
> -		       "comm %s: path %s: %pV\n",
> -		       inode->i_sb->s_id, function, line, inode->i_ino,
> -		       current->comm, path, &vaf);
> -	va_end(args);
> -
>  	ext4_handle_error(inode->i_sb);
>  }
>  
> @@ -543,11 +551,13 @@ void __ext4_std_error(struct super_block *sb, const char *function,
>  	    (sb->s_flags & MS_RDONLY))
>  		return;
>  
> -	errstr = ext4_decode_error(sb, errno, nbuf);
> -	printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n",
> -	       sb->s_id, function, line, errstr);
> -	save_error_info(sb, function, line);
> +	if (ext4_error_ratelimit(sb)) {
> +		errstr = ext4_decode_error(sb, errno, nbuf);
> +		printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n",
> +		       sb->s_id, function, line, errstr);
> +	}
>  
> +	save_error_info(sb, function, line);
>  	ext4_handle_error(sb);
>  }
>  
> @@ -597,6 +607,9 @@ void __ext4_msg(struct super_block *sb,
>  	struct va_format vaf;
>  	va_list args;
>  
> +	if (!___ratelimit(&(EXT4_SB(sb)->s_msg_ratelimit_state), "EXT4-fs"))
> +		return;
> +
>  	va_start(args, fmt);
>  	vaf.fmt = fmt;
>  	vaf.va = &args;
> @@ -610,6 +623,10 @@ void __ext4_warning(struct super_block *sb, const char *function,
>  	struct va_format vaf;
>  	va_list args;
>  
> +	if (!___ratelimit(&(EXT4_SB(sb)->s_warning_ratelimit_state),
> +			  "EXT4-fs warning"))
> +		return;
> +
>  	va_start(args, fmt);
>  	vaf.fmt = fmt;
>  	vaf.va = &args;
> @@ -633,18 +650,20 @@ __acquires(bitlock)
>  	es->s_last_error_block = cpu_to_le64(block);
>  	__save_error_info(sb, function, line);
>  
> -	va_start(args, fmt);
> -
> -	vaf.fmt = fmt;
> -	vaf.va = &args;
> -	printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ",
> -	       sb->s_id, function, line, grp);
> -	if (ino)
> -		printk(KERN_CONT "inode %lu: ", ino);
> -	if (block)
> -		printk(KERN_CONT "block %llu:", (unsigned long long) block);
> -	printk(KERN_CONT "%pV\n", &vaf);
> -	va_end(args);
> +	if (ext4_error_ratelimit(sb)) {
> +		va_start(args, fmt);
> +		vaf.fmt = fmt;
> +		vaf.va = &args;
> +		printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ",
> +		       sb->s_id, function, line, grp);
> +		if (ino)
> +			printk(KERN_CONT "inode %lu: ", ino);
> +		if (block)
> +			printk(KERN_CONT "block %llu:",
> +			       (unsigned long long) block);
> +		printk(KERN_CONT "%pV\n", &vaf);
> +		va_end(args);
> +	}
>  
>  	if (test_opt(sb, ERRORS_CONT)) {
>  		ext4_commit_super(sb, 0);
> @@ -2606,6 +2625,12 @@ EXT4_RW_ATTR_SBI_UI(mb_group_prealloc, s_mb_group_prealloc);
>  EXT4_DEPRECATED_ATTR(max_writeback_mb_bump, 128);
>  EXT4_RW_ATTR_SBI_UI(extent_max_zeroout_kb, s_extent_max_zeroout_kb);
>  EXT4_ATTR(trigger_fs_error, 0200, NULL, trigger_test_error);
> +EXT4_RW_ATTR_SBI_UI(err_ratelimit_interval_ms, s_err_ratelimit_state.interval);
> +EXT4_RW_ATTR_SBI_UI(err_ratelimit_burst, s_err_ratelimit_state.burst);
> +EXT4_RW_ATTR_SBI_UI(warning_ratelimit_interval_ms, s_warning_ratelimit_state.interval);
> +EXT4_RW_ATTR_SBI_UI(warning_ratelimit_burst, s_warning_ratelimit_state.burst);
> +EXT4_RW_ATTR_SBI_UI(msg_ratelimit_interval_ms, s_msg_ratelimit_state.interval);
> +EXT4_RW_ATTR_SBI_UI(msg_ratelimit_burst, s_msg_ratelimit_state.burst);
>  
>  static struct attribute *ext4_attrs[] = {
>  	ATTR_LIST(delayed_allocation_blocks),
> @@ -2623,6 +2648,12 @@ static struct attribute *ext4_attrs[] = {
>  	ATTR_LIST(max_writeback_mb_bump),
>  	ATTR_LIST(extent_max_zeroout_kb),
>  	ATTR_LIST(trigger_fs_error),
> +	ATTR_LIST(err_ratelimit_interval_ms),
> +	ATTR_LIST(err_ratelimit_burst),
> +	ATTR_LIST(warning_ratelimit_interval_ms),
> +	ATTR_LIST(warning_ratelimit_burst),
> +	ATTR_LIST(msg_ratelimit_interval_ms),
> +	ATTR_LIST(msg_ratelimit_burst),
>  	NULL,
>  };
>  
> @@ -4118,6 +4149,11 @@ no_journal:
>  	if (es->s_error_count)
>  		mod_timer(&sbi->s_err_report, jiffies + 300*HZ); /* 5 minutes */
>  
> +	/* Enable message ratelimiting. Default is 10 messages per 5 secs. */
> +	ratelimit_state_init(&sbi->s_err_ratelimit_state, 5 * HZ, 10);
> +	ratelimit_state_init(&sbi->s_warning_ratelimit_state, 5 * HZ, 10);
> +	ratelimit_state_init(&sbi->s_msg_ratelimit_state, 5 * HZ, 10);
> +
>  	kfree(orig_data);
>  	return 0;
>  
> 


  parent reply	other threads:[~2013-10-18 14:08 UTC|newest]

Thread overview: 8+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2013-10-18  1:28 [PATCH] ext4: add ratelimiting to ext4 messages Theodore Ts'o
2013-10-18 13:08 ` Lukáš Czerner
2013-10-18 14:08 ` Eric Sandeen [this message]
2013-10-18 18:59   ` Theodore Ts'o
2013-10-19 23:04     ` Eric Sandeen
2013-10-20 11:18       ` Theodore Ts'o
2013-10-20 23:15         ` Dave Chinner
2013-10-21  9:43     ` Zheng Liu

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=526140E8.7000002@redhat.com \
    --to=sandeen@redhat.com \
    --cc=linux-ext4@vger.kernel.org \
    --cc=tytso@mit.edu \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.