From: "Darrick J. Wong" <djwong@kernel.org>
To: "Ritesh Harjani (IBM)" <ritesh.list@gmail.com>
Cc: linux-xfs@vger.kernel.org, linux-fsdevel@vger.kernel.org,
Matthew Wilcox <willy@infradead.org>,
Christoph Hellwig <hch@infradead.org>,
Brian Foster <bfoster@redhat.com>,
Andreas Gruenbacher <agruenba@redhat.com>,
Christoph Hellwig <hch@lst.de>
Subject: Re: [PATCHv11 1/8] iomap: Rename iomap_page to iomap_folio_state and others
Date: Wed, 12 Jul 2023 21:31:14 -0700 [thread overview]
Message-ID: <20230713043114.GA108251@frogsfrogsfrogs> (raw)
In-Reply-To: <b41b605a29e1306bc3cafa4e1c577c051e8dd8bd.1688188958.git.ritesh.list@gmail.com>
On Sat, Jul 01, 2023 at 01:04:34PM +0530, Ritesh Harjani (IBM) wrote:
> struct iomap_page actually tracks per-block state of a folio.
> Hence it make sense to rename some of these function names and data
> structures for e.g.
> 1. struct iomap_page (iop) -> struct iomap_folio_state (ifs)
> 2. iomap_page_create() -> ifs_alloc()
> 3. iomap_page_release() -> ifs_free()
> 4. iomap_iop_set_range_uptodate() -> ifs_set_range_uptodate()
> 5. to_iomap_page() -> folio->private
>
> Since in later patches we are also going to add per-block dirty state
> tracking to iomap_folio_state. Hence this patch also renames "uptodate"
> & "uptodate_lock" members of iomap_folio_state to "state" and"state_lock".
>
> We don't really need to_iomap_page() function, instead directly open code
> it as folio->private;
>
> Reviewed-by: Christoph Hellwig <hch@lst.de>
> Signed-off-by: Ritesh Harjani (IBM) <ritesh.list@gmail.com>
Reviewed-by: Darrick J. Wong <djwong@kernel.org>
--D
> ---
> fs/iomap/buffered-io.c | 151 ++++++++++++++++++++---------------------
> 1 file changed, 72 insertions(+), 79 deletions(-)
>
> diff --git a/fs/iomap/buffered-io.c b/fs/iomap/buffered-io.c
> index 063133ec77f4..2675a3e0ac1d 100644
> --- a/fs/iomap/buffered-io.c
> +++ b/fs/iomap/buffered-io.c
> @@ -24,64 +24,57 @@
> #define IOEND_BATCH_SIZE 4096
>
> /*
> - * Structure allocated for each folio when block size < folio size
> - * to track sub-folio uptodate status and I/O completions.
> + * Structure allocated for each folio to track per-block uptodate state
> + * and I/O completions.
> */
> -struct iomap_page {
> +struct iomap_folio_state {
> atomic_t read_bytes_pending;
> atomic_t write_bytes_pending;
> - spinlock_t uptodate_lock;
> - unsigned long uptodate[];
> + spinlock_t state_lock;
> + unsigned long state[];
> };
>
> -static inline struct iomap_page *to_iomap_page(struct folio *folio)
> -{
> - if (folio_test_private(folio))
> - return folio_get_private(folio);
> - return NULL;
> -}
> -
> static struct bio_set iomap_ioend_bioset;
>
> -static struct iomap_page *
> -iomap_page_create(struct inode *inode, struct folio *folio, unsigned int flags)
> +static struct iomap_folio_state *ifs_alloc(struct inode *inode,
> + struct folio *folio, unsigned int flags)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
> unsigned int nr_blocks = i_blocks_per_folio(inode, folio);
> gfp_t gfp;
>
> - if (iop || nr_blocks <= 1)
> - return iop;
> + if (ifs || nr_blocks <= 1)
> + return ifs;
>
> if (flags & IOMAP_NOWAIT)
> gfp = GFP_NOWAIT;
> else
> gfp = GFP_NOFS | __GFP_NOFAIL;
>
> - iop = kzalloc(struct_size(iop, uptodate, BITS_TO_LONGS(nr_blocks)),
> + ifs = kzalloc(struct_size(ifs, state, BITS_TO_LONGS(nr_blocks)),
> gfp);
> - if (iop) {
> - spin_lock_init(&iop->uptodate_lock);
> + if (ifs) {
> + spin_lock_init(&ifs->state_lock);
> if (folio_test_uptodate(folio))
> - bitmap_fill(iop->uptodate, nr_blocks);
> - folio_attach_private(folio, iop);
> + bitmap_fill(ifs->state, nr_blocks);
> + folio_attach_private(folio, ifs);
> }
> - return iop;
> + return ifs;
> }
>
> -static void iomap_page_release(struct folio *folio)
> +static void ifs_free(struct folio *folio)
> {
> - struct iomap_page *iop = folio_detach_private(folio);
> + struct iomap_folio_state *ifs = folio_detach_private(folio);
> struct inode *inode = folio->mapping->host;
> unsigned int nr_blocks = i_blocks_per_folio(inode, folio);
>
> - if (!iop)
> + if (!ifs)
> return;
> - WARN_ON_ONCE(atomic_read(&iop->read_bytes_pending));
> - WARN_ON_ONCE(atomic_read(&iop->write_bytes_pending));
> - WARN_ON_ONCE(bitmap_full(iop->uptodate, nr_blocks) !=
> + WARN_ON_ONCE(atomic_read(&ifs->read_bytes_pending));
> + WARN_ON_ONCE(atomic_read(&ifs->write_bytes_pending));
> + WARN_ON_ONCE(bitmap_full(ifs->state, nr_blocks) !=
> folio_test_uptodate(folio));
> - kfree(iop);
> + kfree(ifs);
> }
>
> /*
> @@ -90,7 +83,7 @@ static void iomap_page_release(struct folio *folio)
> static void iomap_adjust_read_range(struct inode *inode, struct folio *folio,
> loff_t *pos, loff_t length, size_t *offp, size_t *lenp)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
> loff_t orig_pos = *pos;
> loff_t isize = i_size_read(inode);
> unsigned block_bits = inode->i_blkbits;
> @@ -105,12 +98,12 @@ static void iomap_adjust_read_range(struct inode *inode, struct folio *folio,
> * per-block uptodate status and adjust the offset and length if needed
> * to avoid reading in already uptodate ranges.
> */
> - if (iop) {
> + if (ifs) {
> unsigned int i;
>
> /* move forward for each leading block marked uptodate */
> for (i = first; i <= last; i++) {
> - if (!test_bit(i, iop->uptodate))
> + if (!test_bit(i, ifs->state))
> break;
> *pos += block_size;
> poff += block_size;
> @@ -120,7 +113,7 @@ static void iomap_adjust_read_range(struct inode *inode, struct folio *folio,
>
> /* truncate len if we find any trailing uptodate block(s) */
> for ( ; i <= last; i++) {
> - if (test_bit(i, iop->uptodate)) {
> + if (test_bit(i, ifs->state)) {
> plen -= (last - i + 1) * block_size;
> last = i - 1;
> break;
> @@ -144,26 +137,26 @@ static void iomap_adjust_read_range(struct inode *inode, struct folio *folio,
> *lenp = plen;
> }
>
> -static void iomap_iop_set_range_uptodate(struct folio *folio,
> - struct iomap_page *iop, size_t off, size_t len)
> +static void ifs_set_range_uptodate(struct folio *folio,
> + struct iomap_folio_state *ifs, size_t off, size_t len)
> {
> struct inode *inode = folio->mapping->host;
> unsigned first = off >> inode->i_blkbits;
> unsigned last = (off + len - 1) >> inode->i_blkbits;
> unsigned long flags;
>
> - spin_lock_irqsave(&iop->uptodate_lock, flags);
> - bitmap_set(iop->uptodate, first, last - first + 1);
> - if (bitmap_full(iop->uptodate, i_blocks_per_folio(inode, folio)))
> + spin_lock_irqsave(&ifs->state_lock, flags);
> + bitmap_set(ifs->state, first, last - first + 1);
> + if (bitmap_full(ifs->state, i_blocks_per_folio(inode, folio)))
> folio_mark_uptodate(folio);
> - spin_unlock_irqrestore(&iop->uptodate_lock, flags);
> + spin_unlock_irqrestore(&ifs->state_lock, flags);
> }
>
> static void iomap_set_range_uptodate(struct folio *folio,
> - struct iomap_page *iop, size_t off, size_t len)
> + struct iomap_folio_state *ifs, size_t off, size_t len)
> {
> - if (iop)
> - iomap_iop_set_range_uptodate(folio, iop, off, len);
> + if (ifs)
> + ifs_set_range_uptodate(folio, ifs, off, len);
> else
> folio_mark_uptodate(folio);
> }
> @@ -171,16 +164,16 @@ static void iomap_set_range_uptodate(struct folio *folio,
> static void iomap_finish_folio_read(struct folio *folio, size_t offset,
> size_t len, int error)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
>
> if (unlikely(error)) {
> folio_clear_uptodate(folio);
> folio_set_error(folio);
> } else {
> - iomap_set_range_uptodate(folio, iop, offset, len);
> + iomap_set_range_uptodate(folio, ifs, offset, len);
> }
>
> - if (!iop || atomic_sub_and_test(len, &iop->read_bytes_pending))
> + if (!ifs || atomic_sub_and_test(len, &ifs->read_bytes_pending))
> folio_unlock(folio);
> }
>
> @@ -213,7 +206,7 @@ struct iomap_readpage_ctx {
> static int iomap_read_inline_data(const struct iomap_iter *iter,
> struct folio *folio)
> {
> - struct iomap_page *iop;
> + struct iomap_folio_state *ifs;
> const struct iomap *iomap = iomap_iter_srcmap(iter);
> size_t size = i_size_read(iter->inode) - iomap->offset;
> size_t poff = offset_in_page(iomap->offset);
> @@ -231,15 +224,15 @@ static int iomap_read_inline_data(const struct iomap_iter *iter,
> if (WARN_ON_ONCE(size > iomap->length))
> return -EIO;
> if (offset > 0)
> - iop = iomap_page_create(iter->inode, folio, iter->flags);
> + ifs = ifs_alloc(iter->inode, folio, iter->flags);
> else
> - iop = to_iomap_page(folio);
> + ifs = folio->private;
>
> addr = kmap_local_folio(folio, offset);
> memcpy(addr, iomap->inline_data, size);
> memset(addr + size, 0, PAGE_SIZE - poff - size);
> kunmap_local(addr);
> - iomap_set_range_uptodate(folio, iop, offset, PAGE_SIZE - poff);
> + iomap_set_range_uptodate(folio, ifs, offset, PAGE_SIZE - poff);
> return 0;
> }
>
> @@ -260,7 +253,7 @@ static loff_t iomap_readpage_iter(const struct iomap_iter *iter,
> loff_t pos = iter->pos + offset;
> loff_t length = iomap_length(iter) - offset;
> struct folio *folio = ctx->cur_folio;
> - struct iomap_page *iop;
> + struct iomap_folio_state *ifs;
> loff_t orig_pos = pos;
> size_t poff, plen;
> sector_t sector;
> @@ -269,20 +262,20 @@ static loff_t iomap_readpage_iter(const struct iomap_iter *iter,
> return iomap_read_inline_data(iter, folio);
>
> /* zero post-eof blocks as the page may be mapped */
> - iop = iomap_page_create(iter->inode, folio, iter->flags);
> + ifs = ifs_alloc(iter->inode, folio, iter->flags);
> iomap_adjust_read_range(iter->inode, folio, &pos, length, &poff, &plen);
> if (plen == 0)
> goto done;
>
> if (iomap_block_needs_zeroing(iter, pos)) {
> folio_zero_range(folio, poff, plen);
> - iomap_set_range_uptodate(folio, iop, poff, plen);
> + iomap_set_range_uptodate(folio, ifs, poff, plen);
> goto done;
> }
>
> ctx->cur_folio_in_bio = true;
> - if (iop)
> - atomic_add(plen, &iop->read_bytes_pending);
> + if (ifs)
> + atomic_add(plen, &ifs->read_bytes_pending);
>
> sector = iomap_sector(iomap, pos);
> if (!ctx->bio ||
> @@ -436,11 +429,11 @@ EXPORT_SYMBOL_GPL(iomap_readahead);
> */
> bool iomap_is_partially_uptodate(struct folio *folio, size_t from, size_t count)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
> struct inode *inode = folio->mapping->host;
> unsigned first, last, i;
>
> - if (!iop)
> + if (!ifs)
> return false;
>
> /* Caller's range may extend past the end of this folio */
> @@ -451,7 +444,7 @@ bool iomap_is_partially_uptodate(struct folio *folio, size_t from, size_t count)
> last = (from + count - 1) >> inode->i_blkbits;
>
> for (i = first; i <= last; i++)
> - if (!test_bit(i, iop->uptodate))
> + if (!test_bit(i, ifs->state))
> return false;
> return true;
> }
> @@ -490,7 +483,7 @@ bool iomap_release_folio(struct folio *folio, gfp_t gfp_flags)
> */
> if (folio_test_dirty(folio) || folio_test_writeback(folio))
> return false;
> - iomap_page_release(folio);
> + ifs_free(folio);
> return true;
> }
> EXPORT_SYMBOL_GPL(iomap_release_folio);
> @@ -507,12 +500,12 @@ void iomap_invalidate_folio(struct folio *folio, size_t offset, size_t len)
> if (offset == 0 && len == folio_size(folio)) {
> WARN_ON_ONCE(folio_test_writeback(folio));
> folio_cancel_dirty(folio);
> - iomap_page_release(folio);
> + ifs_free(folio);
> } else if (folio_test_large(folio)) {
> - /* Must release the iop so the page can be split */
> + /* Must release the ifs so the page can be split */
> WARN_ON_ONCE(!folio_test_uptodate(folio) &&
> folio_test_dirty(folio));
> - iomap_page_release(folio);
> + ifs_free(folio);
> }
> }
> EXPORT_SYMBOL_GPL(iomap_invalidate_folio);
> @@ -547,7 +540,7 @@ static int __iomap_write_begin(const struct iomap_iter *iter, loff_t pos,
> size_t len, struct folio *folio)
> {
> const struct iomap *srcmap = iomap_iter_srcmap(iter);
> - struct iomap_page *iop;
> + struct iomap_folio_state *ifs;
> loff_t block_size = i_blocksize(iter->inode);
> loff_t block_start = round_down(pos, block_size);
> loff_t block_end = round_up(pos + len, block_size);
> @@ -559,8 +552,8 @@ static int __iomap_write_begin(const struct iomap_iter *iter, loff_t pos,
> return 0;
> folio_clear_error(folio);
>
> - iop = iomap_page_create(iter->inode, folio, iter->flags);
> - if ((iter->flags & IOMAP_NOWAIT) && !iop && nr_blocks > 1)
> + ifs = ifs_alloc(iter->inode, folio, iter->flags);
> + if ((iter->flags & IOMAP_NOWAIT) && !ifs && nr_blocks > 1)
> return -EAGAIN;
>
> do {
> @@ -589,7 +582,7 @@ static int __iomap_write_begin(const struct iomap_iter *iter, loff_t pos,
> if (status)
> return status;
> }
> - iomap_set_range_uptodate(folio, iop, poff, plen);
> + iomap_set_range_uptodate(folio, ifs, poff, plen);
> } while ((block_start += plen) < block_end);
>
> return 0;
> @@ -696,7 +689,7 @@ static int iomap_write_begin(struct iomap_iter *iter, loff_t pos,
> static size_t __iomap_write_end(struct inode *inode, loff_t pos, size_t len,
> size_t copied, struct folio *folio)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
> flush_dcache_folio(folio);
>
> /*
> @@ -712,7 +705,7 @@ static size_t __iomap_write_end(struct inode *inode, loff_t pos, size_t len,
> */
> if (unlikely(copied < len && !folio_test_uptodate(folio)))
> return 0;
> - iomap_set_range_uptodate(folio, iop, offset_in_folio(folio, pos), len);
> + iomap_set_range_uptodate(folio, ifs, offset_in_folio(folio, pos), len);
> filemap_dirty_folio(inode->i_mapping, folio);
> return copied;
> }
> @@ -1290,17 +1283,17 @@ EXPORT_SYMBOL_GPL(iomap_page_mkwrite);
> static void iomap_finish_folio_write(struct inode *inode, struct folio *folio,
> size_t len, int error)
> {
> - struct iomap_page *iop = to_iomap_page(folio);
> + struct iomap_folio_state *ifs = folio->private;
>
> if (error) {
> folio_set_error(folio);
> mapping_set_error(inode->i_mapping, error);
> }
>
> - WARN_ON_ONCE(i_blocks_per_folio(inode, folio) > 1 && !iop);
> - WARN_ON_ONCE(iop && atomic_read(&iop->write_bytes_pending) <= 0);
> + WARN_ON_ONCE(i_blocks_per_folio(inode, folio) > 1 && !ifs);
> + WARN_ON_ONCE(ifs && atomic_read(&ifs->write_bytes_pending) <= 0);
>
> - if (!iop || atomic_sub_and_test(len, &iop->write_bytes_pending))
> + if (!ifs || atomic_sub_and_test(len, &ifs->write_bytes_pending))
> folio_end_writeback(folio);
> }
>
> @@ -1567,7 +1560,7 @@ iomap_can_add_to_ioend(struct iomap_writepage_ctx *wpc, loff_t offset,
> */
> static void
> iomap_add_to_ioend(struct inode *inode, loff_t pos, struct folio *folio,
> - struct iomap_page *iop, struct iomap_writepage_ctx *wpc,
> + struct iomap_folio_state *ifs, struct iomap_writepage_ctx *wpc,
> struct writeback_control *wbc, struct list_head *iolist)
> {
> sector_t sector = iomap_sector(&wpc->iomap, pos);
> @@ -1585,8 +1578,8 @@ iomap_add_to_ioend(struct inode *inode, loff_t pos, struct folio *folio,
> bio_add_folio(wpc->ioend->io_bio, folio, len, poff);
> }
>
> - if (iop)
> - atomic_add(len, &iop->write_bytes_pending);
> + if (ifs)
> + atomic_add(len, &ifs->write_bytes_pending);
> wpc->ioend->io_size += len;
> wbc_account_cgroup_owner(wbc, &folio->page, len);
> }
> @@ -1612,7 +1605,7 @@ iomap_writepage_map(struct iomap_writepage_ctx *wpc,
> struct writeback_control *wbc, struct inode *inode,
> struct folio *folio, u64 end_pos)
> {
> - struct iomap_page *iop = iomap_page_create(inode, folio, 0);
> + struct iomap_folio_state *ifs = ifs_alloc(inode, folio, 0);
> struct iomap_ioend *ioend, *next;
> unsigned len = i_blocksize(inode);
> unsigned nblocks = i_blocks_per_folio(inode, folio);
> @@ -1620,7 +1613,7 @@ iomap_writepage_map(struct iomap_writepage_ctx *wpc,
> int error = 0, count = 0, i;
> LIST_HEAD(submit_list);
>
> - WARN_ON_ONCE(iop && atomic_read(&iop->write_bytes_pending) != 0);
> + WARN_ON_ONCE(ifs && atomic_read(&ifs->write_bytes_pending) != 0);
>
> /*
> * Walk through the folio to find areas to write back. If we
> @@ -1628,7 +1621,7 @@ iomap_writepage_map(struct iomap_writepage_ctx *wpc,
> * invalid, grab a new one.
> */
> for (i = 0; i < nblocks && pos < end_pos; i++, pos += len) {
> - if (iop && !test_bit(i, iop->uptodate))
> + if (ifs && !test_bit(i, ifs->state))
> continue;
>
> error = wpc->ops->map_blocks(wpc, inode, pos);
> @@ -1639,7 +1632,7 @@ iomap_writepage_map(struct iomap_writepage_ctx *wpc,
> continue;
> if (wpc->iomap.type == IOMAP_HOLE)
> continue;
> - iomap_add_to_ioend(inode, pos, folio, iop, wpc, wbc,
> + iomap_add_to_ioend(inode, pos, folio, ifs, wpc, wbc,
> &submit_list);
> count++;
> }
> --
> 2.40.1
>
next prev parent reply other threads:[~2023-07-13 4:31 UTC|newest]
Thread overview: 22+ messages / expand[flat|nested] mbox.gz Atom feed top
2023-07-01 7:34 [PATCHv11 0/8] iomap: Add support for per-block dirty state to improve write performance Ritesh Harjani (IBM)
2023-07-01 7:34 ` [PATCHv11 1/8] iomap: Rename iomap_page to iomap_folio_state and others Ritesh Harjani (IBM)
2023-07-13 4:31 ` Darrick J. Wong [this message]
2023-07-01 7:34 ` [PATCHv11 2/8] iomap: Drop ifs argument from iomap_set_range_uptodate() Ritesh Harjani (IBM)
2023-07-13 4:31 ` Darrick J. Wong
2023-07-01 7:34 ` [PATCHv11 3/8] iomap: Add some uptodate state handling helpers for ifs state bitmap Ritesh Harjani (IBM)
2023-07-13 4:32 ` Darrick J. Wong
2023-07-01 7:34 ` [PATCHv11 4/8] iomap: Fix possible overflow condition in iomap_write_delalloc_scan Ritesh Harjani (IBM)
2023-07-13 4:33 ` Darrick J. Wong
2023-07-01 7:34 ` [PATCHv11 5/8] iomap: Use iomap_punch_t typedef Ritesh Harjani (IBM)
2023-07-13 4:33 ` Darrick J. Wong
2023-07-01 7:34 ` [PATCHv11 6/8] iomap: Refactor iomap_write_delalloc_punch() function out Ritesh Harjani (IBM)
2023-07-01 7:34 ` [PATCHv11 7/8] iomap: Allocate ifs in ->write_begin() early Ritesh Harjani (IBM)
2023-07-01 7:34 ` [PATCHv11 8/8] iomap: Add per-block dirty state tracking to improve performance Ritesh Harjani (IBM)
2023-07-06 14:46 ` Ritesh Harjani
2023-07-06 17:42 ` Matthew Wilcox
2023-07-06 22:16 ` Dave Chinner
2023-07-06 23:54 ` Matthew Wilcox
2023-07-10 18:19 ` Ritesh Harjani
2023-07-13 4:38 ` Darrick J. Wong
2023-07-13 5:27 ` Ritesh Harjani
2023-07-13 4:36 ` Darrick J. Wong
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20230713043114.GA108251@frogsfrogsfrogs \
--to=djwong@kernel.org \
--cc=agruenba@redhat.com \
--cc=bfoster@redhat.com \
--cc=hch@infradead.org \
--cc=hch@lst.de \
--cc=linux-fsdevel@vger.kernel.org \
--cc=linux-xfs@vger.kernel.org \
--cc=ritesh.list@gmail.com \
--cc=willy@infradead.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).