Received: by 2002:a05:6a10:1287:0:0:0:0 with SMTP id d7csp3748623pxv; Mon, 19 Jul 2021 07:53:06 -0700 (PDT) X-Google-Smtp-Source: ABdhPJw603izbNYjyBrdzkUhFhIH2v1aXGhylQ4Qy4WHr7XPBvnGZ5EqIPvgLSvAYFq5J+LDKckD X-Received: by 2002:a05:6638:14c1:: with SMTP id l1mr16794943jak.97.1626706386785; Mon, 19 Jul 2021 07:53:06 -0700 (PDT) ARC-Seal: i=1; a=rsa-sha256; t=1626706386; cv=none; d=google.com; s=arc-20160816; b=kEz6aEptmWT9ZV55roieXKmgfLyLjIpsofZIyndPaYwD0RMbCMr28jEG63JdaFJsmW z/7jxvhRUhl4vzbhmq4EARnKSsrxdkz3zPebVLmQ8/WF67gOlp6xF3DkgIVETTwO9q2Z 1hCvGFF3ZqUhhqPpV53tPBFyChYbJCJfJE0sRmPW5KMAIDOaN3SZDpx21gnSaYNj3M7h AN9jnH1zZv6iOZSMXGKevrDqwRbQBjHy4LL2ZWTmln4FPPmWgKdv92TSokAsu4Csb4Hg dDetdF7jj32Hma1TCF7ZvtBwUDEEuebiA3Ss8cwSkZJzCs6rcapJHsQ4GcMYF8SwGatm KX7A== ARC-Message-Signature: i=1; a=rsa-sha256; c=relaxed/relaxed; d=google.com; s=arc-20160816; h=list-id:precedence:content-transfer-encoding:mime-version :message-id:date:subject:cc:to:from; bh=3YDIAwKrXlE6JtYcNvzCdrRtTSoo4qxz4Y3qZtLWGwg=; b=Ex6SdxYIT2+MhTDy6A45KDRBdCkYndwk72BwL7KA2mIDcdt9FJFFM4NnWEjy4mW44m jwZZMz5RuXlNnyG5eH3tJCIoJVfdW6TUwBMjSA+YVY+o9cOVX4UTaNrjVzV7zuwrRXJX ocQcacNVqKL7vEC59sKwRMzV24CQRW4STHkAW6snx5FuO5vS1Gn6SBgvstyLGS4Qf7tt VHy2lb9ogOK5pQhZzo9KML06NZTXkimeHxHXs4Z3whZ2rKT256VF4jyrOCFV6YYUKsYz RT2dI1jOS87dhP/drfqG8QgDGc3FNFWE2fJ6JbzhOr5vhTYAxVlyGjwSzVUG/nRf4T2C M7/A== ARC-Authentication-Results: i=1; mx.google.com; spf=pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) smtp.mailfrom=linux-kernel-owner@vger.kernel.org; dmarc=fail (p=NONE sp=NONE dis=NONE) header.from=alibaba.com Return-Path: Received: from vger.kernel.org (vger.kernel.org. [23.128.96.18]) by mx.google.com with ESMTP id f2si20447562jat.114.2021.07.19.07.52.55; Mon, 19 Jul 2021 07:53:06 -0700 (PDT) Received-SPF: pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) client-ip=23.128.96.18; Authentication-Results: mx.google.com; spf=pass (google.com: domain of linux-kernel-owner@vger.kernel.org designates 23.128.96.18 as permitted sender) smtp.mailfrom=linux-kernel-owner@vger.kernel.org; dmarc=fail (p=NONE sp=NONE dis=NONE) header.from=alibaba.com Received: (majordomo@vger.kernel.org) by vger.kernel.org via listexpand id S241141AbhGSOLg (ORCPT + 99 others); Mon, 19 Jul 2021 10:11:36 -0400 Received: from out30-43.freemail.mail.aliyun.com ([115.124.30.43]:49938 "EHLO out30-43.freemail.mail.aliyun.com" rhost-flags-OK-OK-OK-OK) by vger.kernel.org with ESMTP id S240298AbhGSOJO (ORCPT ); Mon, 19 Jul 2021 10:09:14 -0400 X-Alimail-AntiSpam: AC=PASS;BC=-1|-1;BR=01201311R211e4;CH=green;DM=||false|;DS=||;FP=0|-1|-1|-1|0|-1|-1|-1;HT=e01e04420;MF=hsiangkao@linux.alibaba.com;NM=1;PH=DS;RN=8;SR=0;TI=SMTPD_---0UgIJ0CV_1626706070; Received: from e18g09479.et15sqa.tbsite.net(mailfrom:hsiangkao@linux.alibaba.com fp:SMTPD_---0UgIJ0CV_1626706070) by smtp.aliyun-inc.com(127.0.0.1); Mon, 19 Jul 2021 22:48:00 +0800 From: Gao Xiang To: linux-erofs@lists.ozlabs.org, linux-fsdevel@vger.kernel.org Cc: LKML , Gao Xiang , Christoph Hellwig , "Darrick J . Wong" , Matthew Wilcox , Andreas Gruenbacher Subject: [PATCH v3] iomap: support tail packing inline read Date: Mon, 19 Jul 2021 22:47:47 +0800 Message-Id: <20210719144747.189634-1-hsiangkao@linux.alibaba.com> X-Mailer: git-send-email 2.24.4 MIME-Version: 1.0 Content-Transfer-Encoding: 8bit Precedence: bulk List-ID: X-Mailing-List: linux-kernel@vger.kernel.org This tries to add tail packing inline read to iomap, which can support several inline tail blocks. Similar to the previous approach, it cleans post-EOF in one iteration. The write path remains untouched since EROFS cannot be used for testing. It'd be better to be implemented if upcoming real users care rather than leave untested dead code around. Cc: Christoph Hellwig Cc: Darrick J. Wong Cc: Matthew Wilcox Cc: Andreas Gruenbacher Signed-off-by: Gao Xiang --- v2: https://lore.kernel.org/r/YPLdSja%2F4FBsjss%2F@B-P7TQMD6M-0146.local/ changes since v2: - update suggestion from Christoph: https://lore.kernel.org/r/YPVe41YqpfGLNsBS@infradead.org/ Hi Andreas, would you mind test on the gfs2 side? Thanks in advance! Thanks, Gao Xiang fs/iomap/buffered-io.c | 50 ++++++++++++++++++++++++++---------------- fs/iomap/direct-io.c | 11 ++++++---- 2 files changed, 38 insertions(+), 23 deletions(-) diff --git a/fs/iomap/buffered-io.c b/fs/iomap/buffered-io.c index 87ccb3438bec..cac8a88660d8 100644 --- a/fs/iomap/buffered-io.c +++ b/fs/iomap/buffered-io.c @@ -207,23 +207,22 @@ struct iomap_readpage_ctx { static void iomap_read_inline_data(struct inode *inode, struct page *page, - struct iomap *iomap) + struct iomap *iomap, loff_t pos) { - size_t size = i_size_read(inode); + unsigned int size, poff = offset_in_page(pos); void *addr; - if (PageUptodate(page)) - return; - - BUG_ON(page_has_private(page)); - BUG_ON(page->index); - BUG_ON(size > PAGE_SIZE - offset_in_page(iomap->inline_data)); + /* inline source data must be inside a single page */ + BUG_ON(iomap->length > PAGE_SIZE - offset_in_page(iomap->inline_data)); + /* handle tail-packing blocks cross the current page into the next */ + size = min_t(unsigned int, iomap->length + pos - iomap->offset, + PAGE_SIZE - poff); addr = kmap_atomic(page); - memcpy(addr, iomap->inline_data, size); - memset(addr + size, 0, PAGE_SIZE - size); + memcpy(addr + poff, iomap->inline_data - iomap->offset + pos, size); + memset(addr + poff + size, 0, PAGE_SIZE - poff - size); kunmap_atomic(addr); - SetPageUptodate(page); + iomap_set_range_uptodate(page, poff, PAGE_SIZE - poff); } static inline bool iomap_block_needs_zeroing(struct inode *inode, @@ -246,18 +245,19 @@ iomap_readpage_actor(struct inode *inode, loff_t pos, loff_t length, void *data, unsigned poff, plen; sector_t sector; - if (iomap->type == IOMAP_INLINE) { - WARN_ON_ONCE(pos); - iomap_read_inline_data(inode, page, iomap); - return PAGE_SIZE; - } - - /* zero post-eof blocks as the page may be mapped */ iop = iomap_page_create(inode, page); + /* needs to skip some leading uptodated blocks */ iomap_adjust_read_range(inode, iop, &pos, length, &poff, &plen); if (plen == 0) goto done; + if (iomap->type == IOMAP_INLINE) { + iomap_read_inline_data(inode, page, iomap, pos); + plen = PAGE_SIZE - poff; + goto done; + } + + /* zero post-eof blocks as the page may be mapped */ if (iomap_block_needs_zeroing(inode, iomap, pos)) { zero_user(page, poff, plen); iomap_set_range_uptodate(page, poff, plen); @@ -589,6 +589,18 @@ __iomap_write_begin(struct inode *inode, loff_t pos, unsigned len, int flags, return 0; } +static int iomap_write_begin_inline(struct inode *inode, loff_t pos, + struct page *page, struct iomap *srcmap) +{ + /* needs more work for the tailpacking case, disable for now */ + if (WARN_ON_ONCE(pos != 0)) + return -EIO; + if (PageUptodate(page)) + return 0; + iomap_read_inline_data(inode, page, srcmap, pos); + return 0; +} + static int iomap_write_begin(struct inode *inode, loff_t pos, unsigned len, unsigned flags, struct page **pagep, struct iomap *iomap, struct iomap *srcmap) @@ -618,7 +630,7 @@ iomap_write_begin(struct inode *inode, loff_t pos, unsigned len, unsigned flags, } if (srcmap->type == IOMAP_INLINE) - iomap_read_inline_data(inode, page, srcmap); + status = iomap_write_begin_inline(inode, pos, page, srcmap); else if (iomap->flags & IOMAP_F_BUFFER_HEAD) status = __block_write_begin_int(page, pos, len, NULL, srcmap); else diff --git a/fs/iomap/direct-io.c b/fs/iomap/direct-io.c index 9398b8c31323..ee6309967b77 100644 --- a/fs/iomap/direct-io.c +++ b/fs/iomap/direct-io.c @@ -379,22 +379,25 @@ iomap_dio_inline_actor(struct inode *inode, loff_t pos, loff_t length, { struct iov_iter *iter = dio->submit.iter; size_t copied; + void *dst = iomap->inline_data + pos - iomap->offset; - BUG_ON(pos + length > PAGE_SIZE - offset_in_page(iomap->inline_data)); + /* inline data must be inside a single page */ + BUG_ON(length > PAGE_SIZE - offset_in_page(iomap->inline_data)); if (dio->flags & IOMAP_DIO_WRITE) { loff_t size = inode->i_size; if (pos > size) - memset(iomap->inline_data + size, 0, pos - size); - copied = copy_from_iter(iomap->inline_data + pos, length, iter); + memset(iomap->inline_data + size - iomap->offset, + 0, pos - size); + copied = copy_from_iter(dst, length, iter); if (copied) { if (pos + copied > size) i_size_write(inode, pos + copied); mark_inode_dirty(inode); } } else { - copied = copy_to_iter(iomap->inline_data + pos, length, iter); + copied = copy_to_iter(dst, length, iter); } dio->size += copied; return copied; -- 2.24.4