| // SPDX-License-Identifier: GPL-2.0 |
| /* |
| * linux/drivers/staging/erofs/data.c |
| * |
| * Copyright (C) 2017-2018 HUAWEI, Inc. |
| * http://www.huawei.com/ |
| * Created by Gao Xiang <gaoxiang25@huawei.com> |
| * |
| * This file is subject to the terms and conditions of the GNU General Public |
| * License. See the file COPYING in the main directory of the Linux |
| * distribution for more details. |
| */ |
| #include "internal.h" |
| #include <linux/prefetch.h> |
| |
| #include <trace/events/erofs.h> |
| |
| static inline void read_endio(struct bio *bio) |
| { |
| int i; |
| struct bio_vec *bvec; |
| const blk_status_t err = bio->bi_status; |
| struct bvec_iter_all iter_all; |
| |
| bio_for_each_segment_all(bvec, bio, i, iter_all) { |
| struct page *page = bvec->bv_page; |
| |
| /* page is already locked */ |
| DBG_BUGON(PageUptodate(page)); |
| |
| if (unlikely(err)) |
| SetPageError(page); |
| else |
| SetPageUptodate(page); |
| |
| unlock_page(page); |
| /* page could be reclaimed now */ |
| } |
| bio_put(bio); |
| } |
| |
| /* prio -- true is used for dir */ |
| struct page *__erofs_get_meta_page(struct super_block *sb, |
| erofs_blk_t blkaddr, bool prio, bool nofail) |
| { |
| struct inode *const bd_inode = sb->s_bdev->bd_inode; |
| struct address_space *const mapping = bd_inode->i_mapping; |
| /* prefer retrying in the allocator to blindly looping below */ |
| const gfp_t gfp = mapping_gfp_constraint(mapping, ~__GFP_FS) | |
| (nofail ? __GFP_NOFAIL : 0); |
| unsigned int io_retries = nofail ? EROFS_IO_MAX_RETRIES_NOFAIL : 0; |
| struct page *page; |
| int err; |
| |
| repeat: |
| page = find_or_create_page(mapping, blkaddr, gfp); |
| if (unlikely(!page)) { |
| DBG_BUGON(nofail); |
| return ERR_PTR(-ENOMEM); |
| } |
| DBG_BUGON(!PageLocked(page)); |
| |
| if (!PageUptodate(page)) { |
| struct bio *bio; |
| |
| bio = erofs_grab_bio(sb, blkaddr, 1, read_endio, nofail); |
| if (IS_ERR(bio)) { |
| DBG_BUGON(nofail); |
| err = PTR_ERR(bio); |
| goto err_out; |
| } |
| |
| err = bio_add_page(bio, page, PAGE_SIZE, 0); |
| if (unlikely(err != PAGE_SIZE)) { |
| err = -EFAULT; |
| goto err_out; |
| } |
| |
| __submit_bio(bio, REQ_OP_READ, |
| REQ_META | (prio ? REQ_PRIO : 0)); |
| |
| lock_page(page); |
| |
| /* this page has been truncated by others */ |
| if (unlikely(page->mapping != mapping)) { |
| unlock_repeat: |
| unlock_page(page); |
| put_page(page); |
| goto repeat; |
| } |
| |
| /* more likely a read error */ |
| if (unlikely(!PageUptodate(page))) { |
| if (io_retries) { |
| --io_retries; |
| goto unlock_repeat; |
| } |
| err = -EIO; |
| goto err_out; |
| } |
| } |
| return page; |
| |
| err_out: |
| unlock_page(page); |
| put_page(page); |
| return ERR_PTR(err); |
| } |
| |
| static int erofs_map_blocks_flatmode(struct inode *inode, |
| struct erofs_map_blocks *map, |
| int flags) |
| { |
| int err = 0; |
| erofs_blk_t nblocks, lastblk; |
| u64 offset = map->m_la; |
| struct erofs_vnode *vi = EROFS_V(inode); |
| |
| trace_erofs_map_blocks_flatmode_enter(inode, map, flags); |
| |
| nblocks = DIV_ROUND_UP(inode->i_size, PAGE_SIZE); |
| lastblk = nblocks - is_inode_layout_inline(inode); |
| |
| if (unlikely(offset >= inode->i_size)) { |
| /* leave out-of-bound access unmapped */ |
| map->m_flags = 0; |
| map->m_plen = 0; |
| goto out; |
| } |
| |
| /* there is no hole in flatmode */ |
| map->m_flags = EROFS_MAP_MAPPED; |
| |
| if (offset < blknr_to_addr(lastblk)) { |
| map->m_pa = blknr_to_addr(vi->raw_blkaddr) + map->m_la; |
| map->m_plen = blknr_to_addr(lastblk) - offset; |
| } else if (is_inode_layout_inline(inode)) { |
| /* 2 - inode inline B: inode, [xattrs], inline last blk... */ |
| struct erofs_sb_info *sbi = EROFS_SB(inode->i_sb); |
| |
| map->m_pa = iloc(sbi, vi->nid) + vi->inode_isize + |
| vi->xattr_isize + erofs_blkoff(map->m_la); |
| map->m_plen = inode->i_size - offset; |
| |
| /* inline data should locate in one meta block */ |
| if (erofs_blkoff(map->m_pa) + map->m_plen > PAGE_SIZE) { |
| DBG_BUGON(1); |
| err = -EIO; |
| goto err_out; |
| } |
| |
| map->m_flags |= EROFS_MAP_META; |
| } else { |
| errln("internal error @ nid: %llu (size %llu), m_la 0x%llx", |
| vi->nid, inode->i_size, map->m_la); |
| DBG_BUGON(1); |
| err = -EIO; |
| goto err_out; |
| } |
| |
| out: |
| map->m_llen = map->m_plen; |
| |
| err_out: |
| trace_erofs_map_blocks_flatmode_exit(inode, map, flags, 0); |
| return err; |
| } |
| |
| int erofs_map_blocks(struct inode *inode, |
| struct erofs_map_blocks *map, int flags) |
| { |
| if (unlikely(is_inode_layout_compression(inode))) { |
| int err = z_erofs_map_blocks_iter(inode, map, flags); |
| |
| if (map->mpage) { |
| put_page(map->mpage); |
| map->mpage = NULL; |
| } |
| return err; |
| } |
| return erofs_map_blocks_flatmode(inode, map, flags); |
| } |
| |
| static inline struct bio *erofs_read_raw_page(struct bio *bio, |
| struct address_space *mapping, |
| struct page *page, |
| erofs_off_t *last_block, |
| unsigned int nblocks, |
| bool ra) |
| { |
| struct inode *inode = mapping->host; |
| erofs_off_t current_block = (erofs_off_t)page->index; |
| int err; |
| |
| DBG_BUGON(!nblocks); |
| |
| if (PageUptodate(page)) { |
| err = 0; |
| goto has_updated; |
| } |
| |
| if (cleancache_get_page(page) == 0) { |
| err = 0; |
| SetPageUptodate(page); |
| goto has_updated; |
| } |
| |
| /* note that for readpage case, bio also equals to NULL */ |
| if (bio && |
| /* not continuous */ |
| *last_block + 1 != current_block) { |
| submit_bio_retry: |
| __submit_bio(bio, REQ_OP_READ, 0); |
| bio = NULL; |
| } |
| |
| if (!bio) { |
| struct erofs_map_blocks map = { |
| .m_la = blknr_to_addr(current_block), |
| }; |
| erofs_blk_t blknr; |
| unsigned int blkoff; |
| |
| err = erofs_map_blocks(inode, &map, EROFS_GET_BLOCKS_RAW); |
| if (unlikely(err)) |
| goto err_out; |
| |
| /* zero out the holed page */ |
| if (unlikely(!(map.m_flags & EROFS_MAP_MAPPED))) { |
| zero_user_segment(page, 0, PAGE_SIZE); |
| SetPageUptodate(page); |
| |
| /* imply err = 0, see erofs_map_blocks */ |
| goto has_updated; |
| } |
| |
| /* for RAW access mode, m_plen must be equal to m_llen */ |
| DBG_BUGON(map.m_plen != map.m_llen); |
| |
| blknr = erofs_blknr(map.m_pa); |
| blkoff = erofs_blkoff(map.m_pa); |
| |
| /* deal with inline page */ |
| if (map.m_flags & EROFS_MAP_META) { |
| void *vsrc, *vto; |
| struct page *ipage; |
| |
| DBG_BUGON(map.m_plen > PAGE_SIZE); |
| |
| ipage = erofs_get_meta_page(inode->i_sb, blknr, 0); |
| |
| if (IS_ERR(ipage)) { |
| err = PTR_ERR(ipage); |
| goto err_out; |
| } |
| |
| vsrc = kmap_atomic(ipage); |
| vto = kmap_atomic(page); |
| memcpy(vto, vsrc + blkoff, map.m_plen); |
| memset(vto + map.m_plen, 0, PAGE_SIZE - map.m_plen); |
| kunmap_atomic(vto); |
| kunmap_atomic(vsrc); |
| flush_dcache_page(page); |
| |
| SetPageUptodate(page); |
| /* TODO: could we unlock the page earlier? */ |
| unlock_page(ipage); |
| put_page(ipage); |
| |
| /* imply err = 0, see erofs_map_blocks */ |
| goto has_updated; |
| } |
| |
| /* pa must be block-aligned for raw reading */ |
| DBG_BUGON(erofs_blkoff(map.m_pa)); |
| |
| /* max # of continuous pages */ |
| if (nblocks > DIV_ROUND_UP(map.m_plen, PAGE_SIZE)) |
| nblocks = DIV_ROUND_UP(map.m_plen, PAGE_SIZE); |
| if (nblocks > BIO_MAX_PAGES) |
| nblocks = BIO_MAX_PAGES; |
| |
| bio = erofs_grab_bio(inode->i_sb, |
| blknr, nblocks, read_endio, false); |
| |
| if (IS_ERR(bio)) { |
| err = PTR_ERR(bio); |
| bio = NULL; |
| goto err_out; |
| } |
| } |
| |
| err = bio_add_page(bio, page, PAGE_SIZE, 0); |
| /* out of the extent or bio is full */ |
| if (err < PAGE_SIZE) |
| goto submit_bio_retry; |
| |
| *last_block = current_block; |
| |
| /* shift in advance in case of it followed by too many gaps */ |
| if (bio->bi_iter.bi_size >= bio->bi_max_vecs * PAGE_SIZE) { |
| /* err should reassign to 0 after submitting */ |
| err = 0; |
| goto submit_bio_out; |
| } |
| |
| return bio; |
| |
| err_out: |
| /* for sync reading, set page error immediately */ |
| if (!ra) { |
| SetPageError(page); |
| ClearPageUptodate(page); |
| } |
| has_updated: |
| unlock_page(page); |
| |
| /* if updated manually, continuous pages has a gap */ |
| if (bio) |
| submit_bio_out: |
| __submit_bio(bio, REQ_OP_READ, 0); |
| |
| return unlikely(err) ? ERR_PTR(err) : NULL; |
| } |
| |
| /* |
| * since we dont have write or truncate flows, so no inode |
| * locking needs to be held at the moment. |
| */ |
| static int erofs_raw_access_readpage(struct file *file, struct page *page) |
| { |
| erofs_off_t last_block; |
| struct bio *bio; |
| |
| trace_erofs_readpage(page, true); |
| |
| bio = erofs_read_raw_page(NULL, page->mapping, |
| page, &last_block, 1, false); |
| |
| if (IS_ERR(bio)) |
| return PTR_ERR(bio); |
| |
| DBG_BUGON(bio); /* since we have only one bio -- must be NULL */ |
| return 0; |
| } |
| |
| static int erofs_raw_access_readpages(struct file *filp, |
| struct address_space *mapping, |
| struct list_head *pages, |
| unsigned int nr_pages) |
| { |
| erofs_off_t last_block; |
| struct bio *bio = NULL; |
| gfp_t gfp = readahead_gfp_mask(mapping); |
| struct page *page = list_last_entry(pages, struct page, lru); |
| |
| trace_erofs_readpages(mapping->host, page, nr_pages, true); |
| |
| for (; nr_pages; --nr_pages) { |
| page = list_entry(pages->prev, struct page, lru); |
| |
| prefetchw(&page->flags); |
| list_del(&page->lru); |
| |
| if (!add_to_page_cache_lru(page, mapping, page->index, gfp)) { |
| bio = erofs_read_raw_page(bio, mapping, page, |
| &last_block, nr_pages, true); |
| |
| /* all the page errors are ignored when readahead */ |
| if (IS_ERR(bio)) { |
| pr_err("%s, readahead error at page %lu of nid %llu\n", |
| __func__, page->index, |
| EROFS_V(mapping->host)->nid); |
| |
| bio = NULL; |
| } |
| } |
| |
| /* pages could still be locked */ |
| put_page(page); |
| } |
| DBG_BUGON(!list_empty(pages)); |
| |
| /* the rare case (end in gaps) */ |
| if (unlikely(bio)) |
| __submit_bio(bio, REQ_OP_READ, 0); |
| return 0; |
| } |
| |
| /* for uncompressed (aligned) files and raw access for other files */ |
| const struct address_space_operations erofs_raw_access_aops = { |
| .readpage = erofs_raw_access_readpage, |
| .readpages = erofs_raw_access_readpages, |
| }; |
| |