1 // SPDX-License-Identifier: GPL-2.0-only
3 * Copyright (C) 2017-2018 HUAWEI, Inc.
4 * http://www.huawei.com/
5 * Created by Gao Xiang <gaoxiang25@huawei.com>
8 #include <linux/prefetch.h>
10 #include <trace/events/erofs.h>
12 static void erofs_readendio(struct bio
*bio
)
15 blk_status_t err
= bio
->bi_status
;
16 struct bvec_iter_all iter_all
;
18 bio_for_each_segment_all(bvec
, bio
, iter_all
) {
19 struct page
*page
= bvec
->bv_page
;
21 /* page is already locked */
22 DBG_BUGON(PageUptodate(page
));
27 SetPageUptodate(page
);
30 /* page could be reclaimed now */
35 struct page
*erofs_get_meta_page(struct super_block
*sb
, erofs_blk_t blkaddr
)
37 struct address_space
*const mapping
= sb
->s_bdev
->bd_inode
->i_mapping
;
40 page
= read_cache_page_gfp(mapping
, blkaddr
,
41 mapping_gfp_constraint(mapping
, ~__GFP_FS
));
42 /* should already be PageUptodate */
48 static int erofs_map_blocks_flatmode(struct inode
*inode
,
49 struct erofs_map_blocks
*map
,
53 erofs_blk_t nblocks
, lastblk
;
54 u64 offset
= map
->m_la
;
55 struct erofs_inode
*vi
= EROFS_I(inode
);
56 bool tailendpacking
= (vi
->datalayout
== EROFS_INODE_FLAT_INLINE
);
58 trace_erofs_map_blocks_flatmode_enter(inode
, map
, flags
);
60 nblocks
= DIV_ROUND_UP(inode
->i_size
, PAGE_SIZE
);
61 lastblk
= nblocks
- tailendpacking
;
63 if (offset
>= inode
->i_size
) {
64 /* leave out-of-bound access unmapped */
70 /* there is no hole in flatmode */
71 map
->m_flags
= EROFS_MAP_MAPPED
;
73 if (offset
< blknr_to_addr(lastblk
)) {
74 map
->m_pa
= blknr_to_addr(vi
->raw_blkaddr
) + map
->m_la
;
75 map
->m_plen
= blknr_to_addr(lastblk
) - offset
;
76 } else if (tailendpacking
) {
77 /* 2 - inode inline B: inode, [xattrs], inline last blk... */
78 struct erofs_sb_info
*sbi
= EROFS_SB(inode
->i_sb
);
80 map
->m_pa
= iloc(sbi
, vi
->nid
) + vi
->inode_isize
+
81 vi
->xattr_isize
+ erofs_blkoff(map
->m_la
);
82 map
->m_plen
= inode
->i_size
- offset
;
84 /* inline data should be located in one meta block */
85 if (erofs_blkoff(map
->m_pa
) + map
->m_plen
> PAGE_SIZE
) {
86 erofs_err(inode
->i_sb
,
87 "inline data cross block boundary @ nid %llu",
94 map
->m_flags
|= EROFS_MAP_META
;
96 erofs_err(inode
->i_sb
,
97 "internal error @ nid: %llu (size %llu), m_la 0x%llx",
98 vi
->nid
, inode
->i_size
, map
->m_la
);
105 map
->m_llen
= map
->m_plen
;
108 trace_erofs_map_blocks_flatmode_exit(inode
, map
, flags
, 0);
112 int erofs_map_blocks(struct inode
*inode
,
113 struct erofs_map_blocks
*map
, int flags
)
115 if (erofs_inode_is_data_compressed(EROFS_I(inode
)->datalayout
)) {
116 int err
= z_erofs_map_blocks_iter(inode
, map
, flags
);
119 put_page(map
->mpage
);
124 return erofs_map_blocks_flatmode(inode
, map
, flags
);
127 static inline struct bio
*erofs_read_raw_page(struct bio
*bio
,
128 struct address_space
*mapping
,
130 erofs_off_t
*last_block
,
131 unsigned int nblocks
,
134 struct inode
*const inode
= mapping
->host
;
135 struct super_block
*const sb
= inode
->i_sb
;
136 erofs_off_t current_block
= (erofs_off_t
)page
->index
;
141 if (PageUptodate(page
)) {
146 /* note that for readpage case, bio also equals to NULL */
149 *last_block
+ 1 != current_block
) {
156 struct erofs_map_blocks map
= {
157 .m_la
= blknr_to_addr(current_block
),
162 err
= erofs_map_blocks(inode
, &map
, EROFS_GET_BLOCKS_RAW
);
166 /* zero out the holed page */
167 if (!(map
.m_flags
& EROFS_MAP_MAPPED
)) {
168 zero_user_segment(page
, 0, PAGE_SIZE
);
169 SetPageUptodate(page
);
171 /* imply err = 0, see erofs_map_blocks */
175 /* for RAW access mode, m_plen must be equal to m_llen */
176 DBG_BUGON(map
.m_plen
!= map
.m_llen
);
178 blknr
= erofs_blknr(map
.m_pa
);
179 blkoff
= erofs_blkoff(map
.m_pa
);
181 /* deal with inline page */
182 if (map
.m_flags
& EROFS_MAP_META
) {
186 DBG_BUGON(map
.m_plen
> PAGE_SIZE
);
188 ipage
= erofs_get_meta_page(inode
->i_sb
, blknr
);
191 err
= PTR_ERR(ipage
);
195 vsrc
= kmap_atomic(ipage
);
196 vto
= kmap_atomic(page
);
197 memcpy(vto
, vsrc
+ blkoff
, map
.m_plen
);
198 memset(vto
+ map
.m_plen
, 0, PAGE_SIZE
- map
.m_plen
);
201 flush_dcache_page(page
);
203 SetPageUptodate(page
);
204 /* TODO: could we unlock the page earlier? */
208 /* imply err = 0, see erofs_map_blocks */
212 /* pa must be block-aligned for raw reading */
213 DBG_BUGON(erofs_blkoff(map
.m_pa
));
215 /* max # of continuous pages */
216 if (nblocks
> DIV_ROUND_UP(map
.m_plen
, PAGE_SIZE
))
217 nblocks
= DIV_ROUND_UP(map
.m_plen
, PAGE_SIZE
);
218 if (nblocks
> BIO_MAX_PAGES
)
219 nblocks
= BIO_MAX_PAGES
;
221 bio
= bio_alloc(GFP_NOIO
, nblocks
);
223 bio
->bi_end_io
= erofs_readendio
;
224 bio_set_dev(bio
, sb
->s_bdev
);
225 bio
->bi_iter
.bi_sector
= (sector_t
)blknr
<<
226 LOG_SECTORS_PER_BLOCK
;
227 bio
->bi_opf
= REQ_OP_READ
;
230 err
= bio_add_page(bio
, page
, PAGE_SIZE
, 0);
231 /* out of the extent or bio is full */
233 goto submit_bio_retry
;
235 *last_block
= current_block
;
237 /* shift in advance in case of it followed by too many gaps */
238 if (bio
->bi_iter
.bi_size
>= bio
->bi_max_vecs
* PAGE_SIZE
) {
239 /* err should reassign to 0 after submitting */
247 /* for sync reading, set page error immediately */
250 ClearPageUptodate(page
);
255 /* if updated manually, continuous pages has a gap */
259 return err
? ERR_PTR(err
) : NULL
;
263 * since we dont have write or truncate flows, so no inode
264 * locking needs to be held at the moment.
266 static int erofs_raw_access_readpage(struct file
*file
, struct page
*page
)
268 erofs_off_t last_block
;
271 trace_erofs_readpage(page
, true);
273 bio
= erofs_read_raw_page(NULL
, page
->mapping
,
274 page
, &last_block
, 1, false);
279 DBG_BUGON(bio
); /* since we have only one bio -- must be NULL */
283 static int erofs_raw_access_readpages(struct file
*filp
,
284 struct address_space
*mapping
,
285 struct list_head
*pages
,
286 unsigned int nr_pages
)
288 erofs_off_t last_block
;
289 struct bio
*bio
= NULL
;
290 gfp_t gfp
= readahead_gfp_mask(mapping
);
291 struct page
*page
= list_last_entry(pages
, struct page
, lru
);
293 trace_erofs_readpages(mapping
->host
, page
, nr_pages
, true);
295 for (; nr_pages
; --nr_pages
) {
296 page
= list_entry(pages
->prev
, struct page
, lru
);
298 prefetchw(&page
->flags
);
299 list_del(&page
->lru
);
301 if (!add_to_page_cache_lru(page
, mapping
, page
->index
, gfp
)) {
302 bio
= erofs_read_raw_page(bio
, mapping
, page
,
303 &last_block
, nr_pages
, true);
305 /* all the page errors are ignored when readahead */
307 pr_err("%s, readahead error at page %lu of nid %llu\n",
308 __func__
, page
->index
,
309 EROFS_I(mapping
->host
)->nid
);
315 /* pages could still be locked */
318 DBG_BUGON(!list_empty(pages
));
320 /* the rare case (end in gaps) */
326 static int erofs_get_block(struct inode
*inode
, sector_t iblock
,
327 struct buffer_head
*bh
, int create
)
329 struct erofs_map_blocks map
= {
334 err
= erofs_map_blocks(inode
, &map
, EROFS_GET_BLOCKS_RAW
);
338 if (map
.m_flags
& EROFS_MAP_MAPPED
)
339 bh
->b_blocknr
= erofs_blknr(map
.m_pa
);
344 static sector_t
erofs_bmap(struct address_space
*mapping
, sector_t block
)
346 struct inode
*inode
= mapping
->host
;
348 if (EROFS_I(inode
)->datalayout
== EROFS_INODE_FLAT_INLINE
) {
349 erofs_blk_t blks
= i_size_read(inode
) >> LOG_BLOCK_SIZE
;
351 if (block
>> LOG_SECTORS_PER_BLOCK
>= blks
)
355 return generic_block_bmap(mapping
, block
, erofs_get_block
);
358 /* for uncompressed (aligned) files and raw access for other files */
359 const struct address_space_operations erofs_raw_access_aops
= {
360 .readpage
= erofs_raw_access_readpage
,
361 .readpages
= erofs_raw_access_readpages
,