blob: 0ad6d812c78b6a5aef336ecf8eab688007ccd138 [file] [log] [blame]
David Teiglandb3b94fa2006-01-16 16:50:04 +00001/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
Steven Whitehouse3a8a9a12006-05-18 15:09:15 -04003 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
David Teiglandb3b94fa2006-01-16 16:50:04 +00004 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
Steven Whitehousee9fc2aa2006-09-01 11:05:15 -04007 * of the GNU General Public License version 2.
David Teiglandb3b94fa2006-01-16 16:50:04 +00008 */
9
David Teiglandb3b94fa2006-01-16 16:50:04 +000010#include <linux/spinlock.h>
11#include <linux/completion.h>
12#include <linux/buffer_head.h>
Benjamin Marzinski64dd1532011-09-12 18:15:24 -050013#include <linux/blkdev.h>
Steven Whitehouse5c676f62006-02-27 17:23:27 -050014#include <linux/gfs2_ondisk.h>
Steven Whitehouse71b86f52006-03-28 14:14:04 -050015#include <linux/crc32.h>
Bob Peterson39743202017-02-16 10:27:16 -050016#include <linux/iomap.h>
David Teiglandb3b94fa2006-01-16 16:50:04 +000017
18#include "gfs2.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050019#include "incore.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000020#include "bmap.h"
21#include "glock.h"
22#include "inode.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000023#include "meta_io.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000024#include "quota.h"
25#include "rgrp.h"
Steven Whitehouse45138992013-01-28 09:30:07 +000026#include "log.h"
Bob Peterson4c16c362011-02-23 16:11:33 -050027#include "super.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000028#include "trans.h"
Steven Whitehouse18ec7d52006-02-08 11:50:51 +000029#include "dir.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050030#include "util.h"
Steven Whitehouse63997772009-06-12 08:49:20 +010031#include "trace_gfs2.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000032
33/* This doesn't need to be that large as max 64 bit pointers in a 4k
34 * block is 512, so __u16 is fine for that. It saves stack space to
35 * keep it small.
36 */
37struct metapath {
Steven Whitehousedbac6712008-01-29 09:12:55 +000038 struct buffer_head *mp_bh[GFS2_MAX_META_HEIGHT];
David Teiglandb3b94fa2006-01-16 16:50:04 +000039 __u16 mp_list[GFS2_MAX_META_HEIGHT];
Bob Peterson5f8bd442016-10-28 14:29:29 -050040 int mp_fheight; /* find_metapath height */
41 int mp_aheight; /* actual height (lookup height) */
David Teiglandb3b94fa2006-01-16 16:50:04 +000042};
43
David Teiglandb3b94fa2006-01-16 16:50:04 +000044/**
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040045 * gfs2_unstuffer_page - unstuff a stuffed inode into a block cached by a page
46 * @ip: the inode
47 * @dibh: the dinode buffer
48 * @block: the block number that was allocated
Steven Whitehouseff8f33c2010-08-11 09:37:53 +010049 * @page: The (optional) page. This is looked up if @page is NULL
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040050 *
51 * Returns: errno
52 */
53
54static int gfs2_unstuffer_page(struct gfs2_inode *ip, struct buffer_head *dibh,
Steven Whitehousecd915492006-09-04 12:49:07 -040055 u64 block, struct page *page)
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040056{
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040057 struct inode *inode = &ip->i_inode;
58 struct buffer_head *bh;
59 int release = 0;
60
61 if (!page || page->index) {
Bob Peterson220cca22012-03-19 15:25:50 -040062 page = find_or_create_page(inode->i_mapping, 0, GFP_NOFS);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040063 if (!page)
64 return -ENOMEM;
65 release = 1;
66 }
67
68 if (!PageUptodate(page)) {
69 void *kaddr = kmap(page);
Steven Whitehouse602c89d2010-03-25 14:32:43 +000070 u64 dsize = i_size_read(inode);
71
72 if (dsize > (dibh->b_size - sizeof(struct gfs2_dinode)))
73 dsize = dibh->b_size - sizeof(struct gfs2_dinode);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040074
Steven Whitehouse602c89d2010-03-25 14:32:43 +000075 memcpy(kaddr, dibh->b_data + sizeof(struct gfs2_dinode), dsize);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +030076 memset(kaddr + dsize, 0, PAGE_SIZE - dsize);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040077 kunmap(page);
78
79 SetPageUptodate(page);
80 }
81
82 if (!page_has_buffers(page))
Fabian Frederick47a9a522016-08-02 12:05:27 -050083 create_empty_buffers(page, BIT(inode->i_blkbits),
84 BIT(BH_Uptodate));
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040085
86 bh = page_buffers(page);
87
88 if (!buffer_mapped(bh))
89 map_bh(bh, inode->i_sb, block);
90
91 set_buffer_uptodate(bh);
Steven Whitehouseeaf96522007-08-27 09:49:37 +010092 if (!gfs2_is_jdata(ip))
93 mark_buffer_dirty(bh);
Steven Whitehousebf36a712007-10-17 08:35:19 +010094 if (!gfs2_is_writeback(ip))
Steven Whitehouse350a9b02012-12-14 12:36:02 +000095 gfs2_trans_add_data(ip->i_gl, bh);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040096
97 if (release) {
98 unlock_page(page);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +030099 put_page(page);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400100 }
101
102 return 0;
103}
104
105/**
David Teiglandb3b94fa2006-01-16 16:50:04 +0000106 * gfs2_unstuff_dinode - Unstuff a dinode when the data has grown too big
107 * @ip: The GFS2 inode to unstuff
Steven Whitehouseff8f33c2010-08-11 09:37:53 +0100108 * @page: The (optional) page. This is looked up if the @page is NULL
David Teiglandb3b94fa2006-01-16 16:50:04 +0000109 *
110 * This routine unstuffs a dinode and returns it to a "normal" state such
111 * that the height can be grown in the traditional way.
112 *
113 * Returns: errno
114 */
115
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400116int gfs2_unstuff_dinode(struct gfs2_inode *ip, struct page *page)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000117{
118 struct buffer_head *bh, *dibh;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400119 struct gfs2_dinode *di;
Steven Whitehousecd915492006-09-04 12:49:07 -0400120 u64 block = 0;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +0000121 int isdir = gfs2_is_dir(ip);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000122 int error;
123
124 down_write(&ip->i_rw_mutex);
125
126 error = gfs2_meta_inode_buffer(ip, &dibh);
127 if (error)
128 goto out;
Steven Whitehouse907b9bc2006-09-25 09:26:04 -0400129
Steven Whitehousea2e0f792010-08-11 09:53:11 +0100130 if (i_size_read(&ip->i_inode)) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000131 /* Get a free block, fill it with the stuffed data,
132 and write it out to disk */
133
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000134 unsigned int n = 1;
Bob Peterson6e87ed02011-11-18 10:58:32 -0500135 error = gfs2_alloc_blocks(ip, &block, &n, 0, NULL);
Steven Whitehouse09010972009-05-20 10:48:47 +0100136 if (error)
137 goto out_brelse;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +0000138 if (isdir) {
Steven Whitehouse5731be52008-02-01 13:16:55 +0000139 gfs2_trans_add_unrevoke(GFS2_SB(&ip->i_inode), block, 1);
Steven Whitehouse61e085a2006-04-24 10:07:13 -0400140 error = gfs2_dir_get_new_buffer(ip, block, &bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000141 if (error)
142 goto out_brelse;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400143 gfs2_buffer_copy_tail(bh, sizeof(struct gfs2_meta_header),
David Teiglandb3b94fa2006-01-16 16:50:04 +0000144 dibh, sizeof(struct gfs2_dinode));
145 brelse(bh);
146 } else {
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400147 error = gfs2_unstuffer_page(ip, dibh, block, page);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000148 if (error)
149 goto out_brelse;
150 }
151 }
152
153 /* Set up the pointer to the new block */
154
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000155 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400156 di = (struct gfs2_dinode *)dibh->b_data;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000157 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
158
Steven Whitehousea2e0f792010-08-11 09:53:11 +0100159 if (i_size_read(&ip->i_inode)) {
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400160 *(__be64 *)(di + 1) = cpu_to_be64(block);
Steven Whitehouse77658aa2008-02-12 14:17:27 +0000161 gfs2_add_inode_blocks(&ip->i_inode, 1);
162 di->di_blocks = cpu_to_be64(gfs2_get_inode_blocks(&ip->i_inode));
David Teiglandb3b94fa2006-01-16 16:50:04 +0000163 }
164
Steven Whitehouseecc30c72008-01-28 10:37:35 +0000165 ip->i_height = 1;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400166 di->di_height = cpu_to_be16(1);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000167
Steven Whitehousea91ea692006-09-04 12:04:26 -0400168out_brelse:
David Teiglandb3b94fa2006-01-16 16:50:04 +0000169 brelse(dibh);
Steven Whitehousea91ea692006-09-04 12:04:26 -0400170out:
David Teiglandb3b94fa2006-01-16 16:50:04 +0000171 up_write(&ip->i_rw_mutex);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000172 return error;
173}
174
David Teiglandb3b94fa2006-01-16 16:50:04 +0000175
176/**
177 * find_metapath - Find path through the metadata tree
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000178 * @sdp: The superblock
David Teiglandb3b94fa2006-01-16 16:50:04 +0000179 * @mp: The metapath to return the result in
180 * @block: The disk block to look up
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000181 * @height: The pre-calculated height of the metadata tree
David Teiglandb3b94fa2006-01-16 16:50:04 +0000182 *
183 * This routine returns a struct metapath structure that defines a path
184 * through the metadata of inode "ip" to get to block "block".
185 *
186 * Example:
187 * Given: "ip" is a height 3 file, "offset" is 101342453, and this is a
188 * filesystem with a blocksize of 4096.
189 *
190 * find_metapath() would return a struct metapath structure set to:
191 * mp_offset = 101342453, mp_height = 3, mp_list[0] = 0, mp_list[1] = 48,
192 * and mp_list[2] = 165.
193 *
194 * That means that in order to get to the block containing the byte at
195 * offset 101342453, we would load the indirect block pointed to by pointer
196 * 0 in the dinode. We would then load the indirect block pointed to by
197 * pointer 48 in that indirect block. We would then load the data block
198 * pointed to by pointer 165 in that indirect block.
199 *
200 * ----------------------------------------
201 * | Dinode | |
202 * | | 4|
203 * | |0 1 2 3 4 5 9|
204 * | | 6|
205 * ----------------------------------------
206 * |
207 * |
208 * V
209 * ----------------------------------------
210 * | Indirect Block |
211 * | 5|
212 * | 4 4 4 4 4 5 5 1|
213 * |0 5 6 7 8 9 0 1 2|
214 * ----------------------------------------
215 * |
216 * |
217 * V
218 * ----------------------------------------
219 * | Indirect Block |
220 * | 1 1 1 1 1 5|
221 * | 6 6 6 6 6 1|
222 * |0 3 4 5 6 7 2|
223 * ----------------------------------------
224 * |
225 * |
226 * V
227 * ----------------------------------------
228 * | Data block containing offset |
229 * | 101342453 |
230 * | |
231 * | |
232 * ----------------------------------------
233 *
234 */
235
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000236static void find_metapath(const struct gfs2_sbd *sdp, u64 block,
237 struct metapath *mp, unsigned int height)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000238{
David Teiglandb3b94fa2006-01-16 16:50:04 +0000239 unsigned int i;
240
Bob Peterson5f8bd442016-10-28 14:29:29 -0500241 mp->mp_fheight = height;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000242 for (i = height; i--;)
Bob Peterson7eabb772008-01-28 11:24:35 -0600243 mp->mp_list[i] = do_div(block, sdp->sd_inptrs);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000244}
245
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500246static inline unsigned int metapath_branch_start(const struct metapath *mp)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000247{
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500248 if (mp->mp_list[0] == 0)
249 return 2;
250 return 1;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000251}
252
David Teiglandb3b94fa2006-01-16 16:50:04 +0000253/**
Andreas Gruenbacher20cdc192017-09-22 07:39:54 -0500254 * metaptr1 - Return the first possible metadata pointer in a metapath buffer
Bob Petersond552a2b2017-02-06 08:28:32 -0500255 * @height: The metadata height (0 = dinode)
256 * @mp: The metapath
257 */
258static inline __be64 *metaptr1(unsigned int height, const struct metapath *mp)
259{
260 struct buffer_head *bh = mp->mp_bh[height];
261 if (height == 0)
262 return ((__be64 *)(bh->b_data + sizeof(struct gfs2_dinode)));
263 return ((__be64 *)(bh->b_data + sizeof(struct gfs2_meta_header)));
264}
265
266/**
David Teiglandb3b94fa2006-01-16 16:50:04 +0000267 * metapointer - Return pointer to start of metadata in a buffer
David Teiglandb3b94fa2006-01-16 16:50:04 +0000268 * @height: The metadata height (0 = dinode)
269 * @mp: The metapath
270 *
271 * Return a pointer to the block number of the next height of the metadata
272 * tree given a buffer containing the pointer to the current height of the
273 * metadata tree.
274 */
275
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000276static inline __be64 *metapointer(unsigned int height, const struct metapath *mp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000277{
Bob Petersond552a2b2017-02-06 08:28:32 -0500278 __be64 *p = metaptr1(height, mp);
279 return p + mp->mp_list[height];
David Teiglandb3b94fa2006-01-16 16:50:04 +0000280}
281
Steven Whitehouseb99b98d2011-09-21 11:05:16 +0100282static void gfs2_metapath_ra(struct gfs2_glock *gl,
283 const struct buffer_head *bh, const __be64 *pos)
284{
285 struct buffer_head *rabh;
286 const __be64 *endp = (const __be64 *)(bh->b_data + bh->b_size);
287 const __be64 *t;
288
289 for (t = pos; t < endp; t++) {
290 if (!*t)
291 continue;
292
293 rabh = gfs2_getbuf(gl, be64_to_cpu(*t), CREATE);
294 if (trylock_buffer(rabh)) {
295 if (!buffer_uptodate(rabh)) {
296 rabh->b_end_io = end_buffer_read_sync;
Coly Lie477b242017-07-21 07:48:22 -0500297 submit_bh(REQ_OP_READ,
298 REQ_RAHEAD | REQ_META | REQ_PRIO,
299 rabh);
Steven Whitehouseb99b98d2011-09-21 11:05:16 +0100300 continue;
301 }
302 unlock_buffer(rabh);
303 }
304 brelse(rabh);
305 }
306}
307
David Teiglandb3b94fa2006-01-16 16:50:04 +0000308/**
Bob Petersond552a2b2017-02-06 08:28:32 -0500309 * lookup_mp_height - helper function for lookup_metapath
310 * @ip: the inode
311 * @mp: the metapath
312 * @h: the height which needs looking up
313 */
314static int lookup_mp_height(struct gfs2_inode *ip, struct metapath *mp, int h)
315{
316 __be64 *ptr = metapointer(h, mp);
317 u64 dblock = be64_to_cpu(*ptr);
318
319 if (!dblock)
320 return h + 1;
321
322 return gfs2_meta_indirect_buffer(ip, h + 1, dblock, &mp->mp_bh[h + 1]);
323}
324
325/**
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000326 * lookup_metapath - Walk the metadata tree to a specific point
327 * @ip: The inode
David Teiglandb3b94fa2006-01-16 16:50:04 +0000328 * @mp: The metapath
David Teiglandb3b94fa2006-01-16 16:50:04 +0000329 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000330 * Assumes that the inode's buffer has already been looked up and
331 * hooked onto mp->mp_bh[0] and that the metapath has been initialised
332 * by find_metapath().
David Teiglandb3b94fa2006-01-16 16:50:04 +0000333 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000334 * If this function encounters part of the tree which has not been
335 * allocated, it returns the current height of the tree at the point
336 * at which it found the unallocated block. Blocks which are found are
337 * added to the mp->mp_bh[] list.
338 *
339 * Returns: error or height of metadata tree
David Teiglandb3b94fa2006-01-16 16:50:04 +0000340 */
341
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000342static int lookup_metapath(struct gfs2_inode *ip, struct metapath *mp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000343{
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000344 unsigned int end_of_metadata = ip->i_height - 1;
345 unsigned int x;
Steven Whitehousee23159d2008-02-12 14:48:39 +0000346 int ret;
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000347
348 for (x = 0; x < end_of_metadata; x++) {
Bob Petersond552a2b2017-02-06 08:28:32 -0500349 ret = lookup_mp_height(ip, mp, x);
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000350 if (ret)
Bob Peterson5f8bd442016-10-28 14:29:29 -0500351 goto out;
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000352 }
353
Bob Peterson5f8bd442016-10-28 14:29:29 -0500354 ret = ip->i_height;
355out:
356 mp->mp_aheight = ret;
357 return ret;
Steven Whitehousedbac6712008-01-29 09:12:55 +0000358}
359
Bob Petersond552a2b2017-02-06 08:28:32 -0500360/**
361 * fillup_metapath - fill up buffers for the metadata path to a specific height
362 * @ip: The inode
363 * @mp: The metapath
364 * @h: The height to which it should be mapped
365 *
366 * Similar to lookup_metapath, but does lookups for a range of heights
367 *
368 * Returns: error or height of metadata tree
369 */
370
371static int fillup_metapath(struct gfs2_inode *ip, struct metapath *mp, int h)
372{
373 unsigned int start_h = h - 1;
374 int ret;
375
376 if (h) {
377 /* find the first buffer we need to look up. */
378 while (start_h > 0 && mp->mp_bh[start_h] == NULL)
379 start_h--;
380 for (; start_h < h; start_h++) {
381 ret = lookup_mp_height(ip, mp, start_h);
382 if (ret)
383 return ret;
384 }
385 }
386 return ip->i_height;
387}
388
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000389static inline void release_metapath(struct metapath *mp)
Steven Whitehousedbac6712008-01-29 09:12:55 +0000390{
391 int i;
392
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000393 for (i = 0; i < GFS2_MAX_META_HEIGHT; i++) {
394 if (mp->mp_bh[i] == NULL)
395 break;
396 brelse(mp->mp_bh[i]);
397 }
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000398}
399
Steven Whitehouse30cbf182008-02-08 13:18:11 +0000400/**
401 * gfs2_extent_length - Returns length of an extent of blocks
402 * @start: Start of the buffer
403 * @len: Length of the buffer in bytes
404 * @ptr: Current position in the buffer
405 * @limit: Max extent length to return (0 = unlimited)
406 * @eob: Set to 1 if we hit "end of block"
407 *
408 * If the first block is zero (unallocated) it will return the number of
409 * unallocated blocks in the extent, otherwise it will return the number
410 * of contiguous blocks in the extent.
411 *
412 * Returns: The length of the extent (minimum of one block)
413 */
414
Bob Petersonb6507382014-08-06 09:08:36 -0400415static inline unsigned int gfs2_extent_length(void *start, unsigned int len, __be64 *ptr, size_t limit, int *eob)
Steven Whitehouse30cbf182008-02-08 13:18:11 +0000416{
417 const __be64 *end = (start + len);
418 const __be64 *first = ptr;
419 u64 d = be64_to_cpu(*ptr);
420
421 *eob = 0;
422 do {
423 ptr++;
424 if (ptr >= end)
425 break;
426 if (limit && --limit == 0)
427 break;
428 if (d)
429 d++;
430 } while(be64_to_cpu(*ptr) == d);
431 if (ptr >= end)
432 *eob = 1;
433 return (ptr - first);
434}
435
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000436static inline void bmap_lock(struct gfs2_inode *ip, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400437{
Steven Whitehousefd88de562006-05-05 16:59:11 -0400438 if (create)
439 down_write(&ip->i_rw_mutex);
440 else
441 down_read(&ip->i_rw_mutex);
442}
443
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000444static inline void bmap_unlock(struct gfs2_inode *ip, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400445{
David Teiglandb3b94fa2006-01-16 16:50:04 +0000446 if (create)
447 up_write(&ip->i_rw_mutex);
448 else
449 up_read(&ip->i_rw_mutex);
Steven Whitehousefd88de562006-05-05 16:59:11 -0400450}
David Teiglandb3b94fa2006-01-16 16:50:04 +0000451
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000452static inline __be64 *gfs2_indirect_init(struct metapath *mp,
453 struct gfs2_glock *gl, unsigned int i,
454 unsigned offset, u64 bn)
455{
456 __be64 *ptr = (__be64 *)(mp->mp_bh[i - 1]->b_data +
457 ((i > 1) ? sizeof(struct gfs2_meta_header) :
458 sizeof(struct gfs2_dinode)));
459 BUG_ON(i < 1);
460 BUG_ON(mp->mp_bh[i] != NULL);
461 mp->mp_bh[i] = gfs2_meta_new(gl, bn);
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000462 gfs2_trans_add_meta(gl, mp->mp_bh[i]);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000463 gfs2_metatype_set(mp->mp_bh[i], GFS2_METATYPE_IN, GFS2_FORMAT_IN);
464 gfs2_buffer_clear_tail(mp->mp_bh[i], sizeof(struct gfs2_meta_header));
465 ptr += offset;
466 *ptr = cpu_to_be64(bn);
467 return ptr;
468}
469
470enum alloc_state {
471 ALLOC_DATA = 0,
472 ALLOC_GROW_DEPTH = 1,
473 ALLOC_GROW_HEIGHT = 2,
474 /* ALLOC_UNSTUFF = 3, TBD and rather complicated */
475};
476
Bob Petersond552a2b2017-02-06 08:28:32 -0500477static inline unsigned int hptrs(struct gfs2_sbd *sdp, const unsigned int hgt)
478{
479 if (hgt)
480 return sdp->sd_inptrs;
481 return sdp->sd_diptrs;
482}
483
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000484/**
485 * gfs2_bmap_alloc - Build a metadata tree of the requested height
486 * @inode: The GFS2 inode
487 * @lblock: The logical starting block of the extent
488 * @bh_map: This is used to return the mapping details
Bob Peterson5f8bd442016-10-28 14:29:29 -0500489 * @zero_new: True if newly allocated blocks should be zeroed
490 * @mp: The metapath, with proper height information calculated
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000491 * @maxlen: The max number of data blocks to alloc
Bob Peterson5f8bd442016-10-28 14:29:29 -0500492 * @dblock: Pointer to return the resulting new block
493 * @dblks: Pointer to return the number of blocks allocated
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000494 *
495 * In this routine we may have to alloc:
496 * i) Indirect blocks to grow the metadata tree height
497 * ii) Indirect blocks to fill in lower part of the metadata tree
498 * iii) Data blocks
499 *
500 * The function is in two parts. The first part works out the total
501 * number of blocks which we need. The second part does the actual
502 * allocation asking for an extent at a time (if enough contiguous free
503 * blocks are available, there will only be one request per bmap call)
504 * and uses the state machine to initialise the blocks in order.
505 *
506 * Returns: errno on error
507 */
508
Bob Peterson39743202017-02-16 10:27:16 -0500509static int gfs2_iomap_alloc(struct inode *inode, struct iomap *iomap,
510 unsigned flags, struct metapath *mp)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000511{
512 struct gfs2_inode *ip = GFS2_I(inode);
513 struct gfs2_sbd *sdp = GFS2_SB(inode);
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500514 struct super_block *sb = sdp->sd_vfs;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000515 struct buffer_head *dibh = mp->mp_bh[0];
Bob Peterson5f8bd442016-10-28 14:29:29 -0500516 u64 bn;
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500517 unsigned n, i, blks, alloced = 0, iblks = 0, branch_start = 0;
Bob Peterson39743202017-02-16 10:27:16 -0500518 unsigned dblks = 0;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000519 unsigned ptrs_per_blk;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500520 const unsigned end_of_metadata = mp->mp_fheight - 1;
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500521 int ret;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000522 enum alloc_state state;
523 __be64 *ptr;
524 __be64 zero_bn = 0;
Bob Peterson39743202017-02-16 10:27:16 -0500525 size_t maxlen = iomap->length >> inode->i_blkbits;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000526
Bob Peterson5f8bd442016-10-28 14:29:29 -0500527 BUG_ON(mp->mp_aheight < 1);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000528 BUG_ON(dibh == NULL);
529
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000530 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000531
Bob Peterson5f8bd442016-10-28 14:29:29 -0500532 if (mp->mp_fheight == mp->mp_aheight) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000533 struct buffer_head *bh;
Bob Peterson39743202017-02-16 10:27:16 -0500534 int eob;
535
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000536 /* Bottom indirect block exists, find unalloced extent size */
537 ptr = metapointer(end_of_metadata, mp);
538 bh = mp->mp_bh[end_of_metadata];
Bob Peterson39743202017-02-16 10:27:16 -0500539 dblks = gfs2_extent_length(bh->b_data, bh->b_size, ptr,
540 maxlen, &eob);
541 BUG_ON(dblks < 1);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000542 state = ALLOC_DATA;
543 } else {
544 /* Need to allocate indirect blocks */
Bob Peterson5f8bd442016-10-28 14:29:29 -0500545 ptrs_per_blk = mp->mp_fheight > 1 ? sdp->sd_inptrs :
546 sdp->sd_diptrs;
Bob Peterson39743202017-02-16 10:27:16 -0500547 dblks = min(maxlen, (size_t)(ptrs_per_blk -
548 mp->mp_list[end_of_metadata]));
Bob Peterson5f8bd442016-10-28 14:29:29 -0500549 if (mp->mp_fheight == ip->i_height) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000550 /* Writing into existing tree, extend tree down */
Bob Peterson5f8bd442016-10-28 14:29:29 -0500551 iblks = mp->mp_fheight - mp->mp_aheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000552 state = ALLOC_GROW_DEPTH;
553 } else {
554 /* Building up tree height */
555 state = ALLOC_GROW_HEIGHT;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500556 iblks = mp->mp_fheight - ip->i_height;
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500557 branch_start = metapath_branch_start(mp);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500558 iblks += (mp->mp_fheight - branch_start);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000559 }
560 }
561
562 /* start of the second part of the function (state machine) */
563
Bob Peterson39743202017-02-16 10:27:16 -0500564 blks = dblks + iblks;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500565 i = mp->mp_aheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000566 do {
Steven Whitehouse09010972009-05-20 10:48:47 +0100567 int error;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000568 n = blks - alloced;
Bob Peterson6e87ed02011-11-18 10:58:32 -0500569 error = gfs2_alloc_blocks(ip, &bn, &n, 0, NULL);
Steven Whitehouse09010972009-05-20 10:48:47 +0100570 if (error)
571 return error;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000572 alloced += n;
573 if (state != ALLOC_DATA || gfs2_is_jdata(ip))
574 gfs2_trans_add_unrevoke(sdp, bn, n);
575 switch (state) {
576 /* Growing height of tree */
577 case ALLOC_GROW_HEIGHT:
578 if (i == 1) {
579 ptr = (__be64 *)(dibh->b_data +
580 sizeof(struct gfs2_dinode));
581 zero_bn = *ptr;
582 }
Bob Peterson5f8bd442016-10-28 14:29:29 -0500583 for (; i - 1 < mp->mp_fheight - ip->i_height && n > 0;
584 i++, n--)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000585 gfs2_indirect_init(mp, ip->i_gl, i, 0, bn++);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500586 if (i - 1 == mp->mp_fheight - ip->i_height) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000587 i--;
588 gfs2_buffer_copy_tail(mp->mp_bh[i],
589 sizeof(struct gfs2_meta_header),
590 dibh, sizeof(struct gfs2_dinode));
591 gfs2_buffer_clear_tail(dibh,
592 sizeof(struct gfs2_dinode) +
593 sizeof(__be64));
594 ptr = (__be64 *)(mp->mp_bh[i]->b_data +
595 sizeof(struct gfs2_meta_header));
596 *ptr = zero_bn;
597 state = ALLOC_GROW_DEPTH;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500598 for(i = branch_start; i < mp->mp_fheight; i++) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000599 if (mp->mp_bh[i] == NULL)
600 break;
601 brelse(mp->mp_bh[i]);
602 mp->mp_bh[i] = NULL;
603 }
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500604 i = branch_start;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000605 }
606 if (n == 0)
607 break;
608 /* Branching from existing tree */
609 case ALLOC_GROW_DEPTH:
Bob Peterson5f8bd442016-10-28 14:29:29 -0500610 if (i > 1 && i < mp->mp_fheight)
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000611 gfs2_trans_add_meta(ip->i_gl, mp->mp_bh[i-1]);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500612 for (; i < mp->mp_fheight && n > 0; i++, n--)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000613 gfs2_indirect_init(mp, ip->i_gl, i,
614 mp->mp_list[i-1], bn++);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500615 if (i == mp->mp_fheight)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000616 state = ALLOC_DATA;
617 if (n == 0)
618 break;
619 /* Tree complete, adding data blocks */
620 case ALLOC_DATA:
Bob Peterson39743202017-02-16 10:27:16 -0500621 BUG_ON(n > dblks);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000622 BUG_ON(mp->mp_bh[end_of_metadata] == NULL);
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000623 gfs2_trans_add_meta(ip->i_gl, mp->mp_bh[end_of_metadata]);
Bob Peterson39743202017-02-16 10:27:16 -0500624 dblks = n;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000625 ptr = metapointer(end_of_metadata, mp);
Bob Peterson39743202017-02-16 10:27:16 -0500626 iomap->addr = bn << inode->i_blkbits;
627 iomap->flags |= IOMAP_F_NEW;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000628 while (n-- > 0)
629 *ptr++ = cpu_to_be64(bn++);
Bob Peterson39743202017-02-16 10:27:16 -0500630 if (flags & IOMAP_ZERO) {
631 ret = sb_issue_zeroout(sb, iomap->addr >> inode->i_blkbits,
632 dblks, GFP_NOFS);
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500633 if (ret) {
634 fs_err(sdp,
635 "Failed to zero data buffers\n");
Bob Peterson39743202017-02-16 10:27:16 -0500636 flags &= ~IOMAP_ZERO;
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500637 }
638 }
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000639 break;
640 }
Bob Peterson39743202017-02-16 10:27:16 -0500641 } while (iomap->addr == IOMAP_NULL_ADDR);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000642
Bob Peterson39743202017-02-16 10:27:16 -0500643 iomap->length = (u64)dblks << inode->i_blkbits;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500644 ip->i_height = mp->mp_fheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000645 gfs2_add_inode_blocks(&ip->i_inode, alloced);
646 gfs2_dinode_out(ip, mp->mp_bh[0]->b_data);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000647 return 0;
648}
649
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500650/**
Bob Peterson39743202017-02-16 10:27:16 -0500651 * hole_size - figure out the size of a hole
652 * @inode: The inode
653 * @lblock: The logical starting block number
654 * @mp: The metapath
655 *
656 * Returns: The hole size in bytes
657 *
658 */
659static u64 hole_size(struct inode *inode, sector_t lblock, struct metapath *mp)
660{
661 struct gfs2_inode *ip = GFS2_I(inode);
662 struct gfs2_sbd *sdp = GFS2_SB(inode);
663 struct metapath mp_eof;
664 u64 factor = 1;
665 int hgt;
666 u64 holesz = 0;
667 const __be64 *first, *end, *ptr;
668 const struct buffer_head *bh;
669 u64 lblock_stop = (i_size_read(inode) - 1) >> inode->i_blkbits;
670 int zeroptrs;
671 bool done = false;
672
673 /* Get another metapath, to the very last byte */
674 find_metapath(sdp, lblock_stop, &mp_eof, ip->i_height);
675 for (hgt = ip->i_height - 1; hgt >= 0 && !done; hgt--) {
676 bh = mp->mp_bh[hgt];
677 if (bh) {
678 zeroptrs = 0;
679 first = metapointer(hgt, mp);
680 end = (const __be64 *)(bh->b_data + bh->b_size);
681
682 for (ptr = first; ptr < end; ptr++) {
683 if (*ptr) {
684 done = true;
685 break;
686 } else {
687 zeroptrs++;
688 }
689 }
690 } else {
691 zeroptrs = sdp->sd_inptrs;
692 }
693 if (factor * zeroptrs >= lblock_stop - lblock + 1) {
694 holesz = lblock_stop - lblock + 1;
695 break;
696 }
697 holesz += factor * zeroptrs;
698
699 factor *= sdp->sd_inptrs;
700 if (hgt && (mp->mp_list[hgt - 1] < mp_eof.mp_list[hgt - 1]))
701 (mp->mp_list[hgt - 1])++;
702 }
703 return holesz << inode->i_blkbits;
704}
705
706static void gfs2_stuffed_iomap(struct inode *inode, struct iomap *iomap)
707{
708 struct gfs2_inode *ip = GFS2_I(inode);
709
710 iomap->addr = (ip->i_no_addr << inode->i_blkbits) +
711 sizeof(struct gfs2_dinode);
712 iomap->offset = 0;
713 iomap->length = i_size_read(inode);
714 iomap->type = IOMAP_MAPPED;
715 iomap->flags = IOMAP_F_DATA_INLINE;
716}
717
718/**
719 * gfs2_iomap_begin - Map blocks from an inode to disk blocks
720 * @inode: The inode
721 * @pos: Starting position in bytes
722 * @length: Length to map, in bytes
723 * @flags: iomap flags
724 * @iomap: The iomap structure
725 *
726 * Returns: errno
727 */
728int gfs2_iomap_begin(struct inode *inode, loff_t pos, loff_t length,
729 unsigned flags, struct iomap *iomap)
730{
731 struct gfs2_inode *ip = GFS2_I(inode);
732 struct gfs2_sbd *sdp = GFS2_SB(inode);
733 struct metapath mp = { .mp_aheight = 1, };
734 unsigned int factor = sdp->sd_sb.sb_bsize;
735 const u64 *arr = sdp->sd_heightsize;
736 __be64 *ptr;
737 sector_t lblock;
738 sector_t lend;
739 int ret;
740 int eob;
741 unsigned int len;
742 struct buffer_head *bh;
743 u8 height;
744
745 trace_gfs2_iomap_start(ip, pos, length, flags);
746 if (!length) {
747 ret = -EINVAL;
748 goto out;
749 }
750
751 if ((flags & IOMAP_REPORT) && gfs2_is_stuffed(ip)) {
752 gfs2_stuffed_iomap(inode, iomap);
753 if (pos >= iomap->length)
754 return -ENOENT;
755 ret = 0;
756 goto out;
757 }
758
759 lblock = pos >> inode->i_blkbits;
760 lend = (pos + length + sdp->sd_sb.sb_bsize - 1) >> inode->i_blkbits;
761
762 iomap->offset = lblock << inode->i_blkbits;
763 iomap->addr = IOMAP_NULL_ADDR;
764 iomap->type = IOMAP_HOLE;
765 iomap->length = (u64)(lend - lblock) << inode->i_blkbits;
766 iomap->flags = IOMAP_F_MERGED;
767 bmap_lock(ip, 0);
768
769 /*
770 * Directory data blocks have a struct gfs2_meta_header header, so the
771 * remaining size is smaller than the filesystem block size. Logical
772 * block numbers for directories are in units of this remaining size!
773 */
774 if (gfs2_is_dir(ip)) {
775 factor = sdp->sd_jbsize;
776 arr = sdp->sd_jheightsize;
777 }
778
779 ret = gfs2_meta_inode_buffer(ip, &mp.mp_bh[0]);
780 if (ret)
781 goto out_release;
782
783 height = ip->i_height;
784 while ((lblock + 1) * factor > arr[height])
785 height++;
786 find_metapath(sdp, lblock, &mp, height);
787 if (height > ip->i_height || gfs2_is_stuffed(ip))
788 goto do_alloc;
789
790 ret = lookup_metapath(ip, &mp);
791 if (ret < 0)
792 goto out_release;
793
794 if (mp.mp_aheight != ip->i_height)
795 goto do_alloc;
796
797 ptr = metapointer(ip->i_height - 1, &mp);
798 if (*ptr == 0)
799 goto do_alloc;
800
801 iomap->type = IOMAP_MAPPED;
802 iomap->addr = be64_to_cpu(*ptr) << inode->i_blkbits;
803
804 bh = mp.mp_bh[ip->i_height - 1];
805 len = gfs2_extent_length(bh->b_data, bh->b_size, ptr, lend - lblock, &eob);
806 if (eob)
807 iomap->flags |= IOMAP_F_BOUNDARY;
808 iomap->length = (u64)len << inode->i_blkbits;
809
810 ret = 0;
811
812out_release:
813 release_metapath(&mp);
814 bmap_unlock(ip, 0);
815out:
816 trace_gfs2_iomap_end(ip, iomap, ret);
817 return ret;
818
819do_alloc:
820 if (!(flags & IOMAP_WRITE)) {
821 if (pos >= i_size_read(inode)) {
822 ret = -ENOENT;
823 goto out_release;
824 }
825 ret = 0;
826 iomap->length = hole_size(inode, lblock, &mp);
827 goto out_release;
828 }
829
830 ret = gfs2_iomap_alloc(inode, iomap, flags, &mp);
831 goto out_release;
832}
833
834/**
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500835 * gfs2_block_map - Map a block from an inode to a disk block
836 * @inode: The inode
837 * @lblock: The logical block number
838 * @bh_map: The bh to be mapped
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000839 * @create: True if its ok to alloc blocks to satify the request
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500840 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000841 * Sets buffer_mapped() if successful, sets buffer_boundary() if a
842 * read of metadata will be required before the next block can be
843 * mapped. Sets buffer_new() if new blocks were allocated.
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500844 *
845 * Returns: errno
846 */
847
Bob Petersone9e1ef22007-12-10 14:13:27 -0600848int gfs2_block_map(struct inode *inode, sector_t lblock,
849 struct buffer_head *bh_map, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400850{
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500851 struct gfs2_inode *ip = GFS2_I(inode);
Bob Peterson39743202017-02-16 10:27:16 -0500852 struct iomap iomap;
853 int ret, flags = 0;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000854
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500855 clear_buffer_mapped(bh_map);
856 clear_buffer_new(bh_map);
857 clear_buffer_boundary(bh_map);
Steven Whitehouse63997772009-06-12 08:49:20 +0100858 trace_gfs2_bmap(ip, bh_map, lblock, create, 1);
Andreas Gruenbacher20cdc192017-09-22 07:39:54 -0500859
Bob Peterson39743202017-02-16 10:27:16 -0500860 if (create)
861 flags |= IOMAP_WRITE;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500862 if (buffer_zeronew(bh_map))
Bob Peterson39743202017-02-16 10:27:16 -0500863 flags |= IOMAP_ZERO;
864 ret = gfs2_iomap_begin(inode, (loff_t)lblock << inode->i_blkbits,
865 bh_map->b_size, flags, &iomap);
866 if (ret) {
867 if (!create && ret == -ENOENT) {
868 /* Return unmapped buffer beyond the end of file. */
869 ret = 0;
870 }
871 goto out;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500872 }
Bob Peterson39743202017-02-16 10:27:16 -0500873
874 if (iomap.length > bh_map->b_size) {
875 iomap.length = bh_map->b_size;
876 iomap.flags &= ~IOMAP_F_BOUNDARY;
877 }
878 if (iomap.addr != IOMAP_NULL_ADDR)
879 map_bh(bh_map, inode->i_sb, iomap.addr >> inode->i_blkbits);
880 bh_map->b_size = iomap.length;
881 if (iomap.flags & IOMAP_F_BOUNDARY)
882 set_buffer_boundary(bh_map);
883 if (iomap.flags & IOMAP_F_NEW)
884 set_buffer_new(bh_map);
885
886out:
887 trace_gfs2_bmap(ip, bh_map, lblock, create, ret);
888 return ret;
Steven Whitehousefd88de562006-05-05 16:59:11 -0400889}
890
Steven Whitehouse941e6d72008-01-28 08:47:38 +0000891/*
892 * Deprecated: do not use in new code
893 */
Steven Whitehousefd88de562006-05-05 16:59:11 -0400894int gfs2_extent_map(struct inode *inode, u64 lblock, int *new, u64 *dblock, unsigned *extlen)
895{
Steven Whitehouse23591252006-10-13 17:25:45 -0400896 struct buffer_head bh = { .b_state = 0, .b_blocknr = 0 };
Steven Whitehouse7a6bbac2006-09-18 17:18:23 -0400897 int ret;
Steven Whitehousefd88de562006-05-05 16:59:11 -0400898 int create = *new;
899
900 BUG_ON(!extlen);
901 BUG_ON(!dblock);
902 BUG_ON(!new);
903
Fabian Frederick47a9a522016-08-02 12:05:27 -0500904 bh.b_size = BIT(inode->i_blkbits + (create ? 0 : 5));
Bob Petersone9e1ef22007-12-10 14:13:27 -0600905 ret = gfs2_block_map(inode, lblock, &bh, create);
Steven Whitehouse7a6bbac2006-09-18 17:18:23 -0400906 *extlen = bh.b_size >> inode->i_blkbits;
907 *dblock = bh.b_blocknr;
908 if (buffer_new(&bh))
909 *new = 1;
910 else
911 *new = 0;
912 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000913}
914
915/**
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400916 * gfs2_block_truncate_page - Deal with zeroing out data for truncate
917 *
918 * This is partly borrowed from ext3.
919 */
Steven Whitehouseff8f33c2010-08-11 09:37:53 +0100920static int gfs2_block_truncate_page(struct address_space *mapping, loff_t from)
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400921{
922 struct inode *inode = mapping->host;
923 struct gfs2_inode *ip = GFS2_I(inode);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300924 unsigned long index = from >> PAGE_SHIFT;
925 unsigned offset = from & (PAGE_SIZE-1);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400926 unsigned blocksize, iblock, length, pos;
927 struct buffer_head *bh;
928 struct page *page;
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400929 int err;
930
Bob Peterson220cca22012-03-19 15:25:50 -0400931 page = find_or_create_page(mapping, index, GFP_NOFS);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400932 if (!page)
933 return 0;
934
935 blocksize = inode->i_sb->s_blocksize;
936 length = blocksize - (offset & (blocksize - 1));
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300937 iblock = index << (PAGE_SHIFT - inode->i_sb->s_blocksize_bits);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400938
939 if (!page_has_buffers(page))
940 create_empty_buffers(page, blocksize, 0);
941
942 /* Find the buffer that contains "offset" */
943 bh = page_buffers(page);
944 pos = blocksize;
945 while (offset >= pos) {
946 bh = bh->b_this_page;
947 iblock++;
948 pos += blocksize;
949 }
950
951 err = 0;
952
953 if (!buffer_mapped(bh)) {
Bob Petersone9e1ef22007-12-10 14:13:27 -0600954 gfs2_block_map(inode, iblock, bh, 0);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400955 /* unmapped? It's a hole - nothing to do */
956 if (!buffer_mapped(bh))
957 goto unlock;
958 }
959
960 /* Ok, it's mapped. Make sure it's up-to-date */
961 if (PageUptodate(page))
962 set_buffer_uptodate(bh);
963
964 if (!buffer_uptodate(bh)) {
965 err = -EIO;
Mike Christiedfec8a12016-06-05 14:31:44 -0500966 ll_rw_block(REQ_OP_READ, 0, 1, &bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400967 wait_on_buffer(bh);
968 /* Uhhuh. Read error. Complain and punt. */
969 if (!buffer_uptodate(bh))
970 goto unlock;
S. Wendy Cheng1875f2f2007-06-25 21:14:31 -0400971 err = 0;
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400972 }
973
Steven Whitehousebf36a712007-10-17 08:35:19 +0100974 if (!gfs2_is_writeback(ip))
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000975 gfs2_trans_add_data(ip->i_gl, bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400976
Christoph Lametereebd2aa2008-02-04 22:28:29 -0800977 zero_user(page, offset, length);
Steven Whitehouse40bc9a22009-06-10 09:09:40 +0100978 mark_buffer_dirty(bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400979unlock:
980 unlock_page(page);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300981 put_page(page);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400982 return err;
983}
984
Fabian Frederickc62baf62014-05-14 18:32:31 +0200985#define GFS2_JTRUNC_REVOKES 8192
986
Steven Whitehousefa731fc2012-11-13 09:50:28 +0000987/**
988 * gfs2_journaled_truncate - Wrapper for truncate_pagecache for jdata files
989 * @inode: The inode being truncated
990 * @oldsize: The original (larger) size
991 * @newsize: The new smaller size
992 *
993 * With jdata files, we have to journal a revoke for each block which is
994 * truncated. As a result, we need to split this into separate transactions
995 * if the number of pages being truncated gets too large.
996 */
997
Steven Whitehousefa731fc2012-11-13 09:50:28 +0000998static int gfs2_journaled_truncate(struct inode *inode, u64 oldsize, u64 newsize)
999{
1000 struct gfs2_sbd *sdp = GFS2_SB(inode);
1001 u64 max_chunk = GFS2_JTRUNC_REVOKES * sdp->sd_vfs->s_blocksize;
1002 u64 chunk;
1003 int error;
1004
1005 while (oldsize != newsize) {
1006 chunk = oldsize - newsize;
1007 if (chunk > max_chunk)
1008 chunk = max_chunk;
Kirill A. Shutemov7caef262013-09-12 15:13:56 -07001009 truncate_pagecache(inode, oldsize - chunk);
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001010 oldsize -= chunk;
1011 gfs2_trans_end(sdp);
1012 error = gfs2_trans_begin(sdp, RES_DINODE, GFS2_JTRUNC_REVOKES);
1013 if (error)
1014 return error;
1015 }
1016
1017 return 0;
1018}
1019
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001020static int trunc_start(struct inode *inode, u64 oldsize, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001021{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001022 struct gfs2_inode *ip = GFS2_I(inode);
1023 struct gfs2_sbd *sdp = GFS2_SB(inode);
1024 struct address_space *mapping = inode->i_mapping;
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001025 struct buffer_head *dibh = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001026 int journaled = gfs2_is_jdata(ip);
1027 int error;
1028
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001029 if (journaled)
1030 error = gfs2_trans_begin(sdp, RES_DINODE + RES_JDATA, GFS2_JTRUNC_REVOKES);
1031 else
1032 error = gfs2_trans_begin(sdp, RES_DINODE, 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001033 if (error)
1034 return error;
1035
1036 error = gfs2_meta_inode_buffer(ip, &dibh);
1037 if (error)
1038 goto out;
1039
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001040 gfs2_trans_add_meta(ip->i_gl, dibh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001041
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001042 if (gfs2_is_stuffed(ip)) {
1043 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode) + newsize);
1044 } else {
1045 if (newsize & (u64)(sdp->sd_sb.sb_bsize - 1)) {
1046 error = gfs2_block_truncate_page(mapping, newsize);
1047 if (error)
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001048 goto out;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001049 }
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001050 ip->i_diskflags |= GFS2_DIF_TRUNC_IN_PROG;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001051 }
1052
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001053 i_size_write(inode, newsize);
Deepa Dinamani078cd822016-09-14 07:48:04 -07001054 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001055 gfs2_dinode_out(ip, dibh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001056
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001057 if (journaled)
1058 error = gfs2_journaled_truncate(inode, oldsize, newsize);
1059 else
Kirill A. Shutemov7caef262013-09-12 15:13:56 -07001060 truncate_pagecache(inode, newsize);
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001061
Steven Whitehousea91ea692006-09-04 12:04:26 -04001062out:
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001063 brelse(dibh);
1064 if (current->journal_info)
1065 gfs2_trans_end(sdp);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001066 return error;
1067}
1068
Bob Petersond552a2b2017-02-06 08:28:32 -05001069/**
1070 * sweep_bh_for_rgrps - find an rgrp in a meta buffer and free blocks therein
1071 * @ip: inode
1072 * @rg_gh: holder of resource group glock
1073 * @mp: current metapath fully populated with buffers
1074 * @btotal: place to keep count of total blocks freed
1075 * @hgt: height we're processing
1076 * @first: true if this is the first call to this function for this height
1077 *
1078 * We sweep a metadata buffer (provided by the metapath) for blocks we need to
1079 * free, and free them all. However, we do it one rgrp at a time. If this
1080 * block has references to multiple rgrps, we break it into individual
1081 * transactions. This allows other processes to use the rgrps while we're
1082 * focused on a single one, for better concurrency / performance.
1083 * At every transaction boundary, we rewrite the inode into the journal.
1084 * That way the bitmaps are kept consistent with the inode and we can recover
1085 * if we're interrupted by power-outages.
1086 *
1087 * Returns: 0, or return code if an error occurred.
1088 * *btotal has the total number of blocks freed
1089 */
1090static int sweep_bh_for_rgrps(struct gfs2_inode *ip, struct gfs2_holder *rd_gh,
1091 const struct metapath *mp, u32 *btotal, int hgt,
1092 bool preserve1)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001093{
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +00001094 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001095 struct gfs2_rgrpd *rgd;
1096 struct gfs2_trans *tr;
1097 struct buffer_head *bh = mp->mp_bh[hgt];
1098 __be64 *top, *bottom, *p;
1099 int blks_outside_rgrp;
1100 u64 bn, bstart, isize_blks;
1101 s64 blen; /* needs to be s64 or gfs2_add_inode_blocks breaks */
1102 int meta = ((hgt != ip->i_height - 1) ? 1 : 0);
1103 int ret = 0;
1104 bool buf_in_tr = false; /* buffer was added to transaction */
David Teiglandb3b94fa2006-01-16 16:50:04 +00001105
Bob Petersond552a2b2017-02-06 08:28:32 -05001106 if (gfs2_metatype_check(sdp, bh,
1107 (hgt ? GFS2_METATYPE_IN : GFS2_METATYPE_DI)))
1108 return -EIO;
1109
1110more_rgrps:
1111 blks_outside_rgrp = 0;
1112 bstart = 0;
1113 blen = 0;
1114 top = metapointer(hgt, mp); /* first ptr from metapath */
1115 /* If we're keeping some data at the truncation point, we've got to
1116 preserve the metadata tree by adding 1 to the starting metapath. */
1117 if (preserve1)
1118 top++;
1119
1120 bottom = (__be64 *)(bh->b_data + bh->b_size);
1121
1122 for (p = top; p < bottom; p++) {
1123 if (!*p)
1124 continue;
1125 bn = be64_to_cpu(*p);
1126 if (gfs2_holder_initialized(rd_gh)) {
Andreas Gruenbacher6f6597ba2017-06-30 07:55:08 -05001127 rgd = gfs2_glock2rgrp(rd_gh->gh_gl);
Bob Petersond552a2b2017-02-06 08:28:32 -05001128 gfs2_assert_withdraw(sdp,
1129 gfs2_glock_is_locked_by_me(rd_gh->gh_gl));
1130 } else {
Steven Whitehouse90bcab92017-12-22 13:13:07 +01001131 rgd = gfs2_blk2rgrpd(sdp, bn, true);
Bob Petersond552a2b2017-02-06 08:28:32 -05001132 ret = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE,
1133 0, rd_gh);
1134 if (ret)
1135 goto out;
1136
1137 /* Must be done with the rgrp glock held: */
1138 if (gfs2_rs_active(&ip->i_res) &&
1139 rgd == ip->i_res.rs_rbm.rgd)
1140 gfs2_rs_deltree(&ip->i_res);
1141 }
1142
1143 if (!rgrp_contains_block(rgd, bn)) {
1144 blks_outside_rgrp++;
1145 continue;
1146 }
1147
1148 /* The size of our transactions will be unknown until we
1149 actually process all the metadata blocks that relate to
1150 the rgrp. So we estimate. We know it can't be more than
1151 the dinode's i_blocks and we don't want to exceed the
1152 journal flush threshold, sd_log_thresh2. */
1153 if (current->journal_info == NULL) {
1154 unsigned int jblocks_rqsted, revokes;
1155
1156 jblocks_rqsted = rgd->rd_length + RES_DINODE +
1157 RES_INDIRECT;
1158 isize_blks = gfs2_get_inode_blocks(&ip->i_inode);
1159 if (isize_blks > atomic_read(&sdp->sd_log_thresh2))
1160 jblocks_rqsted +=
1161 atomic_read(&sdp->sd_log_thresh2);
1162 else
1163 jblocks_rqsted += isize_blks;
1164 revokes = jblocks_rqsted;
1165 if (meta)
1166 revokes += hptrs(sdp, hgt);
1167 else if (ip->i_depth)
1168 revokes += sdp->sd_inptrs;
1169 ret = gfs2_trans_begin(sdp, jblocks_rqsted, revokes);
1170 if (ret)
1171 goto out_unlock;
1172 down_write(&ip->i_rw_mutex);
1173 }
1174 /* check if we will exceed the transaction blocks requested */
1175 tr = current->journal_info;
1176 if (tr->tr_num_buf_new + RES_STATFS +
1177 RES_QUOTA >= atomic_read(&sdp->sd_log_thresh2)) {
1178 /* We set blks_outside_rgrp to ensure the loop will
1179 be repeated for the same rgrp, but with a new
1180 transaction. */
1181 blks_outside_rgrp++;
1182 /* This next part is tricky. If the buffer was added
1183 to the transaction, we've already set some block
1184 pointers to 0, so we better follow through and free
1185 them, or we will introduce corruption (so break).
1186 This may be impossible, or at least rare, but I
1187 decided to cover the case regardless.
1188
1189 If the buffer was not added to the transaction
1190 (this call), doing so would exceed our transaction
1191 size, so we need to end the transaction and start a
1192 new one (so goto). */
1193
1194 if (buf_in_tr)
1195 break;
1196 goto out_unlock;
1197 }
1198
1199 gfs2_trans_add_meta(ip->i_gl, bh);
1200 buf_in_tr = true;
1201 *p = 0;
1202 if (bstart + blen == bn) {
1203 blen++;
1204 continue;
1205 }
1206 if (bstart) {
1207 __gfs2_free_blocks(ip, bstart, (u32)blen, meta);
1208 (*btotal) += blen;
1209 gfs2_add_inode_blocks(&ip->i_inode, -blen);
1210 }
1211 bstart = bn;
1212 blen = 1;
1213 }
1214 if (bstart) {
1215 __gfs2_free_blocks(ip, bstart, (u32)blen, meta);
1216 (*btotal) += blen;
1217 gfs2_add_inode_blocks(&ip->i_inode, -blen);
1218 }
1219out_unlock:
1220 if (!ret && blks_outside_rgrp) { /* If buffer still has non-zero blocks
1221 outside the rgrp we just processed,
1222 do it all over again. */
1223 if (current->journal_info) {
1224 struct buffer_head *dibh = mp->mp_bh[0];
1225
1226 /* Every transaction boundary, we rewrite the dinode
1227 to keep its di_blocks current in case of failure. */
1228 ip->i_inode.i_mtime = ip->i_inode.i_ctime =
Stephen Rothwellb32c8c72017-05-08 15:59:34 -07001229 current_time(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001230 gfs2_trans_add_meta(ip->i_gl, dibh);
1231 gfs2_dinode_out(ip, dibh->b_data);
1232 up_write(&ip->i_rw_mutex);
1233 gfs2_trans_end(sdp);
1234 }
1235 gfs2_glock_dq_uninit(rd_gh);
1236 cond_resched();
1237 goto more_rgrps;
1238 }
1239out:
1240 return ret;
1241}
1242
1243/**
1244 * find_nonnull_ptr - find a non-null pointer given a metapath and height
1245 * assumes the metapath is valid (with buffers) out to height h
1246 * @mp: starting metapath
1247 * @h: desired height to search
1248 *
1249 * Returns: true if a non-null pointer was found in the metapath buffer
1250 * false if all remaining pointers are NULL in the buffer
1251 */
1252static bool find_nonnull_ptr(struct gfs2_sbd *sdp, struct metapath *mp,
1253 unsigned int h)
1254{
1255 __be64 *ptr;
1256 unsigned int ptrs = hptrs(sdp, h) - 1;
1257
1258 while (true) {
1259 ptr = metapointer(h, mp);
Bob Petersonc4a9d182017-08-30 09:26:09 -05001260 if (*ptr) { /* if we have a non-null pointer */
1261 /* Now zero the metapath after the current height. */
1262 h++;
1263 if (h < GFS2_MAX_META_HEIGHT)
1264 memset(&mp->mp_list[h], 0,
1265 (GFS2_MAX_META_HEIGHT - h) *
1266 sizeof(mp->mp_list[0]));
Bob Petersond552a2b2017-02-06 08:28:32 -05001267 return true;
Bob Petersonc4a9d182017-08-30 09:26:09 -05001268 }
Bob Petersond552a2b2017-02-06 08:28:32 -05001269
1270 if (mp->mp_list[h] < ptrs)
1271 mp->mp_list[h]++;
1272 else
1273 return false; /* no more pointers in this buffer */
1274 }
1275}
1276
1277enum dealloc_states {
1278 DEALLOC_MP_FULL = 0, /* Strip a metapath with all buffers read in */
1279 DEALLOC_MP_LOWER = 1, /* lower the metapath strip height */
1280 DEALLOC_FILL_MP = 2, /* Fill in the metapath to the given height. */
1281 DEALLOC_DONE = 3, /* process complete */
1282};
1283
Bob Petersonc4a9d182017-08-30 09:26:09 -05001284static bool mp_eq_to_hgt(struct metapath *mp, __u16 *nbof, unsigned int h)
1285{
1286 if (memcmp(mp->mp_list, nbof, h * sizeof(mp->mp_list[0])))
1287 return false;
1288 return true;
1289}
1290
Bob Petersond552a2b2017-02-06 08:28:32 -05001291/**
1292 * trunc_dealloc - truncate a file down to a desired size
1293 * @ip: inode to truncate
1294 * @newsize: The desired size of the file
1295 *
1296 * This function truncates a file to newsize. It works from the
1297 * bottom up, and from the right to the left. In other words, it strips off
1298 * the highest layer (data) before stripping any of the metadata. Doing it
1299 * this way is best in case the operation is interrupted by power failure, etc.
1300 * The dinode is rewritten in every transaction to guarantee integrity.
1301 */
1302static int trunc_dealloc(struct gfs2_inode *ip, u64 newsize)
1303{
1304 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1305 struct metapath mp;
1306 struct buffer_head *dibh, *bh;
1307 struct gfs2_holder rd_gh;
1308 u64 lblock;
1309 __u16 nbof[GFS2_MAX_META_HEIGHT]; /* new beginning of truncation */
1310 unsigned int strip_h = ip->i_height - 1;
1311 u32 btotal = 0;
1312 int ret, state;
1313 int mp_h; /* metapath buffers are read in to this height */
1314 sector_t last_ra = 0;
1315 u64 prev_bnr = 0;
1316 bool preserve1; /* need to preserve the first meta pointer? */
1317
1318 if (!newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001319 lblock = 0;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +00001320 else
Bob Petersond552a2b2017-02-06 08:28:32 -05001321 lblock = (newsize - 1) >> sdp->sd_sb.sb_bsize_shift;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001322
Bob Petersond552a2b2017-02-06 08:28:32 -05001323 memset(&mp, 0, sizeof(mp));
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +00001324 find_metapath(sdp, lblock, &mp, ip->i_height);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001325
Bob Petersond552a2b2017-02-06 08:28:32 -05001326 memcpy(&nbof, &mp.mp_list, sizeof(nbof));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001327
Bob Petersond552a2b2017-02-06 08:28:32 -05001328 ret = gfs2_meta_inode_buffer(ip, &dibh);
1329 if (ret)
1330 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001331
Bob Petersond552a2b2017-02-06 08:28:32 -05001332 mp.mp_bh[0] = dibh;
1333 ret = lookup_metapath(ip, &mp);
1334 if (ret == ip->i_height)
1335 state = DEALLOC_MP_FULL; /* We have a complete metapath */
1336 else
1337 state = DEALLOC_FILL_MP; /* deal with partial metapath */
1338
1339 ret = gfs2_rindex_update(sdp);
1340 if (ret)
1341 goto out_metapath;
1342
1343 ret = gfs2_quota_hold(ip, NO_UID_QUOTA_CHANGE, NO_GID_QUOTA_CHANGE);
1344 if (ret)
1345 goto out_metapath;
1346 gfs2_holder_mark_uninitialized(&rd_gh);
1347
1348 mp_h = strip_h;
1349
1350 while (state != DEALLOC_DONE) {
1351 switch (state) {
1352 /* Truncate a full metapath at the given strip height.
1353 * Note that strip_h == mp_h in order to be in this state. */
1354 case DEALLOC_MP_FULL:
1355 if (mp_h > 0) { /* issue read-ahead on metadata */
1356 __be64 *top;
1357
1358 bh = mp.mp_bh[mp_h - 1];
1359 if (bh->b_blocknr != last_ra) {
1360 last_ra = bh->b_blocknr;
1361 top = metaptr1(mp_h - 1, &mp);
1362 gfs2_metapath_ra(ip->i_gl, bh, top);
1363 }
1364 }
1365 /* If we're truncating to a non-zero size and the mp is
1366 at the beginning of file for the strip height, we
1367 need to preserve the first metadata pointer. */
Bob Petersonc4a9d182017-08-30 09:26:09 -05001368 preserve1 = (newsize && mp_eq_to_hgt(&mp, nbof, mp_h));
Bob Petersond552a2b2017-02-06 08:28:32 -05001369 bh = mp.mp_bh[mp_h];
1370 gfs2_assert_withdraw(sdp, bh);
1371 if (gfs2_assert_withdraw(sdp,
1372 prev_bnr != bh->b_blocknr)) {
1373 printk(KERN_EMERG "GFS2: fsid=%s:inode %llu, "
1374 "block:%llu, i_h:%u, s_h:%u, mp_h:%u\n",
1375 sdp->sd_fsname,
1376 (unsigned long long)ip->i_no_addr,
1377 prev_bnr, ip->i_height, strip_h, mp_h);
1378 }
1379 prev_bnr = bh->b_blocknr;
1380 ret = sweep_bh_for_rgrps(ip, &rd_gh, &mp, &btotal,
1381 mp_h, preserve1);
1382 /* If we hit an error or just swept dinode buffer,
1383 just exit. */
1384 if (ret || !mp_h) {
1385 state = DEALLOC_DONE;
1386 break;
1387 }
1388 state = DEALLOC_MP_LOWER;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001389 break;
Bob Petersond552a2b2017-02-06 08:28:32 -05001390
1391 /* lower the metapath strip height */
1392 case DEALLOC_MP_LOWER:
1393 /* We're done with the current buffer, so release it,
1394 unless it's the dinode buffer. Then back up to the
1395 previous pointer. */
1396 if (mp_h) {
1397 brelse(mp.mp_bh[mp_h]);
1398 mp.mp_bh[mp_h] = NULL;
1399 }
1400 /* If we can't get any lower in height, we've stripped
1401 off all we can. Next step is to back up and start
1402 stripping the previous level of metadata. */
1403 if (mp_h == 0) {
1404 strip_h--;
1405 memcpy(&mp.mp_list, &nbof, sizeof(nbof));
1406 mp_h = strip_h;
1407 state = DEALLOC_FILL_MP;
1408 break;
1409 }
1410 mp.mp_list[mp_h] = 0;
1411 mp_h--; /* search one metadata height down */
1412 if (mp.mp_list[mp_h] >= hptrs(sdp, mp_h) - 1)
1413 break; /* loop around in the same state */
1414 mp.mp_list[mp_h]++;
1415 /* Here we've found a part of the metapath that is not
1416 * allocated. We need to search at that height for the
1417 * next non-null pointer. */
1418 if (find_nonnull_ptr(sdp, &mp, mp_h)) {
1419 state = DEALLOC_FILL_MP;
1420 mp_h++;
1421 }
1422 /* No more non-null pointers at this height. Back up
1423 to the previous height and try again. */
1424 break; /* loop around in the same state */
1425
1426 /* Fill the metapath with buffers to the given height. */
1427 case DEALLOC_FILL_MP:
1428 /* Fill the buffers out to the current height. */
1429 ret = fillup_metapath(ip, &mp, mp_h);
1430 if (ret < 0)
1431 goto out;
1432
1433 /* If buffers found for the entire strip height */
1434 if ((ret == ip->i_height) && (mp_h == strip_h)) {
1435 state = DEALLOC_MP_FULL;
1436 break;
1437 }
1438 if (ret < ip->i_height) /* We have a partial height */
1439 mp_h = ret - 1;
1440
1441 /* If we find a non-null block pointer, crawl a bit
1442 higher up in the metapath and try again, otherwise
1443 we need to look lower for a new starting point. */
1444 if (find_nonnull_ptr(sdp, &mp, mp_h))
1445 mp_h++;
1446 else
1447 state = DEALLOC_MP_LOWER;
1448 break;
1449 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001450 }
1451
Bob Petersond552a2b2017-02-06 08:28:32 -05001452 if (btotal) {
1453 if (current->journal_info == NULL) {
1454 ret = gfs2_trans_begin(sdp, RES_DINODE + RES_STATFS +
1455 RES_QUOTA, 0);
1456 if (ret)
1457 goto out;
1458 down_write(&ip->i_rw_mutex);
1459 }
1460 gfs2_statfs_change(sdp, 0, +btotal, 0);
1461 gfs2_quota_change(ip, -(s64)btotal, ip->i_inode.i_uid,
1462 ip->i_inode.i_gid);
Stephen Rothwellb32c8c72017-05-08 15:59:34 -07001463 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001464 gfs2_trans_add_meta(ip->i_gl, dibh);
1465 gfs2_dinode_out(ip, dibh->b_data);
1466 up_write(&ip->i_rw_mutex);
1467 gfs2_trans_end(sdp);
1468 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001469
Bob Petersond552a2b2017-02-06 08:28:32 -05001470out:
1471 if (gfs2_holder_initialized(&rd_gh))
1472 gfs2_glock_dq_uninit(&rd_gh);
1473 if (current->journal_info) {
1474 up_write(&ip->i_rw_mutex);
1475 gfs2_trans_end(sdp);
1476 cond_resched();
1477 }
1478 gfs2_quota_unhold(ip);
1479out_metapath:
1480 release_metapath(&mp);
1481 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001482}
1483
1484static int trunc_end(struct gfs2_inode *ip)
1485{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001486 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001487 struct buffer_head *dibh;
1488 int error;
1489
1490 error = gfs2_trans_begin(sdp, RES_DINODE, 0);
1491 if (error)
1492 return error;
1493
1494 down_write(&ip->i_rw_mutex);
1495
1496 error = gfs2_meta_inode_buffer(ip, &dibh);
1497 if (error)
1498 goto out;
1499
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001500 if (!i_size_read(&ip->i_inode)) {
Steven Whitehouseecc30c72008-01-28 10:37:35 +00001501 ip->i_height = 0;
Steven Whitehousece276b02008-02-06 09:25:45 +00001502 ip->i_goal = ip->i_no_addr;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001503 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
Steven Whitehouse45138992013-01-28 09:30:07 +00001504 gfs2_ordered_del_inode(ip);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001505 }
Deepa Dinamani078cd822016-09-14 07:48:04 -07001506 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouse383f01f2008-11-04 10:05:22 +00001507 ip->i_diskflags &= ~GFS2_DIF_TRUNC_IN_PROG;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001508
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001509 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse539e5d62006-10-31 15:07:05 -05001510 gfs2_dinode_out(ip, dibh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001511 brelse(dibh);
1512
Steven Whitehousea91ea692006-09-04 12:04:26 -04001513out:
David Teiglandb3b94fa2006-01-16 16:50:04 +00001514 up_write(&ip->i_rw_mutex);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001515 gfs2_trans_end(sdp);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001516 return error;
1517}
1518
1519/**
1520 * do_shrink - make a file smaller
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001521 * @inode: the inode
1522 * @oldsize: the current inode size
1523 * @newsize: the size to make the file
David Teiglandb3b94fa2006-01-16 16:50:04 +00001524 *
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001525 * Called with an exclusive lock on @inode. The @size must
1526 * be equal to or smaller than the current inode size.
David Teiglandb3b94fa2006-01-16 16:50:04 +00001527 *
1528 * Returns: errno
1529 */
1530
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001531static int do_shrink(struct inode *inode, u64 oldsize, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001532{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001533 struct gfs2_inode *ip = GFS2_I(inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001534 int error;
1535
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001536 error = trunc_start(inode, oldsize, newsize);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001537 if (error < 0)
1538 return error;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001539 if (gfs2_is_stuffed(ip))
David Teiglandb3b94fa2006-01-16 16:50:04 +00001540 return 0;
1541
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001542 error = trunc_dealloc(ip, newsize);
1543 if (error == 0)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001544 error = trunc_end(ip);
1545
1546 return error;
1547}
1548
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001549void gfs2_trim_blocks(struct inode *inode)
Wendy Chenga13b8c52007-08-20 09:29:53 -04001550{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001551 u64 size = inode->i_size;
1552 int ret;
1553
1554 ret = do_shrink(inode, size, size);
1555 WARN_ON(ret != 0);
1556}
1557
1558/**
1559 * do_grow - Touch and update inode size
1560 * @inode: The inode
1561 * @size: The new size
1562 *
1563 * This function updates the timestamps on the inode and
1564 * may also increase the size of the inode. This function
1565 * must not be called with @size any smaller than the current
1566 * inode size.
1567 *
1568 * Although it is not strictly required to unstuff files here,
1569 * earlier versions of GFS2 have a bug in the stuffed file reading
1570 * code which will result in a buffer overrun if the size is larger
1571 * than the max stuffed file size. In order to prevent this from
Lucas De Marchi25985ed2011-03-30 22:57:33 -03001572 * occurring, such files are unstuffed, but in other cases we can
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001573 * just update the inode size directly.
1574 *
1575 * Returns: 0 on success, or -ve on error
1576 */
1577
1578static int do_grow(struct inode *inode, u64 size)
1579{
1580 struct gfs2_inode *ip = GFS2_I(inode);
1581 struct gfs2_sbd *sdp = GFS2_SB(inode);
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001582 struct gfs2_alloc_parms ap = { .target = 1, };
Wendy Chenga13b8c52007-08-20 09:29:53 -04001583 struct buffer_head *dibh;
1584 int error;
Bob Peterson2f7ee352012-04-12 09:19:30 -04001585 int unstuff = 0;
Wendy Chenga13b8c52007-08-20 09:29:53 -04001586
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001587 if (gfs2_is_stuffed(ip) &&
1588 (size > (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode)))) {
Abhi Dasb8fbf472015-03-18 12:03:41 -05001589 error = gfs2_quota_lock_check(ip, &ap);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001590 if (error)
Bob Peterson5407e242012-05-18 09:28:23 -04001591 return error;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001592
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001593 error = gfs2_inplace_reserve(ip, &ap);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001594 if (error)
1595 goto do_grow_qunlock;
Bob Peterson2f7ee352012-04-12 09:19:30 -04001596 unstuff = 1;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001597 }
1598
Bob Petersona01aedf2013-06-27 12:47:51 -04001599 error = gfs2_trans_begin(sdp, RES_DINODE + RES_STATFS + RES_RG_BIT +
1600 (sdp->sd_args.ar_quota == GFS2_QUOTA_OFF ?
1601 0 : RES_QUOTA), 0);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001602 if (error)
1603 goto do_grow_release;
1604
Bob Peterson2f7ee352012-04-12 09:19:30 -04001605 if (unstuff) {
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001606 error = gfs2_unstuff_dinode(ip, NULL);
1607 if (error)
1608 goto do_end_trans;
1609 }
Wendy Chenga13b8c52007-08-20 09:29:53 -04001610
1611 error = gfs2_meta_inode_buffer(ip, &dibh);
1612 if (error)
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001613 goto do_end_trans;
Wendy Chenga13b8c52007-08-20 09:29:53 -04001614
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001615 i_size_write(inode, size);
Deepa Dinamani078cd822016-09-14 07:48:04 -07001616 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001617 gfs2_trans_add_meta(ip->i_gl, dibh);
Wendy Chenga13b8c52007-08-20 09:29:53 -04001618 gfs2_dinode_out(ip, dibh->b_data);
1619 brelse(dibh);
1620
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001621do_end_trans:
Wendy Chenga13b8c52007-08-20 09:29:53 -04001622 gfs2_trans_end(sdp);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001623do_grow_release:
Bob Peterson2f7ee352012-04-12 09:19:30 -04001624 if (unstuff) {
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001625 gfs2_inplace_release(ip);
1626do_grow_qunlock:
1627 gfs2_quota_unlock(ip);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001628 }
Wendy Chenga13b8c52007-08-20 09:29:53 -04001629 return error;
1630}
1631
David Teiglandb3b94fa2006-01-16 16:50:04 +00001632/**
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001633 * gfs2_setattr_size - make a file a given size
1634 * @inode: the inode
1635 * @newsize: the size to make the file
David Teiglandb3b94fa2006-01-16 16:50:04 +00001636 *
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001637 * The file size can grow, shrink, or stay the same size. This
1638 * is called holding i_mutex and an exclusive glock on the inode
1639 * in question.
David Teiglandb3b94fa2006-01-16 16:50:04 +00001640 *
1641 * Returns: errno
1642 */
1643
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001644int gfs2_setattr_size(struct inode *inode, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001645{
Steven Whitehouseaf5c2692013-09-27 12:49:33 +01001646 struct gfs2_inode *ip = GFS2_I(inode);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001647 int ret;
1648 u64 oldsize;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001649
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001650 BUG_ON(!S_ISREG(inode->i_mode));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001651
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001652 ret = inode_newsize_ok(inode, newsize);
1653 if (ret)
1654 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001655
Christoph Hellwig562c72a2011-06-24 14:29:45 -04001656 inode_dio_wait(inode);
1657
Bob Petersonb54e9a02015-10-26 10:40:28 -05001658 ret = gfs2_rsqa_alloc(ip);
Bob Petersond2b47cf2013-02-01 12:03:02 -05001659 if (ret)
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001660 goto out;
Bob Petersond2b47cf2013-02-01 12:03:02 -05001661
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001662 oldsize = inode->i_size;
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001663 if (newsize >= oldsize) {
1664 ret = do_grow(inode, newsize);
1665 goto out;
1666 }
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001667
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001668 ret = do_shrink(inode, oldsize, newsize);
1669out:
Bob Petersona097dc7e2015-07-16 08:28:04 -05001670 gfs2_rsqa_delete(ip, NULL);
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001671 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001672}
1673
1674int gfs2_truncatei_resume(struct gfs2_inode *ip)
1675{
1676 int error;
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001677 error = trunc_dealloc(ip, i_size_read(&ip->i_inode));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001678 if (!error)
1679 error = trunc_end(ip);
1680 return error;
1681}
1682
1683int gfs2_file_dealloc(struct gfs2_inode *ip)
1684{
1685 return trunc_dealloc(ip, 0);
1686}
1687
1688/**
Steven Whitehouseb50f2272014-03-03 13:35:57 +00001689 * gfs2_free_journal_extents - Free cached journal bmap info
1690 * @jd: The journal
1691 *
1692 */
1693
1694void gfs2_free_journal_extents(struct gfs2_jdesc *jd)
1695{
1696 struct gfs2_journal_extent *jext;
1697
1698 while(!list_empty(&jd->extent_list)) {
1699 jext = list_entry(jd->extent_list.next, struct gfs2_journal_extent, list);
1700 list_del(&jext->list);
1701 kfree(jext);
1702 }
1703}
1704
1705/**
1706 * gfs2_add_jextent - Add or merge a new extent to extent cache
1707 * @jd: The journal descriptor
1708 * @lblock: The logical block at start of new extent
Fabian Frederickc62baf62014-05-14 18:32:31 +02001709 * @dblock: The physical block at start of new extent
Steven Whitehouseb50f2272014-03-03 13:35:57 +00001710 * @blocks: Size of extent in fs blocks
1711 *
1712 * Returns: 0 on success or -ENOMEM
1713 */
1714
1715static int gfs2_add_jextent(struct gfs2_jdesc *jd, u64 lblock, u64 dblock, u64 blocks)
1716{
1717 struct gfs2_journal_extent *jext;
1718
1719 if (!list_empty(&jd->extent_list)) {
1720 jext = list_entry(jd->extent_list.prev, struct gfs2_journal_extent, list);
1721 if ((jext->dblock + jext->blocks) == dblock) {
1722 jext->blocks += blocks;
1723 return 0;
1724 }
1725 }
1726
1727 jext = kzalloc(sizeof(struct gfs2_journal_extent), GFP_NOFS);
1728 if (jext == NULL)
1729 return -ENOMEM;
1730 jext->dblock = dblock;
1731 jext->lblock = lblock;
1732 jext->blocks = blocks;
1733 list_add_tail(&jext->list, &jd->extent_list);
1734 jd->nr_extents++;
1735 return 0;
1736}
1737
1738/**
1739 * gfs2_map_journal_extents - Cache journal bmap info
1740 * @sdp: The super block
1741 * @jd: The journal to map
1742 *
1743 * Create a reusable "extent" mapping from all logical
1744 * blocks to all physical blocks for the given journal. This will save
1745 * us time when writing journal blocks. Most journals will have only one
1746 * extent that maps all their logical blocks. That's because gfs2.mkfs
1747 * arranges the journal blocks sequentially to maximize performance.
1748 * So the extent would map the first block for the entire file length.
1749 * However, gfs2_jadd can happen while file activity is happening, so
1750 * those journals may not be sequential. Less likely is the case where
1751 * the users created their own journals by mounting the metafs and
1752 * laying it out. But it's still possible. These journals might have
1753 * several extents.
1754 *
1755 * Returns: 0 on success, or error on failure
1756 */
1757
1758int gfs2_map_journal_extents(struct gfs2_sbd *sdp, struct gfs2_jdesc *jd)
1759{
1760 u64 lblock = 0;
1761 u64 lblock_stop;
1762 struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
1763 struct buffer_head bh;
1764 unsigned int shift = sdp->sd_sb.sb_bsize_shift;
1765 u64 size;
1766 int rc;
1767
1768 lblock_stop = i_size_read(jd->jd_inode) >> shift;
1769 size = (lblock_stop - lblock) << shift;
1770 jd->nr_extents = 0;
1771 WARN_ON(!list_empty(&jd->extent_list));
1772
1773 do {
1774 bh.b_state = 0;
1775 bh.b_blocknr = 0;
1776 bh.b_size = size;
1777 rc = gfs2_block_map(jd->jd_inode, lblock, &bh, 0);
1778 if (rc || !buffer_mapped(&bh))
1779 goto fail;
1780 rc = gfs2_add_jextent(jd, lblock, bh.b_blocknr, bh.b_size >> shift);
1781 if (rc)
1782 goto fail;
1783 size -= bh.b_size;
1784 lblock += (bh.b_size >> ip->i_inode.i_blkbits);
1785 } while(size > 0);
1786
1787 fs_info(sdp, "journal %d mapped with %u extents\n", jd->jd_jid,
1788 jd->nr_extents);
1789 return 0;
1790
1791fail:
1792 fs_warn(sdp, "error %d mapping journal %u at offset %llu (extent %u)\n",
1793 rc, jd->jd_jid,
1794 (unsigned long long)(i_size_read(jd->jd_inode) - size),
1795 jd->nr_extents);
1796 fs_warn(sdp, "bmap=%d lblock=%llu block=%llu, state=0x%08lx, size=%llu\n",
1797 rc, (unsigned long long)lblock, (unsigned long long)bh.b_blocknr,
1798 bh.b_state, (unsigned long long)bh.b_size);
1799 gfs2_free_journal_extents(jd);
1800 return rc;
1801}
1802
1803/**
David Teiglandb3b94fa2006-01-16 16:50:04 +00001804 * gfs2_write_alloc_required - figure out if a write will require an allocation
1805 * @ip: the file being written to
1806 * @offset: the offset to write to
1807 * @len: the number of bytes being written
David Teiglandb3b94fa2006-01-16 16:50:04 +00001808 *
Bob Peterson461cb412010-06-24 19:21:20 -04001809 * Returns: 1 if an alloc is required, 0 otherwise
David Teiglandb3b94fa2006-01-16 16:50:04 +00001810 */
1811
Steven Whitehousecd915492006-09-04 12:49:07 -04001812int gfs2_write_alloc_required(struct gfs2_inode *ip, u64 offset,
Bob Peterson461cb412010-06-24 19:21:20 -04001813 unsigned int len)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001814{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001815 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001816 struct buffer_head bh;
1817 unsigned int shift;
1818 u64 lblock, lblock_stop, size;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001819 u64 end_of_file;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001820
David Teiglandb3b94fa2006-01-16 16:50:04 +00001821 if (!len)
1822 return 0;
1823
1824 if (gfs2_is_stuffed(ip)) {
1825 if (offset + len >
1826 sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode))
Bob Peterson461cb412010-06-24 19:21:20 -04001827 return 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001828 return 0;
1829 }
1830
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001831 shift = sdp->sd_sb.sb_bsize_shift;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001832 BUG_ON(gfs2_is_dir(ip));
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001833 end_of_file = (i_size_read(&ip->i_inode) + sdp->sd_sb.sb_bsize - 1) >> shift;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001834 lblock = offset >> shift;
1835 lblock_stop = (offset + len + sdp->sd_sb.sb_bsize - 1) >> shift;
1836 if (lblock_stop > end_of_file)
Bob Peterson461cb412010-06-24 19:21:20 -04001837 return 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001838
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001839 size = (lblock_stop - lblock) << shift;
1840 do {
1841 bh.b_state = 0;
1842 bh.b_size = size;
1843 gfs2_block_map(&ip->i_inode, lblock, &bh, 0);
1844 if (!buffer_mapped(&bh))
Bob Peterson461cb412010-06-24 19:21:20 -04001845 return 1;
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001846 size -= bh.b_size;
1847 lblock += (bh.b_size >> ip->i_inode.i_blkbits);
1848 } while(size > 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001849
1850 return 0;
1851}
1852