blob: 963117f704bf09175d535a180be5039bcdfc6666 [file] [log] [blame]
David Teiglandb3b94fa2006-01-16 16:50:04 +00001/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
Steven Whitehouse3a8a9a12006-05-18 15:09:15 -04003 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
David Teiglandb3b94fa2006-01-16 16:50:04 +00004 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
Steven Whitehousee9fc2aa2006-09-01 11:05:15 -04007 * of the GNU General Public License version 2.
David Teiglandb3b94fa2006-01-16 16:50:04 +00008 */
9
David Teiglandb3b94fa2006-01-16 16:50:04 +000010#include <linux/spinlock.h>
11#include <linux/completion.h>
12#include <linux/buffer_head.h>
Benjamin Marzinski64dd1532011-09-12 18:15:24 -050013#include <linux/blkdev.h>
Steven Whitehouse5c676f62006-02-27 17:23:27 -050014#include <linux/gfs2_ondisk.h>
Steven Whitehouse71b86f52006-03-28 14:14:04 -050015#include <linux/crc32.h>
Bob Peterson39743202017-02-16 10:27:16 -050016#include <linux/iomap.h>
David Teiglandb3b94fa2006-01-16 16:50:04 +000017
18#include "gfs2.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050019#include "incore.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000020#include "bmap.h"
21#include "glock.h"
22#include "inode.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000023#include "meta_io.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000024#include "quota.h"
25#include "rgrp.h"
Steven Whitehouse45138992013-01-28 09:30:07 +000026#include "log.h"
Bob Peterson4c16c362011-02-23 16:11:33 -050027#include "super.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000028#include "trans.h"
Steven Whitehouse18ec7d52006-02-08 11:50:51 +000029#include "dir.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050030#include "util.h"
Steven Whitehouse63997772009-06-12 08:49:20 +010031#include "trace_gfs2.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000032
33/* This doesn't need to be that large as max 64 bit pointers in a 4k
34 * block is 512, so __u16 is fine for that. It saves stack space to
35 * keep it small.
36 */
37struct metapath {
Steven Whitehousedbac6712008-01-29 09:12:55 +000038 struct buffer_head *mp_bh[GFS2_MAX_META_HEIGHT];
David Teiglandb3b94fa2006-01-16 16:50:04 +000039 __u16 mp_list[GFS2_MAX_META_HEIGHT];
Bob Peterson5f8bd442016-10-28 14:29:29 -050040 int mp_fheight; /* find_metapath height */
41 int mp_aheight; /* actual height (lookup height) */
David Teiglandb3b94fa2006-01-16 16:50:04 +000042};
43
David Teiglandb3b94fa2006-01-16 16:50:04 +000044/**
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040045 * gfs2_unstuffer_page - unstuff a stuffed inode into a block cached by a page
46 * @ip: the inode
47 * @dibh: the dinode buffer
48 * @block: the block number that was allocated
Steven Whitehouseff8f33c2010-08-11 09:37:53 +010049 * @page: The (optional) page. This is looked up if @page is NULL
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040050 *
51 * Returns: errno
52 */
53
54static int gfs2_unstuffer_page(struct gfs2_inode *ip, struct buffer_head *dibh,
Steven Whitehousecd915492006-09-04 12:49:07 -040055 u64 block, struct page *page)
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040056{
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040057 struct inode *inode = &ip->i_inode;
58 struct buffer_head *bh;
59 int release = 0;
60
61 if (!page || page->index) {
Bob Peterson220cca22012-03-19 15:25:50 -040062 page = find_or_create_page(inode->i_mapping, 0, GFP_NOFS);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040063 if (!page)
64 return -ENOMEM;
65 release = 1;
66 }
67
68 if (!PageUptodate(page)) {
69 void *kaddr = kmap(page);
Steven Whitehouse602c89d2010-03-25 14:32:43 +000070 u64 dsize = i_size_read(inode);
71
72 if (dsize > (dibh->b_size - sizeof(struct gfs2_dinode)))
73 dsize = dibh->b_size - sizeof(struct gfs2_dinode);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040074
Steven Whitehouse602c89d2010-03-25 14:32:43 +000075 memcpy(kaddr, dibh->b_data + sizeof(struct gfs2_dinode), dsize);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +030076 memset(kaddr + dsize, 0, PAGE_SIZE - dsize);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040077 kunmap(page);
78
79 SetPageUptodate(page);
80 }
81
82 if (!page_has_buffers(page))
Fabian Frederick47a9a522016-08-02 12:05:27 -050083 create_empty_buffers(page, BIT(inode->i_blkbits),
84 BIT(BH_Uptodate));
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040085
86 bh = page_buffers(page);
87
88 if (!buffer_mapped(bh))
89 map_bh(bh, inode->i_sb, block);
90
91 set_buffer_uptodate(bh);
Steven Whitehouseeaf96522007-08-27 09:49:37 +010092 if (!gfs2_is_jdata(ip))
93 mark_buffer_dirty(bh);
Steven Whitehousebf36a712007-10-17 08:35:19 +010094 if (!gfs2_is_writeback(ip))
Steven Whitehouse350a9b02012-12-14 12:36:02 +000095 gfs2_trans_add_data(ip->i_gl, bh);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -040096
97 if (release) {
98 unlock_page(page);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +030099 put_page(page);
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400100 }
101
102 return 0;
103}
104
105/**
David Teiglandb3b94fa2006-01-16 16:50:04 +0000106 * gfs2_unstuff_dinode - Unstuff a dinode when the data has grown too big
107 * @ip: The GFS2 inode to unstuff
Steven Whitehouseff8f33c2010-08-11 09:37:53 +0100108 * @page: The (optional) page. This is looked up if the @page is NULL
David Teiglandb3b94fa2006-01-16 16:50:04 +0000109 *
110 * This routine unstuffs a dinode and returns it to a "normal" state such
111 * that the height can be grown in the traditional way.
112 *
113 * Returns: errno
114 */
115
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400116int gfs2_unstuff_dinode(struct gfs2_inode *ip, struct page *page)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000117{
118 struct buffer_head *bh, *dibh;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400119 struct gfs2_dinode *di;
Steven Whitehousecd915492006-09-04 12:49:07 -0400120 u64 block = 0;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +0000121 int isdir = gfs2_is_dir(ip);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000122 int error;
123
124 down_write(&ip->i_rw_mutex);
125
126 error = gfs2_meta_inode_buffer(ip, &dibh);
127 if (error)
128 goto out;
Steven Whitehouse907b9bc2006-09-25 09:26:04 -0400129
Steven Whitehousea2e0f792010-08-11 09:53:11 +0100130 if (i_size_read(&ip->i_inode)) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000131 /* Get a free block, fill it with the stuffed data,
132 and write it out to disk */
133
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000134 unsigned int n = 1;
Bob Peterson6e87ed02011-11-18 10:58:32 -0500135 error = gfs2_alloc_blocks(ip, &block, &n, 0, NULL);
Steven Whitehouse09010972009-05-20 10:48:47 +0100136 if (error)
137 goto out_brelse;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +0000138 if (isdir) {
Steven Whitehouse5731be52008-02-01 13:16:55 +0000139 gfs2_trans_add_unrevoke(GFS2_SB(&ip->i_inode), block, 1);
Steven Whitehouse61e085a2006-04-24 10:07:13 -0400140 error = gfs2_dir_get_new_buffer(ip, block, &bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000141 if (error)
142 goto out_brelse;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400143 gfs2_buffer_copy_tail(bh, sizeof(struct gfs2_meta_header),
David Teiglandb3b94fa2006-01-16 16:50:04 +0000144 dibh, sizeof(struct gfs2_dinode));
145 brelse(bh);
146 } else {
Steven Whitehousef25ef0c2006-07-26 10:51:20 -0400147 error = gfs2_unstuffer_page(ip, dibh, block, page);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000148 if (error)
149 goto out_brelse;
150 }
151 }
152
153 /* Set up the pointer to the new block */
154
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000155 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400156 di = (struct gfs2_dinode *)dibh->b_data;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000157 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
158
Steven Whitehousea2e0f792010-08-11 09:53:11 +0100159 if (i_size_read(&ip->i_inode)) {
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400160 *(__be64 *)(di + 1) = cpu_to_be64(block);
Steven Whitehouse77658aa2008-02-12 14:17:27 +0000161 gfs2_add_inode_blocks(&ip->i_inode, 1);
162 di->di_blocks = cpu_to_be64(gfs2_get_inode_blocks(&ip->i_inode));
David Teiglandb3b94fa2006-01-16 16:50:04 +0000163 }
164
Steven Whitehouseecc30c72008-01-28 10:37:35 +0000165 ip->i_height = 1;
Steven Whitehouse48516ce2006-10-02 12:39:19 -0400166 di->di_height = cpu_to_be16(1);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000167
Steven Whitehousea91ea692006-09-04 12:04:26 -0400168out_brelse:
David Teiglandb3b94fa2006-01-16 16:50:04 +0000169 brelse(dibh);
Steven Whitehousea91ea692006-09-04 12:04:26 -0400170out:
David Teiglandb3b94fa2006-01-16 16:50:04 +0000171 up_write(&ip->i_rw_mutex);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000172 return error;
173}
174
David Teiglandb3b94fa2006-01-16 16:50:04 +0000175
176/**
177 * find_metapath - Find path through the metadata tree
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000178 * @sdp: The superblock
David Teiglandb3b94fa2006-01-16 16:50:04 +0000179 * @mp: The metapath to return the result in
180 * @block: The disk block to look up
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000181 * @height: The pre-calculated height of the metadata tree
David Teiglandb3b94fa2006-01-16 16:50:04 +0000182 *
183 * This routine returns a struct metapath structure that defines a path
184 * through the metadata of inode "ip" to get to block "block".
185 *
186 * Example:
187 * Given: "ip" is a height 3 file, "offset" is 101342453, and this is a
188 * filesystem with a blocksize of 4096.
189 *
190 * find_metapath() would return a struct metapath structure set to:
191 * mp_offset = 101342453, mp_height = 3, mp_list[0] = 0, mp_list[1] = 48,
192 * and mp_list[2] = 165.
193 *
194 * That means that in order to get to the block containing the byte at
195 * offset 101342453, we would load the indirect block pointed to by pointer
196 * 0 in the dinode. We would then load the indirect block pointed to by
197 * pointer 48 in that indirect block. We would then load the data block
198 * pointed to by pointer 165 in that indirect block.
199 *
200 * ----------------------------------------
201 * | Dinode | |
202 * | | 4|
203 * | |0 1 2 3 4 5 9|
204 * | | 6|
205 * ----------------------------------------
206 * |
207 * |
208 * V
209 * ----------------------------------------
210 * | Indirect Block |
211 * | 5|
212 * | 4 4 4 4 4 5 5 1|
213 * |0 5 6 7 8 9 0 1 2|
214 * ----------------------------------------
215 * |
216 * |
217 * V
218 * ----------------------------------------
219 * | Indirect Block |
220 * | 1 1 1 1 1 5|
221 * | 6 6 6 6 6 1|
222 * |0 3 4 5 6 7 2|
223 * ----------------------------------------
224 * |
225 * |
226 * V
227 * ----------------------------------------
228 * | Data block containing offset |
229 * | 101342453 |
230 * | |
231 * | |
232 * ----------------------------------------
233 *
234 */
235
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000236static void find_metapath(const struct gfs2_sbd *sdp, u64 block,
237 struct metapath *mp, unsigned int height)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000238{
David Teiglandb3b94fa2006-01-16 16:50:04 +0000239 unsigned int i;
240
Bob Peterson5f8bd442016-10-28 14:29:29 -0500241 mp->mp_fheight = height;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000242 for (i = height; i--;)
Bob Peterson7eabb772008-01-28 11:24:35 -0600243 mp->mp_list[i] = do_div(block, sdp->sd_inptrs);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000244}
245
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500246static inline unsigned int metapath_branch_start(const struct metapath *mp)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000247{
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500248 if (mp->mp_list[0] == 0)
249 return 2;
250 return 1;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000251}
252
David Teiglandb3b94fa2006-01-16 16:50:04 +0000253/**
Andreas Gruenbacher20cdc192017-09-22 07:39:54 -0500254 * metaptr1 - Return the first possible metadata pointer in a metapath buffer
Bob Petersond552a2b2017-02-06 08:28:32 -0500255 * @height: The metadata height (0 = dinode)
256 * @mp: The metapath
257 */
258static inline __be64 *metaptr1(unsigned int height, const struct metapath *mp)
259{
260 struct buffer_head *bh = mp->mp_bh[height];
261 if (height == 0)
262 return ((__be64 *)(bh->b_data + sizeof(struct gfs2_dinode)));
263 return ((__be64 *)(bh->b_data + sizeof(struct gfs2_meta_header)));
264}
265
266/**
David Teiglandb3b94fa2006-01-16 16:50:04 +0000267 * metapointer - Return pointer to start of metadata in a buffer
David Teiglandb3b94fa2006-01-16 16:50:04 +0000268 * @height: The metadata height (0 = dinode)
269 * @mp: The metapath
270 *
271 * Return a pointer to the block number of the next height of the metadata
272 * tree given a buffer containing the pointer to the current height of the
273 * metadata tree.
274 */
275
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000276static inline __be64 *metapointer(unsigned int height, const struct metapath *mp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000277{
Bob Petersond552a2b2017-02-06 08:28:32 -0500278 __be64 *p = metaptr1(height, mp);
279 return p + mp->mp_list[height];
David Teiglandb3b94fa2006-01-16 16:50:04 +0000280}
281
Steven Whitehouseb99b98d2011-09-21 11:05:16 +0100282static void gfs2_metapath_ra(struct gfs2_glock *gl,
283 const struct buffer_head *bh, const __be64 *pos)
284{
285 struct buffer_head *rabh;
286 const __be64 *endp = (const __be64 *)(bh->b_data + bh->b_size);
287 const __be64 *t;
288
289 for (t = pos; t < endp; t++) {
290 if (!*t)
291 continue;
292
293 rabh = gfs2_getbuf(gl, be64_to_cpu(*t), CREATE);
294 if (trylock_buffer(rabh)) {
295 if (!buffer_uptodate(rabh)) {
296 rabh->b_end_io = end_buffer_read_sync;
Coly Lie477b242017-07-21 07:48:22 -0500297 submit_bh(REQ_OP_READ,
298 REQ_RAHEAD | REQ_META | REQ_PRIO,
299 rabh);
Steven Whitehouseb99b98d2011-09-21 11:05:16 +0100300 continue;
301 }
302 unlock_buffer(rabh);
303 }
304 brelse(rabh);
305 }
306}
307
David Teiglandb3b94fa2006-01-16 16:50:04 +0000308/**
Bob Petersond552a2b2017-02-06 08:28:32 -0500309 * lookup_mp_height - helper function for lookup_metapath
310 * @ip: the inode
311 * @mp: the metapath
312 * @h: the height which needs looking up
313 */
314static int lookup_mp_height(struct gfs2_inode *ip, struct metapath *mp, int h)
315{
316 __be64 *ptr = metapointer(h, mp);
317 u64 dblock = be64_to_cpu(*ptr);
318
319 if (!dblock)
320 return h + 1;
321
322 return gfs2_meta_indirect_buffer(ip, h + 1, dblock, &mp->mp_bh[h + 1]);
323}
324
325/**
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000326 * lookup_metapath - Walk the metadata tree to a specific point
327 * @ip: The inode
David Teiglandb3b94fa2006-01-16 16:50:04 +0000328 * @mp: The metapath
David Teiglandb3b94fa2006-01-16 16:50:04 +0000329 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000330 * Assumes that the inode's buffer has already been looked up and
331 * hooked onto mp->mp_bh[0] and that the metapath has been initialised
332 * by find_metapath().
David Teiglandb3b94fa2006-01-16 16:50:04 +0000333 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000334 * If this function encounters part of the tree which has not been
335 * allocated, it returns the current height of the tree at the point
336 * at which it found the unallocated block. Blocks which are found are
337 * added to the mp->mp_bh[] list.
338 *
339 * Returns: error or height of metadata tree
David Teiglandb3b94fa2006-01-16 16:50:04 +0000340 */
341
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000342static int lookup_metapath(struct gfs2_inode *ip, struct metapath *mp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000343{
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000344 unsigned int end_of_metadata = ip->i_height - 1;
345 unsigned int x;
Steven Whitehousee23159d2008-02-12 14:48:39 +0000346 int ret;
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000347
348 for (x = 0; x < end_of_metadata; x++) {
Bob Petersond552a2b2017-02-06 08:28:32 -0500349 ret = lookup_mp_height(ip, mp, x);
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000350 if (ret)
Bob Peterson5f8bd442016-10-28 14:29:29 -0500351 goto out;
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000352 }
353
Bob Peterson5f8bd442016-10-28 14:29:29 -0500354 ret = ip->i_height;
355out:
356 mp->mp_aheight = ret;
357 return ret;
Steven Whitehousedbac6712008-01-29 09:12:55 +0000358}
359
Bob Petersond552a2b2017-02-06 08:28:32 -0500360/**
361 * fillup_metapath - fill up buffers for the metadata path to a specific height
362 * @ip: The inode
363 * @mp: The metapath
364 * @h: The height to which it should be mapped
365 *
366 * Similar to lookup_metapath, but does lookups for a range of heights
367 *
368 * Returns: error or height of metadata tree
369 */
370
371static int fillup_metapath(struct gfs2_inode *ip, struct metapath *mp, int h)
372{
373 unsigned int start_h = h - 1;
374 int ret;
375
376 if (h) {
377 /* find the first buffer we need to look up. */
378 while (start_h > 0 && mp->mp_bh[start_h] == NULL)
379 start_h--;
380 for (; start_h < h; start_h++) {
381 ret = lookup_mp_height(ip, mp, start_h);
382 if (ret)
383 return ret;
384 }
385 }
386 return ip->i_height;
387}
388
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000389static inline void release_metapath(struct metapath *mp)
Steven Whitehousedbac6712008-01-29 09:12:55 +0000390{
391 int i;
392
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000393 for (i = 0; i < GFS2_MAX_META_HEIGHT; i++) {
394 if (mp->mp_bh[i] == NULL)
395 break;
396 brelse(mp->mp_bh[i]);
397 }
Steven Whitehouse11707ea2008-01-28 15:10:29 +0000398}
399
Steven Whitehouse30cbf182008-02-08 13:18:11 +0000400/**
401 * gfs2_extent_length - Returns length of an extent of blocks
402 * @start: Start of the buffer
403 * @len: Length of the buffer in bytes
404 * @ptr: Current position in the buffer
405 * @limit: Max extent length to return (0 = unlimited)
406 * @eob: Set to 1 if we hit "end of block"
407 *
408 * If the first block is zero (unallocated) it will return the number of
409 * unallocated blocks in the extent, otherwise it will return the number
410 * of contiguous blocks in the extent.
411 *
412 * Returns: The length of the extent (minimum of one block)
413 */
414
Bob Petersonb6507382014-08-06 09:08:36 -0400415static inline unsigned int gfs2_extent_length(void *start, unsigned int len, __be64 *ptr, size_t limit, int *eob)
Steven Whitehouse30cbf182008-02-08 13:18:11 +0000416{
417 const __be64 *end = (start + len);
418 const __be64 *first = ptr;
419 u64 d = be64_to_cpu(*ptr);
420
421 *eob = 0;
422 do {
423 ptr++;
424 if (ptr >= end)
425 break;
426 if (limit && --limit == 0)
427 break;
428 if (d)
429 d++;
430 } while(be64_to_cpu(*ptr) == d);
431 if (ptr >= end)
432 *eob = 1;
433 return (ptr - first);
434}
435
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000436static inline void bmap_lock(struct gfs2_inode *ip, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400437{
Steven Whitehousefd88de562006-05-05 16:59:11 -0400438 if (create)
439 down_write(&ip->i_rw_mutex);
440 else
441 down_read(&ip->i_rw_mutex);
442}
443
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000444static inline void bmap_unlock(struct gfs2_inode *ip, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400445{
David Teiglandb3b94fa2006-01-16 16:50:04 +0000446 if (create)
447 up_write(&ip->i_rw_mutex);
448 else
449 up_read(&ip->i_rw_mutex);
Steven Whitehousefd88de562006-05-05 16:59:11 -0400450}
David Teiglandb3b94fa2006-01-16 16:50:04 +0000451
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000452static inline __be64 *gfs2_indirect_init(struct metapath *mp,
453 struct gfs2_glock *gl, unsigned int i,
454 unsigned offset, u64 bn)
455{
456 __be64 *ptr = (__be64 *)(mp->mp_bh[i - 1]->b_data +
457 ((i > 1) ? sizeof(struct gfs2_meta_header) :
458 sizeof(struct gfs2_dinode)));
459 BUG_ON(i < 1);
460 BUG_ON(mp->mp_bh[i] != NULL);
461 mp->mp_bh[i] = gfs2_meta_new(gl, bn);
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000462 gfs2_trans_add_meta(gl, mp->mp_bh[i]);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000463 gfs2_metatype_set(mp->mp_bh[i], GFS2_METATYPE_IN, GFS2_FORMAT_IN);
464 gfs2_buffer_clear_tail(mp->mp_bh[i], sizeof(struct gfs2_meta_header));
465 ptr += offset;
466 *ptr = cpu_to_be64(bn);
467 return ptr;
468}
469
470enum alloc_state {
471 ALLOC_DATA = 0,
472 ALLOC_GROW_DEPTH = 1,
473 ALLOC_GROW_HEIGHT = 2,
474 /* ALLOC_UNSTUFF = 3, TBD and rather complicated */
475};
476
Bob Petersond552a2b2017-02-06 08:28:32 -0500477static inline unsigned int hptrs(struct gfs2_sbd *sdp, const unsigned int hgt)
478{
479 if (hgt)
480 return sdp->sd_inptrs;
481 return sdp->sd_diptrs;
482}
483
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000484/**
485 * gfs2_bmap_alloc - Build a metadata tree of the requested height
486 * @inode: The GFS2 inode
487 * @lblock: The logical starting block of the extent
488 * @bh_map: This is used to return the mapping details
Bob Peterson5f8bd442016-10-28 14:29:29 -0500489 * @zero_new: True if newly allocated blocks should be zeroed
490 * @mp: The metapath, with proper height information calculated
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000491 * @maxlen: The max number of data blocks to alloc
Bob Peterson5f8bd442016-10-28 14:29:29 -0500492 * @dblock: Pointer to return the resulting new block
493 * @dblks: Pointer to return the number of blocks allocated
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000494 *
495 * In this routine we may have to alloc:
496 * i) Indirect blocks to grow the metadata tree height
497 * ii) Indirect blocks to fill in lower part of the metadata tree
498 * iii) Data blocks
499 *
500 * The function is in two parts. The first part works out the total
501 * number of blocks which we need. The second part does the actual
502 * allocation asking for an extent at a time (if enough contiguous free
503 * blocks are available, there will only be one request per bmap call)
504 * and uses the state machine to initialise the blocks in order.
505 *
506 * Returns: errno on error
507 */
508
Bob Peterson39743202017-02-16 10:27:16 -0500509static int gfs2_iomap_alloc(struct inode *inode, struct iomap *iomap,
510 unsigned flags, struct metapath *mp)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000511{
512 struct gfs2_inode *ip = GFS2_I(inode);
513 struct gfs2_sbd *sdp = GFS2_SB(inode);
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500514 struct super_block *sb = sdp->sd_vfs;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000515 struct buffer_head *dibh = mp->mp_bh[0];
Bob Peterson5f8bd442016-10-28 14:29:29 -0500516 u64 bn;
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500517 unsigned n, i, blks, alloced = 0, iblks = 0, branch_start = 0;
Bob Peterson39743202017-02-16 10:27:16 -0500518 unsigned dblks = 0;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000519 unsigned ptrs_per_blk;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500520 const unsigned end_of_metadata = mp->mp_fheight - 1;
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500521 int ret;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000522 enum alloc_state state;
523 __be64 *ptr;
524 __be64 zero_bn = 0;
Bob Peterson39743202017-02-16 10:27:16 -0500525 size_t maxlen = iomap->length >> inode->i_blkbits;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000526
Bob Peterson5f8bd442016-10-28 14:29:29 -0500527 BUG_ON(mp->mp_aheight < 1);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000528 BUG_ON(dibh == NULL);
529
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000530 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000531
Bob Peterson5f8bd442016-10-28 14:29:29 -0500532 if (mp->mp_fheight == mp->mp_aheight) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000533 struct buffer_head *bh;
Bob Peterson39743202017-02-16 10:27:16 -0500534 int eob;
535
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000536 /* Bottom indirect block exists, find unalloced extent size */
537 ptr = metapointer(end_of_metadata, mp);
538 bh = mp->mp_bh[end_of_metadata];
Bob Peterson39743202017-02-16 10:27:16 -0500539 dblks = gfs2_extent_length(bh->b_data, bh->b_size, ptr,
540 maxlen, &eob);
541 BUG_ON(dblks < 1);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000542 state = ALLOC_DATA;
543 } else {
544 /* Need to allocate indirect blocks */
Bob Peterson5f8bd442016-10-28 14:29:29 -0500545 ptrs_per_blk = mp->mp_fheight > 1 ? sdp->sd_inptrs :
546 sdp->sd_diptrs;
Bob Peterson39743202017-02-16 10:27:16 -0500547 dblks = min(maxlen, (size_t)(ptrs_per_blk -
548 mp->mp_list[end_of_metadata]));
Bob Peterson5f8bd442016-10-28 14:29:29 -0500549 if (mp->mp_fheight == ip->i_height) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000550 /* Writing into existing tree, extend tree down */
Bob Peterson5f8bd442016-10-28 14:29:29 -0500551 iblks = mp->mp_fheight - mp->mp_aheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000552 state = ALLOC_GROW_DEPTH;
553 } else {
554 /* Building up tree height */
555 state = ALLOC_GROW_HEIGHT;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500556 iblks = mp->mp_fheight - ip->i_height;
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500557 branch_start = metapath_branch_start(mp);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500558 iblks += (mp->mp_fheight - branch_start);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000559 }
560 }
561
562 /* start of the second part of the function (state machine) */
563
Bob Peterson39743202017-02-16 10:27:16 -0500564 blks = dblks + iblks;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500565 i = mp->mp_aheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000566 do {
Steven Whitehouse09010972009-05-20 10:48:47 +0100567 int error;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000568 n = blks - alloced;
Bob Peterson6e87ed02011-11-18 10:58:32 -0500569 error = gfs2_alloc_blocks(ip, &bn, &n, 0, NULL);
Steven Whitehouse09010972009-05-20 10:48:47 +0100570 if (error)
571 return error;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000572 alloced += n;
573 if (state != ALLOC_DATA || gfs2_is_jdata(ip))
574 gfs2_trans_add_unrevoke(sdp, bn, n);
575 switch (state) {
576 /* Growing height of tree */
577 case ALLOC_GROW_HEIGHT:
578 if (i == 1) {
579 ptr = (__be64 *)(dibh->b_data +
580 sizeof(struct gfs2_dinode));
581 zero_bn = *ptr;
582 }
Bob Peterson5f8bd442016-10-28 14:29:29 -0500583 for (; i - 1 < mp->mp_fheight - ip->i_height && n > 0;
584 i++, n--)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000585 gfs2_indirect_init(mp, ip->i_gl, i, 0, bn++);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500586 if (i - 1 == mp->mp_fheight - ip->i_height) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000587 i--;
588 gfs2_buffer_copy_tail(mp->mp_bh[i],
589 sizeof(struct gfs2_meta_header),
590 dibh, sizeof(struct gfs2_dinode));
591 gfs2_buffer_clear_tail(dibh,
592 sizeof(struct gfs2_dinode) +
593 sizeof(__be64));
594 ptr = (__be64 *)(mp->mp_bh[i]->b_data +
595 sizeof(struct gfs2_meta_header));
596 *ptr = zero_bn;
597 state = ALLOC_GROW_DEPTH;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500598 for(i = branch_start; i < mp->mp_fheight; i++) {
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000599 if (mp->mp_bh[i] == NULL)
600 break;
601 brelse(mp->mp_bh[i]);
602 mp->mp_bh[i] = NULL;
603 }
Benjamin Marzinski5af4e7a2008-06-24 12:53:38 -0500604 i = branch_start;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000605 }
606 if (n == 0)
607 break;
608 /* Branching from existing tree */
609 case ALLOC_GROW_DEPTH:
Bob Peterson5f8bd442016-10-28 14:29:29 -0500610 if (i > 1 && i < mp->mp_fheight)
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000611 gfs2_trans_add_meta(ip->i_gl, mp->mp_bh[i-1]);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500612 for (; i < mp->mp_fheight && n > 0; i++, n--)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000613 gfs2_indirect_init(mp, ip->i_gl, i,
614 mp->mp_list[i-1], bn++);
Bob Peterson5f8bd442016-10-28 14:29:29 -0500615 if (i == mp->mp_fheight)
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000616 state = ALLOC_DATA;
617 if (n == 0)
618 break;
619 /* Tree complete, adding data blocks */
620 case ALLOC_DATA:
Bob Peterson39743202017-02-16 10:27:16 -0500621 BUG_ON(n > dblks);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000622 BUG_ON(mp->mp_bh[end_of_metadata] == NULL);
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000623 gfs2_trans_add_meta(ip->i_gl, mp->mp_bh[end_of_metadata]);
Bob Peterson39743202017-02-16 10:27:16 -0500624 dblks = n;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000625 ptr = metapointer(end_of_metadata, mp);
Bob Peterson39743202017-02-16 10:27:16 -0500626 iomap->addr = bn << inode->i_blkbits;
627 iomap->flags |= IOMAP_F_NEW;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000628 while (n-- > 0)
629 *ptr++ = cpu_to_be64(bn++);
Bob Peterson39743202017-02-16 10:27:16 -0500630 if (flags & IOMAP_ZERO) {
631 ret = sb_issue_zeroout(sb, iomap->addr >> inode->i_blkbits,
632 dblks, GFP_NOFS);
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500633 if (ret) {
634 fs_err(sdp,
635 "Failed to zero data buffers\n");
Bob Peterson39743202017-02-16 10:27:16 -0500636 flags &= ~IOMAP_ZERO;
Benjamin Marzinski64dd1532011-09-12 18:15:24 -0500637 }
638 }
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000639 break;
640 }
Bob Peterson39743202017-02-16 10:27:16 -0500641 } while (iomap->addr == IOMAP_NULL_ADDR);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000642
Bob Peterson39743202017-02-16 10:27:16 -0500643 iomap->length = (u64)dblks << inode->i_blkbits;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500644 ip->i_height = mp->mp_fheight;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000645 gfs2_add_inode_blocks(&ip->i_inode, alloced);
646 gfs2_dinode_out(ip, mp->mp_bh[0]->b_data);
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000647 return 0;
648}
649
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500650/**
Bob Peterson39743202017-02-16 10:27:16 -0500651 * hole_size - figure out the size of a hole
652 * @inode: The inode
653 * @lblock: The logical starting block number
654 * @mp: The metapath
655 *
656 * Returns: The hole size in bytes
657 *
658 */
659static u64 hole_size(struct inode *inode, sector_t lblock, struct metapath *mp)
660{
661 struct gfs2_inode *ip = GFS2_I(inode);
662 struct gfs2_sbd *sdp = GFS2_SB(inode);
663 struct metapath mp_eof;
664 u64 factor = 1;
665 int hgt;
666 u64 holesz = 0;
667 const __be64 *first, *end, *ptr;
668 const struct buffer_head *bh;
669 u64 lblock_stop = (i_size_read(inode) - 1) >> inode->i_blkbits;
670 int zeroptrs;
671 bool done = false;
672
673 /* Get another metapath, to the very last byte */
674 find_metapath(sdp, lblock_stop, &mp_eof, ip->i_height);
675 for (hgt = ip->i_height - 1; hgt >= 0 && !done; hgt--) {
676 bh = mp->mp_bh[hgt];
677 if (bh) {
678 zeroptrs = 0;
679 first = metapointer(hgt, mp);
680 end = (const __be64 *)(bh->b_data + bh->b_size);
681
682 for (ptr = first; ptr < end; ptr++) {
683 if (*ptr) {
684 done = true;
685 break;
686 } else {
687 zeroptrs++;
688 }
689 }
690 } else {
691 zeroptrs = sdp->sd_inptrs;
692 }
693 if (factor * zeroptrs >= lblock_stop - lblock + 1) {
694 holesz = lblock_stop - lblock + 1;
695 break;
696 }
697 holesz += factor * zeroptrs;
698
699 factor *= sdp->sd_inptrs;
700 if (hgt && (mp->mp_list[hgt - 1] < mp_eof.mp_list[hgt - 1]))
701 (mp->mp_list[hgt - 1])++;
702 }
703 return holesz << inode->i_blkbits;
704}
705
706static void gfs2_stuffed_iomap(struct inode *inode, struct iomap *iomap)
707{
708 struct gfs2_inode *ip = GFS2_I(inode);
709
710 iomap->addr = (ip->i_no_addr << inode->i_blkbits) +
711 sizeof(struct gfs2_dinode);
712 iomap->offset = 0;
713 iomap->length = i_size_read(inode);
714 iomap->type = IOMAP_MAPPED;
715 iomap->flags = IOMAP_F_DATA_INLINE;
716}
717
718/**
719 * gfs2_iomap_begin - Map blocks from an inode to disk blocks
720 * @inode: The inode
721 * @pos: Starting position in bytes
722 * @length: Length to map, in bytes
723 * @flags: iomap flags
724 * @iomap: The iomap structure
725 *
726 * Returns: errno
727 */
728int gfs2_iomap_begin(struct inode *inode, loff_t pos, loff_t length,
729 unsigned flags, struct iomap *iomap)
730{
731 struct gfs2_inode *ip = GFS2_I(inode);
732 struct gfs2_sbd *sdp = GFS2_SB(inode);
733 struct metapath mp = { .mp_aheight = 1, };
734 unsigned int factor = sdp->sd_sb.sb_bsize;
735 const u64 *arr = sdp->sd_heightsize;
736 __be64 *ptr;
737 sector_t lblock;
738 sector_t lend;
739 int ret;
740 int eob;
741 unsigned int len;
742 struct buffer_head *bh;
743 u8 height;
744
745 trace_gfs2_iomap_start(ip, pos, length, flags);
746 if (!length) {
747 ret = -EINVAL;
748 goto out;
749 }
750
751 if ((flags & IOMAP_REPORT) && gfs2_is_stuffed(ip)) {
752 gfs2_stuffed_iomap(inode, iomap);
753 if (pos >= iomap->length)
754 return -ENOENT;
755 ret = 0;
756 goto out;
757 }
758
759 lblock = pos >> inode->i_blkbits;
760 lend = (pos + length + sdp->sd_sb.sb_bsize - 1) >> inode->i_blkbits;
761
762 iomap->offset = lblock << inode->i_blkbits;
763 iomap->addr = IOMAP_NULL_ADDR;
764 iomap->type = IOMAP_HOLE;
765 iomap->length = (u64)(lend - lblock) << inode->i_blkbits;
766 iomap->flags = IOMAP_F_MERGED;
767 bmap_lock(ip, 0);
768
769 /*
770 * Directory data blocks have a struct gfs2_meta_header header, so the
771 * remaining size is smaller than the filesystem block size. Logical
772 * block numbers for directories are in units of this remaining size!
773 */
774 if (gfs2_is_dir(ip)) {
775 factor = sdp->sd_jbsize;
776 arr = sdp->sd_jheightsize;
777 }
778
779 ret = gfs2_meta_inode_buffer(ip, &mp.mp_bh[0]);
780 if (ret)
781 goto out_release;
782
783 height = ip->i_height;
784 while ((lblock + 1) * factor > arr[height])
785 height++;
786 find_metapath(sdp, lblock, &mp, height);
787 if (height > ip->i_height || gfs2_is_stuffed(ip))
788 goto do_alloc;
789
790 ret = lookup_metapath(ip, &mp);
791 if (ret < 0)
792 goto out_release;
793
794 if (mp.mp_aheight != ip->i_height)
795 goto do_alloc;
796
797 ptr = metapointer(ip->i_height - 1, &mp);
798 if (*ptr == 0)
799 goto do_alloc;
800
801 iomap->type = IOMAP_MAPPED;
802 iomap->addr = be64_to_cpu(*ptr) << inode->i_blkbits;
803
804 bh = mp.mp_bh[ip->i_height - 1];
805 len = gfs2_extent_length(bh->b_data, bh->b_size, ptr, lend - lblock, &eob);
806 if (eob)
807 iomap->flags |= IOMAP_F_BOUNDARY;
808 iomap->length = (u64)len << inode->i_blkbits;
809
810 ret = 0;
811
812out_release:
813 release_metapath(&mp);
814 bmap_unlock(ip, 0);
815out:
816 trace_gfs2_iomap_end(ip, iomap, ret);
817 return ret;
818
819do_alloc:
820 if (!(flags & IOMAP_WRITE)) {
821 if (pos >= i_size_read(inode)) {
822 ret = -ENOENT;
823 goto out_release;
824 }
825 ret = 0;
826 iomap->length = hole_size(inode, lblock, &mp);
827 goto out_release;
828 }
829
830 ret = gfs2_iomap_alloc(inode, iomap, flags, &mp);
831 goto out_release;
832}
833
834/**
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500835 * gfs2_block_map - Map a block from an inode to a disk block
836 * @inode: The inode
837 * @lblock: The logical block number
838 * @bh_map: The bh to be mapped
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000839 * @create: True if its ok to alloc blocks to satify the request
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500840 *
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000841 * Sets buffer_mapped() if successful, sets buffer_boundary() if a
842 * read of metadata will be required before the next block can be
843 * mapped. Sets buffer_new() if new blocks were allocated.
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500844 *
845 * Returns: errno
846 */
847
Bob Petersone9e1ef22007-12-10 14:13:27 -0600848int gfs2_block_map(struct inode *inode, sector_t lblock,
849 struct buffer_head *bh_map, int create)
Steven Whitehousefd88de562006-05-05 16:59:11 -0400850{
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500851 struct gfs2_inode *ip = GFS2_I(inode);
Bob Peterson39743202017-02-16 10:27:16 -0500852 struct iomap iomap;
853 int ret, flags = 0;
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +0000854
Steven Whitehouse4cf1ed82006-11-15 15:21:06 -0500855 clear_buffer_mapped(bh_map);
856 clear_buffer_new(bh_map);
857 clear_buffer_boundary(bh_map);
Steven Whitehouse63997772009-06-12 08:49:20 +0100858 trace_gfs2_bmap(ip, bh_map, lblock, create, 1);
Andreas Gruenbacher20cdc192017-09-22 07:39:54 -0500859
Bob Peterson39743202017-02-16 10:27:16 -0500860 if (create)
861 flags |= IOMAP_WRITE;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500862 if (buffer_zeronew(bh_map))
Bob Peterson39743202017-02-16 10:27:16 -0500863 flags |= IOMAP_ZERO;
864 ret = gfs2_iomap_begin(inode, (loff_t)lblock << inode->i_blkbits,
865 bh_map->b_size, flags, &iomap);
866 if (ret) {
867 if (!create && ret == -ENOENT) {
868 /* Return unmapped buffer beyond the end of file. */
869 ret = 0;
870 }
871 goto out;
Bob Peterson5f8bd442016-10-28 14:29:29 -0500872 }
Bob Peterson39743202017-02-16 10:27:16 -0500873
874 if (iomap.length > bh_map->b_size) {
875 iomap.length = bh_map->b_size;
876 iomap.flags &= ~IOMAP_F_BOUNDARY;
877 }
878 if (iomap.addr != IOMAP_NULL_ADDR)
879 map_bh(bh_map, inode->i_sb, iomap.addr >> inode->i_blkbits);
880 bh_map->b_size = iomap.length;
881 if (iomap.flags & IOMAP_F_BOUNDARY)
882 set_buffer_boundary(bh_map);
883 if (iomap.flags & IOMAP_F_NEW)
884 set_buffer_new(bh_map);
885
886out:
887 trace_gfs2_bmap(ip, bh_map, lblock, create, ret);
888 return ret;
Steven Whitehousefd88de562006-05-05 16:59:11 -0400889}
890
Steven Whitehouse941e6d72008-01-28 08:47:38 +0000891/*
892 * Deprecated: do not use in new code
893 */
Steven Whitehousefd88de562006-05-05 16:59:11 -0400894int gfs2_extent_map(struct inode *inode, u64 lblock, int *new, u64 *dblock, unsigned *extlen)
895{
Steven Whitehouse23591252006-10-13 17:25:45 -0400896 struct buffer_head bh = { .b_state = 0, .b_blocknr = 0 };
Steven Whitehouse7a6bbac2006-09-18 17:18:23 -0400897 int ret;
Steven Whitehousefd88de562006-05-05 16:59:11 -0400898 int create = *new;
899
900 BUG_ON(!extlen);
901 BUG_ON(!dblock);
902 BUG_ON(!new);
903
Fabian Frederick47a9a522016-08-02 12:05:27 -0500904 bh.b_size = BIT(inode->i_blkbits + (create ? 0 : 5));
Bob Petersone9e1ef22007-12-10 14:13:27 -0600905 ret = gfs2_block_map(inode, lblock, &bh, create);
Steven Whitehouse7a6bbac2006-09-18 17:18:23 -0400906 *extlen = bh.b_size >> inode->i_blkbits;
907 *dblock = bh.b_blocknr;
908 if (buffer_new(&bh))
909 *new = 1;
910 else
911 *new = 0;
912 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000913}
914
915/**
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400916 * gfs2_block_truncate_page - Deal with zeroing out data for truncate
917 *
918 * This is partly borrowed from ext3.
919 */
Steven Whitehouseff8f33c2010-08-11 09:37:53 +0100920static int gfs2_block_truncate_page(struct address_space *mapping, loff_t from)
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400921{
922 struct inode *inode = mapping->host;
923 struct gfs2_inode *ip = GFS2_I(inode);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300924 unsigned long index = from >> PAGE_SHIFT;
925 unsigned offset = from & (PAGE_SIZE-1);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400926 unsigned blocksize, iblock, length, pos;
927 struct buffer_head *bh;
928 struct page *page;
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400929 int err;
930
Bob Peterson220cca22012-03-19 15:25:50 -0400931 page = find_or_create_page(mapping, index, GFP_NOFS);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400932 if (!page)
933 return 0;
934
935 blocksize = inode->i_sb->s_blocksize;
936 length = blocksize - (offset & (blocksize - 1));
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300937 iblock = index << (PAGE_SHIFT - inode->i_sb->s_blocksize_bits);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400938
939 if (!page_has_buffers(page))
940 create_empty_buffers(page, blocksize, 0);
941
942 /* Find the buffer that contains "offset" */
943 bh = page_buffers(page);
944 pos = blocksize;
945 while (offset >= pos) {
946 bh = bh->b_this_page;
947 iblock++;
948 pos += blocksize;
949 }
950
951 err = 0;
952
953 if (!buffer_mapped(bh)) {
Bob Petersone9e1ef22007-12-10 14:13:27 -0600954 gfs2_block_map(inode, iblock, bh, 0);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400955 /* unmapped? It's a hole - nothing to do */
956 if (!buffer_mapped(bh))
957 goto unlock;
958 }
959
960 /* Ok, it's mapped. Make sure it's up-to-date */
961 if (PageUptodate(page))
962 set_buffer_uptodate(bh);
963
964 if (!buffer_uptodate(bh)) {
965 err = -EIO;
Mike Christiedfec8a12016-06-05 14:31:44 -0500966 ll_rw_block(REQ_OP_READ, 0, 1, &bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400967 wait_on_buffer(bh);
968 /* Uhhuh. Read error. Complain and punt. */
969 if (!buffer_uptodate(bh))
970 goto unlock;
S. Wendy Cheng1875f2f2007-06-25 21:14:31 -0400971 err = 0;
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400972 }
973
Steven Whitehousebf36a712007-10-17 08:35:19 +0100974 if (!gfs2_is_writeback(ip))
Steven Whitehouse350a9b02012-12-14 12:36:02 +0000975 gfs2_trans_add_data(ip->i_gl, bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400976
Christoph Lametereebd2aa2008-02-04 22:28:29 -0800977 zero_user(page, offset, length);
Steven Whitehouse40bc9a22009-06-10 09:09:40 +0100978 mark_buffer_dirty(bh);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400979unlock:
980 unlock_page(page);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300981 put_page(page);
Steven Whitehouseba7f7292006-07-26 11:27:10 -0400982 return err;
983}
984
Fabian Frederickc62baf62014-05-14 18:32:31 +0200985#define GFS2_JTRUNC_REVOKES 8192
986
Steven Whitehousefa731fc2012-11-13 09:50:28 +0000987/**
988 * gfs2_journaled_truncate - Wrapper for truncate_pagecache for jdata files
989 * @inode: The inode being truncated
990 * @oldsize: The original (larger) size
991 * @newsize: The new smaller size
992 *
993 * With jdata files, we have to journal a revoke for each block which is
994 * truncated. As a result, we need to split this into separate transactions
995 * if the number of pages being truncated gets too large.
996 */
997
Steven Whitehousefa731fc2012-11-13 09:50:28 +0000998static int gfs2_journaled_truncate(struct inode *inode, u64 oldsize, u64 newsize)
999{
1000 struct gfs2_sbd *sdp = GFS2_SB(inode);
1001 u64 max_chunk = GFS2_JTRUNC_REVOKES * sdp->sd_vfs->s_blocksize;
1002 u64 chunk;
1003 int error;
1004
1005 while (oldsize != newsize) {
1006 chunk = oldsize - newsize;
1007 if (chunk > max_chunk)
1008 chunk = max_chunk;
Kirill A. Shutemov7caef262013-09-12 15:13:56 -07001009 truncate_pagecache(inode, oldsize - chunk);
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001010 oldsize -= chunk;
1011 gfs2_trans_end(sdp);
1012 error = gfs2_trans_begin(sdp, RES_DINODE, GFS2_JTRUNC_REVOKES);
1013 if (error)
1014 return error;
1015 }
1016
1017 return 0;
1018}
1019
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001020static int trunc_start(struct inode *inode, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001021{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001022 struct gfs2_inode *ip = GFS2_I(inode);
1023 struct gfs2_sbd *sdp = GFS2_SB(inode);
1024 struct address_space *mapping = inode->i_mapping;
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001025 struct buffer_head *dibh = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001026 int journaled = gfs2_is_jdata(ip);
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001027 u64 oldsize = inode->i_size;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001028 int error;
1029
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001030 if (journaled)
1031 error = gfs2_trans_begin(sdp, RES_DINODE + RES_JDATA, GFS2_JTRUNC_REVOKES);
1032 else
1033 error = gfs2_trans_begin(sdp, RES_DINODE, 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001034 if (error)
1035 return error;
1036
1037 error = gfs2_meta_inode_buffer(ip, &dibh);
1038 if (error)
1039 goto out;
1040
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001041 gfs2_trans_add_meta(ip->i_gl, dibh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001042
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001043 if (gfs2_is_stuffed(ip)) {
1044 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode) + newsize);
1045 } else {
1046 if (newsize & (u64)(sdp->sd_sb.sb_bsize - 1)) {
1047 error = gfs2_block_truncate_page(mapping, newsize);
1048 if (error)
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001049 goto out;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001050 }
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001051 ip->i_diskflags |= GFS2_DIF_TRUNC_IN_PROG;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001052 }
1053
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001054 i_size_write(inode, newsize);
Deepa Dinamani078cd822016-09-14 07:48:04 -07001055 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001056 gfs2_dinode_out(ip, dibh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001057
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001058 if (journaled)
1059 error = gfs2_journaled_truncate(inode, oldsize, newsize);
1060 else
Kirill A. Shutemov7caef262013-09-12 15:13:56 -07001061 truncate_pagecache(inode, newsize);
Steven Whitehousefa731fc2012-11-13 09:50:28 +00001062
Steven Whitehousea91ea692006-09-04 12:04:26 -04001063out:
Andreas Gruenbacher80990f42017-12-12 16:42:01 +01001064 brelse(dibh);
1065 if (current->journal_info)
1066 gfs2_trans_end(sdp);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001067 return error;
1068}
1069
Bob Petersond552a2b2017-02-06 08:28:32 -05001070/**
1071 * sweep_bh_for_rgrps - find an rgrp in a meta buffer and free blocks therein
1072 * @ip: inode
1073 * @rg_gh: holder of resource group glock
1074 * @mp: current metapath fully populated with buffers
1075 * @btotal: place to keep count of total blocks freed
1076 * @hgt: height we're processing
1077 * @first: true if this is the first call to this function for this height
1078 *
1079 * We sweep a metadata buffer (provided by the metapath) for blocks we need to
1080 * free, and free them all. However, we do it one rgrp at a time. If this
1081 * block has references to multiple rgrps, we break it into individual
1082 * transactions. This allows other processes to use the rgrps while we're
1083 * focused on a single one, for better concurrency / performance.
1084 * At every transaction boundary, we rewrite the inode into the journal.
1085 * That way the bitmaps are kept consistent with the inode and we can recover
1086 * if we're interrupted by power-outages.
1087 *
1088 * Returns: 0, or return code if an error occurred.
1089 * *btotal has the total number of blocks freed
1090 */
1091static int sweep_bh_for_rgrps(struct gfs2_inode *ip, struct gfs2_holder *rd_gh,
1092 const struct metapath *mp, u32 *btotal, int hgt,
1093 bool preserve1)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001094{
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +00001095 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001096 struct gfs2_rgrpd *rgd;
1097 struct gfs2_trans *tr;
1098 struct buffer_head *bh = mp->mp_bh[hgt];
1099 __be64 *top, *bottom, *p;
1100 int blks_outside_rgrp;
1101 u64 bn, bstart, isize_blks;
1102 s64 blen; /* needs to be s64 or gfs2_add_inode_blocks breaks */
1103 int meta = ((hgt != ip->i_height - 1) ? 1 : 0);
1104 int ret = 0;
1105 bool buf_in_tr = false; /* buffer was added to transaction */
David Teiglandb3b94fa2006-01-16 16:50:04 +00001106
Bob Petersond552a2b2017-02-06 08:28:32 -05001107 if (gfs2_metatype_check(sdp, bh,
1108 (hgt ? GFS2_METATYPE_IN : GFS2_METATYPE_DI)))
1109 return -EIO;
1110
1111more_rgrps:
1112 blks_outside_rgrp = 0;
1113 bstart = 0;
1114 blen = 0;
1115 top = metapointer(hgt, mp); /* first ptr from metapath */
1116 /* If we're keeping some data at the truncation point, we've got to
1117 preserve the metadata tree by adding 1 to the starting metapath. */
1118 if (preserve1)
1119 top++;
1120
1121 bottom = (__be64 *)(bh->b_data + bh->b_size);
1122
1123 for (p = top; p < bottom; p++) {
1124 if (!*p)
1125 continue;
1126 bn = be64_to_cpu(*p);
1127 if (gfs2_holder_initialized(rd_gh)) {
Andreas Gruenbacher6f6597ba2017-06-30 07:55:08 -05001128 rgd = gfs2_glock2rgrp(rd_gh->gh_gl);
Bob Petersond552a2b2017-02-06 08:28:32 -05001129 gfs2_assert_withdraw(sdp,
1130 gfs2_glock_is_locked_by_me(rd_gh->gh_gl));
1131 } else {
Steven Whitehouse90bcab92017-12-22 13:13:07 +01001132 rgd = gfs2_blk2rgrpd(sdp, bn, true);
Bob Petersond552a2b2017-02-06 08:28:32 -05001133 ret = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE,
1134 0, rd_gh);
1135 if (ret)
1136 goto out;
1137
1138 /* Must be done with the rgrp glock held: */
1139 if (gfs2_rs_active(&ip->i_res) &&
1140 rgd == ip->i_res.rs_rbm.rgd)
1141 gfs2_rs_deltree(&ip->i_res);
1142 }
1143
1144 if (!rgrp_contains_block(rgd, bn)) {
1145 blks_outside_rgrp++;
1146 continue;
1147 }
1148
1149 /* The size of our transactions will be unknown until we
1150 actually process all the metadata blocks that relate to
1151 the rgrp. So we estimate. We know it can't be more than
1152 the dinode's i_blocks and we don't want to exceed the
1153 journal flush threshold, sd_log_thresh2. */
1154 if (current->journal_info == NULL) {
1155 unsigned int jblocks_rqsted, revokes;
1156
1157 jblocks_rqsted = rgd->rd_length + RES_DINODE +
1158 RES_INDIRECT;
1159 isize_blks = gfs2_get_inode_blocks(&ip->i_inode);
1160 if (isize_blks > atomic_read(&sdp->sd_log_thresh2))
1161 jblocks_rqsted +=
1162 atomic_read(&sdp->sd_log_thresh2);
1163 else
1164 jblocks_rqsted += isize_blks;
1165 revokes = jblocks_rqsted;
1166 if (meta)
1167 revokes += hptrs(sdp, hgt);
1168 else if (ip->i_depth)
1169 revokes += sdp->sd_inptrs;
1170 ret = gfs2_trans_begin(sdp, jblocks_rqsted, revokes);
1171 if (ret)
1172 goto out_unlock;
1173 down_write(&ip->i_rw_mutex);
1174 }
1175 /* check if we will exceed the transaction blocks requested */
1176 tr = current->journal_info;
1177 if (tr->tr_num_buf_new + RES_STATFS +
1178 RES_QUOTA >= atomic_read(&sdp->sd_log_thresh2)) {
1179 /* We set blks_outside_rgrp to ensure the loop will
1180 be repeated for the same rgrp, but with a new
1181 transaction. */
1182 blks_outside_rgrp++;
1183 /* This next part is tricky. If the buffer was added
1184 to the transaction, we've already set some block
1185 pointers to 0, so we better follow through and free
1186 them, or we will introduce corruption (so break).
1187 This may be impossible, or at least rare, but I
1188 decided to cover the case regardless.
1189
1190 If the buffer was not added to the transaction
1191 (this call), doing so would exceed our transaction
1192 size, so we need to end the transaction and start a
1193 new one (so goto). */
1194
1195 if (buf_in_tr)
1196 break;
1197 goto out_unlock;
1198 }
1199
1200 gfs2_trans_add_meta(ip->i_gl, bh);
1201 buf_in_tr = true;
1202 *p = 0;
1203 if (bstart + blen == bn) {
1204 blen++;
1205 continue;
1206 }
1207 if (bstart) {
1208 __gfs2_free_blocks(ip, bstart, (u32)blen, meta);
1209 (*btotal) += blen;
1210 gfs2_add_inode_blocks(&ip->i_inode, -blen);
1211 }
1212 bstart = bn;
1213 blen = 1;
1214 }
1215 if (bstart) {
1216 __gfs2_free_blocks(ip, bstart, (u32)blen, meta);
1217 (*btotal) += blen;
1218 gfs2_add_inode_blocks(&ip->i_inode, -blen);
1219 }
1220out_unlock:
1221 if (!ret && blks_outside_rgrp) { /* If buffer still has non-zero blocks
1222 outside the rgrp we just processed,
1223 do it all over again. */
1224 if (current->journal_info) {
1225 struct buffer_head *dibh = mp->mp_bh[0];
1226
1227 /* Every transaction boundary, we rewrite the dinode
1228 to keep its di_blocks current in case of failure. */
1229 ip->i_inode.i_mtime = ip->i_inode.i_ctime =
Stephen Rothwellb32c8c72017-05-08 15:59:34 -07001230 current_time(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001231 gfs2_trans_add_meta(ip->i_gl, dibh);
1232 gfs2_dinode_out(ip, dibh->b_data);
1233 up_write(&ip->i_rw_mutex);
1234 gfs2_trans_end(sdp);
1235 }
1236 gfs2_glock_dq_uninit(rd_gh);
1237 cond_resched();
1238 goto more_rgrps;
1239 }
1240out:
1241 return ret;
1242}
1243
1244/**
1245 * find_nonnull_ptr - find a non-null pointer given a metapath and height
1246 * assumes the metapath is valid (with buffers) out to height h
1247 * @mp: starting metapath
1248 * @h: desired height to search
1249 *
1250 * Returns: true if a non-null pointer was found in the metapath buffer
1251 * false if all remaining pointers are NULL in the buffer
1252 */
1253static bool find_nonnull_ptr(struct gfs2_sbd *sdp, struct metapath *mp,
1254 unsigned int h)
1255{
1256 __be64 *ptr;
1257 unsigned int ptrs = hptrs(sdp, h) - 1;
1258
1259 while (true) {
1260 ptr = metapointer(h, mp);
Bob Petersonc4a9d182017-08-30 09:26:09 -05001261 if (*ptr) { /* if we have a non-null pointer */
1262 /* Now zero the metapath after the current height. */
1263 h++;
1264 if (h < GFS2_MAX_META_HEIGHT)
1265 memset(&mp->mp_list[h], 0,
1266 (GFS2_MAX_META_HEIGHT - h) *
1267 sizeof(mp->mp_list[0]));
Bob Petersond552a2b2017-02-06 08:28:32 -05001268 return true;
Bob Petersonc4a9d182017-08-30 09:26:09 -05001269 }
Bob Petersond552a2b2017-02-06 08:28:32 -05001270
1271 if (mp->mp_list[h] < ptrs)
1272 mp->mp_list[h]++;
1273 else
1274 return false; /* no more pointers in this buffer */
1275 }
1276}
1277
1278enum dealloc_states {
1279 DEALLOC_MP_FULL = 0, /* Strip a metapath with all buffers read in */
1280 DEALLOC_MP_LOWER = 1, /* lower the metapath strip height */
1281 DEALLOC_FILL_MP = 2, /* Fill in the metapath to the given height. */
1282 DEALLOC_DONE = 3, /* process complete */
1283};
1284
Bob Petersonc4a9d182017-08-30 09:26:09 -05001285static bool mp_eq_to_hgt(struct metapath *mp, __u16 *nbof, unsigned int h)
1286{
1287 if (memcmp(mp->mp_list, nbof, h * sizeof(mp->mp_list[0])))
1288 return false;
1289 return true;
1290}
1291
Bob Petersond552a2b2017-02-06 08:28:32 -05001292/**
1293 * trunc_dealloc - truncate a file down to a desired size
1294 * @ip: inode to truncate
1295 * @newsize: The desired size of the file
1296 *
1297 * This function truncates a file to newsize. It works from the
1298 * bottom up, and from the right to the left. In other words, it strips off
1299 * the highest layer (data) before stripping any of the metadata. Doing it
1300 * this way is best in case the operation is interrupted by power failure, etc.
1301 * The dinode is rewritten in every transaction to guarantee integrity.
1302 */
1303static int trunc_dealloc(struct gfs2_inode *ip, u64 newsize)
1304{
1305 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1306 struct metapath mp;
1307 struct buffer_head *dibh, *bh;
1308 struct gfs2_holder rd_gh;
1309 u64 lblock;
1310 __u16 nbof[GFS2_MAX_META_HEIGHT]; /* new beginning of truncation */
1311 unsigned int strip_h = ip->i_height - 1;
1312 u32 btotal = 0;
1313 int ret, state;
1314 int mp_h; /* metapath buffers are read in to this height */
1315 sector_t last_ra = 0;
1316 u64 prev_bnr = 0;
1317 bool preserve1; /* need to preserve the first meta pointer? */
1318
1319 if (!newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001320 lblock = 0;
Steven Whitehouse18ec7d52006-02-08 11:50:51 +00001321 else
Bob Petersond552a2b2017-02-06 08:28:32 -05001322 lblock = (newsize - 1) >> sdp->sd_sb.sb_bsize_shift;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001323
Bob Petersond552a2b2017-02-06 08:28:32 -05001324 memset(&mp, 0, sizeof(mp));
Steven Whitehouse9b8c81d2008-02-22 16:09:31 +00001325 find_metapath(sdp, lblock, &mp, ip->i_height);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001326
Bob Petersond552a2b2017-02-06 08:28:32 -05001327 memcpy(&nbof, &mp.mp_list, sizeof(nbof));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001328
Bob Petersond552a2b2017-02-06 08:28:32 -05001329 ret = gfs2_meta_inode_buffer(ip, &dibh);
1330 if (ret)
1331 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001332
Bob Petersond552a2b2017-02-06 08:28:32 -05001333 mp.mp_bh[0] = dibh;
1334 ret = lookup_metapath(ip, &mp);
1335 if (ret == ip->i_height)
1336 state = DEALLOC_MP_FULL; /* We have a complete metapath */
1337 else
1338 state = DEALLOC_FILL_MP; /* deal with partial metapath */
1339
1340 ret = gfs2_rindex_update(sdp);
1341 if (ret)
1342 goto out_metapath;
1343
1344 ret = gfs2_quota_hold(ip, NO_UID_QUOTA_CHANGE, NO_GID_QUOTA_CHANGE);
1345 if (ret)
1346 goto out_metapath;
1347 gfs2_holder_mark_uninitialized(&rd_gh);
1348
1349 mp_h = strip_h;
1350
1351 while (state != DEALLOC_DONE) {
1352 switch (state) {
1353 /* Truncate a full metapath at the given strip height.
1354 * Note that strip_h == mp_h in order to be in this state. */
1355 case DEALLOC_MP_FULL:
1356 if (mp_h > 0) { /* issue read-ahead on metadata */
1357 __be64 *top;
1358
1359 bh = mp.mp_bh[mp_h - 1];
1360 if (bh->b_blocknr != last_ra) {
1361 last_ra = bh->b_blocknr;
1362 top = metaptr1(mp_h - 1, &mp);
1363 gfs2_metapath_ra(ip->i_gl, bh, top);
1364 }
1365 }
1366 /* If we're truncating to a non-zero size and the mp is
1367 at the beginning of file for the strip height, we
1368 need to preserve the first metadata pointer. */
Bob Petersonc4a9d182017-08-30 09:26:09 -05001369 preserve1 = (newsize && mp_eq_to_hgt(&mp, nbof, mp_h));
Bob Petersond552a2b2017-02-06 08:28:32 -05001370 bh = mp.mp_bh[mp_h];
1371 gfs2_assert_withdraw(sdp, bh);
1372 if (gfs2_assert_withdraw(sdp,
1373 prev_bnr != bh->b_blocknr)) {
1374 printk(KERN_EMERG "GFS2: fsid=%s:inode %llu, "
1375 "block:%llu, i_h:%u, s_h:%u, mp_h:%u\n",
1376 sdp->sd_fsname,
1377 (unsigned long long)ip->i_no_addr,
1378 prev_bnr, ip->i_height, strip_h, mp_h);
1379 }
1380 prev_bnr = bh->b_blocknr;
1381 ret = sweep_bh_for_rgrps(ip, &rd_gh, &mp, &btotal,
1382 mp_h, preserve1);
1383 /* If we hit an error or just swept dinode buffer,
1384 just exit. */
1385 if (ret || !mp_h) {
1386 state = DEALLOC_DONE;
1387 break;
1388 }
1389 state = DEALLOC_MP_LOWER;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001390 break;
Bob Petersond552a2b2017-02-06 08:28:32 -05001391
1392 /* lower the metapath strip height */
1393 case DEALLOC_MP_LOWER:
1394 /* We're done with the current buffer, so release it,
1395 unless it's the dinode buffer. Then back up to the
1396 previous pointer. */
1397 if (mp_h) {
1398 brelse(mp.mp_bh[mp_h]);
1399 mp.mp_bh[mp_h] = NULL;
1400 }
1401 /* If we can't get any lower in height, we've stripped
1402 off all we can. Next step is to back up and start
1403 stripping the previous level of metadata. */
1404 if (mp_h == 0) {
1405 strip_h--;
1406 memcpy(&mp.mp_list, &nbof, sizeof(nbof));
1407 mp_h = strip_h;
1408 state = DEALLOC_FILL_MP;
1409 break;
1410 }
1411 mp.mp_list[mp_h] = 0;
1412 mp_h--; /* search one metadata height down */
1413 if (mp.mp_list[mp_h] >= hptrs(sdp, mp_h) - 1)
1414 break; /* loop around in the same state */
1415 mp.mp_list[mp_h]++;
1416 /* Here we've found a part of the metapath that is not
1417 * allocated. We need to search at that height for the
1418 * next non-null pointer. */
1419 if (find_nonnull_ptr(sdp, &mp, mp_h)) {
1420 state = DEALLOC_FILL_MP;
1421 mp_h++;
1422 }
1423 /* No more non-null pointers at this height. Back up
1424 to the previous height and try again. */
1425 break; /* loop around in the same state */
1426
1427 /* Fill the metapath with buffers to the given height. */
1428 case DEALLOC_FILL_MP:
1429 /* Fill the buffers out to the current height. */
1430 ret = fillup_metapath(ip, &mp, mp_h);
1431 if (ret < 0)
1432 goto out;
1433
1434 /* If buffers found for the entire strip height */
1435 if ((ret == ip->i_height) && (mp_h == strip_h)) {
1436 state = DEALLOC_MP_FULL;
1437 break;
1438 }
1439 if (ret < ip->i_height) /* We have a partial height */
1440 mp_h = ret - 1;
1441
1442 /* If we find a non-null block pointer, crawl a bit
1443 higher up in the metapath and try again, otherwise
1444 we need to look lower for a new starting point. */
1445 if (find_nonnull_ptr(sdp, &mp, mp_h))
1446 mp_h++;
1447 else
1448 state = DEALLOC_MP_LOWER;
1449 break;
1450 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001451 }
1452
Bob Petersond552a2b2017-02-06 08:28:32 -05001453 if (btotal) {
1454 if (current->journal_info == NULL) {
1455 ret = gfs2_trans_begin(sdp, RES_DINODE + RES_STATFS +
1456 RES_QUOTA, 0);
1457 if (ret)
1458 goto out;
1459 down_write(&ip->i_rw_mutex);
1460 }
1461 gfs2_statfs_change(sdp, 0, +btotal, 0);
1462 gfs2_quota_change(ip, -(s64)btotal, ip->i_inode.i_uid,
1463 ip->i_inode.i_gid);
Stephen Rothwellb32c8c72017-05-08 15:59:34 -07001464 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Bob Petersond552a2b2017-02-06 08:28:32 -05001465 gfs2_trans_add_meta(ip->i_gl, dibh);
1466 gfs2_dinode_out(ip, dibh->b_data);
1467 up_write(&ip->i_rw_mutex);
1468 gfs2_trans_end(sdp);
1469 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001470
Bob Petersond552a2b2017-02-06 08:28:32 -05001471out:
1472 if (gfs2_holder_initialized(&rd_gh))
1473 gfs2_glock_dq_uninit(&rd_gh);
1474 if (current->journal_info) {
1475 up_write(&ip->i_rw_mutex);
1476 gfs2_trans_end(sdp);
1477 cond_resched();
1478 }
1479 gfs2_quota_unhold(ip);
1480out_metapath:
1481 release_metapath(&mp);
1482 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001483}
1484
1485static int trunc_end(struct gfs2_inode *ip)
1486{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001487 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001488 struct buffer_head *dibh;
1489 int error;
1490
1491 error = gfs2_trans_begin(sdp, RES_DINODE, 0);
1492 if (error)
1493 return error;
1494
1495 down_write(&ip->i_rw_mutex);
1496
1497 error = gfs2_meta_inode_buffer(ip, &dibh);
1498 if (error)
1499 goto out;
1500
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001501 if (!i_size_read(&ip->i_inode)) {
Steven Whitehouseecc30c72008-01-28 10:37:35 +00001502 ip->i_height = 0;
Steven Whitehousece276b02008-02-06 09:25:45 +00001503 ip->i_goal = ip->i_no_addr;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001504 gfs2_buffer_clear_tail(dibh, sizeof(struct gfs2_dinode));
Steven Whitehouse45138992013-01-28 09:30:07 +00001505 gfs2_ordered_del_inode(ip);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001506 }
Deepa Dinamani078cd822016-09-14 07:48:04 -07001507 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouse383f01f2008-11-04 10:05:22 +00001508 ip->i_diskflags &= ~GFS2_DIF_TRUNC_IN_PROG;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001509
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001510 gfs2_trans_add_meta(ip->i_gl, dibh);
Steven Whitehouse539e5d62006-10-31 15:07:05 -05001511 gfs2_dinode_out(ip, dibh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001512 brelse(dibh);
1513
Steven Whitehousea91ea692006-09-04 12:04:26 -04001514out:
David Teiglandb3b94fa2006-01-16 16:50:04 +00001515 up_write(&ip->i_rw_mutex);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001516 gfs2_trans_end(sdp);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001517 return error;
1518}
1519
1520/**
1521 * do_shrink - make a file smaller
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001522 * @inode: the inode
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001523 * @newsize: the size to make the file
David Teiglandb3b94fa2006-01-16 16:50:04 +00001524 *
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001525 * Called with an exclusive lock on @inode. The @size must
1526 * be equal to or smaller than the current inode size.
David Teiglandb3b94fa2006-01-16 16:50:04 +00001527 *
1528 * Returns: errno
1529 */
1530
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001531static int do_shrink(struct inode *inode, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001532{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001533 struct gfs2_inode *ip = GFS2_I(inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001534 int error;
1535
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001536 error = trunc_start(inode, newsize);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001537 if (error < 0)
1538 return error;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001539 if (gfs2_is_stuffed(ip))
David Teiglandb3b94fa2006-01-16 16:50:04 +00001540 return 0;
1541
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001542 error = trunc_dealloc(ip, newsize);
1543 if (error == 0)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001544 error = trunc_end(ip);
1545
1546 return error;
1547}
1548
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001549void gfs2_trim_blocks(struct inode *inode)
Wendy Chenga13b8c52007-08-20 09:29:53 -04001550{
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001551 int ret;
1552
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001553 ret = do_shrink(inode, inode->i_size);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001554 WARN_ON(ret != 0);
1555}
1556
1557/**
1558 * do_grow - Touch and update inode size
1559 * @inode: The inode
1560 * @size: The new size
1561 *
1562 * This function updates the timestamps on the inode and
1563 * may also increase the size of the inode. This function
1564 * must not be called with @size any smaller than the current
1565 * inode size.
1566 *
1567 * Although it is not strictly required to unstuff files here,
1568 * earlier versions of GFS2 have a bug in the stuffed file reading
1569 * code which will result in a buffer overrun if the size is larger
1570 * than the max stuffed file size. In order to prevent this from
Lucas De Marchi25985ed2011-03-30 22:57:33 -03001571 * occurring, such files are unstuffed, but in other cases we can
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001572 * just update the inode size directly.
1573 *
1574 * Returns: 0 on success, or -ve on error
1575 */
1576
1577static int do_grow(struct inode *inode, u64 size)
1578{
1579 struct gfs2_inode *ip = GFS2_I(inode);
1580 struct gfs2_sbd *sdp = GFS2_SB(inode);
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001581 struct gfs2_alloc_parms ap = { .target = 1, };
Wendy Chenga13b8c52007-08-20 09:29:53 -04001582 struct buffer_head *dibh;
1583 int error;
Bob Peterson2f7ee352012-04-12 09:19:30 -04001584 int unstuff = 0;
Wendy Chenga13b8c52007-08-20 09:29:53 -04001585
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001586 if (gfs2_is_stuffed(ip) &&
1587 (size > (sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode)))) {
Abhi Dasb8fbf472015-03-18 12:03:41 -05001588 error = gfs2_quota_lock_check(ip, &ap);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001589 if (error)
Bob Peterson5407e242012-05-18 09:28:23 -04001590 return error;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001591
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001592 error = gfs2_inplace_reserve(ip, &ap);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001593 if (error)
1594 goto do_grow_qunlock;
Bob Peterson2f7ee352012-04-12 09:19:30 -04001595 unstuff = 1;
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001596 }
1597
Bob Petersona01aedf2013-06-27 12:47:51 -04001598 error = gfs2_trans_begin(sdp, RES_DINODE + RES_STATFS + RES_RG_BIT +
1599 (sdp->sd_args.ar_quota == GFS2_QUOTA_OFF ?
1600 0 : RES_QUOTA), 0);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001601 if (error)
1602 goto do_grow_release;
1603
Bob Peterson2f7ee352012-04-12 09:19:30 -04001604 if (unstuff) {
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001605 error = gfs2_unstuff_dinode(ip, NULL);
1606 if (error)
1607 goto do_end_trans;
1608 }
Wendy Chenga13b8c52007-08-20 09:29:53 -04001609
1610 error = gfs2_meta_inode_buffer(ip, &dibh);
1611 if (error)
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001612 goto do_end_trans;
Wendy Chenga13b8c52007-08-20 09:29:53 -04001613
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001614 i_size_write(inode, size);
Deepa Dinamani078cd822016-09-14 07:48:04 -07001615 ip->i_inode.i_mtime = ip->i_inode.i_ctime = current_time(&ip->i_inode);
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001616 gfs2_trans_add_meta(ip->i_gl, dibh);
Wendy Chenga13b8c52007-08-20 09:29:53 -04001617 gfs2_dinode_out(ip, dibh->b_data);
1618 brelse(dibh);
1619
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001620do_end_trans:
Wendy Chenga13b8c52007-08-20 09:29:53 -04001621 gfs2_trans_end(sdp);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001622do_grow_release:
Bob Peterson2f7ee352012-04-12 09:19:30 -04001623 if (unstuff) {
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001624 gfs2_inplace_release(ip);
1625do_grow_qunlock:
1626 gfs2_quota_unlock(ip);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001627 }
Wendy Chenga13b8c52007-08-20 09:29:53 -04001628 return error;
1629}
1630
David Teiglandb3b94fa2006-01-16 16:50:04 +00001631/**
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001632 * gfs2_setattr_size - make a file a given size
1633 * @inode: the inode
1634 * @newsize: the size to make the file
David Teiglandb3b94fa2006-01-16 16:50:04 +00001635 *
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001636 * The file size can grow, shrink, or stay the same size. This
1637 * is called holding i_mutex and an exclusive glock on the inode
1638 * in question.
David Teiglandb3b94fa2006-01-16 16:50:04 +00001639 *
1640 * Returns: errno
1641 */
1642
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001643int gfs2_setattr_size(struct inode *inode, u64 newsize)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001644{
Steven Whitehouseaf5c2692013-09-27 12:49:33 +01001645 struct gfs2_inode *ip = GFS2_I(inode);
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001646 int ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001647
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001648 BUG_ON(!S_ISREG(inode->i_mode));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001649
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001650 ret = inode_newsize_ok(inode, newsize);
1651 if (ret)
1652 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001653
Christoph Hellwig562c72a2011-06-24 14:29:45 -04001654 inode_dio_wait(inode);
1655
Bob Petersonb54e9a02015-10-26 10:40:28 -05001656 ret = gfs2_rsqa_alloc(ip);
Bob Petersond2b47cf2013-02-01 12:03:02 -05001657 if (ret)
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001658 goto out;
Bob Petersond2b47cf2013-02-01 12:03:02 -05001659
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001660 if (newsize >= inode->i_size) {
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001661 ret = do_grow(inode, newsize);
1662 goto out;
1663 }
Steven Whitehouseff8f33c2010-08-11 09:37:53 +01001664
Andreas Gruenbacher8b5860a2017-12-12 20:49:05 +01001665 ret = do_shrink(inode, newsize);
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001666out:
Bob Petersona097dc7e2015-07-16 08:28:04 -05001667 gfs2_rsqa_delete(ip, NULL);
Bob Peterson2b3dcf32013-05-28 10:04:44 -04001668 return ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001669}
1670
1671int gfs2_truncatei_resume(struct gfs2_inode *ip)
1672{
1673 int error;
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001674 error = trunc_dealloc(ip, i_size_read(&ip->i_inode));
David Teiglandb3b94fa2006-01-16 16:50:04 +00001675 if (!error)
1676 error = trunc_end(ip);
1677 return error;
1678}
1679
1680int gfs2_file_dealloc(struct gfs2_inode *ip)
1681{
1682 return trunc_dealloc(ip, 0);
1683}
1684
1685/**
Steven Whitehouseb50f2272014-03-03 13:35:57 +00001686 * gfs2_free_journal_extents - Free cached journal bmap info
1687 * @jd: The journal
1688 *
1689 */
1690
1691void gfs2_free_journal_extents(struct gfs2_jdesc *jd)
1692{
1693 struct gfs2_journal_extent *jext;
1694
1695 while(!list_empty(&jd->extent_list)) {
1696 jext = list_entry(jd->extent_list.next, struct gfs2_journal_extent, list);
1697 list_del(&jext->list);
1698 kfree(jext);
1699 }
1700}
1701
1702/**
1703 * gfs2_add_jextent - Add or merge a new extent to extent cache
1704 * @jd: The journal descriptor
1705 * @lblock: The logical block at start of new extent
Fabian Frederickc62baf62014-05-14 18:32:31 +02001706 * @dblock: The physical block at start of new extent
Steven Whitehouseb50f2272014-03-03 13:35:57 +00001707 * @blocks: Size of extent in fs blocks
1708 *
1709 * Returns: 0 on success or -ENOMEM
1710 */
1711
1712static int gfs2_add_jextent(struct gfs2_jdesc *jd, u64 lblock, u64 dblock, u64 blocks)
1713{
1714 struct gfs2_journal_extent *jext;
1715
1716 if (!list_empty(&jd->extent_list)) {
1717 jext = list_entry(jd->extent_list.prev, struct gfs2_journal_extent, list);
1718 if ((jext->dblock + jext->blocks) == dblock) {
1719 jext->blocks += blocks;
1720 return 0;
1721 }
1722 }
1723
1724 jext = kzalloc(sizeof(struct gfs2_journal_extent), GFP_NOFS);
1725 if (jext == NULL)
1726 return -ENOMEM;
1727 jext->dblock = dblock;
1728 jext->lblock = lblock;
1729 jext->blocks = blocks;
1730 list_add_tail(&jext->list, &jd->extent_list);
1731 jd->nr_extents++;
1732 return 0;
1733}
1734
1735/**
1736 * gfs2_map_journal_extents - Cache journal bmap info
1737 * @sdp: The super block
1738 * @jd: The journal to map
1739 *
1740 * Create a reusable "extent" mapping from all logical
1741 * blocks to all physical blocks for the given journal. This will save
1742 * us time when writing journal blocks. Most journals will have only one
1743 * extent that maps all their logical blocks. That's because gfs2.mkfs
1744 * arranges the journal blocks sequentially to maximize performance.
1745 * So the extent would map the first block for the entire file length.
1746 * However, gfs2_jadd can happen while file activity is happening, so
1747 * those journals may not be sequential. Less likely is the case where
1748 * the users created their own journals by mounting the metafs and
1749 * laying it out. But it's still possible. These journals might have
1750 * several extents.
1751 *
1752 * Returns: 0 on success, or error on failure
1753 */
1754
1755int gfs2_map_journal_extents(struct gfs2_sbd *sdp, struct gfs2_jdesc *jd)
1756{
1757 u64 lblock = 0;
1758 u64 lblock_stop;
1759 struct gfs2_inode *ip = GFS2_I(jd->jd_inode);
1760 struct buffer_head bh;
1761 unsigned int shift = sdp->sd_sb.sb_bsize_shift;
1762 u64 size;
1763 int rc;
1764
1765 lblock_stop = i_size_read(jd->jd_inode) >> shift;
1766 size = (lblock_stop - lblock) << shift;
1767 jd->nr_extents = 0;
1768 WARN_ON(!list_empty(&jd->extent_list));
1769
1770 do {
1771 bh.b_state = 0;
1772 bh.b_blocknr = 0;
1773 bh.b_size = size;
1774 rc = gfs2_block_map(jd->jd_inode, lblock, &bh, 0);
1775 if (rc || !buffer_mapped(&bh))
1776 goto fail;
1777 rc = gfs2_add_jextent(jd, lblock, bh.b_blocknr, bh.b_size >> shift);
1778 if (rc)
1779 goto fail;
1780 size -= bh.b_size;
1781 lblock += (bh.b_size >> ip->i_inode.i_blkbits);
1782 } while(size > 0);
1783
1784 fs_info(sdp, "journal %d mapped with %u extents\n", jd->jd_jid,
1785 jd->nr_extents);
1786 return 0;
1787
1788fail:
1789 fs_warn(sdp, "error %d mapping journal %u at offset %llu (extent %u)\n",
1790 rc, jd->jd_jid,
1791 (unsigned long long)(i_size_read(jd->jd_inode) - size),
1792 jd->nr_extents);
1793 fs_warn(sdp, "bmap=%d lblock=%llu block=%llu, state=0x%08lx, size=%llu\n",
1794 rc, (unsigned long long)lblock, (unsigned long long)bh.b_blocknr,
1795 bh.b_state, (unsigned long long)bh.b_size);
1796 gfs2_free_journal_extents(jd);
1797 return rc;
1798}
1799
1800/**
David Teiglandb3b94fa2006-01-16 16:50:04 +00001801 * gfs2_write_alloc_required - figure out if a write will require an allocation
1802 * @ip: the file being written to
1803 * @offset: the offset to write to
1804 * @len: the number of bytes being written
David Teiglandb3b94fa2006-01-16 16:50:04 +00001805 *
Bob Peterson461cb412010-06-24 19:21:20 -04001806 * Returns: 1 if an alloc is required, 0 otherwise
David Teiglandb3b94fa2006-01-16 16:50:04 +00001807 */
1808
Steven Whitehousecd915492006-09-04 12:49:07 -04001809int gfs2_write_alloc_required(struct gfs2_inode *ip, u64 offset,
Bob Peterson461cb412010-06-24 19:21:20 -04001810 unsigned int len)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001811{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001812 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001813 struct buffer_head bh;
1814 unsigned int shift;
1815 u64 lblock, lblock_stop, size;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001816 u64 end_of_file;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001817
David Teiglandb3b94fa2006-01-16 16:50:04 +00001818 if (!len)
1819 return 0;
1820
1821 if (gfs2_is_stuffed(ip)) {
1822 if (offset + len >
1823 sdp->sd_sb.sb_bsize - sizeof(struct gfs2_dinode))
Bob Peterson461cb412010-06-24 19:21:20 -04001824 return 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001825 return 0;
1826 }
1827
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001828 shift = sdp->sd_sb.sb_bsize_shift;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001829 BUG_ON(gfs2_is_dir(ip));
Steven Whitehousea2e0f792010-08-11 09:53:11 +01001830 end_of_file = (i_size_read(&ip->i_inode) + sdp->sd_sb.sb_bsize - 1) >> shift;
Steven Whitehouse7ed122e2008-12-10 10:28:10 +00001831 lblock = offset >> shift;
1832 lblock_stop = (offset + len + sdp->sd_sb.sb_bsize - 1) >> shift;
1833 if (lblock_stop > end_of_file)
Bob Peterson461cb412010-06-24 19:21:20 -04001834 return 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001835
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001836 size = (lblock_stop - lblock) << shift;
1837 do {
1838 bh.b_state = 0;
1839 bh.b_size = size;
1840 gfs2_block_map(&ip->i_inode, lblock, &bh, 0);
1841 if (!buffer_mapped(&bh))
Bob Peterson461cb412010-06-24 19:21:20 -04001842 return 1;
Steven Whitehouse941e6d72008-01-28 08:47:38 +00001843 size -= bh.b_size;
1844 lblock += (bh.b_size >> ip->i_inode.i_blkbits);
1845 } while(size > 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001846
1847 return 0;
1848}
1849