blob: 6af2396a317c3de22e9d8bd86e28246b28067523 [file] [log] [blame]
David Teiglandb3b94fa2006-01-16 16:50:04 +00001/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
Bob Petersonfe6c9912008-01-28 11:13:02 -06003 * Copyright (C) 2004-2008 Red Hat, Inc. All rights reserved.
David Teiglandb3b94fa2006-01-16 16:50:04 +00004 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
Steven Whitehousee9fc2aa2006-09-01 11:05:15 -04007 * of the GNU General Public License version 2.
David Teiglandb3b94fa2006-01-16 16:50:04 +00008 */
9
Joe Perchesd77d1b52014-03-06 12:10:45 -080010#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
11
David Teiglandb3b94fa2006-01-16 16:50:04 +000012#include <linux/slab.h>
13#include <linux/spinlock.h>
14#include <linux/completion.h>
15#include <linux/buffer_head.h>
Steven Whitehousef42faf42006-01-30 18:34:10 +000016#include <linux/fs.h>
Steven Whitehouse5c676f62006-02-27 17:23:27 -050017#include <linux/gfs2_ondisk.h>
Bob Peterson1f466a42008-03-10 18:17:47 -050018#include <linux/prefetch.h>
Steven Whitehousef15ab562009-02-09 09:25:01 +000019#include <linux/blkdev.h>
Bob Peterson7c9ca622011-08-31 09:53:19 +010020#include <linux/rbtree.h>
Steven Whitehouse9dbe9612012-10-31 10:37:10 +000021#include <linux/random.h>
David Teiglandb3b94fa2006-01-16 16:50:04 +000022
23#include "gfs2.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050024#include "incore.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000025#include "glock.h"
26#include "glops.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000027#include "lops.h"
28#include "meta_io.h"
29#include "quota.h"
30#include "rgrp.h"
31#include "super.h"
32#include "trans.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050033#include "util.h"
Benjamin Marzinski172e0452007-03-23 14:51:56 -060034#include "log.h"
Steven Whitehousec8cdf472007-06-08 10:05:33 +010035#include "inode.h"
Steven Whitehouse63997772009-06-12 08:49:20 +010036#include "trace_gfs2.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000037
Steven Whitehouse2c1e52a2006-09-05 15:41:57 -040038#define BFITNOENT ((u32)~0)
Bob Peterson6760bdc2007-07-24 14:09:32 -050039#define NO_BLOCK ((u64)~0)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040040
Bob Peterson1f466a42008-03-10 18:17:47 -050041#if BITS_PER_LONG == 32
42#define LBITMASK (0x55555555UL)
43#define LBITSKIP55 (0x55555555UL)
44#define LBITSKIP00 (0x00000000UL)
45#else
46#define LBITMASK (0x5555555555555555UL)
47#define LBITSKIP55 (0x5555555555555555UL)
48#define LBITSKIP00 (0x0000000000000000UL)
49#endif
50
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040051/*
52 * These routines are used by the resource group routines (rgrp.c)
53 * to keep track of block allocation. Each block is represented by two
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040054 * bits. So, each byte represents GFS2_NBBY (i.e. 4) blocks.
55 *
56 * 0 = Free
57 * 1 = Used (not metadata)
58 * 2 = Unlinked (still in use) inode
59 * 3 = Used (metadata)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040060 */
61
Bob Peterson5ce13432013-11-06 10:55:52 -050062struct gfs2_extent {
63 struct gfs2_rbm rbm;
64 u32 len;
65};
66
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040067static const char valid_change[16] = {
68 /* current */
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040069 /* n */ 0, 1, 1, 1,
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040070 /* e */ 1, 0, 0, 0,
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040071 /* w */ 0, 0, 0, 1,
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040072 1, 0, 0, 0
73};
74
Bob Peterson5ce13432013-11-06 10:55:52 -050075static int gfs2_rbm_find(struct gfs2_rbm *rbm, u8 state, u32 *minext,
76 const struct gfs2_inode *ip, bool nowrap,
77 const struct gfs2_alloc_parms *ap);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +010078
79
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040080/**
81 * gfs2_setbit - Set a bit in the bitmaps
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010082 * @rbm: The position of the bit to set
83 * @do_clone: Also set the clone bitmap, if it exists
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040084 * @new_state: the new state of the block
85 *
86 */
87
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010088static inline void gfs2_setbit(const struct gfs2_rbm *rbm, bool do_clone,
Bob Peterson06344b92012-04-26 12:44:35 -040089 unsigned char new_state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040090{
Steven Whitehouseb45e41d2008-02-06 10:11:15 +000091 unsigned char *byte1, *byte2, *end, cur_state;
Bob Petersone579ed42013-09-17 13:12:15 -040092 struct gfs2_bitmap *bi = rbm_bi(rbm);
93 unsigned int buflen = bi->bi_len;
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010094 const unsigned int bit = (rbm->offset % GFS2_NBBY) * GFS2_BIT_SIZE;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040095
Bob Petersone579ed42013-09-17 13:12:15 -040096 byte1 = bi->bi_bh->b_data + bi->bi_offset + (rbm->offset / GFS2_NBBY);
97 end = bi->bi_bh->b_data + bi->bi_offset + buflen;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040098
Steven Whitehouseb45e41d2008-02-06 10:11:15 +000099 BUG_ON(byte1 >= end);
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400100
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000101 cur_state = (*byte1 >> bit) & GFS2_BIT_MASK;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400102
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000103 if (unlikely(!valid_change[new_state * 4 + cur_state])) {
Joe Perchesd77d1b52014-03-06 12:10:45 -0800104 pr_warn("buf_blk = 0x%x old_state=%d, new_state=%d\n",
105 rbm->offset, cur_state, new_state);
106 pr_warn("rgrp=0x%llx bi_start=0x%x\n",
107 (unsigned long long)rbm->rgd->rd_addr, bi->bi_start);
108 pr_warn("bi_offset=0x%x bi_len=0x%x\n",
109 bi->bi_offset, bi->bi_len);
Bob Peterson95c8e172011-03-22 10:49:12 -0400110 dump_stack();
Steven Whitehouse3e6339d2012-08-13 11:37:51 +0100111 gfs2_consist_rgrpd(rbm->rgd);
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000112 return;
113 }
114 *byte1 ^= (cur_state ^ new_state) << bit;
115
Bob Petersone579ed42013-09-17 13:12:15 -0400116 if (do_clone && bi->bi_clone) {
117 byte2 = bi->bi_clone + bi->bi_offset + (rbm->offset / GFS2_NBBY);
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000118 cur_state = (*byte2 >> bit) & GFS2_BIT_MASK;
119 *byte2 ^= (cur_state ^ new_state) << bit;
120 }
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400121}
122
123/**
124 * gfs2_testbit - test a bit in the bitmaps
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100125 * @rbm: The bit to test
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400126 *
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100127 * Returns: The two bit block state of the requested bit
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400128 */
129
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100130static inline u8 gfs2_testbit(const struct gfs2_rbm *rbm)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400131{
Bob Petersone579ed42013-09-17 13:12:15 -0400132 struct gfs2_bitmap *bi = rbm_bi(rbm);
133 const u8 *buffer = bi->bi_bh->b_data + bi->bi_offset;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100134 const u8 *byte;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400135 unsigned int bit;
136
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100137 byte = buffer + (rbm->offset / GFS2_NBBY);
138 bit = (rbm->offset % GFS2_NBBY) * GFS2_BIT_SIZE;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400139
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100140 return (*byte >> bit) & GFS2_BIT_MASK;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400141}
142
143/**
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000144 * gfs2_bit_search
145 * @ptr: Pointer to bitmap data
146 * @mask: Mask to use (normally 0x55555.... but adjusted for search start)
147 * @state: The state we are searching for
148 *
149 * We xor the bitmap data with a patter which is the bitwise opposite
150 * of what we are looking for, this gives rise to a pattern of ones
151 * wherever there is a match. Since we have two bits per entry, we
152 * take this pattern, shift it down by one place and then and it with
153 * the original. All the even bit positions (0,2,4, etc) then represent
154 * successful matches, so we mask with 0x55555..... to remove the unwanted
155 * odd bit positions.
156 *
157 * This allows searching of a whole u64 at once (32 blocks) with a
158 * single test (on 64 bit arches).
159 */
160
161static inline u64 gfs2_bit_search(const __le64 *ptr, u64 mask, u8 state)
162{
163 u64 tmp;
164 static const u64 search[] = {
Hannes Eder075ac442009-02-21 02:11:42 +0100165 [0] = 0xffffffffffffffffULL,
166 [1] = 0xaaaaaaaaaaaaaaaaULL,
167 [2] = 0x5555555555555555ULL,
168 [3] = 0x0000000000000000ULL,
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000169 };
170 tmp = le64_to_cpu(*ptr) ^ search[state];
171 tmp &= (tmp >> 1);
172 tmp &= mask;
173 return tmp;
174}
175
176/**
Bob Peterson8e2e0042012-07-19 08:12:40 -0400177 * rs_cmp - multi-block reservation range compare
178 * @blk: absolute file system block number of the new reservation
179 * @len: number of blocks in the new reservation
180 * @rs: existing reservation to compare against
181 *
182 * returns: 1 if the block range is beyond the reach of the reservation
183 * -1 if the block range is before the start of the reservation
184 * 0 if the block range overlaps with the reservation
185 */
186static inline int rs_cmp(u64 blk, u32 len, struct gfs2_blkreserv *rs)
187{
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100188 u64 startblk = gfs2_rbm_to_block(&rs->rs_rbm);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400189
190 if (blk >= startblk + rs->rs_free)
191 return 1;
192 if (blk + len - 1 < startblk)
193 return -1;
194 return 0;
195}
196
197/**
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400198 * gfs2_bitfit - Search an rgrp's bitmap buffer to find a bit-pair representing
199 * a block in a given allocation state.
Bob Peterson886b1412012-04-11 13:03:52 -0400200 * @buf: the buffer that holds the bitmaps
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000201 * @len: the length (in bytes) of the buffer
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400202 * @goal: start search at this block's bit-pair (within @buffer)
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000203 * @state: GFS2_BLKST_XXX the state of the block we're looking for.
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400204 *
205 * Scope of @goal and returned block number is only within this bitmap buffer,
206 * not entire rgrp or filesystem. @buffer will be offset from the actual
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000207 * beginning of a bitmap block buffer, skipping any header structures, but
208 * headers are always a multiple of 64 bits long so that the buffer is
209 * always aligned to a 64 bit boundary.
210 *
211 * The size of the buffer is in bytes, but is it assumed that it is
Anand Gadiyarfd589a82009-07-16 17:13:03 +0200212 * always ok to read a complete multiple of 64 bits at the end
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000213 * of the block in case the end is no aligned to a natural boundary.
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400214 *
215 * Return: the block number (bitmap buffer scope) that was found
216 */
217
Hannes Eder02ab1722009-02-21 02:12:05 +0100218static u32 gfs2_bitfit(const u8 *buf, const unsigned int len,
219 u32 goal, u8 state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400220{
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000221 u32 spoint = (goal << 1) & ((8*sizeof(u64)) - 1);
222 const __le64 *ptr = ((__le64 *)buf) + (goal >> 5);
223 const __le64 *end = (__le64 *)(buf + ALIGN(len, sizeof(u64)));
224 u64 tmp;
Hannes Eder075ac442009-02-21 02:11:42 +0100225 u64 mask = 0x5555555555555555ULL;
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000226 u32 bit;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400227
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000228 /* Mask off bits we don't care about at the start of the search */
229 mask <<= spoint;
230 tmp = gfs2_bit_search(ptr, mask, state);
231 ptr++;
232 while(tmp == 0 && ptr < end) {
Hannes Eder075ac442009-02-21 02:11:42 +0100233 tmp = gfs2_bit_search(ptr, 0x5555555555555555ULL, state);
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000234 ptr++;
Bob Peterson1f466a42008-03-10 18:17:47 -0500235 }
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000236 /* Mask off any bits which are more than len bytes from the start */
237 if (ptr == end && (len & (sizeof(u64) - 1)))
238 tmp &= (((u64)~0) >> (64 - 8*(len & (sizeof(u64) - 1))));
239 /* Didn't find anything, so return */
240 if (tmp == 0)
241 return BFITNOENT;
242 ptr--;
Steven Whitehoused8bd5042009-04-23 08:54:02 +0100243 bit = __ffs64(tmp);
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000244 bit /= 2; /* two bits per entry in the bitmap */
245 return (((const unsigned char *)ptr - buf) * GFS2_NBBY) + bit;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400246}
247
248/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100249 * gfs2_rbm_from_block - Set the rbm based upon rgd and block number
250 * @rbm: The rbm with rgd already set correctly
251 * @block: The block number (filesystem relative)
252 *
253 * This sets the bi and offset members of an rbm based on a
254 * resource group and a filesystem relative block number. The
255 * resource group must be set in the rbm on entry, the bi and
256 * offset members will be set by this function.
257 *
258 * Returns: 0 on success, or an error code
259 */
260
261static int gfs2_rbm_from_block(struct gfs2_rbm *rbm, u64 block)
262{
263 u64 rblock = block - rbm->rgd->rd_data0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100264
265 if (WARN_ON_ONCE(rblock > UINT_MAX))
266 return -EINVAL;
267 if (block >= rbm->rgd->rd_data0 + rbm->rgd->rd_data)
268 return -E2BIG;
269
Bob Petersone579ed42013-09-17 13:12:15 -0400270 rbm->bii = 0;
Bob Petersona68a0a32012-10-19 08:32:51 -0400271 rbm->offset = (u32)(rblock);
272 /* Check if the block is within the first block */
Bob Petersone579ed42013-09-17 13:12:15 -0400273 if (rbm->offset < rbm_bi(rbm)->bi_blocks)
Bob Petersona68a0a32012-10-19 08:32:51 -0400274 return 0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100275
Bob Petersona68a0a32012-10-19 08:32:51 -0400276 /* Adjust for the size diff between gfs2_meta_header and gfs2_rgrp */
277 rbm->offset += (sizeof(struct gfs2_rgrp) -
278 sizeof(struct gfs2_meta_header)) * GFS2_NBBY;
Bob Petersone579ed42013-09-17 13:12:15 -0400279 rbm->bii = rbm->offset / rbm->rgd->rd_sbd->sd_blocks_per_bitmap;
280 rbm->offset -= rbm->bii * rbm->rgd->rd_sbd->sd_blocks_per_bitmap;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100281 return 0;
282}
283
284/**
Bob Peterson149ed7f2013-09-17 13:14:35 -0400285 * gfs2_rbm_incr - increment an rbm structure
286 * @rbm: The rbm with rgd already set correctly
287 *
288 * This function takes an existing rbm structure and increments it to the next
289 * viable block offset.
290 *
291 * Returns: If incrementing the offset would cause the rbm to go past the
292 * end of the rgrp, true is returned, otherwise false.
293 *
294 */
295
296static bool gfs2_rbm_incr(struct gfs2_rbm *rbm)
297{
298 if (rbm->offset + 1 < rbm_bi(rbm)->bi_blocks) { /* in the same bitmap */
299 rbm->offset++;
300 return false;
301 }
302 if (rbm->bii == rbm->rgd->rd_length - 1) /* at the last bitmap */
303 return true;
304
305 rbm->offset = 0;
306 rbm->bii++;
307 return false;
308}
309
310/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100311 * gfs2_unaligned_extlen - Look for free blocks which are not byte aligned
312 * @rbm: Position to search (value/result)
313 * @n_unaligned: Number of unaligned blocks to check
314 * @len: Decremented for each block found (terminate on zero)
315 *
316 * Returns: true if a non-free block is encountered
317 */
318
319static bool gfs2_unaligned_extlen(struct gfs2_rbm *rbm, u32 n_unaligned, u32 *len)
320{
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100321 u32 n;
322 u8 res;
323
324 for (n = 0; n < n_unaligned; n++) {
325 res = gfs2_testbit(rbm);
326 if (res != GFS2_BLKST_FREE)
327 return true;
328 (*len)--;
329 if (*len == 0)
330 return true;
Bob Peterson149ed7f2013-09-17 13:14:35 -0400331 if (gfs2_rbm_incr(rbm))
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100332 return true;
333 }
334
335 return false;
336}
337
338/**
339 * gfs2_free_extlen - Return extent length of free blocks
Fabian Frederick27ff6a02014-07-02 22:05:27 +0200340 * @rrbm: Starting position
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100341 * @len: Max length to check
342 *
343 * Starting at the block specified by the rbm, see how many free blocks
344 * there are, not reading more than len blocks ahead. This can be done
345 * using memchr_inv when the blocks are byte aligned, but has to be done
346 * on a block by block basis in case of unaligned blocks. Also this
347 * function can cope with bitmap boundaries (although it must stop on
348 * a resource group boundary)
349 *
350 * Returns: Number of free blocks in the extent
351 */
352
353static u32 gfs2_free_extlen(const struct gfs2_rbm *rrbm, u32 len)
354{
355 struct gfs2_rbm rbm = *rrbm;
356 u32 n_unaligned = rbm.offset & 3;
357 u32 size = len;
358 u32 bytes;
359 u32 chunk_size;
360 u8 *ptr, *start, *end;
361 u64 block;
Bob Petersone579ed42013-09-17 13:12:15 -0400362 struct gfs2_bitmap *bi;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100363
364 if (n_unaligned &&
365 gfs2_unaligned_extlen(&rbm, 4 - n_unaligned, &len))
366 goto out;
367
Bob Peterson37015302012-09-12 09:40:31 -0400368 n_unaligned = len & 3;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100369 /* Start is now byte aligned */
370 while (len > 3) {
Bob Petersone579ed42013-09-17 13:12:15 -0400371 bi = rbm_bi(&rbm);
372 start = bi->bi_bh->b_data;
373 if (bi->bi_clone)
374 start = bi->bi_clone;
375 end = start + bi->bi_bh->b_size;
376 start += bi->bi_offset;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100377 BUG_ON(rbm.offset & 3);
378 start += (rbm.offset / GFS2_NBBY);
379 bytes = min_t(u32, len / GFS2_NBBY, (end - start));
380 ptr = memchr_inv(start, 0, bytes);
381 chunk_size = ((ptr == NULL) ? bytes : (ptr - start));
382 chunk_size *= GFS2_NBBY;
383 BUG_ON(len < chunk_size);
384 len -= chunk_size;
385 block = gfs2_rbm_to_block(&rbm);
Bob Peterson15bd50a2012-12-20 13:21:07 -0500386 if (gfs2_rbm_from_block(&rbm, block + chunk_size)) {
387 n_unaligned = 0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100388 break;
Bob Peterson15bd50a2012-12-20 13:21:07 -0500389 }
390 if (ptr) {
391 n_unaligned = 3;
392 break;
393 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100394 n_unaligned = len & 3;
395 }
396
397 /* Deal with any bits left over at the end */
398 if (n_unaligned)
399 gfs2_unaligned_extlen(&rbm, n_unaligned, &len);
400out:
401 return size - len;
402}
403
404/**
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400405 * gfs2_bitcount - count the number of bits in a certain state
Bob Peterson886b1412012-04-11 13:03:52 -0400406 * @rgd: the resource group descriptor
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400407 * @buffer: the buffer that holds the bitmaps
408 * @buflen: the length (in bytes) of the buffer
409 * @state: the state of the block we're looking for
410 *
411 * Returns: The number of bits
412 */
413
Steven Whitehouse110acf32008-01-29 13:30:20 +0000414static u32 gfs2_bitcount(struct gfs2_rgrpd *rgd, const u8 *buffer,
415 unsigned int buflen, u8 state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400416{
Steven Whitehouse110acf32008-01-29 13:30:20 +0000417 const u8 *byte = buffer;
418 const u8 *end = buffer + buflen;
419 const u8 state1 = state << 2;
420 const u8 state2 = state << 4;
421 const u8 state3 = state << 6;
Steven Whitehousecd915492006-09-04 12:49:07 -0400422 u32 count = 0;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400423
424 for (; byte < end; byte++) {
425 if (((*byte) & 0x03) == state)
426 count++;
427 if (((*byte) & 0x0C) == state1)
428 count++;
429 if (((*byte) & 0x30) == state2)
430 count++;
431 if (((*byte) & 0xC0) == state3)
432 count++;
433 }
434
435 return count;
436}
437
David Teiglandb3b94fa2006-01-16 16:50:04 +0000438/**
439 * gfs2_rgrp_verify - Verify that a resource group is consistent
David Teiglandb3b94fa2006-01-16 16:50:04 +0000440 * @rgd: the rgrp
441 *
442 */
443
444void gfs2_rgrp_verify(struct gfs2_rgrpd *rgd)
445{
446 struct gfs2_sbd *sdp = rgd->rd_sbd;
447 struct gfs2_bitmap *bi = NULL;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100448 u32 length = rgd->rd_length;
Steven Whitehousecd915492006-09-04 12:49:07 -0400449 u32 count[4], tmp;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000450 int buf, x;
451
Steven Whitehousecd915492006-09-04 12:49:07 -0400452 memset(count, 0, 4 * sizeof(u32));
David Teiglandb3b94fa2006-01-16 16:50:04 +0000453
454 /* Count # blocks in each of 4 possible allocation states */
455 for (buf = 0; buf < length; buf++) {
456 bi = rgd->rd_bits + buf;
457 for (x = 0; x < 4; x++)
458 count[x] += gfs2_bitcount(rgd,
459 bi->bi_bh->b_data +
460 bi->bi_offset,
461 bi->bi_len, x);
462 }
463
Steven Whitehousecfc8b542008-11-04 10:25:13 +0000464 if (count[0] != rgd->rd_free) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000465 if (gfs2_consist_rgrpd(rgd))
466 fs_err(sdp, "free data mismatch: %u != %u\n",
Steven Whitehousecfc8b542008-11-04 10:25:13 +0000467 count[0], rgd->rd_free);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000468 return;
469 }
470
Steven Whitehouse73f74942008-11-04 10:32:57 +0000471 tmp = rgd->rd_data - rgd->rd_free - rgd->rd_dinodes;
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500472 if (count[1] != tmp) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000473 if (gfs2_consist_rgrpd(rgd))
474 fs_err(sdp, "used data mismatch: %u != %u\n",
475 count[1], tmp);
476 return;
477 }
478
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500479 if (count[2] + count[3] != rgd->rd_dinodes) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000480 if (gfs2_consist_rgrpd(rgd))
481 fs_err(sdp, "used metadata mismatch: %u != %u\n",
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500482 count[2] + count[3], rgd->rd_dinodes);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000483 return;
484 }
485}
486
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100487static inline int rgrp_contains_block(struct gfs2_rgrpd *rgd, u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000488{
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100489 u64 first = rgd->rd_data0;
490 u64 last = first + rgd->rd_data;
Steven Whitehouse16910422006-09-05 11:15:45 -0400491 return first <= block && block < last;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000492}
493
494/**
495 * gfs2_blk2rgrpd - Find resource group for a given data/meta block number
496 * @sdp: The GFS2 superblock
Bob Peterson886b1412012-04-11 13:03:52 -0400497 * @blk: The data block number
498 * @exact: True if this needs to be an exact match
David Teiglandb3b94fa2006-01-16 16:50:04 +0000499 *
500 * Returns: The resource group, or NULL if not found
501 */
502
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000503struct gfs2_rgrpd *gfs2_blk2rgrpd(struct gfs2_sbd *sdp, u64 blk, bool exact)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000504{
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000505 struct rb_node *n, *next;
Steven Whitehousef75bbfb2011-09-08 10:21:13 +0100506 struct gfs2_rgrpd *cur;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000507
508 spin_lock(&sdp->sd_rindex_spin);
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000509 n = sdp->sd_rindex_tree.rb_node;
510 while (n) {
511 cur = rb_entry(n, struct gfs2_rgrpd, rd_node);
512 next = NULL;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100513 if (blk < cur->rd_addr)
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000514 next = n->rb_left;
Steven Whitehousef75bbfb2011-09-08 10:21:13 +0100515 else if (blk >= cur->rd_data0 + cur->rd_data)
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000516 next = n->rb_right;
517 if (next == NULL) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000518 spin_unlock(&sdp->sd_rindex_spin);
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000519 if (exact) {
520 if (blk < cur->rd_addr)
521 return NULL;
522 if (blk >= cur->rd_data0 + cur->rd_data)
523 return NULL;
524 }
Bob Peterson7c9ca622011-08-31 09:53:19 +0100525 return cur;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000526 }
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000527 n = next;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000528 }
David Teiglandb3b94fa2006-01-16 16:50:04 +0000529 spin_unlock(&sdp->sd_rindex_spin);
530
531 return NULL;
532}
533
534/**
535 * gfs2_rgrpd_get_first - get the first Resource Group in the filesystem
536 * @sdp: The GFS2 superblock
537 *
538 * Returns: The first rgrp in the filesystem
539 */
540
541struct gfs2_rgrpd *gfs2_rgrpd_get_first(struct gfs2_sbd *sdp)
542{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100543 const struct rb_node *n;
544 struct gfs2_rgrpd *rgd;
545
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100546 spin_lock(&sdp->sd_rindex_spin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100547 n = rb_first(&sdp->sd_rindex_tree);
548 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100549 spin_unlock(&sdp->sd_rindex_spin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100550
551 return rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000552}
553
554/**
555 * gfs2_rgrpd_get_next - get the next RG
Bob Peterson886b1412012-04-11 13:03:52 -0400556 * @rgd: the resource group descriptor
David Teiglandb3b94fa2006-01-16 16:50:04 +0000557 *
558 * Returns: The next rgrp
559 */
560
561struct gfs2_rgrpd *gfs2_rgrpd_get_next(struct gfs2_rgrpd *rgd)
562{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100563 struct gfs2_sbd *sdp = rgd->rd_sbd;
564 const struct rb_node *n;
565
566 spin_lock(&sdp->sd_rindex_spin);
567 n = rb_next(&rgd->rd_node);
568 if (n == NULL)
569 n = rb_first(&sdp->sd_rindex_tree);
570
571 if (unlikely(&rgd->rd_node == n)) {
572 spin_unlock(&sdp->sd_rindex_spin);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000573 return NULL;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100574 }
575 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
576 spin_unlock(&sdp->sd_rindex_spin);
577 return rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000578}
579
Abhi Das00a158b2014-09-18 21:40:28 -0500580void check_and_update_goal(struct gfs2_inode *ip)
581{
582 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
583 if (!ip->i_goal || gfs2_blk2rgrpd(sdp, ip->i_goal, 1) == NULL)
584 ip->i_goal = ip->i_no_addr;
585}
586
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100587void gfs2_free_clones(struct gfs2_rgrpd *rgd)
588{
589 int x;
590
591 for (x = 0; x < rgd->rd_length; x++) {
592 struct gfs2_bitmap *bi = rgd->rd_bits + x;
593 kfree(bi->bi_clone);
594 bi->bi_clone = NULL;
595 }
596}
597
Bob Peterson0a305e42012-06-06 11:17:59 +0100598/**
599 * gfs2_rs_alloc - make sure we have a reservation assigned to the inode
600 * @ip: the inode for this reservation
601 */
602int gfs2_rs_alloc(struct gfs2_inode *ip)
603{
Abhijith Dasf1213ca2012-12-19 10:48:01 -0500604 int error = 0;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100605
Bob Peterson0a305e42012-06-06 11:17:59 +0100606 down_write(&ip->i_rw_mutex);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400607 if (ip->i_res)
Abhijith Dasf1213ca2012-12-19 10:48:01 -0500608 goto out;
609
610 ip->i_res = kmem_cache_zalloc(gfs2_rsrv_cachep, GFP_NOFS);
611 if (!ip->i_res) {
612 error = -ENOMEM;
613 goto out;
614 }
615
616 RB_CLEAR_NODE(&ip->i_res->rs_node);
617out:
Bob Peterson0a305e42012-06-06 11:17:59 +0100618 up_write(&ip->i_rw_mutex);
Wei Yongjun441362d2013-03-11 23:01:37 +0800619 return error;
Bob Peterson0a305e42012-06-06 11:17:59 +0100620}
621
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100622static void dump_rs(struct seq_file *seq, const struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400623{
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100624 gfs2_print_dbg(seq, " B: n:%llu s:%llu b:%u f:%u\n",
625 (unsigned long long)rs->rs_inum,
626 (unsigned long long)gfs2_rbm_to_block(&rs->rs_rbm),
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100627 rs->rs_rbm.offset, rs->rs_free);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400628}
629
Bob Peterson0a305e42012-06-06 11:17:59 +0100630/**
Bob Peterson8e2e0042012-07-19 08:12:40 -0400631 * __rs_deltree - remove a multi-block reservation from the rgd tree
632 * @rs: The reservation to remove
633 *
634 */
Bob Peterson20095212013-03-13 10:26:38 -0400635static void __rs_deltree(struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400636{
637 struct gfs2_rgrpd *rgd;
638
639 if (!gfs2_rs_active(rs))
640 return;
641
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100642 rgd = rs->rs_rbm.rgd;
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100643 trace_gfs2_rs(rs, TRACE_RS_TREEDEL);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100644 rb_erase(&rs->rs_node, &rgd->rd_rstree);
Michel Lespinasse24d634e2012-08-05 22:04:08 -0700645 RB_CLEAR_NODE(&rs->rs_node);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400646
647 if (rs->rs_free) {
Bob Petersone579ed42013-09-17 13:12:15 -0400648 struct gfs2_bitmap *bi = rbm_bi(&rs->rs_rbm);
649
Bob Peterson20095212013-03-13 10:26:38 -0400650 /* return reserved blocks to the rgrp */
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100651 BUG_ON(rs->rs_rbm.rgd->rd_reserved < rs->rs_free);
652 rs->rs_rbm.rgd->rd_reserved -= rs->rs_free;
Bob Peterson5ea50502013-11-25 11:16:25 +0000653 /* The rgrp extent failure point is likely not to increase;
654 it will only do so if the freed blocks are somehow
655 contiguous with a span of free blocks that follows. Still,
656 it will force the number to be recalculated later. */
657 rgd->rd_extfail_pt += rs->rs_free;
Bob Peterson8e2e0042012-07-19 08:12:40 -0400658 rs->rs_free = 0;
Bob Petersone579ed42013-09-17 13:12:15 -0400659 clear_bit(GBF_FULL, &bi->bi_flags);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400660 }
Bob Peterson8e2e0042012-07-19 08:12:40 -0400661}
662
663/**
664 * gfs2_rs_deltree - remove a multi-block reservation from the rgd tree
665 * @rs: The reservation to remove
666 *
667 */
Bob Peterson20095212013-03-13 10:26:38 -0400668void gfs2_rs_deltree(struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400669{
670 struct gfs2_rgrpd *rgd;
671
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100672 rgd = rs->rs_rbm.rgd;
673 if (rgd) {
674 spin_lock(&rgd->rd_rsspin);
Bob Peterson20095212013-03-13 10:26:38 -0400675 __rs_deltree(rs);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100676 spin_unlock(&rgd->rd_rsspin);
677 }
Bob Peterson8e2e0042012-07-19 08:12:40 -0400678}
679
680/**
681 * gfs2_rs_delete - delete a multi-block reservation
Bob Peterson0a305e42012-06-06 11:17:59 +0100682 * @ip: The inode for this reservation
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100683 * @wcount: The inode's write count, or NULL
Bob Peterson0a305e42012-06-06 11:17:59 +0100684 *
685 */
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100686void gfs2_rs_delete(struct gfs2_inode *ip, atomic_t *wcount)
Bob Peterson0a305e42012-06-06 11:17:59 +0100687{
688 down_write(&ip->i_rw_mutex);
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100689 if (ip->i_res && ((wcount == NULL) || (atomic_read(wcount) <= 1))) {
Bob Peterson20095212013-03-13 10:26:38 -0400690 gfs2_rs_deltree(ip->i_res);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400691 BUG_ON(ip->i_res->rs_free);
Bob Peterson0a305e42012-06-06 11:17:59 +0100692 kmem_cache_free(gfs2_rsrv_cachep, ip->i_res);
693 ip->i_res = NULL;
694 }
695 up_write(&ip->i_rw_mutex);
696}
697
Bob Peterson8e2e0042012-07-19 08:12:40 -0400698/**
699 * return_all_reservations - return all reserved blocks back to the rgrp.
700 * @rgd: the rgrp that needs its space back
701 *
702 * We previously reserved a bunch of blocks for allocation. Now we need to
703 * give them back. This leave the reservation structures in tact, but removes
704 * all of their corresponding "no-fly zones".
705 */
706static void return_all_reservations(struct gfs2_rgrpd *rgd)
707{
708 struct rb_node *n;
709 struct gfs2_blkreserv *rs;
710
711 spin_lock(&rgd->rd_rsspin);
712 while ((n = rb_first(&rgd->rd_rstree))) {
713 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
Bob Peterson20095212013-03-13 10:26:38 -0400714 __rs_deltree(rs);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400715 }
716 spin_unlock(&rgd->rd_rsspin);
717}
718
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100719void gfs2_clear_rgrpd(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000720{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100721 struct rb_node *n;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000722 struct gfs2_rgrpd *rgd;
723 struct gfs2_glock *gl;
724
Bob Peterson7c9ca622011-08-31 09:53:19 +0100725 while ((n = rb_first(&sdp->sd_rindex_tree))) {
726 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000727 gl = rgd->rd_gl;
728
Bob Peterson7c9ca622011-08-31 09:53:19 +0100729 rb_erase(n, &sdp->sd_rindex_tree);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000730
731 if (gl) {
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100732 spin_lock(&gl->gl_spin);
Steven Whitehouse5c676f62006-02-27 17:23:27 -0500733 gl->gl_object = NULL;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100734 spin_unlock(&gl->gl_spin);
Steven Whitehouse29687a22011-03-30 16:33:25 +0100735 gfs2_glock_add_to_lru(gl);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000736 gfs2_glock_put(gl);
737 }
738
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100739 gfs2_free_clones(rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000740 kfree(rgd->rd_bits);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400741 return_all_reservations(rgd);
Bob Peterson6bdd9be2008-01-28 17:20:26 -0600742 kmem_cache_free(gfs2_rgrpd_cachep, rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000743 }
744}
745
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100746static void gfs2_rindex_print(const struct gfs2_rgrpd *rgd)
747{
Joe Perchesd77d1b52014-03-06 12:10:45 -0800748 pr_info("ri_addr = %llu\n", (unsigned long long)rgd->rd_addr);
749 pr_info("ri_length = %u\n", rgd->rd_length);
750 pr_info("ri_data0 = %llu\n", (unsigned long long)rgd->rd_data0);
751 pr_info("ri_data = %u\n", rgd->rd_data);
752 pr_info("ri_bitbytes = %u\n", rgd->rd_bitbytes);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100753}
754
David Teiglandb3b94fa2006-01-16 16:50:04 +0000755/**
756 * gfs2_compute_bitstructs - Compute the bitmap sizes
757 * @rgd: The resource group descriptor
758 *
759 * Calculates bitmap descriptors, one for each block that contains bitmap data
760 *
761 * Returns: errno
762 */
763
764static int compute_bitstructs(struct gfs2_rgrpd *rgd)
765{
766 struct gfs2_sbd *sdp = rgd->rd_sbd;
767 struct gfs2_bitmap *bi;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100768 u32 length = rgd->rd_length; /* # blocks in hdr & bitmap */
Steven Whitehousecd915492006-09-04 12:49:07 -0400769 u32 bytes_left, bytes;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000770 int x;
771
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -0400772 if (!length)
773 return -EINVAL;
774
Steven Whitehousedd894be2006-07-27 14:29:00 -0400775 rgd->rd_bits = kcalloc(length, sizeof(struct gfs2_bitmap), GFP_NOFS);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000776 if (!rgd->rd_bits)
777 return -ENOMEM;
778
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100779 bytes_left = rgd->rd_bitbytes;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000780
781 for (x = 0; x < length; x++) {
782 bi = rgd->rd_bits + x;
783
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +0100784 bi->bi_flags = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000785 /* small rgrp; bitmap stored completely in header block */
786 if (length == 1) {
787 bytes = bytes_left;
788 bi->bi_offset = sizeof(struct gfs2_rgrp);
789 bi->bi_start = 0;
790 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500791 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000792 /* header block */
793 } else if (x == 0) {
794 bytes = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_rgrp);
795 bi->bi_offset = sizeof(struct gfs2_rgrp);
796 bi->bi_start = 0;
797 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500798 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000799 /* last block */
800 } else if (x + 1 == length) {
801 bytes = bytes_left;
802 bi->bi_offset = sizeof(struct gfs2_meta_header);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100803 bi->bi_start = rgd->rd_bitbytes - bytes_left;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000804 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500805 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000806 /* other blocks */
807 } else {
Steven Whitehouse568f4c92006-02-27 12:00:42 -0500808 bytes = sdp->sd_sb.sb_bsize -
809 sizeof(struct gfs2_meta_header);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000810 bi->bi_offset = sizeof(struct gfs2_meta_header);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100811 bi->bi_start = rgd->rd_bitbytes - bytes_left;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000812 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500813 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000814 }
815
816 bytes_left -= bytes;
817 }
818
819 if (bytes_left) {
820 gfs2_consist_rgrpd(rgd);
821 return -EIO;
822 }
823 bi = rgd->rd_bits + (length - 1);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100824 if ((bi->bi_start + bi->bi_len) * GFS2_NBBY != rgd->rd_data) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000825 if (gfs2_consist_rgrpd(rgd)) {
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100826 gfs2_rindex_print(rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000827 fs_err(sdp, "start=%u len=%u offset=%u\n",
828 bi->bi_start, bi->bi_len, bi->bi_offset);
829 }
830 return -EIO;
831 }
832
833 return 0;
834}
835
836/**
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500837 * gfs2_ri_total - Total up the file system space, according to the rindex.
Bob Peterson886b1412012-04-11 13:03:52 -0400838 * @sdp: the filesystem
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500839 *
840 */
841u64 gfs2_ri_total(struct gfs2_sbd *sdp)
842{
843 u64 total_data = 0;
844 struct inode *inode = sdp->sd_rindex;
845 struct gfs2_inode *ip = GFS2_I(inode);
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500846 char buf[sizeof(struct gfs2_rindex)];
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500847 int error, rgrps;
848
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500849 for (rgrps = 0;; rgrps++) {
850 loff_t pos = rgrps * sizeof(struct gfs2_rindex);
851
Bob Petersonbcd72782010-12-07 13:58:56 -0500852 if (pos + sizeof(struct gfs2_rindex) > i_size_read(inode))
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500853 break;
Andrew Price43066292012-04-16 16:40:55 +0100854 error = gfs2_internal_read(ip, buf, &pos,
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500855 sizeof(struct gfs2_rindex));
856 if (error != sizeof(struct gfs2_rindex))
857 break;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100858 total_data += be32_to_cpu(((struct gfs2_rindex *)buf)->ri_data);
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500859 }
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500860 return total_data;
861}
862
Bob Peterson6aad1c32012-03-05 09:20:59 -0500863static int rgd_insert(struct gfs2_rgrpd *rgd)
Bob Peterson7c9ca622011-08-31 09:53:19 +0100864{
865 struct gfs2_sbd *sdp = rgd->rd_sbd;
866 struct rb_node **newn = &sdp->sd_rindex_tree.rb_node, *parent = NULL;
867
868 /* Figure out where to put new node */
869 while (*newn) {
870 struct gfs2_rgrpd *cur = rb_entry(*newn, struct gfs2_rgrpd,
871 rd_node);
872
873 parent = *newn;
874 if (rgd->rd_addr < cur->rd_addr)
875 newn = &((*newn)->rb_left);
876 else if (rgd->rd_addr > cur->rd_addr)
877 newn = &((*newn)->rb_right);
878 else
Bob Peterson6aad1c32012-03-05 09:20:59 -0500879 return -EEXIST;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100880 }
881
882 rb_link_node(&rgd->rd_node, parent, newn);
883 rb_insert_color(&rgd->rd_node, &sdp->sd_rindex_tree);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500884 sdp->sd_rgrps++;
885 return 0;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100886}
887
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500888/**
Robert Peterson6c532672007-05-10 16:54:38 -0500889 * read_rindex_entry - Pull in a new resource index entry from the disk
Andrew Price43066292012-04-16 16:40:55 +0100890 * @ip: Pointer to the rindex inode
David Teiglandb3b94fa2006-01-16 16:50:04 +0000891 *
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100892 * Returns: 0 on success, > 0 on EOF, error code otherwise
Robert Peterson6c532672007-05-10 16:54:38 -0500893 */
894
Andrew Price43066292012-04-16 16:40:55 +0100895static int read_rindex_entry(struct gfs2_inode *ip)
Robert Peterson6c532672007-05-10 16:54:38 -0500896{
897 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehouse7005c3e2013-12-06 10:16:14 +0000898 const unsigned bsize = sdp->sd_sb.sb_bsize;
Robert Peterson6c532672007-05-10 16:54:38 -0500899 loff_t pos = sdp->sd_rgrps * sizeof(struct gfs2_rindex);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100900 struct gfs2_rindex buf;
Robert Peterson6c532672007-05-10 16:54:38 -0500901 int error;
902 struct gfs2_rgrpd *rgd;
903
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100904 if (pos >= i_size_read(&ip->i_inode))
905 return 1;
906
Andrew Price43066292012-04-16 16:40:55 +0100907 error = gfs2_internal_read(ip, (char *)&buf, &pos,
Robert Peterson6c532672007-05-10 16:54:38 -0500908 sizeof(struct gfs2_rindex));
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100909
910 if (error != sizeof(struct gfs2_rindex))
911 return (error == 0) ? 1 : error;
Robert Peterson6c532672007-05-10 16:54:38 -0500912
Bob Peterson6bdd9be2008-01-28 17:20:26 -0600913 rgd = kmem_cache_zalloc(gfs2_rgrpd_cachep, GFP_NOFS);
Robert Peterson6c532672007-05-10 16:54:38 -0500914 error = -ENOMEM;
915 if (!rgd)
916 return error;
917
Robert Peterson6c532672007-05-10 16:54:38 -0500918 rgd->rd_sbd = sdp;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100919 rgd->rd_addr = be64_to_cpu(buf.ri_addr);
920 rgd->rd_length = be32_to_cpu(buf.ri_length);
921 rgd->rd_data0 = be64_to_cpu(buf.ri_data0);
922 rgd->rd_data = be32_to_cpu(buf.ri_data);
923 rgd->rd_bitbytes = be32_to_cpu(buf.ri_bitbytes);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400924 spin_lock_init(&rgd->rd_rsspin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100925
Robert Peterson6c532672007-05-10 16:54:38 -0500926 error = compute_bitstructs(rgd);
927 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100928 goto fail;
Robert Peterson6c532672007-05-10 16:54:38 -0500929
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100930 error = gfs2_glock_get(sdp, rgd->rd_addr,
Robert Peterson6c532672007-05-10 16:54:38 -0500931 &gfs2_rgrp_glops, CREATE, &rgd->rd_gl);
932 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100933 goto fail;
Robert Peterson6c532672007-05-10 16:54:38 -0500934
935 rgd->rd_gl->gl_object = rgd;
Steven Whitehouse7005c3e2013-12-06 10:16:14 +0000936 rgd->rd_gl->gl_vm.start = rgd->rd_addr * bsize;
937 rgd->rd_gl->gl_vm.end = rgd->rd_gl->gl_vm.start + (rgd->rd_length * bsize) - 1;
David Teigland4e2f8842012-11-14 13:47:37 -0500938 rgd->rd_rgl = (struct gfs2_rgrp_lvb *)rgd->rd_gl->gl_lksb.sb_lvbptr;
Bob Peterson0e27c182014-10-29 08:02:28 -0500939 rgd->rd_flags &= ~(GFS2_RDF_UPTODATE | GFS2_RDF_PREFERRED);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100940 if (rgd->rd_data > sdp->sd_max_rg_data)
941 sdp->sd_max_rg_data = rgd->rd_data;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100942 spin_lock(&sdp->sd_rindex_spin);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500943 error = rgd_insert(rgd);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100944 spin_unlock(&sdp->sd_rindex_spin);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500945 if (!error)
946 return 0;
947
948 error = 0; /* someone else read in the rgrp; free it and ignore it */
Bob Petersonc1ac5392012-03-22 08:58:30 -0400949 gfs2_glock_put(rgd->rd_gl);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100950
951fail:
952 kfree(rgd->rd_bits);
953 kmem_cache_free(gfs2_rgrpd_cachep, rgd);
Robert Peterson6c532672007-05-10 16:54:38 -0500954 return error;
955}
956
957/**
Bob Peterson0e27c182014-10-29 08:02:28 -0500958 * set_rgrp_preferences - Run all the rgrps, selecting some we prefer to use
959 * @sdp: the GFS2 superblock
960 *
961 * The purpose of this function is to select a subset of the resource groups
962 * and mark them as PREFERRED. We do it in such a way that each node prefers
963 * to use a unique set of rgrps to minimize glock contention.
964 */
965static void set_rgrp_preferences(struct gfs2_sbd *sdp)
966{
967 struct gfs2_rgrpd *rgd, *first;
968 int i;
969
970 /* Skip an initial number of rgrps, based on this node's journal ID.
971 That should start each node out on its own set. */
972 rgd = gfs2_rgrpd_get_first(sdp);
973 for (i = 0; i < sdp->sd_lockstruct.ls_jid; i++)
974 rgd = gfs2_rgrpd_get_next(rgd);
975 first = rgd;
976
977 do {
978 rgd->rd_flags |= GFS2_RDF_PREFERRED;
979 for (i = 0; i < sdp->sd_journals; i++) {
980 rgd = gfs2_rgrpd_get_next(rgd);
981 if (rgd == first)
982 break;
983 }
984 } while (rgd != first);
985}
986
987/**
Robert Peterson6c532672007-05-10 16:54:38 -0500988 * gfs2_ri_update - Pull in a new resource index from the disk
989 * @ip: pointer to the rindex inode
990 *
David Teiglandb3b94fa2006-01-16 16:50:04 +0000991 * Returns: 0 on successful update, error code otherwise
992 */
993
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100994static int gfs2_ri_update(struct gfs2_inode *ip)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000995{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -0400996 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000997 int error;
998
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100999 do {
Andrew Price43066292012-04-16 16:40:55 +01001000 error = read_rindex_entry(ip);
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001001 } while (error == 0);
1002
1003 if (error < 0)
1004 return error;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001005
Bob Peterson0e27c182014-10-29 08:02:28 -05001006 set_rgrp_preferences(sdp);
1007
Bob Petersoncf45b752008-01-31 10:31:39 -06001008 sdp->sd_rindex_uptodate = 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001009 return 0;
Robert Peterson6c532672007-05-10 16:54:38 -05001010}
David Teiglandb3b94fa2006-01-16 16:50:04 +00001011
Robert Peterson6c532672007-05-10 16:54:38 -05001012/**
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001013 * gfs2_rindex_update - Update the rindex if required
David Teiglandb3b94fa2006-01-16 16:50:04 +00001014 * @sdp: The GFS2 superblock
David Teiglandb3b94fa2006-01-16 16:50:04 +00001015 *
1016 * We grab a lock on the rindex inode to make sure that it doesn't
1017 * change whilst we are performing an operation. We keep this lock
1018 * for quite long periods of time compared to other locks. This
1019 * doesn't matter, since it is shared and it is very, very rarely
1020 * accessed in the exclusive mode (i.e. only when expanding the filesystem).
1021 *
1022 * This makes sure that we're using the latest copy of the resource index
1023 * special file, which might have been updated if someone expanded the
1024 * filesystem (via gfs2_grow utility), which adds new resource groups.
1025 *
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001026 * Returns: 0 on succeess, error code otherwise
David Teiglandb3b94fa2006-01-16 16:50:04 +00001027 */
1028
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001029int gfs2_rindex_update(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001030{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001031 struct gfs2_inode *ip = GFS2_I(sdp->sd_rindex);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001032 struct gfs2_glock *gl = ip->i_gl;
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001033 struct gfs2_holder ri_gh;
1034 int error = 0;
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001035 int unlock_required = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001036
1037 /* Read new copy from disk if we don't have the latest */
Bob Petersoncf45b752008-01-31 10:31:39 -06001038 if (!sdp->sd_rindex_uptodate) {
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001039 if (!gfs2_glock_is_locked_by_me(gl)) {
1040 error = gfs2_glock_nq_init(gl, LM_ST_SHARED, 0, &ri_gh);
1041 if (error)
Bob Peterson6aad1c32012-03-05 09:20:59 -05001042 return error;
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001043 unlock_required = 1;
1044 }
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001045 if (!sdp->sd_rindex_uptodate)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001046 error = gfs2_ri_update(ip);
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001047 if (unlock_required)
1048 gfs2_glock_dq_uninit(&ri_gh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001049 }
1050
1051 return error;
1052}
1053
Bob Peterson42d52e32008-01-28 18:38:07 -06001054static void gfs2_rgrp_in(struct gfs2_rgrpd *rgd, const void *buf)
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001055{
1056 const struct gfs2_rgrp *str = buf;
Bob Peterson42d52e32008-01-28 18:38:07 -06001057 u32 rg_flags;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001058
Bob Peterson42d52e32008-01-28 18:38:07 -06001059 rg_flags = be32_to_cpu(str->rg_flags);
Steven Whitehouse09010972009-05-20 10:48:47 +01001060 rg_flags &= ~GFS2_RDF_MASK;
Steven Whitehouse1ce97e52009-05-21 15:18:19 +01001061 rgd->rd_flags &= GFS2_RDF_MASK;
1062 rgd->rd_flags |= rg_flags;
Steven Whitehousecfc8b542008-11-04 10:25:13 +00001063 rgd->rd_free = be32_to_cpu(str->rg_free);
Steven Whitehouse73f74942008-11-04 10:32:57 +00001064 rgd->rd_dinodes = be32_to_cpu(str->rg_dinodes);
Steven Whitehoused8b71f72008-11-04 10:19:03 +00001065 rgd->rd_igeneration = be64_to_cpu(str->rg_igeneration);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001066}
1067
Bob Peterson42d52e32008-01-28 18:38:07 -06001068static void gfs2_rgrp_out(struct gfs2_rgrpd *rgd, void *buf)
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001069{
1070 struct gfs2_rgrp *str = buf;
1071
Steven Whitehouse09010972009-05-20 10:48:47 +01001072 str->rg_flags = cpu_to_be32(rgd->rd_flags & ~GFS2_RDF_MASK);
Steven Whitehousecfc8b542008-11-04 10:25:13 +00001073 str->rg_free = cpu_to_be32(rgd->rd_free);
Steven Whitehouse73f74942008-11-04 10:32:57 +00001074 str->rg_dinodes = cpu_to_be32(rgd->rd_dinodes);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001075 str->__pad = cpu_to_be32(0);
Steven Whitehoused8b71f72008-11-04 10:19:03 +00001076 str->rg_igeneration = cpu_to_be64(rgd->rd_igeneration);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001077 memset(&str->rg_reserved, 0, sizeof(str->rg_reserved));
1078}
1079
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001080static int gfs2_rgrp_lvb_valid(struct gfs2_rgrpd *rgd)
1081{
1082 struct gfs2_rgrp_lvb *rgl = rgd->rd_rgl;
1083 struct gfs2_rgrp *str = (struct gfs2_rgrp *)rgd->rd_bits[0].bi_bh->b_data;
1084
1085 if (rgl->rl_flags != str->rg_flags || rgl->rl_free != str->rg_free ||
1086 rgl->rl_dinodes != str->rg_dinodes ||
1087 rgl->rl_igeneration != str->rg_igeneration)
1088 return 0;
1089 return 1;
1090}
1091
1092static void gfs2_rgrp_ondisk2lvb(struct gfs2_rgrp_lvb *rgl, const void *buf)
1093{
1094 const struct gfs2_rgrp *str = buf;
1095
1096 rgl->rl_magic = cpu_to_be32(GFS2_MAGIC);
1097 rgl->rl_flags = str->rg_flags;
1098 rgl->rl_free = str->rg_free;
1099 rgl->rl_dinodes = str->rg_dinodes;
1100 rgl->rl_igeneration = str->rg_igeneration;
1101 rgl->__pad = 0UL;
1102}
1103
1104static void update_rgrp_lvb_unlinked(struct gfs2_rgrpd *rgd, u32 change)
1105{
1106 struct gfs2_rgrp_lvb *rgl = rgd->rd_rgl;
1107 u32 unlinked = be32_to_cpu(rgl->rl_unlinked) + change;
1108 rgl->rl_unlinked = cpu_to_be32(unlinked);
1109}
1110
1111static u32 count_unlinked(struct gfs2_rgrpd *rgd)
1112{
1113 struct gfs2_bitmap *bi;
1114 const u32 length = rgd->rd_length;
1115 const u8 *buffer = NULL;
1116 u32 i, goal, count = 0;
1117
1118 for (i = 0, bi = rgd->rd_bits; i < length; i++, bi++) {
1119 goal = 0;
1120 buffer = bi->bi_bh->b_data + bi->bi_offset;
1121 WARN_ON(!buffer_uptodate(bi->bi_bh));
1122 while (goal < bi->bi_len * GFS2_NBBY) {
1123 goal = gfs2_bitfit(buffer, bi->bi_len, goal,
1124 GFS2_BLKST_UNLINKED);
1125 if (goal == BFITNOENT)
1126 break;
1127 count++;
1128 goal++;
1129 }
1130 }
1131
1132 return count;
1133}
1134
1135
David Teiglandb3b94fa2006-01-16 16:50:04 +00001136/**
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001137 * gfs2_rgrp_bh_get - Read in a RG's header and bitmaps
1138 * @rgd: the struct gfs2_rgrpd describing the RG to read in
David Teiglandb3b94fa2006-01-16 16:50:04 +00001139 *
1140 * Read in all of a Resource Group's header and bitmap blocks.
1141 * Caller must eventually call gfs2_rgrp_relse() to free the bitmaps.
1142 *
1143 * Returns: errno
1144 */
1145
Rashika Kheriac2b0b302014-02-09 18:40:19 +05301146static int gfs2_rgrp_bh_get(struct gfs2_rgrpd *rgd)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001147{
1148 struct gfs2_sbd *sdp = rgd->rd_sbd;
1149 struct gfs2_glock *gl = rgd->rd_gl;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001150 unsigned int length = rgd->rd_length;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001151 struct gfs2_bitmap *bi;
1152 unsigned int x, y;
1153 int error;
1154
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001155 if (rgd->rd_bits[0].bi_bh != NULL)
1156 return 0;
1157
David Teiglandb3b94fa2006-01-16 16:50:04 +00001158 for (x = 0; x < length; x++) {
1159 bi = rgd->rd_bits + x;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001160 error = gfs2_meta_read(gl, rgd->rd_addr + x, 0, &bi->bi_bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001161 if (error)
1162 goto fail;
1163 }
1164
1165 for (y = length; y--;) {
1166 bi = rgd->rd_bits + y;
Steven Whitehouse7276b3b2006-09-21 17:05:23 -04001167 error = gfs2_meta_wait(sdp, bi->bi_bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001168 if (error)
1169 goto fail;
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001170 if (gfs2_metatype_check(sdp, bi->bi_bh, y ? GFS2_METATYPE_RB :
David Teiglandb3b94fa2006-01-16 16:50:04 +00001171 GFS2_METATYPE_RG)) {
1172 error = -EIO;
1173 goto fail;
1174 }
1175 }
1176
Bob Petersoncf45b752008-01-31 10:31:39 -06001177 if (!(rgd->rd_flags & GFS2_RDF_UPTODATE)) {
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01001178 for (x = 0; x < length; x++)
1179 clear_bit(GBF_FULL, &rgd->rd_bits[x].bi_flags);
Bob Peterson42d52e32008-01-28 18:38:07 -06001180 gfs2_rgrp_in(rgd, (rgd->rd_bits[0].bi_bh)->b_data);
Steven Whitehouse1ce97e52009-05-21 15:18:19 +01001181 rgd->rd_flags |= (GFS2_RDF_UPTODATE | GFS2_RDF_CHECK);
Bob Peterson7c9ca622011-08-31 09:53:19 +01001182 rgd->rd_free_clone = rgd->rd_free;
Bob Peterson5ea50502013-11-25 11:16:25 +00001183 /* max out the rgrp allocation failure point */
1184 rgd->rd_extfail_pt = rgd->rd_free;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001185 }
Al Viro951b4bd2013-06-02 19:53:40 -04001186 if (cpu_to_be32(GFS2_MAGIC) != rgd->rd_rgl->rl_magic) {
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001187 rgd->rd_rgl->rl_unlinked = cpu_to_be32(count_unlinked(rgd));
1188 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl,
1189 rgd->rd_bits[0].bi_bh->b_data);
1190 }
1191 else if (sdp->sd_args.ar_rgrplvb) {
1192 if (!gfs2_rgrp_lvb_valid(rgd)){
1193 gfs2_consist_rgrpd(rgd);
1194 error = -EIO;
1195 goto fail;
1196 }
1197 if (rgd->rd_rgl->rl_unlinked == 0)
1198 rgd->rd_flags &= ~GFS2_RDF_CHECK;
1199 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001200 return 0;
1201
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001202fail:
David Teiglandb3b94fa2006-01-16 16:50:04 +00001203 while (x--) {
1204 bi = rgd->rd_bits + x;
1205 brelse(bi->bi_bh);
1206 bi->bi_bh = NULL;
1207 gfs2_assert_warn(sdp, !bi->bi_clone);
1208 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001209
1210 return error;
1211}
1212
Rashika Kheriac2b0b302014-02-09 18:40:19 +05301213static int update_rgrp_lvb(struct gfs2_rgrpd *rgd)
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001214{
1215 u32 rl_flags;
1216
1217 if (rgd->rd_flags & GFS2_RDF_UPTODATE)
1218 return 0;
1219
Al Viro951b4bd2013-06-02 19:53:40 -04001220 if (cpu_to_be32(GFS2_MAGIC) != rgd->rd_rgl->rl_magic)
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001221 return gfs2_rgrp_bh_get(rgd);
1222
1223 rl_flags = be32_to_cpu(rgd->rd_rgl->rl_flags);
1224 rl_flags &= ~GFS2_RDF_MASK;
1225 rgd->rd_flags &= GFS2_RDF_MASK;
1226 rgd->rd_flags |= (rl_flags | GFS2_RDF_UPTODATE | GFS2_RDF_CHECK);
1227 if (rgd->rd_rgl->rl_unlinked == 0)
1228 rgd->rd_flags &= ~GFS2_RDF_CHECK;
1229 rgd->rd_free = be32_to_cpu(rgd->rd_rgl->rl_free);
1230 rgd->rd_free_clone = rgd->rd_free;
1231 rgd->rd_dinodes = be32_to_cpu(rgd->rd_rgl->rl_dinodes);
1232 rgd->rd_igeneration = be64_to_cpu(rgd->rd_rgl->rl_igeneration);
1233 return 0;
1234}
1235
1236int gfs2_rgrp_go_lock(struct gfs2_holder *gh)
1237{
1238 struct gfs2_rgrpd *rgd = gh->gh_gl->gl_object;
1239 struct gfs2_sbd *sdp = rgd->rd_sbd;
1240
1241 if (gh->gh_flags & GL_SKIP && sdp->sd_args.ar_rgrplvb)
1242 return 0;
Bob Peterson8b127d02014-01-16 08:52:16 -05001243 return gfs2_rgrp_bh_get(rgd);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001244}
1245
David Teiglandb3b94fa2006-01-16 16:50:04 +00001246/**
Bob Peterson7c9ca622011-08-31 09:53:19 +01001247 * gfs2_rgrp_go_unlock - Release RG bitmaps read in with gfs2_rgrp_bh_get()
Bob Peterson886b1412012-04-11 13:03:52 -04001248 * @gh: The glock holder for the resource group
David Teiglandb3b94fa2006-01-16 16:50:04 +00001249 *
1250 */
1251
Bob Peterson7c9ca622011-08-31 09:53:19 +01001252void gfs2_rgrp_go_unlock(struct gfs2_holder *gh)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001253{
Bob Peterson7c9ca622011-08-31 09:53:19 +01001254 struct gfs2_rgrpd *rgd = gh->gh_gl->gl_object;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001255 int x, length = rgd->rd_length;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001256
David Teiglandb3b94fa2006-01-16 16:50:04 +00001257 for (x = 0; x < length; x++) {
1258 struct gfs2_bitmap *bi = rgd->rd_bits + x;
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001259 if (bi->bi_bh) {
1260 brelse(bi->bi_bh);
1261 bi->bi_bh = NULL;
1262 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001263 }
1264
David Teiglandb3b94fa2006-01-16 16:50:04 +00001265}
1266
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001267int gfs2_rgrp_send_discards(struct gfs2_sbd *sdp, u64 offset,
Bob Peterson7c9ca622011-08-31 09:53:19 +01001268 struct buffer_head *bh,
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001269 const struct gfs2_bitmap *bi, unsigned minlen, u64 *ptrimmed)
Steven Whitehousef15ab562009-02-09 09:25:01 +00001270{
1271 struct super_block *sb = sdp->sd_vfs;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001272 u64 blk;
Steven Whitehouse64d576b2009-02-12 13:31:58 +00001273 sector_t start = 0;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001274 sector_t nr_blks = 0;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001275 int rv;
1276 unsigned int x;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001277 u32 trimmed = 0;
1278 u8 diff;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001279
1280 for (x = 0; x < bi->bi_len; x++) {
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001281 const u8 *clone = bi->bi_clone ? bi->bi_clone : bi->bi_bh->b_data;
1282 clone += bi->bi_offset;
1283 clone += x;
1284 if (bh) {
1285 const u8 *orig = bh->b_data + bi->bi_offset + x;
1286 diff = ~(*orig | (*orig >> 1)) & (*clone | (*clone >> 1));
1287 } else {
1288 diff = ~(*clone | (*clone >> 1));
1289 }
Steven Whitehousef15ab562009-02-09 09:25:01 +00001290 diff &= 0x55;
1291 if (diff == 0)
1292 continue;
1293 blk = offset + ((bi->bi_start + x) * GFS2_NBBY);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001294 while(diff) {
1295 if (diff & 1) {
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001296 if (nr_blks == 0)
Steven Whitehousef15ab562009-02-09 09:25:01 +00001297 goto start_new_extent;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001298 if ((start + nr_blks) != blk) {
1299 if (nr_blks >= minlen) {
1300 rv = sb_issue_discard(sb,
1301 start, nr_blks,
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001302 GFP_NOFS, 0);
1303 if (rv)
1304 goto fail;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001305 trimmed += nr_blks;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001306 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001307 nr_blks = 0;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001308start_new_extent:
1309 start = blk;
1310 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001311 nr_blks++;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001312 }
1313 diff >>= 2;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001314 blk++;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001315 }
1316 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001317 if (nr_blks >= minlen) {
1318 rv = sb_issue_discard(sb, start, nr_blks, GFP_NOFS, 0);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001319 if (rv)
1320 goto fail;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001321 trimmed += nr_blks;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001322 }
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001323 if (ptrimmed)
1324 *ptrimmed = trimmed;
1325 return 0;
1326
Steven Whitehousef15ab562009-02-09 09:25:01 +00001327fail:
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001328 if (sdp->sd_args.ar_discard)
1329 fs_warn(sdp, "error %d on discard request, turning discards off for this filesystem", rv);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001330 sdp->sd_args.ar_discard = 0;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001331 return -EIO;
1332}
1333
1334/**
1335 * gfs2_fitrim - Generate discard requests for unused bits of the filesystem
1336 * @filp: Any file on the filesystem
1337 * @argp: Pointer to the arguments (also used to pass result)
1338 *
1339 * Returns: 0 on success, otherwise error code
1340 */
1341
1342int gfs2_fitrim(struct file *filp, void __user *argp)
1343{
Al Viro496ad9a2013-01-23 17:07:38 -05001344 struct inode *inode = file_inode(filp);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001345 struct gfs2_sbd *sdp = GFS2_SB(inode);
1346 struct request_queue *q = bdev_get_queue(sdp->sd_vfs->s_bdev);
1347 struct buffer_head *bh;
1348 struct gfs2_rgrpd *rgd;
1349 struct gfs2_rgrpd *rgd_end;
1350 struct gfs2_holder gh;
1351 struct fstrim_range r;
1352 int ret = 0;
1353 u64 amt;
1354 u64 trimmed = 0;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001355 u64 start, end, minlen;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001356 unsigned int x;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001357 unsigned bs_shift = sdp->sd_sb.sb_bsize_shift;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001358
1359 if (!capable(CAP_SYS_ADMIN))
1360 return -EPERM;
1361
1362 if (!blk_queue_discard(q))
1363 return -EOPNOTSUPP;
1364
Lukas Czerner3a238ad2012-10-16 11:39:07 +02001365 if (copy_from_user(&r, argp, sizeof(r)))
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001366 return -EFAULT;
1367
Bob Peterson5e2f7d62012-04-04 22:11:16 -04001368 ret = gfs2_rindex_update(sdp);
1369 if (ret)
1370 return ret;
1371
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001372 start = r.start >> bs_shift;
1373 end = start + (r.len >> bs_shift);
1374 minlen = max_t(u64, r.minlen,
1375 q->limits.discard_granularity) >> bs_shift;
1376
Abhijith Das6a98c332013-06-19 17:03:29 -04001377 if (end <= start || minlen > sdp->sd_max_rg_data)
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001378 return -EINVAL;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001379
Abhijith Das6a98c332013-06-19 17:03:29 -04001380 rgd = gfs2_blk2rgrpd(sdp, start, 0);
1381 rgd_end = gfs2_blk2rgrpd(sdp, end, 0);
1382
1383 if ((gfs2_rgrpd_get_first(sdp) == gfs2_rgrpd_get_next(rgd_end))
1384 && (start > rgd_end->rd_data0 + rgd_end->rd_data))
1385 return -EINVAL; /* start is beyond the end of the fs */
1386
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001387 while (1) {
1388
1389 ret = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE, 0, &gh);
1390 if (ret)
1391 goto out;
1392
1393 if (!(rgd->rd_flags & GFS2_RGF_TRIMMED)) {
1394 /* Trim each bitmap in the rgrp */
1395 for (x = 0; x < rgd->rd_length; x++) {
1396 struct gfs2_bitmap *bi = rgd->rd_bits + x;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001397 ret = gfs2_rgrp_send_discards(sdp,
1398 rgd->rd_data0, NULL, bi, minlen,
1399 &amt);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001400 if (ret) {
1401 gfs2_glock_dq_uninit(&gh);
1402 goto out;
1403 }
1404 trimmed += amt;
1405 }
1406
1407 /* Mark rgrp as having been trimmed */
1408 ret = gfs2_trans_begin(sdp, RES_RG_HDR, 0);
1409 if (ret == 0) {
1410 bh = rgd->rd_bits[0].bi_bh;
1411 rgd->rd_flags |= GFS2_RGF_TRIMMED;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001412 gfs2_trans_add_meta(rgd->rd_gl, bh);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001413 gfs2_rgrp_out(rgd, bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001414 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, bh->b_data);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001415 gfs2_trans_end(sdp);
1416 }
1417 }
1418 gfs2_glock_dq_uninit(&gh);
1419
1420 if (rgd == rgd_end)
1421 break;
1422
1423 rgd = gfs2_rgrpd_get_next(rgd);
1424 }
1425
1426out:
Abhijith Das6a98c332013-06-19 17:03:29 -04001427 r.len = trimmed << bs_shift;
Lukas Czerner3a238ad2012-10-16 11:39:07 +02001428 if (copy_to_user(argp, &r, sizeof(r)))
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001429 return -EFAULT;
1430
1431 return ret;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001432}
1433
David Teiglandb3b94fa2006-01-16 16:50:04 +00001434/**
Bob Peterson8e2e0042012-07-19 08:12:40 -04001435 * rs_insert - insert a new multi-block reservation into the rgrp's rb_tree
Bob Peterson8e2e0042012-07-19 08:12:40 -04001436 * @ip: the inode structure
Bob Peterson8e2e0042012-07-19 08:12:40 -04001437 *
Bob Peterson8e2e0042012-07-19 08:12:40 -04001438 */
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001439static void rs_insert(struct gfs2_inode *ip)
Bob Peterson8e2e0042012-07-19 08:12:40 -04001440{
1441 struct rb_node **newn, *parent = NULL;
1442 int rc;
1443 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001444 struct gfs2_rgrpd *rgd = rs->rs_rbm.rgd;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001445 u64 fsblock = gfs2_rbm_to_block(&rs->rs_rbm);
1446
1447 BUG_ON(gfs2_rs_active(rs));
Bob Peterson8e2e0042012-07-19 08:12:40 -04001448
1449 spin_lock(&rgd->rd_rsspin);
1450 newn = &rgd->rd_rstree.rb_node;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001451 while (*newn) {
1452 struct gfs2_blkreserv *cur =
1453 rb_entry(*newn, struct gfs2_blkreserv, rs_node);
1454
1455 parent = *newn;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001456 rc = rs_cmp(fsblock, rs->rs_free, cur);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001457 if (rc > 0)
1458 newn = &((*newn)->rb_right);
1459 else if (rc < 0)
1460 newn = &((*newn)->rb_left);
1461 else {
1462 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001463 WARN_ON(1);
1464 return;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001465 }
1466 }
1467
Bob Peterson8e2e0042012-07-19 08:12:40 -04001468 rb_link_node(&rs->rs_node, parent, newn);
1469 rb_insert_color(&rs->rs_node, &rgd->rd_rstree);
1470
Bob Peterson8e2e0042012-07-19 08:12:40 -04001471 /* Do our rgrp accounting for the reservation */
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001472 rgd->rd_reserved += rs->rs_free; /* blocks reserved */
Bob Peterson8e2e0042012-07-19 08:12:40 -04001473 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouse9e733d32012-08-23 15:37:59 +01001474 trace_gfs2_rs(rs, TRACE_RS_INSERT);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001475}
1476
1477/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001478 * rg_mblk_search - find a group of multiple free blocks to form a reservation
Bob Peterson8e2e0042012-07-19 08:12:40 -04001479 * @rgd: the resource group descriptor
Bob Peterson8e2e0042012-07-19 08:12:40 -04001480 * @ip: pointer to the inode for which we're reserving blocks
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001481 * @ap: the allocation parameters
Bob Peterson8e2e0042012-07-19 08:12:40 -04001482 *
Bob Peterson8e2e0042012-07-19 08:12:40 -04001483 */
1484
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001485static void rg_mblk_search(struct gfs2_rgrpd *rgd, struct gfs2_inode *ip,
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001486 const struct gfs2_alloc_parms *ap)
Bob Peterson8e2e0042012-07-19 08:12:40 -04001487{
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001488 struct gfs2_rbm rbm = { .rgd = rgd, };
1489 u64 goal;
1490 struct gfs2_blkreserv *rs = ip->i_res;
1491 u32 extlen;
1492 u32 free_blocks = rgd->rd_free_clone - rgd->rd_reserved;
1493 int ret;
Bob Petersonaf21ca82013-05-14 13:04:29 -04001494 struct inode *inode = &ip->i_inode;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001495
Bob Petersonaf21ca82013-05-14 13:04:29 -04001496 if (S_ISDIR(inode->i_mode))
1497 extlen = 1;
1498 else {
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001499 extlen = max_t(u32, atomic_read(&rs->rs_sizehint), ap->target);
Bob Petersonaf21ca82013-05-14 13:04:29 -04001500 extlen = clamp(extlen, RGRP_RSRV_MINBLKS, free_blocks);
1501 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001502 if ((rgd->rd_free_clone < rgd->rd_reserved) || (free_blocks < extlen))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001503 return;
1504
Bob Peterson8e2e0042012-07-19 08:12:40 -04001505 /* Find bitmap block that contains bits for goal block */
1506 if (rgrp_contains_block(rgd, ip->i_goal))
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001507 goal = ip->i_goal;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001508 else
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001509 goal = rgd->rd_last_alloc + rgd->rd_data0;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001510
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001511 if (WARN_ON(gfs2_rbm_from_block(&rbm, goal)))
1512 return;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001513
Bob Peterson5ce13432013-11-06 10:55:52 -05001514 ret = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, &extlen, ip, true, ap);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001515 if (ret == 0) {
1516 rs->rs_rbm = rbm;
1517 rs->rs_free = extlen;
1518 rs->rs_inum = ip->i_no_addr;
1519 rs_insert(ip);
Bob Peterson13d2eb02012-12-20 13:23:04 -05001520 } else {
1521 if (goal == rgd->rd_last_alloc + rgd->rd_data0)
1522 rgd->rd_last_alloc = 0;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001523 }
Bob Petersonb3e47ca2011-11-21 11:47:08 -05001524}
1525
David Teiglandb3b94fa2006-01-16 16:50:04 +00001526/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001527 * gfs2_next_unreserved_block - Return next block that is not reserved
1528 * @rgd: The resource group
1529 * @block: The starting block
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001530 * @length: The required length
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001531 * @ip: Ignore any reservations for this inode
1532 *
1533 * If the block does not appear in any reservation, then return the
1534 * block number unchanged. If it does appear in the reservation, then
1535 * keep looking through the tree of reservations in order to find the
1536 * first block number which is not reserved.
1537 */
1538
1539static u64 gfs2_next_unreserved_block(struct gfs2_rgrpd *rgd, u64 block,
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001540 u32 length,
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001541 const struct gfs2_inode *ip)
1542{
1543 struct gfs2_blkreserv *rs;
1544 struct rb_node *n;
1545 int rc;
1546
1547 spin_lock(&rgd->rd_rsspin);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001548 n = rgd->rd_rstree.rb_node;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001549 while (n) {
1550 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001551 rc = rs_cmp(block, length, rs);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001552 if (rc < 0)
1553 n = n->rb_left;
1554 else if (rc > 0)
1555 n = n->rb_right;
1556 else
1557 break;
1558 }
1559
1560 if (n) {
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001561 while ((rs_cmp(block, length, rs) == 0) && (ip->i_res != rs)) {
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001562 block = gfs2_rbm_to_block(&rs->rs_rbm) + rs->rs_free;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001563 n = n->rb_right;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001564 if (n == NULL)
1565 break;
1566 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
1567 }
1568 }
1569
1570 spin_unlock(&rgd->rd_rsspin);
1571 return block;
1572}
1573
1574/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001575 * gfs2_reservation_check_and_update - Check for reservations during block alloc
1576 * @rbm: The current position in the resource group
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001577 * @ip: The inode for which we are searching for blocks
1578 * @minext: The minimum extent length
Bob Peterson5ce13432013-11-06 10:55:52 -05001579 * @maxext: A pointer to the maximum extent structure
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001580 *
1581 * This checks the current position in the rgrp to see whether there is
1582 * a reservation covering this block. If not then this function is a
1583 * no-op. If there is, then the position is moved to the end of the
1584 * contiguous reservation(s) so that we are pointing at the first
1585 * non-reserved block.
1586 *
1587 * Returns: 0 if no reservation, 1 if @rbm has changed, otherwise an error
1588 */
1589
1590static int gfs2_reservation_check_and_update(struct gfs2_rbm *rbm,
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001591 const struct gfs2_inode *ip,
Bob Peterson5ce13432013-11-06 10:55:52 -05001592 u32 minext,
1593 struct gfs2_extent *maxext)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001594{
1595 u64 block = gfs2_rbm_to_block(rbm);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001596 u32 extlen = 1;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001597 u64 nblock;
1598 int ret;
1599
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001600 /*
1601 * If we have a minimum extent length, then skip over any extent
1602 * which is less than the min extent length in size.
1603 */
1604 if (minext) {
1605 extlen = gfs2_free_extlen(rbm, minext);
Bob Peterson5ce13432013-11-06 10:55:52 -05001606 if (extlen <= maxext->len)
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001607 goto fail;
1608 }
1609
1610 /*
1611 * Check the extent which has been found against the reservations
1612 * and skip if parts of it are already reserved
1613 */
1614 nblock = gfs2_next_unreserved_block(rbm->rgd, block, extlen, ip);
Bob Peterson5ce13432013-11-06 10:55:52 -05001615 if (nblock == block) {
1616 if (!minext || extlen >= minext)
1617 return 0;
1618
1619 if (extlen > maxext->len) {
1620 maxext->len = extlen;
1621 maxext->rbm = *rbm;
1622 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001623fail:
Bob Peterson5ce13432013-11-06 10:55:52 -05001624 nblock = block + extlen;
1625 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001626 ret = gfs2_rbm_from_block(rbm, nblock);
1627 if (ret < 0)
1628 return ret;
1629 return 1;
1630}
1631
1632/**
1633 * gfs2_rbm_find - Look for blocks of a particular state
1634 * @rbm: Value/result starting position and final position
1635 * @state: The state which we want to find
Bob Peterson5ce13432013-11-06 10:55:52 -05001636 * @minext: Pointer to the requested extent length (NULL for a single block)
1637 * This is updated to be the actual reservation size.
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001638 * @ip: If set, check for reservations
1639 * @nowrap: Stop looking at the end of the rgrp, rather than wrapping
1640 * around until we've reached the starting point.
Bob Peterson5ce13432013-11-06 10:55:52 -05001641 * @ap: the allocation parameters
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001642 *
1643 * Side effects:
1644 * - If looking for free blocks, we set GBF_FULL on each bitmap which
1645 * has no free blocks in it.
Bob Peterson5ea50502013-11-25 11:16:25 +00001646 * - If looking for free blocks, we set rd_extfail_pt on each rgrp which
1647 * has come up short on a free block search.
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001648 *
1649 * Returns: 0 on success, -ENOSPC if there is no block of the requested state
1650 */
1651
Bob Peterson5ce13432013-11-06 10:55:52 -05001652static int gfs2_rbm_find(struct gfs2_rbm *rbm, u8 state, u32 *minext,
1653 const struct gfs2_inode *ip, bool nowrap,
1654 const struct gfs2_alloc_parms *ap)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001655{
1656 struct buffer_head *bh;
Bob Petersone579ed42013-09-17 13:12:15 -04001657 int initial_bii;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001658 u32 initial_offset;
Bob Peterson5ea50502013-11-25 11:16:25 +00001659 int first_bii = rbm->bii;
1660 u32 first_offset = rbm->offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001661 u32 offset;
1662 u8 *buffer;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001663 int n = 0;
1664 int iters = rbm->rgd->rd_length;
1665 int ret;
Bob Petersone579ed42013-09-17 13:12:15 -04001666 struct gfs2_bitmap *bi;
Bob Peterson5ce13432013-11-06 10:55:52 -05001667 struct gfs2_extent maxext = { .rbm.rgd = rbm->rgd, };
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001668
1669 /* If we are not starting at the beginning of a bitmap, then we
1670 * need to add one to the bitmap count to ensure that we search
1671 * the starting bitmap twice.
1672 */
1673 if (rbm->offset != 0)
1674 iters++;
1675
1676 while(1) {
Bob Petersone579ed42013-09-17 13:12:15 -04001677 bi = rbm_bi(rbm);
1678 if (test_bit(GBF_FULL, &bi->bi_flags) &&
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001679 (state == GFS2_BLKST_FREE))
1680 goto next_bitmap;
1681
Bob Petersone579ed42013-09-17 13:12:15 -04001682 bh = bi->bi_bh;
1683 buffer = bh->b_data + bi->bi_offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001684 WARN_ON(!buffer_uptodate(bh));
Bob Petersone579ed42013-09-17 13:12:15 -04001685 if (state != GFS2_BLKST_UNLINKED && bi->bi_clone)
1686 buffer = bi->bi_clone + bi->bi_offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001687 initial_offset = rbm->offset;
Bob Petersone579ed42013-09-17 13:12:15 -04001688 offset = gfs2_bitfit(buffer, bi->bi_len, rbm->offset, state);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001689 if (offset == BFITNOENT)
1690 goto bitmap_full;
1691 rbm->offset = offset;
1692 if (ip == NULL)
1693 return 0;
1694
Bob Petersone579ed42013-09-17 13:12:15 -04001695 initial_bii = rbm->bii;
Bob Peterson5ce13432013-11-06 10:55:52 -05001696 ret = gfs2_reservation_check_and_update(rbm, ip,
1697 minext ? *minext : 0,
1698 &maxext);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001699 if (ret == 0)
1700 return 0;
1701 if (ret > 0) {
Bob Petersone579ed42013-09-17 13:12:15 -04001702 n += (rbm->bii - initial_bii);
Bob Peterson8d8b7522012-08-07 13:28:17 -04001703 goto next_iter;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001704 }
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001705 if (ret == -E2BIG) {
Bob Petersone579ed42013-09-17 13:12:15 -04001706 rbm->bii = 0;
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001707 rbm->offset = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001708 n += (rbm->bii - initial_bii);
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001709 goto res_covered_end_of_rgrp;
1710 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001711 return ret;
1712
1713bitmap_full: /* Mark bitmap as full and fall through */
Bob Petersone579ed42013-09-17 13:12:15 -04001714 if ((state == GFS2_BLKST_FREE) && initial_offset == 0) {
1715 struct gfs2_bitmap *bi = rbm_bi(rbm);
1716 set_bit(GBF_FULL, &bi->bi_flags);
1717 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001718
1719next_bitmap: /* Find next bitmap in the rgrp */
1720 rbm->offset = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001721 rbm->bii++;
1722 if (rbm->bii == rbm->rgd->rd_length)
1723 rbm->bii = 0;
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001724res_covered_end_of_rgrp:
Bob Petersone579ed42013-09-17 13:12:15 -04001725 if ((rbm->bii == 0) && nowrap)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001726 break;
1727 n++;
Bob Peterson8d8b7522012-08-07 13:28:17 -04001728next_iter:
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001729 if (n >= iters)
1730 break;
1731 }
1732
Bob Peterson5ce13432013-11-06 10:55:52 -05001733 if (minext == NULL || state != GFS2_BLKST_FREE)
1734 return -ENOSPC;
1735
Bob Peterson5ea50502013-11-25 11:16:25 +00001736 /* If the extent was too small, and it's smaller than the smallest
1737 to have failed before, remember for future reference that it's
1738 useless to search this rgrp again for this amount or more. */
1739 if ((first_offset == 0) && (first_bii == 0) &&
1740 (*minext < rbm->rgd->rd_extfail_pt))
1741 rbm->rgd->rd_extfail_pt = *minext;
1742
Bob Peterson5ce13432013-11-06 10:55:52 -05001743 /* If the maximum extent we found is big enough to fulfill the
1744 minimum requirements, use it anyway. */
1745 if (maxext.len) {
1746 *rbm = maxext.rbm;
1747 *minext = maxext.len;
1748 return 0;
1749 }
1750
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001751 return -ENOSPC;
1752}
1753
1754/**
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001755 * try_rgrp_unlink - Look for any unlinked, allocated, but unused inodes
1756 * @rgd: The rgrp
Bob Peterson886b1412012-04-11 13:03:52 -04001757 * @last_unlinked: block address of the last dinode we unlinked
1758 * @skip: block address we should explicitly not unlink
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001759 *
Bob Peterson1a0eae82010-04-14 11:58:16 -04001760 * Returns: 0 if no error
1761 * The inode, if one has been found, in inode.
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001762 */
1763
Steven Whitehouse044b9412010-11-03 20:01:07 +00001764static void try_rgrp_unlink(struct gfs2_rgrpd *rgd, u64 *last_unlinked, u64 skip)
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001765{
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001766 u64 block;
Bob Peterson5f3eae72007-08-08 16:52:09 -05001767 struct gfs2_sbd *sdp = rgd->rd_sbd;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001768 struct gfs2_glock *gl;
1769 struct gfs2_inode *ip;
1770 int error;
1771 int found = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001772 struct gfs2_rbm rbm = { .rgd = rgd, .bii = 0, .offset = 0 };
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001773
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001774 while (1) {
Bob Peterson5f3eae72007-08-08 16:52:09 -05001775 down_write(&sdp->sd_log_flush_lock);
Bob Peterson5ce13432013-11-06 10:55:52 -05001776 error = gfs2_rbm_find(&rbm, GFS2_BLKST_UNLINKED, NULL, NULL,
1777 true, NULL);
Bob Peterson5f3eae72007-08-08 16:52:09 -05001778 up_write(&sdp->sd_log_flush_lock);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001779 if (error == -ENOSPC)
1780 break;
1781 if (WARN_ON_ONCE(error))
Bob Peterson24c73872007-07-12 16:58:50 -05001782 break;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05001783
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001784 block = gfs2_rbm_to_block(&rbm);
1785 if (gfs2_rbm_from_block(&rbm, block + 1))
1786 break;
1787 if (*last_unlinked != NO_BLOCK && block <= *last_unlinked)
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001788 continue;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001789 if (block == skip)
Steven Whitehouse1e19a192009-07-10 21:13:38 +01001790 continue;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001791 *last_unlinked = block;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001792
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001793 error = gfs2_glock_get(sdp, block, &gfs2_inode_glops, CREATE, &gl);
Steven Whitehouse044b9412010-11-03 20:01:07 +00001794 if (error)
1795 continue;
1796
1797 /* If the inode is already in cache, we can ignore it here
1798 * because the existing inode disposal code will deal with
1799 * it when all refs have gone away. Accessing gl_object like
1800 * this is not safe in general. Here it is ok because we do
1801 * not dereference the pointer, and we only need an approx
1802 * answer to whether it is NULL or not.
1803 */
1804 ip = gl->gl_object;
1805
1806 if (ip || queue_work(gfs2_delete_workqueue, &gl->gl_delete) == 0)
1807 gfs2_glock_put(gl);
1808 else
1809 found++;
1810
1811 /* Limit reclaim to sensible number of tasks */
Bob Peterson44ad37d2011-03-17 16:19:58 -04001812 if (found > NR_CPUS)
Steven Whitehouse044b9412010-11-03 20:01:07 +00001813 return;
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001814 }
1815
1816 rgd->rd_flags &= ~GFS2_RDF_CHECK;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001817 return;
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001818}
1819
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001820/**
1821 * gfs2_rgrp_congested - Use stats to figure out whether an rgrp is congested
1822 * @rgd: The rgrp in question
1823 * @loops: An indication of how picky we can be (0=very, 1=less so)
1824 *
1825 * This function uses the recently added glock statistics in order to
1826 * figure out whether a parciular resource group is suffering from
1827 * contention from multiple nodes. This is done purely on the basis
1828 * of timings, since this is the only data we have to work with and
1829 * our aim here is to reject a resource group which is highly contended
1830 * but (very important) not to do this too often in order to ensure that
1831 * we do not land up introducing fragmentation by changing resource
1832 * groups when not actually required.
1833 *
1834 * The calculation is fairly simple, we want to know whether the SRTTB
1835 * (i.e. smoothed round trip time for blocking operations) to acquire
1836 * the lock for this rgrp's glock is significantly greater than the
1837 * time taken for resource groups on average. We introduce a margin in
1838 * the form of the variable @var which is computed as the sum of the two
1839 * respective variences, and multiplied by a factor depending on @loops
1840 * and whether we have a lot of data to base the decision on. This is
1841 * then tested against the square difference of the means in order to
1842 * decide whether the result is statistically significant or not.
1843 *
1844 * Returns: A boolean verdict on the congestion status
1845 */
1846
1847static bool gfs2_rgrp_congested(const struct gfs2_rgrpd *rgd, int loops)
1848{
1849 const struct gfs2_glock *gl = rgd->rd_gl;
1850 const struct gfs2_sbd *sdp = gl->gl_sbd;
1851 struct gfs2_lkstats *st;
1852 s64 r_dcount, l_dcount;
1853 s64 r_srttb, l_srttb;
1854 s64 srttb_diff;
1855 s64 sqr_diff;
1856 s64 var;
1857
1858 preempt_disable();
1859 st = &this_cpu_ptr(sdp->sd_lkstats)->lkstats[LM_TYPE_RGRP];
1860 r_srttb = st->stats[GFS2_LKS_SRTTB];
1861 r_dcount = st->stats[GFS2_LKS_DCOUNT];
1862 var = st->stats[GFS2_LKS_SRTTVARB] +
1863 gl->gl_stats.stats[GFS2_LKS_SRTTVARB];
1864 preempt_enable();
1865
1866 l_srttb = gl->gl_stats.stats[GFS2_LKS_SRTTB];
1867 l_dcount = gl->gl_stats.stats[GFS2_LKS_DCOUNT];
1868
1869 if ((l_dcount < 1) || (r_dcount < 1) || (r_srttb == 0))
1870 return false;
1871
1872 srttb_diff = r_srttb - l_srttb;
1873 sqr_diff = srttb_diff * srttb_diff;
1874
1875 var *= 2;
1876 if (l_dcount < 8 || r_dcount < 8)
1877 var *= 2;
1878 if (loops == 1)
1879 var *= 2;
1880
1881 return ((srttb_diff < 0) && (sqr_diff > var));
1882}
1883
1884/**
1885 * gfs2_rgrp_used_recently
1886 * @rs: The block reservation with the rgrp to test
1887 * @msecs: The time limit in milliseconds
1888 *
1889 * Returns: True if the rgrp glock has been used within the time limit
1890 */
1891static bool gfs2_rgrp_used_recently(const struct gfs2_blkreserv *rs,
1892 u64 msecs)
1893{
1894 u64 tdiff;
1895
1896 tdiff = ktime_to_ns(ktime_sub(ktime_get_real(),
1897 rs->rs_rbm.rgd->rd_gl->gl_dstamp));
1898
1899 return tdiff > (msecs * 1000 * 1000);
1900}
1901
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001902static u32 gfs2_orlov_skip(const struct gfs2_inode *ip)
1903{
1904 const struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1905 u32 skip;
1906
1907 get_random_bytes(&skip, sizeof(skip));
1908 return skip % sdp->sd_rgrps;
1909}
1910
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001911static bool gfs2_select_rgrp(struct gfs2_rgrpd **pos, const struct gfs2_rgrpd *begin)
1912{
1913 struct gfs2_rgrpd *rgd = *pos;
Steven Whitehouseaa8920c2012-11-13 14:50:35 +00001914 struct gfs2_sbd *sdp = rgd->rd_sbd;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001915
1916 rgd = gfs2_rgrpd_get_next(rgd);
1917 if (rgd == NULL)
Steven Whitehouseaa8920c2012-11-13 14:50:35 +00001918 rgd = gfs2_rgrpd_get_first(sdp);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001919 *pos = rgd;
1920 if (rgd != begin) /* If we didn't wrap */
1921 return true;
1922 return false;
1923}
1924
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001925/**
Bob Peterson0e27c182014-10-29 08:02:28 -05001926 * fast_to_acquire - determine if a resource group will be fast to acquire
1927 *
1928 * If this is one of our preferred rgrps, it should be quicker to acquire,
1929 * because we tried to set ourselves up as dlm lock master.
1930 */
1931static inline int fast_to_acquire(struct gfs2_rgrpd *rgd)
1932{
1933 struct gfs2_glock *gl = rgd->rd_gl;
1934
1935 if (gl->gl_state != LM_ST_UNLOCKED && list_empty(&gl->gl_holders) &&
1936 !test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags) &&
1937 !test_bit(GLF_DEMOTE, &gl->gl_flags))
1938 return 1;
1939 if (rgd->rd_flags & GFS2_RDF_PREFERRED)
1940 return 1;
1941 return 0;
1942}
1943
1944/**
Bob Peterson666d1d82012-06-13 23:03:56 -04001945 * gfs2_inplace_reserve - Reserve space in the filesystem
David Teiglandb3b94fa2006-01-16 16:50:04 +00001946 * @ip: the inode to reserve space for
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001947 * @ap: the allocation parameters
David Teiglandb3b94fa2006-01-16 16:50:04 +00001948 *
Abhi Das25435e52015-03-18 12:04:37 -05001949 * We try our best to find an rgrp that has at least ap->target blocks
1950 * available. After a couple of passes (loops == 2), the prospects of finding
1951 * such an rgrp diminish. At this stage, we return the first rgrp that has
1952 * atleast ap->min_target blocks available. Either way, we set ap->allowed to
1953 * the number of blocks available in the chosen rgrp.
1954 *
1955 * Returns: 0 on success,
1956 * -ENOMEM if a suitable rgrp can't be found
1957 * errno otherwise
David Teiglandb3b94fa2006-01-16 16:50:04 +00001958 */
1959
Abhi Das25435e52015-03-18 12:04:37 -05001960int gfs2_inplace_reserve(struct gfs2_inode *ip, struct gfs2_alloc_parms *ap)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001961{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001962 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001963 struct gfs2_rgrpd *begin = NULL;
Bob Peterson564e12b2011-11-21 13:36:17 -05001964 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001965 int error = 0, rg_locked, flags = 0;
Bob Peterson666d1d82012-06-13 23:03:56 -04001966 u64 last_unlinked = NO_BLOCK;
Bob Peterson7c9ca622011-08-31 09:53:19 +01001967 int loops = 0;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001968 u32 skip = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001969
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001970 if (sdp->sd_args.ar_rgrplvb)
1971 flags |= GL_SKIP;
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001972 if (gfs2_assert_warn(sdp, ap->target))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001973 return -EINVAL;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001974 if (gfs2_rs_active(rs)) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001975 begin = rs->rs_rbm.rgd;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001976 } else if (ip->i_rgd && rgrp_contains_block(ip->i_rgd, ip->i_goal)) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001977 rs->rs_rbm.rgd = begin = ip->i_rgd;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001978 } else {
Abhi Das00a158b2014-09-18 21:40:28 -05001979 check_and_update_goal(ip);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001980 rs->rs_rbm.rgd = begin = gfs2_blk2rgrpd(sdp, ip->i_goal, 1);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001981 }
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001982 if (S_ISDIR(ip->i_inode.i_mode) && (ap->aflags & GFS2_AF_ORLOV))
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001983 skip = gfs2_orlov_skip(ip);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001984 if (rs->rs_rbm.rgd == NULL)
Bob Peterson7c9ca622011-08-31 09:53:19 +01001985 return -EBADSLT;
1986
1987 while (loops < 3) {
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001988 rg_locked = 1;
Abhijith Das292c8c12007-11-29 14:13:54 -06001989
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001990 if (!gfs2_glock_is_locked_by_me(rs->rs_rbm.rgd->rd_gl)) {
1991 rg_locked = 0;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001992 if (skip && skip--)
1993 goto next_rgrp;
Bob Peterson0e27c182014-10-29 08:02:28 -05001994 if (!gfs2_rs_active(rs)) {
1995 if (loops == 0 &&
1996 !fast_to_acquire(rs->rs_rbm.rgd))
1997 goto next_rgrp;
1998 if ((loops < 2) &&
1999 gfs2_rgrp_used_recently(rs, 1000) &&
2000 gfs2_rgrp_congested(rs->rs_rbm.rgd, loops))
2001 goto next_rgrp;
2002 }
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002003 error = gfs2_glock_nq_init(rs->rs_rbm.rgd->rd_gl,
Bob Peterson8e2e0042012-07-19 08:12:40 -04002004 LM_ST_EXCLUSIVE, flags,
2005 &rs->rs_rgd_gh);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002006 if (unlikely(error))
2007 return error;
Steven Whitehousebcd97c02012-10-31 09:58:42 +00002008 if (!gfs2_rs_active(rs) && (loops < 2) &&
2009 gfs2_rgrp_congested(rs->rs_rbm.rgd, loops))
2010 goto skip_rgrp;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002011 if (sdp->sd_args.ar_rgrplvb) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002012 error = update_rgrp_lvb(rs->rs_rbm.rgd);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002013 if (unlikely(error)) {
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002014 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
2015 return error;
2016 }
2017 }
Abhijith Das292c8c12007-11-29 14:13:54 -06002018 }
Bob Peterson666d1d82012-06-13 23:03:56 -04002019
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002020 /* Skip unuseable resource groups */
Bob Peterson5ea50502013-11-25 11:16:25 +00002021 if ((rs->rs_rbm.rgd->rd_flags & (GFS2_RGF_NOALLOC |
2022 GFS2_RDF_ERROR)) ||
Abhi Das25435e52015-03-18 12:04:37 -05002023 (loops == 0 && ap->target > rs->rs_rbm.rgd->rd_extfail_pt))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002024 goto skip_rgrp;
2025
2026 if (sdp->sd_args.ar_rgrplvb)
2027 gfs2_rgrp_bh_get(rs->rs_rbm.rgd);
2028
2029 /* Get a reservation if we don't already have one */
2030 if (!gfs2_rs_active(rs))
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01002031 rg_mblk_search(rs->rs_rbm.rgd, ip, ap);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002032
2033 /* Skip rgrps when we can't get a reservation on first pass */
2034 if (!gfs2_rs_active(rs) && (loops < 1))
2035 goto check_rgrp;
2036
2037 /* If rgrp has enough free space, use it */
Abhi Das25435e52015-03-18 12:04:37 -05002038 if (rs->rs_rbm.rgd->rd_free_clone >= ap->target ||
2039 (loops == 2 && ap->min_target &&
2040 rs->rs_rbm.rgd->rd_free_clone >= ap->min_target)) {
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002041 ip->i_rgd = rs->rs_rbm.rgd;
Abhi Das25435e52015-03-18 12:04:37 -05002042 ap->allowed = ip->i_rgd->rd_free_clone;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002043 return 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002044 }
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002045check_rgrp:
2046 /* Check for unlinked inodes which can be reclaimed */
2047 if (rs->rs_rbm.rgd->rd_flags & GFS2_RDF_CHECK)
2048 try_rgrp_unlink(rs->rs_rbm.rgd, &last_unlinked,
2049 ip->i_no_addr);
2050skip_rgrp:
Bob Peterson1330edb2013-11-06 10:58:00 -05002051 /* Drop reservation, if we couldn't use reserved rgrp */
2052 if (gfs2_rs_active(rs))
2053 gfs2_rs_deltree(rs);
2054
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002055 /* Unlock rgrp if required */
2056 if (!rg_locked)
2057 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
2058next_rgrp:
2059 /* Find the next rgrp, and continue looking */
2060 if (gfs2_select_rgrp(&rs->rs_rbm.rgd, begin))
2061 continue;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00002062 if (skip)
2063 continue;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002064
2065 /* If we've scanned all the rgrps, but found no free blocks
2066 * then this checks for some less likely conditions before
2067 * trying again.
2068 */
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002069 loops++;
2070 /* Check that fs hasn't grown if writing to rindex */
2071 if (ip == GFS2_I(sdp->sd_rindex) && !sdp->sd_rindex_uptodate) {
2072 error = gfs2_ri_update(ip);
2073 if (error)
2074 return error;
2075 }
2076 /* Flushing the log may release space */
2077 if (loops == 2)
Benjamin Marzinski24972552014-05-01 22:26:55 -05002078 gfs2_log_flush(sdp, NULL, NORMAL_FLUSH);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002079 }
2080
2081 return -ENOSPC;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002082}
2083
2084/**
2085 * gfs2_inplace_release - release an inplace reservation
2086 * @ip: the inode the reservation was taken out on
2087 *
2088 * Release a reservation made by gfs2_inplace_reserve().
2089 */
2090
2091void gfs2_inplace_release(struct gfs2_inode *ip)
2092{
Bob Peterson564e12b2011-11-21 13:36:17 -05002093 struct gfs2_blkreserv *rs = ip->i_res;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002094
Bob Peterson564e12b2011-11-21 13:36:17 -05002095 if (rs->rs_rgd_gh.gh_gl)
2096 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002097}
2098
2099/**
2100 * gfs2_get_block_type - Check a block in a RG is of given type
2101 * @rgd: the resource group holding the block
2102 * @block: the block number
2103 *
2104 * Returns: The block type (GFS2_BLKST_*)
2105 */
2106
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002107static unsigned char gfs2_get_block_type(struct gfs2_rgrpd *rgd, u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002108{
Steven Whitehouse39839032012-08-03 11:10:30 +01002109 struct gfs2_rbm rbm = { .rgd = rgd, };
2110 int ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002111
Steven Whitehouse39839032012-08-03 11:10:30 +01002112 ret = gfs2_rbm_from_block(&rbm, block);
2113 WARN_ON_ONCE(ret != 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002114
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002115 return gfs2_testbit(&rbm);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002116}
2117
David Teiglandb3b94fa2006-01-16 16:50:04 +00002118
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002119/**
2120 * gfs2_alloc_extent - allocate an extent from a given bitmap
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002121 * @rbm: the resource group information
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002122 * @dinode: TRUE if the first block we allocate is for a dinode
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002123 * @n: The extent length (value/result)
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002124 *
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002125 * Add the bitmap buffer to the transaction.
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002126 * Set the found bits to @new_state to change block's allocation state.
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002127 */
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002128static void gfs2_alloc_extent(const struct gfs2_rbm *rbm, bool dinode,
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002129 unsigned int *n)
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002130{
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002131 struct gfs2_rbm pos = { .rgd = rbm->rgd, };
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002132 const unsigned int elen = *n;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002133 u64 block;
2134 int ret;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002135
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002136 *n = 1;
2137 block = gfs2_rbm_to_block(rbm);
Bob Petersone579ed42013-09-17 13:12:15 -04002138 gfs2_trans_add_meta(rbm->rgd->rd_gl, rbm_bi(rbm)->bi_bh);
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002139 gfs2_setbit(rbm, true, dinode ? GFS2_BLKST_DINODE : GFS2_BLKST_USED);
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002140 block++;
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002141 while (*n < elen) {
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002142 ret = gfs2_rbm_from_block(&pos, block);
Bob Peterson0688a5e2012-08-28 08:45:56 -04002143 if (ret || gfs2_testbit(&pos) != GFS2_BLKST_FREE)
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002144 break;
Bob Petersone579ed42013-09-17 13:12:15 -04002145 gfs2_trans_add_meta(pos.rgd->rd_gl, rbm_bi(&pos)->bi_bh);
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002146 gfs2_setbit(&pos, true, GFS2_BLKST_USED);
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002147 (*n)++;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002148 block++;
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002149 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00002150}
2151
2152/**
2153 * rgblk_free - Change alloc state of given block(s)
2154 * @sdp: the filesystem
2155 * @bstart: the start of a run of blocks to free
2156 * @blen: the length of the block run (all must lie within ONE RG!)
2157 * @new_state: GFS2_BLKST_XXX the after-allocation block state
2158 *
2159 * Returns: Resource group containing the block(s)
2160 */
2161
Steven Whitehousecd915492006-09-04 12:49:07 -04002162static struct gfs2_rgrpd *rgblk_free(struct gfs2_sbd *sdp, u64 bstart,
2163 u32 blen, unsigned char new_state)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002164{
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002165 struct gfs2_rbm rbm;
Bob Petersond24e0562014-10-03 08:38:06 -04002166 struct gfs2_bitmap *bi, *bi_prev = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002167
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002168 rbm.rgd = gfs2_blk2rgrpd(sdp, bstart, 1);
2169 if (!rbm.rgd) {
David Teiglandb3b94fa2006-01-16 16:50:04 +00002170 if (gfs2_consist(sdp))
Steven Whitehouse382066d2006-05-24 10:22:09 -04002171 fs_err(sdp, "block = %llu\n", (unsigned long long)bstart);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002172 return NULL;
2173 }
2174
Bob Petersond24e0562014-10-03 08:38:06 -04002175 gfs2_rbm_from_block(&rbm, bstart);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002176 while (blen--) {
Bob Petersone579ed42013-09-17 13:12:15 -04002177 bi = rbm_bi(&rbm);
Bob Petersond24e0562014-10-03 08:38:06 -04002178 if (bi != bi_prev) {
2179 if (!bi->bi_clone) {
2180 bi->bi_clone = kmalloc(bi->bi_bh->b_size,
2181 GFP_NOFS | __GFP_NOFAIL);
2182 memcpy(bi->bi_clone + bi->bi_offset,
2183 bi->bi_bh->b_data + bi->bi_offset,
2184 bi->bi_len);
2185 }
2186 gfs2_trans_add_meta(rbm.rgd->rd_gl, bi->bi_bh);
2187 bi_prev = bi;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002188 }
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002189 gfs2_setbit(&rbm, false, new_state);
Bob Petersond24e0562014-10-03 08:38:06 -04002190 gfs2_rbm_incr(&rbm);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002191 }
2192
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002193 return rbm.rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002194}
2195
2196/**
Steven Whitehouse09010972009-05-20 10:48:47 +01002197 * gfs2_rgrp_dump - print out an rgrp
2198 * @seq: The iterator
2199 * @gl: The glock in question
David Teiglandb3b94fa2006-01-16 16:50:04 +00002200 *
David Teiglandb3b94fa2006-01-16 16:50:04 +00002201 */
2202
Steven Whitehouseac3beb62014-01-16 10:31:13 +00002203void gfs2_rgrp_dump(struct seq_file *seq, const struct gfs2_glock *gl)
Steven Whitehouse09010972009-05-20 10:48:47 +01002204{
Bob Peterson8e2e0042012-07-19 08:12:40 -04002205 struct gfs2_rgrpd *rgd = gl->gl_object;
2206 struct gfs2_blkreserv *trs;
2207 const struct rb_node *n;
2208
Steven Whitehouse09010972009-05-20 10:48:47 +01002209 if (rgd == NULL)
Steven Whitehouseac3beb62014-01-16 10:31:13 +00002210 return;
Bob Peterson5ea50502013-11-25 11:16:25 +00002211 gfs2_print_dbg(seq, " R: n:%llu f:%02x b:%u/%u i:%u r:%u e:%u\n",
Steven Whitehouse09010972009-05-20 10:48:47 +01002212 (unsigned long long)rgd->rd_addr, rgd->rd_flags,
Bob Peterson8e2e0042012-07-19 08:12:40 -04002213 rgd->rd_free, rgd->rd_free_clone, rgd->rd_dinodes,
Bob Peterson5ea50502013-11-25 11:16:25 +00002214 rgd->rd_reserved, rgd->rd_extfail_pt);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002215 spin_lock(&rgd->rd_rsspin);
2216 for (n = rb_first(&rgd->rd_rstree); n; n = rb_next(&trs->rs_node)) {
2217 trs = rb_entry(n, struct gfs2_blkreserv, rs_node);
2218 dump_rs(seq, trs);
2219 }
2220 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouse09010972009-05-20 10:48:47 +01002221}
2222
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002223static void gfs2_rgrp_error(struct gfs2_rgrpd *rgd)
2224{
2225 struct gfs2_sbd *sdp = rgd->rd_sbd;
2226 fs_warn(sdp, "rgrp %llu has an error, marking it readonly until umount\n",
Steven Whitehouse86d00632009-09-14 09:50:57 +01002227 (unsigned long long)rgd->rd_addr);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002228 fs_warn(sdp, "umount on all nodes and run fsck.gfs2 to fix the error\n");
2229 gfs2_rgrp_dump(NULL, rgd->rd_gl);
2230 rgd->rd_flags |= GFS2_RDF_ERROR;
2231}
2232
Steven Whitehouse09010972009-05-20 10:48:47 +01002233/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002234 * gfs2_adjust_reservation - Adjust (or remove) a reservation after allocation
2235 * @ip: The inode we have just allocated blocks for
2236 * @rbm: The start of the allocated blocks
2237 * @len: The extent length
Bob Peterson8e2e0042012-07-19 08:12:40 -04002238 *
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002239 * Adjusts a reservation after an allocation has taken place. If the
2240 * reservation does not match the allocation, or if it is now empty
2241 * then it is removed.
Bob Peterson8e2e0042012-07-19 08:12:40 -04002242 */
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002243
2244static void gfs2_adjust_reservation(struct gfs2_inode *ip,
2245 const struct gfs2_rbm *rbm, unsigned len)
Bob Peterson8e2e0042012-07-19 08:12:40 -04002246{
2247 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002248 struct gfs2_rgrpd *rgd = rbm->rgd;
2249 unsigned rlen;
2250 u64 block;
2251 int ret;
Bob Peterson8e2e0042012-07-19 08:12:40 -04002252
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002253 spin_lock(&rgd->rd_rsspin);
2254 if (gfs2_rs_active(rs)) {
2255 if (gfs2_rbm_eq(&rs->rs_rbm, rbm)) {
2256 block = gfs2_rbm_to_block(rbm);
2257 ret = gfs2_rbm_from_block(&rs->rs_rbm, block + len);
2258 rlen = min(rs->rs_free, len);
2259 rs->rs_free -= rlen;
2260 rgd->rd_reserved -= rlen;
Steven Whitehouse9e733d32012-08-23 15:37:59 +01002261 trace_gfs2_rs(rs, TRACE_RS_CLAIM);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002262 if (rs->rs_free && !ret)
2263 goto out;
Bob Peterson1a855032014-10-29 08:02:30 -05002264 /* We used up our block reservation, so we should
2265 reserve more blocks next time. */
2266 atomic_add(RGRP_RSRV_ADDBLKS, &rs->rs_sizehint);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002267 }
Bob Peterson20095212013-03-13 10:26:38 -04002268 __rs_deltree(rs);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002269 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002270out:
2271 spin_unlock(&rgd->rd_rsspin);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002272}
2273
2274/**
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002275 * gfs2_set_alloc_start - Set starting point for block allocation
2276 * @rbm: The rbm which will be set to the required location
2277 * @ip: The gfs2 inode
2278 * @dinode: Flag to say if allocation includes a new inode
2279 *
2280 * This sets the starting point from the reservation if one is active
2281 * otherwise it falls back to guessing a start point based on the
2282 * inode's goal block or the last allocation point in the rgrp.
2283 */
2284
2285static void gfs2_set_alloc_start(struct gfs2_rbm *rbm,
2286 const struct gfs2_inode *ip, bool dinode)
2287{
2288 u64 goal;
2289
2290 if (gfs2_rs_active(ip->i_res)) {
2291 *rbm = ip->i_res->rs_rbm;
2292 return;
2293 }
2294
2295 if (!dinode && rgrp_contains_block(rbm->rgd, ip->i_goal))
2296 goal = ip->i_goal;
2297 else
2298 goal = rbm->rgd->rd_last_alloc + rbm->rgd->rd_data0;
2299
2300 gfs2_rbm_from_block(rbm, goal);
2301}
2302
2303/**
Bob Peterson6e87ed02011-11-18 10:58:32 -05002304 * gfs2_alloc_blocks - Allocate one or more blocks of data and/or a dinode
Steven Whitehouse09010972009-05-20 10:48:47 +01002305 * @ip: the inode to allocate the block for
2306 * @bn: Used to return the starting block number
Bob Peterson8e2e0042012-07-19 08:12:40 -04002307 * @nblocks: requested number of blocks/extent length (value/result)
Bob Peterson6e87ed02011-11-18 10:58:32 -05002308 * @dinode: 1 if we're allocating a dinode block, else 0
Bob Peterson3c5d7852011-11-14 11:17:08 -05002309 * @generation: the generation number of the inode
Steven Whitehouse09010972009-05-20 10:48:47 +01002310 *
2311 * Returns: 0 or error
2312 */
2313
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002314int gfs2_alloc_blocks(struct gfs2_inode *ip, u64 *bn, unsigned int *nblocks,
Bob Peterson6e87ed02011-11-18 10:58:32 -05002315 bool dinode, u64 *generation)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002316{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002317 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002318 struct buffer_head *dibh;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002319 struct gfs2_rbm rbm = { .rgd = ip->i_rgd, };
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002320 unsigned int ndata;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002321 u64 block; /* block, within the file system scope */
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002322 int error;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002323
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002324 gfs2_set_alloc_start(&rbm, ip, dinode);
Bob Peterson5ce13432013-11-06 10:55:52 -05002325 error = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, NULL, ip, false, NULL);
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002326
Steven Whitehouse137834a2012-08-23 13:43:40 +01002327 if (error == -ENOSPC) {
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002328 gfs2_set_alloc_start(&rbm, ip, dinode);
Bob Peterson5ce13432013-11-06 10:55:52 -05002329 error = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, NULL, NULL, false,
2330 NULL);
Steven Whitehouse137834a2012-08-23 13:43:40 +01002331 }
2332
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002333 /* Since all blocks are reserved in advance, this shouldn't happen */
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002334 if (error) {
Bob Peterson5ea50502013-11-25 11:16:25 +00002335 fs_warn(sdp, "inum=%llu error=%d, nblocks=%u, full=%d fail_pt=%d\n",
Steven Whitehouse9e733d32012-08-23 15:37:59 +01002336 (unsigned long long)ip->i_no_addr, error, *nblocks,
Bob Peterson5ea50502013-11-25 11:16:25 +00002337 test_bit(GBF_FULL, &rbm.rgd->rd_bits->bi_flags),
2338 rbm.rgd->rd_extfail_pt);
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002339 goto rgrp_error;
2340 }
2341
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002342 gfs2_alloc_extent(&rbm, dinode, nblocks);
2343 block = gfs2_rbm_to_block(&rbm);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002344 rbm.rgd->rd_last_alloc = block - rbm.rgd->rd_data0;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002345 if (gfs2_rs_active(ip->i_res))
2346 gfs2_adjust_reservation(ip, &rbm, *nblocks);
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002347 ndata = *nblocks;
2348 if (dinode)
2349 ndata--;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002350
Bob Peterson3c5d7852011-11-14 11:17:08 -05002351 if (!dinode) {
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002352 ip->i_goal = block + ndata - 1;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002353 error = gfs2_meta_inode_buffer(ip, &dibh);
2354 if (error == 0) {
2355 struct gfs2_dinode *di =
2356 (struct gfs2_dinode *)dibh->b_data;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002357 gfs2_trans_add_meta(ip->i_gl, dibh);
Bob Peterson3c5d7852011-11-14 11:17:08 -05002358 di->di_goal_meta = di->di_goal_data =
2359 cpu_to_be64(ip->i_goal);
2360 brelse(dibh);
2361 }
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002362 }
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002363 if (rbm.rgd->rd_free < *nblocks) {
Fabian Frederickfc554ed2014-03-05 22:06:42 +08002364 pr_warn("nblocks=%u\n", *nblocks);
Steven Whitehouse09010972009-05-20 10:48:47 +01002365 goto rgrp_error;
Bob Peterson8e2e0042012-07-19 08:12:40 -04002366 }
Steven Whitehouse09010972009-05-20 10:48:47 +01002367
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002368 rbm.rgd->rd_free -= *nblocks;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002369 if (dinode) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002370 rbm.rgd->rd_dinodes++;
2371 *generation = rbm.rgd->rd_igeneration++;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002372 if (*generation == 0)
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002373 *generation = rbm.rgd->rd_igeneration++;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002374 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00002375
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002376 gfs2_trans_add_meta(rbm.rgd->rd_gl, rbm.rgd->rd_bits[0].bi_bh);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002377 gfs2_rgrp_out(rbm.rgd, rbm.rgd->rd_bits[0].bi_bh->b_data);
2378 gfs2_rgrp_ondisk2lvb(rbm.rgd->rd_rgl, rbm.rgd->rd_bits[0].bi_bh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002379
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002380 gfs2_statfs_change(sdp, 0, -(s64)*nblocks, dinode ? 1 : 0);
Bob Peterson3c5d7852011-11-14 11:17:08 -05002381 if (dinode)
Steven Whitehouseb2c8b3e2014-02-04 15:45:11 +00002382 gfs2_trans_add_unrevoke(sdp, block, *nblocks);
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002383
Steven Whitehousefd4b4e02013-02-26 16:15:20 +00002384 gfs2_quota_change(ip, *nblocks, ip->i_inode.i_uid, ip->i_inode.i_gid);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002385
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002386 rbm.rgd->rd_free_clone -= *nblocks;
2387 trace_gfs2_block_alloc(ip, rbm.rgd, block, *nblocks,
Bob Peterson6e87ed02011-11-18 10:58:32 -05002388 dinode ? GFS2_BLKST_DINODE : GFS2_BLKST_USED);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002389 *bn = block;
2390 return 0;
2391
2392rgrp_error:
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002393 gfs2_rgrp_error(rbm.rgd);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002394 return -EIO;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002395}
2396
2397/**
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002398 * __gfs2_free_blocks - free a contiguous run of block(s)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002399 * @ip: the inode these blocks are being freed from
2400 * @bstart: first block of a run of contiguous blocks
2401 * @blen: the length of the block run
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002402 * @meta: 1 if the blocks represent metadata
David Teiglandb3b94fa2006-01-16 16:50:04 +00002403 *
2404 */
2405
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002406void __gfs2_free_blocks(struct gfs2_inode *ip, u64 bstart, u32 blen, int meta)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002407{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002408 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002409 struct gfs2_rgrpd *rgd;
2410
2411 rgd = rgblk_free(sdp, bstart, blen, GFS2_BLKST_FREE);
2412 if (!rgd)
2413 return;
Bob Peterson41db1ab2012-05-09 12:11:35 -04002414 trace_gfs2_block_alloc(ip, rgd, bstart, blen, GFS2_BLKST_FREE);
Steven Whitehousecfc8b542008-11-04 10:25:13 +00002415 rgd->rd_free += blen;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002416 rgd->rd_flags &= ~GFS2_RGF_TRIMMED;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002417 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002418 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002419 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002420
Steven Whitehouse6d3117b2011-05-21 14:05:58 +01002421 /* Directories keep their data in the metadata address space */
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002422 if (meta || ip->i_depth)
Steven Whitehouse6d3117b2011-05-21 14:05:58 +01002423 gfs2_meta_wipe(ip, bstart, blen);
Bob Peterson4c16c362011-02-23 16:11:33 -05002424}
David Teiglandb3b94fa2006-01-16 16:50:04 +00002425
Bob Peterson4c16c362011-02-23 16:11:33 -05002426/**
Bob Peterson4c16c362011-02-23 16:11:33 -05002427 * gfs2_free_meta - free a contiguous run of data block(s)
2428 * @ip: the inode these blocks are being freed from
2429 * @bstart: first block of a run of contiguous blocks
2430 * @blen: the length of the block run
2431 *
2432 */
2433
Steven Whitehousecd915492006-09-04 12:49:07 -04002434void gfs2_free_meta(struct gfs2_inode *ip, u64 bstart, u32 blen)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002435{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002436 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002437
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002438 __gfs2_free_blocks(ip, bstart, blen, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002439 gfs2_statfs_change(sdp, 0, +blen, 0);
Steven Whitehouse2933f922006-11-01 13:23:29 -05002440 gfs2_quota_change(ip, -(s64)blen, ip->i_inode.i_uid, ip->i_inode.i_gid);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002441}
2442
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002443void gfs2_unlink_di(struct inode *inode)
2444{
2445 struct gfs2_inode *ip = GFS2_I(inode);
2446 struct gfs2_sbd *sdp = GFS2_SB(inode);
2447 struct gfs2_rgrpd *rgd;
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002448 u64 blkno = ip->i_no_addr;
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002449
2450 rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_UNLINKED);
2451 if (!rgd)
2452 return;
Bob Peterson41db1ab2012-05-09 12:11:35 -04002453 trace_gfs2_block_alloc(ip, rgd, blkno, 1, GFS2_BLKST_UNLINKED);
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002454 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002455 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002456 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
2457 update_rgrp_lvb_unlinked(rgd, 1);
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002458}
2459
Steven Whitehousecd915492006-09-04 12:49:07 -04002460static void gfs2_free_uninit_di(struct gfs2_rgrpd *rgd, u64 blkno)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002461{
2462 struct gfs2_sbd *sdp = rgd->rd_sbd;
2463 struct gfs2_rgrpd *tmp_rgd;
2464
2465 tmp_rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_FREE);
2466 if (!tmp_rgd)
2467 return;
2468 gfs2_assert_withdraw(sdp, rgd == tmp_rgd);
2469
Steven Whitehouse73f74942008-11-04 10:32:57 +00002470 if (!rgd->rd_dinodes)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002471 gfs2_consist_rgrpd(rgd);
Steven Whitehouse73f74942008-11-04 10:32:57 +00002472 rgd->rd_dinodes--;
Steven Whitehousecfc8b542008-11-04 10:25:13 +00002473 rgd->rd_free++;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002474
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002475 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002476 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002477 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
2478 update_rgrp_lvb_unlinked(rgd, -1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002479
2480 gfs2_statfs_change(sdp, 0, +1, -1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002481}
2482
David Teiglandb3b94fa2006-01-16 16:50:04 +00002483
2484void gfs2_free_di(struct gfs2_rgrpd *rgd, struct gfs2_inode *ip)
2485{
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002486 gfs2_free_uninit_di(rgd, ip->i_no_addr);
Bob Peterson41db1ab2012-05-09 12:11:35 -04002487 trace_gfs2_block_alloc(ip, rgd, ip->i_no_addr, 1, GFS2_BLKST_FREE);
Steven Whitehouse2933f922006-11-01 13:23:29 -05002488 gfs2_quota_change(ip, -1, ip->i_inode.i_uid, ip->i_inode.i_gid);
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002489 gfs2_meta_wipe(ip, ip->i_no_addr, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002490}
2491
2492/**
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002493 * gfs2_check_blk_type - Check the type of a block
2494 * @sdp: The superblock
2495 * @no_addr: The block number to check
2496 * @type: The block type we are looking for
2497 *
2498 * Returns: 0 if the block type matches the expected type
2499 * -ESTALE if it doesn't match
2500 * or -ve errno if something went wrong while checking
2501 */
2502
2503int gfs2_check_blk_type(struct gfs2_sbd *sdp, u64 no_addr, unsigned int type)
2504{
2505 struct gfs2_rgrpd *rgd;
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002506 struct gfs2_holder rgd_gh;
Bob Peterson58884c42012-03-05 10:19:35 -05002507 int error = -EINVAL;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002508
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002509 rgd = gfs2_blk2rgrpd(sdp, no_addr, 1);
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002510 if (!rgd)
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002511 goto fail;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002512
2513 error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_SHARED, 0, &rgd_gh);
2514 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002515 goto fail;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002516
2517 if (gfs2_get_block_type(rgd, no_addr) != type)
2518 error = -ESTALE;
2519
2520 gfs2_glock_dq_uninit(&rgd_gh);
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002521fail:
2522 return error;
2523}
2524
2525/**
David Teiglandb3b94fa2006-01-16 16:50:04 +00002526 * gfs2_rlist_add - add a RG to a list of RGs
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002527 * @ip: the inode
David Teiglandb3b94fa2006-01-16 16:50:04 +00002528 * @rlist: the list of resource groups
2529 * @block: the block
2530 *
2531 * Figure out what RG a block belongs to and add that RG to the list
2532 *
2533 * FIXME: Don't use NOFAIL
2534 *
2535 */
2536
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002537void gfs2_rlist_add(struct gfs2_inode *ip, struct gfs2_rgrp_list *rlist,
Steven Whitehousecd915492006-09-04 12:49:07 -04002538 u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002539{
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002540 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002541 struct gfs2_rgrpd *rgd;
2542 struct gfs2_rgrpd **tmp;
2543 unsigned int new_space;
2544 unsigned int x;
2545
2546 if (gfs2_assert_warn(sdp, !rlist->rl_ghs))
2547 return;
2548
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002549 if (ip->i_rgd && rgrp_contains_block(ip->i_rgd, block))
2550 rgd = ip->i_rgd;
2551 else
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002552 rgd = gfs2_blk2rgrpd(sdp, block, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002553 if (!rgd) {
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002554 fs_err(sdp, "rlist_add: no rgrp for block %llu\n", (unsigned long long)block);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002555 return;
2556 }
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002557 ip->i_rgd = rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002558
2559 for (x = 0; x < rlist->rl_rgrps; x++)
2560 if (rlist->rl_rgd[x] == rgd)
2561 return;
2562
2563 if (rlist->rl_rgrps == rlist->rl_space) {
2564 new_space = rlist->rl_space + 10;
2565
2566 tmp = kcalloc(new_space, sizeof(struct gfs2_rgrpd *),
Steven Whitehousedd894be2006-07-27 14:29:00 -04002567 GFP_NOFS | __GFP_NOFAIL);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002568
2569 if (rlist->rl_rgd) {
2570 memcpy(tmp, rlist->rl_rgd,
2571 rlist->rl_space * sizeof(struct gfs2_rgrpd *));
2572 kfree(rlist->rl_rgd);
2573 }
2574
2575 rlist->rl_space = new_space;
2576 rlist->rl_rgd = tmp;
2577 }
2578
2579 rlist->rl_rgd[rlist->rl_rgrps++] = rgd;
2580}
2581
2582/**
2583 * gfs2_rlist_alloc - all RGs have been added to the rlist, now allocate
2584 * and initialize an array of glock holders for them
2585 * @rlist: the list of resource groups
2586 * @state: the lock state to acquire the RG lock in
David Teiglandb3b94fa2006-01-16 16:50:04 +00002587 *
2588 * FIXME: Don't use NOFAIL
2589 *
2590 */
2591
Bob Petersonfe6c9912008-01-28 11:13:02 -06002592void gfs2_rlist_alloc(struct gfs2_rgrp_list *rlist, unsigned int state)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002593{
2594 unsigned int x;
2595
2596 rlist->rl_ghs = kcalloc(rlist->rl_rgrps, sizeof(struct gfs2_holder),
Steven Whitehousedd894be2006-07-27 14:29:00 -04002597 GFP_NOFS | __GFP_NOFAIL);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002598 for (x = 0; x < rlist->rl_rgrps; x++)
2599 gfs2_holder_init(rlist->rl_rgd[x]->rd_gl,
Bob Petersonfe6c9912008-01-28 11:13:02 -06002600 state, 0,
David Teiglandb3b94fa2006-01-16 16:50:04 +00002601 &rlist->rl_ghs[x]);
2602}
2603
2604/**
2605 * gfs2_rlist_free - free a resource group list
Fabian Frederick27ff6a02014-07-02 22:05:27 +02002606 * @rlist: the list of resource groups
David Teiglandb3b94fa2006-01-16 16:50:04 +00002607 *
2608 */
2609
2610void gfs2_rlist_free(struct gfs2_rgrp_list *rlist)
2611{
2612 unsigned int x;
2613
2614 kfree(rlist->rl_rgd);
2615
2616 if (rlist->rl_ghs) {
2617 for (x = 0; x < rlist->rl_rgrps; x++)
2618 gfs2_holder_uninit(&rlist->rl_ghs[x]);
2619 kfree(rlist->rl_ghs);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002620 rlist->rl_ghs = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002621 }
2622}
2623