blob: 55ef72dc5b13c80c8c9dcb37a45b5dd18e93dd29 [file] [log] [blame]
David Teiglandb3b94fa2006-01-16 16:50:04 +00001/*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
Bob Petersonfe6c9912008-01-28 11:13:02 -06003 * Copyright (C) 2004-2008 Red Hat, Inc. All rights reserved.
David Teiglandb3b94fa2006-01-16 16:50:04 +00004 *
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
Steven Whitehousee9fc2aa2006-09-01 11:05:15 -04007 * of the GNU General Public License version 2.
David Teiglandb3b94fa2006-01-16 16:50:04 +00008 */
9
Joe Perchesd77d1b52014-03-06 12:10:45 -080010#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
11
David Teiglandb3b94fa2006-01-16 16:50:04 +000012#include <linux/slab.h>
13#include <linux/spinlock.h>
14#include <linux/completion.h>
15#include <linux/buffer_head.h>
Steven Whitehousef42faf42006-01-30 18:34:10 +000016#include <linux/fs.h>
Steven Whitehouse5c676f62006-02-27 17:23:27 -050017#include <linux/gfs2_ondisk.h>
Bob Peterson1f466a42008-03-10 18:17:47 -050018#include <linux/prefetch.h>
Steven Whitehousef15ab562009-02-09 09:25:01 +000019#include <linux/blkdev.h>
Bob Peterson7c9ca622011-08-31 09:53:19 +010020#include <linux/rbtree.h>
Steven Whitehouse9dbe9612012-10-31 10:37:10 +000021#include <linux/random.h>
David Teiglandb3b94fa2006-01-16 16:50:04 +000022
23#include "gfs2.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050024#include "incore.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000025#include "glock.h"
26#include "glops.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000027#include "lops.h"
28#include "meta_io.h"
29#include "quota.h"
30#include "rgrp.h"
31#include "super.h"
32#include "trans.h"
Steven Whitehouse5c676f62006-02-27 17:23:27 -050033#include "util.h"
Benjamin Marzinski172e0452007-03-23 14:51:56 -060034#include "log.h"
Steven Whitehousec8cdf472007-06-08 10:05:33 +010035#include "inode.h"
Steven Whitehouse63997772009-06-12 08:49:20 +010036#include "trace_gfs2.h"
David Teiglandb3b94fa2006-01-16 16:50:04 +000037
Steven Whitehouse2c1e52a2006-09-05 15:41:57 -040038#define BFITNOENT ((u32)~0)
Bob Peterson6760bdc2007-07-24 14:09:32 -050039#define NO_BLOCK ((u64)~0)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040040
Bob Peterson1f466a42008-03-10 18:17:47 -050041#if BITS_PER_LONG == 32
42#define LBITMASK (0x55555555UL)
43#define LBITSKIP55 (0x55555555UL)
44#define LBITSKIP00 (0x00000000UL)
45#else
46#define LBITMASK (0x5555555555555555UL)
47#define LBITSKIP55 (0x5555555555555555UL)
48#define LBITSKIP00 (0x0000000000000000UL)
49#endif
50
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040051/*
52 * These routines are used by the resource group routines (rgrp.c)
53 * to keep track of block allocation. Each block is represented by two
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040054 * bits. So, each byte represents GFS2_NBBY (i.e. 4) blocks.
55 *
56 * 0 = Free
57 * 1 = Used (not metadata)
58 * 2 = Unlinked (still in use) inode
59 * 3 = Used (metadata)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040060 */
61
Bob Peterson5ce13432013-11-06 10:55:52 -050062struct gfs2_extent {
63 struct gfs2_rbm rbm;
64 u32 len;
65};
66
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040067static const char valid_change[16] = {
68 /* current */
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040069 /* n */ 0, 1, 1, 1,
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040070 /* e */ 1, 0, 0, 0,
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -040071 /* w */ 0, 0, 0, 1,
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040072 1, 0, 0, 0
73};
74
Bob Peterson5ce13432013-11-06 10:55:52 -050075static int gfs2_rbm_find(struct gfs2_rbm *rbm, u8 state, u32 *minext,
76 const struct gfs2_inode *ip, bool nowrap,
77 const struct gfs2_alloc_parms *ap);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +010078
79
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040080/**
81 * gfs2_setbit - Set a bit in the bitmaps
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010082 * @rbm: The position of the bit to set
83 * @do_clone: Also set the clone bitmap, if it exists
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040084 * @new_state: the new state of the block
85 *
86 */
87
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010088static inline void gfs2_setbit(const struct gfs2_rbm *rbm, bool do_clone,
Bob Peterson06344b92012-04-26 12:44:35 -040089 unsigned char new_state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040090{
Steven Whitehouseb45e41d2008-02-06 10:11:15 +000091 unsigned char *byte1, *byte2, *end, cur_state;
Bob Petersone579ed42013-09-17 13:12:15 -040092 struct gfs2_bitmap *bi = rbm_bi(rbm);
93 unsigned int buflen = bi->bi_len;
Steven Whitehouse3e6339d2012-08-13 11:37:51 +010094 const unsigned int bit = (rbm->offset % GFS2_NBBY) * GFS2_BIT_SIZE;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040095
Bob Petersone579ed42013-09-17 13:12:15 -040096 byte1 = bi->bi_bh->b_data + bi->bi_offset + (rbm->offset / GFS2_NBBY);
97 end = bi->bi_bh->b_data + bi->bi_offset + buflen;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -040098
Steven Whitehouseb45e41d2008-02-06 10:11:15 +000099 BUG_ON(byte1 >= end);
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400100
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000101 cur_state = (*byte1 >> bit) & GFS2_BIT_MASK;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400102
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000103 if (unlikely(!valid_change[new_state * 4 + cur_state])) {
Joe Perchesd77d1b52014-03-06 12:10:45 -0800104 pr_warn("buf_blk = 0x%x old_state=%d, new_state=%d\n",
105 rbm->offset, cur_state, new_state);
106 pr_warn("rgrp=0x%llx bi_start=0x%x\n",
107 (unsigned long long)rbm->rgd->rd_addr, bi->bi_start);
108 pr_warn("bi_offset=0x%x bi_len=0x%x\n",
109 bi->bi_offset, bi->bi_len);
Bob Peterson95c8e172011-03-22 10:49:12 -0400110 dump_stack();
Steven Whitehouse3e6339d2012-08-13 11:37:51 +0100111 gfs2_consist_rgrpd(rbm->rgd);
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000112 return;
113 }
114 *byte1 ^= (cur_state ^ new_state) << bit;
115
Bob Petersone579ed42013-09-17 13:12:15 -0400116 if (do_clone && bi->bi_clone) {
117 byte2 = bi->bi_clone + bi->bi_offset + (rbm->offset / GFS2_NBBY);
Steven Whitehouseb45e41d2008-02-06 10:11:15 +0000118 cur_state = (*byte2 >> bit) & GFS2_BIT_MASK;
119 *byte2 ^= (cur_state ^ new_state) << bit;
120 }
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400121}
122
123/**
124 * gfs2_testbit - test a bit in the bitmaps
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100125 * @rbm: The bit to test
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400126 *
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100127 * Returns: The two bit block state of the requested bit
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400128 */
129
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100130static inline u8 gfs2_testbit(const struct gfs2_rbm *rbm)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400131{
Bob Petersone579ed42013-09-17 13:12:15 -0400132 struct gfs2_bitmap *bi = rbm_bi(rbm);
133 const u8 *buffer = bi->bi_bh->b_data + bi->bi_offset;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100134 const u8 *byte;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400135 unsigned int bit;
136
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100137 byte = buffer + (rbm->offset / GFS2_NBBY);
138 bit = (rbm->offset % GFS2_NBBY) * GFS2_BIT_SIZE;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400139
Steven Whitehousec04a2ef2012-08-13 11:14:57 +0100140 return (*byte >> bit) & GFS2_BIT_MASK;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400141}
142
143/**
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000144 * gfs2_bit_search
145 * @ptr: Pointer to bitmap data
146 * @mask: Mask to use (normally 0x55555.... but adjusted for search start)
147 * @state: The state we are searching for
148 *
149 * We xor the bitmap data with a patter which is the bitwise opposite
150 * of what we are looking for, this gives rise to a pattern of ones
151 * wherever there is a match. Since we have two bits per entry, we
152 * take this pattern, shift it down by one place and then and it with
153 * the original. All the even bit positions (0,2,4, etc) then represent
154 * successful matches, so we mask with 0x55555..... to remove the unwanted
155 * odd bit positions.
156 *
157 * This allows searching of a whole u64 at once (32 blocks) with a
158 * single test (on 64 bit arches).
159 */
160
161static inline u64 gfs2_bit_search(const __le64 *ptr, u64 mask, u8 state)
162{
163 u64 tmp;
164 static const u64 search[] = {
Hannes Eder075ac442009-02-21 02:11:42 +0100165 [0] = 0xffffffffffffffffULL,
166 [1] = 0xaaaaaaaaaaaaaaaaULL,
167 [2] = 0x5555555555555555ULL,
168 [3] = 0x0000000000000000ULL,
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000169 };
170 tmp = le64_to_cpu(*ptr) ^ search[state];
171 tmp &= (tmp >> 1);
172 tmp &= mask;
173 return tmp;
174}
175
176/**
Bob Peterson8e2e0042012-07-19 08:12:40 -0400177 * rs_cmp - multi-block reservation range compare
178 * @blk: absolute file system block number of the new reservation
179 * @len: number of blocks in the new reservation
180 * @rs: existing reservation to compare against
181 *
182 * returns: 1 if the block range is beyond the reach of the reservation
183 * -1 if the block range is before the start of the reservation
184 * 0 if the block range overlaps with the reservation
185 */
186static inline int rs_cmp(u64 blk, u32 len, struct gfs2_blkreserv *rs)
187{
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100188 u64 startblk = gfs2_rbm_to_block(&rs->rs_rbm);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400189
190 if (blk >= startblk + rs->rs_free)
191 return 1;
192 if (blk + len - 1 < startblk)
193 return -1;
194 return 0;
195}
196
197/**
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400198 * gfs2_bitfit - Search an rgrp's bitmap buffer to find a bit-pair representing
199 * a block in a given allocation state.
Bob Peterson886b1412012-04-11 13:03:52 -0400200 * @buf: the buffer that holds the bitmaps
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000201 * @len: the length (in bytes) of the buffer
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400202 * @goal: start search at this block's bit-pair (within @buffer)
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000203 * @state: GFS2_BLKST_XXX the state of the block we're looking for.
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400204 *
205 * Scope of @goal and returned block number is only within this bitmap buffer,
206 * not entire rgrp or filesystem. @buffer will be offset from the actual
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000207 * beginning of a bitmap block buffer, skipping any header structures, but
208 * headers are always a multiple of 64 bits long so that the buffer is
209 * always aligned to a 64 bit boundary.
210 *
211 * The size of the buffer is in bytes, but is it assumed that it is
Anand Gadiyarfd589a82009-07-16 17:13:03 +0200212 * always ok to read a complete multiple of 64 bits at the end
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000213 * of the block in case the end is no aligned to a natural boundary.
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400214 *
215 * Return: the block number (bitmap buffer scope) that was found
216 */
217
Hannes Eder02ab1722009-02-21 02:12:05 +0100218static u32 gfs2_bitfit(const u8 *buf, const unsigned int len,
219 u32 goal, u8 state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400220{
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000221 u32 spoint = (goal << 1) & ((8*sizeof(u64)) - 1);
222 const __le64 *ptr = ((__le64 *)buf) + (goal >> 5);
223 const __le64 *end = (__le64 *)(buf + ALIGN(len, sizeof(u64)));
224 u64 tmp;
Hannes Eder075ac442009-02-21 02:11:42 +0100225 u64 mask = 0x5555555555555555ULL;
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000226 u32 bit;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400227
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000228 /* Mask off bits we don't care about at the start of the search */
229 mask <<= spoint;
230 tmp = gfs2_bit_search(ptr, mask, state);
231 ptr++;
232 while(tmp == 0 && ptr < end) {
Hannes Eder075ac442009-02-21 02:11:42 +0100233 tmp = gfs2_bit_search(ptr, 0x5555555555555555ULL, state);
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000234 ptr++;
Bob Peterson1f466a42008-03-10 18:17:47 -0500235 }
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000236 /* Mask off any bits which are more than len bytes from the start */
237 if (ptr == end && (len & (sizeof(u64) - 1)))
238 tmp &= (((u64)~0) >> (64 - 8*(len & (sizeof(u64) - 1))));
239 /* Didn't find anything, so return */
240 if (tmp == 0)
241 return BFITNOENT;
242 ptr--;
Steven Whitehoused8bd5042009-04-23 08:54:02 +0100243 bit = __ffs64(tmp);
Steven Whitehouse223b2b82009-02-17 14:13:35 +0000244 bit /= 2; /* two bits per entry in the bitmap */
245 return (((const unsigned char *)ptr - buf) * GFS2_NBBY) + bit;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400246}
247
248/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100249 * gfs2_rbm_from_block - Set the rbm based upon rgd and block number
250 * @rbm: The rbm with rgd already set correctly
251 * @block: The block number (filesystem relative)
252 *
253 * This sets the bi and offset members of an rbm based on a
254 * resource group and a filesystem relative block number. The
255 * resource group must be set in the rbm on entry, the bi and
256 * offset members will be set by this function.
257 *
258 * Returns: 0 on success, or an error code
259 */
260
261static int gfs2_rbm_from_block(struct gfs2_rbm *rbm, u64 block)
262{
263 u64 rblock = block - rbm->rgd->rd_data0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100264
265 if (WARN_ON_ONCE(rblock > UINT_MAX))
266 return -EINVAL;
267 if (block >= rbm->rgd->rd_data0 + rbm->rgd->rd_data)
268 return -E2BIG;
269
Bob Petersone579ed42013-09-17 13:12:15 -0400270 rbm->bii = 0;
Bob Petersona68a0a32012-10-19 08:32:51 -0400271 rbm->offset = (u32)(rblock);
272 /* Check if the block is within the first block */
Bob Petersone579ed42013-09-17 13:12:15 -0400273 if (rbm->offset < rbm_bi(rbm)->bi_blocks)
Bob Petersona68a0a32012-10-19 08:32:51 -0400274 return 0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100275
Bob Petersona68a0a32012-10-19 08:32:51 -0400276 /* Adjust for the size diff between gfs2_meta_header and gfs2_rgrp */
277 rbm->offset += (sizeof(struct gfs2_rgrp) -
278 sizeof(struct gfs2_meta_header)) * GFS2_NBBY;
Bob Petersone579ed42013-09-17 13:12:15 -0400279 rbm->bii = rbm->offset / rbm->rgd->rd_sbd->sd_blocks_per_bitmap;
280 rbm->offset -= rbm->bii * rbm->rgd->rd_sbd->sd_blocks_per_bitmap;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100281 return 0;
282}
283
284/**
Bob Peterson149ed7f2013-09-17 13:14:35 -0400285 * gfs2_rbm_incr - increment an rbm structure
286 * @rbm: The rbm with rgd already set correctly
287 *
288 * This function takes an existing rbm structure and increments it to the next
289 * viable block offset.
290 *
291 * Returns: If incrementing the offset would cause the rbm to go past the
292 * end of the rgrp, true is returned, otherwise false.
293 *
294 */
295
296static bool gfs2_rbm_incr(struct gfs2_rbm *rbm)
297{
298 if (rbm->offset + 1 < rbm_bi(rbm)->bi_blocks) { /* in the same bitmap */
299 rbm->offset++;
300 return false;
301 }
302 if (rbm->bii == rbm->rgd->rd_length - 1) /* at the last bitmap */
303 return true;
304
305 rbm->offset = 0;
306 rbm->bii++;
307 return false;
308}
309
310/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100311 * gfs2_unaligned_extlen - Look for free blocks which are not byte aligned
312 * @rbm: Position to search (value/result)
313 * @n_unaligned: Number of unaligned blocks to check
314 * @len: Decremented for each block found (terminate on zero)
315 *
316 * Returns: true if a non-free block is encountered
317 */
318
319static bool gfs2_unaligned_extlen(struct gfs2_rbm *rbm, u32 n_unaligned, u32 *len)
320{
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100321 u32 n;
322 u8 res;
323
324 for (n = 0; n < n_unaligned; n++) {
325 res = gfs2_testbit(rbm);
326 if (res != GFS2_BLKST_FREE)
327 return true;
328 (*len)--;
329 if (*len == 0)
330 return true;
Bob Peterson149ed7f2013-09-17 13:14:35 -0400331 if (gfs2_rbm_incr(rbm))
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100332 return true;
333 }
334
335 return false;
336}
337
338/**
339 * gfs2_free_extlen - Return extent length of free blocks
Fabian Frederick27ff6a02014-07-02 22:05:27 +0200340 * @rrbm: Starting position
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100341 * @len: Max length to check
342 *
343 * Starting at the block specified by the rbm, see how many free blocks
344 * there are, not reading more than len blocks ahead. This can be done
345 * using memchr_inv when the blocks are byte aligned, but has to be done
346 * on a block by block basis in case of unaligned blocks. Also this
347 * function can cope with bitmap boundaries (although it must stop on
348 * a resource group boundary)
349 *
350 * Returns: Number of free blocks in the extent
351 */
352
353static u32 gfs2_free_extlen(const struct gfs2_rbm *rrbm, u32 len)
354{
355 struct gfs2_rbm rbm = *rrbm;
356 u32 n_unaligned = rbm.offset & 3;
357 u32 size = len;
358 u32 bytes;
359 u32 chunk_size;
360 u8 *ptr, *start, *end;
361 u64 block;
Bob Petersone579ed42013-09-17 13:12:15 -0400362 struct gfs2_bitmap *bi;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100363
364 if (n_unaligned &&
365 gfs2_unaligned_extlen(&rbm, 4 - n_unaligned, &len))
366 goto out;
367
Bob Peterson37015302012-09-12 09:40:31 -0400368 n_unaligned = len & 3;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100369 /* Start is now byte aligned */
370 while (len > 3) {
Bob Petersone579ed42013-09-17 13:12:15 -0400371 bi = rbm_bi(&rbm);
372 start = bi->bi_bh->b_data;
373 if (bi->bi_clone)
374 start = bi->bi_clone;
375 end = start + bi->bi_bh->b_size;
376 start += bi->bi_offset;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100377 BUG_ON(rbm.offset & 3);
378 start += (rbm.offset / GFS2_NBBY);
379 bytes = min_t(u32, len / GFS2_NBBY, (end - start));
380 ptr = memchr_inv(start, 0, bytes);
381 chunk_size = ((ptr == NULL) ? bytes : (ptr - start));
382 chunk_size *= GFS2_NBBY;
383 BUG_ON(len < chunk_size);
384 len -= chunk_size;
385 block = gfs2_rbm_to_block(&rbm);
Bob Peterson15bd50a2012-12-20 13:21:07 -0500386 if (gfs2_rbm_from_block(&rbm, block + chunk_size)) {
387 n_unaligned = 0;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100388 break;
Bob Peterson15bd50a2012-12-20 13:21:07 -0500389 }
390 if (ptr) {
391 n_unaligned = 3;
392 break;
393 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +0100394 n_unaligned = len & 3;
395 }
396
397 /* Deal with any bits left over at the end */
398 if (n_unaligned)
399 gfs2_unaligned_extlen(&rbm, n_unaligned, &len);
400out:
401 return size - len;
402}
403
404/**
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400405 * gfs2_bitcount - count the number of bits in a certain state
Bob Peterson886b1412012-04-11 13:03:52 -0400406 * @rgd: the resource group descriptor
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400407 * @buffer: the buffer that holds the bitmaps
408 * @buflen: the length (in bytes) of the buffer
409 * @state: the state of the block we're looking for
410 *
411 * Returns: The number of bits
412 */
413
Steven Whitehouse110acf32008-01-29 13:30:20 +0000414static u32 gfs2_bitcount(struct gfs2_rgrpd *rgd, const u8 *buffer,
415 unsigned int buflen, u8 state)
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400416{
Steven Whitehouse110acf32008-01-29 13:30:20 +0000417 const u8 *byte = buffer;
418 const u8 *end = buffer + buflen;
419 const u8 state1 = state << 2;
420 const u8 state2 = state << 4;
421 const u8 state3 = state << 6;
Steven Whitehousecd915492006-09-04 12:49:07 -0400422 u32 count = 0;
Steven Whitehouse88c8ab1f2006-05-18 13:52:39 -0400423
424 for (; byte < end; byte++) {
425 if (((*byte) & 0x03) == state)
426 count++;
427 if (((*byte) & 0x0C) == state1)
428 count++;
429 if (((*byte) & 0x30) == state2)
430 count++;
431 if (((*byte) & 0xC0) == state3)
432 count++;
433 }
434
435 return count;
436}
437
David Teiglandb3b94fa2006-01-16 16:50:04 +0000438/**
439 * gfs2_rgrp_verify - Verify that a resource group is consistent
David Teiglandb3b94fa2006-01-16 16:50:04 +0000440 * @rgd: the rgrp
441 *
442 */
443
444void gfs2_rgrp_verify(struct gfs2_rgrpd *rgd)
445{
446 struct gfs2_sbd *sdp = rgd->rd_sbd;
447 struct gfs2_bitmap *bi = NULL;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100448 u32 length = rgd->rd_length;
Steven Whitehousecd915492006-09-04 12:49:07 -0400449 u32 count[4], tmp;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000450 int buf, x;
451
Steven Whitehousecd915492006-09-04 12:49:07 -0400452 memset(count, 0, 4 * sizeof(u32));
David Teiglandb3b94fa2006-01-16 16:50:04 +0000453
454 /* Count # blocks in each of 4 possible allocation states */
455 for (buf = 0; buf < length; buf++) {
456 bi = rgd->rd_bits + buf;
457 for (x = 0; x < 4; x++)
458 count[x] += gfs2_bitcount(rgd,
459 bi->bi_bh->b_data +
460 bi->bi_offset,
461 bi->bi_len, x);
462 }
463
Steven Whitehousecfc8b542008-11-04 10:25:13 +0000464 if (count[0] != rgd->rd_free) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000465 if (gfs2_consist_rgrpd(rgd))
466 fs_err(sdp, "free data mismatch: %u != %u\n",
Steven Whitehousecfc8b542008-11-04 10:25:13 +0000467 count[0], rgd->rd_free);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000468 return;
469 }
470
Steven Whitehouse73f74942008-11-04 10:32:57 +0000471 tmp = rgd->rd_data - rgd->rd_free - rgd->rd_dinodes;
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500472 if (count[1] != tmp) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000473 if (gfs2_consist_rgrpd(rgd))
474 fs_err(sdp, "used data mismatch: %u != %u\n",
475 count[1], tmp);
476 return;
477 }
478
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500479 if (count[2] + count[3] != rgd->rd_dinodes) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000480 if (gfs2_consist_rgrpd(rgd))
481 fs_err(sdp, "used metadata mismatch: %u != %u\n",
Benjamin Marzinski6b946172009-07-10 18:13:26 -0500482 count[2] + count[3], rgd->rd_dinodes);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000483 return;
484 }
485}
486
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100487static inline int rgrp_contains_block(struct gfs2_rgrpd *rgd, u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000488{
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100489 u64 first = rgd->rd_data0;
490 u64 last = first + rgd->rd_data;
Steven Whitehouse16910422006-09-05 11:15:45 -0400491 return first <= block && block < last;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000492}
493
494/**
495 * gfs2_blk2rgrpd - Find resource group for a given data/meta block number
496 * @sdp: The GFS2 superblock
Bob Peterson886b1412012-04-11 13:03:52 -0400497 * @blk: The data block number
498 * @exact: True if this needs to be an exact match
David Teiglandb3b94fa2006-01-16 16:50:04 +0000499 *
500 * Returns: The resource group, or NULL if not found
501 */
502
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000503struct gfs2_rgrpd *gfs2_blk2rgrpd(struct gfs2_sbd *sdp, u64 blk, bool exact)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000504{
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000505 struct rb_node *n, *next;
Steven Whitehousef75bbfb2011-09-08 10:21:13 +0100506 struct gfs2_rgrpd *cur;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000507
508 spin_lock(&sdp->sd_rindex_spin);
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000509 n = sdp->sd_rindex_tree.rb_node;
510 while (n) {
511 cur = rb_entry(n, struct gfs2_rgrpd, rd_node);
512 next = NULL;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100513 if (blk < cur->rd_addr)
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000514 next = n->rb_left;
Steven Whitehousef75bbfb2011-09-08 10:21:13 +0100515 else if (blk >= cur->rd_data0 + cur->rd_data)
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000516 next = n->rb_right;
517 if (next == NULL) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000518 spin_unlock(&sdp->sd_rindex_spin);
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000519 if (exact) {
520 if (blk < cur->rd_addr)
521 return NULL;
522 if (blk >= cur->rd_data0 + cur->rd_data)
523 return NULL;
524 }
Bob Peterson7c9ca622011-08-31 09:53:19 +0100525 return cur;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000526 }
Steven Whitehouse66fc0612012-02-08 12:58:32 +0000527 n = next;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000528 }
David Teiglandb3b94fa2006-01-16 16:50:04 +0000529 spin_unlock(&sdp->sd_rindex_spin);
530
531 return NULL;
532}
533
534/**
535 * gfs2_rgrpd_get_first - get the first Resource Group in the filesystem
536 * @sdp: The GFS2 superblock
537 *
538 * Returns: The first rgrp in the filesystem
539 */
540
541struct gfs2_rgrpd *gfs2_rgrpd_get_first(struct gfs2_sbd *sdp)
542{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100543 const struct rb_node *n;
544 struct gfs2_rgrpd *rgd;
545
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100546 spin_lock(&sdp->sd_rindex_spin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100547 n = rb_first(&sdp->sd_rindex_tree);
548 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100549 spin_unlock(&sdp->sd_rindex_spin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100550
551 return rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000552}
553
554/**
555 * gfs2_rgrpd_get_next - get the next RG
Bob Peterson886b1412012-04-11 13:03:52 -0400556 * @rgd: the resource group descriptor
David Teiglandb3b94fa2006-01-16 16:50:04 +0000557 *
558 * Returns: The next rgrp
559 */
560
561struct gfs2_rgrpd *gfs2_rgrpd_get_next(struct gfs2_rgrpd *rgd)
562{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100563 struct gfs2_sbd *sdp = rgd->rd_sbd;
564 const struct rb_node *n;
565
566 spin_lock(&sdp->sd_rindex_spin);
567 n = rb_next(&rgd->rd_node);
568 if (n == NULL)
569 n = rb_first(&sdp->sd_rindex_tree);
570
571 if (unlikely(&rgd->rd_node == n)) {
572 spin_unlock(&sdp->sd_rindex_spin);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000573 return NULL;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100574 }
575 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
576 spin_unlock(&sdp->sd_rindex_spin);
577 return rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000578}
579
Abhi Das00a158b2014-09-18 21:40:28 -0500580void check_and_update_goal(struct gfs2_inode *ip)
581{
582 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
583 if (!ip->i_goal || gfs2_blk2rgrpd(sdp, ip->i_goal, 1) == NULL)
584 ip->i_goal = ip->i_no_addr;
585}
586
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100587void gfs2_free_clones(struct gfs2_rgrpd *rgd)
588{
589 int x;
590
591 for (x = 0; x < rgd->rd_length; x++) {
592 struct gfs2_bitmap *bi = rgd->rd_bits + x;
593 kfree(bi->bi_clone);
594 bi->bi_clone = NULL;
595 }
596}
597
Bob Peterson0a305e42012-06-06 11:17:59 +0100598/**
599 * gfs2_rs_alloc - make sure we have a reservation assigned to the inode
600 * @ip: the inode for this reservation
601 */
602int gfs2_rs_alloc(struct gfs2_inode *ip)
603{
Abhijith Dasf1213ca2012-12-19 10:48:01 -0500604 int error = 0;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100605
Bob Peterson0a305e42012-06-06 11:17:59 +0100606 down_write(&ip->i_rw_mutex);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400607 if (ip->i_res)
Abhijith Dasf1213ca2012-12-19 10:48:01 -0500608 goto out;
609
610 ip->i_res = kmem_cache_zalloc(gfs2_rsrv_cachep, GFP_NOFS);
611 if (!ip->i_res) {
612 error = -ENOMEM;
613 goto out;
614 }
615
616 RB_CLEAR_NODE(&ip->i_res->rs_node);
617out:
Bob Peterson0a305e42012-06-06 11:17:59 +0100618 up_write(&ip->i_rw_mutex);
Wei Yongjun441362d2013-03-11 23:01:37 +0800619 return error;
Bob Peterson0a305e42012-06-06 11:17:59 +0100620}
621
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100622static void dump_rs(struct seq_file *seq, const struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400623{
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100624 gfs2_print_dbg(seq, " B: n:%llu s:%llu b:%u f:%u\n",
625 (unsigned long long)rs->rs_inum,
626 (unsigned long long)gfs2_rbm_to_block(&rs->rs_rbm),
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100627 rs->rs_rbm.offset, rs->rs_free);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400628}
629
Bob Peterson0a305e42012-06-06 11:17:59 +0100630/**
Bob Peterson8e2e0042012-07-19 08:12:40 -0400631 * __rs_deltree - remove a multi-block reservation from the rgd tree
632 * @rs: The reservation to remove
633 *
634 */
Bob Peterson20095212013-03-13 10:26:38 -0400635static void __rs_deltree(struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400636{
637 struct gfs2_rgrpd *rgd;
638
639 if (!gfs2_rs_active(rs))
640 return;
641
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100642 rgd = rs->rs_rbm.rgd;
Steven Whitehouse9e733d32012-08-23 15:37:59 +0100643 trace_gfs2_rs(rs, TRACE_RS_TREEDEL);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100644 rb_erase(&rs->rs_node, &rgd->rd_rstree);
Michel Lespinasse24d634e2012-08-05 22:04:08 -0700645 RB_CLEAR_NODE(&rs->rs_node);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400646
647 if (rs->rs_free) {
Bob Petersone579ed42013-09-17 13:12:15 -0400648 struct gfs2_bitmap *bi = rbm_bi(&rs->rs_rbm);
649
Bob Peterson20095212013-03-13 10:26:38 -0400650 /* return reserved blocks to the rgrp */
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100651 BUG_ON(rs->rs_rbm.rgd->rd_reserved < rs->rs_free);
652 rs->rs_rbm.rgd->rd_reserved -= rs->rs_free;
Bob Peterson5ea50502013-11-25 11:16:25 +0000653 /* The rgrp extent failure point is likely not to increase;
654 it will only do so if the freed blocks are somehow
655 contiguous with a span of free blocks that follows. Still,
656 it will force the number to be recalculated later. */
657 rgd->rd_extfail_pt += rs->rs_free;
Bob Peterson8e2e0042012-07-19 08:12:40 -0400658 rs->rs_free = 0;
Bob Petersone579ed42013-09-17 13:12:15 -0400659 clear_bit(GBF_FULL, &bi->bi_flags);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400660 }
Bob Peterson8e2e0042012-07-19 08:12:40 -0400661}
662
663/**
664 * gfs2_rs_deltree - remove a multi-block reservation from the rgd tree
665 * @rs: The reservation to remove
666 *
667 */
Bob Peterson20095212013-03-13 10:26:38 -0400668void gfs2_rs_deltree(struct gfs2_blkreserv *rs)
Bob Peterson8e2e0042012-07-19 08:12:40 -0400669{
670 struct gfs2_rgrpd *rgd;
671
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100672 rgd = rs->rs_rbm.rgd;
673 if (rgd) {
674 spin_lock(&rgd->rd_rsspin);
Bob Peterson20095212013-03-13 10:26:38 -0400675 __rs_deltree(rs);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +0100676 spin_unlock(&rgd->rd_rsspin);
677 }
Bob Peterson8e2e0042012-07-19 08:12:40 -0400678}
679
680/**
681 * gfs2_rs_delete - delete a multi-block reservation
Bob Peterson0a305e42012-06-06 11:17:59 +0100682 * @ip: The inode for this reservation
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100683 * @wcount: The inode's write count, or NULL
Bob Peterson0a305e42012-06-06 11:17:59 +0100684 *
685 */
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100686void gfs2_rs_delete(struct gfs2_inode *ip, atomic_t *wcount)
Bob Peterson0a305e42012-06-06 11:17:59 +0100687{
688 down_write(&ip->i_rw_mutex);
Steven Whitehouseaf5c2692013-09-27 12:49:33 +0100689 if (ip->i_res && ((wcount == NULL) || (atomic_read(wcount) <= 1))) {
Bob Peterson20095212013-03-13 10:26:38 -0400690 gfs2_rs_deltree(ip->i_res);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400691 BUG_ON(ip->i_res->rs_free);
Bob Peterson0a305e42012-06-06 11:17:59 +0100692 kmem_cache_free(gfs2_rsrv_cachep, ip->i_res);
693 ip->i_res = NULL;
694 }
695 up_write(&ip->i_rw_mutex);
696}
697
Bob Peterson8e2e0042012-07-19 08:12:40 -0400698/**
699 * return_all_reservations - return all reserved blocks back to the rgrp.
700 * @rgd: the rgrp that needs its space back
701 *
702 * We previously reserved a bunch of blocks for allocation. Now we need to
703 * give them back. This leave the reservation structures in tact, but removes
704 * all of their corresponding "no-fly zones".
705 */
706static void return_all_reservations(struct gfs2_rgrpd *rgd)
707{
708 struct rb_node *n;
709 struct gfs2_blkreserv *rs;
710
711 spin_lock(&rgd->rd_rsspin);
712 while ((n = rb_first(&rgd->rd_rstree))) {
713 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
Bob Peterson20095212013-03-13 10:26:38 -0400714 __rs_deltree(rs);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400715 }
716 spin_unlock(&rgd->rd_rsspin);
717}
718
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100719void gfs2_clear_rgrpd(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000720{
Bob Peterson7c9ca622011-08-31 09:53:19 +0100721 struct rb_node *n;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000722 struct gfs2_rgrpd *rgd;
723 struct gfs2_glock *gl;
724
Bob Peterson7c9ca622011-08-31 09:53:19 +0100725 while ((n = rb_first(&sdp->sd_rindex_tree))) {
726 rgd = rb_entry(n, struct gfs2_rgrpd, rd_node);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000727 gl = rgd->rd_gl;
728
Bob Peterson7c9ca622011-08-31 09:53:19 +0100729 rb_erase(n, &sdp->sd_rindex_tree);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000730
731 if (gl) {
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100732 spin_lock(&gl->gl_spin);
Steven Whitehouse5c676f62006-02-27 17:23:27 -0500733 gl->gl_object = NULL;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100734 spin_unlock(&gl->gl_spin);
Steven Whitehouse29687a22011-03-30 16:33:25 +0100735 gfs2_glock_add_to_lru(gl);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000736 gfs2_glock_put(gl);
737 }
738
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100739 gfs2_free_clones(rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000740 kfree(rgd->rd_bits);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400741 return_all_reservations(rgd);
Bob Peterson6bdd9be2008-01-28 17:20:26 -0600742 kmem_cache_free(gfs2_rgrpd_cachep, rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000743 }
744}
745
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100746static void gfs2_rindex_print(const struct gfs2_rgrpd *rgd)
747{
Joe Perchesd77d1b52014-03-06 12:10:45 -0800748 pr_info("ri_addr = %llu\n", (unsigned long long)rgd->rd_addr);
749 pr_info("ri_length = %u\n", rgd->rd_length);
750 pr_info("ri_data0 = %llu\n", (unsigned long long)rgd->rd_data0);
751 pr_info("ri_data = %u\n", rgd->rd_data);
752 pr_info("ri_bitbytes = %u\n", rgd->rd_bitbytes);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100753}
754
David Teiglandb3b94fa2006-01-16 16:50:04 +0000755/**
756 * gfs2_compute_bitstructs - Compute the bitmap sizes
757 * @rgd: The resource group descriptor
758 *
759 * Calculates bitmap descriptors, one for each block that contains bitmap data
760 *
761 * Returns: errno
762 */
763
764static int compute_bitstructs(struct gfs2_rgrpd *rgd)
765{
766 struct gfs2_sbd *sdp = rgd->rd_sbd;
767 struct gfs2_bitmap *bi;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100768 u32 length = rgd->rd_length; /* # blocks in hdr & bitmap */
Steven Whitehousecd915492006-09-04 12:49:07 -0400769 u32 bytes_left, bytes;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000770 int x;
771
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -0400772 if (!length)
773 return -EINVAL;
774
Steven Whitehousedd894be2006-07-27 14:29:00 -0400775 rgd->rd_bits = kcalloc(length, sizeof(struct gfs2_bitmap), GFP_NOFS);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000776 if (!rgd->rd_bits)
777 return -ENOMEM;
778
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100779 bytes_left = rgd->rd_bitbytes;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000780
781 for (x = 0; x < length; x++) {
782 bi = rgd->rd_bits + x;
783
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +0100784 bi->bi_flags = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000785 /* small rgrp; bitmap stored completely in header block */
786 if (length == 1) {
787 bytes = bytes_left;
788 bi->bi_offset = sizeof(struct gfs2_rgrp);
789 bi->bi_start = 0;
790 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500791 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000792 /* header block */
793 } else if (x == 0) {
794 bytes = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_rgrp);
795 bi->bi_offset = sizeof(struct gfs2_rgrp);
796 bi->bi_start = 0;
797 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500798 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000799 /* last block */
800 } else if (x + 1 == length) {
801 bytes = bytes_left;
802 bi->bi_offset = sizeof(struct gfs2_meta_header);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100803 bi->bi_start = rgd->rd_bitbytes - bytes_left;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000804 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500805 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000806 /* other blocks */
807 } else {
Steven Whitehouse568f4c92006-02-27 12:00:42 -0500808 bytes = sdp->sd_sb.sb_bsize -
809 sizeof(struct gfs2_meta_header);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000810 bi->bi_offset = sizeof(struct gfs2_meta_header);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100811 bi->bi_start = rgd->rd_bitbytes - bytes_left;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000812 bi->bi_len = bytes;
Bob Peterson7e230f52013-09-11 13:44:02 -0500813 bi->bi_blocks = bytes * GFS2_NBBY;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000814 }
815
816 bytes_left -= bytes;
817 }
818
819 if (bytes_left) {
820 gfs2_consist_rgrpd(rgd);
821 return -EIO;
822 }
823 bi = rgd->rd_bits + (length - 1);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100824 if ((bi->bi_start + bi->bi_len) * GFS2_NBBY != rgd->rd_data) {
David Teiglandb3b94fa2006-01-16 16:50:04 +0000825 if (gfs2_consist_rgrpd(rgd)) {
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100826 gfs2_rindex_print(rgd);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000827 fs_err(sdp, "start=%u len=%u offset=%u\n",
828 bi->bi_start, bi->bi_len, bi->bi_offset);
829 }
830 return -EIO;
831 }
832
833 return 0;
834}
835
836/**
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500837 * gfs2_ri_total - Total up the file system space, according to the rindex.
Bob Peterson886b1412012-04-11 13:03:52 -0400838 * @sdp: the filesystem
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500839 *
840 */
841u64 gfs2_ri_total(struct gfs2_sbd *sdp)
842{
843 u64 total_data = 0;
844 struct inode *inode = sdp->sd_rindex;
845 struct gfs2_inode *ip = GFS2_I(inode);
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500846 char buf[sizeof(struct gfs2_rindex)];
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500847 int error, rgrps;
848
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500849 for (rgrps = 0;; rgrps++) {
850 loff_t pos = rgrps * sizeof(struct gfs2_rindex);
851
Bob Petersonbcd72782010-12-07 13:58:56 -0500852 if (pos + sizeof(struct gfs2_rindex) > i_size_read(inode))
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500853 break;
Andrew Price43066292012-04-16 16:40:55 +0100854 error = gfs2_internal_read(ip, buf, &pos,
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500855 sizeof(struct gfs2_rindex));
856 if (error != sizeof(struct gfs2_rindex))
857 break;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100858 total_data += be32_to_cpu(((struct gfs2_rindex *)buf)->ri_data);
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500859 }
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500860 return total_data;
861}
862
Bob Peterson6aad1c32012-03-05 09:20:59 -0500863static int rgd_insert(struct gfs2_rgrpd *rgd)
Bob Peterson7c9ca622011-08-31 09:53:19 +0100864{
865 struct gfs2_sbd *sdp = rgd->rd_sbd;
866 struct rb_node **newn = &sdp->sd_rindex_tree.rb_node, *parent = NULL;
867
868 /* Figure out where to put new node */
869 while (*newn) {
870 struct gfs2_rgrpd *cur = rb_entry(*newn, struct gfs2_rgrpd,
871 rd_node);
872
873 parent = *newn;
874 if (rgd->rd_addr < cur->rd_addr)
875 newn = &((*newn)->rb_left);
876 else if (rgd->rd_addr > cur->rd_addr)
877 newn = &((*newn)->rb_right);
878 else
Bob Peterson6aad1c32012-03-05 09:20:59 -0500879 return -EEXIST;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100880 }
881
882 rb_link_node(&rgd->rd_node, parent, newn);
883 rb_insert_color(&rgd->rd_node, &sdp->sd_rindex_tree);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500884 sdp->sd_rgrps++;
885 return 0;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100886}
887
Robert Peterson7ae8fa82007-05-09 09:37:57 -0500888/**
Robert Peterson6c532672007-05-10 16:54:38 -0500889 * read_rindex_entry - Pull in a new resource index entry from the disk
Andrew Price43066292012-04-16 16:40:55 +0100890 * @ip: Pointer to the rindex inode
David Teiglandb3b94fa2006-01-16 16:50:04 +0000891 *
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100892 * Returns: 0 on success, > 0 on EOF, error code otherwise
Robert Peterson6c532672007-05-10 16:54:38 -0500893 */
894
Andrew Price43066292012-04-16 16:40:55 +0100895static int read_rindex_entry(struct gfs2_inode *ip)
Robert Peterson6c532672007-05-10 16:54:38 -0500896{
897 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehouse7005c3e2013-12-06 10:16:14 +0000898 const unsigned bsize = sdp->sd_sb.sb_bsize;
Robert Peterson6c532672007-05-10 16:54:38 -0500899 loff_t pos = sdp->sd_rgrps * sizeof(struct gfs2_rindex);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100900 struct gfs2_rindex buf;
Robert Peterson6c532672007-05-10 16:54:38 -0500901 int error;
902 struct gfs2_rgrpd *rgd;
903
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100904 if (pos >= i_size_read(&ip->i_inode))
905 return 1;
906
Andrew Price43066292012-04-16 16:40:55 +0100907 error = gfs2_internal_read(ip, (char *)&buf, &pos,
Robert Peterson6c532672007-05-10 16:54:38 -0500908 sizeof(struct gfs2_rindex));
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100909
910 if (error != sizeof(struct gfs2_rindex))
911 return (error == 0) ? 1 : error;
Robert Peterson6c532672007-05-10 16:54:38 -0500912
Bob Peterson6bdd9be2008-01-28 17:20:26 -0600913 rgd = kmem_cache_zalloc(gfs2_rgrpd_cachep, GFP_NOFS);
Robert Peterson6c532672007-05-10 16:54:38 -0500914 error = -ENOMEM;
915 if (!rgd)
916 return error;
917
Robert Peterson6c532672007-05-10 16:54:38 -0500918 rgd->rd_sbd = sdp;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100919 rgd->rd_addr = be64_to_cpu(buf.ri_addr);
920 rgd->rd_length = be32_to_cpu(buf.ri_length);
921 rgd->rd_data0 = be64_to_cpu(buf.ri_data0);
922 rgd->rd_data = be32_to_cpu(buf.ri_data);
923 rgd->rd_bitbytes = be32_to_cpu(buf.ri_bitbytes);
Bob Peterson8e2e0042012-07-19 08:12:40 -0400924 spin_lock_init(&rgd->rd_rsspin);
Bob Peterson7c9ca622011-08-31 09:53:19 +0100925
Robert Peterson6c532672007-05-10 16:54:38 -0500926 error = compute_bitstructs(rgd);
927 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100928 goto fail;
Robert Peterson6c532672007-05-10 16:54:38 -0500929
Steven Whitehousebb8d8a62007-06-01 14:11:58 +0100930 error = gfs2_glock_get(sdp, rgd->rd_addr,
Robert Peterson6c532672007-05-10 16:54:38 -0500931 &gfs2_rgrp_glops, CREATE, &rgd->rd_gl);
932 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100933 goto fail;
Robert Peterson6c532672007-05-10 16:54:38 -0500934
935 rgd->rd_gl->gl_object = rgd;
Steven Whitehouse7005c3e2013-12-06 10:16:14 +0000936 rgd->rd_gl->gl_vm.start = rgd->rd_addr * bsize;
937 rgd->rd_gl->gl_vm.end = rgd->rd_gl->gl_vm.start + (rgd->rd_length * bsize) - 1;
David Teigland4e2f8842012-11-14 13:47:37 -0500938 rgd->rd_rgl = (struct gfs2_rgrp_lvb *)rgd->rd_gl->gl_lksb.sb_lvbptr;
Bob Petersoncf45b752008-01-31 10:31:39 -0600939 rgd->rd_flags &= ~GFS2_RDF_UPTODATE;
Bob Peterson7c9ca622011-08-31 09:53:19 +0100940 if (rgd->rd_data > sdp->sd_max_rg_data)
941 sdp->sd_max_rg_data = rgd->rd_data;
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100942 spin_lock(&sdp->sd_rindex_spin);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500943 error = rgd_insert(rgd);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100944 spin_unlock(&sdp->sd_rindex_spin);
Bob Peterson6aad1c32012-03-05 09:20:59 -0500945 if (!error)
946 return 0;
947
948 error = 0; /* someone else read in the rgrp; free it and ignore it */
Bob Petersonc1ac5392012-03-22 08:58:30 -0400949 gfs2_glock_put(rgd->rd_gl);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100950
951fail:
952 kfree(rgd->rd_bits);
953 kmem_cache_free(gfs2_rgrpd_cachep, rgd);
Robert Peterson6c532672007-05-10 16:54:38 -0500954 return error;
955}
956
957/**
958 * gfs2_ri_update - Pull in a new resource index from the disk
959 * @ip: pointer to the rindex inode
960 *
David Teiglandb3b94fa2006-01-16 16:50:04 +0000961 * Returns: 0 on successful update, error code otherwise
962 */
963
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100964static int gfs2_ri_update(struct gfs2_inode *ip)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000965{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -0400966 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +0000967 int error;
968
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100969 do {
Andrew Price43066292012-04-16 16:40:55 +0100970 error = read_rindex_entry(ip);
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100971 } while (error == 0);
972
973 if (error < 0)
974 return error;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000975
Bob Petersoncf45b752008-01-31 10:31:39 -0600976 sdp->sd_rindex_uptodate = 1;
David Teiglandb3b94fa2006-01-16 16:50:04 +0000977 return 0;
Robert Peterson6c532672007-05-10 16:54:38 -0500978}
David Teiglandb3b94fa2006-01-16 16:50:04 +0000979
Robert Peterson6c532672007-05-10 16:54:38 -0500980/**
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100981 * gfs2_rindex_update - Update the rindex if required
David Teiglandb3b94fa2006-01-16 16:50:04 +0000982 * @sdp: The GFS2 superblock
David Teiglandb3b94fa2006-01-16 16:50:04 +0000983 *
984 * We grab a lock on the rindex inode to make sure that it doesn't
985 * change whilst we are performing an operation. We keep this lock
986 * for quite long periods of time compared to other locks. This
987 * doesn't matter, since it is shared and it is very, very rarely
988 * accessed in the exclusive mode (i.e. only when expanding the filesystem).
989 *
990 * This makes sure that we're using the latest copy of the resource index
991 * special file, which might have been updated if someone expanded the
992 * filesystem (via gfs2_grow utility), which adds new resource groups.
993 *
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100994 * Returns: 0 on succeess, error code otherwise
David Teiglandb3b94fa2006-01-16 16:50:04 +0000995 */
996
Steven Whitehouse8339ee52011-08-31 16:38:29 +0100997int gfs2_rindex_update(struct gfs2_sbd *sdp)
David Teiglandb3b94fa2006-01-16 16:50:04 +0000998{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -0400999 struct gfs2_inode *ip = GFS2_I(sdp->sd_rindex);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001000 struct gfs2_glock *gl = ip->i_gl;
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001001 struct gfs2_holder ri_gh;
1002 int error = 0;
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001003 int unlock_required = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001004
1005 /* Read new copy from disk if we don't have the latest */
Bob Petersoncf45b752008-01-31 10:31:39 -06001006 if (!sdp->sd_rindex_uptodate) {
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001007 if (!gfs2_glock_is_locked_by_me(gl)) {
1008 error = gfs2_glock_nq_init(gl, LM_ST_SHARED, 0, &ri_gh);
1009 if (error)
Bob Peterson6aad1c32012-03-05 09:20:59 -05001010 return error;
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001011 unlock_required = 1;
1012 }
Steven Whitehouse8339ee52011-08-31 16:38:29 +01001013 if (!sdp->sd_rindex_uptodate)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001014 error = gfs2_ri_update(ip);
Steven Whitehousea365fbf2012-02-24 15:09:14 +00001015 if (unlock_required)
1016 gfs2_glock_dq_uninit(&ri_gh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001017 }
1018
1019 return error;
1020}
1021
Bob Peterson42d52e32008-01-28 18:38:07 -06001022static void gfs2_rgrp_in(struct gfs2_rgrpd *rgd, const void *buf)
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001023{
1024 const struct gfs2_rgrp *str = buf;
Bob Peterson42d52e32008-01-28 18:38:07 -06001025 u32 rg_flags;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001026
Bob Peterson42d52e32008-01-28 18:38:07 -06001027 rg_flags = be32_to_cpu(str->rg_flags);
Steven Whitehouse09010972009-05-20 10:48:47 +01001028 rg_flags &= ~GFS2_RDF_MASK;
Steven Whitehouse1ce97e52009-05-21 15:18:19 +01001029 rgd->rd_flags &= GFS2_RDF_MASK;
1030 rgd->rd_flags |= rg_flags;
Steven Whitehousecfc8b542008-11-04 10:25:13 +00001031 rgd->rd_free = be32_to_cpu(str->rg_free);
Steven Whitehouse73f74942008-11-04 10:32:57 +00001032 rgd->rd_dinodes = be32_to_cpu(str->rg_dinodes);
Steven Whitehoused8b71f72008-11-04 10:19:03 +00001033 rgd->rd_igeneration = be64_to_cpu(str->rg_igeneration);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001034}
1035
Bob Peterson42d52e32008-01-28 18:38:07 -06001036static void gfs2_rgrp_out(struct gfs2_rgrpd *rgd, void *buf)
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001037{
1038 struct gfs2_rgrp *str = buf;
1039
Steven Whitehouse09010972009-05-20 10:48:47 +01001040 str->rg_flags = cpu_to_be32(rgd->rd_flags & ~GFS2_RDF_MASK);
Steven Whitehousecfc8b542008-11-04 10:25:13 +00001041 str->rg_free = cpu_to_be32(rgd->rd_free);
Steven Whitehouse73f74942008-11-04 10:32:57 +00001042 str->rg_dinodes = cpu_to_be32(rgd->rd_dinodes);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001043 str->__pad = cpu_to_be32(0);
Steven Whitehoused8b71f72008-11-04 10:19:03 +00001044 str->rg_igeneration = cpu_to_be64(rgd->rd_igeneration);
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001045 memset(&str->rg_reserved, 0, sizeof(str->rg_reserved));
1046}
1047
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001048static int gfs2_rgrp_lvb_valid(struct gfs2_rgrpd *rgd)
1049{
1050 struct gfs2_rgrp_lvb *rgl = rgd->rd_rgl;
1051 struct gfs2_rgrp *str = (struct gfs2_rgrp *)rgd->rd_bits[0].bi_bh->b_data;
1052
1053 if (rgl->rl_flags != str->rg_flags || rgl->rl_free != str->rg_free ||
1054 rgl->rl_dinodes != str->rg_dinodes ||
1055 rgl->rl_igeneration != str->rg_igeneration)
1056 return 0;
1057 return 1;
1058}
1059
1060static void gfs2_rgrp_ondisk2lvb(struct gfs2_rgrp_lvb *rgl, const void *buf)
1061{
1062 const struct gfs2_rgrp *str = buf;
1063
1064 rgl->rl_magic = cpu_to_be32(GFS2_MAGIC);
1065 rgl->rl_flags = str->rg_flags;
1066 rgl->rl_free = str->rg_free;
1067 rgl->rl_dinodes = str->rg_dinodes;
1068 rgl->rl_igeneration = str->rg_igeneration;
1069 rgl->__pad = 0UL;
1070}
1071
1072static void update_rgrp_lvb_unlinked(struct gfs2_rgrpd *rgd, u32 change)
1073{
1074 struct gfs2_rgrp_lvb *rgl = rgd->rd_rgl;
1075 u32 unlinked = be32_to_cpu(rgl->rl_unlinked) + change;
1076 rgl->rl_unlinked = cpu_to_be32(unlinked);
1077}
1078
1079static u32 count_unlinked(struct gfs2_rgrpd *rgd)
1080{
1081 struct gfs2_bitmap *bi;
1082 const u32 length = rgd->rd_length;
1083 const u8 *buffer = NULL;
1084 u32 i, goal, count = 0;
1085
1086 for (i = 0, bi = rgd->rd_bits; i < length; i++, bi++) {
1087 goal = 0;
1088 buffer = bi->bi_bh->b_data + bi->bi_offset;
1089 WARN_ON(!buffer_uptodate(bi->bi_bh));
1090 while (goal < bi->bi_len * GFS2_NBBY) {
1091 goal = gfs2_bitfit(buffer, bi->bi_len, goal,
1092 GFS2_BLKST_UNLINKED);
1093 if (goal == BFITNOENT)
1094 break;
1095 count++;
1096 goal++;
1097 }
1098 }
1099
1100 return count;
1101}
1102
1103
David Teiglandb3b94fa2006-01-16 16:50:04 +00001104/**
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001105 * gfs2_rgrp_bh_get - Read in a RG's header and bitmaps
1106 * @rgd: the struct gfs2_rgrpd describing the RG to read in
David Teiglandb3b94fa2006-01-16 16:50:04 +00001107 *
1108 * Read in all of a Resource Group's header and bitmap blocks.
1109 * Caller must eventually call gfs2_rgrp_relse() to free the bitmaps.
1110 *
1111 * Returns: errno
1112 */
1113
Rashika Kheriac2b0b302014-02-09 18:40:19 +05301114static int gfs2_rgrp_bh_get(struct gfs2_rgrpd *rgd)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001115{
1116 struct gfs2_sbd *sdp = rgd->rd_sbd;
1117 struct gfs2_glock *gl = rgd->rd_gl;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001118 unsigned int length = rgd->rd_length;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001119 struct gfs2_bitmap *bi;
1120 unsigned int x, y;
1121 int error;
1122
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001123 if (rgd->rd_bits[0].bi_bh != NULL)
1124 return 0;
1125
David Teiglandb3b94fa2006-01-16 16:50:04 +00001126 for (x = 0; x < length; x++) {
1127 bi = rgd->rd_bits + x;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001128 error = gfs2_meta_read(gl, rgd->rd_addr + x, 0, &bi->bi_bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001129 if (error)
1130 goto fail;
1131 }
1132
1133 for (y = length; y--;) {
1134 bi = rgd->rd_bits + y;
Steven Whitehouse7276b3b2006-09-21 17:05:23 -04001135 error = gfs2_meta_wait(sdp, bi->bi_bh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00001136 if (error)
1137 goto fail;
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001138 if (gfs2_metatype_check(sdp, bi->bi_bh, y ? GFS2_METATYPE_RB :
David Teiglandb3b94fa2006-01-16 16:50:04 +00001139 GFS2_METATYPE_RG)) {
1140 error = -EIO;
1141 goto fail;
1142 }
1143 }
1144
Bob Petersoncf45b752008-01-31 10:31:39 -06001145 if (!(rgd->rd_flags & GFS2_RDF_UPTODATE)) {
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01001146 for (x = 0; x < length; x++)
1147 clear_bit(GBF_FULL, &rgd->rd_bits[x].bi_flags);
Bob Peterson42d52e32008-01-28 18:38:07 -06001148 gfs2_rgrp_in(rgd, (rgd->rd_bits[0].bi_bh)->b_data);
Steven Whitehouse1ce97e52009-05-21 15:18:19 +01001149 rgd->rd_flags |= (GFS2_RDF_UPTODATE | GFS2_RDF_CHECK);
Bob Peterson7c9ca622011-08-31 09:53:19 +01001150 rgd->rd_free_clone = rgd->rd_free;
Bob Peterson5ea50502013-11-25 11:16:25 +00001151 /* max out the rgrp allocation failure point */
1152 rgd->rd_extfail_pt = rgd->rd_free;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001153 }
Al Viro951b4bd2013-06-02 19:53:40 -04001154 if (cpu_to_be32(GFS2_MAGIC) != rgd->rd_rgl->rl_magic) {
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001155 rgd->rd_rgl->rl_unlinked = cpu_to_be32(count_unlinked(rgd));
1156 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl,
1157 rgd->rd_bits[0].bi_bh->b_data);
1158 }
1159 else if (sdp->sd_args.ar_rgrplvb) {
1160 if (!gfs2_rgrp_lvb_valid(rgd)){
1161 gfs2_consist_rgrpd(rgd);
1162 error = -EIO;
1163 goto fail;
1164 }
1165 if (rgd->rd_rgl->rl_unlinked == 0)
1166 rgd->rd_flags &= ~GFS2_RDF_CHECK;
1167 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001168 return 0;
1169
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001170fail:
David Teiglandb3b94fa2006-01-16 16:50:04 +00001171 while (x--) {
1172 bi = rgd->rd_bits + x;
1173 brelse(bi->bi_bh);
1174 bi->bi_bh = NULL;
1175 gfs2_assert_warn(sdp, !bi->bi_clone);
1176 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001177
1178 return error;
1179}
1180
Rashika Kheriac2b0b302014-02-09 18:40:19 +05301181static int update_rgrp_lvb(struct gfs2_rgrpd *rgd)
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001182{
1183 u32 rl_flags;
1184
1185 if (rgd->rd_flags & GFS2_RDF_UPTODATE)
1186 return 0;
1187
Al Viro951b4bd2013-06-02 19:53:40 -04001188 if (cpu_to_be32(GFS2_MAGIC) != rgd->rd_rgl->rl_magic)
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001189 return gfs2_rgrp_bh_get(rgd);
1190
1191 rl_flags = be32_to_cpu(rgd->rd_rgl->rl_flags);
1192 rl_flags &= ~GFS2_RDF_MASK;
1193 rgd->rd_flags &= GFS2_RDF_MASK;
1194 rgd->rd_flags |= (rl_flags | GFS2_RDF_UPTODATE | GFS2_RDF_CHECK);
1195 if (rgd->rd_rgl->rl_unlinked == 0)
1196 rgd->rd_flags &= ~GFS2_RDF_CHECK;
1197 rgd->rd_free = be32_to_cpu(rgd->rd_rgl->rl_free);
1198 rgd->rd_free_clone = rgd->rd_free;
1199 rgd->rd_dinodes = be32_to_cpu(rgd->rd_rgl->rl_dinodes);
1200 rgd->rd_igeneration = be64_to_cpu(rgd->rd_rgl->rl_igeneration);
1201 return 0;
1202}
1203
1204int gfs2_rgrp_go_lock(struct gfs2_holder *gh)
1205{
1206 struct gfs2_rgrpd *rgd = gh->gh_gl->gl_object;
1207 struct gfs2_sbd *sdp = rgd->rd_sbd;
1208
1209 if (gh->gh_flags & GL_SKIP && sdp->sd_args.ar_rgrplvb)
1210 return 0;
Bob Peterson8b127d02014-01-16 08:52:16 -05001211 return gfs2_rgrp_bh_get(rgd);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001212}
1213
David Teiglandb3b94fa2006-01-16 16:50:04 +00001214/**
Bob Peterson7c9ca622011-08-31 09:53:19 +01001215 * gfs2_rgrp_go_unlock - Release RG bitmaps read in with gfs2_rgrp_bh_get()
Bob Peterson886b1412012-04-11 13:03:52 -04001216 * @gh: The glock holder for the resource group
David Teiglandb3b94fa2006-01-16 16:50:04 +00001217 *
1218 */
1219
Bob Peterson7c9ca622011-08-31 09:53:19 +01001220void gfs2_rgrp_go_unlock(struct gfs2_holder *gh)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001221{
Bob Peterson7c9ca622011-08-31 09:53:19 +01001222 struct gfs2_rgrpd *rgd = gh->gh_gl->gl_object;
Steven Whitehousebb8d8a62007-06-01 14:11:58 +01001223 int x, length = rgd->rd_length;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001224
David Teiglandb3b94fa2006-01-16 16:50:04 +00001225 for (x = 0; x < length; x++) {
1226 struct gfs2_bitmap *bi = rgd->rd_bits + x;
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001227 if (bi->bi_bh) {
1228 brelse(bi->bi_bh);
1229 bi->bi_bh = NULL;
1230 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001231 }
1232
David Teiglandb3b94fa2006-01-16 16:50:04 +00001233}
1234
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001235int gfs2_rgrp_send_discards(struct gfs2_sbd *sdp, u64 offset,
Bob Peterson7c9ca622011-08-31 09:53:19 +01001236 struct buffer_head *bh,
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001237 const struct gfs2_bitmap *bi, unsigned minlen, u64 *ptrimmed)
Steven Whitehousef15ab562009-02-09 09:25:01 +00001238{
1239 struct super_block *sb = sdp->sd_vfs;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001240 u64 blk;
Steven Whitehouse64d576b2009-02-12 13:31:58 +00001241 sector_t start = 0;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001242 sector_t nr_blks = 0;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001243 int rv;
1244 unsigned int x;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001245 u32 trimmed = 0;
1246 u8 diff;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001247
1248 for (x = 0; x < bi->bi_len; x++) {
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001249 const u8 *clone = bi->bi_clone ? bi->bi_clone : bi->bi_bh->b_data;
1250 clone += bi->bi_offset;
1251 clone += x;
1252 if (bh) {
1253 const u8 *orig = bh->b_data + bi->bi_offset + x;
1254 diff = ~(*orig | (*orig >> 1)) & (*clone | (*clone >> 1));
1255 } else {
1256 diff = ~(*clone | (*clone >> 1));
1257 }
Steven Whitehousef15ab562009-02-09 09:25:01 +00001258 diff &= 0x55;
1259 if (diff == 0)
1260 continue;
1261 blk = offset + ((bi->bi_start + x) * GFS2_NBBY);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001262 while(diff) {
1263 if (diff & 1) {
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001264 if (nr_blks == 0)
Steven Whitehousef15ab562009-02-09 09:25:01 +00001265 goto start_new_extent;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001266 if ((start + nr_blks) != blk) {
1267 if (nr_blks >= minlen) {
1268 rv = sb_issue_discard(sb,
1269 start, nr_blks,
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001270 GFP_NOFS, 0);
1271 if (rv)
1272 goto fail;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001273 trimmed += nr_blks;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001274 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001275 nr_blks = 0;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001276start_new_extent:
1277 start = blk;
1278 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001279 nr_blks++;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001280 }
1281 diff >>= 2;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001282 blk++;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001283 }
1284 }
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001285 if (nr_blks >= minlen) {
1286 rv = sb_issue_discard(sb, start, nr_blks, GFP_NOFS, 0);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001287 if (rv)
1288 goto fail;
Bob Petersonb2c87ca2013-03-22 10:07:24 -04001289 trimmed += nr_blks;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001290 }
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001291 if (ptrimmed)
1292 *ptrimmed = trimmed;
1293 return 0;
1294
Steven Whitehousef15ab562009-02-09 09:25:01 +00001295fail:
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001296 if (sdp->sd_args.ar_discard)
1297 fs_warn(sdp, "error %d on discard request, turning discards off for this filesystem", rv);
Steven Whitehousef15ab562009-02-09 09:25:01 +00001298 sdp->sd_args.ar_discard = 0;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001299 return -EIO;
1300}
1301
1302/**
1303 * gfs2_fitrim - Generate discard requests for unused bits of the filesystem
1304 * @filp: Any file on the filesystem
1305 * @argp: Pointer to the arguments (also used to pass result)
1306 *
1307 * Returns: 0 on success, otherwise error code
1308 */
1309
1310int gfs2_fitrim(struct file *filp, void __user *argp)
1311{
Al Viro496ad9a2013-01-23 17:07:38 -05001312 struct inode *inode = file_inode(filp);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001313 struct gfs2_sbd *sdp = GFS2_SB(inode);
1314 struct request_queue *q = bdev_get_queue(sdp->sd_vfs->s_bdev);
1315 struct buffer_head *bh;
1316 struct gfs2_rgrpd *rgd;
1317 struct gfs2_rgrpd *rgd_end;
1318 struct gfs2_holder gh;
1319 struct fstrim_range r;
1320 int ret = 0;
1321 u64 amt;
1322 u64 trimmed = 0;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001323 u64 start, end, minlen;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001324 unsigned int x;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001325 unsigned bs_shift = sdp->sd_sb.sb_bsize_shift;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001326
1327 if (!capable(CAP_SYS_ADMIN))
1328 return -EPERM;
1329
1330 if (!blk_queue_discard(q))
1331 return -EOPNOTSUPP;
1332
Lukas Czerner3a238ad2012-10-16 11:39:07 +02001333 if (copy_from_user(&r, argp, sizeof(r)))
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001334 return -EFAULT;
1335
Bob Peterson5e2f7d62012-04-04 22:11:16 -04001336 ret = gfs2_rindex_update(sdp);
1337 if (ret)
1338 return ret;
1339
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001340 start = r.start >> bs_shift;
1341 end = start + (r.len >> bs_shift);
1342 minlen = max_t(u64, r.minlen,
1343 q->limits.discard_granularity) >> bs_shift;
1344
Abhijith Das6a98c332013-06-19 17:03:29 -04001345 if (end <= start || minlen > sdp->sd_max_rg_data)
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001346 return -EINVAL;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001347
Abhijith Das6a98c332013-06-19 17:03:29 -04001348 rgd = gfs2_blk2rgrpd(sdp, start, 0);
1349 rgd_end = gfs2_blk2rgrpd(sdp, end, 0);
1350
1351 if ((gfs2_rgrpd_get_first(sdp) == gfs2_rgrpd_get_next(rgd_end))
1352 && (start > rgd_end->rd_data0 + rgd_end->rd_data))
1353 return -EINVAL; /* start is beyond the end of the fs */
1354
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001355 while (1) {
1356
1357 ret = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE, 0, &gh);
1358 if (ret)
1359 goto out;
1360
1361 if (!(rgd->rd_flags & GFS2_RGF_TRIMMED)) {
1362 /* Trim each bitmap in the rgrp */
1363 for (x = 0; x < rgd->rd_length; x++) {
1364 struct gfs2_bitmap *bi = rgd->rd_bits + x;
Lukas Czerner076f0fa2012-10-16 11:39:08 +02001365 ret = gfs2_rgrp_send_discards(sdp,
1366 rgd->rd_data0, NULL, bi, minlen,
1367 &amt);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001368 if (ret) {
1369 gfs2_glock_dq_uninit(&gh);
1370 goto out;
1371 }
1372 trimmed += amt;
1373 }
1374
1375 /* Mark rgrp as having been trimmed */
1376 ret = gfs2_trans_begin(sdp, RES_RG_HDR, 0);
1377 if (ret == 0) {
1378 bh = rgd->rd_bits[0].bi_bh;
1379 rgd->rd_flags |= GFS2_RGF_TRIMMED;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00001380 gfs2_trans_add_meta(rgd->rd_gl, bh);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001381 gfs2_rgrp_out(rgd, bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001382 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, bh->b_data);
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001383 gfs2_trans_end(sdp);
1384 }
1385 }
1386 gfs2_glock_dq_uninit(&gh);
1387
1388 if (rgd == rgd_end)
1389 break;
1390
1391 rgd = gfs2_rgrpd_get_next(rgd);
1392 }
1393
1394out:
Abhijith Das6a98c332013-06-19 17:03:29 -04001395 r.len = trimmed << bs_shift;
Lukas Czerner3a238ad2012-10-16 11:39:07 +02001396 if (copy_to_user(argp, &r, sizeof(r)))
Steven Whitehouse66fc0612012-02-08 12:58:32 +00001397 return -EFAULT;
1398
1399 return ret;
Steven Whitehousef15ab562009-02-09 09:25:01 +00001400}
1401
David Teiglandb3b94fa2006-01-16 16:50:04 +00001402/**
Bob Peterson8e2e0042012-07-19 08:12:40 -04001403 * rs_insert - insert a new multi-block reservation into the rgrp's rb_tree
Bob Peterson8e2e0042012-07-19 08:12:40 -04001404 * @ip: the inode structure
Bob Peterson8e2e0042012-07-19 08:12:40 -04001405 *
Bob Peterson8e2e0042012-07-19 08:12:40 -04001406 */
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001407static void rs_insert(struct gfs2_inode *ip)
Bob Peterson8e2e0042012-07-19 08:12:40 -04001408{
1409 struct rb_node **newn, *parent = NULL;
1410 int rc;
1411 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001412 struct gfs2_rgrpd *rgd = rs->rs_rbm.rgd;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001413 u64 fsblock = gfs2_rbm_to_block(&rs->rs_rbm);
1414
1415 BUG_ON(gfs2_rs_active(rs));
Bob Peterson8e2e0042012-07-19 08:12:40 -04001416
1417 spin_lock(&rgd->rd_rsspin);
1418 newn = &rgd->rd_rstree.rb_node;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001419 while (*newn) {
1420 struct gfs2_blkreserv *cur =
1421 rb_entry(*newn, struct gfs2_blkreserv, rs_node);
1422
1423 parent = *newn;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001424 rc = rs_cmp(fsblock, rs->rs_free, cur);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001425 if (rc > 0)
1426 newn = &((*newn)->rb_right);
1427 else if (rc < 0)
1428 newn = &((*newn)->rb_left);
1429 else {
1430 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001431 WARN_ON(1);
1432 return;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001433 }
1434 }
1435
Bob Peterson8e2e0042012-07-19 08:12:40 -04001436 rb_link_node(&rs->rs_node, parent, newn);
1437 rb_insert_color(&rs->rs_node, &rgd->rd_rstree);
1438
Bob Peterson8e2e0042012-07-19 08:12:40 -04001439 /* Do our rgrp accounting for the reservation */
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001440 rgd->rd_reserved += rs->rs_free; /* blocks reserved */
Bob Peterson8e2e0042012-07-19 08:12:40 -04001441 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouse9e733d32012-08-23 15:37:59 +01001442 trace_gfs2_rs(rs, TRACE_RS_INSERT);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001443}
1444
1445/**
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001446 * rg_mblk_search - find a group of multiple free blocks to form a reservation
Bob Peterson8e2e0042012-07-19 08:12:40 -04001447 * @rgd: the resource group descriptor
Bob Peterson8e2e0042012-07-19 08:12:40 -04001448 * @ip: pointer to the inode for which we're reserving blocks
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001449 * @ap: the allocation parameters
Bob Peterson8e2e0042012-07-19 08:12:40 -04001450 *
Bob Peterson8e2e0042012-07-19 08:12:40 -04001451 */
1452
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001453static void rg_mblk_search(struct gfs2_rgrpd *rgd, struct gfs2_inode *ip,
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001454 const struct gfs2_alloc_parms *ap)
Bob Peterson8e2e0042012-07-19 08:12:40 -04001455{
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001456 struct gfs2_rbm rbm = { .rgd = rgd, };
1457 u64 goal;
1458 struct gfs2_blkreserv *rs = ip->i_res;
1459 u32 extlen;
1460 u32 free_blocks = rgd->rd_free_clone - rgd->rd_reserved;
1461 int ret;
Bob Petersonaf21ca82013-05-14 13:04:29 -04001462 struct inode *inode = &ip->i_inode;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001463
Bob Petersonaf21ca82013-05-14 13:04:29 -04001464 if (S_ISDIR(inode->i_mode))
1465 extlen = 1;
1466 else {
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001467 extlen = max_t(u32, atomic_read(&rs->rs_sizehint), ap->target);
Bob Petersonaf21ca82013-05-14 13:04:29 -04001468 extlen = clamp(extlen, RGRP_RSRV_MINBLKS, free_blocks);
1469 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001470 if ((rgd->rd_free_clone < rgd->rd_reserved) || (free_blocks < extlen))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001471 return;
1472
Bob Peterson8e2e0042012-07-19 08:12:40 -04001473 /* Find bitmap block that contains bits for goal block */
1474 if (rgrp_contains_block(rgd, ip->i_goal))
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001475 goal = ip->i_goal;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001476 else
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001477 goal = rgd->rd_last_alloc + rgd->rd_data0;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001478
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001479 if (WARN_ON(gfs2_rbm_from_block(&rbm, goal)))
1480 return;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001481
Bob Peterson5ce13432013-11-06 10:55:52 -05001482 ret = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, &extlen, ip, true, ap);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001483 if (ret == 0) {
1484 rs->rs_rbm = rbm;
1485 rs->rs_free = extlen;
1486 rs->rs_inum = ip->i_no_addr;
1487 rs_insert(ip);
Bob Peterson13d2eb02012-12-20 13:23:04 -05001488 } else {
1489 if (goal == rgd->rd_last_alloc + rgd->rd_data0)
1490 rgd->rd_last_alloc = 0;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001491 }
Bob Petersonb3e47ca2011-11-21 11:47:08 -05001492}
1493
David Teiglandb3b94fa2006-01-16 16:50:04 +00001494/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001495 * gfs2_next_unreserved_block - Return next block that is not reserved
1496 * @rgd: The resource group
1497 * @block: The starting block
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001498 * @length: The required length
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001499 * @ip: Ignore any reservations for this inode
1500 *
1501 * If the block does not appear in any reservation, then return the
1502 * block number unchanged. If it does appear in the reservation, then
1503 * keep looking through the tree of reservations in order to find the
1504 * first block number which is not reserved.
1505 */
1506
1507static u64 gfs2_next_unreserved_block(struct gfs2_rgrpd *rgd, u64 block,
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001508 u32 length,
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001509 const struct gfs2_inode *ip)
1510{
1511 struct gfs2_blkreserv *rs;
1512 struct rb_node *n;
1513 int rc;
1514
1515 spin_lock(&rgd->rd_rsspin);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001516 n = rgd->rd_rstree.rb_node;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001517 while (n) {
1518 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001519 rc = rs_cmp(block, length, rs);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001520 if (rc < 0)
1521 n = n->rb_left;
1522 else if (rc > 0)
1523 n = n->rb_right;
1524 else
1525 break;
1526 }
1527
1528 if (n) {
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001529 while ((rs_cmp(block, length, rs) == 0) && (ip->i_res != rs)) {
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001530 block = gfs2_rbm_to_block(&rs->rs_rbm) + rs->rs_free;
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001531 n = n->rb_right;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001532 if (n == NULL)
1533 break;
1534 rs = rb_entry(n, struct gfs2_blkreserv, rs_node);
1535 }
1536 }
1537
1538 spin_unlock(&rgd->rd_rsspin);
1539 return block;
1540}
1541
1542/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001543 * gfs2_reservation_check_and_update - Check for reservations during block alloc
1544 * @rbm: The current position in the resource group
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001545 * @ip: The inode for which we are searching for blocks
1546 * @minext: The minimum extent length
Bob Peterson5ce13432013-11-06 10:55:52 -05001547 * @maxext: A pointer to the maximum extent structure
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001548 *
1549 * This checks the current position in the rgrp to see whether there is
1550 * a reservation covering this block. If not then this function is a
1551 * no-op. If there is, then the position is moved to the end of the
1552 * contiguous reservation(s) so that we are pointing at the first
1553 * non-reserved block.
1554 *
1555 * Returns: 0 if no reservation, 1 if @rbm has changed, otherwise an error
1556 */
1557
1558static int gfs2_reservation_check_and_update(struct gfs2_rbm *rbm,
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001559 const struct gfs2_inode *ip,
Bob Peterson5ce13432013-11-06 10:55:52 -05001560 u32 minext,
1561 struct gfs2_extent *maxext)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001562{
1563 u64 block = gfs2_rbm_to_block(rbm);
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001564 u32 extlen = 1;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001565 u64 nblock;
1566 int ret;
1567
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001568 /*
1569 * If we have a minimum extent length, then skip over any extent
1570 * which is less than the min extent length in size.
1571 */
1572 if (minext) {
1573 extlen = gfs2_free_extlen(rbm, minext);
Bob Peterson5ce13432013-11-06 10:55:52 -05001574 if (extlen <= maxext->len)
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001575 goto fail;
1576 }
1577
1578 /*
1579 * Check the extent which has been found against the reservations
1580 * and skip if parts of it are already reserved
1581 */
1582 nblock = gfs2_next_unreserved_block(rbm->rgd, block, extlen, ip);
Bob Peterson5ce13432013-11-06 10:55:52 -05001583 if (nblock == block) {
1584 if (!minext || extlen >= minext)
1585 return 0;
1586
1587 if (extlen > maxext->len) {
1588 maxext->len = extlen;
1589 maxext->rbm = *rbm;
1590 }
Steven Whitehouseff7f4cb2012-09-10 10:03:50 +01001591fail:
Bob Peterson5ce13432013-11-06 10:55:52 -05001592 nblock = block + extlen;
1593 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001594 ret = gfs2_rbm_from_block(rbm, nblock);
1595 if (ret < 0)
1596 return ret;
1597 return 1;
1598}
1599
1600/**
1601 * gfs2_rbm_find - Look for blocks of a particular state
1602 * @rbm: Value/result starting position and final position
1603 * @state: The state which we want to find
Bob Peterson5ce13432013-11-06 10:55:52 -05001604 * @minext: Pointer to the requested extent length (NULL for a single block)
1605 * This is updated to be the actual reservation size.
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001606 * @ip: If set, check for reservations
1607 * @nowrap: Stop looking at the end of the rgrp, rather than wrapping
1608 * around until we've reached the starting point.
Bob Peterson5ce13432013-11-06 10:55:52 -05001609 * @ap: the allocation parameters
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001610 *
1611 * Side effects:
1612 * - If looking for free blocks, we set GBF_FULL on each bitmap which
1613 * has no free blocks in it.
Bob Peterson5ea50502013-11-25 11:16:25 +00001614 * - If looking for free blocks, we set rd_extfail_pt on each rgrp which
1615 * has come up short on a free block search.
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001616 *
1617 * Returns: 0 on success, -ENOSPC if there is no block of the requested state
1618 */
1619
Bob Peterson5ce13432013-11-06 10:55:52 -05001620static int gfs2_rbm_find(struct gfs2_rbm *rbm, u8 state, u32 *minext,
1621 const struct gfs2_inode *ip, bool nowrap,
1622 const struct gfs2_alloc_parms *ap)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001623{
1624 struct buffer_head *bh;
Bob Petersone579ed42013-09-17 13:12:15 -04001625 int initial_bii;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001626 u32 initial_offset;
Bob Peterson5ea50502013-11-25 11:16:25 +00001627 int first_bii = rbm->bii;
1628 u32 first_offset = rbm->offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001629 u32 offset;
1630 u8 *buffer;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001631 int n = 0;
1632 int iters = rbm->rgd->rd_length;
1633 int ret;
Bob Petersone579ed42013-09-17 13:12:15 -04001634 struct gfs2_bitmap *bi;
Bob Peterson5ce13432013-11-06 10:55:52 -05001635 struct gfs2_extent maxext = { .rbm.rgd = rbm->rgd, };
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001636
1637 /* If we are not starting at the beginning of a bitmap, then we
1638 * need to add one to the bitmap count to ensure that we search
1639 * the starting bitmap twice.
1640 */
1641 if (rbm->offset != 0)
1642 iters++;
1643
1644 while(1) {
Bob Petersone579ed42013-09-17 13:12:15 -04001645 bi = rbm_bi(rbm);
1646 if (test_bit(GBF_FULL, &bi->bi_flags) &&
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001647 (state == GFS2_BLKST_FREE))
1648 goto next_bitmap;
1649
Bob Petersone579ed42013-09-17 13:12:15 -04001650 bh = bi->bi_bh;
1651 buffer = bh->b_data + bi->bi_offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001652 WARN_ON(!buffer_uptodate(bh));
Bob Petersone579ed42013-09-17 13:12:15 -04001653 if (state != GFS2_BLKST_UNLINKED && bi->bi_clone)
1654 buffer = bi->bi_clone + bi->bi_offset;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001655 initial_offset = rbm->offset;
Bob Petersone579ed42013-09-17 13:12:15 -04001656 offset = gfs2_bitfit(buffer, bi->bi_len, rbm->offset, state);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001657 if (offset == BFITNOENT)
1658 goto bitmap_full;
1659 rbm->offset = offset;
1660 if (ip == NULL)
1661 return 0;
1662
Bob Petersone579ed42013-09-17 13:12:15 -04001663 initial_bii = rbm->bii;
Bob Peterson5ce13432013-11-06 10:55:52 -05001664 ret = gfs2_reservation_check_and_update(rbm, ip,
1665 minext ? *minext : 0,
1666 &maxext);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001667 if (ret == 0)
1668 return 0;
1669 if (ret > 0) {
Bob Petersone579ed42013-09-17 13:12:15 -04001670 n += (rbm->bii - initial_bii);
Bob Peterson8d8b7522012-08-07 13:28:17 -04001671 goto next_iter;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001672 }
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001673 if (ret == -E2BIG) {
Bob Petersone579ed42013-09-17 13:12:15 -04001674 rbm->bii = 0;
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001675 rbm->offset = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001676 n += (rbm->bii - initial_bii);
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001677 goto res_covered_end_of_rgrp;
1678 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001679 return ret;
1680
1681bitmap_full: /* Mark bitmap as full and fall through */
Bob Petersone579ed42013-09-17 13:12:15 -04001682 if ((state == GFS2_BLKST_FREE) && initial_offset == 0) {
1683 struct gfs2_bitmap *bi = rbm_bi(rbm);
1684 set_bit(GBF_FULL, &bi->bi_flags);
1685 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001686
1687next_bitmap: /* Find next bitmap in the rgrp */
1688 rbm->offset = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001689 rbm->bii++;
1690 if (rbm->bii == rbm->rgd->rd_length)
1691 rbm->bii = 0;
Steven Whitehouse5d50d532012-08-07 13:47:12 +01001692res_covered_end_of_rgrp:
Bob Petersone579ed42013-09-17 13:12:15 -04001693 if ((rbm->bii == 0) && nowrap)
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001694 break;
1695 n++;
Bob Peterson8d8b7522012-08-07 13:28:17 -04001696next_iter:
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001697 if (n >= iters)
1698 break;
1699 }
1700
Bob Peterson5ce13432013-11-06 10:55:52 -05001701 if (minext == NULL || state != GFS2_BLKST_FREE)
1702 return -ENOSPC;
1703
Bob Peterson5ea50502013-11-25 11:16:25 +00001704 /* If the extent was too small, and it's smaller than the smallest
1705 to have failed before, remember for future reference that it's
1706 useless to search this rgrp again for this amount or more. */
1707 if ((first_offset == 0) && (first_bii == 0) &&
1708 (*minext < rbm->rgd->rd_extfail_pt))
1709 rbm->rgd->rd_extfail_pt = *minext;
1710
Bob Peterson5ce13432013-11-06 10:55:52 -05001711 /* If the maximum extent we found is big enough to fulfill the
1712 minimum requirements, use it anyway. */
1713 if (maxext.len) {
1714 *rbm = maxext.rbm;
1715 *minext = maxext.len;
1716 return 0;
1717 }
1718
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001719 return -ENOSPC;
1720}
1721
1722/**
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001723 * try_rgrp_unlink - Look for any unlinked, allocated, but unused inodes
1724 * @rgd: The rgrp
Bob Peterson886b1412012-04-11 13:03:52 -04001725 * @last_unlinked: block address of the last dinode we unlinked
1726 * @skip: block address we should explicitly not unlink
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001727 *
Bob Peterson1a0eae82010-04-14 11:58:16 -04001728 * Returns: 0 if no error
1729 * The inode, if one has been found, in inode.
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001730 */
1731
Steven Whitehouse044b9412010-11-03 20:01:07 +00001732static void try_rgrp_unlink(struct gfs2_rgrpd *rgd, u64 *last_unlinked, u64 skip)
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001733{
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001734 u64 block;
Bob Peterson5f3eae72007-08-08 16:52:09 -05001735 struct gfs2_sbd *sdp = rgd->rd_sbd;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001736 struct gfs2_glock *gl;
1737 struct gfs2_inode *ip;
1738 int error;
1739 int found = 0;
Bob Petersone579ed42013-09-17 13:12:15 -04001740 struct gfs2_rbm rbm = { .rgd = rgd, .bii = 0, .offset = 0 };
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001741
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001742 while (1) {
Bob Peterson5f3eae72007-08-08 16:52:09 -05001743 down_write(&sdp->sd_log_flush_lock);
Bob Peterson5ce13432013-11-06 10:55:52 -05001744 error = gfs2_rbm_find(&rbm, GFS2_BLKST_UNLINKED, NULL, NULL,
1745 true, NULL);
Bob Peterson5f3eae72007-08-08 16:52:09 -05001746 up_write(&sdp->sd_log_flush_lock);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001747 if (error == -ENOSPC)
1748 break;
1749 if (WARN_ON_ONCE(error))
Bob Peterson24c73872007-07-12 16:58:50 -05001750 break;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05001751
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001752 block = gfs2_rbm_to_block(&rbm);
1753 if (gfs2_rbm_from_block(&rbm, block + 1))
1754 break;
1755 if (*last_unlinked != NO_BLOCK && block <= *last_unlinked)
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001756 continue;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001757 if (block == skip)
Steven Whitehouse1e19a192009-07-10 21:13:38 +01001758 continue;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001759 *last_unlinked = block;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001760
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01001761 error = gfs2_glock_get(sdp, block, &gfs2_inode_glops, CREATE, &gl);
Steven Whitehouse044b9412010-11-03 20:01:07 +00001762 if (error)
1763 continue;
1764
1765 /* If the inode is already in cache, we can ignore it here
1766 * because the existing inode disposal code will deal with
1767 * it when all refs have gone away. Accessing gl_object like
1768 * this is not safe in general. Here it is ok because we do
1769 * not dereference the pointer, and we only need an approx
1770 * answer to whether it is NULL or not.
1771 */
1772 ip = gl->gl_object;
1773
1774 if (ip || queue_work(gfs2_delete_workqueue, &gl->gl_delete) == 0)
1775 gfs2_glock_put(gl);
1776 else
1777 found++;
1778
1779 /* Limit reclaim to sensible number of tasks */
Bob Peterson44ad37d2011-03-17 16:19:58 -04001780 if (found > NR_CPUS)
Steven Whitehouse044b9412010-11-03 20:01:07 +00001781 return;
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001782 }
1783
1784 rgd->rd_flags &= ~GFS2_RDF_CHECK;
Steven Whitehouse044b9412010-11-03 20:01:07 +00001785 return;
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001786}
1787
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001788/**
1789 * gfs2_rgrp_congested - Use stats to figure out whether an rgrp is congested
1790 * @rgd: The rgrp in question
1791 * @loops: An indication of how picky we can be (0=very, 1=less so)
1792 *
1793 * This function uses the recently added glock statistics in order to
1794 * figure out whether a parciular resource group is suffering from
1795 * contention from multiple nodes. This is done purely on the basis
1796 * of timings, since this is the only data we have to work with and
1797 * our aim here is to reject a resource group which is highly contended
1798 * but (very important) not to do this too often in order to ensure that
1799 * we do not land up introducing fragmentation by changing resource
1800 * groups when not actually required.
1801 *
1802 * The calculation is fairly simple, we want to know whether the SRTTB
1803 * (i.e. smoothed round trip time for blocking operations) to acquire
1804 * the lock for this rgrp's glock is significantly greater than the
1805 * time taken for resource groups on average. We introduce a margin in
1806 * the form of the variable @var which is computed as the sum of the two
1807 * respective variences, and multiplied by a factor depending on @loops
1808 * and whether we have a lot of data to base the decision on. This is
1809 * then tested against the square difference of the means in order to
1810 * decide whether the result is statistically significant or not.
1811 *
1812 * Returns: A boolean verdict on the congestion status
1813 */
1814
1815static bool gfs2_rgrp_congested(const struct gfs2_rgrpd *rgd, int loops)
1816{
1817 const struct gfs2_glock *gl = rgd->rd_gl;
1818 const struct gfs2_sbd *sdp = gl->gl_sbd;
1819 struct gfs2_lkstats *st;
1820 s64 r_dcount, l_dcount;
1821 s64 r_srttb, l_srttb;
1822 s64 srttb_diff;
1823 s64 sqr_diff;
1824 s64 var;
1825
1826 preempt_disable();
1827 st = &this_cpu_ptr(sdp->sd_lkstats)->lkstats[LM_TYPE_RGRP];
1828 r_srttb = st->stats[GFS2_LKS_SRTTB];
1829 r_dcount = st->stats[GFS2_LKS_DCOUNT];
1830 var = st->stats[GFS2_LKS_SRTTVARB] +
1831 gl->gl_stats.stats[GFS2_LKS_SRTTVARB];
1832 preempt_enable();
1833
1834 l_srttb = gl->gl_stats.stats[GFS2_LKS_SRTTB];
1835 l_dcount = gl->gl_stats.stats[GFS2_LKS_DCOUNT];
1836
1837 if ((l_dcount < 1) || (r_dcount < 1) || (r_srttb == 0))
1838 return false;
1839
1840 srttb_diff = r_srttb - l_srttb;
1841 sqr_diff = srttb_diff * srttb_diff;
1842
1843 var *= 2;
1844 if (l_dcount < 8 || r_dcount < 8)
1845 var *= 2;
1846 if (loops == 1)
1847 var *= 2;
1848
1849 return ((srttb_diff < 0) && (sqr_diff > var));
1850}
1851
1852/**
1853 * gfs2_rgrp_used_recently
1854 * @rs: The block reservation with the rgrp to test
1855 * @msecs: The time limit in milliseconds
1856 *
1857 * Returns: True if the rgrp glock has been used within the time limit
1858 */
1859static bool gfs2_rgrp_used_recently(const struct gfs2_blkreserv *rs,
1860 u64 msecs)
1861{
1862 u64 tdiff;
1863
1864 tdiff = ktime_to_ns(ktime_sub(ktime_get_real(),
1865 rs->rs_rbm.rgd->rd_gl->gl_dstamp));
1866
1867 return tdiff > (msecs * 1000 * 1000);
1868}
1869
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001870static u32 gfs2_orlov_skip(const struct gfs2_inode *ip)
1871{
1872 const struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1873 u32 skip;
1874
1875 get_random_bytes(&skip, sizeof(skip));
1876 return skip % sdp->sd_rgrps;
1877}
1878
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001879static bool gfs2_select_rgrp(struct gfs2_rgrpd **pos, const struct gfs2_rgrpd *begin)
1880{
1881 struct gfs2_rgrpd *rgd = *pos;
Steven Whitehouseaa8920c2012-11-13 14:50:35 +00001882 struct gfs2_sbd *sdp = rgd->rd_sbd;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001883
1884 rgd = gfs2_rgrpd_get_next(rgd);
1885 if (rgd == NULL)
Steven Whitehouseaa8920c2012-11-13 14:50:35 +00001886 rgd = gfs2_rgrpd_get_first(sdp);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001887 *pos = rgd;
1888 if (rgd != begin) /* If we didn't wrap */
1889 return true;
1890 return false;
1891}
1892
Steven Whitehousec8cdf472007-06-08 10:05:33 +01001893/**
Bob Peterson666d1d82012-06-13 23:03:56 -04001894 * gfs2_inplace_reserve - Reserve space in the filesystem
David Teiglandb3b94fa2006-01-16 16:50:04 +00001895 * @ip: the inode to reserve space for
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001896 * @ap: the allocation parameters
David Teiglandb3b94fa2006-01-16 16:50:04 +00001897 *
1898 * Returns: errno
1899 */
1900
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001901int gfs2_inplace_reserve(struct gfs2_inode *ip, const struct gfs2_alloc_parms *ap)
David Teiglandb3b94fa2006-01-16 16:50:04 +00001902{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04001903 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001904 struct gfs2_rgrpd *begin = NULL;
Bob Peterson564e12b2011-11-21 13:36:17 -05001905 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001906 int error = 0, rg_locked, flags = 0;
Bob Peterson666d1d82012-06-13 23:03:56 -04001907 u64 last_unlinked = NO_BLOCK;
Bob Peterson7c9ca622011-08-31 09:53:19 +01001908 int loops = 0;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001909 u32 skip = 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001910
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001911 if (sdp->sd_args.ar_rgrplvb)
1912 flags |= GL_SKIP;
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001913 if (gfs2_assert_warn(sdp, ap->target))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001914 return -EINVAL;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001915 if (gfs2_rs_active(rs)) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001916 begin = rs->rs_rbm.rgd;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001917 } else if (ip->i_rgd && rgrp_contains_block(ip->i_rgd, ip->i_goal)) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001918 rs->rs_rbm.rgd = begin = ip->i_rgd;
Bob Peterson8e2e0042012-07-19 08:12:40 -04001919 } else {
Abhi Das00a158b2014-09-18 21:40:28 -05001920 check_and_update_goal(ip);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001921 rs->rs_rbm.rgd = begin = gfs2_blk2rgrpd(sdp, ip->i_goal, 1);
Bob Peterson8e2e0042012-07-19 08:12:40 -04001922 }
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001923 if (S_ISDIR(ip->i_inode.i_mode) && (ap->aflags & GFS2_AF_ORLOV))
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001924 skip = gfs2_orlov_skip(ip);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001925 if (rs->rs_rbm.rgd == NULL)
Bob Peterson7c9ca622011-08-31 09:53:19 +01001926 return -EBADSLT;
1927
1928 while (loops < 3) {
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001929 rg_locked = 1;
Abhijith Das292c8c12007-11-29 14:13:54 -06001930
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001931 if (!gfs2_glock_is_locked_by_me(rs->rs_rbm.rgd->rd_gl)) {
1932 rg_locked = 0;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001933 if (skip && skip--)
1934 goto next_rgrp;
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001935 if (!gfs2_rs_active(rs) && (loops < 2) &&
1936 gfs2_rgrp_used_recently(rs, 1000) &&
1937 gfs2_rgrp_congested(rs->rs_rbm.rgd, loops))
1938 goto next_rgrp;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001939 error = gfs2_glock_nq_init(rs->rs_rbm.rgd->rd_gl,
Bob Peterson8e2e0042012-07-19 08:12:40 -04001940 LM_ST_EXCLUSIVE, flags,
1941 &rs->rs_rgd_gh);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001942 if (unlikely(error))
1943 return error;
Steven Whitehousebcd97c02012-10-31 09:58:42 +00001944 if (!gfs2_rs_active(rs) && (loops < 2) &&
1945 gfs2_rgrp_congested(rs->rs_rbm.rgd, loops))
1946 goto skip_rgrp;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001947 if (sdp->sd_args.ar_rgrplvb) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01001948 error = update_rgrp_lvb(rs->rs_rbm.rgd);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001949 if (unlikely(error)) {
Benjamin Marzinski90306c42012-05-29 23:01:09 -05001950 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
1951 return error;
1952 }
1953 }
Abhijith Das292c8c12007-11-29 14:13:54 -06001954 }
Bob Peterson666d1d82012-06-13 23:03:56 -04001955
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001956 /* Skip unuseable resource groups */
Bob Peterson5ea50502013-11-25 11:16:25 +00001957 if ((rs->rs_rbm.rgd->rd_flags & (GFS2_RGF_NOALLOC |
1958 GFS2_RDF_ERROR)) ||
Steven Whitehouse7de41d32013-12-04 11:14:05 +00001959 (ap->target > rs->rs_rbm.rgd->rd_extfail_pt))
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001960 goto skip_rgrp;
1961
1962 if (sdp->sd_args.ar_rgrplvb)
1963 gfs2_rgrp_bh_get(rs->rs_rbm.rgd);
1964
1965 /* Get a reservation if we don't already have one */
1966 if (!gfs2_rs_active(rs))
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001967 rg_mblk_search(rs->rs_rbm.rgd, ip, ap);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001968
1969 /* Skip rgrps when we can't get a reservation on first pass */
1970 if (!gfs2_rs_active(rs) && (loops < 1))
1971 goto check_rgrp;
1972
1973 /* If rgrp has enough free space, use it */
Steven Whitehouse7b9cff42013-10-02 11:13:25 +01001974 if (rs->rs_rbm.rgd->rd_free_clone >= ap->target) {
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001975 ip->i_rgd = rs->rs_rbm.rgd;
1976 return 0;
David Teiglandb3b94fa2006-01-16 16:50:04 +00001977 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00001978
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001979check_rgrp:
1980 /* Check for unlinked inodes which can be reclaimed */
1981 if (rs->rs_rbm.rgd->rd_flags & GFS2_RDF_CHECK)
1982 try_rgrp_unlink(rs->rs_rbm.rgd, &last_unlinked,
1983 ip->i_no_addr);
1984skip_rgrp:
Bob Peterson1330edb2013-11-06 10:58:00 -05001985 /* Drop reservation, if we couldn't use reserved rgrp */
1986 if (gfs2_rs_active(rs))
1987 gfs2_rs_deltree(rs);
1988
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001989 /* Unlock rgrp if required */
1990 if (!rg_locked)
1991 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
1992next_rgrp:
1993 /* Find the next rgrp, and continue looking */
1994 if (gfs2_select_rgrp(&rs->rs_rbm.rgd, begin))
1995 continue;
Steven Whitehouse9dbe9612012-10-31 10:37:10 +00001996 if (skip)
1997 continue;
Steven Whitehousec743ffd2012-08-25 18:21:47 +01001998
1999 /* If we've scanned all the rgrps, but found no free blocks
2000 * then this checks for some less likely conditions before
2001 * trying again.
2002 */
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002003 loops++;
2004 /* Check that fs hasn't grown if writing to rindex */
2005 if (ip == GFS2_I(sdp->sd_rindex) && !sdp->sd_rindex_uptodate) {
2006 error = gfs2_ri_update(ip);
2007 if (error)
2008 return error;
2009 }
2010 /* Flushing the log may release space */
2011 if (loops == 2)
Benjamin Marzinski24972552014-05-01 22:26:55 -05002012 gfs2_log_flush(sdp, NULL, NORMAL_FLUSH);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002013 }
2014
2015 return -ENOSPC;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002016}
2017
2018/**
2019 * gfs2_inplace_release - release an inplace reservation
2020 * @ip: the inode the reservation was taken out on
2021 *
2022 * Release a reservation made by gfs2_inplace_reserve().
2023 */
2024
2025void gfs2_inplace_release(struct gfs2_inode *ip)
2026{
Bob Peterson564e12b2011-11-21 13:36:17 -05002027 struct gfs2_blkreserv *rs = ip->i_res;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002028
Bob Peterson564e12b2011-11-21 13:36:17 -05002029 if (rs->rs_rgd_gh.gh_gl)
2030 gfs2_glock_dq_uninit(&rs->rs_rgd_gh);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002031}
2032
2033/**
2034 * gfs2_get_block_type - Check a block in a RG is of given type
2035 * @rgd: the resource group holding the block
2036 * @block: the block number
2037 *
2038 * Returns: The block type (GFS2_BLKST_*)
2039 */
2040
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002041static unsigned char gfs2_get_block_type(struct gfs2_rgrpd *rgd, u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002042{
Steven Whitehouse39839032012-08-03 11:10:30 +01002043 struct gfs2_rbm rbm = { .rgd = rgd, };
2044 int ret;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002045
Steven Whitehouse39839032012-08-03 11:10:30 +01002046 ret = gfs2_rbm_from_block(&rbm, block);
2047 WARN_ON_ONCE(ret != 0);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002048
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002049 return gfs2_testbit(&rbm);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002050}
2051
David Teiglandb3b94fa2006-01-16 16:50:04 +00002052
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002053/**
2054 * gfs2_alloc_extent - allocate an extent from a given bitmap
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002055 * @rbm: the resource group information
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002056 * @dinode: TRUE if the first block we allocate is for a dinode
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002057 * @n: The extent length (value/result)
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002058 *
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002059 * Add the bitmap buffer to the transaction.
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002060 * Set the found bits to @new_state to change block's allocation state.
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002061 */
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002062static void gfs2_alloc_extent(const struct gfs2_rbm *rbm, bool dinode,
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002063 unsigned int *n)
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002064{
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002065 struct gfs2_rbm pos = { .rgd = rbm->rgd, };
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002066 const unsigned int elen = *n;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002067 u64 block;
2068 int ret;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002069
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002070 *n = 1;
2071 block = gfs2_rbm_to_block(rbm);
Bob Petersone579ed42013-09-17 13:12:15 -04002072 gfs2_trans_add_meta(rbm->rgd->rd_gl, rbm_bi(rbm)->bi_bh);
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002073 gfs2_setbit(rbm, true, dinode ? GFS2_BLKST_DINODE : GFS2_BLKST_USED);
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002074 block++;
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002075 while (*n < elen) {
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002076 ret = gfs2_rbm_from_block(&pos, block);
Bob Peterson0688a5e2012-08-28 08:45:56 -04002077 if (ret || gfs2_testbit(&pos) != GFS2_BLKST_FREE)
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002078 break;
Bob Petersone579ed42013-09-17 13:12:15 -04002079 gfs2_trans_add_meta(pos.rgd->rd_gl, rbm_bi(&pos)->bi_bh);
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002080 gfs2_setbit(&pos, true, GFS2_BLKST_USED);
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002081 (*n)++;
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002082 block++;
Steven Whitehouse60a0b8f2009-05-21 12:23:12 +01002083 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00002084}
2085
2086/**
2087 * rgblk_free - Change alloc state of given block(s)
2088 * @sdp: the filesystem
2089 * @bstart: the start of a run of blocks to free
2090 * @blen: the length of the block run (all must lie within ONE RG!)
2091 * @new_state: GFS2_BLKST_XXX the after-allocation block state
2092 *
2093 * Returns: Resource group containing the block(s)
2094 */
2095
Steven Whitehousecd915492006-09-04 12:49:07 -04002096static struct gfs2_rgrpd *rgblk_free(struct gfs2_sbd *sdp, u64 bstart,
2097 u32 blen, unsigned char new_state)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002098{
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002099 struct gfs2_rbm rbm;
Bob Petersone579ed42013-09-17 13:12:15 -04002100 struct gfs2_bitmap *bi;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002101
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002102 rbm.rgd = gfs2_blk2rgrpd(sdp, bstart, 1);
2103 if (!rbm.rgd) {
David Teiglandb3b94fa2006-01-16 16:50:04 +00002104 if (gfs2_consist(sdp))
Steven Whitehouse382066d2006-05-24 10:22:09 -04002105 fs_err(sdp, "block = %llu\n", (unsigned long long)bstart);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002106 return NULL;
2107 }
2108
David Teiglandb3b94fa2006-01-16 16:50:04 +00002109 while (blen--) {
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002110 gfs2_rbm_from_block(&rbm, bstart);
Bob Petersone579ed42013-09-17 13:12:15 -04002111 bi = rbm_bi(&rbm);
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002112 bstart++;
Bob Petersone579ed42013-09-17 13:12:15 -04002113 if (!bi->bi_clone) {
2114 bi->bi_clone = kmalloc(bi->bi_bh->b_size,
2115 GFP_NOFS | __GFP_NOFAIL);
2116 memcpy(bi->bi_clone + bi->bi_offset,
2117 bi->bi_bh->b_data + bi->bi_offset, bi->bi_len);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002118 }
Bob Petersone579ed42013-09-17 13:12:15 -04002119 gfs2_trans_add_meta(rbm.rgd->rd_gl, bi->bi_bh);
Steven Whitehouse3e6339d2012-08-13 11:37:51 +01002120 gfs2_setbit(&rbm, false, new_state);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002121 }
2122
Steven Whitehouse3b1d0b92012-08-03 11:23:28 +01002123 return rbm.rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002124}
2125
2126/**
Steven Whitehouse09010972009-05-20 10:48:47 +01002127 * gfs2_rgrp_dump - print out an rgrp
2128 * @seq: The iterator
2129 * @gl: The glock in question
David Teiglandb3b94fa2006-01-16 16:50:04 +00002130 *
David Teiglandb3b94fa2006-01-16 16:50:04 +00002131 */
2132
Steven Whitehouseac3beb62014-01-16 10:31:13 +00002133void gfs2_rgrp_dump(struct seq_file *seq, const struct gfs2_glock *gl)
Steven Whitehouse09010972009-05-20 10:48:47 +01002134{
Bob Peterson8e2e0042012-07-19 08:12:40 -04002135 struct gfs2_rgrpd *rgd = gl->gl_object;
2136 struct gfs2_blkreserv *trs;
2137 const struct rb_node *n;
2138
Steven Whitehouse09010972009-05-20 10:48:47 +01002139 if (rgd == NULL)
Steven Whitehouseac3beb62014-01-16 10:31:13 +00002140 return;
Bob Peterson5ea50502013-11-25 11:16:25 +00002141 gfs2_print_dbg(seq, " R: n:%llu f:%02x b:%u/%u i:%u r:%u e:%u\n",
Steven Whitehouse09010972009-05-20 10:48:47 +01002142 (unsigned long long)rgd->rd_addr, rgd->rd_flags,
Bob Peterson8e2e0042012-07-19 08:12:40 -04002143 rgd->rd_free, rgd->rd_free_clone, rgd->rd_dinodes,
Bob Peterson5ea50502013-11-25 11:16:25 +00002144 rgd->rd_reserved, rgd->rd_extfail_pt);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002145 spin_lock(&rgd->rd_rsspin);
2146 for (n = rb_first(&rgd->rd_rstree); n; n = rb_next(&trs->rs_node)) {
2147 trs = rb_entry(n, struct gfs2_blkreserv, rs_node);
2148 dump_rs(seq, trs);
2149 }
2150 spin_unlock(&rgd->rd_rsspin);
Steven Whitehouse09010972009-05-20 10:48:47 +01002151}
2152
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002153static void gfs2_rgrp_error(struct gfs2_rgrpd *rgd)
2154{
2155 struct gfs2_sbd *sdp = rgd->rd_sbd;
2156 fs_warn(sdp, "rgrp %llu has an error, marking it readonly until umount\n",
Steven Whitehouse86d00632009-09-14 09:50:57 +01002157 (unsigned long long)rgd->rd_addr);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002158 fs_warn(sdp, "umount on all nodes and run fsck.gfs2 to fix the error\n");
2159 gfs2_rgrp_dump(NULL, rgd->rd_gl);
2160 rgd->rd_flags |= GFS2_RDF_ERROR;
2161}
2162
Steven Whitehouse09010972009-05-20 10:48:47 +01002163/**
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002164 * gfs2_adjust_reservation - Adjust (or remove) a reservation after allocation
2165 * @ip: The inode we have just allocated blocks for
2166 * @rbm: The start of the allocated blocks
2167 * @len: The extent length
Bob Peterson8e2e0042012-07-19 08:12:40 -04002168 *
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002169 * Adjusts a reservation after an allocation has taken place. If the
2170 * reservation does not match the allocation, or if it is now empty
2171 * then it is removed.
Bob Peterson8e2e0042012-07-19 08:12:40 -04002172 */
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002173
2174static void gfs2_adjust_reservation(struct gfs2_inode *ip,
2175 const struct gfs2_rbm *rbm, unsigned len)
Bob Peterson8e2e0042012-07-19 08:12:40 -04002176{
2177 struct gfs2_blkreserv *rs = ip->i_res;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002178 struct gfs2_rgrpd *rgd = rbm->rgd;
2179 unsigned rlen;
2180 u64 block;
2181 int ret;
Bob Peterson8e2e0042012-07-19 08:12:40 -04002182
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002183 spin_lock(&rgd->rd_rsspin);
2184 if (gfs2_rs_active(rs)) {
2185 if (gfs2_rbm_eq(&rs->rs_rbm, rbm)) {
2186 block = gfs2_rbm_to_block(rbm);
2187 ret = gfs2_rbm_from_block(&rs->rs_rbm, block + len);
2188 rlen = min(rs->rs_free, len);
2189 rs->rs_free -= rlen;
2190 rgd->rd_reserved -= rlen;
Steven Whitehouse9e733d32012-08-23 15:37:59 +01002191 trace_gfs2_rs(rs, TRACE_RS_CLAIM);
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002192 if (rs->rs_free && !ret)
2193 goto out;
2194 }
Bob Peterson20095212013-03-13 10:26:38 -04002195 __rs_deltree(rs);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002196 }
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002197out:
2198 spin_unlock(&rgd->rd_rsspin);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002199}
2200
2201/**
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002202 * gfs2_set_alloc_start - Set starting point for block allocation
2203 * @rbm: The rbm which will be set to the required location
2204 * @ip: The gfs2 inode
2205 * @dinode: Flag to say if allocation includes a new inode
2206 *
2207 * This sets the starting point from the reservation if one is active
2208 * otherwise it falls back to guessing a start point based on the
2209 * inode's goal block or the last allocation point in the rgrp.
2210 */
2211
2212static void gfs2_set_alloc_start(struct gfs2_rbm *rbm,
2213 const struct gfs2_inode *ip, bool dinode)
2214{
2215 u64 goal;
2216
2217 if (gfs2_rs_active(ip->i_res)) {
2218 *rbm = ip->i_res->rs_rbm;
2219 return;
2220 }
2221
2222 if (!dinode && rgrp_contains_block(rbm->rgd, ip->i_goal))
2223 goal = ip->i_goal;
2224 else
2225 goal = rbm->rgd->rd_last_alloc + rbm->rgd->rd_data0;
2226
2227 gfs2_rbm_from_block(rbm, goal);
2228}
2229
2230/**
Bob Peterson6e87ed02011-11-18 10:58:32 -05002231 * gfs2_alloc_blocks - Allocate one or more blocks of data and/or a dinode
Steven Whitehouse09010972009-05-20 10:48:47 +01002232 * @ip: the inode to allocate the block for
2233 * @bn: Used to return the starting block number
Bob Peterson8e2e0042012-07-19 08:12:40 -04002234 * @nblocks: requested number of blocks/extent length (value/result)
Bob Peterson6e87ed02011-11-18 10:58:32 -05002235 * @dinode: 1 if we're allocating a dinode block, else 0
Bob Peterson3c5d7852011-11-14 11:17:08 -05002236 * @generation: the generation number of the inode
Steven Whitehouse09010972009-05-20 10:48:47 +01002237 *
2238 * Returns: 0 or error
2239 */
2240
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002241int gfs2_alloc_blocks(struct gfs2_inode *ip, u64 *bn, unsigned int *nblocks,
Bob Peterson6e87ed02011-11-18 10:58:32 -05002242 bool dinode, u64 *generation)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002243{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002244 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002245 struct buffer_head *dibh;
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002246 struct gfs2_rbm rbm = { .rgd = ip->i_rgd, };
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002247 unsigned int ndata;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002248 u64 block; /* block, within the file system scope */
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002249 int error;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002250
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002251 gfs2_set_alloc_start(&rbm, ip, dinode);
Bob Peterson5ce13432013-11-06 10:55:52 -05002252 error = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, NULL, ip, false, NULL);
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002253
Steven Whitehouse137834a2012-08-23 13:43:40 +01002254 if (error == -ENOSPC) {
Steven Whitehouse9e07f2c2013-10-02 14:42:45 +01002255 gfs2_set_alloc_start(&rbm, ip, dinode);
Bob Peterson5ce13432013-11-06 10:55:52 -05002256 error = gfs2_rbm_find(&rbm, GFS2_BLKST_FREE, NULL, NULL, false,
2257 NULL);
Steven Whitehouse137834a2012-08-23 13:43:40 +01002258 }
2259
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002260 /* Since all blocks are reserved in advance, this shouldn't happen */
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002261 if (error) {
Bob Peterson5ea50502013-11-25 11:16:25 +00002262 fs_warn(sdp, "inum=%llu error=%d, nblocks=%u, full=%d fail_pt=%d\n",
Steven Whitehouse9e733d32012-08-23 15:37:59 +01002263 (unsigned long long)ip->i_no_addr, error, *nblocks,
Bob Peterson5ea50502013-11-25 11:16:25 +00002264 test_bit(GBF_FULL, &rbm.rgd->rd_bits->bi_flags),
2265 rbm.rgd->rd_extfail_pt);
Steven Whitehouse62e252e2012-07-30 11:06:08 +01002266 goto rgrp_error;
2267 }
2268
Steven Whitehousec04a2ef2012-08-13 11:14:57 +01002269 gfs2_alloc_extent(&rbm, dinode, nblocks);
2270 block = gfs2_rbm_to_block(&rbm);
Steven Whitehousec743ffd2012-08-25 18:21:47 +01002271 rbm.rgd->rd_last_alloc = block - rbm.rgd->rd_data0;
Steven Whitehouse5b924ae2012-08-01 20:35:05 +01002272 if (gfs2_rs_active(ip->i_res))
2273 gfs2_adjust_reservation(ip, &rbm, *nblocks);
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002274 ndata = *nblocks;
2275 if (dinode)
2276 ndata--;
Bob Petersonb3e47ca2011-11-21 11:47:08 -05002277
Bob Peterson3c5d7852011-11-14 11:17:08 -05002278 if (!dinode) {
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002279 ip->i_goal = block + ndata - 1;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002280 error = gfs2_meta_inode_buffer(ip, &dibh);
2281 if (error == 0) {
2282 struct gfs2_dinode *di =
2283 (struct gfs2_dinode *)dibh->b_data;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002284 gfs2_trans_add_meta(ip->i_gl, dibh);
Bob Peterson3c5d7852011-11-14 11:17:08 -05002285 di->di_goal_meta = di->di_goal_data =
2286 cpu_to_be64(ip->i_goal);
2287 brelse(dibh);
2288 }
Steven Whitehoused9ba7612009-04-23 08:59:41 +01002289 }
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002290 if (rbm.rgd->rd_free < *nblocks) {
Fabian Frederickfc554ed2014-03-05 22:06:42 +08002291 pr_warn("nblocks=%u\n", *nblocks);
Steven Whitehouse09010972009-05-20 10:48:47 +01002292 goto rgrp_error;
Bob Peterson8e2e0042012-07-19 08:12:40 -04002293 }
Steven Whitehouse09010972009-05-20 10:48:47 +01002294
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002295 rbm.rgd->rd_free -= *nblocks;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002296 if (dinode) {
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002297 rbm.rgd->rd_dinodes++;
2298 *generation = rbm.rgd->rd_igeneration++;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002299 if (*generation == 0)
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002300 *generation = rbm.rgd->rd_igeneration++;
Bob Peterson3c5d7852011-11-14 11:17:08 -05002301 }
David Teiglandb3b94fa2006-01-16 16:50:04 +00002302
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002303 gfs2_trans_add_meta(rbm.rgd->rd_gl, rbm.rgd->rd_bits[0].bi_bh);
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002304 gfs2_rgrp_out(rbm.rgd, rbm.rgd->rd_bits[0].bi_bh->b_data);
2305 gfs2_rgrp_ondisk2lvb(rbm.rgd->rd_rgl, rbm.rgd->rd_bits[0].bi_bh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002306
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002307 gfs2_statfs_change(sdp, 0, -(s64)*nblocks, dinode ? 1 : 0);
Bob Peterson3c5d7852011-11-14 11:17:08 -05002308 if (dinode)
Steven Whitehouseb2c8b3e2014-02-04 15:45:11 +00002309 gfs2_trans_add_unrevoke(sdp, block, *nblocks);
Steven Whitehouse6a8099e2011-11-22 12:18:51 +00002310
Steven Whitehousefd4b4e02013-02-26 16:15:20 +00002311 gfs2_quota_change(ip, *nblocks, ip->i_inode.i_uid, ip->i_inode.i_gid);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002312
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002313 rbm.rgd->rd_free_clone -= *nblocks;
2314 trace_gfs2_block_alloc(ip, rbm.rgd, block, *nblocks,
Bob Peterson6e87ed02011-11-18 10:58:32 -05002315 dinode ? GFS2_BLKST_DINODE : GFS2_BLKST_USED);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002316 *bn = block;
2317 return 0;
2318
2319rgrp_error:
Steven Whitehouse4a993fb2012-07-31 15:21:20 +01002320 gfs2_rgrp_error(rbm.rgd);
Steven Whitehouse6050b9c2009-07-31 16:19:40 +01002321 return -EIO;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002322}
2323
2324/**
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002325 * __gfs2_free_blocks - free a contiguous run of block(s)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002326 * @ip: the inode these blocks are being freed from
2327 * @bstart: first block of a run of contiguous blocks
2328 * @blen: the length of the block run
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002329 * @meta: 1 if the blocks represent metadata
David Teiglandb3b94fa2006-01-16 16:50:04 +00002330 *
2331 */
2332
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002333void __gfs2_free_blocks(struct gfs2_inode *ip, u64 bstart, u32 blen, int meta)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002334{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002335 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002336 struct gfs2_rgrpd *rgd;
2337
2338 rgd = rgblk_free(sdp, bstart, blen, GFS2_BLKST_FREE);
2339 if (!rgd)
2340 return;
Bob Peterson41db1ab2012-05-09 12:11:35 -04002341 trace_gfs2_block_alloc(ip, rgd, bstart, blen, GFS2_BLKST_FREE);
Steven Whitehousecfc8b542008-11-04 10:25:13 +00002342 rgd->rd_free += blen;
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002343 rgd->rd_flags &= ~GFS2_RGF_TRIMMED;
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002344 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002345 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002346 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002347
Steven Whitehouse6d3117b2011-05-21 14:05:58 +01002348 /* Directories keep their data in the metadata address space */
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002349 if (meta || ip->i_depth)
Steven Whitehouse6d3117b2011-05-21 14:05:58 +01002350 gfs2_meta_wipe(ip, bstart, blen);
Bob Peterson4c16c362011-02-23 16:11:33 -05002351}
David Teiglandb3b94fa2006-01-16 16:50:04 +00002352
Bob Peterson4c16c362011-02-23 16:11:33 -05002353/**
Bob Peterson4c16c362011-02-23 16:11:33 -05002354 * gfs2_free_meta - free a contiguous run of data block(s)
2355 * @ip: the inode these blocks are being freed from
2356 * @bstart: first block of a run of contiguous blocks
2357 * @blen: the length of the block run
2358 *
2359 */
2360
Steven Whitehousecd915492006-09-04 12:49:07 -04002361void gfs2_free_meta(struct gfs2_inode *ip, u64 bstart, u32 blen)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002362{
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002363 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002364
Eric Sandeen46fcb2e2011-06-23 10:39:34 -05002365 __gfs2_free_blocks(ip, bstart, blen, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002366 gfs2_statfs_change(sdp, 0, +blen, 0);
Steven Whitehouse2933f922006-11-01 13:23:29 -05002367 gfs2_quota_change(ip, -(s64)blen, ip->i_inode.i_uid, ip->i_inode.i_gid);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002368}
2369
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002370void gfs2_unlink_di(struct inode *inode)
2371{
2372 struct gfs2_inode *ip = GFS2_I(inode);
2373 struct gfs2_sbd *sdp = GFS2_SB(inode);
2374 struct gfs2_rgrpd *rgd;
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002375 u64 blkno = ip->i_no_addr;
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002376
2377 rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_UNLINKED);
2378 if (!rgd)
2379 return;
Bob Peterson41db1ab2012-05-09 12:11:35 -04002380 trace_gfs2_block_alloc(ip, rgd, blkno, 1, GFS2_BLKST_UNLINKED);
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002381 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002382 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002383 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
2384 update_rgrp_lvb_unlinked(rgd, 1);
Steven Whitehousefeaa7bb2006-06-14 15:32:57 -04002385}
2386
Steven Whitehousecd915492006-09-04 12:49:07 -04002387static void gfs2_free_uninit_di(struct gfs2_rgrpd *rgd, u64 blkno)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002388{
2389 struct gfs2_sbd *sdp = rgd->rd_sbd;
2390 struct gfs2_rgrpd *tmp_rgd;
2391
2392 tmp_rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_FREE);
2393 if (!tmp_rgd)
2394 return;
2395 gfs2_assert_withdraw(sdp, rgd == tmp_rgd);
2396
Steven Whitehouse73f74942008-11-04 10:32:57 +00002397 if (!rgd->rd_dinodes)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002398 gfs2_consist_rgrpd(rgd);
Steven Whitehouse73f74942008-11-04 10:32:57 +00002399 rgd->rd_dinodes--;
Steven Whitehousecfc8b542008-11-04 10:25:13 +00002400 rgd->rd_free++;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002401
Steven Whitehouse350a9b02012-12-14 12:36:02 +00002402 gfs2_trans_add_meta(rgd->rd_gl, rgd->rd_bits[0].bi_bh);
Bob Peterson42d52e32008-01-28 18:38:07 -06002403 gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
Benjamin Marzinski90306c42012-05-29 23:01:09 -05002404 gfs2_rgrp_ondisk2lvb(rgd->rd_rgl, rgd->rd_bits[0].bi_bh->b_data);
2405 update_rgrp_lvb_unlinked(rgd, -1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002406
2407 gfs2_statfs_change(sdp, 0, +1, -1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002408}
2409
David Teiglandb3b94fa2006-01-16 16:50:04 +00002410
2411void gfs2_free_di(struct gfs2_rgrpd *rgd, struct gfs2_inode *ip)
2412{
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002413 gfs2_free_uninit_di(rgd, ip->i_no_addr);
Bob Peterson41db1ab2012-05-09 12:11:35 -04002414 trace_gfs2_block_alloc(ip, rgd, ip->i_no_addr, 1, GFS2_BLKST_FREE);
Steven Whitehouse2933f922006-11-01 13:23:29 -05002415 gfs2_quota_change(ip, -1, ip->i_inode.i_uid, ip->i_inode.i_gid);
Steven Whitehousedbb7cae2007-05-15 15:37:50 +01002416 gfs2_meta_wipe(ip, ip->i_no_addr, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002417}
2418
2419/**
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002420 * gfs2_check_blk_type - Check the type of a block
2421 * @sdp: The superblock
2422 * @no_addr: The block number to check
2423 * @type: The block type we are looking for
2424 *
2425 * Returns: 0 if the block type matches the expected type
2426 * -ESTALE if it doesn't match
2427 * or -ve errno if something went wrong while checking
2428 */
2429
2430int gfs2_check_blk_type(struct gfs2_sbd *sdp, u64 no_addr, unsigned int type)
2431{
2432 struct gfs2_rgrpd *rgd;
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002433 struct gfs2_holder rgd_gh;
Bob Peterson58884c42012-03-05 10:19:35 -05002434 int error = -EINVAL;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002435
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002436 rgd = gfs2_blk2rgrpd(sdp, no_addr, 1);
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002437 if (!rgd)
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002438 goto fail;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002439
2440 error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_SHARED, 0, &rgd_gh);
2441 if (error)
Steven Whitehouse8339ee52011-08-31 16:38:29 +01002442 goto fail;
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002443
2444 if (gfs2_get_block_type(rgd, no_addr) != type)
2445 error = -ESTALE;
2446
2447 gfs2_glock_dq_uninit(&rgd_gh);
Steven Whitehouseacf7e242009-09-08 18:00:30 +01002448fail:
2449 return error;
2450}
2451
2452/**
David Teiglandb3b94fa2006-01-16 16:50:04 +00002453 * gfs2_rlist_add - add a RG to a list of RGs
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002454 * @ip: the inode
David Teiglandb3b94fa2006-01-16 16:50:04 +00002455 * @rlist: the list of resource groups
2456 * @block: the block
2457 *
2458 * Figure out what RG a block belongs to and add that RG to the list
2459 *
2460 * FIXME: Don't use NOFAIL
2461 *
2462 */
2463
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002464void gfs2_rlist_add(struct gfs2_inode *ip, struct gfs2_rgrp_list *rlist,
Steven Whitehousecd915492006-09-04 12:49:07 -04002465 u64 block)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002466{
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002467 struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002468 struct gfs2_rgrpd *rgd;
2469 struct gfs2_rgrpd **tmp;
2470 unsigned int new_space;
2471 unsigned int x;
2472
2473 if (gfs2_assert_warn(sdp, !rlist->rl_ghs))
2474 return;
2475
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002476 if (ip->i_rgd && rgrp_contains_block(ip->i_rgd, block))
2477 rgd = ip->i_rgd;
2478 else
Steven Whitehouse66fc0612012-02-08 12:58:32 +00002479 rgd = gfs2_blk2rgrpd(sdp, block, 1);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002480 if (!rgd) {
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002481 fs_err(sdp, "rlist_add: no rgrp for block %llu\n", (unsigned long long)block);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002482 return;
2483 }
Steven Whitehouse70b0c362011-09-02 16:08:09 +01002484 ip->i_rgd = rgd;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002485
2486 for (x = 0; x < rlist->rl_rgrps; x++)
2487 if (rlist->rl_rgd[x] == rgd)
2488 return;
2489
2490 if (rlist->rl_rgrps == rlist->rl_space) {
2491 new_space = rlist->rl_space + 10;
2492
2493 tmp = kcalloc(new_space, sizeof(struct gfs2_rgrpd *),
Steven Whitehousedd894be2006-07-27 14:29:00 -04002494 GFP_NOFS | __GFP_NOFAIL);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002495
2496 if (rlist->rl_rgd) {
2497 memcpy(tmp, rlist->rl_rgd,
2498 rlist->rl_space * sizeof(struct gfs2_rgrpd *));
2499 kfree(rlist->rl_rgd);
2500 }
2501
2502 rlist->rl_space = new_space;
2503 rlist->rl_rgd = tmp;
2504 }
2505
2506 rlist->rl_rgd[rlist->rl_rgrps++] = rgd;
2507}
2508
2509/**
2510 * gfs2_rlist_alloc - all RGs have been added to the rlist, now allocate
2511 * and initialize an array of glock holders for them
2512 * @rlist: the list of resource groups
2513 * @state: the lock state to acquire the RG lock in
David Teiglandb3b94fa2006-01-16 16:50:04 +00002514 *
2515 * FIXME: Don't use NOFAIL
2516 *
2517 */
2518
Bob Petersonfe6c9912008-01-28 11:13:02 -06002519void gfs2_rlist_alloc(struct gfs2_rgrp_list *rlist, unsigned int state)
David Teiglandb3b94fa2006-01-16 16:50:04 +00002520{
2521 unsigned int x;
2522
2523 rlist->rl_ghs = kcalloc(rlist->rl_rgrps, sizeof(struct gfs2_holder),
Steven Whitehousedd894be2006-07-27 14:29:00 -04002524 GFP_NOFS | __GFP_NOFAIL);
David Teiglandb3b94fa2006-01-16 16:50:04 +00002525 for (x = 0; x < rlist->rl_rgrps; x++)
2526 gfs2_holder_init(rlist->rl_rgd[x]->rd_gl,
Bob Petersonfe6c9912008-01-28 11:13:02 -06002527 state, 0,
David Teiglandb3b94fa2006-01-16 16:50:04 +00002528 &rlist->rl_ghs[x]);
2529}
2530
2531/**
2532 * gfs2_rlist_free - free a resource group list
Fabian Frederick27ff6a02014-07-02 22:05:27 +02002533 * @rlist: the list of resource groups
David Teiglandb3b94fa2006-01-16 16:50:04 +00002534 *
2535 */
2536
2537void gfs2_rlist_free(struct gfs2_rgrp_list *rlist)
2538{
2539 unsigned int x;
2540
2541 kfree(rlist->rl_rgd);
2542
2543 if (rlist->rl_ghs) {
2544 for (x = 0; x < rlist->rl_rgrps; x++)
2545 gfs2_holder_uninit(&rlist->rl_ghs[x]);
2546 kfree(rlist->rl_ghs);
Bob Peterson8e2e0042012-07-19 08:12:40 -04002547 rlist->rl_ghs = NULL;
David Teiglandb3b94fa2006-01-16 16:50:04 +00002548 }
2549}
2550