1 /*
2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
3  * Copyright (C) 2004-2008 Red Hat, Inc.  All rights reserved.
4  *
5  * This copyrighted material is made available to anyone wishing to use,
6  * modify, copy, or redistribute it subject to the terms and conditions
7  * of the GNU General Public License version 2.
8  */
9 
10 #include <linux/slab.h>
11 #include <linux/spinlock.h>
12 #include <linux/completion.h>
13 #include <linux/buffer_head.h>
14 #include <linux/fs.h>
15 #include <linux/gfs2_ondisk.h>
16 #include <linux/prefetch.h>
17 #include <linux/blkdev.h>
18 
19 #include "gfs2.h"
20 #include "incore.h"
21 #include "glock.h"
22 #include "glops.h"
23 #include "lops.h"
24 #include "meta_io.h"
25 #include "quota.h"
26 #include "rgrp.h"
27 #include "super.h"
28 #include "trans.h"
29 #include "util.h"
30 #include "log.h"
31 #include "inode.h"
32 #include "trace_gfs2.h"
33 
34 #define BFITNOENT ((u32)~0)
35 #define NO_BLOCK ((u64)~0)
36 
37 #if BITS_PER_LONG == 32
38 #define LBITMASK   (0x55555555UL)
39 #define LBITSKIP55 (0x55555555UL)
40 #define LBITSKIP00 (0x00000000UL)
41 #else
42 #define LBITMASK   (0x5555555555555555UL)
43 #define LBITSKIP55 (0x5555555555555555UL)
44 #define LBITSKIP00 (0x0000000000000000UL)
45 #endif
46 
47 /*
48  * These routines are used by the resource group routines (rgrp.c)
49  * to keep track of block allocation.  Each block is represented by two
50  * bits.  So, each byte represents GFS2_NBBY (i.e. 4) blocks.
51  *
52  * 0 = Free
53  * 1 = Used (not metadata)
54  * 2 = Unlinked (still in use) inode
55  * 3 = Used (metadata)
56  */
57 
58 static const char valid_change[16] = {
59 	        /* current */
60 	/* n */ 0, 1, 1, 1,
61 	/* e */ 1, 0, 0, 0,
62 	/* w */ 0, 0, 0, 1,
63 	        1, 0, 0, 0
64 };
65 
66 static u32 rgblk_search(struct gfs2_rgrpd *rgd, u32 goal,
67                         unsigned char old_state, unsigned char new_state,
68 			unsigned int *n);
69 
70 /**
71  * gfs2_setbit - Set a bit in the bitmaps
72  * @buffer: the buffer that holds the bitmaps
73  * @buflen: the length (in bytes) of the buffer
74  * @block: the block to set
75  * @new_state: the new state of the block
76  *
77  */
78 
gfs2_setbit(struct gfs2_rgrpd * rgd,unsigned char * buf1,unsigned char * buf2,unsigned int offset,unsigned int buflen,u32 block,unsigned char new_state)79 static inline void gfs2_setbit(struct gfs2_rgrpd *rgd, unsigned char *buf1,
80 			       unsigned char *buf2, unsigned int offset,
81 			       unsigned int buflen, u32 block,
82 			       unsigned char new_state)
83 {
84 	unsigned char *byte1, *byte2, *end, cur_state;
85 	const unsigned int bit = (block % GFS2_NBBY) * GFS2_BIT_SIZE;
86 
87 	byte1 = buf1 + offset + (block / GFS2_NBBY);
88 	end = buf1 + offset + buflen;
89 
90 	BUG_ON(byte1 >= end);
91 
92 	cur_state = (*byte1 >> bit) & GFS2_BIT_MASK;
93 
94 	if (unlikely(!valid_change[new_state * 4 + cur_state])) {
95 		gfs2_consist_rgrpd(rgd);
96 		return;
97 	}
98 	*byte1 ^= (cur_state ^ new_state) << bit;
99 
100 	if (buf2) {
101 		byte2 = buf2 + offset + (block / GFS2_NBBY);
102 		cur_state = (*byte2 >> bit) & GFS2_BIT_MASK;
103 		*byte2 ^= (cur_state ^ new_state) << bit;
104 	}
105 }
106 
107 /**
108  * gfs2_testbit - test a bit in the bitmaps
109  * @buffer: the buffer that holds the bitmaps
110  * @buflen: the length (in bytes) of the buffer
111  * @block: the block to read
112  *
113  */
114 
gfs2_testbit(struct gfs2_rgrpd * rgd,const unsigned char * buffer,unsigned int buflen,u32 block)115 static inline unsigned char gfs2_testbit(struct gfs2_rgrpd *rgd,
116 					 const unsigned char *buffer,
117 					 unsigned int buflen, u32 block)
118 {
119 	const unsigned char *byte, *end;
120 	unsigned char cur_state;
121 	unsigned int bit;
122 
123 	byte = buffer + (block / GFS2_NBBY);
124 	bit = (block % GFS2_NBBY) * GFS2_BIT_SIZE;
125 	end = buffer + buflen;
126 
127 	gfs2_assert(rgd->rd_sbd, byte < end);
128 
129 	cur_state = (*byte >> bit) & GFS2_BIT_MASK;
130 
131 	return cur_state;
132 }
133 
134 /**
135  * gfs2_bit_search
136  * @ptr: Pointer to bitmap data
137  * @mask: Mask to use (normally 0x55555.... but adjusted for search start)
138  * @state: The state we are searching for
139  *
140  * We xor the bitmap data with a patter which is the bitwise opposite
141  * of what we are looking for, this gives rise to a pattern of ones
142  * wherever there is a match. Since we have two bits per entry, we
143  * take this pattern, shift it down by one place and then and it with
144  * the original. All the even bit positions (0,2,4, etc) then represent
145  * successful matches, so we mask with 0x55555..... to remove the unwanted
146  * odd bit positions.
147  *
148  * This allows searching of a whole u64 at once (32 blocks) with a
149  * single test (on 64 bit arches).
150  */
151 
gfs2_bit_search(const __le64 * ptr,u64 mask,u8 state)152 static inline u64 gfs2_bit_search(const __le64 *ptr, u64 mask, u8 state)
153 {
154 	u64 tmp;
155 	static const u64 search[] = {
156 		[0] = 0xffffffffffffffffULL,
157 		[1] = 0xaaaaaaaaaaaaaaaaULL,
158 		[2] = 0x5555555555555555ULL,
159 		[3] = 0x0000000000000000ULL,
160 	};
161 	tmp = le64_to_cpu(*ptr) ^ search[state];
162 	tmp &= (tmp >> 1);
163 	tmp &= mask;
164 	return tmp;
165 }
166 
167 /**
168  * gfs2_bitfit - Search an rgrp's bitmap buffer to find a bit-pair representing
169  *       a block in a given allocation state.
170  * @buffer: the buffer that holds the bitmaps
171  * @len: the length (in bytes) of the buffer
172  * @goal: start search at this block's bit-pair (within @buffer)
173  * @state: GFS2_BLKST_XXX the state of the block we're looking for.
174  *
175  * Scope of @goal and returned block number is only within this bitmap buffer,
176  * not entire rgrp or filesystem.  @buffer will be offset from the actual
177  * beginning of a bitmap block buffer, skipping any header structures, but
178  * headers are always a multiple of 64 bits long so that the buffer is
179  * always aligned to a 64 bit boundary.
180  *
181  * The size of the buffer is in bytes, but is it assumed that it is
182  * always ok to read a complete multiple of 64 bits at the end
183  * of the block in case the end is no aligned to a natural boundary.
184  *
185  * Return: the block number (bitmap buffer scope) that was found
186  */
187 
gfs2_bitfit(const u8 * buf,const unsigned int len,u32 goal,u8 state)188 static u32 gfs2_bitfit(const u8 *buf, const unsigned int len,
189 		       u32 goal, u8 state)
190 {
191 	u32 spoint = (goal << 1) & ((8*sizeof(u64)) - 1);
192 	const __le64 *ptr = ((__le64 *)buf) + (goal >> 5);
193 	const __le64 *end = (__le64 *)(buf + ALIGN(len, sizeof(u64)));
194 	u64 tmp;
195 	u64 mask = 0x5555555555555555ULL;
196 	u32 bit;
197 
198 	BUG_ON(state > 3);
199 
200 	/* Mask off bits we don't care about at the start of the search */
201 	mask <<= spoint;
202 	tmp = gfs2_bit_search(ptr, mask, state);
203 	ptr++;
204 	while(tmp == 0 && ptr < end) {
205 		tmp = gfs2_bit_search(ptr, 0x5555555555555555ULL, state);
206 		ptr++;
207 	}
208 	/* Mask off any bits which are more than len bytes from the start */
209 	if (ptr == end && (len & (sizeof(u64) - 1)))
210 		tmp &= (((u64)~0) >> (64 - 8*(len & (sizeof(u64) - 1))));
211 	/* Didn't find anything, so return */
212 	if (tmp == 0)
213 		return BFITNOENT;
214 	ptr--;
215 	bit = __ffs64(tmp);
216 	bit /= 2;	/* two bits per entry in the bitmap */
217 	return (((const unsigned char *)ptr - buf) * GFS2_NBBY) + bit;
218 }
219 
220 /**
221  * gfs2_bitcount - count the number of bits in a certain state
222  * @buffer: the buffer that holds the bitmaps
223  * @buflen: the length (in bytes) of the buffer
224  * @state: the state of the block we're looking for
225  *
226  * Returns: The number of bits
227  */
228 
gfs2_bitcount(struct gfs2_rgrpd * rgd,const u8 * buffer,unsigned int buflen,u8 state)229 static u32 gfs2_bitcount(struct gfs2_rgrpd *rgd, const u8 *buffer,
230 			 unsigned int buflen, u8 state)
231 {
232 	const u8 *byte = buffer;
233 	const u8 *end = buffer + buflen;
234 	const u8 state1 = state << 2;
235 	const u8 state2 = state << 4;
236 	const u8 state3 = state << 6;
237 	u32 count = 0;
238 
239 	for (; byte < end; byte++) {
240 		if (((*byte) & 0x03) == state)
241 			count++;
242 		if (((*byte) & 0x0C) == state1)
243 			count++;
244 		if (((*byte) & 0x30) == state2)
245 			count++;
246 		if (((*byte) & 0xC0) == state3)
247 			count++;
248 	}
249 
250 	return count;
251 }
252 
253 /**
254  * gfs2_rgrp_verify - Verify that a resource group is consistent
255  * @sdp: the filesystem
256  * @rgd: the rgrp
257  *
258  */
259 
gfs2_rgrp_verify(struct gfs2_rgrpd * rgd)260 void gfs2_rgrp_verify(struct gfs2_rgrpd *rgd)
261 {
262 	struct gfs2_sbd *sdp = rgd->rd_sbd;
263 	struct gfs2_bitmap *bi = NULL;
264 	u32 length = rgd->rd_length;
265 	u32 count[4], tmp;
266 	int buf, x;
267 
268 	memset(count, 0, 4 * sizeof(u32));
269 
270 	/* Count # blocks in each of 4 possible allocation states */
271 	for (buf = 0; buf < length; buf++) {
272 		bi = rgd->rd_bits + buf;
273 		for (x = 0; x < 4; x++)
274 			count[x] += gfs2_bitcount(rgd,
275 						  bi->bi_bh->b_data +
276 						  bi->bi_offset,
277 						  bi->bi_len, x);
278 	}
279 
280 	if (count[0] != rgd->rd_free) {
281 		if (gfs2_consist_rgrpd(rgd))
282 			fs_err(sdp, "free data mismatch:  %u != %u\n",
283 			       count[0], rgd->rd_free);
284 		return;
285 	}
286 
287 	tmp = rgd->rd_data - rgd->rd_free - rgd->rd_dinodes;
288 	if (count[1] != tmp) {
289 		if (gfs2_consist_rgrpd(rgd))
290 			fs_err(sdp, "used data mismatch:  %u != %u\n",
291 			       count[1], tmp);
292 		return;
293 	}
294 
295 	if (count[2] + count[3] != rgd->rd_dinodes) {
296 		if (gfs2_consist_rgrpd(rgd))
297 			fs_err(sdp, "used metadata mismatch:  %u != %u\n",
298 			       count[2] + count[3], rgd->rd_dinodes);
299 		return;
300 	}
301 }
302 
rgrp_contains_block(struct gfs2_rgrpd * rgd,u64 block)303 static inline int rgrp_contains_block(struct gfs2_rgrpd *rgd, u64 block)
304 {
305 	u64 first = rgd->rd_data0;
306 	u64 last = first + rgd->rd_data;
307 	return first <= block && block < last;
308 }
309 
310 /**
311  * gfs2_blk2rgrpd - Find resource group for a given data/meta block number
312  * @sdp: The GFS2 superblock
313  * @n: The data block number
314  *
315  * Returns: The resource group, or NULL if not found
316  */
317 
gfs2_blk2rgrpd(struct gfs2_sbd * sdp,u64 blk)318 struct gfs2_rgrpd *gfs2_blk2rgrpd(struct gfs2_sbd *sdp, u64 blk)
319 {
320 	struct gfs2_rgrpd *rgd;
321 
322 	spin_lock(&sdp->sd_rindex_spin);
323 
324 	list_for_each_entry(rgd, &sdp->sd_rindex_mru_list, rd_list_mru) {
325 		if (rgrp_contains_block(rgd, blk)) {
326 			list_move(&rgd->rd_list_mru, &sdp->sd_rindex_mru_list);
327 			spin_unlock(&sdp->sd_rindex_spin);
328 			return rgd;
329 		}
330 	}
331 
332 	spin_unlock(&sdp->sd_rindex_spin);
333 
334 	return NULL;
335 }
336 
337 /**
338  * gfs2_rgrpd_get_first - get the first Resource Group in the filesystem
339  * @sdp: The GFS2 superblock
340  *
341  * Returns: The first rgrp in the filesystem
342  */
343 
gfs2_rgrpd_get_first(struct gfs2_sbd * sdp)344 struct gfs2_rgrpd *gfs2_rgrpd_get_first(struct gfs2_sbd *sdp)
345 {
346 	gfs2_assert(sdp, !list_empty(&sdp->sd_rindex_list));
347 	return list_entry(sdp->sd_rindex_list.next, struct gfs2_rgrpd, rd_list);
348 }
349 
350 /**
351  * gfs2_rgrpd_get_next - get the next RG
352  * @rgd: A RG
353  *
354  * Returns: The next rgrp
355  */
356 
gfs2_rgrpd_get_next(struct gfs2_rgrpd * rgd)357 struct gfs2_rgrpd *gfs2_rgrpd_get_next(struct gfs2_rgrpd *rgd)
358 {
359 	if (rgd->rd_list.next == &rgd->rd_sbd->sd_rindex_list)
360 		return NULL;
361 	return list_entry(rgd->rd_list.next, struct gfs2_rgrpd, rd_list);
362 }
363 
clear_rgrpdi(struct gfs2_sbd * sdp)364 static void clear_rgrpdi(struct gfs2_sbd *sdp)
365 {
366 	struct list_head *head;
367 	struct gfs2_rgrpd *rgd;
368 	struct gfs2_glock *gl;
369 
370 	spin_lock(&sdp->sd_rindex_spin);
371 	sdp->sd_rindex_forward = NULL;
372 	spin_unlock(&sdp->sd_rindex_spin);
373 
374 	head = &sdp->sd_rindex_list;
375 	while (!list_empty(head)) {
376 		rgd = list_entry(head->next, struct gfs2_rgrpd, rd_list);
377 		gl = rgd->rd_gl;
378 
379 		list_del(&rgd->rd_list);
380 		list_del(&rgd->rd_list_mru);
381 
382 		if (gl) {
383 			gl->gl_object = NULL;
384 			gfs2_glock_put(gl);
385 		}
386 
387 		kfree(rgd->rd_bits);
388 		kmem_cache_free(gfs2_rgrpd_cachep, rgd);
389 	}
390 }
391 
gfs2_clear_rgrpd(struct gfs2_sbd * sdp)392 void gfs2_clear_rgrpd(struct gfs2_sbd *sdp)
393 {
394 	mutex_lock(&sdp->sd_rindex_mutex);
395 	clear_rgrpdi(sdp);
396 	mutex_unlock(&sdp->sd_rindex_mutex);
397 }
398 
gfs2_rindex_print(const struct gfs2_rgrpd * rgd)399 static void gfs2_rindex_print(const struct gfs2_rgrpd *rgd)
400 {
401 	printk(KERN_INFO "  ri_addr = %llu\n", (unsigned long long)rgd->rd_addr);
402 	printk(KERN_INFO "  ri_length = %u\n", rgd->rd_length);
403 	printk(KERN_INFO "  ri_data0 = %llu\n", (unsigned long long)rgd->rd_data0);
404 	printk(KERN_INFO "  ri_data = %u\n", rgd->rd_data);
405 	printk(KERN_INFO "  ri_bitbytes = %u\n", rgd->rd_bitbytes);
406 }
407 
408 /**
409  * gfs2_compute_bitstructs - Compute the bitmap sizes
410  * @rgd: The resource group descriptor
411  *
412  * Calculates bitmap descriptors, one for each block that contains bitmap data
413  *
414  * Returns: errno
415  */
416 
compute_bitstructs(struct gfs2_rgrpd * rgd)417 static int compute_bitstructs(struct gfs2_rgrpd *rgd)
418 {
419 	struct gfs2_sbd *sdp = rgd->rd_sbd;
420 	struct gfs2_bitmap *bi;
421 	u32 length = rgd->rd_length; /* # blocks in hdr & bitmap */
422 	u32 bytes_left, bytes;
423 	int x;
424 
425 	if (!length)
426 		return -EINVAL;
427 
428 	rgd->rd_bits = kcalloc(length, sizeof(struct gfs2_bitmap), GFP_NOFS);
429 	if (!rgd->rd_bits)
430 		return -ENOMEM;
431 
432 	bytes_left = rgd->rd_bitbytes;
433 
434 	for (x = 0; x < length; x++) {
435 		bi = rgd->rd_bits + x;
436 
437 		bi->bi_flags = 0;
438 		/* small rgrp; bitmap stored completely in header block */
439 		if (length == 1) {
440 			bytes = bytes_left;
441 			bi->bi_offset = sizeof(struct gfs2_rgrp);
442 			bi->bi_start = 0;
443 			bi->bi_len = bytes;
444 		/* header block */
445 		} else if (x == 0) {
446 			bytes = sdp->sd_sb.sb_bsize - sizeof(struct gfs2_rgrp);
447 			bi->bi_offset = sizeof(struct gfs2_rgrp);
448 			bi->bi_start = 0;
449 			bi->bi_len = bytes;
450 		/* last block */
451 		} else if (x + 1 == length) {
452 			bytes = bytes_left;
453 			bi->bi_offset = sizeof(struct gfs2_meta_header);
454 			bi->bi_start = rgd->rd_bitbytes - bytes_left;
455 			bi->bi_len = bytes;
456 		/* other blocks */
457 		} else {
458 			bytes = sdp->sd_sb.sb_bsize -
459 				sizeof(struct gfs2_meta_header);
460 			bi->bi_offset = sizeof(struct gfs2_meta_header);
461 			bi->bi_start = rgd->rd_bitbytes - bytes_left;
462 			bi->bi_len = bytes;
463 		}
464 
465 		bytes_left -= bytes;
466 	}
467 
468 	if (bytes_left) {
469 		gfs2_consist_rgrpd(rgd);
470 		return -EIO;
471 	}
472 	bi = rgd->rd_bits + (length - 1);
473 	if ((bi->bi_start + bi->bi_len) * GFS2_NBBY != rgd->rd_data) {
474 		if (gfs2_consist_rgrpd(rgd)) {
475 			gfs2_rindex_print(rgd);
476 			fs_err(sdp, "start=%u len=%u offset=%u\n",
477 			       bi->bi_start, bi->bi_len, bi->bi_offset);
478 		}
479 		return -EIO;
480 	}
481 
482 	return 0;
483 }
484 
485 /**
486  * gfs2_ri_total - Total up the file system space, according to the rindex.
487  *
488  */
gfs2_ri_total(struct gfs2_sbd * sdp)489 u64 gfs2_ri_total(struct gfs2_sbd *sdp)
490 {
491 	u64 total_data = 0;
492 	struct inode *inode = sdp->sd_rindex;
493 	struct gfs2_inode *ip = GFS2_I(inode);
494 	char buf[sizeof(struct gfs2_rindex)];
495 	struct file_ra_state ra_state;
496 	int error, rgrps;
497 
498 	mutex_lock(&sdp->sd_rindex_mutex);
499 	file_ra_state_init(&ra_state, inode->i_mapping);
500 	for (rgrps = 0;; rgrps++) {
501 		loff_t pos = rgrps * sizeof(struct gfs2_rindex);
502 
503 		if (pos + sizeof(struct gfs2_rindex) > i_size_read(inode))
504 			break;
505 		error = gfs2_internal_read(ip, &ra_state, buf, &pos,
506 					   sizeof(struct gfs2_rindex));
507 		if (error != sizeof(struct gfs2_rindex))
508 			break;
509 		total_data += be32_to_cpu(((struct gfs2_rindex *)buf)->ri_data);
510 	}
511 	mutex_unlock(&sdp->sd_rindex_mutex);
512 	return total_data;
513 }
514 
gfs2_rindex_in(struct gfs2_rgrpd * rgd,const void * buf)515 static void gfs2_rindex_in(struct gfs2_rgrpd *rgd, const void *buf)
516 {
517 	const struct gfs2_rindex *str = buf;
518 
519 	rgd->rd_addr = be64_to_cpu(str->ri_addr);
520 	rgd->rd_length = be32_to_cpu(str->ri_length);
521 	rgd->rd_data0 = be64_to_cpu(str->ri_data0);
522 	rgd->rd_data = be32_to_cpu(str->ri_data);
523 	rgd->rd_bitbytes = be32_to_cpu(str->ri_bitbytes);
524 }
525 
526 /**
527  * read_rindex_entry - Pull in a new resource index entry from the disk
528  * @gl: The glock covering the rindex inode
529  *
530  * Returns: 0 on success, error code otherwise
531  */
532 
read_rindex_entry(struct gfs2_inode * ip,struct file_ra_state * ra_state)533 static int read_rindex_entry(struct gfs2_inode *ip,
534 			     struct file_ra_state *ra_state)
535 {
536 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
537 	loff_t pos = sdp->sd_rgrps * sizeof(struct gfs2_rindex);
538 	char buf[sizeof(struct gfs2_rindex)];
539 	int error;
540 	struct gfs2_rgrpd *rgd;
541 
542 	error = gfs2_internal_read(ip, ra_state, buf, &pos,
543 				   sizeof(struct gfs2_rindex));
544 	if (!error)
545 		return 0;
546 	if (error != sizeof(struct gfs2_rindex)) {
547 		if (error > 0)
548 			error = -EIO;
549 		return error;
550 	}
551 
552 	rgd = kmem_cache_zalloc(gfs2_rgrpd_cachep, GFP_NOFS);
553 	error = -ENOMEM;
554 	if (!rgd)
555 		return error;
556 
557 	mutex_init(&rgd->rd_mutex);
558 	lops_init_le(&rgd->rd_le, &gfs2_rg_lops);
559 	rgd->rd_sbd = sdp;
560 
561 	list_add_tail(&rgd->rd_list, &sdp->sd_rindex_list);
562 	list_add_tail(&rgd->rd_list_mru, &sdp->sd_rindex_mru_list);
563 
564 	gfs2_rindex_in(rgd, buf);
565 	error = compute_bitstructs(rgd);
566 	if (error)
567 		return error;
568 
569 	error = gfs2_glock_get(sdp, rgd->rd_addr,
570 			       &gfs2_rgrp_glops, CREATE, &rgd->rd_gl);
571 	if (error)
572 		return error;
573 
574 	rgd->rd_gl->gl_object = rgd;
575 	rgd->rd_flags &= ~GFS2_RDF_UPTODATE;
576 	return error;
577 }
578 
579 /**
580  * gfs2_ri_update - Pull in a new resource index from the disk
581  * @ip: pointer to the rindex inode
582  *
583  * Returns: 0 on successful update, error code otherwise
584  */
585 
gfs2_ri_update(struct gfs2_inode * ip)586 int gfs2_ri_update(struct gfs2_inode *ip)
587 {
588 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
589 	struct inode *inode = &ip->i_inode;
590 	struct file_ra_state ra_state;
591 	u64 rgrp_count = i_size_read(inode);
592 	struct gfs2_rgrpd *rgd;
593 	unsigned int max_data = 0;
594 	int error;
595 
596 	do_div(rgrp_count, sizeof(struct gfs2_rindex));
597 	clear_rgrpdi(sdp);
598 
599 	file_ra_state_init(&ra_state, inode->i_mapping);
600 	for (sdp->sd_rgrps = 0; sdp->sd_rgrps < rgrp_count; sdp->sd_rgrps++) {
601 		error = read_rindex_entry(ip, &ra_state);
602 		if (error) {
603 			clear_rgrpdi(sdp);
604 			return error;
605 		}
606 	}
607 
608 	list_for_each_entry(rgd, &sdp->sd_rindex_list, rd_list)
609 		if (rgd->rd_data > max_data)
610 			max_data = rgd->rd_data;
611 	sdp->sd_max_rg_data = max_data;
612 	sdp->sd_rindex_uptodate = 1;
613 	return 0;
614 }
615 
616 /**
617  * gfs2_rindex_hold - Grab a lock on the rindex
618  * @sdp: The GFS2 superblock
619  * @ri_gh: the glock holder
620  *
621  * We grab a lock on the rindex inode to make sure that it doesn't
622  * change whilst we are performing an operation. We keep this lock
623  * for quite long periods of time compared to other locks. This
624  * doesn't matter, since it is shared and it is very, very rarely
625  * accessed in the exclusive mode (i.e. only when expanding the filesystem).
626  *
627  * This makes sure that we're using the latest copy of the resource index
628  * special file, which might have been updated if someone expanded the
629  * filesystem (via gfs2_grow utility), which adds new resource groups.
630  *
631  * Returns: 0 on success, error code otherwise
632  */
633 
gfs2_rindex_hold(struct gfs2_sbd * sdp,struct gfs2_holder * ri_gh)634 int gfs2_rindex_hold(struct gfs2_sbd *sdp, struct gfs2_holder *ri_gh)
635 {
636 	struct gfs2_inode *ip = GFS2_I(sdp->sd_rindex);
637 	struct gfs2_glock *gl = ip->i_gl;
638 	int error;
639 
640 	error = gfs2_glock_nq_init(gl, LM_ST_SHARED, 0, ri_gh);
641 	if (error)
642 		return error;
643 
644 	/* Read new copy from disk if we don't have the latest */
645 	if (!sdp->sd_rindex_uptodate) {
646 		mutex_lock(&sdp->sd_rindex_mutex);
647 		if (!sdp->sd_rindex_uptodate) {
648 			error = gfs2_ri_update(ip);
649 			if (error)
650 				gfs2_glock_dq_uninit(ri_gh);
651 		}
652 		mutex_unlock(&sdp->sd_rindex_mutex);
653 	}
654 
655 	return error;
656 }
657 
gfs2_rgrp_in(struct gfs2_rgrpd * rgd,const void * buf)658 static void gfs2_rgrp_in(struct gfs2_rgrpd *rgd, const void *buf)
659 {
660 	const struct gfs2_rgrp *str = buf;
661 	u32 rg_flags;
662 
663 	rg_flags = be32_to_cpu(str->rg_flags);
664 	rg_flags &= ~GFS2_RDF_MASK;
665 	rgd->rd_flags &= GFS2_RDF_MASK;
666 	rgd->rd_flags |= rg_flags;
667 	rgd->rd_free = be32_to_cpu(str->rg_free);
668 	rgd->rd_dinodes = be32_to_cpu(str->rg_dinodes);
669 	rgd->rd_igeneration = be64_to_cpu(str->rg_igeneration);
670 }
671 
gfs2_rgrp_out(struct gfs2_rgrpd * rgd,void * buf)672 static void gfs2_rgrp_out(struct gfs2_rgrpd *rgd, void *buf)
673 {
674 	struct gfs2_rgrp *str = buf;
675 
676 	str->rg_flags = cpu_to_be32(rgd->rd_flags & ~GFS2_RDF_MASK);
677 	str->rg_free = cpu_to_be32(rgd->rd_free);
678 	str->rg_dinodes = cpu_to_be32(rgd->rd_dinodes);
679 	str->__pad = cpu_to_be32(0);
680 	str->rg_igeneration = cpu_to_be64(rgd->rd_igeneration);
681 	memset(&str->rg_reserved, 0, sizeof(str->rg_reserved));
682 }
683 
684 /**
685  * gfs2_rgrp_bh_get - Read in a RG's header and bitmaps
686  * @rgd: the struct gfs2_rgrpd describing the RG to read in
687  *
688  * Read in all of a Resource Group's header and bitmap blocks.
689  * Caller must eventually call gfs2_rgrp_relse() to free the bitmaps.
690  *
691  * Returns: errno
692  */
693 
gfs2_rgrp_bh_get(struct gfs2_rgrpd * rgd)694 int gfs2_rgrp_bh_get(struct gfs2_rgrpd *rgd)
695 {
696 	struct gfs2_sbd *sdp = rgd->rd_sbd;
697 	struct gfs2_glock *gl = rgd->rd_gl;
698 	unsigned int length = rgd->rd_length;
699 	struct gfs2_bitmap *bi;
700 	unsigned int x, y;
701 	int error;
702 
703 	mutex_lock(&rgd->rd_mutex);
704 
705 	spin_lock(&sdp->sd_rindex_spin);
706 	if (rgd->rd_bh_count) {
707 		rgd->rd_bh_count++;
708 		spin_unlock(&sdp->sd_rindex_spin);
709 		mutex_unlock(&rgd->rd_mutex);
710 		return 0;
711 	}
712 	spin_unlock(&sdp->sd_rindex_spin);
713 
714 	for (x = 0; x < length; x++) {
715 		bi = rgd->rd_bits + x;
716 		error = gfs2_meta_read(gl, rgd->rd_addr + x, 0, &bi->bi_bh);
717 		if (error)
718 			goto fail;
719 	}
720 
721 	for (y = length; y--;) {
722 		bi = rgd->rd_bits + y;
723 		error = gfs2_meta_wait(sdp, bi->bi_bh);
724 		if (error)
725 			goto fail;
726 		if (gfs2_metatype_check(sdp, bi->bi_bh, y ? GFS2_METATYPE_RB :
727 					      GFS2_METATYPE_RG)) {
728 			error = -EIO;
729 			goto fail;
730 		}
731 	}
732 
733 	if (!(rgd->rd_flags & GFS2_RDF_UPTODATE)) {
734 		for (x = 0; x < length; x++)
735 			clear_bit(GBF_FULL, &rgd->rd_bits[x].bi_flags);
736 		gfs2_rgrp_in(rgd, (rgd->rd_bits[0].bi_bh)->b_data);
737 		rgd->rd_flags |= (GFS2_RDF_UPTODATE | GFS2_RDF_CHECK);
738 	}
739 
740 	spin_lock(&sdp->sd_rindex_spin);
741 	rgd->rd_free_clone = rgd->rd_free;
742 	rgd->rd_bh_count++;
743 	spin_unlock(&sdp->sd_rindex_spin);
744 
745 	mutex_unlock(&rgd->rd_mutex);
746 
747 	return 0;
748 
749 fail:
750 	while (x--) {
751 		bi = rgd->rd_bits + x;
752 		brelse(bi->bi_bh);
753 		bi->bi_bh = NULL;
754 		gfs2_assert_warn(sdp, !bi->bi_clone);
755 	}
756 	mutex_unlock(&rgd->rd_mutex);
757 
758 	return error;
759 }
760 
gfs2_rgrp_bh_hold(struct gfs2_rgrpd * rgd)761 void gfs2_rgrp_bh_hold(struct gfs2_rgrpd *rgd)
762 {
763 	struct gfs2_sbd *sdp = rgd->rd_sbd;
764 
765 	spin_lock(&sdp->sd_rindex_spin);
766 	gfs2_assert_warn(rgd->rd_sbd, rgd->rd_bh_count);
767 	rgd->rd_bh_count++;
768 	spin_unlock(&sdp->sd_rindex_spin);
769 }
770 
771 /**
772  * gfs2_rgrp_bh_put - Release RG bitmaps read in with gfs2_rgrp_bh_get()
773  * @rgd: the struct gfs2_rgrpd describing the RG to read in
774  *
775  */
776 
gfs2_rgrp_bh_put(struct gfs2_rgrpd * rgd)777 void gfs2_rgrp_bh_put(struct gfs2_rgrpd *rgd)
778 {
779 	struct gfs2_sbd *sdp = rgd->rd_sbd;
780 	int x, length = rgd->rd_length;
781 
782 	spin_lock(&sdp->sd_rindex_spin);
783 	gfs2_assert_warn(rgd->rd_sbd, rgd->rd_bh_count);
784 	if (--rgd->rd_bh_count) {
785 		spin_unlock(&sdp->sd_rindex_spin);
786 		return;
787 	}
788 
789 	for (x = 0; x < length; x++) {
790 		struct gfs2_bitmap *bi = rgd->rd_bits + x;
791 		kfree(bi->bi_clone);
792 		bi->bi_clone = NULL;
793 		brelse(bi->bi_bh);
794 		bi->bi_bh = NULL;
795 	}
796 
797 	spin_unlock(&sdp->sd_rindex_spin);
798 }
799 
gfs2_rgrp_send_discards(struct gfs2_sbd * sdp,u64 offset,const struct gfs2_bitmap * bi)800 static void gfs2_rgrp_send_discards(struct gfs2_sbd *sdp, u64 offset,
801 				    const struct gfs2_bitmap *bi)
802 {
803 	struct super_block *sb = sdp->sd_vfs;
804 	struct block_device *bdev = sb->s_bdev;
805 	const unsigned int sects_per_blk = sdp->sd_sb.sb_bsize /
806 					   bdev_logical_block_size(sb->s_bdev);
807 	u64 blk;
808 	sector_t start = 0;
809 	sector_t nr_sects = 0;
810 	int rv;
811 	unsigned int x;
812 
813 	for (x = 0; x < bi->bi_len; x++) {
814 		const u8 *orig = bi->bi_bh->b_data + bi->bi_offset + x;
815 		const u8 *clone = bi->bi_clone + bi->bi_offset + x;
816 		u8 diff = ~(*orig | (*orig >> 1)) & (*clone | (*clone >> 1));
817 		diff &= 0x55;
818 		if (diff == 0)
819 			continue;
820 		blk = offset + ((bi->bi_start + x) * GFS2_NBBY);
821 		blk *= sects_per_blk; /* convert to sectors */
822 		while(diff) {
823 			if (diff & 1) {
824 				if (nr_sects == 0)
825 					goto start_new_extent;
826 				if ((start + nr_sects) != blk) {
827 					rv = blkdev_issue_discard(bdev, start,
828 							    nr_sects, GFP_NOFS,
829 							    0);
830 					if (rv)
831 						goto fail;
832 					nr_sects = 0;
833 start_new_extent:
834 					start = blk;
835 				}
836 				nr_sects += sects_per_blk;
837 			}
838 			diff >>= 2;
839 			blk += sects_per_blk;
840 		}
841 	}
842 	if (nr_sects) {
843 		rv = blkdev_issue_discard(bdev, start, nr_sects, GFP_NOFS, 0);
844 		if (rv)
845 			goto fail;
846 	}
847 	return;
848 fail:
849 	fs_warn(sdp, "error %d on discard request, turning discards off for this filesystem", rv);
850 	sdp->sd_args.ar_discard = 0;
851 }
852 
gfs2_rgrp_repolish_clones(struct gfs2_rgrpd * rgd)853 void gfs2_rgrp_repolish_clones(struct gfs2_rgrpd *rgd)
854 {
855 	struct gfs2_sbd *sdp = rgd->rd_sbd;
856 	unsigned int length = rgd->rd_length;
857 	unsigned int x;
858 
859 	for (x = 0; x < length; x++) {
860 		struct gfs2_bitmap *bi = rgd->rd_bits + x;
861 		if (!bi->bi_clone)
862 			continue;
863 		if (sdp->sd_args.ar_discard)
864 			gfs2_rgrp_send_discards(sdp, rgd->rd_data0, bi);
865 		clear_bit(GBF_FULL, &bi->bi_flags);
866 		memcpy(bi->bi_clone + bi->bi_offset,
867 		       bi->bi_bh->b_data + bi->bi_offset, bi->bi_len);
868 	}
869 
870 	spin_lock(&sdp->sd_rindex_spin);
871 	rgd->rd_free_clone = rgd->rd_free;
872 	spin_unlock(&sdp->sd_rindex_spin);
873 }
874 
875 /**
876  * gfs2_alloc_get - get the struct gfs2_alloc structure for an inode
877  * @ip: the incore GFS2 inode structure
878  *
879  * Returns: the struct gfs2_alloc
880  */
881 
gfs2_alloc_get(struct gfs2_inode * ip)882 struct gfs2_alloc *gfs2_alloc_get(struct gfs2_inode *ip)
883 {
884 	BUG_ON(ip->i_alloc != NULL);
885 	ip->i_alloc = kzalloc(sizeof(struct gfs2_alloc), GFP_NOFS);
886 	return ip->i_alloc;
887 }
888 
889 /**
890  * try_rgrp_fit - See if a given reservation will fit in a given RG
891  * @rgd: the RG data
892  * @al: the struct gfs2_alloc structure describing the reservation
893  *
894  * If there's room for the requested blocks to be allocated from the RG:
895  *   Sets the $al_rgd field in @al.
896  *
897  * Returns: 1 on success (it fits), 0 on failure (it doesn't fit)
898  */
899 
try_rgrp_fit(struct gfs2_rgrpd * rgd,struct gfs2_alloc * al)900 static int try_rgrp_fit(struct gfs2_rgrpd *rgd, struct gfs2_alloc *al)
901 {
902 	struct gfs2_sbd *sdp = rgd->rd_sbd;
903 	int ret = 0;
904 
905 	if (rgd->rd_flags & (GFS2_RGF_NOALLOC | GFS2_RDF_ERROR))
906 		return 0;
907 
908 	spin_lock(&sdp->sd_rindex_spin);
909 	if (rgd->rd_free_clone >= al->al_requested) {
910 		al->al_rgd = rgd;
911 		ret = 1;
912 	}
913 	spin_unlock(&sdp->sd_rindex_spin);
914 
915 	return ret;
916 }
917 
918 /**
919  * try_rgrp_unlink - Look for any unlinked, allocated, but unused inodes
920  * @rgd: The rgrp
921  *
922  * Returns: 0 if no error
923  *          The inode, if one has been found, in inode.
924  */
925 
try_rgrp_unlink(struct gfs2_rgrpd * rgd,u64 * last_unlinked,u64 skip)926 static void try_rgrp_unlink(struct gfs2_rgrpd *rgd, u64 *last_unlinked, u64 skip)
927 {
928 	u32 goal = 0, block;
929 	u64 no_addr;
930 	struct gfs2_sbd *sdp = rgd->rd_sbd;
931 	unsigned int n;
932 	struct gfs2_glock *gl;
933 	struct gfs2_inode *ip;
934 	int error;
935 	int found = 0;
936 
937 	while (goal < rgd->rd_data) {
938 		down_write(&sdp->sd_log_flush_lock);
939 		n = 1;
940 		block = rgblk_search(rgd, goal, GFS2_BLKST_UNLINKED,
941 				     GFS2_BLKST_UNLINKED, &n);
942 		up_write(&sdp->sd_log_flush_lock);
943 		if (block == BFITNOENT)
944 			break;
945 		/* rgblk_search can return a block < goal, so we need to
946 		   keep it marching forward. */
947 		no_addr = block + rgd->rd_data0;
948 		goal = max(block + 1, goal + 1);
949 		if (*last_unlinked != NO_BLOCK && no_addr <= *last_unlinked)
950 			continue;
951 		if (no_addr == skip)
952 			continue;
953 		*last_unlinked = no_addr;
954 
955 		error = gfs2_glock_get(sdp, no_addr, &gfs2_inode_glops, CREATE, &gl);
956 		if (error)
957 			continue;
958 
959 		/* If the inode is already in cache, we can ignore it here
960 		 * because the existing inode disposal code will deal with
961 		 * it when all refs have gone away. Accessing gl_object like
962 		 * this is not safe in general. Here it is ok because we do
963 		 * not dereference the pointer, and we only need an approx
964 		 * answer to whether it is NULL or not.
965 		 */
966 		ip = gl->gl_object;
967 
968 		if (ip || queue_work(gfs2_delete_workqueue, &gl->gl_delete) == 0)
969 			gfs2_glock_put(gl);
970 		else
971 			found++;
972 
973 		/* Limit reclaim to sensible number of tasks */
974 		if (found > NR_CPUS)
975 			return;
976 	}
977 
978 	rgd->rd_flags &= ~GFS2_RDF_CHECK;
979 	return;
980 }
981 
982 /**
983  * recent_rgrp_next - get next RG from "recent" list
984  * @cur_rgd: current rgrp
985  *
986  * Returns: The next rgrp in the recent list
987  */
988 
recent_rgrp_next(struct gfs2_rgrpd * cur_rgd)989 static struct gfs2_rgrpd *recent_rgrp_next(struct gfs2_rgrpd *cur_rgd)
990 {
991 	struct gfs2_sbd *sdp = cur_rgd->rd_sbd;
992 	struct list_head *head;
993 	struct gfs2_rgrpd *rgd;
994 
995 	spin_lock(&sdp->sd_rindex_spin);
996 	head = &sdp->sd_rindex_mru_list;
997 	if (unlikely(cur_rgd->rd_list_mru.next == head)) {
998 		spin_unlock(&sdp->sd_rindex_spin);
999 		return NULL;
1000 	}
1001 	rgd = list_entry(cur_rgd->rd_list_mru.next, struct gfs2_rgrpd, rd_list_mru);
1002 	spin_unlock(&sdp->sd_rindex_spin);
1003 	return rgd;
1004 }
1005 
1006 /**
1007  * forward_rgrp_get - get an rgrp to try next from full list
1008  * @sdp: The GFS2 superblock
1009  *
1010  * Returns: The rgrp to try next
1011  */
1012 
forward_rgrp_get(struct gfs2_sbd * sdp)1013 static struct gfs2_rgrpd *forward_rgrp_get(struct gfs2_sbd *sdp)
1014 {
1015 	struct gfs2_rgrpd *rgd;
1016 	unsigned int journals = gfs2_jindex_size(sdp);
1017 	unsigned int rg = 0, x;
1018 
1019 	spin_lock(&sdp->sd_rindex_spin);
1020 
1021 	rgd = sdp->sd_rindex_forward;
1022 	if (!rgd) {
1023 		if (sdp->sd_rgrps >= journals)
1024 			rg = sdp->sd_rgrps * sdp->sd_jdesc->jd_jid / journals;
1025 
1026 		for (x = 0, rgd = gfs2_rgrpd_get_first(sdp); x < rg;
1027 		     x++, rgd = gfs2_rgrpd_get_next(rgd))
1028 			/* Do Nothing */;
1029 
1030 		sdp->sd_rindex_forward = rgd;
1031 	}
1032 
1033 	spin_unlock(&sdp->sd_rindex_spin);
1034 
1035 	return rgd;
1036 }
1037 
1038 /**
1039  * forward_rgrp_set - set the forward rgrp pointer
1040  * @sdp: the filesystem
1041  * @rgd: The new forward rgrp
1042  *
1043  */
1044 
forward_rgrp_set(struct gfs2_sbd * sdp,struct gfs2_rgrpd * rgd)1045 static void forward_rgrp_set(struct gfs2_sbd *sdp, struct gfs2_rgrpd *rgd)
1046 {
1047 	spin_lock(&sdp->sd_rindex_spin);
1048 	sdp->sd_rindex_forward = rgd;
1049 	spin_unlock(&sdp->sd_rindex_spin);
1050 }
1051 
1052 /**
1053  * get_local_rgrp - Choose and lock a rgrp for allocation
1054  * @ip: the inode to reserve space for
1055  * @rgp: the chosen and locked rgrp
1056  *
1057  * Try to acquire rgrp in way which avoids contending with others.
1058  *
1059  * Returns: errno
1060  */
1061 
get_local_rgrp(struct gfs2_inode * ip,u64 * last_unlinked)1062 static int get_local_rgrp(struct gfs2_inode *ip, u64 *last_unlinked)
1063 {
1064 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1065 	struct gfs2_rgrpd *rgd, *begin = NULL;
1066 	struct gfs2_alloc *al = ip->i_alloc;
1067 	int flags = LM_FLAG_TRY;
1068 	int skipped = 0;
1069 	int loops = 0;
1070 	int error, rg_locked;
1071 
1072 	rgd = gfs2_blk2rgrpd(sdp, ip->i_goal);
1073 
1074 	while (rgd) {
1075 		rg_locked = 0;
1076 
1077 		if (gfs2_glock_is_locked_by_me(rgd->rd_gl)) {
1078 			rg_locked = 1;
1079 			error = 0;
1080 		} else {
1081 			error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE,
1082 						   LM_FLAG_TRY, &al->al_rgd_gh);
1083 		}
1084 		switch (error) {
1085 		case 0:
1086 			if (try_rgrp_fit(rgd, al))
1087 				goto out;
1088 			if (rgd->rd_flags & GFS2_RDF_CHECK)
1089 				try_rgrp_unlink(rgd, last_unlinked, ip->i_no_addr);
1090 			if (!rg_locked)
1091 				gfs2_glock_dq_uninit(&al->al_rgd_gh);
1092 			/* fall through */
1093 		case GLR_TRYFAILED:
1094 			rgd = recent_rgrp_next(rgd);
1095 			break;
1096 
1097 		default:
1098 			return error;
1099 		}
1100 	}
1101 
1102 	/* Go through full list of rgrps */
1103 
1104 	begin = rgd = forward_rgrp_get(sdp);
1105 
1106 	for (;;) {
1107 		rg_locked = 0;
1108 
1109 		if (gfs2_glock_is_locked_by_me(rgd->rd_gl)) {
1110 			rg_locked = 1;
1111 			error = 0;
1112 		} else {
1113 			error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_EXCLUSIVE, flags,
1114 						   &al->al_rgd_gh);
1115 		}
1116 		switch (error) {
1117 		case 0:
1118 			if (try_rgrp_fit(rgd, al))
1119 				goto out;
1120 			if (rgd->rd_flags & GFS2_RDF_CHECK)
1121 				try_rgrp_unlink(rgd, last_unlinked, ip->i_no_addr);
1122 			if (!rg_locked)
1123 				gfs2_glock_dq_uninit(&al->al_rgd_gh);
1124 			break;
1125 
1126 		case GLR_TRYFAILED:
1127 			skipped++;
1128 			break;
1129 
1130 		default:
1131 			return error;
1132 		}
1133 
1134 		rgd = gfs2_rgrpd_get_next(rgd);
1135 		if (!rgd)
1136 			rgd = gfs2_rgrpd_get_first(sdp);
1137 
1138 		if (rgd == begin) {
1139 			if (++loops >= 3)
1140 				return -ENOSPC;
1141 			if (!skipped)
1142 				loops++;
1143 			flags = 0;
1144 			if (loops == 2)
1145 				gfs2_log_flush(sdp, NULL);
1146 		}
1147 	}
1148 
1149 out:
1150 	if (begin) {
1151 		spin_lock(&sdp->sd_rindex_spin);
1152 		list_move(&rgd->rd_list_mru, &sdp->sd_rindex_mru_list);
1153 		spin_unlock(&sdp->sd_rindex_spin);
1154 		rgd = gfs2_rgrpd_get_next(rgd);
1155 		if (!rgd)
1156 			rgd = gfs2_rgrpd_get_first(sdp);
1157 		forward_rgrp_set(sdp, rgd);
1158 	}
1159 
1160 	return 0;
1161 }
1162 
1163 /**
1164  * gfs2_inplace_reserve_i - Reserve space in the filesystem
1165  * @ip: the inode to reserve space for
1166  *
1167  * Returns: errno
1168  */
1169 
gfs2_inplace_reserve_i(struct gfs2_inode * ip,int hold_rindex,char * file,unsigned int line)1170 int gfs2_inplace_reserve_i(struct gfs2_inode *ip, int hold_rindex,
1171 			   char *file, unsigned int line)
1172 {
1173 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1174 	struct gfs2_alloc *al = ip->i_alloc;
1175 	int error = 0;
1176 	u64 last_unlinked = NO_BLOCK;
1177 	int tries = 0;
1178 
1179 	if (gfs2_assert_warn(sdp, al->al_requested))
1180 		return -EINVAL;
1181 
1182 	if (hold_rindex) {
1183 		/* We need to hold the rindex unless the inode we're using is
1184 		   the rindex itself, in which case it's already held. */
1185 		if (ip != GFS2_I(sdp->sd_rindex))
1186 			error = gfs2_rindex_hold(sdp, &al->al_ri_gh);
1187 		else if (!sdp->sd_rgrps) /* We may not have the rindex read
1188 					    in, so: */
1189 			error = gfs2_ri_update(ip);
1190 		if (error)
1191 			return error;
1192 	}
1193 
1194 try_again:
1195 	do {
1196 		error = get_local_rgrp(ip, &last_unlinked);
1197 		/* If there is no space, flushing the log may release some */
1198 		if (error) {
1199 			if (ip == GFS2_I(sdp->sd_rindex) &&
1200 			    !sdp->sd_rindex_uptodate) {
1201 				error = gfs2_ri_update(ip);
1202 				if (error)
1203 					return error;
1204 				goto try_again;
1205 			}
1206 			gfs2_log_flush(sdp, NULL);
1207 		}
1208 	} while (error && tries++ < 3);
1209 
1210 	if (error) {
1211 		if (hold_rindex && ip != GFS2_I(sdp->sd_rindex))
1212 			gfs2_glock_dq_uninit(&al->al_ri_gh);
1213 		return error;
1214 	}
1215 
1216 	/* no error, so we have the rgrp set in the inode's allocation. */
1217 	al->al_file = file;
1218 	al->al_line = line;
1219 
1220 	return 0;
1221 }
1222 
1223 /**
1224  * gfs2_inplace_release - release an inplace reservation
1225  * @ip: the inode the reservation was taken out on
1226  *
1227  * Release a reservation made by gfs2_inplace_reserve().
1228  */
1229 
gfs2_inplace_release(struct gfs2_inode * ip)1230 void gfs2_inplace_release(struct gfs2_inode *ip)
1231 {
1232 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1233 	struct gfs2_alloc *al = ip->i_alloc;
1234 
1235 	if (gfs2_assert_warn(sdp, al->al_alloced <= al->al_requested) == -1)
1236 		fs_warn(sdp, "al_alloced = %u, al_requested = %u "
1237 			     "al_file = %s, al_line = %u\n",
1238 		             al->al_alloced, al->al_requested, al->al_file,
1239 			     al->al_line);
1240 
1241 	al->al_rgd = NULL;
1242 	if (al->al_rgd_gh.gh_gl)
1243 		gfs2_glock_dq_uninit(&al->al_rgd_gh);
1244 	if (ip != GFS2_I(sdp->sd_rindex) && al->al_ri_gh.gh_gl)
1245 		gfs2_glock_dq_uninit(&al->al_ri_gh);
1246 }
1247 
1248 /**
1249  * gfs2_get_block_type - Check a block in a RG is of given type
1250  * @rgd: the resource group holding the block
1251  * @block: the block number
1252  *
1253  * Returns: The block type (GFS2_BLKST_*)
1254  */
1255 
gfs2_get_block_type(struct gfs2_rgrpd * rgd,u64 block)1256 static unsigned char gfs2_get_block_type(struct gfs2_rgrpd *rgd, u64 block)
1257 {
1258 	struct gfs2_bitmap *bi = NULL;
1259 	u32 length, rgrp_block, buf_block;
1260 	unsigned int buf;
1261 	unsigned char type;
1262 
1263 	length = rgd->rd_length;
1264 	rgrp_block = block - rgd->rd_data0;
1265 
1266 	for (buf = 0; buf < length; buf++) {
1267 		bi = rgd->rd_bits + buf;
1268 		if (rgrp_block < (bi->bi_start + bi->bi_len) * GFS2_NBBY)
1269 			break;
1270 	}
1271 
1272 	gfs2_assert(rgd->rd_sbd, buf < length);
1273 	buf_block = rgrp_block - bi->bi_start * GFS2_NBBY;
1274 
1275 	type = gfs2_testbit(rgd, bi->bi_bh->b_data + bi->bi_offset,
1276 			   bi->bi_len, buf_block);
1277 
1278 	return type;
1279 }
1280 
1281 /**
1282  * rgblk_search - find a block in @old_state, change allocation
1283  *           state to @new_state
1284  * @rgd: the resource group descriptor
1285  * @goal: the goal block within the RG (start here to search for avail block)
1286  * @old_state: GFS2_BLKST_XXX the before-allocation state to find
1287  * @new_state: GFS2_BLKST_XXX the after-allocation block state
1288  * @n: The extent length
1289  *
1290  * Walk rgrp's bitmap to find bits that represent a block in @old_state.
1291  * Add the found bitmap buffer to the transaction.
1292  * Set the found bits to @new_state to change block's allocation state.
1293  *
1294  * This function never fails, because we wouldn't call it unless we
1295  * know (from reservation results, etc.) that a block is available.
1296  *
1297  * Scope of @goal and returned block is just within rgrp, not the whole
1298  * filesystem.
1299  *
1300  * Returns:  the block number allocated
1301  */
1302 
rgblk_search(struct gfs2_rgrpd * rgd,u32 goal,unsigned char old_state,unsigned char new_state,unsigned int * n)1303 static u32 rgblk_search(struct gfs2_rgrpd *rgd, u32 goal,
1304 			unsigned char old_state, unsigned char new_state,
1305 			unsigned int *n)
1306 {
1307 	struct gfs2_bitmap *bi = NULL;
1308 	const u32 length = rgd->rd_length;
1309 	u32 blk = BFITNOENT;
1310 	unsigned int buf, x;
1311 	const unsigned int elen = *n;
1312 	const u8 *buffer = NULL;
1313 
1314 	*n = 0;
1315 	/* Find bitmap block that contains bits for goal block */
1316 	for (buf = 0; buf < length; buf++) {
1317 		bi = rgd->rd_bits + buf;
1318 		/* Convert scope of "goal" from rgrp-wide to within found bit block */
1319 		if (goal < (bi->bi_start + bi->bi_len) * GFS2_NBBY) {
1320 			goal -= bi->bi_start * GFS2_NBBY;
1321 			goto do_search;
1322 		}
1323 	}
1324 	buf = 0;
1325 	goal = 0;
1326 
1327 do_search:
1328 	/* Search (up to entire) bitmap in this rgrp for allocatable block.
1329 	   "x <= length", instead of "x < length", because we typically start
1330 	   the search in the middle of a bit block, but if we can't find an
1331 	   allocatable block anywhere else, we want to be able wrap around and
1332 	   search in the first part of our first-searched bit block.  */
1333 	for (x = 0; x <= length; x++) {
1334 		bi = rgd->rd_bits + buf;
1335 
1336 		if (test_bit(GBF_FULL, &bi->bi_flags) &&
1337 		    (old_state == GFS2_BLKST_FREE))
1338 			goto skip;
1339 
1340 		/* The GFS2_BLKST_UNLINKED state doesn't apply to the clone
1341 		   bitmaps, so we must search the originals for that. */
1342 		buffer = bi->bi_bh->b_data + bi->bi_offset;
1343 		if (old_state != GFS2_BLKST_UNLINKED && bi->bi_clone)
1344 			buffer = bi->bi_clone + bi->bi_offset;
1345 
1346 		blk = gfs2_bitfit(buffer, bi->bi_len, goal, old_state);
1347 		if (blk != BFITNOENT)
1348 			break;
1349 
1350 		if ((goal == 0) && (old_state == GFS2_BLKST_FREE))
1351 			set_bit(GBF_FULL, &bi->bi_flags);
1352 
1353 		/* Try next bitmap block (wrap back to rgrp header if at end) */
1354 skip:
1355 		buf++;
1356 		buf %= length;
1357 		goal = 0;
1358 	}
1359 
1360 	if (blk == BFITNOENT)
1361 		return blk;
1362 	*n = 1;
1363 	if (old_state == new_state)
1364 		goto out;
1365 
1366 	gfs2_trans_add_bh(rgd->rd_gl, bi->bi_bh, 1);
1367 	gfs2_setbit(rgd, bi->bi_bh->b_data, bi->bi_clone, bi->bi_offset,
1368 		    bi->bi_len, blk, new_state);
1369 	goal = blk;
1370 	while (*n < elen) {
1371 		goal++;
1372 		if (goal >= (bi->bi_len * GFS2_NBBY))
1373 			break;
1374 		if (gfs2_testbit(rgd, buffer, bi->bi_len, goal) !=
1375 		    GFS2_BLKST_FREE)
1376 			break;
1377 		gfs2_setbit(rgd, bi->bi_bh->b_data, bi->bi_clone, bi->bi_offset,
1378 			    bi->bi_len, goal, new_state);
1379 		(*n)++;
1380 	}
1381 out:
1382 	return (bi->bi_start * GFS2_NBBY) + blk;
1383 }
1384 
1385 /**
1386  * rgblk_free - Change alloc state of given block(s)
1387  * @sdp: the filesystem
1388  * @bstart: the start of a run of blocks to free
1389  * @blen: the length of the block run (all must lie within ONE RG!)
1390  * @new_state: GFS2_BLKST_XXX the after-allocation block state
1391  *
1392  * Returns:  Resource group containing the block(s)
1393  */
1394 
rgblk_free(struct gfs2_sbd * sdp,u64 bstart,u32 blen,unsigned char new_state)1395 static struct gfs2_rgrpd *rgblk_free(struct gfs2_sbd *sdp, u64 bstart,
1396 				     u32 blen, unsigned char new_state)
1397 {
1398 	struct gfs2_rgrpd *rgd;
1399 	struct gfs2_bitmap *bi = NULL;
1400 	u32 length, rgrp_blk, buf_blk;
1401 	unsigned int buf;
1402 
1403 	rgd = gfs2_blk2rgrpd(sdp, bstart);
1404 	if (!rgd) {
1405 		if (gfs2_consist(sdp))
1406 			fs_err(sdp, "block = %llu\n", (unsigned long long)bstart);
1407 		return NULL;
1408 	}
1409 
1410 	length = rgd->rd_length;
1411 
1412 	rgrp_blk = bstart - rgd->rd_data0;
1413 
1414 	while (blen--) {
1415 		for (buf = 0; buf < length; buf++) {
1416 			bi = rgd->rd_bits + buf;
1417 			if (rgrp_blk < (bi->bi_start + bi->bi_len) * GFS2_NBBY)
1418 				break;
1419 		}
1420 
1421 		gfs2_assert(rgd->rd_sbd, buf < length);
1422 
1423 		buf_blk = rgrp_blk - bi->bi_start * GFS2_NBBY;
1424 		rgrp_blk++;
1425 
1426 		if (!bi->bi_clone) {
1427 			bi->bi_clone = kmalloc(bi->bi_bh->b_size,
1428 					       GFP_NOFS | __GFP_NOFAIL);
1429 			memcpy(bi->bi_clone + bi->bi_offset,
1430 			       bi->bi_bh->b_data + bi->bi_offset,
1431 			       bi->bi_len);
1432 		}
1433 		gfs2_trans_add_bh(rgd->rd_gl, bi->bi_bh, 1);
1434 		gfs2_setbit(rgd, bi->bi_bh->b_data, NULL, bi->bi_offset,
1435 			    bi->bi_len, buf_blk, new_state);
1436 	}
1437 
1438 	return rgd;
1439 }
1440 
1441 /**
1442  * gfs2_rgrp_dump - print out an rgrp
1443  * @seq: The iterator
1444  * @gl: The glock in question
1445  *
1446  */
1447 
gfs2_rgrp_dump(struct seq_file * seq,const struct gfs2_glock * gl)1448 int gfs2_rgrp_dump(struct seq_file *seq, const struct gfs2_glock *gl)
1449 {
1450 	const struct gfs2_rgrpd *rgd = gl->gl_object;
1451 	if (rgd == NULL)
1452 		return 0;
1453 	gfs2_print_dbg(seq, " R: n:%llu f:%02x b:%u/%u i:%u\n",
1454 		       (unsigned long long)rgd->rd_addr, rgd->rd_flags,
1455 		       rgd->rd_free, rgd->rd_free_clone, rgd->rd_dinodes);
1456 	return 0;
1457 }
1458 
gfs2_rgrp_error(struct gfs2_rgrpd * rgd)1459 static void gfs2_rgrp_error(struct gfs2_rgrpd *rgd)
1460 {
1461 	struct gfs2_sbd *sdp = rgd->rd_sbd;
1462 	fs_warn(sdp, "rgrp %llu has an error, marking it readonly until umount\n",
1463 		(unsigned long long)rgd->rd_addr);
1464 	fs_warn(sdp, "umount on all nodes and run fsck.gfs2 to fix the error\n");
1465 	gfs2_rgrp_dump(NULL, rgd->rd_gl);
1466 	rgd->rd_flags |= GFS2_RDF_ERROR;
1467 }
1468 
1469 /**
1470  * gfs2_alloc_block - Allocate one or more blocks
1471  * @ip: the inode to allocate the block for
1472  * @bn: Used to return the starting block number
1473  * @n: requested number of blocks/extent length (value/result)
1474  *
1475  * Returns: 0 or error
1476  */
1477 
gfs2_alloc_block(struct gfs2_inode * ip,u64 * bn,unsigned int * n)1478 int gfs2_alloc_block(struct gfs2_inode *ip, u64 *bn, unsigned int *n)
1479 {
1480 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1481 	struct buffer_head *dibh;
1482 	struct gfs2_alloc *al = ip->i_alloc;
1483 	struct gfs2_rgrpd *rgd;
1484 	u32 goal, blk;
1485 	u64 block;
1486 	int error;
1487 
1488 	/* Only happens if there is a bug in gfs2, return something distinctive
1489 	 * to ensure that it is noticed.
1490 	 */
1491 	if (al == NULL)
1492 		return -ECANCELED;
1493 
1494 	rgd = al->al_rgd;
1495 
1496 	if (rgrp_contains_block(rgd, ip->i_goal))
1497 		goal = ip->i_goal - rgd->rd_data0;
1498 	else
1499 		goal = rgd->rd_last_alloc;
1500 
1501 	blk = rgblk_search(rgd, goal, GFS2_BLKST_FREE, GFS2_BLKST_USED, n);
1502 
1503 	/* Since all blocks are reserved in advance, this shouldn't happen */
1504 	if (blk == BFITNOENT)
1505 		goto rgrp_error;
1506 
1507 	rgd->rd_last_alloc = blk;
1508 	block = rgd->rd_data0 + blk;
1509 	ip->i_goal = block;
1510 	error = gfs2_meta_inode_buffer(ip, &dibh);
1511 	if (error == 0) {
1512 		struct gfs2_dinode *di = (struct gfs2_dinode *)dibh->b_data;
1513 		gfs2_trans_add_bh(ip->i_gl, dibh, 1);
1514 		di->di_goal_meta = di->di_goal_data = cpu_to_be64(ip->i_goal);
1515 		brelse(dibh);
1516 	}
1517 	if (rgd->rd_free < *n)
1518 		goto rgrp_error;
1519 
1520 	rgd->rd_free -= *n;
1521 
1522 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1523 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1524 
1525 	al->al_alloced += *n;
1526 
1527 	gfs2_statfs_change(sdp, 0, -(s64)*n, 0);
1528 	gfs2_quota_change(ip, *n, ip->i_inode.i_uid, ip->i_inode.i_gid);
1529 
1530 	spin_lock(&sdp->sd_rindex_spin);
1531 	rgd->rd_free_clone -= *n;
1532 	spin_unlock(&sdp->sd_rindex_spin);
1533 	trace_gfs2_block_alloc(ip, block, *n, GFS2_BLKST_USED);
1534 	*bn = block;
1535 	return 0;
1536 
1537 rgrp_error:
1538 	gfs2_rgrp_error(rgd);
1539 	return -EIO;
1540 }
1541 
1542 /**
1543  * gfs2_alloc_di - Allocate a dinode
1544  * @dip: the directory that the inode is going in
1545  * @bn: the block number which is allocated
1546  * @generation: the generation number of the inode
1547  *
1548  * Returns: 0 on success or error
1549  */
1550 
gfs2_alloc_di(struct gfs2_inode * dip,u64 * bn,u64 * generation)1551 int gfs2_alloc_di(struct gfs2_inode *dip, u64 *bn, u64 *generation)
1552 {
1553 	struct gfs2_sbd *sdp = GFS2_SB(&dip->i_inode);
1554 	struct gfs2_alloc *al = dip->i_alloc;
1555 	struct gfs2_rgrpd *rgd = al->al_rgd;
1556 	u32 blk;
1557 	u64 block;
1558 	unsigned int n = 1;
1559 
1560 	blk = rgblk_search(rgd, rgd->rd_last_alloc,
1561 			   GFS2_BLKST_FREE, GFS2_BLKST_DINODE, &n);
1562 
1563 	/* Since all blocks are reserved in advance, this shouldn't happen */
1564 	if (blk == BFITNOENT)
1565 		goto rgrp_error;
1566 
1567 	rgd->rd_last_alloc = blk;
1568 	block = rgd->rd_data0 + blk;
1569 	if (rgd->rd_free == 0)
1570 		goto rgrp_error;
1571 
1572 	rgd->rd_free--;
1573 	rgd->rd_dinodes++;
1574 	*generation = rgd->rd_igeneration++;
1575 	if (*generation == 0)
1576 		*generation = rgd->rd_igeneration++;
1577 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1578 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1579 
1580 	al->al_alloced++;
1581 
1582 	gfs2_statfs_change(sdp, 0, -1, +1);
1583 	gfs2_trans_add_unrevoke(sdp, block, 1);
1584 
1585 	spin_lock(&sdp->sd_rindex_spin);
1586 	rgd->rd_free_clone--;
1587 	spin_unlock(&sdp->sd_rindex_spin);
1588 	trace_gfs2_block_alloc(dip, block, 1, GFS2_BLKST_DINODE);
1589 	*bn = block;
1590 	return 0;
1591 
1592 rgrp_error:
1593 	gfs2_rgrp_error(rgd);
1594 	return -EIO;
1595 }
1596 
1597 /**
1598  * gfs2_free_data - free a contiguous run of data block(s)
1599  * @ip: the inode these blocks are being freed from
1600  * @bstart: first block of a run of contiguous blocks
1601  * @blen: the length of the block run
1602  *
1603  */
1604 
__gfs2_free_data(struct gfs2_inode * ip,u64 bstart,u32 blen)1605 void __gfs2_free_data(struct gfs2_inode *ip, u64 bstart, u32 blen)
1606 {
1607 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1608 	struct gfs2_rgrpd *rgd;
1609 
1610 	rgd = rgblk_free(sdp, bstart, blen, GFS2_BLKST_FREE);
1611 	if (!rgd)
1612 		return;
1613 	trace_gfs2_block_alloc(ip, bstart, blen, GFS2_BLKST_FREE);
1614 	rgd->rd_free += blen;
1615 
1616 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1617 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1618 
1619 	gfs2_trans_add_rg(rgd);
1620 }
1621 
1622 /**
1623  * gfs2_free_data - free a contiguous run of data block(s)
1624  * @ip: the inode these blocks are being freed from
1625  * @bstart: first block of a run of contiguous blocks
1626  * @blen: the length of the block run
1627  *
1628  */
1629 
gfs2_free_data(struct gfs2_inode * ip,u64 bstart,u32 blen)1630 void gfs2_free_data(struct gfs2_inode *ip, u64 bstart, u32 blen)
1631 {
1632 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1633 
1634 	__gfs2_free_data(ip, bstart, blen);
1635 	gfs2_statfs_change(sdp, 0, +blen, 0);
1636 	gfs2_quota_change(ip, -(s64)blen, ip->i_inode.i_uid, ip->i_inode.i_gid);
1637 }
1638 
1639 /**
1640  * gfs2_free_meta - free a contiguous run of data block(s)
1641  * @ip: the inode these blocks are being freed from
1642  * @bstart: first block of a run of contiguous blocks
1643  * @blen: the length of the block run
1644  *
1645  */
1646 
__gfs2_free_meta(struct gfs2_inode * ip,u64 bstart,u32 blen)1647 void __gfs2_free_meta(struct gfs2_inode *ip, u64 bstart, u32 blen)
1648 {
1649 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1650 	struct gfs2_rgrpd *rgd;
1651 
1652 	rgd = rgblk_free(sdp, bstart, blen, GFS2_BLKST_FREE);
1653 	if (!rgd)
1654 		return;
1655 	trace_gfs2_block_alloc(ip, bstart, blen, GFS2_BLKST_FREE);
1656 	rgd->rd_free += blen;
1657 
1658 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1659 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1660 
1661 	gfs2_trans_add_rg(rgd);
1662 	gfs2_meta_wipe(ip, bstart, blen);
1663 }
1664 
1665 /**
1666  * gfs2_free_meta - free a contiguous run of data block(s)
1667  * @ip: the inode these blocks are being freed from
1668  * @bstart: first block of a run of contiguous blocks
1669  * @blen: the length of the block run
1670  *
1671  */
1672 
gfs2_free_meta(struct gfs2_inode * ip,u64 bstart,u32 blen)1673 void gfs2_free_meta(struct gfs2_inode *ip, u64 bstart, u32 blen)
1674 {
1675 	struct gfs2_sbd *sdp = GFS2_SB(&ip->i_inode);
1676 
1677 	__gfs2_free_meta(ip, bstart, blen);
1678 	gfs2_statfs_change(sdp, 0, +blen, 0);
1679 	gfs2_quota_change(ip, -(s64)blen, ip->i_inode.i_uid, ip->i_inode.i_gid);
1680 }
1681 
gfs2_unlink_di(struct inode * inode)1682 void gfs2_unlink_di(struct inode *inode)
1683 {
1684 	struct gfs2_inode *ip = GFS2_I(inode);
1685 	struct gfs2_sbd *sdp = GFS2_SB(inode);
1686 	struct gfs2_rgrpd *rgd;
1687 	u64 blkno = ip->i_no_addr;
1688 
1689 	rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_UNLINKED);
1690 	if (!rgd)
1691 		return;
1692 	trace_gfs2_block_alloc(ip, blkno, 1, GFS2_BLKST_UNLINKED);
1693 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1694 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1695 	gfs2_trans_add_rg(rgd);
1696 }
1697 
gfs2_free_uninit_di(struct gfs2_rgrpd * rgd,u64 blkno)1698 static void gfs2_free_uninit_di(struct gfs2_rgrpd *rgd, u64 blkno)
1699 {
1700 	struct gfs2_sbd *sdp = rgd->rd_sbd;
1701 	struct gfs2_rgrpd *tmp_rgd;
1702 
1703 	tmp_rgd = rgblk_free(sdp, blkno, 1, GFS2_BLKST_FREE);
1704 	if (!tmp_rgd)
1705 		return;
1706 	gfs2_assert_withdraw(sdp, rgd == tmp_rgd);
1707 
1708 	if (!rgd->rd_dinodes)
1709 		gfs2_consist_rgrpd(rgd);
1710 	rgd->rd_dinodes--;
1711 	rgd->rd_free++;
1712 
1713 	gfs2_trans_add_bh(rgd->rd_gl, rgd->rd_bits[0].bi_bh, 1);
1714 	gfs2_rgrp_out(rgd, rgd->rd_bits[0].bi_bh->b_data);
1715 
1716 	gfs2_statfs_change(sdp, 0, +1, -1);
1717 	gfs2_trans_add_rg(rgd);
1718 }
1719 
1720 
gfs2_free_di(struct gfs2_rgrpd * rgd,struct gfs2_inode * ip)1721 void gfs2_free_di(struct gfs2_rgrpd *rgd, struct gfs2_inode *ip)
1722 {
1723 	gfs2_free_uninit_di(rgd, ip->i_no_addr);
1724 	trace_gfs2_block_alloc(ip, ip->i_no_addr, 1, GFS2_BLKST_FREE);
1725 	gfs2_quota_change(ip, -1, ip->i_inode.i_uid, ip->i_inode.i_gid);
1726 	gfs2_meta_wipe(ip, ip->i_no_addr, 1);
1727 }
1728 
1729 /**
1730  * gfs2_check_blk_type - Check the type of a block
1731  * @sdp: The superblock
1732  * @no_addr: The block number to check
1733  * @type: The block type we are looking for
1734  *
1735  * Returns: 0 if the block type matches the expected type
1736  *          -ESTALE if it doesn't match
1737  *          or -ve errno if something went wrong while checking
1738  */
1739 
gfs2_check_blk_type(struct gfs2_sbd * sdp,u64 no_addr,unsigned int type)1740 int gfs2_check_blk_type(struct gfs2_sbd *sdp, u64 no_addr, unsigned int type)
1741 {
1742 	struct gfs2_rgrpd *rgd;
1743 	struct gfs2_holder ri_gh, rgd_gh;
1744 	struct gfs2_inode *ip = GFS2_I(sdp->sd_rindex);
1745 	int ri_locked = 0;
1746 	int error;
1747 
1748 	if (!gfs2_glock_is_locked_by_me(ip->i_gl)) {
1749 		error = gfs2_rindex_hold(sdp, &ri_gh);
1750 		if (error)
1751 			goto fail;
1752 		ri_locked = 1;
1753 	}
1754 
1755 	error = -EINVAL;
1756 	rgd = gfs2_blk2rgrpd(sdp, no_addr);
1757 	if (!rgd)
1758 		goto fail_rindex;
1759 
1760 	error = gfs2_glock_nq_init(rgd->rd_gl, LM_ST_SHARED, 0, &rgd_gh);
1761 	if (error)
1762 		goto fail_rindex;
1763 
1764 	if (gfs2_get_block_type(rgd, no_addr) != type)
1765 		error = -ESTALE;
1766 
1767 	gfs2_glock_dq_uninit(&rgd_gh);
1768 fail_rindex:
1769 	if (ri_locked)
1770 		gfs2_glock_dq_uninit(&ri_gh);
1771 fail:
1772 	return error;
1773 }
1774 
1775 /**
1776  * gfs2_rlist_add - add a RG to a list of RGs
1777  * @sdp: the filesystem
1778  * @rlist: the list of resource groups
1779  * @block: the block
1780  *
1781  * Figure out what RG a block belongs to and add that RG to the list
1782  *
1783  * FIXME: Don't use NOFAIL
1784  *
1785  */
1786 
gfs2_rlist_add(struct gfs2_sbd * sdp,struct gfs2_rgrp_list * rlist,u64 block)1787 void gfs2_rlist_add(struct gfs2_sbd *sdp, struct gfs2_rgrp_list *rlist,
1788 		    u64 block)
1789 {
1790 	struct gfs2_rgrpd *rgd;
1791 	struct gfs2_rgrpd **tmp;
1792 	unsigned int new_space;
1793 	unsigned int x;
1794 
1795 	if (gfs2_assert_warn(sdp, !rlist->rl_ghs))
1796 		return;
1797 
1798 	rgd = gfs2_blk2rgrpd(sdp, block);
1799 	if (!rgd) {
1800 		if (gfs2_consist(sdp))
1801 			fs_err(sdp, "block = %llu\n", (unsigned long long)block);
1802 		return;
1803 	}
1804 
1805 	for (x = 0; x < rlist->rl_rgrps; x++)
1806 		if (rlist->rl_rgd[x] == rgd)
1807 			return;
1808 
1809 	if (rlist->rl_rgrps == rlist->rl_space) {
1810 		new_space = rlist->rl_space + 10;
1811 
1812 		tmp = kcalloc(new_space, sizeof(struct gfs2_rgrpd *),
1813 			      GFP_NOFS | __GFP_NOFAIL);
1814 
1815 		if (rlist->rl_rgd) {
1816 			memcpy(tmp, rlist->rl_rgd,
1817 			       rlist->rl_space * sizeof(struct gfs2_rgrpd *));
1818 			kfree(rlist->rl_rgd);
1819 		}
1820 
1821 		rlist->rl_space = new_space;
1822 		rlist->rl_rgd = tmp;
1823 	}
1824 
1825 	rlist->rl_rgd[rlist->rl_rgrps++] = rgd;
1826 }
1827 
1828 /**
1829  * gfs2_rlist_alloc - all RGs have been added to the rlist, now allocate
1830  *      and initialize an array of glock holders for them
1831  * @rlist: the list of resource groups
1832  * @state: the lock state to acquire the RG lock in
1833  * @flags: the modifier flags for the holder structures
1834  *
1835  * FIXME: Don't use NOFAIL
1836  *
1837  */
1838 
gfs2_rlist_alloc(struct gfs2_rgrp_list * rlist,unsigned int state)1839 void gfs2_rlist_alloc(struct gfs2_rgrp_list *rlist, unsigned int state)
1840 {
1841 	unsigned int x;
1842 
1843 	rlist->rl_ghs = kcalloc(rlist->rl_rgrps, sizeof(struct gfs2_holder),
1844 				GFP_NOFS | __GFP_NOFAIL);
1845 	for (x = 0; x < rlist->rl_rgrps; x++)
1846 		gfs2_holder_init(rlist->rl_rgd[x]->rd_gl,
1847 				state, 0,
1848 				&rlist->rl_ghs[x]);
1849 }
1850 
1851 /**
1852  * gfs2_rlist_free - free a resource group list
1853  * @list: the list of resource groups
1854  *
1855  */
1856 
gfs2_rlist_free(struct gfs2_rgrp_list * rlist)1857 void gfs2_rlist_free(struct gfs2_rgrp_list *rlist)
1858 {
1859 	unsigned int x;
1860 
1861 	kfree(rlist->rl_rgd);
1862 
1863 	if (rlist->rl_ghs) {
1864 		for (x = 0; x < rlist->rl_rgrps; x++)
1865 			gfs2_holder_uninit(&rlist->rl_ghs[x]);
1866 		kfree(rlist->rl_ghs);
1867 	}
1868 }
1869 
1870