1ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* -*- mode: c; c-basic-offset: 8; -*-
2ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * vim: noexpandtab sw=8 ts=8 sts=0:
3ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
4ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * suballoc.c
5ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
6ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * metadata alloc and free
7ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * Inspired by ext3 block groups.
8ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
9ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * Copyright (C) 2002, 2004 Oracle.  All rights reserved.
10ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
11ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * This program is free software; you can redistribute it and/or
12ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * modify it under the terms of the GNU General Public
13ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * License as published by the Free Software Foundation; either
14ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * version 2 of the License, or (at your option) any later version.
15ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
16ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * This program is distributed in the hope that it will be useful,
17ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * but WITHOUT ANY WARRANTY; without even the implied warranty of
18ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
19ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * General Public License for more details.
20ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
21ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * You should have received a copy of the GNU General Public
22ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * License along with this program; if not, write to the
23ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
24ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * Boston, MA 021110-1307, USA.
25ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh */
26ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
27ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include <linux/fs.h>
28ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include <linux/types.h>
29ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include <linux/slab.h>
30ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include <linux/highmem.h>
31ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
32ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include <cluster/masklog.h>
33ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
34ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "ocfs2.h"
35ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
36ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "alloc.h"
37d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker#include "blockcheck.h"
38ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "dlmglue.h"
39ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "inode.h"
40ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "journal.h"
41ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "localalloc.h"
42ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "suballoc.h"
43ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "super.h"
44ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "sysfile.h"
45ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "uptodate.h"
462f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma#include "ocfs2_trace.h"
47ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
48ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh#include "buffer_head_io.h"
49ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
50ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma#define NOT_ALLOC_NEW_GROUP		0
5160ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma#define ALLOC_NEW_GROUP			0x1
5260ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma#define ALLOC_GROUPS_FROM_GLOBAL	0x2
53ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma
54b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang#define OCFS2_MAX_TO_STEAL		1024
554d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
567d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Beckerstruct ocfs2_suballoc_result {
572b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	u64		sr_bg_blkno;	/* The bg we allocated from.  Set
582b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker					   to 0 when a block group is
592b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker					   contiguous. */
60e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	u64		sr_bg_stable_blkno; /*
61e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					     * Doesn't change, always
62e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					     * set to target block
63e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					     * group descriptor
64e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					     * block.
65e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					     */
66ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	u64		sr_blkno;	/* The first allocated block */
677d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	unsigned int	sr_bit_offset;	/* The bit in the bg */
687d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	unsigned int	sr_bits;	/* How many bits we claimed */
697d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker};
707d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker
71b2b6ebf5f740e015b2155343958f067e594323eaMark Fashehstatic u64 ocfs2_group_from_res(struct ocfs2_suballoc_result *res)
72b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh{
73b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	if (res->sr_blkno == 0)
74b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh		return 0;
75b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh
76b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	if (res->sr_bg_blkno)
77b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh		return res->sr_bg_blkno;
78b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh
79b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	return ocfs2_which_suballoc_group(res->sr_blkno, res->sr_bit_offset);
80b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh}
81b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh
82ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_debug_bg(struct ocfs2_group_desc *bg);
83ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_debug_suballoc_inode(struct ocfs2_dinode *fe);
84ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline u16 ocfs2_find_victim_chain(struct ocfs2_chain_list *cl);
851fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fashehstatic int ocfs2_block_group_fill(handle_t *handle,
86ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct inode *alloc_inode,
87ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct buffer_head *bg_bh,
88ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  u64 group_blkno,
89798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				  unsigned int group_clusters,
90ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  u16 my_chain,
91ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct ocfs2_chain_list *cl);
92ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_block_group_alloc(struct ocfs2_super *osb,
93ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				   struct inode *alloc_inode,
941187c968852e3c668f3b9376083851f81f6eee22Joel Becker				   struct buffer_head *bh,
9560ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma				   u64 max_block,
96feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma				   u64 *last_alloc_group,
9760ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma				   int flags);
98ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
99ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_cluster_group_search(struct inode *inode,
100ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				      struct buffer_head *group_bh,
101ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				      u32 bits_wanted, u32 min_bits,
1021187c968852e3c668f3b9376083851f81f6eee22Joel Becker				      u64 max_block,
1037d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				      struct ocfs2_suballoc_result *res);
104ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_block_group_search(struct inode *inode,
105ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *group_bh,
106ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    u32 bits_wanted, u32 min_bits,
1071187c968852e3c668f3b9376083851f81f6eee22Joel Becker				    u64 max_block,
1087d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				    struct ocfs2_suballoc_result *res);
109aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Beckerstatic int ocfs2_claim_suballoc_bits(struct ocfs2_alloc_context *ac,
1101fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh				     handle_t *handle,
111ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				     u32 bits_wanted,
112ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				     u32 min_bits,
1137d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				     struct ocfs2_suballoc_result *res);
114ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_test_bg_bit_allocatable(struct buffer_head *bg_bh,
115ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					 int nr);
1161fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fashehstatic int ocfs2_relink_block_group(handle_t *handle,
117ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct inode *alloc_inode,
118ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *fe_bh,
119ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *bg_bh,
120ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *prev_bg_bh,
121ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    u16 chain);
122ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline int ocfs2_block_group_reasonably_empty(struct ocfs2_group_desc *bg,
123ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						     u32 wanted);
124ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline u32 ocfs2_desc_bitmap_to_cluster_off(struct inode *inode,
125ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   u64 bg_blkno,
126ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   u16 bg_bit_off);
127ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_block_to_cluster_group(struct inode *inode,
128ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u64 data_blkno,
129ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u64 *bg_blkno,
130ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u16 *bg_bit_off);
1311187c968852e3c668f3b9376083851f81f6eee22Joel Beckerstatic int ocfs2_reserve_clusters_with_limit(struct ocfs2_super *osb,
1321187c968852e3c668f3b9376083851f81f6eee22Joel Becker					     u32 bits_wanted, u64 max_block,
13360ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma					     int flags,
1341187c968852e3c668f3b9376083851f81f6eee22Joel Becker					     struct ocfs2_alloc_context **ac);
135ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1369c7af40b210e87f8fddd97b0badc0a352862234aMark Fashehvoid ocfs2_free_ac_resource(struct ocfs2_alloc_context *ac)
137ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
138da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	struct inode *inode = ac->ac_inode;
139da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
140da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	if (inode) {
141da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		if (ac->ac_which != OCFS2_AC_USE_LOCAL)
142e63aecb651ba73dffc62f9608ee1b7ae2a0ffd4bMark Fasheh			ocfs2_inode_unlock(inode, 1);
143da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
144da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		mutex_unlock(&inode->i_mutex);
145da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
146da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		iput(inode);
1474d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		ac->ac_inode = NULL;
148da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	}
149a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(ac->ac_bh);
150a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	ac->ac_bh = NULL;
151e3b4a97dbe9741a3227c3ed857a0632532fcd386Mark Fasheh	ac->ac_resv = NULL;
152e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ac->ac_find_loc_priv) {
153e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		kfree(ac->ac_find_loc_priv);
154e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		ac->ac_find_loc_priv = NULL;
155e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
1564d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma}
1574d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
1584d0ddb2ce25db2254d468233d942276ecf40bff8Tao Mavoid ocfs2_free_alloc_context(struct ocfs2_alloc_context *ac)
1594d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma{
1604d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	ocfs2_free_ac_resource(ac);
161ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	kfree(ac);
162ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
163ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
164ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic u32 ocfs2_bits_per_group(struct ocfs2_chain_list *cl)
165ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
166ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return (u32)le16_to_cpu(cl->cl_cpg) * (u32)le16_to_cpu(cl->cl_bpc);
167ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
168ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
16957e3e7971136003c96766346049aa73b82cab079Joel Becker#define do_error(fmt, ...)						\
17057e3e7971136003c96766346049aa73b82cab079Joel Becker	do{								\
17178c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma		if (resize)					\
17257e3e7971136003c96766346049aa73b82cab079Joel Becker			mlog(ML_ERROR, fmt "\n", ##__VA_ARGS__);	\
17357e3e7971136003c96766346049aa73b82cab079Joel Becker		else							\
17457e3e7971136003c96766346049aa73b82cab079Joel Becker			ocfs2_error(sb, fmt, ##__VA_ARGS__);		\
17557e3e7971136003c96766346049aa73b82cab079Joel Becker	} while (0)
17657e3e7971136003c96766346049aa73b82cab079Joel Becker
177970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Beckerstatic int ocfs2_validate_gd_self(struct super_block *sb,
178970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker				  struct buffer_head *bh,
17978c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma				  int resize)
180970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker{
181970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	struct ocfs2_group_desc *gd = (struct ocfs2_group_desc *)bh->b_data;
182970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
1837bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	if (!OCFS2_IS_VALID_GROUP_DESC(gd)) {
18468f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has bad signature %.*s",
18568f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr, 7,
18657e3e7971136003c96766346049aa73b82cab079Joel Becker			 gd->bg_signature);
18757e3e7971136003c96766346049aa73b82cab079Joel Becker		return -EINVAL;
1887bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	}
1897bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
19068f64d471be38631d7196b938d9809802dd467faJoel Becker	if (le64_to_cpu(gd->bg_blkno) != bh->b_blocknr) {
19168f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has an invalid bg_blkno "
19268f64d471be38631d7196b938d9809802dd467faJoel Becker			 "of %llu",
19368f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr,
19468f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)le64_to_cpu(gd->bg_blkno));
19568f64d471be38631d7196b938d9809802dd467faJoel Becker		return -EINVAL;
19668f64d471be38631d7196b938d9809802dd467faJoel Becker	}
19768f64d471be38631d7196b938d9809802dd467faJoel Becker
19868f64d471be38631d7196b938d9809802dd467faJoel Becker	if (le32_to_cpu(gd->bg_generation) != OCFS2_SB(sb)->fs_generation) {
19968f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has an invalid "
20068f64d471be38631d7196b938d9809802dd467faJoel Becker			 "fs_generation of #%u",
20168f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr,
20268f64d471be38631d7196b938d9809802dd467faJoel Becker			 le32_to_cpu(gd->bg_generation));
20368f64d471be38631d7196b938d9809802dd467faJoel Becker		return -EINVAL;
20468f64d471be38631d7196b938d9809802dd467faJoel Becker	}
20568f64d471be38631d7196b938d9809802dd467faJoel Becker
206970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	if (le16_to_cpu(gd->bg_free_bits_count) > le16_to_cpu(gd->bg_bits)) {
207970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker		do_error("Group descriptor #%llu has bit count %u but "
208970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 "claims that %u are free",
209970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 (unsigned long long)bh->b_blocknr,
210970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 le16_to_cpu(gd->bg_bits),
211970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 le16_to_cpu(gd->bg_free_bits_count));
212970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker		return -EINVAL;
213970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	}
214970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
215970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	if (le16_to_cpu(gd->bg_bits) > (8 * le16_to_cpu(gd->bg_size))) {
216970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker		do_error("Group descriptor #%llu has bit count %u but "
217970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 "max bitmap bits of %u",
218970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 (unsigned long long)bh->b_blocknr,
219970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 le16_to_cpu(gd->bg_bits),
220970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			 8 * le16_to_cpu(gd->bg_size));
221970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker		return -EINVAL;
222970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	}
223970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
224970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	return 0;
225970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker}
226970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
227970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Beckerstatic int ocfs2_validate_gd_parent(struct super_block *sb,
228970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker				    struct ocfs2_dinode *di,
229970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker				    struct buffer_head *bh,
23078c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma				    int resize)
231970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker{
232970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	unsigned int max_bits;
233970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	struct ocfs2_group_desc *gd = (struct ocfs2_group_desc *)bh->b_data;
234970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
2357bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	if (di->i_blkno != gd->bg_parent_dinode) {
23668f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has bad parent "
23757e3e7971136003c96766346049aa73b82cab079Joel Becker			 "pointer (%llu, expected %llu)",
23868f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr,
23957e3e7971136003c96766346049aa73b82cab079Joel Becker			 (unsigned long long)le64_to_cpu(gd->bg_parent_dinode),
24057e3e7971136003c96766346049aa73b82cab079Joel Becker			 (unsigned long long)le64_to_cpu(di->i_blkno));
24157e3e7971136003c96766346049aa73b82cab079Joel Becker		return -EINVAL;
2427bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	}
2437bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
2447bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	max_bits = le16_to_cpu(di->id2.i_chain.cl_cpg) * le16_to_cpu(di->id2.i_chain.cl_bpc);
2457bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	if (le16_to_cpu(gd->bg_bits) > max_bits) {
24668f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has bit count of %u",
24768f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr,
24857e3e7971136003c96766346049aa73b82cab079Joel Becker			 le16_to_cpu(gd->bg_bits));
24957e3e7971136003c96766346049aa73b82cab079Joel Becker		return -EINVAL;
2507bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	}
2517bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
25278c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma	/* In resize, we may meet the case bg_chain == cl_next_free_rec. */
25378c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma	if ((le16_to_cpu(gd->bg_chain) >
25478c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma	     le16_to_cpu(di->id2.i_chain.cl_next_free_rec)) ||
25578c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma	    ((le16_to_cpu(gd->bg_chain) ==
25678c37eb0d5e6a9727b12ea0f1821795ffaa66cfeTao Ma	     le16_to_cpu(di->id2.i_chain.cl_next_free_rec)) && !resize)) {
25768f64d471be38631d7196b938d9809802dd467faJoel Becker		do_error("Group descriptor #%llu has bad chain %u",
25868f64d471be38631d7196b938d9809802dd467faJoel Becker			 (unsigned long long)bh->b_blocknr,
25957e3e7971136003c96766346049aa73b82cab079Joel Becker			 le16_to_cpu(gd->bg_chain));
26057e3e7971136003c96766346049aa73b82cab079Joel Becker		return -EINVAL;
2617bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	}
2627bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
263970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	return 0;
264970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker}
2657bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
26657e3e7971136003c96766346049aa73b82cab079Joel Becker#undef do_error
2677bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
268970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker/*
269970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker * This version only prints errors.  It does not fail the filesystem, and
270970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker * exists only for resize.
271970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker */
272970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Beckerint ocfs2_check_group_descriptor(struct super_block *sb,
273970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker				 struct ocfs2_dinode *di,
274970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker				 struct buffer_head *bh)
275970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker{
276970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	int rc;
277d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	struct ocfs2_group_desc *gd = (struct ocfs2_group_desc *)bh->b_data;
278d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker
279d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	BUG_ON(!buffer_uptodate(bh));
280970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
281d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	/*
282d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * If the ecc fails, we return the error but otherwise
283d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * leave the filesystem running.  We know any error is
284d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * local to this block.
285d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 */
286d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	rc = ocfs2_validate_meta_ecc(sb, bh->b_data, &gd->bg_check);
28713723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker	if (rc) {
28813723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker		mlog(ML_ERROR,
28913723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker		     "Checksum failed for group descriptor %llu\n",
29013723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker		     (unsigned long long)bh->b_blocknr);
29113723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker	} else
292d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker		rc = ocfs2_validate_gd_self(sb, bh, 1);
293970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	if (!rc)
294970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker		rc = ocfs2_validate_gd_parent(sb, di, bh, 1);
295970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
296970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	return rc;
297970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker}
298970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
299970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Beckerstatic int ocfs2_validate_group_descriptor(struct super_block *sb,
300970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker					   struct buffer_head *bh)
301970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker{
302d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	int rc;
303d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	struct ocfs2_group_desc *gd = (struct ocfs2_group_desc *)bh->b_data;
304d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker
3052f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_validate_group_descriptor(
3062f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma					(unsigned long long)bh->b_blocknr);
307970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker
308d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	BUG_ON(!buffer_uptodate(bh));
309d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker
310d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	/*
311d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * If the ecc fails, we return the error but otherwise
312d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * leave the filesystem running.  We know any error is
313d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * local to this block.
314d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 */
315d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	rc = ocfs2_validate_meta_ecc(sb, bh->b_data, &gd->bg_check);
316d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	if (rc)
317d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker		return rc;
318d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker
319d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	/*
320d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 * Errors after here are fatal.
321d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker	 */
322d6b32bbb3eae3fb787f1c33bf9f767ca1ddeb208Joel Becker
323970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	return ocfs2_validate_gd_self(sb, bh, 0);
3247bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh}
3257bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
32668f64d471be38631d7196b938d9809802dd467faJoel Beckerint ocfs2_read_group_descriptor(struct inode *inode, struct ocfs2_dinode *di,
32768f64d471be38631d7196b938d9809802dd467faJoel Becker				u64 gd_blkno, struct buffer_head **bh)
32868f64d471be38631d7196b938d9809802dd467faJoel Becker{
32968f64d471be38631d7196b938d9809802dd467faJoel Becker	int rc;
33068f64d471be38631d7196b938d9809802dd467faJoel Becker	struct buffer_head *tmp = *bh;
33168f64d471be38631d7196b938d9809802dd467faJoel Becker
3328cb471e8f82506937fe5e2e9fb0bf90f6b1f1170Joel Becker	rc = ocfs2_read_block(INODE_CACHE(inode), gd_blkno, &tmp,
333970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker			      ocfs2_validate_group_descriptor);
33468f64d471be38631d7196b938d9809802dd467faJoel Becker	if (rc)
33568f64d471be38631d7196b938d9809802dd467faJoel Becker		goto out;
33668f64d471be38631d7196b938d9809802dd467faJoel Becker
337970e4936d7d15f35d00fd15a14f5343ba78b2fc8Joel Becker	rc = ocfs2_validate_gd_parent(inode->i_sb, di, tmp, 0);
33868f64d471be38631d7196b938d9809802dd467faJoel Becker	if (rc) {
33968f64d471be38631d7196b938d9809802dd467faJoel Becker		brelse(tmp);
34068f64d471be38631d7196b938d9809802dd467faJoel Becker		goto out;
34168f64d471be38631d7196b938d9809802dd467faJoel Becker	}
34268f64d471be38631d7196b938d9809802dd467faJoel Becker
34368f64d471be38631d7196b938d9809802dd467faJoel Becker	/* If ocfs2_read_block() got us a new bh, pass it up. */
34468f64d471be38631d7196b938d9809802dd467faJoel Becker	if (!*bh)
34568f64d471be38631d7196b938d9809802dd467faJoel Becker		*bh = tmp;
34668f64d471be38631d7196b938d9809802dd467faJoel Becker
34768f64d471be38631d7196b938d9809802dd467faJoel Beckerout:
34868f64d471be38631d7196b938d9809802dd467faJoel Becker	return rc;
34968f64d471be38631d7196b938d9809802dd467faJoel Becker}
35068f64d471be38631d7196b938d9809802dd467faJoel Becker
351798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerstatic void ocfs2_bg_discontig_add_extent(struct ocfs2_super *osb,
352798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					  struct ocfs2_group_desc *bg,
353798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					  struct ocfs2_chain_list *cl,
35447dea423799d98c53793237ab386a94976f305d5Tao Ma					  u64 p_blkno, unsigned int clusters)
355798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
356798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_extent_list *el = &bg->bg_list;
357798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_extent_rec *rec;
358798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
3594711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	BUG_ON(!ocfs2_supports_discontig_bg(osb));
360798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (!el->l_next_free_rec)
361798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		el->l_count = cpu_to_le16(ocfs2_extent_recs_per_gd(osb->sb));
362798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	rec = &el->l_recs[le16_to_cpu(el->l_next_free_rec)];
3634711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	rec->e_blkno = cpu_to_le64(p_blkno);
364798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	rec->e_cpos = cpu_to_le32(le16_to_cpu(bg->bg_bits) /
365798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				  le16_to_cpu(cl->cl_bpc));
36647dea423799d98c53793237ab386a94976f305d5Tao Ma	rec->e_leaf_clusters = cpu_to_le16(clusters);
367798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	le16_add_cpu(&bg->bg_bits, clusters * le16_to_cpu(cl->cl_bpc));
3684711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	le16_add_cpu(&bg->bg_free_bits_count,
3694711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		     clusters * le16_to_cpu(cl->cl_bpc));
370798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	le16_add_cpu(&el->l_next_free_rec, 1);
371798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
372798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
3731fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fashehstatic int ocfs2_block_group_fill(handle_t *handle,
374ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct inode *alloc_inode,
375ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct buffer_head *bg_bh,
376ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  u64 group_blkno,
377798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				  unsigned int group_clusters,
378ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  u16 my_chain,
379ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				  struct ocfs2_chain_list *cl)
380ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
381ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status = 0;
382798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_super *osb = OCFS2_SB(alloc_inode->i_sb);
383ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg = (struct ocfs2_group_desc *) bg_bh->b_data;
384ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct super_block * sb = alloc_inode->i_sb;
385ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
386ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (((unsigned long long) bg_bh->b_blocknr) != group_blkno) {
387b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh		ocfs2_error(alloc_inode->i_sb, "group block (%llu) != "
388b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh			    "b_blocknr (%llu)",
389b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh			    (unsigned long long)group_blkno,
390ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			    (unsigned long long) bg_bh->b_blocknr);
391ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -EIO;
392ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
393ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
394ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
39513723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker	status = ocfs2_journal_access_gd(handle,
3960cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 INODE_CACHE(alloc_inode),
39713723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 bg_bh,
39813723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 OCFS2_JOURNAL_ACCESS_CREATE);
399ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
400ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
401ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
402ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
403ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
404ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	memset(bg, 0, sb->s_blocksize);
405ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	strcpy(bg->bg_signature, OCFS2_GROUP_DESC_SIGNATURE);
406ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_generation = cpu_to_le32(OCFS2_SB(sb)->fs_generation);
4078571882c21e5073b2f96147ec4ff9b7042339e1bTao Ma	bg->bg_size = cpu_to_le16(ocfs2_group_bitmap_size(sb, 1,
4088571882c21e5073b2f96147ec4ff9b7042339e1bTao Ma						osb->s_feature_incompat));
409ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_chain = cpu_to_le16(my_chain);
410ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_next_group = cl->cl_recs[my_chain].c_blkno;
411ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_parent_dinode = cpu_to_le64(OCFS2_I(alloc_inode)->ip_blkno);
412ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_blkno = cpu_to_le64(group_blkno);
413798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (group_clusters == le16_to_cpu(cl->cl_cpg))
414798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		bg->bg_bits = cpu_to_le16(ocfs2_bits_per_group(cl));
415798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	else
4164711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		ocfs2_bg_discontig_add_extent(osb, bg, cl, group_blkno,
417798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					      group_clusters);
418798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
419ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* set the 1st bit in the bitmap to account for the descriptor block */
420ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ocfs2_set_bit(0, (unsigned long *)bg->bg_bitmap);
421ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_free_bits_count = cpu_to_le16(le16_to_cpu(bg->bg_bits) - 1);
422ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
423ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, bg_bh);
424ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
425ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* There is no need to zero out or otherwise initialize the
426ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * other blocks in a group - All valid FS metadata in a block
427ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * group stores the superblock fs_generation value at
428ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * allocation time. */
429ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
430ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
431c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
432c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
433ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
434ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
435ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
436ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline u16 ocfs2_find_smallest_chain(struct ocfs2_chain_list *cl)
437ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
438ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 curr, best;
439ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
440ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	best = curr = 0;
441ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	while (curr < le16_to_cpu(cl->cl_count)) {
442ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (le32_to_cpu(cl->cl_recs[best].c_total) >
443ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		    le32_to_cpu(cl->cl_recs[curr].c_total))
444ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			best = curr;
445ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		curr++;
446ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
447ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return best;
448ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
449ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
450798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerstatic struct buffer_head *
451798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerocfs2_block_group_alloc_contig(struct ocfs2_super *osb, handle_t *handle,
452798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			       struct inode *alloc_inode,
453798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			       struct ocfs2_alloc_context *ac,
454798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			       struct ocfs2_chain_list *cl)
455798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
456798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	int status;
457798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u32 bit_off, num_bits;
458798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u64 bg_blkno;
459798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct buffer_head *bg_bh;
460798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	unsigned int alloc_rec = ocfs2_find_smallest_chain(cl);
461798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
4621ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker	status = ocfs2_claim_clusters(handle, ac,
463798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				      le16_to_cpu(cl->cl_cpg), &bit_off,
464798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				      &num_bits);
465798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status < 0) {
466798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		if (status != -ENOSPC)
467798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			mlog_errno(status);
468798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
469798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
470798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
471798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	/* setup the group */
472798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg_blkno = ocfs2_clusters_to_blocks(osb->sb, bit_off);
4732f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_block_group_alloc_contig(
4742f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	     (unsigned long long)bg_blkno, alloc_rec);
475798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
476798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg_bh = sb_getblk(osb->sb, bg_blkno);
477798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (!bg_bh) {
4787391a294b861bf2c3b762dfdcf61b9c5f1bffa1fRui Xiang		status = -ENOMEM;
479798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
480798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
481798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
482798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	ocfs2_set_new_buffer_uptodate(INODE_CACHE(alloc_inode), bg_bh);
483798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
484798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	status = ocfs2_block_group_fill(handle, alloc_inode, bg_bh,
485798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					bg_blkno, num_bits, alloc_rec, cl);
486798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status < 0) {
487798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		brelse(bg_bh);
488798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
489798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
490798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
491798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerbail:
492798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	return status ? ERR_PTR(status) : bg_bh;
493798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
494798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
495798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerstatic int ocfs2_block_group_claim_bits(struct ocfs2_super *osb,
496798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					handle_t *handle,
497798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					struct ocfs2_alloc_context *ac,
498798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					unsigned int min_bits,
499798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					u32 *bit_off, u32 *num_bits)
500798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
50118d3a98f3c1b0e27ce026afa4d1ef042f2903726Joel Becker	int status = 0;
502798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
503798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	while (min_bits) {
5041ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker		status = ocfs2_claim_clusters(handle, ac, min_bits,
505798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					      bit_off, num_bits);
506798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		if (status != -ENOSPC)
507798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			break;
508798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
509798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		min_bits >>= 1;
510798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
511798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
512798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	return status;
513798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
514798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
515798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerstatic int ocfs2_block_group_grow_discontig(handle_t *handle,
516798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					    struct inode *alloc_inode,
517798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					    struct buffer_head *bg_bh,
518798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					    struct ocfs2_alloc_context *ac,
519798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					    struct ocfs2_chain_list *cl,
520798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					    unsigned int min_bits)
521798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
522798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	int status;
523798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_super *osb = OCFS2_SB(alloc_inode->i_sb);
524798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_group_desc *bg =
525798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		(struct ocfs2_group_desc *)bg_bh->b_data;
5264711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	unsigned int needed = le16_to_cpu(cl->cl_cpg) -
5274711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma			 le16_to_cpu(bg->bg_bits) / le16_to_cpu(cl->cl_bpc);
528798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u32 p_cpos, clusters;
529798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u64 p_blkno;
530798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_extent_list *el = &bg->bg_list;
531798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
532798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	status = ocfs2_journal_access_gd(handle,
533798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					 INODE_CACHE(alloc_inode),
534798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					 bg_bh,
535798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					 OCFS2_JOURNAL_ACCESS_CREATE);
536798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status < 0) {
537798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
538798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
539798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
540798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
541798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	while ((needed > 0) && (le16_to_cpu(el->l_next_free_rec) <
542798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				le16_to_cpu(el->l_count))) {
543798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		if (min_bits > needed)
544798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			min_bits = needed;
545798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		status = ocfs2_block_group_claim_bits(osb, handle, ac,
546798db35f4649eac2778381c390ed7d12de9ec767Joel Becker						      min_bits, &p_cpos,
547798db35f4649eac2778381c390ed7d12de9ec767Joel Becker						      &clusters);
548798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		if (status < 0) {
549798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			if (status != -ENOSPC)
550798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				mlog_errno(status);
551798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			goto bail;
552798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		}
553798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		p_blkno = ocfs2_clusters_to_blocks(osb->sb, p_cpos);
554798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		ocfs2_bg_discontig_add_extent(osb, bg, cl, p_blkno,
555798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					      clusters);
556798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
557798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		min_bits = clusters;
5584711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		needed = le16_to_cpu(cl->cl_cpg) -
5594711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma			 le16_to_cpu(bg->bg_bits) / le16_to_cpu(cl->cl_bpc);
560798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
561798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
562798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (needed > 0) {
5634711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		/*
5644711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		 * We have used up all the extent rec but can't fill up
5654711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		 * the cpg. So bail out.
5664711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		 */
5674711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		status = -ENOSPC;
5684711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma		goto bail;
569798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
570798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
571798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	ocfs2_journal_dirty(handle, bg_bh);
572798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
573798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerbail:
574798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	return status;
575798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
576798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
5778b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Beckerstatic void ocfs2_bg_alloc_cleanup(handle_t *handle,
5788b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker				   struct ocfs2_alloc_context *cluster_ac,
5798b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker				   struct inode *alloc_inode,
5808b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker				   struct buffer_head *bg_bh)
581798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
5828b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker	int i, ret;
583798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_group_desc *bg;
584798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_extent_list *el;
585798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_extent_rec *rec;
586798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
587798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (!bg_bh)
588798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		return;
589798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
590798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg = (struct ocfs2_group_desc *)bg_bh->b_data;
591798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	el = &bg->bg_list;
592798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	for (i = 0; i < le16_to_cpu(el->l_next_free_rec); i++) {
593798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		rec = &el->l_recs[i];
5948b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		ret = ocfs2_free_clusters(handle, cluster_ac->ac_inode,
5958b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker					  cluster_ac->ac_bh,
5968b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker					  le64_to_cpu(rec->e_blkno),
59772094e43e3af5020510f920321d71f1798fa896dAl Viro					  le16_to_cpu(rec->e_leaf_clusters));
5988b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		if (ret)
5998b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker			mlog_errno(ret);
6008b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		/* Try all the clusters to free */
601798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
602798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
603798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	ocfs2_remove_from_cache(INODE_CACHE(alloc_inode), bg_bh);
604798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	brelse(bg_bh);
605798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
606798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
607798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerstatic struct buffer_head *
608798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerocfs2_block_group_alloc_discontig(handle_t *handle,
609798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				  struct inode *alloc_inode,
610798db35f4649eac2778381c390ed7d12de9ec767Joel Becker				  struct ocfs2_alloc_context *ac,
6118b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker				  struct ocfs2_chain_list *cl)
612798db35f4649eac2778381c390ed7d12de9ec767Joel Becker{
613798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	int status;
614798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u32 bit_off, num_bits;
615798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	u64 bg_blkno;
616798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	unsigned int min_bits = le16_to_cpu(cl->cl_cpg) >> 1;
617798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct buffer_head *bg_bh = NULL;
618798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	unsigned int alloc_rec = ocfs2_find_smallest_chain(cl);
619798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	struct ocfs2_super *osb = OCFS2_SB(alloc_inode->i_sb);
620798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
6214711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	if (!ocfs2_supports_discontig_bg(osb)) {
622798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		status = -ENOSPC;
623798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
624798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
625798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
6268b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker	status = ocfs2_extend_trans(handle,
6278b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker				    ocfs2_calc_bg_discontig_credits(osb->sb));
6288b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker	if (status) {
6298b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		mlog_errno(status);
6308b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		goto bail;
6318b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker	}
6328b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker
63395ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	/*
63495ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	 * We're going to be grabbing from multiple cluster groups.
63595ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	 * We don't have enough credits to relink them all, and the
63695ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	 * cluster groups will be staying in cache for the duration of
63795ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	 * this operation.
63895ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker	 */
639309a85b6861fedbb48a22d45e0e079d1be993b3aXiaowei.Hu	ac->ac_disable_chain_relink = 1;
64095ec0adf0b56d6a3f0ca1ec87173311898486b2eJoel Becker
641798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	/* Claim the first region */
642798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	status = ocfs2_block_group_claim_bits(osb, handle, ac, min_bits,
643798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					      &bit_off, &num_bits);
644798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status < 0) {
645798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		if (status != -ENOSPC)
646798db35f4649eac2778381c390ed7d12de9ec767Joel Becker			mlog_errno(status);
647798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
648798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
649798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	min_bits = num_bits;
650798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
651798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	/* setup the group */
652798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg_blkno = ocfs2_clusters_to_blocks(osb->sb, bit_off);
6532f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_block_group_alloc_discontig(
6542f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)bg_blkno, alloc_rec);
655798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
656798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg_bh = sb_getblk(osb->sb, bg_blkno);
657798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (!bg_bh) {
6587391a294b861bf2c3b762dfdcf61b9c5f1bffa1fRui Xiang		status = -ENOMEM;
659798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
660798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
661798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
662798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	ocfs2_set_new_buffer_uptodate(INODE_CACHE(alloc_inode), bg_bh);
663798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
664798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	status = ocfs2_block_group_fill(handle, alloc_inode, bg_bh,
665798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					bg_blkno, num_bits, alloc_rec, cl);
666798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status < 0) {
667798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
668798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		goto bail;
669798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	}
670798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
671798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	status = ocfs2_block_group_grow_discontig(handle, alloc_inode,
672798db35f4649eac2778381c390ed7d12de9ec767Joel Becker						  bg_bh, ac, cl, min_bits);
673798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status)
674798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		mlog_errno(status);
675798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
676798db35f4649eac2778381c390ed7d12de9ec767Joel Beckerbail:
677798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (status)
6788b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker		ocfs2_bg_alloc_cleanup(handle, ac, alloc_inode, bg_bh);
679798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	return status ? ERR_PTR(status) : bg_bh;
680798db35f4649eac2778381c390ed7d12de9ec767Joel Becker}
681798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
682ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/*
683ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * We expect the block group allocator to already be locked.
684ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh */
685ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_block_group_alloc(struct ocfs2_super *osb,
686ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				   struct inode *alloc_inode,
6871187c968852e3c668f3b9376083851f81f6eee22Joel Becker				   struct buffer_head *bh,
68860ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma				   u64 max_block,
689feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma				   u64 *last_alloc_group,
69060ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma				   int flags)
691ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
692ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status, credits;
693ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe = (struct ocfs2_dinode *) bh->b_data;
694ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_chain_list *cl;
695ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_alloc_context *ac = NULL;
6961fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh	handle_t *handle = NULL;
6974711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	u16 alloc_rec;
698ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct buffer_head *bg_bh = NULL;
699ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg;
700ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
701ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ocfs2_is_cluster_bitmap(alloc_inode));
702ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
703ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	cl = &fe->id2.i_chain;
7041187c968852e3c668f3b9376083851f81f6eee22Joel Becker	status = ocfs2_reserve_clusters_with_limit(osb,
7051187c968852e3c668f3b9376083851f81f6eee22Joel Becker						   le16_to_cpu(cl->cl_cpg),
70660ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma						   max_block, flags, &ac);
707ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
708ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
709ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
710ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
711ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
712ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
713ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	credits = ocfs2_calc_group_alloc_credits(osb->sb,
714ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						 le16_to_cpu(cl->cl_cpg));
71565eff9ccf86d63eb5c3e9071450a36e4e4fa9564Mark Fasheh	handle = ocfs2_start_trans(osb, credits);
716ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (IS_ERR(handle)) {
717ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = PTR_ERR(handle);
718ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		handle = NULL;
719ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
720ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
721ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
722ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
723feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	if (last_alloc_group && *last_alloc_group != 0) {
7242f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		trace_ocfs2_block_group_alloc(
7252f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)*last_alloc_group);
726feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma		ac->ac_last_group = *last_alloc_group;
727feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	}
728798db35f4649eac2778381c390ed7d12de9ec767Joel Becker
729798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	bg_bh = ocfs2_block_group_alloc_contig(osb, handle, alloc_inode,
730798db35f4649eac2778381c390ed7d12de9ec767Joel Becker					       ac, cl);
731798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (IS_ERR(bg_bh) && (PTR_ERR(bg_bh) == -ENOSPC))
732798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		bg_bh = ocfs2_block_group_alloc_discontig(handle,
733798db35f4649eac2778381c390ed7d12de9ec767Joel Becker							  alloc_inode,
7348b06bc592ebc5a31e8d0b9c2ab17c6e78dde1f86Joel Becker							  ac, cl);
735798db35f4649eac2778381c390ed7d12de9ec767Joel Becker	if (IS_ERR(bg_bh)) {
736798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		status = PTR_ERR(bg_bh);
737798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		bg_bh = NULL;
738ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
739ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
740ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
741ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
742ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg = (struct ocfs2_group_desc *) bg_bh->b_data;
743ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
7440cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_di(handle, INODE_CACHE(alloc_inode),
74513723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 bh, OCFS2_JOURNAL_ACCESS_WRITE);
746ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
747ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
748ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
749ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
750ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
7514711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	alloc_rec = le16_to_cpu(bg->bg_chain);
7524711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	le32_add_cpu(&cl->cl_recs[alloc_rec].c_free,
753ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		     le16_to_cpu(bg->bg_free_bits_count));
7544711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	le32_add_cpu(&cl->cl_recs[alloc_rec].c_total,
755798db35f4649eac2778381c390ed7d12de9ec767Joel Becker		     le16_to_cpu(bg->bg_bits));
7560a463b74e7e6856b24e613de2b85237c6e11890bTao Ma	cl->cl_recs[alloc_rec].c_blkno = bg->bg_blkno;
757ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (le16_to_cpu(cl->cl_next_free_rec) < le16_to_cpu(cl->cl_count))
758ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		le16_add_cpu(&cl->cl_next_free_rec, 1);
759ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
760ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le32_add_cpu(&fe->id1.bitmap1.i_used, le16_to_cpu(bg->bg_bits) -
761ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					le16_to_cpu(bg->bg_free_bits_count));
762ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le32_add_cpu(&fe->id1.bitmap1.i_total, le16_to_cpu(bg->bg_bits));
763ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le32_add_cpu(&fe->i_clusters, le16_to_cpu(cl->cl_cpg));
764ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
765ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, bh);
766ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
767ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	spin_lock(&OCFS2_I(alloc_inode)->ip_lock);
768ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	OCFS2_I(alloc_inode)->ip_clusters = le32_to_cpu(fe->i_clusters);
769ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe->i_size = cpu_to_le64(ocfs2_clusters_to_bytes(alloc_inode->i_sb,
770ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     le32_to_cpu(fe->i_clusters)));
771ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	spin_unlock(&OCFS2_I(alloc_inode)->ip_lock);
772ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	i_size_write(alloc_inode, le64_to_cpu(fe->i_size));
7738110b073a9135acf0a71bccfc20c0d1023f179c6Mark Fasheh	alloc_inode->i_blocks = ocfs2_inode_sector_count(alloc_inode);
7746fdb702d6262b18b1b41a35f1f81903b0a2bc2c9Darrick J. Wong	ocfs2_update_inode_fsync_trans(handle, alloc_inode, 0);
775ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
776ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
777feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma
778feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	/* save the new last alloc group so that the caller can cache it. */
779feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	if (last_alloc_group)
780feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma		*last_alloc_group = ac->ac_last_group;
781feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma
782ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
783ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (handle)
78402dc1af44e9fa4b8801169891b3a1ba4047537adMark Fasheh		ocfs2_commit_trans(osb, handle);
785ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
786ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (ac)
787ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_free_alloc_context(ac);
788ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
789a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(bg_bh);
790ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
791c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
792c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
793ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
794ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
795ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
796ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_reserve_suballoc_bits(struct ocfs2_super *osb,
797da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh				       struct ocfs2_alloc_context *ac,
798da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh				       int type,
799ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma				       u32 slot,
800feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma				       u64 *last_alloc_group,
80160ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma				       int flags)
802ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
803ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
804ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 bits_wanted = ac->ac_bits_wanted;
805da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	struct inode *alloc_inode;
806ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct buffer_head *bh = NULL;
807ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe;
808ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 free_bits;
809ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
810da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	alloc_inode = ocfs2_get_system_file_inode(osb, type, slot);
811da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	if (!alloc_inode) {
812da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		mlog_errno(-EINVAL);
813da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		return -EINVAL;
814da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	}
815ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
816da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	mutex_lock(&alloc_inode->i_mutex);
817da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
818e63aecb651ba73dffc62f9608ee1b7ae2a0ffd4bMark Fasheh	status = ocfs2_inode_lock(alloc_inode, &bh, 1);
819ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
820da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		mutex_unlock(&alloc_inode->i_mutex);
821da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		iput(alloc_inode);
822da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
823ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
824da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		return status;
825ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
826ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
827da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	ac->ac_inode = alloc_inode;
828a4a4891164d4f6f383cc17e7c90828a7ca6a1146Tao Ma	ac->ac_alloc_slot = slot;
829da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
830ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe = (struct ocfs2_dinode *) bh->b_data;
83110995aa2451afa20b721cc7de856cae1a13dba57Joel Becker
83210995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	/* The bh was validated by the inode read inside
83310995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	 * ocfs2_inode_lock().  Any corruption is a code bug. */
83410995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	BUG_ON(!OCFS2_IS_VALID_DINODE(fe));
83510995aa2451afa20b721cc7de856cae1a13dba57Joel Becker
836ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (!(fe->i_flags & cpu_to_le32(OCFS2_CHAIN_FL))) {
837b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh		ocfs2_error(alloc_inode->i_sb, "Invalid chain allocator %llu",
838b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh			    (unsigned long long)le64_to_cpu(fe->i_blkno));
839ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -EIO;
840ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
841ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
842ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
843ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	free_bits = le32_to_cpu(fe->id1.bitmap1.i_total) -
844ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		le32_to_cpu(fe->id1.bitmap1.i_used);
845ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
846ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (bits_wanted > free_bits) {
847ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* cluster bitmap never grows */
848ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (ocfs2_is_cluster_bitmap(alloc_inode)) {
8492f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			trace_ocfs2_reserve_suballoc_bits_nospc(bits_wanted,
8502f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma								free_bits);
851ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			status = -ENOSPC;
852ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
853ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
854ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
85560ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma		if (!(flags & ALLOC_NEW_GROUP)) {
8562f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			trace_ocfs2_reserve_suballoc_bits_no_new_group(
8572f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma						slot, bits_wanted, free_bits);
858ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma			status = -ENOSPC;
859ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma			goto bail;
860ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma		}
861ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma
8621187c968852e3c668f3b9376083851f81f6eee22Joel Becker		status = ocfs2_block_group_alloc(osb, alloc_inode, bh,
863feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma						 ac->ac_max_block,
864feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma						 last_alloc_group, flags);
865ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status < 0) {
866ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			if (status != -ENOSPC)
867ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				mlog_errno(status);
868ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
869ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
870ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		atomic_inc(&osb->alloc_stats.bg_extends);
871ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
872ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* You should never ask for this much metadata */
873ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		BUG_ON(bits_wanted >
874ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		       (le32_to_cpu(fe->id1.bitmap1.i_total)
875ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			- le32_to_cpu(fe->id1.bitmap1.i_used)));
876ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
877ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
878ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	get_bh(bh);
879ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ac->ac_bh = bh;
880ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
881a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(bh);
882ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
883c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
884c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
885ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
886ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
887ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
888b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic void ocfs2_init_inode_steal_slot(struct ocfs2_super *osb)
889b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
890b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_lock(&osb->osb_lock);
891b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	osb->s_inode_steal_slot = OCFS2_INVALID_SLOT;
892b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_unlock(&osb->osb_lock);
893b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	atomic_set(&osb->s_num_inodes_stolen, 0);
894b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
895b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
896b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic void ocfs2_init_meta_steal_slot(struct ocfs2_super *osb)
897b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
898b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_lock(&osb->osb_lock);
899b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	osb->s_meta_steal_slot = OCFS2_INVALID_SLOT;
900b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_unlock(&osb->osb_lock);
901b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	atomic_set(&osb->s_num_meta_stolen, 0);
902b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
903b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
904b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangvoid ocfs2_init_steal_slots(struct ocfs2_super *osb)
905b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
906b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	ocfs2_init_inode_steal_slot(osb);
907b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	ocfs2_init_meta_steal_slot(osb);
908b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
909b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
910b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic void __ocfs2_set_steal_slot(struct ocfs2_super *osb, int slot, int type)
911b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
912b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_lock(&osb->osb_lock);
913b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	if (type == INODE_ALLOC_SYSTEM_INODE)
914b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		osb->s_inode_steal_slot = slot;
915b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	else if (type == EXTENT_ALLOC_SYSTEM_INODE)
916b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		osb->s_meta_steal_slot = slot;
917b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_unlock(&osb->osb_lock);
918b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
919b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
920b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int __ocfs2_get_steal_slot(struct ocfs2_super *osb, int type)
921b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
922b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	int slot = OCFS2_INVALID_SLOT;
923b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
924b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_lock(&osb->osb_lock);
925b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	if (type == INODE_ALLOC_SYSTEM_INODE)
926b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		slot = osb->s_inode_steal_slot;
927b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	else if (type == EXTENT_ALLOC_SYSTEM_INODE)
928b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		slot = osb->s_meta_steal_slot;
929b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	spin_unlock(&osb->osb_lock);
930b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
931b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return slot;
932b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
933b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
934b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int ocfs2_get_inode_steal_slot(struct ocfs2_super *osb)
935b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
936b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return __ocfs2_get_steal_slot(osb, INODE_ALLOC_SYSTEM_INODE);
937b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
938b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
939b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int ocfs2_get_meta_steal_slot(struct ocfs2_super *osb)
940b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
941b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return __ocfs2_get_steal_slot(osb, EXTENT_ALLOC_SYSTEM_INODE);
942b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
943b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
944b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int ocfs2_steal_resource(struct ocfs2_super *osb,
945b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang				struct ocfs2_alloc_context *ac,
946b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang				int type)
947b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
948b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	int i, status = -ENOSPC;
949b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	int slot = __ocfs2_get_steal_slot(osb, type);
950b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
951b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	/* Start to steal resource from the first slot after ours. */
952b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	if (slot == OCFS2_INVALID_SLOT)
953b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		slot = osb->slot_num + 1;
954b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
955b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	for (i = 0; i < osb->max_slots; i++, slot++) {
956b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		if (slot == osb->max_slots)
957b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			slot = 0;
958b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
959b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		if (slot == osb->slot_num)
960b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			continue;
961b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
962b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		status = ocfs2_reserve_suballoc_bits(osb, ac,
963b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang						     type,
964b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang						     (u32)slot, NULL,
965b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang						     NOT_ALLOC_NEW_GROUP);
966b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		if (status >= 0) {
967b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			__ocfs2_set_steal_slot(osb, slot, type);
968b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			break;
969b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		}
970b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
971b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		ocfs2_free_ac_resource(ac);
972b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	}
973b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
974b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return status;
975b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
976b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
977b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int ocfs2_steal_inode(struct ocfs2_super *osb,
978b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			     struct ocfs2_alloc_context *ac)
979b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
980b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return ocfs2_steal_resource(osb, ac, INODE_ALLOC_SYSTEM_INODE);
981b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
982b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
983b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangstatic int ocfs2_steal_meta(struct ocfs2_super *osb,
984b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			    struct ocfs2_alloc_context *ac)
985b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang{
986b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	return ocfs2_steal_resource(osb, ac, EXTENT_ALLOC_SYSTEM_INODE);
987b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang}
988b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
989cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yangint ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb,
990cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang				      int blocks,
991cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang				      struct ocfs2_alloc_context **ac)
992ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
993ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
994b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	int slot = ocfs2_get_meta_steal_slot(osb);
995ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
996cd86128088554d64fea1679191509f00e6353c5bRobert P. J. Day	*ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL);
997ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (!(*ac)) {
998ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -ENOMEM;
999ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1000ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1001ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1002ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1003cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang	(*ac)->ac_bits_wanted = blocks;
1004ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_which = OCFS2_AC_USE_META;
1005ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_group_search = ocfs2_block_group_search;
1006ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1007b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	if (slot != OCFS2_INVALID_SLOT &&
1008b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		atomic_read(&osb->s_num_meta_stolen) < OCFS2_MAX_TO_STEAL)
1009b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		goto extent_steal;
1010b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
1011b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	atomic_set(&osb->s_num_meta_stolen, 0);
1012da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	status = ocfs2_reserve_suballoc_bits(osb, (*ac),
1013ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma					     EXTENT_ALLOC_SYSTEM_INODE,
1014b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang					     (u32)osb->slot_num, NULL,
101533d5d380d667ad264675cfdb297dfc3c5b6542ccMark Fasheh					     ALLOC_GROUPS_FROM_GLOBAL|ALLOC_NEW_GROUP);
1016b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
1017b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
1018b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	if (status >= 0) {
1019b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		status = 0;
1020b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		if (slot != OCFS2_INVALID_SLOT)
1021b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang			ocfs2_init_meta_steal_slot(osb);
1022b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		goto bail;
1023b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	} else if (status < 0 && status != -ENOSPC) {
1024b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		mlog_errno(status);
1025b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang		goto bail;
1026b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	}
1027b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
1028b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	ocfs2_free_ac_resource(*ac);
1029b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang
1030b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yangextent_steal:
1031b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	status = ocfs2_steal_meta(osb, *ac);
1032b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	atomic_inc(&osb->s_num_meta_stolen);
1033ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1034ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
1035ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1036ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1037ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1038ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1039ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
1040ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1041ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if ((status < 0) && *ac) {
1042ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_free_alloc_context(*ac);
1043ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		*ac = NULL;
1044ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1045ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1046c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
1047c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
1048ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1049ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1050ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1051cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yangint ocfs2_reserve_new_metadata(struct ocfs2_super *osb,
1052cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang			       struct ocfs2_extent_list *root_el,
1053cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang			       struct ocfs2_alloc_context **ac)
1054cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang{
1055cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang	return ocfs2_reserve_new_metadata_blocks(osb,
1056cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang					ocfs2_extend_meta_needed(root_el),
1057cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang					ac);
1058cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang}
1059cf1d6c763fbcb115263114302485ad17e7933d87Tiger Yang
1060ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehint ocfs2_reserve_new_inode(struct ocfs2_super *osb,
1061ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			    struct ocfs2_alloc_context **ac)
1062ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1063ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1064b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	int slot = ocfs2_get_inode_steal_slot(osb);
1065feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	u64 alloc_group;
1066ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1067cd86128088554d64fea1679191509f00e6353c5bRobert P. J. Day	*ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL);
1068ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (!(*ac)) {
1069ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -ENOMEM;
1070ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1071ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1072ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1073ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1074ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_bits_wanted = 1;
1075ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_which = OCFS2_AC_USE_INODE;
1076ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1077ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_group_search = ocfs2_block_group_search;
1078ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
10794d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	/*
10801187c968852e3c668f3b9376083851f81f6eee22Joel Becker	 * stat(2) can't handle i_ino > 32bits, so we tell the
10811187c968852e3c668f3b9376083851f81f6eee22Joel Becker	 * lower levels not to allocate us a block group past that
108212462f1d9f0b96389497438dc2730c6f7410be82Joel Becker	 * limit.  The 'inode64' mount option avoids this behavior.
10831187c968852e3c668f3b9376083851f81f6eee22Joel Becker	 */
108412462f1d9f0b96389497438dc2730c6f7410be82Joel Becker	if (!(osb->s_mount_opt & OCFS2_MOUNT_INODE64))
108512462f1d9f0b96389497438dc2730c6f7410be82Joel Becker		(*ac)->ac_max_block = (u32)~0U;
10861187c968852e3c668f3b9376083851f81f6eee22Joel Becker
10871187c968852e3c668f3b9376083851f81f6eee22Joel Becker	/*
10884d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * slot is set when we successfully steal inode from other nodes.
10894d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * It is reset in 3 places:
10904d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * 1. when we flush the truncate log
10914d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * 2. when we complete local alloc recovery.
10924d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * 3. when we successfully allocate from our own slot.
10934d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * After it is set, we will go on stealing inodes until we find the
10944d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 * need to check our slots to see whether there is some space for us.
10954d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	 */
10964d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	if (slot != OCFS2_INVALID_SLOT &&
1097b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	    atomic_read(&osb->s_num_inodes_stolen) < OCFS2_MAX_TO_STEAL)
10984d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		goto inode_steal;
10994d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
11004d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	atomic_set(&osb->s_num_inodes_stolen, 0);
1101feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma	alloc_group = osb->osb_inode_alloc_group;
1102da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	status = ocfs2_reserve_suballoc_bits(osb, *ac,
1103da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh					     INODE_ALLOC_SYSTEM_INODE,
1104b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang					     (u32)osb->slot_num,
1105feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma					     &alloc_group,
110660ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma					     ALLOC_NEW_GROUP |
110760ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma					     ALLOC_GROUPS_FROM_GLOBAL);
11084d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	if (status >= 0) {
11094d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		status = 0;
11104d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
1111feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma		spin_lock(&osb->osb_lock);
1112feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma		osb->osb_inode_alloc_group = alloc_group;
1113feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma		spin_unlock(&osb->osb_lock);
11142f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		trace_ocfs2_reserve_new_inode_new_group(
11152f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			(unsigned long long)alloc_group);
1116feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma
11174d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		/*
11184d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		 * Some inodes must be freed by us, so try to allocate
11194d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		 * from our own next time.
11204d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		 */
11214d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		if (slot != OCFS2_INVALID_SLOT)
11224d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma			ocfs2_init_inode_steal_slot(osb);
11234d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		goto bail;
11244d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	} else if (status < 0 && status != -ENOSPC) {
11254d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		mlog_errno(status);
11264d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma		goto bail;
11274d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	}
11284d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
11294d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	ocfs2_free_ac_resource(*ac);
11304d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma
11314d0ddb2ce25db2254d468233d942276ecf40bff8Tao Mainode_steal:
1132b89c54282db0c8634a2d2dc200f196d571750ce5Tiger Yang	status = ocfs2_steal_inode(osb, *ac);
11334d0ddb2ce25db2254d468233d942276ecf40bff8Tao Ma	atomic_inc(&osb->s_num_inodes_stolen);
1134ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1135ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
1136ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1137ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1138ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1139ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1140ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
1141ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1142ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if ((status < 0) && *ac) {
1143ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_free_alloc_context(*ac);
1144ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		*ac = NULL;
1145ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1146ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1147c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
1148c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
1149ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1150ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1151ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1152ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* local alloc code has to do the same thing, so rather than do this
1153ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * twice.. */
1154ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehint ocfs2_reserve_cluster_bitmap_bits(struct ocfs2_super *osb,
1155ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				      struct ocfs2_alloc_context *ac)
1156ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1157ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1158ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1159ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ac->ac_which = OCFS2_AC_USE_MAIN;
1160ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ac->ac_group_search = ocfs2_cluster_group_search;
1161ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1162da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	status = ocfs2_reserve_suballoc_bits(osb, ac,
1163da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh					     GLOBAL_BITMAP_SYSTEM_INODE,
1164feb473a6e8bd19297d0f3bb377b25055c0228c0aTao Ma					     OCFS2_INVALID_SLOT, NULL,
1165ffda89a3bf3b968bdc268584c6bc1da5c173cf12Tao Ma					     ALLOC_NEW_GROUP);
1166da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	if (status < 0 && status != -ENOSPC) {
1167ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1168da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		goto bail;
1169da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh	}
1170da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh
1171ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1172ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1173ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1174ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1175ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* Callers don't need to care which bitmap (local alloc or main) to
1176ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * use so we figure it out for them, but unfortunately this clutters
1177ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * things a bit. */
11781187c968852e3c668f3b9376083851f81f6eee22Joel Beckerstatic int ocfs2_reserve_clusters_with_limit(struct ocfs2_super *osb,
11791187c968852e3c668f3b9376083851f81f6eee22Joel Becker					     u32 bits_wanted, u64 max_block,
118060ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma					     int flags,
11811187c968852e3c668f3b9376083851f81f6eee22Joel Becker					     struct ocfs2_alloc_context **ac)
1182ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1183ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1184ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1185cd86128088554d64fea1679191509f00e6353c5bRobert P. J. Day	*ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL);
1186ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (!(*ac)) {
1187ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -ENOMEM;
1188ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1189ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1190ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1191ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1192ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	(*ac)->ac_bits_wanted = bits_wanted;
11931187c968852e3c668f3b9376083851f81f6eee22Joel Becker	(*ac)->ac_max_block = max_block;
1194ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1195ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = -ENOSPC;
119660ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma	if (!(flags & ALLOC_GROUPS_FROM_GLOBAL) &&
119760ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma	    ocfs2_alloc_should_use_local(osb, bits_wanted)) {
1198ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = ocfs2_reserve_local_alloc_bits(osb,
1199ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh							bits_wanted,
1200ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh							*ac);
1201a57c8fd2ad238258cc983049008aea5f985804b2Mark Fasheh		if ((status < 0) && (status != -ENOSPC)) {
1202ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1203ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
1204ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1205ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1206ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1207ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status == -ENOSPC) {
1208ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = ocfs2_reserve_cluster_bitmap_bits(osb, *ac);
1209ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status < 0) {
1210ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			if (status != -ENOSPC)
1211ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				mlog_errno(status);
1212ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
1213ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1214ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1215ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1216ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
1217ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1218ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if ((status < 0) && *ac) {
1219ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_free_alloc_context(*ac);
1220ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		*ac = NULL;
1221ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1222ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1223c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
1224c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
1225ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1226ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1227ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
12281187c968852e3c668f3b9376083851f81f6eee22Joel Beckerint ocfs2_reserve_clusters(struct ocfs2_super *osb,
12291187c968852e3c668f3b9376083851f81f6eee22Joel Becker			   u32 bits_wanted,
12301187c968852e3c668f3b9376083851f81f6eee22Joel Becker			   struct ocfs2_alloc_context **ac)
12311187c968852e3c668f3b9376083851f81f6eee22Joel Becker{
123260ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma	return ocfs2_reserve_clusters_with_limit(osb, bits_wanted, 0,
123360ca81e82dae4aa2e8ae84cf96b4d08535931669Tao Ma						 ALLOC_NEW_GROUP, ac);
12341187c968852e3c668f3b9376083851f81f6eee22Joel Becker}
12351187c968852e3c668f3b9376083851f81f6eee22Joel Becker
1236ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/*
1237ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * More or less lifted from ext3. I'll leave their description below:
1238ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
1239ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * "For ext3 allocations, we must not reuse any blocks which are
1240ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * allocated in the bitmap buffer's "last committed data" copy.  This
1241ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * prevents deletes from freeing up the page for reuse until we have
1242ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * committed the delete transaction.
1243ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
1244ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * If we didn't do this, then deleting something and reallocating it as
1245ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * data would allow the old block to be overwritten before the
1246ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * transaction committed (because we force data to disk before commit).
1247ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * This would lead to corruption if we crashed between overwriting the
1248ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * data and committing the delete.
1249ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
1250ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * @@@ We may want to make this allocation behaviour conditional on
1251ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * data-writes at some point, and disable it for metadata allocations or
1252ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * sync-data inodes."
1253ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh *
1254ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * Note: OCFS2 already does this differently for metadata vs data
1255c78bad11fbf1272ea021f56458025dc98486d6f4Joe Perches * allocations, as those bitmaps are separate and undo access is never
1256ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * called on a metadata group descriptor.
1257ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh */
1258ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_test_bg_bit_allocatable(struct buffer_head *bg_bh,
1259ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					 int nr)
1260ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1261ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg = (struct ocfs2_group_desc *) bg_bh->b_data;
126294e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	int ret;
1263ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1264ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (ocfs2_test_bit(nr, (unsigned long *)bg->bg_bitmap))
1265ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		return 0;
126694e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran
126794e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	if (!buffer_jbd(bg_bh))
1268ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		return 1;
1269ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
127094e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	jbd_lock_bh_state(bg_bh);
1271ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg = (struct ocfs2_group_desc *) bh2jh(bg_bh)->b_committed_data;
127294e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	if (bg)
127394e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		ret = !ocfs2_test_bit(nr, (unsigned long *)bg->bg_bitmap);
127494e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	else
127594e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		ret = 1;
127694e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	jbd_unlock_bh_state(bg_bh);
127794e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran
127894e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	return ret;
1279ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1280ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1281ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_block_group_find_clear_bits(struct ocfs2_super *osb,
1282ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     struct buffer_head *bg_bh,
1283ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     unsigned int bits_wanted,
12847bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh					     unsigned int total_bits,
12857d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					     struct ocfs2_suballoc_result *res)
1286ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1287ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	void *bitmap;
1288ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 best_offset, best_size;
1289ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int offset, start, found, status = 0;
1290ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg = (struct ocfs2_group_desc *) bg_bh->b_data;
1291ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
12924203530613280281868b3ca36c817530bca3825cJoel Becker	/* Callers got this descriptor from
12934203530613280281868b3ca36c817530bca3825cJoel Becker	 * ocfs2_read_group_descriptor().  Any corruption is a code bug. */
12944203530613280281868b3ca36c817530bca3825cJoel Becker	BUG_ON(!OCFS2_IS_VALID_GROUP_DESC(bg));
1295ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1296ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	found = start = best_offset = best_size = 0;
1297ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bitmap = bg->bg_bitmap;
1298ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
12997bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	while((offset = ocfs2_find_next_zero_bit(bitmap, total_bits, start)) != -1) {
13007bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		if (offset == total_bits)
1301ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			break;
1302ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1303ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (!ocfs2_test_bg_bit_allocatable(bg_bh, offset)) {
1304ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* We found a zero, but we can't use it as it
1305ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 * hasn't been put to disk yet! */
1306ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			found = 0;
1307ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			start = offset + 1;
1308ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		} else if (offset == start) {
1309ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* we found a zero */
1310ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			found++;
1311ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* move start to the next bit to test */
1312ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			start++;
1313ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		} else {
1314ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* got a zero after some ones */
1315ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			found = 1;
1316ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			start = offset + 1;
1317ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1318ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (found > best_size) {
1319ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			best_size = found;
1320ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			best_offset = start - found;
1321ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1322ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* we got everything we needed */
1323ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (found == bits_wanted) {
1324ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* mlog(0, "Found it all!\n"); */
1325ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			break;
1326ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1327ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1328ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
13297d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	if (best_size) {
13307d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker		res->sr_bit_offset = best_offset;
13317d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker		res->sr_bits = best_size;
1332ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	} else {
1333ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -ENOSPC;
1334ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* No error log here -- see the comment above
1335ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		 * ocfs2_test_bg_bit_allocatable */
1336ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1337ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1338ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1339ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1340ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
13410a2fcd8988ac682f443fd5b0a7c48154a7b42ef2Younger Liuint ocfs2_block_group_set_bits(handle_t *handle,
1342ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     struct inode *alloc_inode,
1343ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     struct ocfs2_group_desc *bg,
1344ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     struct buffer_head *group_bh,
1345ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     unsigned int bit_off,
1346ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					     unsigned int num_bits)
1347ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1348ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1349ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	void *bitmap = bg->bg_bitmap;
1350ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int journal_type = OCFS2_JOURNAL_ACCESS_WRITE;
1351ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
13524203530613280281868b3ca36c817530bca3825cJoel Becker	/* All callers get the descriptor via
13534203530613280281868b3ca36c817530bca3825cJoel Becker	 * ocfs2_read_group_descriptor().  Any corruption is a code bug. */
13544203530613280281868b3ca36c817530bca3825cJoel Becker	BUG_ON(!OCFS2_IS_VALID_GROUP_DESC(bg));
1355ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(le16_to_cpu(bg->bg_free_bits_count) < num_bits);
1356ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
13572f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_block_group_set_bits(bit_off, num_bits);
1358ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1359ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (ocfs2_is_cluster_bitmap(alloc_inode))
1360ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		journal_type = OCFS2_JOURNAL_ACCESS_UNDO;
1361ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
136213723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker	status = ocfs2_journal_access_gd(handle,
13630cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 INODE_CACHE(alloc_inode),
136413723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 group_bh,
136513723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 journal_type);
1366ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1367ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1368ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1369ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1370ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1371ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le16_add_cpu(&bg->bg_free_bits_count, -num_bits);
13729b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda	if (le16_to_cpu(bg->bg_free_bits_count) > le16_to_cpu(bg->bg_bits)) {
13739b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda		ocfs2_error(alloc_inode->i_sb, "Group descriptor # %llu has bit"
13749b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    " count %u but claims %u are freed. num_bits %d",
13759b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    (unsigned long long)le64_to_cpu(bg->bg_blkno),
13769b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    le16_to_cpu(bg->bg_bits),
13779b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    le16_to_cpu(bg->bg_free_bits_count), num_bits);
13789b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda		return -EROFS;
13799b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda	}
1380ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	while(num_bits--)
1381ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_set_bit(bit_off++, bitmap);
1382ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1383ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, group_bh);
1384ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1385ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1386ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1387ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1388ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1389ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* find the one with the most empty bits */
1390ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline u16 ocfs2_find_victim_chain(struct ocfs2_chain_list *cl)
1391ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1392ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 curr, best;
1393ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1394ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!cl->cl_next_free_rec);
1395ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1396ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	best = curr = 0;
1397ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	while (curr < le16_to_cpu(cl->cl_next_free_rec)) {
1398ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (le32_to_cpu(cl->cl_recs[curr].c_free) >
1399ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		    le32_to_cpu(cl->cl_recs[best].c_free))
1400ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			best = curr;
1401ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		curr++;
1402ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1403ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1404ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(best >= le16_to_cpu(cl->cl_next_free_rec));
1405ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return best;
1406ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1407ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14081fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fashehstatic int ocfs2_relink_block_group(handle_t *handle,
1409ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct inode *alloc_inode,
1410ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *fe_bh,
1411ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *bg_bh,
1412ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *prev_bg_bh,
1413ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    u16 chain)
1414ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1415ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1416ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* there is a really tiny chance the journal calls could fail,
1417ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * but we wouldn't want inconsistent blocks in *any* case. */
1418493098413bdb45f223ff0552e2f734849491dbbeJie Liu	u64 bg_ptr, prev_bg_ptr;
1419ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe = (struct ocfs2_dinode *) fe_bh->b_data;
1420ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg = (struct ocfs2_group_desc *) bg_bh->b_data;
1421ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *prev_bg = (struct ocfs2_group_desc *) prev_bg_bh->b_data;
1422ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14234203530613280281868b3ca36c817530bca3825cJoel Becker	/* The caller got these descriptors from
14244203530613280281868b3ca36c817530bca3825cJoel Becker	 * ocfs2_read_group_descriptor().  Any corruption is a code bug. */
14254203530613280281868b3ca36c817530bca3825cJoel Becker	BUG_ON(!OCFS2_IS_VALID_GROUP_DESC(bg));
14264203530613280281868b3ca36c817530bca3825cJoel Becker	BUG_ON(!OCFS2_IS_VALID_GROUP_DESC(prev_bg));
1427ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14282f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_relink_block_group(
14292f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)le64_to_cpu(fe->i_blkno), chain,
14302f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)le64_to_cpu(bg->bg_blkno),
14312f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)le64_to_cpu(prev_bg->bg_blkno));
1432ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1433ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg_ptr = le64_to_cpu(bg->bg_next_group);
1434ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	prev_bg_ptr = le64_to_cpu(prev_bg->bg_next_group);
1435ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14360cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_gd(handle, INODE_CACHE(alloc_inode),
14370cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 prev_bg_bh,
143813723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker					 OCFS2_JOURNAL_ACCESS_WRITE);
143925e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton	if (status < 0)
1440493098413bdb45f223ff0552e2f734849491dbbeJie Liu		goto out;
1441ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1442ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	prev_bg->bg_next_group = bg->bg_next_group;
1443ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, prev_bg_bh);
1444ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14450cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_gd(handle, INODE_CACHE(alloc_inode),
14460cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 bg_bh, OCFS2_JOURNAL_ACCESS_WRITE);
144725e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton	if (status < 0)
1448493098413bdb45f223ff0552e2f734849491dbbeJie Liu		goto out_rollback_prev_bg;
1449ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1450ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg->bg_next_group = fe->id2.i_chain.cl_recs[chain].c_blkno;
1451ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, bg_bh);
1452ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14530cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_di(handle, INODE_CACHE(alloc_inode),
14540cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 fe_bh, OCFS2_JOURNAL_ACCESS_WRITE);
145525e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton	if (status < 0)
1456493098413bdb45f223ff0552e2f734849491dbbeJie Liu		goto out_rollback_bg;
1457ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1458ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe->id2.i_chain.cl_recs[chain].c_blkno = bg->bg_blkno;
1459ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, fe_bh);
1460ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1461493098413bdb45f223ff0552e2f734849491dbbeJie Liuout:
146225e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton	if (status < 0)
146325e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton		mlog_errno(status);
1464493098413bdb45f223ff0552e2f734849491dbbeJie Liu	return status;
14654203530613280281868b3ca36c817530bca3825cJoel Becker
1466493098413bdb45f223ff0552e2f734849491dbbeJie Liuout_rollback_bg:
1467493098413bdb45f223ff0552e2f734849491dbbeJie Liu	bg->bg_next_group = cpu_to_le64(bg_ptr);
1468493098413bdb45f223ff0552e2f734849491dbbeJie Liuout_rollback_prev_bg:
1469493098413bdb45f223ff0552e2f734849491dbbeJie Liu	prev_bg->bg_next_group = cpu_to_le64(prev_bg_ptr);
147025e2892101ba541dce8593c698d70ccc278bc1fdAndrew Morton	goto out;
1471ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1472ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1473ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline int ocfs2_block_group_reasonably_empty(struct ocfs2_group_desc *bg,
1474ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						     u32 wanted)
1475ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1476ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return le16_to_cpu(bg->bg_free_bits_count) > wanted;
1477ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1478ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1479ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* return 0 on success, -ENOSPC to keep searching and any other < 0
1480ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * value on error. */
1481ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_cluster_group_search(struct inode *inode,
1482ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				      struct buffer_head *group_bh,
1483ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				      u32 bits_wanted, u32 min_bits,
14841187c968852e3c668f3b9376083851f81f6eee22Joel Becker				      u64 max_block,
14857d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				      struct ocfs2_suballoc_result *res)
1486ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1487ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int search = -ENOSPC;
1488ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int ret;
14891187c968852e3c668f3b9376083851f81f6eee22Joel Becker	u64 blkoff;
14907bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	struct ocfs2_group_desc *gd = (struct ocfs2_group_desc *) group_bh->b_data;
14919c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh	struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
14927bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	unsigned int max_bits, gd_cluster_off;
1493ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1494ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ocfs2_is_cluster_bitmap(inode));
1495ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
14967bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh	if (gd->bg_free_bits_count) {
14977bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		max_bits = le16_to_cpu(gd->bg_bits);
14987bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
14997bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		/* Tail groups in cluster bitmaps which aren't cpg
150025985edcedea6396277003854657b5f3cb31a628Lucas De Marchi		 * aligned are prone to partial extension by a failed
15017bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		 * fs resize. If the file system resize never got to
15027bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		 * update the dinode cluster count, then we don't want
15037bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		 * to trust any clusters past it, regardless of what
15047bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		 * the group descriptor says. */
15057bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		gd_cluster_off = ocfs2_blocks_to_clusters(inode->i_sb,
15067bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh							  le64_to_cpu(gd->bg_blkno));
15077bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		if ((gd_cluster_off + max_bits) >
15087bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		    OCFS2_I(inode)->ip_clusters) {
15097bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh			max_bits = OCFS2_I(inode)->ip_clusters - gd_cluster_off;
15102f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			trace_ocfs2_cluster_group_search_wrong_max_bits(
15112f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)le64_to_cpu(gd->bg_blkno),
15122f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				le16_to_cpu(gd->bg_bits),
15132f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				OCFS2_I(inode)->ip_clusters, max_bits);
15147bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh		}
15157bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh
1516ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ret = ocfs2_block_group_find_clear_bits(OCFS2_SB(inode->i_sb),
1517ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh							group_bh, bits_wanted,
15187d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker							max_bits, res);
1519ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (ret)
1520ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			return ret;
1521ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
15221187c968852e3c668f3b9376083851f81f6eee22Joel Becker		if (max_block) {
15231187c968852e3c668f3b9376083851f81f6eee22Joel Becker			blkoff = ocfs2_clusters_to_blocks(inode->i_sb,
15241187c968852e3c668f3b9376083851f81f6eee22Joel Becker							  gd_cluster_off +
15257d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker							  res->sr_bit_offset +
15267d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker							  res->sr_bits);
15272f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			trace_ocfs2_cluster_group_search_max_block(
15282f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)blkoff,
15292f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)max_block);
15301187c968852e3c668f3b9376083851f81f6eee22Joel Becker			if (blkoff > max_block)
15311187c968852e3c668f3b9376083851f81f6eee22Joel Becker				return -ENOSPC;
15321187c968852e3c668f3b9376083851f81f6eee22Joel Becker		}
15331187c968852e3c668f3b9376083851f81f6eee22Joel Becker
1534ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* ocfs2_block_group_find_clear_bits() might
1535ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		 * return success, but we still want to return
1536ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		 * -ENOSPC unless it found the minimum number
1537ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		 * of bits. */
15387d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker		if (min_bits <= res->sr_bits)
1539ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			search = 0; /* success */
15407d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker		else if (res->sr_bits) {
15419c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh			/*
15429c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh			 * Don't show bits which we'll be returning
15439c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh			 * for allocation to the local alloc bitmap.
15449c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh			 */
15457d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker			ocfs2_local_alloc_seen_free_bits(osb, res->sr_bits);
1546ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1547ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1548ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1549ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return search;
1550ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1551ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1552ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_block_group_search(struct inode *inode,
1553ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    struct buffer_head *group_bh,
1554ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				    u32 bits_wanted, u32 min_bits,
15551187c968852e3c668f3b9376083851f81f6eee22Joel Becker				    u64 max_block,
15567d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				    struct ocfs2_suballoc_result *res)
1557ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1558ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int ret = -ENOSPC;
15591187c968852e3c668f3b9376083851f81f6eee22Joel Becker	u64 blkoff;
1560ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg = (struct ocfs2_group_desc *) group_bh->b_data;
1561ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1562ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(min_bits != 1);
1563ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ocfs2_is_cluster_bitmap(inode));
1564ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
15651187c968852e3c668f3b9376083851f81f6eee22Joel Becker	if (bg->bg_free_bits_count) {
1566ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ret = ocfs2_block_group_find_clear_bits(OCFS2_SB(inode->i_sb),
1567ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh							group_bh, bits_wanted,
15687bf72edee614e10b8d470c40a326f47bfdd69992Mark Fasheh							le16_to_cpu(bg->bg_bits),
15697d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker							res);
15701187c968852e3c668f3b9376083851f81f6eee22Joel Becker		if (!ret && max_block) {
15717d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker			blkoff = le64_to_cpu(bg->bg_blkno) +
15727d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				res->sr_bit_offset + res->sr_bits;
15732f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			trace_ocfs2_block_group_search_max_block(
15742f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)blkoff,
15752f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				(unsigned long long)max_block);
15761187c968852e3c668f3b9376083851f81f6eee22Joel Becker			if (blkoff > max_block)
15771187c968852e3c668f3b9376083851f81f6eee22Joel Becker				ret = -ENOSPC;
15781187c968852e3c668f3b9376083851f81f6eee22Joel Becker		}
15791187c968852e3c668f3b9376083851f81f6eee22Joel Becker	}
1580ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1581ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return ret;
1582ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1583ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
15840a2fcd8988ac682f443fd5b0a7c48154a7b42ef2Younger Liuint ocfs2_alloc_dinode_update_counts(struct inode *inode,
15851fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh				       handle_t *handle,
1586883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				       struct buffer_head *di_bh,
1587883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				       u32 num_bits,
1588883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				       u16 chain)
1589883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh{
1590883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	int ret;
1591883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	u32 tmp_used;
1592883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	struct ocfs2_dinode *di = (struct ocfs2_dinode *) di_bh->b_data;
1593883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	struct ocfs2_chain_list *cl = (struct ocfs2_chain_list *) &di->id2.i_chain;
1594883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
15950cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	ret = ocfs2_journal_access_di(handle, INODE_CACHE(inode), di_bh,
159613723d00e374c2a6d6ccb5af6de965e89c3e1b01Joel Becker				      OCFS2_JOURNAL_ACCESS_WRITE);
1597883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	if (ret < 0) {
1598883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		mlog_errno(ret);
1599883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		goto out;
1600883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1601883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1602883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	tmp_used = le32_to_cpu(di->id1.bitmap1.i_used);
1603883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	di->id1.bitmap1.i_used = cpu_to_le32(num_bits + tmp_used);
1604883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	le32_add_cpu(&cl->cl_recs[chain].c_free, -num_bits);
1605ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, di_bh);
1606883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1607883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fashehout:
1608883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	return ret;
1609883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh}
1610883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1611db66c71577d525c0cd65e66ff675747565783ba4Younger Liuvoid ocfs2_rollback_alloc_dinode_counts(struct inode *inode,
1612db66c71577d525c0cd65e66ff675747565783ba4Younger Liu				       struct buffer_head *di_bh,
1613db66c71577d525c0cd65e66ff675747565783ba4Younger Liu				       u32 num_bits,
1614db66c71577d525c0cd65e66ff675747565783ba4Younger Liu				       u16 chain)
1615db66c71577d525c0cd65e66ff675747565783ba4Younger Liu{
1616db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	u32 tmp_used;
1617db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	struct ocfs2_dinode *di = (struct ocfs2_dinode *) di_bh->b_data;
1618db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	struct ocfs2_chain_list *cl;
1619db66c71577d525c0cd65e66ff675747565783ba4Younger Liu
1620db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	cl = (struct ocfs2_chain_list *)&di->id2.i_chain;
1621db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	tmp_used = le32_to_cpu(di->id1.bitmap1.i_used);
1622db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	di->id1.bitmap1.i_used = cpu_to_le32(tmp_used - num_bits);
1623db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	le32_add_cpu(&cl->cl_recs[chain].c_free, num_bits);
1624db66c71577d525c0cd65e66ff675747565783ba4Younger Liu}
1625db66c71577d525c0cd65e66ff675747565783ba4Younger Liu
1626ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Beckerstatic int ocfs2_bg_discontig_fix_by_rec(struct ocfs2_suballoc_result *res,
1627ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker					 struct ocfs2_extent_rec *rec,
1628ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker					 struct ocfs2_chain_list *cl)
162913e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker{
163013e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	unsigned int bpc = le16_to_cpu(cl->cl_bpc);
163113e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	unsigned int bitoff = le32_to_cpu(rec->e_cpos) * bpc;
163272094e43e3af5020510f920321d71f1798fa896dAl Viro	unsigned int bitcount = le16_to_cpu(rec->e_leaf_clusters) * bpc;
163313e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
163413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	if (res->sr_bit_offset < bitoff)
163513e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		return 0;
163613e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	if (res->sr_bit_offset >= (bitoff + bitcount))
163713e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		return 0;
1638ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	res->sr_blkno = le64_to_cpu(rec->e_blkno) +
1639ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker		(res->sr_bit_offset - bitoff);
164013e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	if ((res->sr_bit_offset + res->sr_bits) > (bitoff + bitcount))
164113e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		res->sr_bits = (bitoff + bitcount) - res->sr_bit_offset;
164213e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	return 1;
164313e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker}
164413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1645ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Beckerstatic void ocfs2_bg_discontig_fix_result(struct ocfs2_alloc_context *ac,
1646ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker					  struct ocfs2_group_desc *bg,
1647ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker					  struct ocfs2_suballoc_result *res)
164813e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker{
164913e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	int i;
16502b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	u64 bg_blkno = res->sr_bg_blkno;  /* Save off */
165113e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	struct ocfs2_extent_rec *rec;
165213e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	struct ocfs2_dinode *di = (struct ocfs2_dinode *)ac->ac_bh->b_data;
165313e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	struct ocfs2_chain_list *cl = &di->id2.i_chain;
165413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1655ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	if (ocfs2_is_cluster_bitmap(ac->ac_inode)) {
1656ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker		res->sr_blkno = 0;
165713e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		return;
1658ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	}
165913e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1660ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	res->sr_blkno = res->sr_bg_blkno + res->sr_bit_offset;
16612b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	res->sr_bg_blkno = 0;  /* Clear it for contig block groups */
16624711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	if (!ocfs2_supports_discontig_bg(OCFS2_SB(ac->ac_inode->i_sb)) ||
1663ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	    !bg->bg_list.l_next_free_rec)
166413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		return;
166513e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
166613e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	for (i = 0; i < le16_to_cpu(bg->bg_list.l_next_free_rec); i++) {
166713e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker		rec = &bg->bg_list.l_recs[i];
16682b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker		if (ocfs2_bg_discontig_fix_by_rec(res, rec, cl)) {
16692b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker			res->sr_bg_blkno = bg_blkno;  /* Restore */
167013e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker			break;
16712b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker		}
167213e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	}
167313e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker}
167413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1675883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fashehstatic int ocfs2_search_one_group(struct ocfs2_alloc_context *ac,
16761fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh				  handle_t *handle,
1677883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				  u32 bits_wanted,
1678883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				  u32 min_bits,
16797d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				  struct ocfs2_suballoc_result *res,
1680883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh				  u16 *bits_left)
1681883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh{
1682883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	int ret;
1683883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	struct buffer_head *group_bh = NULL;
1684883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	struct ocfs2_group_desc *gd;
168568f64d471be38631d7196b938d9809802dd467faJoel Becker	struct ocfs2_dinode *di = (struct ocfs2_dinode *)ac->ac_bh->b_data;
1686883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	struct inode *alloc_inode = ac->ac_inode;
1687883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
16887d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	ret = ocfs2_read_group_descriptor(alloc_inode, di,
16897d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					  res->sr_bg_blkno, &group_bh);
1690883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	if (ret < 0) {
1691883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		mlog_errno(ret);
1692883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		return ret;
1693883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1694883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1695883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	gd = (struct ocfs2_group_desc *) group_bh->b_data;
1696883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	ret = ac->ac_group_search(alloc_inode, group_bh, bits_wanted, min_bits,
16977d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				  ac->ac_max_block, res);
1698883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	if (ret < 0) {
1699883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		if (ret != -ENOSPC)
1700883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			mlog_errno(ret);
1701883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		goto out;
1702883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1703883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
170413e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	if (!ret)
1705ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker		ocfs2_bg_discontig_fix_result(ac, gd, res);
170613e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1707e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	/*
1708e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * sr_bg_blkno might have been changed by
1709e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * ocfs2_bg_discontig_fix_result
1710e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 */
1711e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	res->sr_bg_stable_blkno = group_bh->b_blocknr;
1712e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
1713e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ac->ac_find_loc_only)
1714e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out_loc_only;
1715e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
1716883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	ret = ocfs2_alloc_dinode_update_counts(alloc_inode, handle, ac->ac_bh,
17177d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					       res->sr_bits,
1718883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh					       le16_to_cpu(gd->bg_chain));
1719883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	if (ret < 0) {
1720883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		mlog_errno(ret);
1721883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		goto out;
1722883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1723883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1724883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	ret = ocfs2_block_group_set_bits(handle, alloc_inode, gd, group_bh,
17257d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					 res->sr_bit_offset, res->sr_bits);
1726db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	if (ret < 0) {
1727db66c71577d525c0cd65e66ff675747565783ba4Younger Liu		ocfs2_rollback_alloc_dinode_counts(alloc_inode, ac->ac_bh,
1728db66c71577d525c0cd65e66ff675747565783ba4Younger Liu					       res->sr_bits,
1729db66c71577d525c0cd65e66ff675747565783ba4Younger Liu					       le16_to_cpu(gd->bg_chain));
1730883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		mlog_errno(ret);
1731db66c71577d525c0cd65e66ff675747565783ba4Younger Liu	}
1732883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1733e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehout_loc_only:
1734883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	*bits_left = le16_to_cpu(gd->bg_free_bits_count);
1735883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1736883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fashehout:
1737883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	brelse(group_bh);
1738883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1739883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	return ret;
1740883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh}
1741883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1742ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic int ocfs2_search_chain(struct ocfs2_alloc_context *ac,
17431fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh			      handle_t *handle,
1744ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			      u32 bits_wanted,
1745ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			      u32 min_bits,
17467d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker			      struct ocfs2_suballoc_result *res,
1747883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			      u16 *bits_left)
1748ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1749ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
17507d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	u16 chain;
1751ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u64 next_group;
1752ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct inode *alloc_inode = ac->ac_inode;
1753ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct buffer_head *group_bh = NULL;
1754ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct buffer_head *prev_group_bh = NULL;
1755ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe = (struct ocfs2_dinode *) ac->ac_bh->b_data;
1756ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_chain_list *cl = (struct ocfs2_chain_list *) &fe->id2.i_chain;
1757ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *bg;
1758ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1759ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	chain = ac->ac_chain;
17602f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_search_chain_begin(
17612f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)OCFS2_I(alloc_inode)->ip_blkno,
17622f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		bits_wanted, chain);
1763ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
176468f64d471be38631d7196b938d9809802dd467faJoel Becker	status = ocfs2_read_group_descriptor(alloc_inode, fe,
176568f64d471be38631d7196b938d9809802dd467faJoel Becker					     le64_to_cpu(cl->cl_recs[chain].c_blkno),
176668f64d471be38631d7196b938d9809802dd467faJoel Becker					     &group_bh);
1767ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1768ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1769ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1770ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1771ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	bg = (struct ocfs2_group_desc *) group_bh->b_data;
1772ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1773ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = -ENOSPC;
1774ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* for now, the chain search is a bit simplistic. We just use
1775ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * the 1st group with any empty bits. */
17761187c968852e3c668f3b9376083851f81f6eee22Joel Becker	while ((status = ac->ac_group_search(alloc_inode, group_bh,
17771187c968852e3c668f3b9376083851f81f6eee22Joel Becker					     bits_wanted, min_bits,
17787d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					     ac->ac_max_block,
17797d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					     res)) == -ENOSPC) {
1780ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (!bg->bg_next_group)
1781ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			break;
1782a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh
1783a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh		brelse(prev_group_bh);
1784a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh		prev_group_bh = NULL;
1785a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh
1786ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		next_group = le64_to_cpu(bg->bg_next_group);
1787ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		prev_group_bh = group_bh;
1788ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		group_bh = NULL;
178968f64d471be38631d7196b938d9809802dd467faJoel Becker		status = ocfs2_read_group_descriptor(alloc_inode, fe,
179068f64d471be38631d7196b938d9809802dd467faJoel Becker						     next_group, &group_bh);
1791ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status < 0) {
1792ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1793ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
1794ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1795ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		bg = (struct ocfs2_group_desc *) group_bh->b_data;
1796ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1797ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1798ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
1799ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1800ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1801ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1802ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
18032f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_search_chain_succ(
18042f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)le64_to_cpu(bg->bg_blkno), res->sr_bits);
1805ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
18067d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	res->sr_bg_blkno = le64_to_cpu(bg->bg_blkno);
1807ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
18087d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	BUG_ON(res->sr_bits == 0);
180913e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker	if (!status)
1810ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker		ocfs2_bg_discontig_fix_result(ac, bg, res);
181113e434cf0cacd2f03a7f4cd077e3e995ef5ef710Joel Becker
1812e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	/*
1813e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * sr_bg_blkno might have been changed by
1814e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * ocfs2_bg_discontig_fix_result
1815e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 */
1816e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	res->sr_bg_stable_blkno = group_bh->b_blocknr;
1817ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1818ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/*
1819ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * Keep track of previous block descriptor read. When
1820ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * we find a target, if we have read more than X
1821ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * number of descriptors, and the target is reasonably
1822ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * empty, relink him to top of his chain.
1823ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 *
1824ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * We've read 0 extra blocks and only send one more to
1825ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * the transaction, yet the next guy to search has a
1826ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * much easier time.
1827ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 *
1828ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * Do this *after* figuring out how many bits we're taking out
1829ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * of our target group.
1830ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 */
1831309a85b6861fedbb48a22d45e0e079d1be993b3aXiaowei.Hu	if (!ac->ac_disable_chain_relink &&
1832ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	    (prev_group_bh) &&
18337d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	    (ocfs2_block_group_reasonably_empty(bg, res->sr_bits))) {
1834ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = ocfs2_relink_block_group(handle, alloc_inode,
1835ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						  ac->ac_bh, group_bh,
1836ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						  prev_group_bh, chain);
1837ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status < 0) {
1838ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1839ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
1840ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1841ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1842ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1843e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ac->ac_find_loc_only)
1844e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out_loc_only;
1845e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
1846d51349829c378c06ba4aa7d4b16ca23739858608Mark Fasheh	status = ocfs2_alloc_dinode_update_counts(alloc_inode, handle,
1847d51349829c378c06ba4aa7d4b16ca23739858608Mark Fasheh						  ac->ac_bh, res->sr_bits,
1848d51349829c378c06ba4aa7d4b16ca23739858608Mark Fasheh						  chain);
1849d51349829c378c06ba4aa7d4b16ca23739858608Mark Fasheh	if (status) {
1850ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1851ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1852ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1853ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1854ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = ocfs2_block_group_set_bits(handle,
1855ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					    alloc_inode,
1856ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					    bg,
1857ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					    group_bh,
18587d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					    res->sr_bit_offset,
18597d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					    res->sr_bits);
1860ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
1861db66c71577d525c0cd65e66ff675747565783ba4Younger Liu		ocfs2_rollback_alloc_dinode_counts(alloc_inode,
1862db66c71577d525c0cd65e66ff675747565783ba4Younger Liu					ac->ac_bh, res->sr_bits, chain);
1863ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1864ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1865ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1866ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
18672f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_search_chain_end(
18682f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			(unsigned long long)le64_to_cpu(fe->i_blkno),
18692f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			res->sr_bits);
1870ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1871e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehout_loc_only:
1872883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	*bits_left = le16_to_cpu(bg->bg_free_bits_count);
1873ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
1874a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(group_bh);
1875a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(prev_group_bh);
1876ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1877c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
1878c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
1879ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1880ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1881ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1882ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* will give out up to bits_wanted contiguous bits. */
1883aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Beckerstatic int ocfs2_claim_suballoc_bits(struct ocfs2_alloc_context *ac,
18841fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fasheh				     handle_t *handle,
1885ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				     u32 bits_wanted,
1886ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				     u32 min_bits,
18877d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				     struct ocfs2_suballoc_result *res)
1888ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
1889ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
1890ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 victim, i;
1891883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	u16 bits_left = 0;
1892b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	u64 hint = ac->ac_last_group;
1893ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_chain_list *cl;
1894ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe;
1895ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1896ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_bits_given >= ac->ac_bits_wanted);
1897ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(bits_wanted > (ac->ac_bits_wanted - ac->ac_bits_given));
1898ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ac->ac_bh);
1899ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1900ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe = (struct ocfs2_dinode *) ac->ac_bh->b_data;
190110995aa2451afa20b721cc7de856cae1a13dba57Joel Becker
190210995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	/* The bh was validated by the inode read during
190310995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	 * ocfs2_reserve_suballoc_bits().  Any corruption is a code bug. */
190410995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	BUG_ON(!OCFS2_IS_VALID_DINODE(fe));
190510995aa2451afa20b721cc7de856cae1a13dba57Joel Becker
1906ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (le32_to_cpu(fe->id1.bitmap1.i_used) >=
1907ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	    le32_to_cpu(fe->id1.bitmap1.i_total)) {
1908aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Becker		ocfs2_error(ac->ac_inode->i_sb,
1909aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Becker			    "Chain allocator dinode %llu has %u used "
1910b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh			    "bits but only %u total.",
1911b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh			    (unsigned long long)le64_to_cpu(fe->i_blkno),
1912ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			    le32_to_cpu(fe->id1.bitmap1.i_used),
1913ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			    le32_to_cpu(fe->id1.bitmap1.i_total));
1914ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = -EIO;
1915ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1916ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1917ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1918b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	res->sr_bg_blkno = hint;
19197d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	if (res->sr_bg_blkno) {
1920883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		/* Attempt to short-circuit the usual search mechanism
1921883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		 * by jumping straight to the most recently used
1922b595076a180a56d1bb170e6eceda6eb9d76f4cd3Uwe Kleine-König		 * allocation group. This helps us maintain some
1923883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		 * contiguousness across allocations. */
1924da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		status = ocfs2_search_one_group(ac, handle, bits_wanted,
19257d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker						min_bits, res, &bits_left);
19267d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker		if (!status)
1927883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			goto set_hint;
1928883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		if (status < 0 && status != -ENOSPC) {
1929883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			mlog_errno(status);
1930883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			goto bail;
1931883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		}
1932883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1933883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1934ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	cl = (struct ocfs2_chain_list *) &fe->id2.i_chain;
1935ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1936ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	victim = ocfs2_find_victim_chain(cl);
1937ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ac->ac_chain = victim;
1938ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
19397d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	status = ocfs2_search_chain(ac, handle, bits_wanted, min_bits,
19407d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker				    res, &bits_left);
1941b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	if (!status) {
1942b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh		hint = ocfs2_group_from_res(res);
1943883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		goto set_hint;
1944b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh	}
1945ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0 && status != -ENOSPC) {
1946ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
1947ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
1948ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1949ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
19502f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_claim_suballoc_bits(victim);
1951ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1952ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* If we didn't pick a good victim, then just default to
1953ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * searching each chain in order. Don't allow chain relinking
1954ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * because we only calculate enough journal credits for one
1955ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * relink per alloc. */
1956309a85b6861fedbb48a22d45e0e079d1be993b3aXiaowei.Hu	ac->ac_disable_chain_relink = 1;
1957ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	for (i = 0; i < le16_to_cpu(cl->cl_next_free_rec); i ++) {
1958ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (i == victim)
1959ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			continue;
1960ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (!cl->cl_recs[i].c_free)
1961ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			continue;
1962ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1963ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ac->ac_chain = i;
1964da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh		status = ocfs2_search_chain(ac, handle, bits_wanted, min_bits,
19657d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					    res, &bits_left);
1966b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh		if (!status) {
1967b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh			hint = ocfs2_group_from_res(res);
1968ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			break;
1969b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh		}
1970ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status < 0 && status != -ENOSPC) {
1971ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
1972ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
1973ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
1974ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
1975ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
1976883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fashehset_hint:
1977883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	if (status != -ENOSPC) {
1978883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		/* If the next search of this group is not likely to
1979883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		 * yield a suitable extent, then we reset the last
1980883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		 * group hint so as to not waste a disk read */
1981883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		if (bits_left < min_bits)
1982883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh			ac->ac_last_group = 0;
1983883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh		else
1984b2b6ebf5f740e015b2155343958f067e594323eaMark Fasheh			ac->ac_last_group = hint;
1985883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh	}
1986883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fasheh
1987883d4cae4a2b01a05193cf2665c77b7489a8b6a0Mark Fashehbail:
1988c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
1989c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
1990ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
1991ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
1992ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
19931ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Beckerint ocfs2_claim_metadata(handle_t *handle,
1994ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 struct ocfs2_alloc_context *ac,
1995ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 u32 bits_wanted,
19962b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker			 u64 *suballoc_loc,
1997ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 u16 *suballoc_bit_start,
1998ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 unsigned int *num_bits,
1999ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 u64 *blkno_start)
2000ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2001ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
2002ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	struct ocfs2_suballoc_result res = { .sr_blkno = 0, };
2003ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2004ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ac);
2005ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_bits_wanted < (ac->ac_bits_given + bits_wanted));
2006ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_which != OCFS2_AC_USE_META);
2007ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2008aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Becker	status = ocfs2_claim_suballoc_bits(ac,
2009da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh					   handle,
2010ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					   bits_wanted,
2011ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					   1,
20127d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					   &res);
2013ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2014ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2015ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2016ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
20171ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker	atomic_inc(&OCFS2_SB(ac->ac_inode->i_sb)->alloc_stats.bg_allocs);
2018ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
20192b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	*suballoc_loc = res.sr_bg_blkno;
20207d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	*suballoc_bit_start = res.sr_bit_offset;
2021ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	*blkno_start = res.sr_blkno;
20227d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	ac->ac_bits_given += res.sr_bits;
20237d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	*num_bits = res.sr_bits;
2024ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
2025ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
2026c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2027c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
2028ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2029ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2030ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2031138211515c102807a16c02fdc15feef1f6ef8124Tao Mastatic void ocfs2_init_inode_ac_group(struct inode *dir,
2032abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma				      struct buffer_head *parent_di_bh,
2033138211515c102807a16c02fdc15feef1f6ef8124Tao Ma				      struct ocfs2_alloc_context *ac)
2034138211515c102807a16c02fdc15feef1f6ef8124Tao Ma{
2035abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	struct ocfs2_dinode *di = (struct ocfs2_dinode *)parent_di_bh->b_data;
2036138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	/*
2037138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * Try to allocate inodes from some specific group.
2038138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 *
2039138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * If the parent dir has recorded the last group used in allocation,
2040138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * cool, use it. Otherwise if we try to allocate new inode from the
2041138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * same slot the parent dir belongs to, use the same chunk.
2042138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 *
2043138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * We are very careful here to avoid the mistake of setting
2044138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 * ac_last_group to a group descriptor from a different (unlocked) slot.
2045138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	 */
2046138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	if (OCFS2_I(dir)->ip_last_used_group &&
2047138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	    OCFS2_I(dir)->ip_last_used_slot == ac->ac_alloc_slot)
2048138211515c102807a16c02fdc15feef1f6ef8124Tao Ma		ac->ac_last_group = OCFS2_I(dir)->ip_last_used_group;
2049abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	else if (le16_to_cpu(di->i_suballoc_slot) == ac->ac_alloc_slot) {
2050abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma		if (di->i_suballoc_loc)
2051abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma			ac->ac_last_group = le64_to_cpu(di->i_suballoc_loc);
2052abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma		else
2053abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma			ac->ac_last_group = ocfs2_which_suballoc_group(
2054abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma					le64_to_cpu(di->i_blkno),
2055abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma					le16_to_cpu(di->i_suballoc_bit));
2056abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	}
2057138211515c102807a16c02fdc15feef1f6ef8124Tao Ma}
2058138211515c102807a16c02fdc15feef1f6ef8124Tao Ma
2059138211515c102807a16c02fdc15feef1f6ef8124Tao Mastatic inline void ocfs2_save_inode_ac_group(struct inode *dir,
2060138211515c102807a16c02fdc15feef1f6ef8124Tao Ma					     struct ocfs2_alloc_context *ac)
2061138211515c102807a16c02fdc15feef1f6ef8124Tao Ma{
2062138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	OCFS2_I(dir)->ip_last_used_group = ac->ac_last_group;
2063138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	OCFS2_I(dir)->ip_last_used_slot = ac->ac_alloc_slot;
2064138211515c102807a16c02fdc15feef1f6ef8124Tao Ma}
2065138211515c102807a16c02fdc15feef1f6ef8124Tao Ma
2066e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehint ocfs2_find_new_inode_loc(struct inode *dir,
2067e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh			     struct buffer_head *parent_fe_bh,
2068e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh			     struct ocfs2_alloc_context *ac,
2069e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh			     u64 *fe_blkno)
2070e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh{
2071e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	int ret;
2072e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	handle_t *handle = NULL;
2073e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	struct ocfs2_suballoc_result *res;
2074e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2075e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(!ac);
2076e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(ac->ac_bits_given != 0);
2077e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(ac->ac_bits_wanted != 1);
2078e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(ac->ac_which != OCFS2_AC_USE_INODE);
2079e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2080e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	res = kzalloc(sizeof(*res), GFP_NOFS);
2081e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (res == NULL) {
2082e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		ret = -ENOMEM;
2083e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2084e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2085e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2086e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2087e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ocfs2_init_inode_ac_group(dir, parent_fe_bh, ac);
2088e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2089e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	/*
2090e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * The handle started here is for chain relink. Alternatively,
2091e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * we could just disable relink for these calls.
2092e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 */
2093e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	handle = ocfs2_start_trans(OCFS2_SB(dir->i_sb), OCFS2_SUBALLOC_ALLOC);
2094e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (IS_ERR(handle)) {
2095e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		ret = PTR_ERR(handle);
2096e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		handle = NULL;
2097e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2098e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2099e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2100e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2101e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	/*
2102e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * This will instruct ocfs2_claim_suballoc_bits and
2103e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * ocfs2_search_one_group to search but save actual allocation
2104e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * for later.
2105e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 */
2106e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ac->ac_find_loc_only = 1;
2107e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2108e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ret = ocfs2_claim_suballoc_bits(ac, handle, 1, 1, res);
2109e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ret < 0) {
2110e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2111e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2112e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2113e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2114e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ac->ac_find_loc_priv = res;
2115e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	*fe_blkno = res->sr_blkno;
21166fdb702d6262b18b1b41a35f1f81903b0a2bc2c9Darrick J. Wong	ocfs2_update_inode_fsync_trans(handle, dir, 0);
2117e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehout:
2118e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (handle)
2119e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		ocfs2_commit_trans(OCFS2_SB(dir->i_sb), handle);
2120e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2121e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ret)
2122e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		kfree(res);
2123e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2124e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	return ret;
2125e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh}
2126e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2127e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehint ocfs2_claim_new_inode_at_loc(handle_t *handle,
2128e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh				 struct inode *dir,
2129e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh				 struct ocfs2_alloc_context *ac,
2130e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh				 u64 *suballoc_loc,
2131e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh				 u16 *suballoc_bit,
2132e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh				 u64 di_blkno)
2133e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh{
2134e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	int ret;
2135e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	u16 chain;
2136e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	struct ocfs2_suballoc_result *res = ac->ac_find_loc_priv;
2137e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	struct buffer_head *bg_bh = NULL;
2138e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	struct ocfs2_group_desc *bg;
2139e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	struct ocfs2_dinode *di = (struct ocfs2_dinode *) ac->ac_bh->b_data;
2140e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2141e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	/*
2142e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * Since di_blkno is being passed back in, we check for any
2143e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * inconsistencies which may have happened between
2144e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * calls. These are code bugs as di_blkno is not expected to
2145e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 * change once returned from ocfs2_find_new_inode_loc()
2146e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	 */
2147e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(res->sr_blkno != di_blkno);
2148e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2149e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ret = ocfs2_read_group_descriptor(ac->ac_inode, di,
2150e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					  res->sr_bg_stable_blkno, &bg_bh);
2151e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ret) {
2152e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2153e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2154e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2155e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2156e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	bg = (struct ocfs2_group_desc *) bg_bh->b_data;
2157e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	chain = le16_to_cpu(bg->bg_chain);
2158e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2159e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ret = ocfs2_alloc_dinode_update_counts(ac->ac_inode, handle,
2160e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					       ac->ac_bh, res->sr_bits,
2161e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					       chain);
2162e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ret) {
2163e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2164e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2165e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2166e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2167e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ret = ocfs2_block_group_set_bits(handle,
2168e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					 ac->ac_inode,
2169e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					 bg,
2170e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					 bg_bh,
2171e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					 res->sr_bit_offset,
2172e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh					 res->sr_bits);
2173e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	if (ret < 0) {
2174db66c71577d525c0cd65e66ff675747565783ba4Younger Liu		ocfs2_rollback_alloc_dinode_counts(ac->ac_inode,
2175db66c71577d525c0cd65e66ff675747565783ba4Younger Liu					       ac->ac_bh, res->sr_bits, chain);
2176e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		mlog_errno(ret);
2177e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh		goto out;
2178e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	}
2179e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
21802f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_claim_new_inode_at_loc((unsigned long long)di_blkno,
21812f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma					   res->sr_bits);
2182e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2183e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	atomic_inc(&OCFS2_SB(ac->ac_inode->i_sb)->alloc_stats.bg_allocs);
2184e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2185e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	BUG_ON(res->sr_bits != 1);
2186e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2187e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	*suballoc_loc = res->sr_bg_blkno;
2188e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	*suballoc_bit = res->sr_bit_offset;
2189e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ac->ac_bits_given++;
2190e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	ocfs2_save_inode_ac_group(dir, ac);
2191e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2192e49e27674d1dd2717ad90b21ece8f83102153315Mark Fashehout:
2193e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	brelse(bg_bh);
2194e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
2195e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh	return ret;
2196e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh}
2197e49e27674d1dd2717ad90b21ece8f83102153315Mark Fasheh
21981ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Beckerint ocfs2_claim_new_inode(handle_t *handle,
2199138211515c102807a16c02fdc15feef1f6ef8124Tao Ma			  struct inode *dir,
2200138211515c102807a16c02fdc15feef1f6ef8124Tao Ma			  struct buffer_head *parent_fe_bh,
2201ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			  struct ocfs2_alloc_context *ac,
22022b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker			  u64 *suballoc_loc,
2203ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			  u16 *suballoc_bit,
2204ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			  u64 *fe_blkno)
2205ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2206ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
22072b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	struct ocfs2_suballoc_result res;
2208ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2209ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ac);
2210ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_bits_given != 0);
2211ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_bits_wanted != 1);
2212ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_which != OCFS2_AC_USE_INODE);
2213ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2214138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	ocfs2_init_inode_ac_group(dir, parent_fe_bh, ac);
2215138211515c102807a16c02fdc15feef1f6ef8124Tao Ma
2216aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Becker	status = ocfs2_claim_suballoc_bits(ac,
2217da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh					   handle,
2218ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					   1,
2219ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					   1,
22207d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker					   &res);
2221ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2222ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2223ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2224ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
22251ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker	atomic_inc(&OCFS2_SB(ac->ac_inode->i_sb)->alloc_stats.bg_allocs);
2226ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
22277d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	BUG_ON(res.sr_bits != 1);
2228ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
22292b6cb576aa80611f1f6a3c88708d1e68a8d97985Joel Becker	*suballoc_loc = res.sr_bg_blkno;
22307d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker	*suballoc_bit = res.sr_bit_offset;
2231ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	*fe_blkno = res.sr_blkno;
2232ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ac->ac_bits_given++;
2233138211515c102807a16c02fdc15feef1f6ef8124Tao Ma	ocfs2_save_inode_ac_group(dir, ac);
2234ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = 0;
2235ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
2236c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2237c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
2238ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2239ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2240ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2241ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* translate a group desc. blkno and it's bitmap offset into
2242ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * disk cluster offset. */
2243ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline u32 ocfs2_desc_bitmap_to_cluster_off(struct inode *inode,
2244ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   u64 bg_blkno,
2245ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   u16 bg_bit_off)
2246ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2247ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
2248ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 cluster = 0;
2249ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2250ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ocfs2_is_cluster_bitmap(inode));
2251ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2252ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (bg_blkno != osb->first_cluster_group_blkno)
2253ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		cluster = ocfs2_blocks_to_clusters(inode->i_sb, bg_blkno);
2254ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	cluster += (u32) bg_bit_off;
2255ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return cluster;
2256ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2257ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2258ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* given a cluster offset, calculate which block group it belongs to
2259ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * and return that block offset. */
2260d659072f736837e56b6433d58e5315ad1d4d5ccfTao Mau64 ocfs2_which_cluster_group(struct inode *inode, u32 cluster)
2261ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2262ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
2263ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 group_no;
2264ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2265ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ocfs2_is_cluster_bitmap(inode));
2266ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2267ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	group_no = cluster / osb->bitmap_cpg;
2268ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (!group_no)
2269ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		return osb->first_cluster_group_blkno;
2270ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return ocfs2_clusters_to_blocks(inode->i_sb,
2271ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					group_no * osb->bitmap_cpg);
2272ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2273ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2274ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/* given the block number of a cluster start, calculate which cluster
2275ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * group and descriptor bitmap offset that corresponds to. */
2276ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_block_to_cluster_group(struct inode *inode,
2277ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u64 data_blkno,
2278ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u64 *bg_blkno,
2279ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						u16 *bg_bit_off)
2280ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2281ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
2282ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 data_cluster = ocfs2_blocks_to_clusters(osb->sb, data_blkno);
2283ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2284ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(!ocfs2_is_cluster_bitmap(inode));
2285ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2286ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	*bg_blkno = ocfs2_which_cluster_group(inode,
2287ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					      data_cluster);
2288ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2289ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (*bg_blkno == osb->first_cluster_group_blkno)
2290ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		*bg_bit_off = (u16) data_cluster;
2291ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	else
2292ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		*bg_bit_off = (u16) ocfs2_blocks_to_clusters(osb->sb,
2293ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh							     data_blkno - *bg_blkno);
2294ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2295ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2296ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/*
2297ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * min_bits - minimum contiguous chunk from this total allocation we
2298ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * can handle. set to what we asked for originally for a full
2299ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * contig. allocation, set to '1' to indicate we can deal with extents
2300ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * of any size.
2301ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh */
23021ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Beckerint __ocfs2_claim_clusters(handle_t *handle,
2303415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			   struct ocfs2_alloc_context *ac,
2304415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			   u32 min_clusters,
2305415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			   u32 max_clusters,
2306415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			   u32 *cluster_start,
2307415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			   u32 *num_clusters)
2308ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2309ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
2310415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh	unsigned int bits_wanted = max_clusters;
2311ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker	struct ocfs2_suballoc_result res = { .sr_blkno = 0, };
23121ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker	struct ocfs2_super *osb = OCFS2_SB(ac->ac_inode->i_sb);
2313ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2314ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_bits_given >= ac->ac_bits_wanted);
2315ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2316ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(ac->ac_which != OCFS2_AC_USE_LOCAL
2317ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	       && ac->ac_which != OCFS2_AC_USE_MAIN);
2318ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2319ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (ac->ac_which == OCFS2_AC_USE_LOCAL) {
232033d5d380d667ad264675cfdb297dfc3c5b6542ccMark Fasheh		WARN_ON(min_clusters > 1);
232133d5d380d667ad264675cfdb297dfc3c5b6542ccMark Fasheh
2322ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		status = ocfs2_claim_local_alloc_bits(osb,
2323ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						      handle,
2324ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						      ac,
2325ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						      bits_wanted,
2326ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						      cluster_start,
2327ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						      num_clusters);
2328ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (!status)
2329ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			atomic_inc(&osb->alloc_stats.local_data);
2330ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	} else {
2331ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (min_clusters > (osb->bitmap_cpg - 1)) {
2332ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			/* The only paths asking for contiguousness
2333ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			 * should know about this already. */
23342fbe8d1ebe004425b4f7b8bba345623d2280be82Sunil Mushran			mlog(ML_ERROR, "minimum allocation requested %u exceeds "
23352fbe8d1ebe004425b4f7b8bba345623d2280be82Sunil Mushran			     "group bitmap size %u!\n", min_clusters,
23362fbe8d1ebe004425b4f7b8bba345623d2280be82Sunil Mushran			     osb->bitmap_cpg);
2337ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			status = -ENOSPC;
2338ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			goto bail;
2339ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
2340ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		/* clamp the current request down to a realistic size. */
2341ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (bits_wanted > (osb->bitmap_cpg - 1))
2342ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			bits_wanted = osb->bitmap_cpg - 1;
2343ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2344aa8f8e93c898a0319bcd6c79a9a42fe52abac7d7Joel Becker		status = ocfs2_claim_suballoc_bits(ac,
2345da5cbf2f9df922cfdafa39351691fa83517f1e25Mark Fasheh						   handle,
2346ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   bits_wanted,
2347ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh						   min_clusters,
23487d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker						   &res);
2349ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (!status) {
2350ba2066351b630f0205ebf725f5c81a2a07a77cd7Joel Becker			BUG_ON(res.sr_blkno); /* cluster alloc can't set */
2351ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			*cluster_start =
2352ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				ocfs2_desc_bitmap_to_cluster_off(ac->ac_inode,
23537d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker								 res.sr_bg_blkno,
23547d1fe093bf04124dcc50c5dde1765bd098464bfaJoel Becker								 res.sr_bit_offset);
2355ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			atomic_inc(&osb->alloc_stats.bitmap_data);
23564711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma			*num_clusters = res.sr_bits;
2357ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		}
2358ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2359ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2360ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		if (status != -ENOSPC)
2361ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh			mlog_errno(status);
2362ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2363ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2364ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
23654711954eaa8d30f653fda238cecf919f1ae40d6fTao Ma	ac->ac_bits_given += *num_clusters;
2366ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2367ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
2368c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2369c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
2370ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2371ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2372ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
23731ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Beckerint ocfs2_claim_clusters(handle_t *handle,
2374415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			 struct ocfs2_alloc_context *ac,
2375415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			 u32 min_clusters,
2376415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			 u32 *cluster_start,
2377415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh			 u32 *num_clusters)
2378415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh{
2379415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh	unsigned int bits_wanted = ac->ac_bits_wanted - ac->ac_bits_given;
2380415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh
23811ed9b777f77929ae961d6f9cdf828a07200ba71cJoel Becker	return __ocfs2_claim_clusters(handle, ac, min_clusters,
2382415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh				      bits_wanted, cluster_start, num_clusters);
2383415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh}
2384415cb800375cc4e89fb5a6a454e484bd4adbffb4Mark Fasheh
2385b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehstatic int ocfs2_block_group_clear_bits(handle_t *handle,
2386b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					struct inode *alloc_inode,
2387b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					struct ocfs2_group_desc *bg,
2388b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					struct buffer_head *group_bh,
2389b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					unsigned int bit_off,
2390b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					unsigned int num_bits,
2391b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					void (*undo_fn)(unsigned int bit,
2392b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh							unsigned long *bmap))
2393ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2394ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
2395ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	unsigned int tmp;
2396ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *undo_bg = NULL;
2397ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
23984203530613280281868b3ca36c817530bca3825cJoel Becker	/* The caller got this descriptor from
23994203530613280281868b3ca36c817530bca3825cJoel Becker	 * ocfs2_read_group_descriptor().  Any corruption is a code bug. */
24004203530613280281868b3ca36c817530bca3825cJoel Becker	BUG_ON(!OCFS2_IS_VALID_GROUP_DESC(bg));
2401ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
24022f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_block_group_clear_bits(bit_off, num_bits);
2403ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2404b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	BUG_ON(undo_fn && !ocfs2_is_cluster_bitmap(alloc_inode));
24050cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_gd(handle, INODE_CACHE(alloc_inode),
2406b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					 group_bh,
2407b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					 undo_fn ?
2408b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					 OCFS2_JOURNAL_ACCESS_UNDO :
2409b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					 OCFS2_JOURNAL_ACCESS_WRITE);
2410ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2411ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2412ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2413ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2414ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2415b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	if (undo_fn) {
241694e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		jbd_lock_bh_state(group_bh);
241794e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		undo_bg = (struct ocfs2_group_desc *)
241894e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran					bh2jh(group_bh)->b_committed_data;
241994e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		BUG_ON(!undo_bg);
242094e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran	}
2421ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2422ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	tmp = num_bits;
2423ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	while(tmp--) {
2424ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		ocfs2_clear_bit((bit_off + tmp),
2425ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				(unsigned long *) bg->bg_bitmap);
2426b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh		if (undo_fn)
2427b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			undo_fn(bit_off + tmp,
2428b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				(unsigned long *) undo_bg->bg_bitmap);
2429ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2430ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le16_add_cpu(&bg->bg_free_bits_count, num_bits);
24319b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda	if (le16_to_cpu(bg->bg_free_bits_count) > le16_to_cpu(bg->bg_bits)) {
24329b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda		ocfs2_error(alloc_inode->i_sb, "Group descriptor # %llu has bit"
24339b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    " count %u but claims %u are freed. num_bits %d",
24349b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    (unsigned long long)le64_to_cpu(bg->bg_blkno),
24359b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    le16_to_cpu(bg->bg_bits),
24369b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda			    le16_to_cpu(bg->bg_free_bits_count), num_bits);
24379b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda		return -EROFS;
24389b5cd10e4c14a1a642076ace6a73be3d33c91fb6Srinivas Eeda	}
2439ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2440b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	if (undo_fn)
244194e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran		jbd_unlock_bh_state(group_bh);
244294e41ecfe0f202df948fdbb19a53308a58cf2184Sunil Mushran
2443ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, group_bh);
2444ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
2445ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2446ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2447ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2448ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh/*
2449ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh * expects the suballoc inode to already be locked.
2450ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh */
2451b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehstatic int _ocfs2_free_suballoc_bits(handle_t *handle,
2452b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     struct inode *alloc_inode,
2453b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     struct buffer_head *alloc_bh,
2454b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     unsigned int start_bit,
2455b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     u64 bg_blkno,
2456b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     unsigned int count,
2457b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				     void (*undo_fn)(unsigned int bit,
2458b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh						     unsigned long *bitmap))
2459ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2460ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status = 0;
2461ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u32 tmp_used;
2462ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe = (struct ocfs2_dinode *) alloc_bh->b_data;
2463ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_chain_list *cl = &fe->id2.i_chain;
2464ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct buffer_head *group_bh = NULL;
2465ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_group_desc *group;
2466ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
246710995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	/* The alloc_bh comes from ocfs2_free_dinode() or
246810995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	 * ocfs2_free_clusters().  The callers have all locked the
246910995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	 * allocator and gotten alloc_bh from the lock call.  This
247025985edcedea6396277003854657b5f3cb31a628Lucas De Marchi	 * validates the dinode buffer.  Any corruption that has happened
247110995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	 * is a code bug. */
247210995aa2451afa20b721cc7de856cae1a13dba57Joel Becker	BUG_ON(!OCFS2_IS_VALID_DINODE(fe));
2473ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON((count + start_bit) > ocfs2_bits_per_group(cl));
2474ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
24752f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_free_suballoc_bits(
24762f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)OCFS2_I(alloc_inode)->ip_blkno,
24772f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		(unsigned long long)bg_blkno,
24782f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma		start_bit, count);
2479ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
248068f64d471be38631d7196b938d9809802dd467faJoel Becker	status = ocfs2_read_group_descriptor(alloc_inode, fe, bg_blkno,
248168f64d471be38631d7196b938d9809802dd467faJoel Becker					     &group_bh);
2482ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2483ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2484ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2485ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2486ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	group = (struct ocfs2_group_desc *) group_bh->b_data;
248768f64d471be38631d7196b938d9809802dd467faJoel Becker
2488ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON((count + start_bit) > le16_to_cpu(group->bg_bits));
2489ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2490ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	status = ocfs2_block_group_clear_bits(handle, alloc_inode,
2491ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					      group, group_bh,
2492b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					      start_bit, count, undo_fn);
2493ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2494ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2495ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2496ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2497ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
24980cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker	status = ocfs2_journal_access_di(handle, INODE_CACHE(alloc_inode),
24990cf2f7632b1789b811ab20b611c4156e6de2b055Joel Becker					 alloc_bh, OCFS2_JOURNAL_ACCESS_WRITE);
2500ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	if (status < 0) {
2501ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
2502ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		goto bail;
2503ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2504ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2505ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	le32_add_cpu(&cl->cl_recs[le16_to_cpu(group->bg_chain)].c_free,
2506ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		     count);
2507ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	tmp_used = le32_to_cpu(fe->id1.bitmap1.i_used);
2508ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe->id1.bitmap1.i_used = cpu_to_le32(tmp_used - count);
2509ec20cec7a351584ca6c70ead012e73d61f9a8e04Joel Becker	ocfs2_journal_dirty(handle, alloc_bh);
2510ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2511ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehbail:
2512a81cb88b64a479b78c6dd5666678d50171865db8Mark Fasheh	brelse(group_bh);
2513ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2514c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2515c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
2516ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2517ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2518ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2519b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehint ocfs2_free_suballoc_bits(handle_t *handle,
2520b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			     struct inode *alloc_inode,
2521b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			     struct buffer_head *alloc_bh,
2522b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			     unsigned int start_bit,
2523b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			     u64 bg_blkno,
2524b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			     unsigned int count)
2525b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh{
2526b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	return _ocfs2_free_suballoc_bits(handle, alloc_inode, alloc_bh,
2527b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					 start_bit, bg_blkno, count, NULL);
2528b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh}
2529b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh
25301fabe1481fac9e01bf8bffa60a2307ef379aa5deMark Fashehint ocfs2_free_dinode(handle_t *handle,
2531ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		      struct inode *inode_alloc_inode,
2532ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		      struct buffer_head *inode_alloc_bh,
2533ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		      struct ocfs2_dinode *di)
2534ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2535ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u64 blk = le64_to_cpu(di->i_blkno);
2536ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 bit = le16_to_cpu(di->i_suballoc_bit);
2537ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u64 bg_blkno = ocfs2_which_suballoc_group(blk, bit);
2538ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
253974380c479ad83addeff8a172ab95f59557b5b0c3Tao Ma	if (di->i_suballoc_loc)
254074380c479ad83addeff8a172ab95f59557b5b0c3Tao Ma		bg_blkno = le64_to_cpu(di->i_suballoc_loc);
2541ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return ocfs2_free_suballoc_bits(handle, inode_alloc_inode,
2542ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh					inode_alloc_bh, bit, bg_blkno, 1);
2543ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2544ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2545b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehstatic int _ocfs2_free_clusters(handle_t *handle,
2546b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				struct inode *bitmap_inode,
2547b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				struct buffer_head *bitmap_bh,
2548b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				u64 start_blk,
2549b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				unsigned int num_clusters,
2550b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				void (*undo_fn)(unsigned int bit,
2551b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh						unsigned long *bitmap))
2552ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2553ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int status;
2554ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u16 bg_start_bit;
2555ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	u64 bg_blkno;
2556ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	struct ocfs2_dinode *fe;
2557ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2558ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	/* You can't ever have a contiguous set of clusters
2559ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * bigger than a block group bitmap so we never have to worry
2560ef6b689b63b9f5227ccee6f16dd9ee3faf58a464Tao Ma	 * about looping on them.
2561ef6b689b63b9f5227ccee6f16dd9ee3faf58a464Tao Ma	 * This is expensive. We can safely remove once this stuff has
2562ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	 * gotten tested really well. */
2563ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	BUG_ON(start_blk != ocfs2_clusters_to_blocks(bitmap_inode->i_sb, ocfs2_blocks_to_clusters(bitmap_inode->i_sb, start_blk)));
2564ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2565ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	fe = (struct ocfs2_dinode *) bitmap_bh->b_data;
2566ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2567ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	ocfs2_block_to_cluster_group(bitmap_inode, start_blk, &bg_blkno,
2568ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh				     &bg_start_bit);
2569ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
25702f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_free_clusters((unsigned long long)bg_blkno,
25712f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			(unsigned long long)start_blk,
25722f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma			bg_start_bit, num_clusters);
2573ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2574b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	status = _ocfs2_free_suballoc_bits(handle, bitmap_inode, bitmap_bh,
2575b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					   bg_start_bit, bg_blkno,
2576b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh					   num_clusters, undo_fn);
25779c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh	if (status < 0) {
2578ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		mlog_errno(status);
25799c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh		goto out;
25809c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh	}
25819c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh
25829c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh	ocfs2_local_alloc_seen_free_bits(OCFS2_SB(bitmap_inode->i_sb),
25839c7af40b210e87f8fddd97b0badc0a352862234aMark Fasheh					 num_clusters);
2584ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
25859c7af40b210e87f8fddd97b0badc0a352862234aMark Fashehout:
2586c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2587c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
2588ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	return status;
2589ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2590ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2591b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehint ocfs2_free_clusters(handle_t *handle,
2592b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			struct inode *bitmap_inode,
2593b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			struct buffer_head *bitmap_bh,
2594b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			u64 start_blk,
2595b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			unsigned int num_clusters)
2596b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh{
2597b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	return _ocfs2_free_clusters(handle, bitmap_inode, bitmap_bh,
2598b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				    start_blk, num_clusters,
2599b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				    _ocfs2_set_bit);
2600b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh}
2601b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh
2602b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh/*
2603b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh * Give never-used clusters back to the global bitmap.  We don't need
2604b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh * to protect these bits in the undo buffer.
2605b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh */
2606b4414eea0e7b9c134262c801a87e338bf675962cMark Fashehint ocfs2_release_clusters(handle_t *handle,
2607b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			   struct inode *bitmap_inode,
2608b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			   struct buffer_head *bitmap_bh,
2609b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			   u64 start_blk,
2610b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh			   unsigned int num_clusters)
2611b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh{
2612b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh	return _ocfs2_free_clusters(handle, bitmap_inode, bitmap_bh,
2613b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				    start_blk, num_clusters,
2614b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh				    _ocfs2_clear_bit);
2615b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh}
2616b4414eea0e7b9c134262c801a87e338bf675962cMark Fasheh
2617ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_debug_bg(struct ocfs2_group_desc *bg)
2618ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2619ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("Block Group:\n");
2620ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_signature:       %s\n", bg->bg_signature);
2621ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_size:            %u\n", bg->bg_size);
2622ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_bits:            %u\n", bg->bg_bits);
2623ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_free_bits_count: %u\n", bg->bg_free_bits_count);
2624ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_chain:           %u\n", bg->bg_chain);
2625ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("bg_generation:      %u\n", le32_to_cpu(bg->bg_generation));
2626b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	printk("bg_next_group:      %llu\n",
2627b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	       (unsigned long long)bg->bg_next_group);
2628b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	printk("bg_parent_dinode:   %llu\n",
2629b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	       (unsigned long long)bg->bg_parent_dinode);
2630b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	printk("bg_blkno:           %llu\n",
2631b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	       (unsigned long long)bg->bg_blkno);
2632ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2633ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2634ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fashehstatic inline void ocfs2_debug_suballoc_inode(struct ocfs2_dinode *fe)
2635ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh{
2636ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	int i;
2637ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh
2638b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	printk("Suballoc Inode %llu:\n", (unsigned long long)fe->i_blkno);
2639ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("i_signature:                  %s\n", fe->i_signature);
2640b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	printk("i_size:                       %llu\n",
2641b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh	       (unsigned long long)fe->i_size);
2642ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("i_clusters:                   %u\n", fe->i_clusters);
2643ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("i_generation:                 %u\n",
2644ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	       le32_to_cpu(fe->i_generation));
2645ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id1.bitmap1.i_used:           %u\n",
2646ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	       le32_to_cpu(fe->id1.bitmap1.i_used));
2647ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id1.bitmap1.i_total:          %u\n",
2648ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	       le32_to_cpu(fe->id1.bitmap1.i_total));
2649ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id2.i_chain.cl_cpg:           %u\n", fe->id2.i_chain.cl_cpg);
2650ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id2.i_chain.cl_bpc:           %u\n", fe->id2.i_chain.cl_bpc);
2651ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id2.i_chain.cl_count:         %u\n", fe->id2.i_chain.cl_count);
2652ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	printk("id2.i_chain.cl_next_free_rec: %u\n",
2653ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	       fe->id2.i_chain.cl_next_free_rec);
2654ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	for(i = 0; i < fe->id2.i_chain.cl_next_free_rec; i++) {
2655ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		printk("fe->id2.i_chain.cl_recs[%d].c_free:  %u\n", i,
2656ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		       fe->id2.i_chain.cl_recs[i].c_free);
2657ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		printk("fe->id2.i_chain.cl_recs[%d].c_total: %u\n", i,
2658ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh		       fe->id2.i_chain.cl_recs[i].c_total);
2659b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh		printk("fe->id2.i_chain.cl_recs[%d].c_blkno: %llu\n", i,
2660b0697053f9e8de9cea3d510d9e290851ece9460bMark Fasheh		       (unsigned long long)fe->id2.i_chain.cl_recs[i].c_blkno);
2661ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh	}
2662ccd979bdbce9fba8412beb3f1de68a9d0171b12cMark Fasheh}
2663e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2664e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma/*
2665e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * For a given allocation, determine which allocators will need to be
2666e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * accessed, and lock them, reserving the appropriate number of bits.
2667e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma *
2668e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * Sparse file systems call this from ocfs2_write_begin_nolock()
2669e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * and ocfs2_allocate_unwritten_extents().
2670e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma *
2671e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * File systems which don't support holes call this from
2672e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma * ocfs2_extend_allocation().
2673e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma */
2674f99b9b7ccf6a691f653cec45f36bfdd1e94769c7Joel Beckerint ocfs2_lock_allocators(struct inode *inode,
2675f99b9b7ccf6a691f653cec45f36bfdd1e94769c7Joel Becker			  struct ocfs2_extent_tree *et,
2676e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			  u32 clusters_to_add, u32 extents_to_split,
2677e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			  struct ocfs2_alloc_context **data_ac,
2678f99b9b7ccf6a691f653cec45f36bfdd1e94769c7Joel Becker			  struct ocfs2_alloc_context **meta_ac)
2679e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma{
2680e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	int ret = 0, num_free_extents;
2681e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	unsigned int max_recs_needed = clusters_to_add + 2 * extents_to_split;
2682e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
2683e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2684e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	*meta_ac = NULL;
2685e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (data_ac)
2686e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		*data_ac = NULL;
2687e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2688e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	BUG_ON(clusters_to_add != 0 && data_ac == NULL);
2689e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
26903d03a305ded8057155bd3c801e64ffef9f534827Joel Becker	num_free_extents = ocfs2_num_free_extents(osb, et);
2691e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (num_free_extents < 0) {
2692e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		ret = num_free_extents;
2693e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		mlog_errno(ret);
2694e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		goto out;
2695e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	}
2696e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2697e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	/*
2698e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * Sparse allocation file systems need to be more conservative
2699e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * with reserving room for expansion - the actual allocation
2700e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * happens while we've got a journal handle open so re-taking
2701e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * a cluster lock (because we ran out of room for another
2702e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * extent) will violate ordering rules.
2703e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 *
2704e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * Most of the time we'll only be seeing this 1 cluster at a time
2705e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * anyway.
2706e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 *
2707e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * Always lock for any unwritten extents - we might want to
2708e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 * add blocks during a split.
2709e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	 */
2710e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (!num_free_extents ||
2711e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	    (ocfs2_sparse_alloc(osb) && num_free_extents < max_recs_needed)) {
2712f99b9b7ccf6a691f653cec45f36bfdd1e94769c7Joel Becker		ret = ocfs2_reserve_new_metadata(osb, et->et_root_el, meta_ac);
2713e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		if (ret < 0) {
2714e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			if (ret != -ENOSPC)
2715e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma				mlog_errno(ret);
2716e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			goto out;
2717e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		}
2718e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	}
2719e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2720e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (clusters_to_add == 0)
2721e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		goto out;
2722e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2723e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	ret = ocfs2_reserve_clusters(osb, clusters_to_add, data_ac);
2724e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (ret < 0) {
2725e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		if (ret != -ENOSPC)
2726e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			mlog_errno(ret);
2727e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		goto out;
2728e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	}
2729e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2730e7d4cb6bc19658646357eeff134645cd9bc3479fTao Maout:
2731e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	if (ret) {
2732e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		if (*meta_ac) {
2733e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			ocfs2_free_alloc_context(*meta_ac);
2734e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma			*meta_ac = NULL;
2735e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		}
2736e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2737e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		/*
2738e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		 * We cannot have an error and a non null *data_ac.
2739e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma		 */
2740e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	}
2741e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma
2742e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma	return ret;
2743e7d4cb6bc19658646357eeff134645cd9bc3479fTao Ma}
27446ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27456ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang/*
27466ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * Read the inode specified by blkno to get suballoc_slot and
27476ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * suballoc_bit.
27486ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang */
27496ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangstatic int ocfs2_get_suballoc_slot_bit(struct ocfs2_super *osb, u64 blkno,
2750889f004a8c83d515f275078687f859bc0d5ede9dTao Ma				       u16 *suballoc_slot, u64 *group_blkno,
2751889f004a8c83d515f275078687f859bc0d5ede9dTao Ma				       u16 *suballoc_bit)
27526ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang{
27536ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	int status;
27546ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct buffer_head *inode_bh = NULL;
27556ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct ocfs2_dinode *inode_fe;
27566ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27572f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_get_suballoc_slot_bit((unsigned long long)blkno);
27586ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27596ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	/* dirty read disk */
27606ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	status = ocfs2_read_blocks_sync(osb, blkno, 1, &inode_bh);
27616ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (status < 0) {
27625b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		mlog(ML_ERROR, "read block %llu failed %d\n",
27635b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		     (unsigned long long)blkno, status);
27646ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
27656ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
27666ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27676ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	inode_fe = (struct ocfs2_dinode *) inode_bh->b_data;
27686ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (!OCFS2_IS_VALID_DINODE(inode_fe)) {
27695b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		mlog(ML_ERROR, "invalid inode %llu requested\n",
27705b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		     (unsigned long long)blkno);
27716ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		status = -EINVAL;
27726ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
27736ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
27746ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27750fba813748f16f4eaf24d492c505226c4026d58fTao Ma	if (le16_to_cpu(inode_fe->i_suballoc_slot) != (u16)OCFS2_INVALID_SLOT &&
27766ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	    (u32)le16_to_cpu(inode_fe->i_suballoc_slot) > osb->max_slots - 1) {
27776ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "inode %llu has invalid suballoc slot %u\n",
27785b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		     (unsigned long long)blkno,
27795b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		     (u32)le16_to_cpu(inode_fe->i_suballoc_slot));
27806ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		status = -EINVAL;
27816ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
27826ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
27836ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27846ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (suballoc_slot)
27856ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		*suballoc_slot = le16_to_cpu(inode_fe->i_suballoc_slot);
27866ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (suballoc_bit)
27876ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		*suballoc_bit = le16_to_cpu(inode_fe->i_suballoc_bit);
2788889f004a8c83d515f275078687f859bc0d5ede9dTao Ma	if (group_blkno)
2789889f004a8c83d515f275078687f859bc0d5ede9dTao Ma		*group_blkno = le64_to_cpu(inode_fe->i_suballoc_loc);
27906ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27916ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangbail:
27926ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	brelse(inode_bh);
27936ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
2794c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2795c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
27966ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	return status;
27976ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang}
27986ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
27996ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang/*
28006ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * test whether bit is SET in allocator bitmap or not.  on success, 0
28016ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * is returned and *res is 1 for SET; 0 otherwise.  when fails, errno
28026ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * is returned and *res is meaningless.  Call this after you have
28036ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * cluster locked against suballoc, or you may get a result based on
28046ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * non-up2date contents
28056ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang */
28066ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangstatic int ocfs2_test_suballoc_bit(struct ocfs2_super *osb,
28076ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang				   struct inode *suballoc,
2808889f004a8c83d515f275078687f859bc0d5ede9dTao Ma				   struct buffer_head *alloc_bh,
2809889f004a8c83d515f275078687f859bc0d5ede9dTao Ma				   u64 group_blkno, u64 blkno,
28106ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang				   u16 bit, int *res)
28116ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang{
2812abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	struct ocfs2_dinode *alloc_di;
28136ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct ocfs2_group_desc *group;
28146ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct buffer_head *group_bh = NULL;
28156ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	u64 bg_blkno;
28166ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	int status;
28176ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28182f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_test_suballoc_bit((unsigned long long)blkno,
28192f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma				      (unsigned int)bit);
28206ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
2821abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	alloc_di = (struct ocfs2_dinode *)alloc_bh->b_data;
2822abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	if ((bit + 1) > ocfs2_bits_per_group(&alloc_di->id2.i_chain)) {
28236ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "suballoc bit %u out of range of %u\n",
28246ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		     (unsigned int)bit,
2825abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma		     ocfs2_bits_per_group(&alloc_di->id2.i_chain));
28266ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		status = -EINVAL;
28276ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
28286ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
28296ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
2830889f004a8c83d515f275078687f859bc0d5ede9dTao Ma	bg_blkno = group_blkno ? group_blkno :
2831889f004a8c83d515f275078687f859bc0d5ede9dTao Ma		   ocfs2_which_suballoc_group(blkno, bit);
2832abf1b3cb5b20fbad27ca9c7497235eeb4dd3f4fdTao Ma	status = ocfs2_read_group_descriptor(suballoc, alloc_di, bg_blkno,
28336ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang					     &group_bh);
28346ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (status < 0) {
28355b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		mlog(ML_ERROR, "read group %llu failed %d\n",
28365b09b507daaa882d888b6cd78ee89ba9caace44bJoel Becker		     (unsigned long long)bg_blkno, status);
28376ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
28386ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
28396ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28406ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	group = (struct ocfs2_group_desc *) group_bh->b_data;
28416ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	*res = ocfs2_test_bit(bit, (unsigned long *)group->bg_bitmap);
28426ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28436ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangbail:
28446ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	brelse(group_bh);
28456ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
2846c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2847c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
28486ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	return status;
28496ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang}
28506ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28516ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang/*
28526ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * Test if the bit representing this inode (blkno) is set in the
28536ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * suballocator.
28546ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang *
28556ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * On success, 0 is returned and *res is 1 for SET; 0 otherwise.
28566ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang *
28576ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * In the event of failure, a negative value is returned and *res is
28586ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * meaningless.
28596ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang *
28606ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * Callers must make sure to hold nfs_sync_lock to prevent
28616ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * ocfs2_delete_inode() on another node from accessing the same
28626ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang * suballocator concurrently.
28636ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang */
28646ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangint ocfs2_test_inode_bit(struct ocfs2_super *osb, u64 blkno, int *res)
28656ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang{
28666ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	int status;
2867889f004a8c83d515f275078687f859bc0d5ede9dTao Ma	u64 group_blkno = 0;
28686ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	u16 suballoc_bit = 0, suballoc_slot = 0;
28696ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct inode *inode_alloc_inode;
28706ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	struct buffer_head *alloc_bh = NULL;
28716ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28722f73e135b83c5001dad84cbd1d445d23fd045b83Tao Ma	trace_ocfs2_test_inode_bit((unsigned long long)blkno);
28736ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28746ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	status = ocfs2_get_suballoc_slot_bit(osb, blkno, &suballoc_slot,
2875889f004a8c83d515f275078687f859bc0d5ede9dTao Ma					     &group_blkno, &suballoc_bit);
28766ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (status < 0) {
28776ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "get alloc slot and bit failed %d\n", status);
28786ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
28796ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
28806ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28816ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	inode_alloc_inode =
28826ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		ocfs2_get_system_file_inode(osb, INODE_ALLOC_SYSTEM_INODE,
28836ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang					    suballoc_slot);
28846ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (!inode_alloc_inode) {
28856ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		/* the error code could be inaccurate, but we are not able to
28866ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		 * get the correct one. */
28876ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		status = -EINVAL;
28886ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "unable to get alloc inode in slot %u\n",
28896ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		     (u32)suballoc_slot);
28906ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
28916ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
28926ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
28936ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	mutex_lock(&inode_alloc_inode->i_mutex);
28946ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	status = ocfs2_inode_lock(inode_alloc_inode, &alloc_bh, 0);
28956ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (status < 0) {
28966ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mutex_unlock(&inode_alloc_inode->i_mutex);
28977dc3e83901b342ea7fe36262329c3784f2937361jiangyiwen		iput(inode_alloc_inode);
28986ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "lock on alloc inode on slot %u failed %d\n",
28996ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		     (u32)suballoc_slot, status);
29006ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		goto bail;
29016ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	}
29026ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
29036ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	status = ocfs2_test_suballoc_bit(osb, inode_alloc_inode, alloc_bh,
2904889f004a8c83d515f275078687f859bc0d5ede9dTao Ma					 group_blkno, blkno, suballoc_bit, res);
29056ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	if (status < 0)
29066ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang		mlog(ML_ERROR, "test suballoc bit failed %d\n", status);
29076ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
29086ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	ocfs2_inode_unlock(inode_alloc_inode, 0);
29096ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	mutex_unlock(&inode_alloc_inode->i_mutex);
29106ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang
29116ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	iput(inode_alloc_inode);
29126ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	brelse(alloc_bh);
29136ca497a83e592d64e050c4d04b6dedb8c915f39awengang wangbail:
2914c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma	if (status)
2915c1e8d35ef5ffb393b94a192034b5e3541e005d75Tao Ma		mlog_errno(status);
29166ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang	return status;
29176ca497a83e592d64e050c4d04b6dedb8c915f39awengang wang}
2918