super.c revision 4c05141df57f4ffc1a9a28f1925434924179bfe4
1/*
2 * Copyright 2000 by Hans Reiser, licensing governed by reiserfs/README
3 *
4 * Trivial changes by Alan Cox to add the LFS fixes
5 *
6 * Trivial Changes:
7 * Rights granted to Hans Reiser to redistribute under other terms providing
8 * he accepts all liability including but not limited to patent, fitness
9 * for purpose, and direct or indirect claims arising from failure to perform.
10 *
11 * NO WARRANTY
12 */
13
14#include <linux/module.h>
15#include <linux/slab.h>
16#include <linux/vmalloc.h>
17#include <linux/time.h>
18#include <asm/uaccess.h>
19#include "reiserfs.h"
20#include "acl.h"
21#include "xattr.h"
22#include <linux/init.h>
23#include <linux/blkdev.h>
24#include <linux/buffer_head.h>
25#include <linux/exportfs.h>
26#include <linux/quotaops.h>
27#include <linux/vfs.h>
28#include <linux/mount.h>
29#include <linux/namei.h>
30#include <linux/crc32.h>
31#include <linux/seq_file.h>
32
33struct file_system_type reiserfs_fs_type;
34
35static const char reiserfs_3_5_magic_string[] = REISERFS_SUPER_MAGIC_STRING;
36static const char reiserfs_3_6_magic_string[] = REISER2FS_SUPER_MAGIC_STRING;
37static const char reiserfs_jr_magic_string[] = REISER2FS_JR_SUPER_MAGIC_STRING;
38
39int is_reiserfs_3_5(struct reiserfs_super_block *rs)
40{
41	return !strncmp(rs->s_v1.s_magic, reiserfs_3_5_magic_string,
42			strlen(reiserfs_3_5_magic_string));
43}
44
45int is_reiserfs_3_6(struct reiserfs_super_block *rs)
46{
47	return !strncmp(rs->s_v1.s_magic, reiserfs_3_6_magic_string,
48			strlen(reiserfs_3_6_magic_string));
49}
50
51int is_reiserfs_jr(struct reiserfs_super_block *rs)
52{
53	return !strncmp(rs->s_v1.s_magic, reiserfs_jr_magic_string,
54			strlen(reiserfs_jr_magic_string));
55}
56
57static int is_any_reiserfs_magic_string(struct reiserfs_super_block *rs)
58{
59	return (is_reiserfs_3_5(rs) || is_reiserfs_3_6(rs) ||
60		is_reiserfs_jr(rs));
61}
62
63static int reiserfs_remount(struct super_block *s, int *flags, char *data);
64static int reiserfs_statfs(struct dentry *dentry, struct kstatfs *buf);
65void show_alloc_options(struct seq_file *seq, struct super_block *s);
66
67static int reiserfs_sync_fs(struct super_block *s, int wait)
68{
69	struct reiserfs_transaction_handle th;
70
71	/*
72	 * Writeback quota in non-journalled quota case - journalled quota has
73	 * no dirty dquots
74	 */
75	dquot_writeback_dquots(s, -1);
76	reiserfs_write_lock(s);
77	if (!journal_begin(&th, s, 1))
78		if (!journal_end_sync(&th, s, 1))
79			reiserfs_flush_old_commits(s);
80	reiserfs_write_unlock(s);
81	return 0;
82}
83
84static void flush_old_commits(struct work_struct *work)
85{
86	struct reiserfs_sb_info *sbi;
87	struct super_block *s;
88
89	sbi = container_of(work, struct reiserfs_sb_info, old_work.work);
90	s = sbi->s_journal->j_work_sb;
91
92	spin_lock(&sbi->old_work_lock);
93	sbi->work_queued = 0;
94	spin_unlock(&sbi->old_work_lock);
95
96	reiserfs_sync_fs(s, 1);
97}
98
99void reiserfs_schedule_old_flush(struct super_block *s)
100{
101	struct reiserfs_sb_info *sbi = REISERFS_SB(s);
102	unsigned long delay;
103
104	if (s->s_flags & MS_RDONLY)
105		return;
106
107	spin_lock(&sbi->old_work_lock);
108	if (!sbi->work_queued) {
109		delay = msecs_to_jiffies(dirty_writeback_interval * 10);
110		queue_delayed_work(system_long_wq, &sbi->old_work, delay);
111		sbi->work_queued = 1;
112	}
113	spin_unlock(&sbi->old_work_lock);
114}
115
116static void cancel_old_flush(struct super_block *s)
117{
118	struct reiserfs_sb_info *sbi = REISERFS_SB(s);
119
120	cancel_delayed_work_sync(&REISERFS_SB(s)->old_work);
121	spin_lock(&sbi->old_work_lock);
122	sbi->work_queued = 0;
123	spin_unlock(&sbi->old_work_lock);
124}
125
126static int reiserfs_freeze(struct super_block *s)
127{
128	struct reiserfs_transaction_handle th;
129
130	cancel_old_flush(s);
131
132	reiserfs_write_lock(s);
133	if (!(s->s_flags & MS_RDONLY)) {
134		int err = journal_begin(&th, s, 1);
135		if (err) {
136			reiserfs_block_writes(&th);
137		} else {
138			reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s),
139						     1);
140			journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB(s));
141			reiserfs_block_writes(&th);
142			journal_end_sync(&th, s, 1);
143		}
144	}
145	reiserfs_write_unlock(s);
146	return 0;
147}
148
149static int reiserfs_unfreeze(struct super_block *s)
150{
151	reiserfs_allow_writes(s);
152	return 0;
153}
154
155extern const struct in_core_key MAX_IN_CORE_KEY;
156
157/* this is used to delete "save link" when there are no items of a
158   file it points to. It can either happen if unlink is completed but
159   "save unlink" removal, or if file has both unlink and truncate
160   pending and as unlink completes first (because key of "save link"
161   protecting unlink is bigger that a key lf "save link" which
162   protects truncate), so there left no items to make truncate
163   completion on */
164static int remove_save_link_only(struct super_block *s,
165				 struct reiserfs_key *key, int oid_free)
166{
167	struct reiserfs_transaction_handle th;
168	int err;
169
170	/* we are going to do one balancing */
171	err = journal_begin(&th, s, JOURNAL_PER_BALANCE_CNT);
172	if (err)
173		return err;
174
175	reiserfs_delete_solid_item(&th, NULL, key);
176	if (oid_free)
177		/* removals are protected by direct items */
178		reiserfs_release_objectid(&th, le32_to_cpu(key->k_objectid));
179
180	return journal_end(&th, s, JOURNAL_PER_BALANCE_CNT);
181}
182
183#ifdef CONFIG_QUOTA
184static int reiserfs_quota_on_mount(struct super_block *, int);
185#endif
186
187/* look for uncompleted unlinks and truncates and complete them */
188static int finish_unfinished(struct super_block *s)
189{
190	INITIALIZE_PATH(path);
191	struct cpu_key max_cpu_key, obj_key;
192	struct reiserfs_key save_link_key, last_inode_key;
193	int retval = 0;
194	struct item_head *ih;
195	struct buffer_head *bh;
196	int item_pos;
197	char *item;
198	int done;
199	struct inode *inode;
200	int truncate;
201#ifdef CONFIG_QUOTA
202	int i;
203	int ms_active_set;
204	int quota_enabled[MAXQUOTAS];
205#endif
206
207	/* compose key to look for "save" links */
208	max_cpu_key.version = KEY_FORMAT_3_5;
209	max_cpu_key.on_disk_key.k_dir_id = ~0U;
210	max_cpu_key.on_disk_key.k_objectid = ~0U;
211	set_cpu_key_k_offset(&max_cpu_key, ~0U);
212	max_cpu_key.key_length = 3;
213
214	memset(&last_inode_key, 0, sizeof(last_inode_key));
215
216#ifdef CONFIG_QUOTA
217	/* Needed for iput() to work correctly and not trash data */
218	if (s->s_flags & MS_ACTIVE) {
219		ms_active_set = 0;
220	} else {
221		ms_active_set = 1;
222		s->s_flags |= MS_ACTIVE;
223	}
224	/* Turn on quotas so that they are updated correctly */
225	for (i = 0; i < MAXQUOTAS; i++) {
226		quota_enabled[i] = 1;
227		if (REISERFS_SB(s)->s_qf_names[i]) {
228			int ret;
229
230			if (sb_has_quota_active(s, i)) {
231				quota_enabled[i] = 0;
232				continue;
233			}
234			ret = reiserfs_quota_on_mount(s, i);
235			if (ret < 0)
236				reiserfs_warning(s, "reiserfs-2500",
237						 "cannot turn on journaled "
238						 "quota: error %d", ret);
239		}
240	}
241#endif
242
243	done = 0;
244	REISERFS_SB(s)->s_is_unlinked_ok = 1;
245	while (!retval) {
246		retval = search_item(s, &max_cpu_key, &path);
247		if (retval != ITEM_NOT_FOUND) {
248			reiserfs_error(s, "vs-2140",
249				       "search_by_key returned %d", retval);
250			break;
251		}
252
253		bh = get_last_bh(&path);
254		item_pos = get_item_pos(&path);
255		if (item_pos != B_NR_ITEMS(bh)) {
256			reiserfs_warning(s, "vs-2060",
257					 "wrong position found");
258			break;
259		}
260		item_pos--;
261		ih = B_N_PITEM_HEAD(bh, item_pos);
262
263		if (le32_to_cpu(ih->ih_key.k_dir_id) != MAX_KEY_OBJECTID)
264			/* there are no "save" links anymore */
265			break;
266
267		save_link_key = ih->ih_key;
268		if (is_indirect_le_ih(ih))
269			truncate = 1;
270		else
271			truncate = 0;
272
273		/* reiserfs_iget needs k_dirid and k_objectid only */
274		item = B_I_PITEM(bh, ih);
275		obj_key.on_disk_key.k_dir_id = le32_to_cpu(*(__le32 *) item);
276		obj_key.on_disk_key.k_objectid =
277		    le32_to_cpu(ih->ih_key.k_objectid);
278		obj_key.on_disk_key.k_offset = 0;
279		obj_key.on_disk_key.k_type = 0;
280
281		pathrelse(&path);
282
283		inode = reiserfs_iget(s, &obj_key);
284		if (!inode) {
285			/* the unlink almost completed, it just did not manage to remove
286			   "save" link and release objectid */
287			reiserfs_warning(s, "vs-2180", "iget failed for %K",
288					 &obj_key);
289			retval = remove_save_link_only(s, &save_link_key, 1);
290			continue;
291		}
292
293		if (!truncate && inode->i_nlink) {
294			/* file is not unlinked */
295			reiserfs_warning(s, "vs-2185",
296					 "file %K is not unlinked",
297					 &obj_key);
298			retval = remove_save_link_only(s, &save_link_key, 0);
299			continue;
300		}
301		reiserfs_write_unlock(s);
302		dquot_initialize(inode);
303		reiserfs_write_lock(s);
304
305		if (truncate && S_ISDIR(inode->i_mode)) {
306			/* We got a truncate request for a dir which is impossible.
307			   The only imaginable way is to execute unfinished truncate request
308			   then boot into old kernel, remove the file and create dir with
309			   the same key. */
310			reiserfs_warning(s, "green-2101",
311					 "impossible truncate on a "
312					 "directory %k. Please report",
313					 INODE_PKEY(inode));
314			retval = remove_save_link_only(s, &save_link_key, 0);
315			truncate = 0;
316			iput(inode);
317			continue;
318		}
319
320		if (truncate) {
321			REISERFS_I(inode)->i_flags |=
322			    i_link_saved_truncate_mask;
323			/* not completed truncate found. New size was committed together
324			   with "save" link */
325			reiserfs_info(s, "Truncating %k to %Ld ..",
326				      INODE_PKEY(inode), inode->i_size);
327			reiserfs_truncate_file(inode,
328					       0
329					       /*don't update modification time */
330					       );
331			retval = remove_save_link(inode, truncate);
332		} else {
333			REISERFS_I(inode)->i_flags |= i_link_saved_unlink_mask;
334			/* not completed unlink (rmdir) found */
335			reiserfs_info(s, "Removing %k..", INODE_PKEY(inode));
336			if (memcmp(&last_inode_key, INODE_PKEY(inode),
337					sizeof(last_inode_key))){
338				last_inode_key = *INODE_PKEY(inode);
339				/* removal gets completed in iput */
340				retval = 0;
341			} else {
342				reiserfs_warning(s, "super-2189", "Dead loop "
343						 "in finish_unfinished "
344						 "detected, just remove "
345						 "save link\n");
346				retval = remove_save_link_only(s,
347							&save_link_key, 0);
348			}
349		}
350
351		iput(inode);
352		printk("done\n");
353		done++;
354	}
355	REISERFS_SB(s)->s_is_unlinked_ok = 0;
356
357#ifdef CONFIG_QUOTA
358	/* Turn quotas off */
359	for (i = 0; i < MAXQUOTAS; i++) {
360		if (sb_dqopt(s)->files[i] && quota_enabled[i])
361			dquot_quota_off(s, i);
362	}
363	if (ms_active_set)
364		/* Restore the flag back */
365		s->s_flags &= ~MS_ACTIVE;
366#endif
367	pathrelse(&path);
368	if (done)
369		reiserfs_info(s, "There were %d uncompleted unlinks/truncates. "
370			      "Completed\n", done);
371	return retval;
372}
373
374/* to protect file being unlinked from getting lost we "safe" link files
375   being unlinked. This link will be deleted in the same transaction with last
376   item of file. mounting the filesystem we scan all these links and remove
377   files which almost got lost */
378void add_save_link(struct reiserfs_transaction_handle *th,
379		   struct inode *inode, int truncate)
380{
381	INITIALIZE_PATH(path);
382	int retval;
383	struct cpu_key key;
384	struct item_head ih;
385	__le32 link;
386
387	BUG_ON(!th->t_trans_id);
388
389	/* file can only get one "save link" of each kind */
390	RFALSE(truncate &&
391	       (REISERFS_I(inode)->i_flags & i_link_saved_truncate_mask),
392	       "saved link already exists for truncated inode %lx",
393	       (long)inode->i_ino);
394	RFALSE(!truncate &&
395	       (REISERFS_I(inode)->i_flags & i_link_saved_unlink_mask),
396	       "saved link already exists for unlinked inode %lx",
397	       (long)inode->i_ino);
398
399	/* setup key of "save" link */
400	key.version = KEY_FORMAT_3_5;
401	key.on_disk_key.k_dir_id = MAX_KEY_OBJECTID;
402	key.on_disk_key.k_objectid = inode->i_ino;
403	if (!truncate) {
404		/* unlink, rmdir, rename */
405		set_cpu_key_k_offset(&key, 1 + inode->i_sb->s_blocksize);
406		set_cpu_key_k_type(&key, TYPE_DIRECT);
407
408		/* item head of "safe" link */
409		make_le_item_head(&ih, &key, key.version,
410				  1 + inode->i_sb->s_blocksize, TYPE_DIRECT,
411				  4 /*length */ , 0xffff /*free space */ );
412	} else {
413		/* truncate */
414		if (S_ISDIR(inode->i_mode))
415			reiserfs_warning(inode->i_sb, "green-2102",
416					 "Adding a truncate savelink for "
417					 "a directory %k! Please report",
418					 INODE_PKEY(inode));
419		set_cpu_key_k_offset(&key, 1);
420		set_cpu_key_k_type(&key, TYPE_INDIRECT);
421
422		/* item head of "safe" link */
423		make_le_item_head(&ih, &key, key.version, 1, TYPE_INDIRECT,
424				  4 /*length */ , 0 /*free space */ );
425	}
426	key.key_length = 3;
427
428	/* look for its place in the tree */
429	retval = search_item(inode->i_sb, &key, &path);
430	if (retval != ITEM_NOT_FOUND) {
431		if (retval != -ENOSPC)
432			reiserfs_error(inode->i_sb, "vs-2100",
433				       "search_by_key (%K) returned %d", &key,
434				       retval);
435		pathrelse(&path);
436		return;
437	}
438
439	/* body of "save" link */
440	link = INODE_PKEY(inode)->k_dir_id;
441
442	/* put "save" link into tree, don't charge quota to anyone */
443	retval =
444	    reiserfs_insert_item(th, &path, &key, &ih, NULL, (char *)&link);
445	if (retval) {
446		if (retval != -ENOSPC)
447			reiserfs_error(inode->i_sb, "vs-2120",
448				       "insert_item returned %d", retval);
449	} else {
450		if (truncate)
451			REISERFS_I(inode)->i_flags |=
452			    i_link_saved_truncate_mask;
453		else
454			REISERFS_I(inode)->i_flags |= i_link_saved_unlink_mask;
455	}
456}
457
458/* this opens transaction unlike add_save_link */
459int remove_save_link(struct inode *inode, int truncate)
460{
461	struct reiserfs_transaction_handle th;
462	struct reiserfs_key key;
463	int err;
464
465	/* we are going to do one balancing only */
466	err = journal_begin(&th, inode->i_sb, JOURNAL_PER_BALANCE_CNT);
467	if (err)
468		return err;
469
470	/* setup key of "save" link */
471	key.k_dir_id = cpu_to_le32(MAX_KEY_OBJECTID);
472	key.k_objectid = INODE_PKEY(inode)->k_objectid;
473	if (!truncate) {
474		/* unlink, rmdir, rename */
475		set_le_key_k_offset(KEY_FORMAT_3_5, &key,
476				    1 + inode->i_sb->s_blocksize);
477		set_le_key_k_type(KEY_FORMAT_3_5, &key, TYPE_DIRECT);
478	} else {
479		/* truncate */
480		set_le_key_k_offset(KEY_FORMAT_3_5, &key, 1);
481		set_le_key_k_type(KEY_FORMAT_3_5, &key, TYPE_INDIRECT);
482	}
483
484	if ((truncate &&
485	     (REISERFS_I(inode)->i_flags & i_link_saved_truncate_mask)) ||
486	    (!truncate &&
487	     (REISERFS_I(inode)->i_flags & i_link_saved_unlink_mask)))
488		/* don't take quota bytes from anywhere */
489		reiserfs_delete_solid_item(&th, NULL, &key);
490	if (!truncate) {
491		reiserfs_release_objectid(&th, inode->i_ino);
492		REISERFS_I(inode)->i_flags &= ~i_link_saved_unlink_mask;
493	} else
494		REISERFS_I(inode)->i_flags &= ~i_link_saved_truncate_mask;
495
496	return journal_end(&th, inode->i_sb, JOURNAL_PER_BALANCE_CNT);
497}
498
499static void reiserfs_kill_sb(struct super_block *s)
500{
501	if (REISERFS_SB(s)) {
502		/*
503		 * Force any pending inode evictions to occur now. Any
504		 * inodes to be removed that have extended attributes
505		 * associated with them need to clean them up before
506		 * we can release the extended attribute root dentries.
507		 * shrink_dcache_for_umount will BUG if we don't release
508		 * those before it's called so ->put_super is too late.
509		 */
510		shrink_dcache_sb(s);
511
512		dput(REISERFS_SB(s)->xattr_root);
513		REISERFS_SB(s)->xattr_root = NULL;
514		dput(REISERFS_SB(s)->priv_root);
515		REISERFS_SB(s)->priv_root = NULL;
516	}
517
518	kill_block_super(s);
519}
520
521static void reiserfs_put_super(struct super_block *s)
522{
523	struct reiserfs_transaction_handle th;
524	th.t_trans_id = 0;
525
526	dquot_disable(s, -1, DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
527
528	reiserfs_write_lock(s);
529
530	/* change file system state to current state if it was mounted with read-write permissions */
531	if (!(s->s_flags & MS_RDONLY)) {
532		if (!journal_begin(&th, s, 10)) {
533			reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s),
534						     1);
535			set_sb_umount_state(SB_DISK_SUPER_BLOCK(s),
536					    REISERFS_SB(s)->s_mount_state);
537			journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB(s));
538		}
539	}
540
541	/* note, journal_release checks for readonly mount, and can decide not
542	 ** to do a journal_end
543	 */
544	journal_release(&th, s);
545
546	reiserfs_free_bitmap_cache(s);
547
548	brelse(SB_BUFFER_WITH_SB(s));
549
550	print_statistics(s);
551
552	if (REISERFS_SB(s)->reserved_blocks != 0) {
553		reiserfs_warning(s, "green-2005", "reserved blocks left %d",
554				 REISERFS_SB(s)->reserved_blocks);
555	}
556
557	reiserfs_proc_info_done(s);
558
559	reiserfs_write_unlock(s);
560	mutex_destroy(&REISERFS_SB(s)->lock);
561	kfree(s->s_fs_info);
562	s->s_fs_info = NULL;
563}
564
565static struct kmem_cache *reiserfs_inode_cachep;
566
567static struct inode *reiserfs_alloc_inode(struct super_block *sb)
568{
569	struct reiserfs_inode_info *ei;
570	ei = (struct reiserfs_inode_info *)
571	    kmem_cache_alloc(reiserfs_inode_cachep, GFP_KERNEL);
572	if (!ei)
573		return NULL;
574	atomic_set(&ei->openers, 0);
575	mutex_init(&ei->tailpack);
576	return &ei->vfs_inode;
577}
578
579static void reiserfs_i_callback(struct rcu_head *head)
580{
581	struct inode *inode = container_of(head, struct inode, i_rcu);
582	kmem_cache_free(reiserfs_inode_cachep, REISERFS_I(inode));
583}
584
585static void reiserfs_destroy_inode(struct inode *inode)
586{
587	call_rcu(&inode->i_rcu, reiserfs_i_callback);
588}
589
590static void init_once(void *foo)
591{
592	struct reiserfs_inode_info *ei = (struct reiserfs_inode_info *)foo;
593
594	INIT_LIST_HEAD(&ei->i_prealloc_list);
595	inode_init_once(&ei->vfs_inode);
596}
597
598static int init_inodecache(void)
599{
600	reiserfs_inode_cachep = kmem_cache_create("reiser_inode_cache",
601						  sizeof(struct
602							 reiserfs_inode_info),
603						  0, (SLAB_RECLAIM_ACCOUNT|
604							SLAB_MEM_SPREAD),
605						  init_once);
606	if (reiserfs_inode_cachep == NULL)
607		return -ENOMEM;
608	return 0;
609}
610
611static void destroy_inodecache(void)
612{
613	/*
614	 * Make sure all delayed rcu free inodes are flushed before we
615	 * destroy cache.
616	 */
617	rcu_barrier();
618	kmem_cache_destroy(reiserfs_inode_cachep);
619}
620
621/* we don't mark inodes dirty, we just log them */
622static void reiserfs_dirty_inode(struct inode *inode, int flags)
623{
624	struct reiserfs_transaction_handle th;
625
626	int err = 0;
627	int lock_depth;
628
629	if (inode->i_sb->s_flags & MS_RDONLY) {
630		reiserfs_warning(inode->i_sb, "clm-6006",
631				 "writing inode %lu on readonly FS",
632				 inode->i_ino);
633		return;
634	}
635	lock_depth = reiserfs_write_lock_once(inode->i_sb);
636
637	/* this is really only used for atime updates, so they don't have
638	 ** to be included in O_SYNC or fsync
639	 */
640	err = journal_begin(&th, inode->i_sb, 1);
641	if (err)
642		goto out;
643
644	reiserfs_update_sd(&th, inode);
645	journal_end(&th, inode->i_sb, 1);
646
647out:
648	reiserfs_write_unlock_once(inode->i_sb, lock_depth);
649}
650
651static int reiserfs_show_options(struct seq_file *seq, struct dentry *root)
652{
653	struct super_block *s = root->d_sb;
654	struct reiserfs_journal *journal = SB_JOURNAL(s);
655	long opts = REISERFS_SB(s)->s_mount_opt;
656
657	if (opts & (1 << REISERFS_LARGETAIL))
658		seq_puts(seq, ",tails=on");
659	else if (!(opts & (1 << REISERFS_SMALLTAIL)))
660		seq_puts(seq, ",notail");
661	/* tails=small is default so we don't show it */
662
663	if (!(opts & (1 << REISERFS_BARRIER_FLUSH)))
664		seq_puts(seq, ",barrier=none");
665	/* barrier=flush is default so we don't show it */
666
667	if (opts & (1 << REISERFS_ERROR_CONTINUE))
668		seq_puts(seq, ",errors=continue");
669	else if (opts & (1 << REISERFS_ERROR_PANIC))
670		seq_puts(seq, ",errors=panic");
671	/* errors=ro is default so we don't show it */
672
673	if (opts & (1 << REISERFS_DATA_LOG))
674		seq_puts(seq, ",data=journal");
675	else if (opts & (1 << REISERFS_DATA_WRITEBACK))
676		seq_puts(seq, ",data=writeback");
677	/* data=ordered is default so we don't show it */
678
679	if (opts & (1 << REISERFS_ATTRS))
680		seq_puts(seq, ",attrs");
681
682	if (opts & (1 << REISERFS_XATTRS_USER))
683		seq_puts(seq, ",user_xattr");
684
685	if (opts & (1 << REISERFS_EXPOSE_PRIVROOT))
686		seq_puts(seq, ",expose_privroot");
687
688	if (opts & (1 << REISERFS_POSIXACL))
689		seq_puts(seq, ",acl");
690
691	if (REISERFS_SB(s)->s_jdev)
692		seq_printf(seq, ",jdev=%s", REISERFS_SB(s)->s_jdev);
693
694	if (journal->j_max_commit_age != journal->j_default_max_commit_age)
695		seq_printf(seq, ",commit=%d", journal->j_max_commit_age);
696
697#ifdef CONFIG_QUOTA
698	if (REISERFS_SB(s)->s_qf_names[USRQUOTA])
699		seq_printf(seq, ",usrjquota=%s", REISERFS_SB(s)->s_qf_names[USRQUOTA]);
700	else if (opts & (1 << REISERFS_USRQUOTA))
701		seq_puts(seq, ",usrquota");
702	if (REISERFS_SB(s)->s_qf_names[GRPQUOTA])
703		seq_printf(seq, ",grpjquota=%s", REISERFS_SB(s)->s_qf_names[GRPQUOTA]);
704	else if (opts & (1 << REISERFS_GRPQUOTA))
705		seq_puts(seq, ",grpquota");
706	if (REISERFS_SB(s)->s_jquota_fmt) {
707		if (REISERFS_SB(s)->s_jquota_fmt == QFMT_VFS_OLD)
708			seq_puts(seq, ",jqfmt=vfsold");
709		else if (REISERFS_SB(s)->s_jquota_fmt == QFMT_VFS_V0)
710			seq_puts(seq, ",jqfmt=vfsv0");
711	}
712#endif
713
714	/* Block allocator options */
715	if (opts & (1 << REISERFS_NO_BORDER))
716		seq_puts(seq, ",block-allocator=noborder");
717	if (opts & (1 << REISERFS_NO_UNHASHED_RELOCATION))
718		seq_puts(seq, ",block-allocator=no_unhashed_relocation");
719	if (opts & (1 << REISERFS_HASHED_RELOCATION))
720		seq_puts(seq, ",block-allocator=hashed_relocation");
721	if (opts & (1 << REISERFS_TEST4))
722		seq_puts(seq, ",block-allocator=test4");
723	show_alloc_options(seq, s);
724	return 0;
725}
726
727#ifdef CONFIG_QUOTA
728static ssize_t reiserfs_quota_write(struct super_block *, int, const char *,
729				    size_t, loff_t);
730static ssize_t reiserfs_quota_read(struct super_block *, int, char *, size_t,
731				   loff_t);
732#endif
733
734static const struct super_operations reiserfs_sops = {
735	.alloc_inode = reiserfs_alloc_inode,
736	.destroy_inode = reiserfs_destroy_inode,
737	.write_inode = reiserfs_write_inode,
738	.dirty_inode = reiserfs_dirty_inode,
739	.evict_inode = reiserfs_evict_inode,
740	.put_super = reiserfs_put_super,
741	.sync_fs = reiserfs_sync_fs,
742	.freeze_fs = reiserfs_freeze,
743	.unfreeze_fs = reiserfs_unfreeze,
744	.statfs = reiserfs_statfs,
745	.remount_fs = reiserfs_remount,
746	.show_options = reiserfs_show_options,
747#ifdef CONFIG_QUOTA
748	.quota_read = reiserfs_quota_read,
749	.quota_write = reiserfs_quota_write,
750#endif
751};
752
753#ifdef CONFIG_QUOTA
754#define QTYPE2NAME(t) ((t)==USRQUOTA?"user":"group")
755
756static int reiserfs_write_dquot(struct dquot *);
757static int reiserfs_acquire_dquot(struct dquot *);
758static int reiserfs_release_dquot(struct dquot *);
759static int reiserfs_mark_dquot_dirty(struct dquot *);
760static int reiserfs_write_info(struct super_block *, int);
761static int reiserfs_quota_on(struct super_block *, int, int, struct path *);
762
763static const struct dquot_operations reiserfs_quota_operations = {
764	.write_dquot = reiserfs_write_dquot,
765	.acquire_dquot = reiserfs_acquire_dquot,
766	.release_dquot = reiserfs_release_dquot,
767	.mark_dirty = reiserfs_mark_dquot_dirty,
768	.write_info = reiserfs_write_info,
769	.alloc_dquot	= dquot_alloc,
770	.destroy_dquot	= dquot_destroy,
771};
772
773static const struct quotactl_ops reiserfs_qctl_operations = {
774	.quota_on = reiserfs_quota_on,
775	.quota_off = dquot_quota_off,
776	.quota_sync = dquot_quota_sync,
777	.get_info = dquot_get_dqinfo,
778	.set_info = dquot_set_dqinfo,
779	.get_dqblk = dquot_get_dqblk,
780	.set_dqblk = dquot_set_dqblk,
781};
782#endif
783
784static const struct export_operations reiserfs_export_ops = {
785	.encode_fh = reiserfs_encode_fh,
786	.fh_to_dentry = reiserfs_fh_to_dentry,
787	.fh_to_parent = reiserfs_fh_to_parent,
788	.get_parent = reiserfs_get_parent,
789};
790
791/* this struct is used in reiserfs_getopt () for containing the value for those
792   mount options that have values rather than being toggles. */
793typedef struct {
794	char *value;
795	int setmask;		/* bitmask which is to set on mount_options bitmask when this
796				   value is found, 0 is no bits are to be changed. */
797	int clrmask;		/* bitmask which is to clear on mount_options bitmask when  this
798				   value is found, 0 is no bits are to be changed. This is
799				   applied BEFORE setmask */
800} arg_desc_t;
801
802/* Set this bit in arg_required to allow empty arguments */
803#define REISERFS_OPT_ALLOWEMPTY 31
804
805/* this struct is used in reiserfs_getopt() for describing the set of reiserfs
806   mount options */
807typedef struct {
808	char *option_name;
809	int arg_required;	/* 0 if argument is not required, not 0 otherwise */
810	const arg_desc_t *values;	/* list of values accepted by an option */
811	int setmask;		/* bitmask which is to set on mount_options bitmask when this
812				   value is found, 0 is no bits are to be changed. */
813	int clrmask;		/* bitmask which is to clear on mount_options bitmask when  this
814				   value is found, 0 is no bits are to be changed. This is
815				   applied BEFORE setmask */
816} opt_desc_t;
817
818/* possible values for -o data= */
819static const arg_desc_t logging_mode[] = {
820	{"ordered", 1 << REISERFS_DATA_ORDERED,
821	 (1 << REISERFS_DATA_LOG | 1 << REISERFS_DATA_WRITEBACK)},
822	{"journal", 1 << REISERFS_DATA_LOG,
823	 (1 << REISERFS_DATA_ORDERED | 1 << REISERFS_DATA_WRITEBACK)},
824	{"writeback", 1 << REISERFS_DATA_WRITEBACK,
825	 (1 << REISERFS_DATA_ORDERED | 1 << REISERFS_DATA_LOG)},
826	{.value = NULL}
827};
828
829/* possible values for -o barrier= */
830static const arg_desc_t barrier_mode[] = {
831	{"none", 1 << REISERFS_BARRIER_NONE, 1 << REISERFS_BARRIER_FLUSH},
832	{"flush", 1 << REISERFS_BARRIER_FLUSH, 1 << REISERFS_BARRIER_NONE},
833	{.value = NULL}
834};
835
836/* possible values for "-o block-allocator=" and bits which are to be set in
837   s_mount_opt of reiserfs specific part of in-core super block */
838static const arg_desc_t balloc[] = {
839	{"noborder", 1 << REISERFS_NO_BORDER, 0},
840	{"border", 0, 1 << REISERFS_NO_BORDER},
841	{"no_unhashed_relocation", 1 << REISERFS_NO_UNHASHED_RELOCATION, 0},
842	{"hashed_relocation", 1 << REISERFS_HASHED_RELOCATION, 0},
843	{"test4", 1 << REISERFS_TEST4, 0},
844	{"notest4", 0, 1 << REISERFS_TEST4},
845	{NULL, 0, 0}
846};
847
848static const arg_desc_t tails[] = {
849	{"on", 1 << REISERFS_LARGETAIL, 1 << REISERFS_SMALLTAIL},
850	{"off", 0, (1 << REISERFS_LARGETAIL) | (1 << REISERFS_SMALLTAIL)},
851	{"small", 1 << REISERFS_SMALLTAIL, 1 << REISERFS_LARGETAIL},
852	{NULL, 0, 0}
853};
854
855static const arg_desc_t error_actions[] = {
856	{"panic", 1 << REISERFS_ERROR_PANIC,
857	 (1 << REISERFS_ERROR_RO | 1 << REISERFS_ERROR_CONTINUE)},
858	{"ro-remount", 1 << REISERFS_ERROR_RO,
859	 (1 << REISERFS_ERROR_PANIC | 1 << REISERFS_ERROR_CONTINUE)},
860#ifdef REISERFS_JOURNAL_ERROR_ALLOWS_NO_LOG
861	{"continue", 1 << REISERFS_ERROR_CONTINUE,
862	 (1 << REISERFS_ERROR_PANIC | 1 << REISERFS_ERROR_RO)},
863#endif
864	{NULL, 0, 0},
865};
866
867/* proceed only one option from a list *cur - string containing of mount options
868   opts - array of options which are accepted
869   opt_arg - if option is found and requires an argument and if it is specifed
870   in the input - pointer to the argument is stored here
871   bit_flags - if option requires to set a certain bit - it is set here
872   return -1 if unknown option is found, opt->arg_required otherwise */
873static int reiserfs_getopt(struct super_block *s, char **cur, opt_desc_t * opts,
874			   char **opt_arg, unsigned long *bit_flags)
875{
876	char *p;
877	/* foo=bar,
878	   ^   ^  ^
879	   |   |  +-- option_end
880	   |   +-- arg_start
881	   +-- option_start
882	 */
883	const opt_desc_t *opt;
884	const arg_desc_t *arg;
885
886	p = *cur;
887
888	/* assume argument cannot contain commas */
889	*cur = strchr(p, ',');
890	if (*cur) {
891		*(*cur) = '\0';
892		(*cur)++;
893	}
894
895	if (!strncmp(p, "alloc=", 6)) {
896		/* Ugly special case, probably we should redo options parser so that
897		   it can understand several arguments for some options, also so that
898		   it can fill several bitfields with option values. */
899		if (reiserfs_parse_alloc_options(s, p + 6)) {
900			return -1;
901		} else {
902			return 0;
903		}
904	}
905
906	/* for every option in the list */
907	for (opt = opts; opt->option_name; opt++) {
908		if (!strncmp(p, opt->option_name, strlen(opt->option_name))) {
909			if (bit_flags) {
910				if (opt->clrmask ==
911				    (1 << REISERFS_UNSUPPORTED_OPT))
912					reiserfs_warning(s, "super-6500",
913							 "%s not supported.\n",
914							 p);
915				else
916					*bit_flags &= ~opt->clrmask;
917				if (opt->setmask ==
918				    (1 << REISERFS_UNSUPPORTED_OPT))
919					reiserfs_warning(s, "super-6501",
920							 "%s not supported.\n",
921							 p);
922				else
923					*bit_flags |= opt->setmask;
924			}
925			break;
926		}
927	}
928	if (!opt->option_name) {
929		reiserfs_warning(s, "super-6502",
930				 "unknown mount option \"%s\"", p);
931		return -1;
932	}
933
934	p += strlen(opt->option_name);
935	switch (*p) {
936	case '=':
937		if (!opt->arg_required) {
938			reiserfs_warning(s, "super-6503",
939					 "the option \"%s\" does not "
940					 "require an argument\n",
941					 opt->option_name);
942			return -1;
943		}
944		break;
945
946	case 0:
947		if (opt->arg_required) {
948			reiserfs_warning(s, "super-6504",
949					 "the option \"%s\" requires an "
950					 "argument\n", opt->option_name);
951			return -1;
952		}
953		break;
954	default:
955		reiserfs_warning(s, "super-6505",
956				 "head of option \"%s\" is only correct\n",
957				 opt->option_name);
958		return -1;
959	}
960
961	/* move to the argument, or to next option if argument is not required */
962	p++;
963
964	if (opt->arg_required
965	    && !(opt->arg_required & (1 << REISERFS_OPT_ALLOWEMPTY))
966	    && !strlen(p)) {
967		/* this catches "option=," if not allowed */
968		reiserfs_warning(s, "super-6506",
969				 "empty argument for \"%s\"\n",
970				 opt->option_name);
971		return -1;
972	}
973
974	if (!opt->values) {
975		/* *=NULLopt_arg contains pointer to argument */
976		*opt_arg = p;
977		return opt->arg_required & ~(1 << REISERFS_OPT_ALLOWEMPTY);
978	}
979
980	/* values possible for this option are listed in opt->values */
981	for (arg = opt->values; arg->value; arg++) {
982		if (!strcmp(p, arg->value)) {
983			if (bit_flags) {
984				*bit_flags &= ~arg->clrmask;
985				*bit_flags |= arg->setmask;
986			}
987			return opt->arg_required;
988		}
989	}
990
991	reiserfs_warning(s, "super-6506",
992			 "bad value \"%s\" for option \"%s\"\n", p,
993			 opt->option_name);
994	return -1;
995}
996
997/* returns 0 if something is wrong in option string, 1 - otherwise */
998static int reiserfs_parse_options(struct super_block *s, char *options,	/* string given via mount's -o */
999				  unsigned long *mount_options,
1000				  /* after the parsing phase, contains the
1001				     collection of bitflags defining what
1002				     mount options were selected. */
1003				  unsigned long *blocks,	/* strtol-ed from NNN of resize=NNN */
1004				  char **jdev_name,
1005				  unsigned int *commit_max_age,
1006				  char **qf_names,
1007				  unsigned int *qfmt)
1008{
1009	int c;
1010	char *arg = NULL;
1011	char *pos;
1012	opt_desc_t opts[] = {
1013		/* Compatibility stuff, so that -o notail for old setups still work */
1014		{"tails",.arg_required = 't',.values = tails},
1015		{"notail",.clrmask =
1016		 (1 << REISERFS_LARGETAIL) | (1 << REISERFS_SMALLTAIL)},
1017		{"conv",.setmask = 1 << REISERFS_CONVERT},
1018		{"attrs",.setmask = 1 << REISERFS_ATTRS},
1019		{"noattrs",.clrmask = 1 << REISERFS_ATTRS},
1020		{"expose_privroot", .setmask = 1 << REISERFS_EXPOSE_PRIVROOT},
1021#ifdef CONFIG_REISERFS_FS_XATTR
1022		{"user_xattr",.setmask = 1 << REISERFS_XATTRS_USER},
1023		{"nouser_xattr",.clrmask = 1 << REISERFS_XATTRS_USER},
1024#else
1025		{"user_xattr",.setmask = 1 << REISERFS_UNSUPPORTED_OPT},
1026		{"nouser_xattr",.clrmask = 1 << REISERFS_UNSUPPORTED_OPT},
1027#endif
1028#ifdef CONFIG_REISERFS_FS_POSIX_ACL
1029		{"acl",.setmask = 1 << REISERFS_POSIXACL},
1030		{"noacl",.clrmask = 1 << REISERFS_POSIXACL},
1031#else
1032		{"acl",.setmask = 1 << REISERFS_UNSUPPORTED_OPT},
1033		{"noacl",.clrmask = 1 << REISERFS_UNSUPPORTED_OPT},
1034#endif
1035		{.option_name = "nolog"},
1036		{"replayonly",.setmask = 1 << REPLAYONLY},
1037		{"block-allocator",.arg_required = 'a',.values = balloc},
1038		{"data",.arg_required = 'd',.values = logging_mode},
1039		{"barrier",.arg_required = 'b',.values = barrier_mode},
1040		{"resize",.arg_required = 'r',.values = NULL},
1041		{"jdev",.arg_required = 'j',.values = NULL},
1042		{"nolargeio",.arg_required = 'w',.values = NULL},
1043		{"commit",.arg_required = 'c',.values = NULL},
1044		{"usrquota",.setmask = 1 << REISERFS_USRQUOTA},
1045		{"grpquota",.setmask = 1 << REISERFS_GRPQUOTA},
1046		{"noquota",.clrmask = 1 << REISERFS_USRQUOTA | 1 << REISERFS_GRPQUOTA},
1047		{"errors",.arg_required = 'e',.values = error_actions},
1048		{"usrjquota",.arg_required =
1049		 'u' | (1 << REISERFS_OPT_ALLOWEMPTY),.values = NULL},
1050		{"grpjquota",.arg_required =
1051		 'g' | (1 << REISERFS_OPT_ALLOWEMPTY),.values = NULL},
1052		{"jqfmt",.arg_required = 'f',.values = NULL},
1053		{.option_name = NULL}
1054	};
1055
1056	*blocks = 0;
1057	if (!options || !*options)
1058		/* use default configuration: create tails, journaling on, no
1059		   conversion to newest format */
1060		return 1;
1061
1062	for (pos = options; pos;) {
1063		c = reiserfs_getopt(s, &pos, opts, &arg, mount_options);
1064		if (c == -1)
1065			/* wrong option is given */
1066			return 0;
1067
1068		if (c == 'r') {
1069			char *p;
1070
1071			p = NULL;
1072			/* "resize=NNN" or "resize=auto" */
1073
1074			if (!strcmp(arg, "auto")) {
1075				/* From JFS code, to auto-get the size. */
1076				*blocks =
1077				    s->s_bdev->bd_inode->i_size >> s->
1078				    s_blocksize_bits;
1079			} else {
1080				*blocks = simple_strtoul(arg, &p, 0);
1081				if (*p != '\0') {
1082					/* NNN does not look like a number */
1083					reiserfs_warning(s, "super-6507",
1084							 "bad value %s for "
1085							 "-oresize\n", arg);
1086					return 0;
1087				}
1088			}
1089		}
1090
1091		if (c == 'c') {
1092			char *p = NULL;
1093			unsigned long val = simple_strtoul(arg, &p, 0);
1094			/* commit=NNN (time in seconds) */
1095			if (*p != '\0' || val >= (unsigned int)-1) {
1096				reiserfs_warning(s, "super-6508",
1097						 "bad value %s for -ocommit\n",
1098						 arg);
1099				return 0;
1100			}
1101			*commit_max_age = (unsigned int)val;
1102		}
1103
1104		if (c == 'w') {
1105			reiserfs_warning(s, "super-6509", "nolargeio option "
1106					 "is no longer supported");
1107			return 0;
1108		}
1109
1110		if (c == 'j') {
1111			if (arg && *arg && jdev_name) {
1112				if (*jdev_name) {	//Hm, already assigned?
1113					reiserfs_warning(s, "super-6510",
1114							 "journal device was "
1115							 "already specified to "
1116							 "be %s", *jdev_name);
1117					return 0;
1118				}
1119				*jdev_name = arg;
1120			}
1121		}
1122#ifdef CONFIG_QUOTA
1123		if (c == 'u' || c == 'g') {
1124			int qtype = c == 'u' ? USRQUOTA : GRPQUOTA;
1125
1126			if (sb_any_quota_loaded(s) &&
1127			    (!*arg != !REISERFS_SB(s)->s_qf_names[qtype])) {
1128				reiserfs_warning(s, "super-6511",
1129						 "cannot change journaled "
1130						 "quota options when quota "
1131						 "turned on.");
1132				return 0;
1133			}
1134			if (*arg) {	/* Some filename specified? */
1135				if (REISERFS_SB(s)->s_qf_names[qtype]
1136				    && strcmp(REISERFS_SB(s)->s_qf_names[qtype],
1137					      arg)) {
1138					reiserfs_warning(s, "super-6512",
1139							 "%s quota file "
1140							 "already specified.",
1141							 QTYPE2NAME(qtype));
1142					return 0;
1143				}
1144				if (strchr(arg, '/')) {
1145					reiserfs_warning(s, "super-6513",
1146							 "quotafile must be "
1147							 "on filesystem root.");
1148					return 0;
1149				}
1150				qf_names[qtype] = kstrdup(arg, GFP_KERNEL);
1151				if (!qf_names[qtype]) {
1152					reiserfs_warning(s, "reiserfs-2502",
1153							 "not enough memory "
1154							 "for storing "
1155							 "quotafile name.");
1156					return 0;
1157				}
1158				if (qtype == USRQUOTA)
1159					*mount_options |= 1 << REISERFS_USRQUOTA;
1160				else
1161					*mount_options |= 1 << REISERFS_GRPQUOTA;
1162			} else {
1163				if (qf_names[qtype] !=
1164				    REISERFS_SB(s)->s_qf_names[qtype])
1165					kfree(qf_names[qtype]);
1166				qf_names[qtype] = NULL;
1167				if (qtype == USRQUOTA)
1168					*mount_options &= ~(1 << REISERFS_USRQUOTA);
1169				else
1170					*mount_options &= ~(1 << REISERFS_GRPQUOTA);
1171			}
1172		}
1173		if (c == 'f') {
1174			if (!strcmp(arg, "vfsold"))
1175				*qfmt = QFMT_VFS_OLD;
1176			else if (!strcmp(arg, "vfsv0"))
1177				*qfmt = QFMT_VFS_V0;
1178			else {
1179				reiserfs_warning(s, "super-6514",
1180						 "unknown quota format "
1181						 "specified.");
1182				return 0;
1183			}
1184			if (sb_any_quota_loaded(s) &&
1185			    *qfmt != REISERFS_SB(s)->s_jquota_fmt) {
1186				reiserfs_warning(s, "super-6515",
1187						 "cannot change journaled "
1188						 "quota options when quota "
1189						 "turned on.");
1190				return 0;
1191			}
1192		}
1193#else
1194		if (c == 'u' || c == 'g' || c == 'f') {
1195			reiserfs_warning(s, "reiserfs-2503", "journaled "
1196					 "quota options not supported.");
1197			return 0;
1198		}
1199#endif
1200	}
1201
1202#ifdef CONFIG_QUOTA
1203	if (!REISERFS_SB(s)->s_jquota_fmt && !*qfmt
1204	    && (qf_names[USRQUOTA] || qf_names[GRPQUOTA])) {
1205		reiserfs_warning(s, "super-6515",
1206				 "journaled quota format not specified.");
1207		return 0;
1208	}
1209	if ((!(*mount_options & (1 << REISERFS_USRQUOTA)) &&
1210	       sb_has_quota_loaded(s, USRQUOTA)) ||
1211	    (!(*mount_options & (1 << REISERFS_GRPQUOTA)) &&
1212	       sb_has_quota_loaded(s, GRPQUOTA))) {
1213		reiserfs_warning(s, "super-6516", "quota options must "
1214				 "be present when quota is turned on.");
1215		return 0;
1216	}
1217#endif
1218
1219	return 1;
1220}
1221
1222static void switch_data_mode(struct super_block *s, unsigned long mode)
1223{
1224	REISERFS_SB(s)->s_mount_opt &= ~((1 << REISERFS_DATA_LOG) |
1225					 (1 << REISERFS_DATA_ORDERED) |
1226					 (1 << REISERFS_DATA_WRITEBACK));
1227	REISERFS_SB(s)->s_mount_opt |= (1 << mode);
1228}
1229
1230static void handle_data_mode(struct super_block *s, unsigned long mount_options)
1231{
1232	if (mount_options & (1 << REISERFS_DATA_LOG)) {
1233		if (!reiserfs_data_log(s)) {
1234			switch_data_mode(s, REISERFS_DATA_LOG);
1235			reiserfs_info(s, "switching to journaled data mode\n");
1236		}
1237	} else if (mount_options & (1 << REISERFS_DATA_ORDERED)) {
1238		if (!reiserfs_data_ordered(s)) {
1239			switch_data_mode(s, REISERFS_DATA_ORDERED);
1240			reiserfs_info(s, "switching to ordered data mode\n");
1241		}
1242	} else if (mount_options & (1 << REISERFS_DATA_WRITEBACK)) {
1243		if (!reiserfs_data_writeback(s)) {
1244			switch_data_mode(s, REISERFS_DATA_WRITEBACK);
1245			reiserfs_info(s, "switching to writeback data mode\n");
1246		}
1247	}
1248}
1249
1250static void handle_barrier_mode(struct super_block *s, unsigned long bits)
1251{
1252	int flush = (1 << REISERFS_BARRIER_FLUSH);
1253	int none = (1 << REISERFS_BARRIER_NONE);
1254	int all_barrier = flush | none;
1255
1256	if (bits & all_barrier) {
1257		REISERFS_SB(s)->s_mount_opt &= ~all_barrier;
1258		if (bits & flush) {
1259			REISERFS_SB(s)->s_mount_opt |= flush;
1260			printk("reiserfs: enabling write barrier flush mode\n");
1261		} else if (bits & none) {
1262			REISERFS_SB(s)->s_mount_opt |= none;
1263			printk("reiserfs: write barriers turned off\n");
1264		}
1265	}
1266}
1267
1268static void handle_attrs(struct super_block *s)
1269{
1270	struct reiserfs_super_block *rs = SB_DISK_SUPER_BLOCK(s);
1271
1272	if (reiserfs_attrs(s)) {
1273		if (old_format_only(s)) {
1274			reiserfs_warning(s, "super-6517", "cannot support "
1275					 "attributes on 3.5.x disk format");
1276			REISERFS_SB(s)->s_mount_opt &= ~(1 << REISERFS_ATTRS);
1277			return;
1278		}
1279		if (!(le32_to_cpu(rs->s_flags) & reiserfs_attrs_cleared)) {
1280			reiserfs_warning(s, "super-6518", "cannot support "
1281					 "attributes until flag is set in "
1282					 "super-block");
1283			REISERFS_SB(s)->s_mount_opt &= ~(1 << REISERFS_ATTRS);
1284		}
1285	}
1286}
1287
1288#ifdef CONFIG_QUOTA
1289static void handle_quota_files(struct super_block *s, char **qf_names,
1290			       unsigned int *qfmt)
1291{
1292	int i;
1293
1294	for (i = 0; i < MAXQUOTAS; i++) {
1295		if (qf_names[i] != REISERFS_SB(s)->s_qf_names[i])
1296			kfree(REISERFS_SB(s)->s_qf_names[i]);
1297		REISERFS_SB(s)->s_qf_names[i] = qf_names[i];
1298	}
1299	if (*qfmt)
1300		REISERFS_SB(s)->s_jquota_fmt = *qfmt;
1301}
1302#endif
1303
1304static int reiserfs_remount(struct super_block *s, int *mount_flags, char *arg)
1305{
1306	struct reiserfs_super_block *rs;
1307	struct reiserfs_transaction_handle th;
1308	unsigned long blocks;
1309	unsigned long mount_options = REISERFS_SB(s)->s_mount_opt;
1310	unsigned long safe_mask = 0;
1311	unsigned int commit_max_age = (unsigned int)-1;
1312	struct reiserfs_journal *journal = SB_JOURNAL(s);
1313	char *new_opts = kstrdup(arg, GFP_KERNEL);
1314	int err;
1315	char *qf_names[MAXQUOTAS];
1316	unsigned int qfmt = 0;
1317#ifdef CONFIG_QUOTA
1318	int i;
1319#endif
1320
1321	reiserfs_write_lock(s);
1322
1323#ifdef CONFIG_QUOTA
1324	memcpy(qf_names, REISERFS_SB(s)->s_qf_names, sizeof(qf_names));
1325#endif
1326
1327	rs = SB_DISK_SUPER_BLOCK(s);
1328
1329	if (!reiserfs_parse_options
1330	    (s, arg, &mount_options, &blocks, NULL, &commit_max_age,
1331	    qf_names, &qfmt)) {
1332#ifdef CONFIG_QUOTA
1333		for (i = 0; i < MAXQUOTAS; i++)
1334			if (qf_names[i] != REISERFS_SB(s)->s_qf_names[i])
1335				kfree(qf_names[i]);
1336#endif
1337		err = -EINVAL;
1338		goto out_err_unlock;
1339	}
1340#ifdef CONFIG_QUOTA
1341	handle_quota_files(s, qf_names, &qfmt);
1342#endif
1343
1344	handle_attrs(s);
1345
1346	/* Add options that are safe here */
1347	safe_mask |= 1 << REISERFS_SMALLTAIL;
1348	safe_mask |= 1 << REISERFS_LARGETAIL;
1349	safe_mask |= 1 << REISERFS_NO_BORDER;
1350	safe_mask |= 1 << REISERFS_NO_UNHASHED_RELOCATION;
1351	safe_mask |= 1 << REISERFS_HASHED_RELOCATION;
1352	safe_mask |= 1 << REISERFS_TEST4;
1353	safe_mask |= 1 << REISERFS_ATTRS;
1354	safe_mask |= 1 << REISERFS_XATTRS_USER;
1355	safe_mask |= 1 << REISERFS_POSIXACL;
1356	safe_mask |= 1 << REISERFS_BARRIER_FLUSH;
1357	safe_mask |= 1 << REISERFS_BARRIER_NONE;
1358	safe_mask |= 1 << REISERFS_ERROR_RO;
1359	safe_mask |= 1 << REISERFS_ERROR_CONTINUE;
1360	safe_mask |= 1 << REISERFS_ERROR_PANIC;
1361	safe_mask |= 1 << REISERFS_USRQUOTA;
1362	safe_mask |= 1 << REISERFS_GRPQUOTA;
1363
1364	/* Update the bitmask, taking care to keep
1365	 * the bits we're not allowed to change here */
1366	REISERFS_SB(s)->s_mount_opt =
1367	    (REISERFS_SB(s)->
1368	     s_mount_opt & ~safe_mask) | (mount_options & safe_mask);
1369
1370	if (commit_max_age != 0 && commit_max_age != (unsigned int)-1) {
1371		journal->j_max_commit_age = commit_max_age;
1372		journal->j_max_trans_age = commit_max_age;
1373	} else if (commit_max_age == 0) {
1374		/* 0 means restore defaults. */
1375		journal->j_max_commit_age = journal->j_default_max_commit_age;
1376		journal->j_max_trans_age = JOURNAL_MAX_TRANS_AGE;
1377	}
1378
1379	if (blocks) {
1380		err = reiserfs_resize(s, blocks);
1381		if (err != 0)
1382			goto out_err_unlock;
1383	}
1384
1385	if (*mount_flags & MS_RDONLY) {
1386		reiserfs_write_unlock(s);
1387		reiserfs_xattr_init(s, *mount_flags);
1388		/* remount read-only */
1389		if (s->s_flags & MS_RDONLY)
1390			/* it is read-only already */
1391			goto out_ok_unlocked;
1392
1393		err = dquot_suspend(s, -1);
1394		if (err < 0)
1395			goto out_err;
1396
1397		/* try to remount file system with read-only permissions */
1398		if (sb_umount_state(rs) == REISERFS_VALID_FS
1399		    || REISERFS_SB(s)->s_mount_state != REISERFS_VALID_FS) {
1400			goto out_ok_unlocked;
1401		}
1402
1403		reiserfs_write_lock(s);
1404
1405		err = journal_begin(&th, s, 10);
1406		if (err)
1407			goto out_err_unlock;
1408
1409		/* Mounting a rw partition read-only. */
1410		reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
1411		set_sb_umount_state(rs, REISERFS_SB(s)->s_mount_state);
1412		journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB(s));
1413	} else {
1414		/* remount read-write */
1415		if (!(s->s_flags & MS_RDONLY)) {
1416			reiserfs_write_unlock(s);
1417			reiserfs_xattr_init(s, *mount_flags);
1418			goto out_ok_unlocked;	/* We are read-write already */
1419		}
1420
1421		if (reiserfs_is_journal_aborted(journal)) {
1422			err = journal->j_errno;
1423			goto out_err_unlock;
1424		}
1425
1426		handle_data_mode(s, mount_options);
1427		handle_barrier_mode(s, mount_options);
1428		REISERFS_SB(s)->s_mount_state = sb_umount_state(rs);
1429		s->s_flags &= ~MS_RDONLY;	/* now it is safe to call journal_begin */
1430		err = journal_begin(&th, s, 10);
1431		if (err)
1432			goto out_err_unlock;
1433
1434		/* Mount a partition which is read-only, read-write */
1435		reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
1436		REISERFS_SB(s)->s_mount_state = sb_umount_state(rs);
1437		s->s_flags &= ~MS_RDONLY;
1438		set_sb_umount_state(rs, REISERFS_ERROR_FS);
1439		if (!old_format_only(s))
1440			set_sb_mnt_count(rs, sb_mnt_count(rs) + 1);
1441		/* mark_buffer_dirty (SB_BUFFER_WITH_SB (s), 1); */
1442		journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB(s));
1443		REISERFS_SB(s)->s_mount_state = REISERFS_VALID_FS;
1444	}
1445	/* this will force a full flush of all journal lists */
1446	SB_JOURNAL(s)->j_must_wait = 1;
1447	err = journal_end(&th, s, 10);
1448	if (err)
1449		goto out_err_unlock;
1450
1451	reiserfs_write_unlock(s);
1452	if (!(*mount_flags & MS_RDONLY)) {
1453		dquot_resume(s, -1);
1454		reiserfs_write_lock(s);
1455		finish_unfinished(s);
1456		reiserfs_write_unlock(s);
1457		reiserfs_xattr_init(s, *mount_flags);
1458	}
1459
1460out_ok_unlocked:
1461	replace_mount_options(s, new_opts);
1462	return 0;
1463
1464out_err_unlock:
1465	reiserfs_write_unlock(s);
1466out_err:
1467	kfree(new_opts);
1468	return err;
1469}
1470
1471static int read_super_block(struct super_block *s, int offset)
1472{
1473	struct buffer_head *bh;
1474	struct reiserfs_super_block *rs;
1475	int fs_blocksize;
1476
1477	bh = sb_bread(s, offset / s->s_blocksize);
1478	if (!bh) {
1479		reiserfs_warning(s, "sh-2006",
1480				 "bread failed (dev %s, block %lu, size %lu)",
1481				 reiserfs_bdevname(s), offset / s->s_blocksize,
1482				 s->s_blocksize);
1483		return 1;
1484	}
1485
1486	rs = (struct reiserfs_super_block *)bh->b_data;
1487	if (!is_any_reiserfs_magic_string(rs)) {
1488		brelse(bh);
1489		return 1;
1490	}
1491	//
1492	// ok, reiserfs signature (old or new) found in at the given offset
1493	//
1494	fs_blocksize = sb_blocksize(rs);
1495	brelse(bh);
1496	sb_set_blocksize(s, fs_blocksize);
1497
1498	bh = sb_bread(s, offset / s->s_blocksize);
1499	if (!bh) {
1500		reiserfs_warning(s, "sh-2007",
1501				 "bread failed (dev %s, block %lu, size %lu)",
1502				 reiserfs_bdevname(s), offset / s->s_blocksize,
1503				 s->s_blocksize);
1504		return 1;
1505	}
1506
1507	rs = (struct reiserfs_super_block *)bh->b_data;
1508	if (sb_blocksize(rs) != s->s_blocksize) {
1509		reiserfs_warning(s, "sh-2011", "can't find a reiserfs "
1510				 "filesystem on (dev %s, block %Lu, size %lu)",
1511				 reiserfs_bdevname(s),
1512				 (unsigned long long)bh->b_blocknr,
1513				 s->s_blocksize);
1514		brelse(bh);
1515		return 1;
1516	}
1517
1518	if (rs->s_v1.s_root_block == cpu_to_le32(-1)) {
1519		brelse(bh);
1520		reiserfs_warning(s, "super-6519", "Unfinished reiserfsck "
1521				 "--rebuild-tree run detected. Please run\n"
1522				 "reiserfsck --rebuild-tree and wait for a "
1523				 "completion. If that fails\n"
1524				 "get newer reiserfsprogs package");
1525		return 1;
1526	}
1527
1528	SB_BUFFER_WITH_SB(s) = bh;
1529	SB_DISK_SUPER_BLOCK(s) = rs;
1530
1531	if (is_reiserfs_jr(rs)) {
1532		/* magic is of non-standard journal filesystem, look at s_version to
1533		   find which format is in use */
1534		if (sb_version(rs) == REISERFS_VERSION_2)
1535			reiserfs_info(s, "found reiserfs format \"3.6\""
1536				      " with non-standard journal\n");
1537		else if (sb_version(rs) == REISERFS_VERSION_1)
1538			reiserfs_info(s, "found reiserfs format \"3.5\""
1539				      " with non-standard journal\n");
1540		else {
1541			reiserfs_warning(s, "sh-2012", "found unknown "
1542					 "format \"%u\" of reiserfs with "
1543					 "non-standard magic", sb_version(rs));
1544			return 1;
1545		}
1546	} else
1547		/* s_version of standard format may contain incorrect information,
1548		   so we just look at the magic string */
1549		reiserfs_info(s,
1550			      "found reiserfs format \"%s\" with standard journal\n",
1551			      is_reiserfs_3_5(rs) ? "3.5" : "3.6");
1552
1553	s->s_op = &reiserfs_sops;
1554	s->s_export_op = &reiserfs_export_ops;
1555#ifdef CONFIG_QUOTA
1556	s->s_qcop = &reiserfs_qctl_operations;
1557	s->dq_op = &reiserfs_quota_operations;
1558#endif
1559
1560	/* new format is limited by the 32 bit wide i_blocks field, want to
1561	 ** be one full block below that.
1562	 */
1563	s->s_maxbytes = (512LL << 32) - s->s_blocksize;
1564	return 0;
1565}
1566
1567/* after journal replay, reread all bitmap and super blocks */
1568static int reread_meta_blocks(struct super_block *s)
1569{
1570	ll_rw_block(READ, 1, &(SB_BUFFER_WITH_SB(s)));
1571	wait_on_buffer(SB_BUFFER_WITH_SB(s));
1572	if (!buffer_uptodate(SB_BUFFER_WITH_SB(s))) {
1573		reiserfs_warning(s, "reiserfs-2504", "error reading the super");
1574		return 1;
1575	}
1576
1577	return 0;
1578}
1579
1580/////////////////////////////////////////////////////
1581// hash detection stuff
1582
1583// if root directory is empty - we set default - Yura's - hash and
1584// warn about it
1585// FIXME: we look for only one name in a directory. If tea and yura
1586// bith have the same value - we ask user to send report to the
1587// mailing list
1588static __u32 find_hash_out(struct super_block *s)
1589{
1590	int retval;
1591	struct inode *inode;
1592	struct cpu_key key;
1593	INITIALIZE_PATH(path);
1594	struct reiserfs_dir_entry de;
1595	__u32 hash = DEFAULT_HASH;
1596
1597	inode = s->s_root->d_inode;
1598
1599	do {			// Some serious "goto"-hater was there ;)
1600		u32 teahash, r5hash, yurahash;
1601
1602		make_cpu_key(&key, inode, ~0, TYPE_DIRENTRY, 3);
1603		retval = search_by_entry_key(s, &key, &path, &de);
1604		if (retval == IO_ERROR) {
1605			pathrelse(&path);
1606			return UNSET_HASH;
1607		}
1608		if (retval == NAME_NOT_FOUND)
1609			de.de_entry_num--;
1610		set_de_name_and_namelen(&de);
1611		if (deh_offset(&(de.de_deh[de.de_entry_num])) == DOT_DOT_OFFSET) {
1612			/* allow override in this case */
1613			if (reiserfs_rupasov_hash(s)) {
1614				hash = YURA_HASH;
1615			}
1616			reiserfs_info(s, "FS seems to be empty, autodetect "
1617					 "is using the default hash\n");
1618			break;
1619		}
1620		r5hash = GET_HASH_VALUE(r5_hash(de.de_name, de.de_namelen));
1621		teahash = GET_HASH_VALUE(keyed_hash(de.de_name, de.de_namelen));
1622		yurahash = GET_HASH_VALUE(yura_hash(de.de_name, de.de_namelen));
1623		if (((teahash == r5hash)
1624		     &&
1625		     (GET_HASH_VALUE(deh_offset(&(de.de_deh[de.de_entry_num])))
1626		      == r5hash)) || ((teahash == yurahash)
1627				      && (yurahash ==
1628					  GET_HASH_VALUE(deh_offset
1629							 (&
1630							  (de.
1631							   de_deh[de.
1632								  de_entry_num])))))
1633		    || ((r5hash == yurahash)
1634			&& (yurahash ==
1635			    GET_HASH_VALUE(deh_offset
1636					   (&(de.de_deh[de.de_entry_num])))))) {
1637			reiserfs_warning(s, "reiserfs-2506", "Unable to "
1638					 "automatically detect hash function. "
1639					 "Please mount with -o "
1640					 "hash={tea,rupasov,r5}");
1641			hash = UNSET_HASH;
1642			break;
1643		}
1644		if (GET_HASH_VALUE(deh_offset(&(de.de_deh[de.de_entry_num]))) ==
1645		    yurahash)
1646			hash = YURA_HASH;
1647		else if (GET_HASH_VALUE
1648			 (deh_offset(&(de.de_deh[de.de_entry_num]))) == teahash)
1649			hash = TEA_HASH;
1650		else if (GET_HASH_VALUE
1651			 (deh_offset(&(de.de_deh[de.de_entry_num]))) == r5hash)
1652			hash = R5_HASH;
1653		else {
1654			reiserfs_warning(s, "reiserfs-2506",
1655					 "Unrecognised hash function");
1656			hash = UNSET_HASH;
1657		}
1658	} while (0);
1659
1660	pathrelse(&path);
1661	return hash;
1662}
1663
1664// finds out which hash names are sorted with
1665static int what_hash(struct super_block *s)
1666{
1667	__u32 code;
1668
1669	code = sb_hash_function_code(SB_DISK_SUPER_BLOCK(s));
1670
1671	/* reiserfs_hash_detect() == true if any of the hash mount options
1672	 ** were used.  We must check them to make sure the user isn't
1673	 ** using a bad hash value
1674	 */
1675	if (code == UNSET_HASH || reiserfs_hash_detect(s))
1676		code = find_hash_out(s);
1677
1678	if (code != UNSET_HASH && reiserfs_hash_detect(s)) {
1679		/* detection has found the hash, and we must check against the
1680		 ** mount options
1681		 */
1682		if (reiserfs_rupasov_hash(s) && code != YURA_HASH) {
1683			reiserfs_warning(s, "reiserfs-2507",
1684					 "Error, %s hash detected, "
1685					 "unable to force rupasov hash",
1686					 reiserfs_hashname(code));
1687			code = UNSET_HASH;
1688		} else if (reiserfs_tea_hash(s) && code != TEA_HASH) {
1689			reiserfs_warning(s, "reiserfs-2508",
1690					 "Error, %s hash detected, "
1691					 "unable to force tea hash",
1692					 reiserfs_hashname(code));
1693			code = UNSET_HASH;
1694		} else if (reiserfs_r5_hash(s) && code != R5_HASH) {
1695			reiserfs_warning(s, "reiserfs-2509",
1696					 "Error, %s hash detected, "
1697					 "unable to force r5 hash",
1698					 reiserfs_hashname(code));
1699			code = UNSET_HASH;
1700		}
1701	} else {
1702		/* find_hash_out was not called or could not determine the hash */
1703		if (reiserfs_rupasov_hash(s)) {
1704			code = YURA_HASH;
1705		} else if (reiserfs_tea_hash(s)) {
1706			code = TEA_HASH;
1707		} else if (reiserfs_r5_hash(s)) {
1708			code = R5_HASH;
1709		}
1710	}
1711
1712	/* if we are mounted RW, and we have a new valid hash code, update
1713	 ** the super
1714	 */
1715	if (code != UNSET_HASH &&
1716	    !(s->s_flags & MS_RDONLY) &&
1717	    code != sb_hash_function_code(SB_DISK_SUPER_BLOCK(s))) {
1718		set_sb_hash_function_code(SB_DISK_SUPER_BLOCK(s), code);
1719	}
1720	return code;
1721}
1722
1723// return pointer to appropriate function
1724static hashf_t hash_function(struct super_block *s)
1725{
1726	switch (what_hash(s)) {
1727	case TEA_HASH:
1728		reiserfs_info(s, "Using tea hash to sort names\n");
1729		return keyed_hash;
1730	case YURA_HASH:
1731		reiserfs_info(s, "Using rupasov hash to sort names\n");
1732		return yura_hash;
1733	case R5_HASH:
1734		reiserfs_info(s, "Using r5 hash to sort names\n");
1735		return r5_hash;
1736	}
1737	return NULL;
1738}
1739
1740// this is used to set up correct value for old partitions
1741static int function2code(hashf_t func)
1742{
1743	if (func == keyed_hash)
1744		return TEA_HASH;
1745	if (func == yura_hash)
1746		return YURA_HASH;
1747	if (func == r5_hash)
1748		return R5_HASH;
1749
1750	BUG();			// should never happen
1751
1752	return 0;
1753}
1754
1755#define SWARN(silent, s, id, ...)			\
1756	if (!(silent))				\
1757		reiserfs_warning(s, id, __VA_ARGS__)
1758
1759static int reiserfs_fill_super(struct super_block *s, void *data, int silent)
1760{
1761	struct inode *root_inode;
1762	struct reiserfs_transaction_handle th;
1763	int old_format = 0;
1764	unsigned long blocks;
1765	unsigned int commit_max_age = 0;
1766	int jinit_done = 0;
1767	struct reiserfs_iget_args args;
1768	struct reiserfs_super_block *rs;
1769	char *jdev_name;
1770	struct reiserfs_sb_info *sbi;
1771	int errval = -EINVAL;
1772	char *qf_names[MAXQUOTAS] = {};
1773	unsigned int qfmt = 0;
1774
1775	save_mount_options(s, data);
1776
1777	sbi = kzalloc(sizeof(struct reiserfs_sb_info), GFP_KERNEL);
1778	if (!sbi)
1779		return -ENOMEM;
1780	s->s_fs_info = sbi;
1781	/* Set default values for options: non-aggressive tails, RO on errors */
1782	sbi->s_mount_opt |= (1 << REISERFS_SMALLTAIL);
1783	sbi->s_mount_opt |= (1 << REISERFS_ERROR_RO);
1784	sbi->s_mount_opt |= (1 << REISERFS_BARRIER_FLUSH);
1785	/* no preallocation minimum, be smart in
1786	   reiserfs_file_write instead */
1787	sbi->s_alloc_options.preallocmin = 0;
1788	/* Preallocate by 16 blocks (17-1) at once */
1789	sbi->s_alloc_options.preallocsize = 17;
1790	/* setup default block allocator options */
1791	reiserfs_init_alloc_options(s);
1792
1793	spin_lock_init(&sbi->old_work_lock);
1794	INIT_DELAYED_WORK(&sbi->old_work, flush_old_commits);
1795	mutex_init(&sbi->lock);
1796	sbi->lock_depth = -1;
1797
1798	jdev_name = NULL;
1799	if (reiserfs_parse_options
1800	    (s, (char *)data, &(sbi->s_mount_opt), &blocks, &jdev_name,
1801	     &commit_max_age, qf_names, &qfmt) == 0) {
1802		goto error_unlocked;
1803	}
1804	if (jdev_name && jdev_name[0]) {
1805		sbi->s_jdev = kstrdup(jdev_name, GFP_KERNEL);
1806		if (!sbi->s_jdev) {
1807			SWARN(silent, s, "", "Cannot allocate memory for "
1808				"journal device name");
1809			goto error;
1810		}
1811	}
1812#ifdef CONFIG_QUOTA
1813	handle_quota_files(s, qf_names, &qfmt);
1814#endif
1815
1816	if (blocks) {
1817		SWARN(silent, s, "jmacd-7", "resize option for remount only");
1818		goto error_unlocked;
1819	}
1820
1821	/* try old format (undistributed bitmap, super block in 8-th 1k block of a device) */
1822	if (!read_super_block(s, REISERFS_OLD_DISK_OFFSET_IN_BYTES))
1823		old_format = 1;
1824	/* try new format (64-th 1k block), which can contain reiserfs super block */
1825	else if (read_super_block(s, REISERFS_DISK_OFFSET_IN_BYTES)) {
1826		SWARN(silent, s, "sh-2021", "can not find reiserfs on %s",
1827		      reiserfs_bdevname(s));
1828		goto error_unlocked;
1829	}
1830
1831	rs = SB_DISK_SUPER_BLOCK(s);
1832	/* Let's do basic sanity check to verify that underlying device is not
1833	   smaller than the filesystem. If the check fails then abort and scream,
1834	   because bad stuff will happen otherwise. */
1835	if (s->s_bdev && s->s_bdev->bd_inode
1836	    && i_size_read(s->s_bdev->bd_inode) <
1837	    sb_block_count(rs) * sb_blocksize(rs)) {
1838		SWARN(silent, s, "", "Filesystem cannot be "
1839		      "mounted because it is bigger than the device");
1840		SWARN(silent, s, "", "You may need to run fsck "
1841		      "or increase size of your LVM partition");
1842		SWARN(silent, s, "", "Or may be you forgot to "
1843		      "reboot after fdisk when it told you to");
1844		goto error_unlocked;
1845	}
1846
1847	sbi->s_mount_state = SB_REISERFS_STATE(s);
1848	sbi->s_mount_state = REISERFS_VALID_FS;
1849
1850	if ((errval = reiserfs_init_bitmap_cache(s))) {
1851		SWARN(silent, s, "jmacd-8", "unable to read bitmap");
1852		goto error_unlocked;
1853	}
1854
1855	errval = -EINVAL;
1856#ifdef CONFIG_REISERFS_CHECK
1857	SWARN(silent, s, "", "CONFIG_REISERFS_CHECK is set ON");
1858	SWARN(silent, s, "", "- it is slow mode for debugging.");
1859#endif
1860
1861	/* make data=ordered the default */
1862	if (!reiserfs_data_log(s) && !reiserfs_data_ordered(s) &&
1863	    !reiserfs_data_writeback(s)) {
1864		sbi->s_mount_opt |= (1 << REISERFS_DATA_ORDERED);
1865	}
1866
1867	if (reiserfs_data_log(s)) {
1868		reiserfs_info(s, "using journaled data mode\n");
1869	} else if (reiserfs_data_ordered(s)) {
1870		reiserfs_info(s, "using ordered data mode\n");
1871	} else {
1872		reiserfs_info(s, "using writeback data mode\n");
1873	}
1874	if (reiserfs_barrier_flush(s)) {
1875		printk("reiserfs: using flush barriers\n");
1876	}
1877
1878	// set_device_ro(s->s_dev, 1) ;
1879	if (journal_init(s, jdev_name, old_format, commit_max_age)) {
1880		SWARN(silent, s, "sh-2022",
1881		      "unable to initialize journal space");
1882		goto error_unlocked;
1883	} else {
1884		jinit_done = 1;	/* once this is set, journal_release must be called
1885				 ** if we error out of the mount
1886				 */
1887	}
1888
1889	if (reread_meta_blocks(s)) {
1890		SWARN(silent, s, "jmacd-9",
1891		      "unable to reread meta blocks after journal init");
1892		goto error_unlocked;
1893	}
1894
1895	if (replay_only(s))
1896		goto error_unlocked;
1897
1898	if (bdev_read_only(s->s_bdev) && !(s->s_flags & MS_RDONLY)) {
1899		SWARN(silent, s, "clm-7000",
1900		      "Detected readonly device, marking FS readonly");
1901		s->s_flags |= MS_RDONLY;
1902	}
1903	args.objectid = REISERFS_ROOT_OBJECTID;
1904	args.dirid = REISERFS_ROOT_PARENT_OBJECTID;
1905	root_inode =
1906	    iget5_locked(s, REISERFS_ROOT_OBJECTID, reiserfs_find_actor,
1907			 reiserfs_init_locked_inode, (void *)(&args));
1908	if (!root_inode) {
1909		SWARN(silent, s, "jmacd-10", "get root inode failed");
1910		goto error_unlocked;
1911	}
1912
1913	/*
1914	 * This path assumed to be called with the BKL in the old times.
1915	 * Now we have inherited the big reiserfs lock from it and many
1916	 * reiserfs helpers called in the mount path and elsewhere require
1917	 * this lock to be held even if it's not always necessary. Let's be
1918	 * conservative and hold it early. The window can be reduced after
1919	 * careful review of the code.
1920	 */
1921	reiserfs_write_lock(s);
1922
1923	if (root_inode->i_state & I_NEW) {
1924		reiserfs_read_locked_inode(root_inode, &args);
1925		unlock_new_inode(root_inode);
1926	}
1927
1928	s->s_root = d_make_root(root_inode);
1929	if (!s->s_root)
1930		goto error;
1931	// define and initialize hash function
1932	sbi->s_hash_function = hash_function(s);
1933	if (sbi->s_hash_function == NULL) {
1934		dput(s->s_root);
1935		s->s_root = NULL;
1936		goto error;
1937	}
1938
1939	if (is_reiserfs_3_5(rs)
1940	    || (is_reiserfs_jr(rs) && SB_VERSION(s) == REISERFS_VERSION_1))
1941		set_bit(REISERFS_3_5, &(sbi->s_properties));
1942	else if (old_format)
1943		set_bit(REISERFS_OLD_FORMAT, &(sbi->s_properties));
1944	else
1945		set_bit(REISERFS_3_6, &(sbi->s_properties));
1946
1947	if (!(s->s_flags & MS_RDONLY)) {
1948
1949		errval = journal_begin(&th, s, 1);
1950		if (errval) {
1951			dput(s->s_root);
1952			s->s_root = NULL;
1953			goto error;
1954		}
1955		reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
1956
1957		set_sb_umount_state(rs, REISERFS_ERROR_FS);
1958		set_sb_fs_state(rs, 0);
1959
1960		/* Clear out s_bmap_nr if it would wrap. We can handle this
1961		 * case, but older revisions can't. This will cause the
1962		 * file system to fail mount on those older implementations,
1963		 * avoiding corruption. -jeffm */
1964		if (bmap_would_wrap(reiserfs_bmap_count(s)) &&
1965		    sb_bmap_nr(rs) != 0) {
1966			reiserfs_warning(s, "super-2030", "This file system "
1967					"claims to use %u bitmap blocks in "
1968					"its super block, but requires %u. "
1969					"Clearing to zero.", sb_bmap_nr(rs),
1970					reiserfs_bmap_count(s));
1971
1972			set_sb_bmap_nr(rs, 0);
1973		}
1974
1975		if (old_format_only(s)) {
1976			/* filesystem of format 3.5 either with standard or non-standard
1977			   journal */
1978			if (convert_reiserfs(s)) {
1979				/* and -o conv is given */
1980				if (!silent)
1981					reiserfs_info(s,
1982						      "converting 3.5 filesystem to the 3.6 format");
1983
1984				if (is_reiserfs_3_5(rs))
1985					/* put magic string of 3.6 format. 2.2 will not be able to
1986					   mount this filesystem anymore */
1987					memcpy(rs->s_v1.s_magic,
1988					       reiserfs_3_6_magic_string,
1989					       sizeof
1990					       (reiserfs_3_6_magic_string));
1991
1992				set_sb_version(rs, REISERFS_VERSION_2);
1993				reiserfs_convert_objectid_map_v1(s);
1994				set_bit(REISERFS_3_6, &(sbi->s_properties));
1995				clear_bit(REISERFS_3_5, &(sbi->s_properties));
1996			} else if (!silent) {
1997				reiserfs_info(s, "using 3.5.x disk format\n");
1998			}
1999		} else
2000			set_sb_mnt_count(rs, sb_mnt_count(rs) + 1);
2001
2002
2003		journal_mark_dirty(&th, s, SB_BUFFER_WITH_SB(s));
2004		errval = journal_end(&th, s, 1);
2005		if (errval) {
2006			dput(s->s_root);
2007			s->s_root = NULL;
2008			goto error;
2009		}
2010
2011		reiserfs_write_unlock(s);
2012		if ((errval = reiserfs_lookup_privroot(s)) ||
2013		    (errval = reiserfs_xattr_init(s, s->s_flags))) {
2014			dput(s->s_root);
2015			s->s_root = NULL;
2016			goto error_unlocked;
2017		}
2018		reiserfs_write_lock(s);
2019
2020		/* look for files which were to be removed in previous session */
2021		finish_unfinished(s);
2022	} else {
2023		if (old_format_only(s) && !silent) {
2024			reiserfs_info(s, "using 3.5.x disk format\n");
2025		}
2026
2027		reiserfs_write_unlock(s);
2028		if ((errval = reiserfs_lookup_privroot(s)) ||
2029		    (errval = reiserfs_xattr_init(s, s->s_flags))) {
2030			dput(s->s_root);
2031			s->s_root = NULL;
2032			goto error_unlocked;
2033		}
2034		reiserfs_write_lock(s);
2035	}
2036	// mark hash in super block: it could be unset. overwrite should be ok
2037	set_sb_hash_function_code(rs, function2code(sbi->s_hash_function));
2038
2039	handle_attrs(s);
2040
2041	reiserfs_proc_info_init(s);
2042
2043	init_waitqueue_head(&(sbi->s_wait));
2044	spin_lock_init(&sbi->bitmap_lock);
2045
2046	reiserfs_write_unlock(s);
2047
2048	return (0);
2049
2050error:
2051	reiserfs_write_unlock(s);
2052
2053error_unlocked:
2054	/* kill the commit thread, free journal ram */
2055	if (jinit_done) {
2056		reiserfs_write_lock(s);
2057		journal_release_error(NULL, s);
2058		reiserfs_write_unlock(s);
2059	}
2060
2061	cancel_delayed_work_sync(&REISERFS_SB(s)->old_work);
2062
2063	reiserfs_free_bitmap_cache(s);
2064	if (SB_BUFFER_WITH_SB(s))
2065		brelse(SB_BUFFER_WITH_SB(s));
2066#ifdef CONFIG_QUOTA
2067	{
2068		int j;
2069		for (j = 0; j < MAXQUOTAS; j++)
2070			kfree(qf_names[j]);
2071	}
2072#endif
2073	kfree(sbi);
2074
2075	s->s_fs_info = NULL;
2076	return errval;
2077}
2078
2079static int reiserfs_statfs(struct dentry *dentry, struct kstatfs *buf)
2080{
2081	struct reiserfs_super_block *rs = SB_DISK_SUPER_BLOCK(dentry->d_sb);
2082
2083	buf->f_namelen = (REISERFS_MAX_NAME(s->s_blocksize));
2084	buf->f_bfree = sb_free_blocks(rs);
2085	buf->f_bavail = buf->f_bfree;
2086	buf->f_blocks = sb_block_count(rs) - sb_bmap_nr(rs) - 1;
2087	buf->f_bsize = dentry->d_sb->s_blocksize;
2088	/* changed to accommodate gcc folks. */
2089	buf->f_type = REISERFS_SUPER_MAGIC;
2090	buf->f_fsid.val[0] = (u32)crc32_le(0, rs->s_uuid, sizeof(rs->s_uuid)/2);
2091	buf->f_fsid.val[1] = (u32)crc32_le(0, rs->s_uuid + sizeof(rs->s_uuid)/2,
2092				sizeof(rs->s_uuid)/2);
2093
2094	return 0;
2095}
2096
2097#ifdef CONFIG_QUOTA
2098static int reiserfs_write_dquot(struct dquot *dquot)
2099{
2100	struct reiserfs_transaction_handle th;
2101	int ret, err;
2102
2103	reiserfs_write_lock(dquot->dq_sb);
2104	ret =
2105	    journal_begin(&th, dquot->dq_sb,
2106			  REISERFS_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
2107	if (ret)
2108		goto out;
2109	reiserfs_write_unlock(dquot->dq_sb);
2110	ret = dquot_commit(dquot);
2111	reiserfs_write_lock(dquot->dq_sb);
2112	err =
2113	    journal_end(&th, dquot->dq_sb,
2114			REISERFS_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
2115	if (!ret && err)
2116		ret = err;
2117out:
2118	reiserfs_write_unlock(dquot->dq_sb);
2119	return ret;
2120}
2121
2122static int reiserfs_acquire_dquot(struct dquot *dquot)
2123{
2124	struct reiserfs_transaction_handle th;
2125	int ret, err;
2126
2127	reiserfs_write_lock(dquot->dq_sb);
2128	ret =
2129	    journal_begin(&th, dquot->dq_sb,
2130			  REISERFS_QUOTA_INIT_BLOCKS(dquot->dq_sb));
2131	if (ret)
2132		goto out;
2133	reiserfs_write_unlock(dquot->dq_sb);
2134	ret = dquot_acquire(dquot);
2135	reiserfs_write_lock(dquot->dq_sb);
2136	err =
2137	    journal_end(&th, dquot->dq_sb,
2138			REISERFS_QUOTA_INIT_BLOCKS(dquot->dq_sb));
2139	if (!ret && err)
2140		ret = err;
2141out:
2142	reiserfs_write_unlock(dquot->dq_sb);
2143	return ret;
2144}
2145
2146static int reiserfs_release_dquot(struct dquot *dquot)
2147{
2148	struct reiserfs_transaction_handle th;
2149	int ret, err;
2150
2151	reiserfs_write_lock(dquot->dq_sb);
2152	ret =
2153	    journal_begin(&th, dquot->dq_sb,
2154			  REISERFS_QUOTA_DEL_BLOCKS(dquot->dq_sb));
2155	reiserfs_write_unlock(dquot->dq_sb);
2156	if (ret) {
2157		/* Release dquot anyway to avoid endless cycle in dqput() */
2158		dquot_release(dquot);
2159		goto out;
2160	}
2161	ret = dquot_release(dquot);
2162	reiserfs_write_lock(dquot->dq_sb);
2163	err =
2164	    journal_end(&th, dquot->dq_sb,
2165			REISERFS_QUOTA_DEL_BLOCKS(dquot->dq_sb));
2166	if (!ret && err)
2167		ret = err;
2168	reiserfs_write_unlock(dquot->dq_sb);
2169out:
2170	return ret;
2171}
2172
2173static int reiserfs_mark_dquot_dirty(struct dquot *dquot)
2174{
2175	/* Are we journaling quotas? */
2176	if (REISERFS_SB(dquot->dq_sb)->s_qf_names[USRQUOTA] ||
2177	    REISERFS_SB(dquot->dq_sb)->s_qf_names[GRPQUOTA]) {
2178		dquot_mark_dquot_dirty(dquot);
2179		return reiserfs_write_dquot(dquot);
2180	} else
2181		return dquot_mark_dquot_dirty(dquot);
2182}
2183
2184static int reiserfs_write_info(struct super_block *sb, int type)
2185{
2186	struct reiserfs_transaction_handle th;
2187	int ret, err;
2188
2189	/* Data block + inode block */
2190	reiserfs_write_lock(sb);
2191	ret = journal_begin(&th, sb, 2);
2192	if (ret)
2193		goto out;
2194	reiserfs_write_unlock(sb);
2195	ret = dquot_commit_info(sb, type);
2196	reiserfs_write_lock(sb);
2197	err = journal_end(&th, sb, 2);
2198	if (!ret && err)
2199		ret = err;
2200out:
2201	reiserfs_write_unlock(sb);
2202	return ret;
2203}
2204
2205/*
2206 * Turn on quotas during mount time - we need to find the quota file and such...
2207 */
2208static int reiserfs_quota_on_mount(struct super_block *sb, int type)
2209{
2210	return dquot_quota_on_mount(sb, REISERFS_SB(sb)->s_qf_names[type],
2211					REISERFS_SB(sb)->s_jquota_fmt, type);
2212}
2213
2214/*
2215 * Standard function to be called on quota_on
2216 */
2217static int reiserfs_quota_on(struct super_block *sb, int type, int format_id,
2218			     struct path *path)
2219{
2220	int err;
2221	struct inode *inode;
2222	struct reiserfs_transaction_handle th;
2223	int opt = type == USRQUOTA ? REISERFS_USRQUOTA : REISERFS_GRPQUOTA;
2224
2225	reiserfs_write_lock(sb);
2226	if (!(REISERFS_SB(sb)->s_mount_opt & (1 << opt))) {
2227		err = -EINVAL;
2228		goto out;
2229	}
2230
2231	/* Quotafile not on the same filesystem? */
2232	if (path->dentry->d_sb != sb) {
2233		err = -EXDEV;
2234		goto out;
2235	}
2236	inode = path->dentry->d_inode;
2237	/* We must not pack tails for quota files on reiserfs for quota IO to work */
2238	if (!(REISERFS_I(inode)->i_flags & i_nopack_mask)) {
2239		err = reiserfs_unpack(inode, NULL);
2240		if (err) {
2241			reiserfs_warning(sb, "super-6520",
2242				"Unpacking tail of quota file failed"
2243				" (%d). Cannot turn on quotas.", err);
2244			err = -EINVAL;
2245			goto out;
2246		}
2247		mark_inode_dirty(inode);
2248	}
2249	/* Journaling quota? */
2250	if (REISERFS_SB(sb)->s_qf_names[type]) {
2251		/* Quotafile not of fs root? */
2252		if (path->dentry->d_parent != sb->s_root)
2253			reiserfs_warning(sb, "super-6521",
2254				 "Quota file not on filesystem root. "
2255				 "Journalled quota will not work.");
2256	}
2257
2258	/*
2259	 * When we journal data on quota file, we have to flush journal to see
2260	 * all updates to the file when we bypass pagecache...
2261	 */
2262	if (reiserfs_file_data_log(inode)) {
2263		/* Just start temporary transaction and finish it */
2264		err = journal_begin(&th, sb, 1);
2265		if (err)
2266			goto out;
2267		err = journal_end_sync(&th, sb, 1);
2268		if (err)
2269			goto out;
2270	}
2271	reiserfs_write_unlock(sb);
2272	return dquot_quota_on(sb, type, format_id, path);
2273out:
2274	reiserfs_write_unlock(sb);
2275	return err;
2276}
2277
2278/* Read data from quotafile - avoid pagecache and such because we cannot afford
2279 * acquiring the locks... As quota files are never truncated and quota code
2280 * itself serializes the operations (and no one else should touch the files)
2281 * we don't have to be afraid of races */
2282static ssize_t reiserfs_quota_read(struct super_block *sb, int type, char *data,
2283				   size_t len, loff_t off)
2284{
2285	struct inode *inode = sb_dqopt(sb)->files[type];
2286	unsigned long blk = off >> sb->s_blocksize_bits;
2287	int err = 0, offset = off & (sb->s_blocksize - 1), tocopy;
2288	size_t toread;
2289	struct buffer_head tmp_bh, *bh;
2290	loff_t i_size = i_size_read(inode);
2291
2292	if (off > i_size)
2293		return 0;
2294	if (off + len > i_size)
2295		len = i_size - off;
2296	toread = len;
2297	while (toread > 0) {
2298		tocopy =
2299		    sb->s_blocksize - offset <
2300		    toread ? sb->s_blocksize - offset : toread;
2301		tmp_bh.b_state = 0;
2302		/* Quota files are without tails so we can safely use this function */
2303		reiserfs_write_lock(sb);
2304		err = reiserfs_get_block(inode, blk, &tmp_bh, 0);
2305		reiserfs_write_unlock(sb);
2306		if (err)
2307			return err;
2308		if (!buffer_mapped(&tmp_bh))	/* A hole? */
2309			memset(data, 0, tocopy);
2310		else {
2311			bh = sb_bread(sb, tmp_bh.b_blocknr);
2312			if (!bh)
2313				return -EIO;
2314			memcpy(data, bh->b_data + offset, tocopy);
2315			brelse(bh);
2316		}
2317		offset = 0;
2318		toread -= tocopy;
2319		data += tocopy;
2320		blk++;
2321	}
2322	return len;
2323}
2324
2325/* Write to quotafile (we know the transaction is already started and has
2326 * enough credits) */
2327static ssize_t reiserfs_quota_write(struct super_block *sb, int type,
2328				    const char *data, size_t len, loff_t off)
2329{
2330	struct inode *inode = sb_dqopt(sb)->files[type];
2331	unsigned long blk = off >> sb->s_blocksize_bits;
2332	int err = 0, offset = off & (sb->s_blocksize - 1), tocopy;
2333	int journal_quota = REISERFS_SB(sb)->s_qf_names[type] != NULL;
2334	size_t towrite = len;
2335	struct buffer_head tmp_bh, *bh;
2336
2337	if (!current->journal_info) {
2338		printk(KERN_WARNING "reiserfs: Quota write (off=%Lu, len=%Lu)"
2339			" cancelled because transaction is not started.\n",
2340			(unsigned long long)off, (unsigned long long)len);
2341		return -EIO;
2342	}
2343	while (towrite > 0) {
2344		tocopy = sb->s_blocksize - offset < towrite ?
2345		    sb->s_blocksize - offset : towrite;
2346		tmp_bh.b_state = 0;
2347		reiserfs_write_lock(sb);
2348		err = reiserfs_get_block(inode, blk, &tmp_bh, GET_BLOCK_CREATE);
2349		reiserfs_write_unlock(sb);
2350		if (err)
2351			goto out;
2352		if (offset || tocopy != sb->s_blocksize)
2353			bh = sb_bread(sb, tmp_bh.b_blocknr);
2354		else
2355			bh = sb_getblk(sb, tmp_bh.b_blocknr);
2356		if (!bh) {
2357			err = -EIO;
2358			goto out;
2359		}
2360		lock_buffer(bh);
2361		memcpy(bh->b_data + offset, data, tocopy);
2362		flush_dcache_page(bh->b_page);
2363		set_buffer_uptodate(bh);
2364		unlock_buffer(bh);
2365		reiserfs_write_lock(sb);
2366		reiserfs_prepare_for_journal(sb, bh, 1);
2367		journal_mark_dirty(current->journal_info, sb, bh);
2368		if (!journal_quota)
2369			reiserfs_add_ordered_list(inode, bh);
2370		reiserfs_write_unlock(sb);
2371		brelse(bh);
2372		offset = 0;
2373		towrite -= tocopy;
2374		data += tocopy;
2375		blk++;
2376	}
2377out:
2378	if (len == towrite)
2379		return err;
2380	if (inode->i_size < off + len - towrite)
2381		i_size_write(inode, off + len - towrite);
2382	inode->i_version++;
2383	inode->i_mtime = inode->i_ctime = CURRENT_TIME;
2384	mark_inode_dirty(inode);
2385	return len - towrite;
2386}
2387
2388#endif
2389
2390static struct dentry *get_super_block(struct file_system_type *fs_type,
2391			   int flags, const char *dev_name,
2392			   void *data)
2393{
2394	return mount_bdev(fs_type, flags, dev_name, data, reiserfs_fill_super);
2395}
2396
2397static int __init init_reiserfs_fs(void)
2398{
2399	int ret;
2400
2401	if ((ret = init_inodecache())) {
2402		return ret;
2403	}
2404
2405	reiserfs_proc_info_global_init();
2406
2407	ret = register_filesystem(&reiserfs_fs_type);
2408
2409	if (ret == 0) {
2410		return 0;
2411	}
2412
2413	reiserfs_proc_info_global_done();
2414	destroy_inodecache();
2415
2416	return ret;
2417}
2418
2419static void __exit exit_reiserfs_fs(void)
2420{
2421	reiserfs_proc_info_global_done();
2422	unregister_filesystem(&reiserfs_fs_type);
2423	destroy_inodecache();
2424}
2425
2426struct file_system_type reiserfs_fs_type = {
2427	.owner = THIS_MODULE,
2428	.name = "reiserfs",
2429	.mount = get_super_block,
2430	.kill_sb = reiserfs_kill_sb,
2431	.fs_flags = FS_REQUIRES_DEV,
2432};
2433MODULE_ALIAS_FS("reiserfs");
2434
2435MODULE_DESCRIPTION("ReiserFS journaled filesystem");
2436MODULE_AUTHOR("Hans Reiser <reiser@namesys.com>");
2437MODULE_LICENSE("GPL");
2438
2439module_init(init_reiserfs_fs);
2440module_exit(exit_reiserfs_fs);
2441