zram: fix unbalanced idr management at hot removal
[linux/fpc-iii.git] / fs / reiserfs / super.c
blob0a6ad4e71e88dd0c2a7a3b3c4eaaa1671ba6dcad
1 /*
2 * Copyright 2000 by Hans Reiser, licensing governed by reiserfs/README
4 * Trivial changes by Alan Cox to add the LFS fixes
6 * Trivial Changes:
7 * Rights granted to Hans Reiser to redistribute under other terms providing
8 * he accepts all liability including but not limited to patent, fitness
9 * for purpose, and direct or indirect claims arising from failure to perform.
11 * NO WARRANTY
14 #include <linux/module.h>
15 #include <linux/slab.h>
16 #include <linux/vmalloc.h>
17 #include <linux/time.h>
18 #include <linux/uaccess.h>
19 #include "reiserfs.h"
20 #include "acl.h"
21 #include "xattr.h"
22 #include <linux/init.h>
23 #include <linux/blkdev.h>
24 #include <linux/backing-dev.h>
25 #include <linux/buffer_head.h>
26 #include <linux/exportfs.h>
27 #include <linux/quotaops.h>
28 #include <linux/vfs.h>
29 #include <linux/mount.h>
30 #include <linux/namei.h>
31 #include <linux/crc32.h>
32 #include <linux/seq_file.h>
34 struct file_system_type reiserfs_fs_type;
36 static const char reiserfs_3_5_magic_string[] = REISERFS_SUPER_MAGIC_STRING;
37 static const char reiserfs_3_6_magic_string[] = REISER2FS_SUPER_MAGIC_STRING;
38 static const char reiserfs_jr_magic_string[] = REISER2FS_JR_SUPER_MAGIC_STRING;
40 int is_reiserfs_3_5(struct reiserfs_super_block *rs)
42 return !strncmp(rs->s_v1.s_magic, reiserfs_3_5_magic_string,
43 strlen(reiserfs_3_5_magic_string));
46 int is_reiserfs_3_6(struct reiserfs_super_block *rs)
48 return !strncmp(rs->s_v1.s_magic, reiserfs_3_6_magic_string,
49 strlen(reiserfs_3_6_magic_string));
52 int is_reiserfs_jr(struct reiserfs_super_block *rs)
54 return !strncmp(rs->s_v1.s_magic, reiserfs_jr_magic_string,
55 strlen(reiserfs_jr_magic_string));
58 static int is_any_reiserfs_magic_string(struct reiserfs_super_block *rs)
60 return (is_reiserfs_3_5(rs) || is_reiserfs_3_6(rs) ||
61 is_reiserfs_jr(rs));
64 static int reiserfs_remount(struct super_block *s, int *flags, char *data);
65 static int reiserfs_statfs(struct dentry *dentry, struct kstatfs *buf);
67 static int reiserfs_sync_fs(struct super_block *s, int wait)
69 struct reiserfs_transaction_handle th;
72 * Writeback quota in non-journalled quota case - journalled quota has
73 * no dirty dquots
75 dquot_writeback_dquots(s, -1);
76 reiserfs_write_lock(s);
77 if (!journal_begin(&th, s, 1))
78 if (!journal_end_sync(&th))
79 reiserfs_flush_old_commits(s);
80 reiserfs_write_unlock(s);
81 return 0;
84 static void flush_old_commits(struct work_struct *work)
86 struct reiserfs_sb_info *sbi;
87 struct super_block *s;
89 sbi = container_of(work, struct reiserfs_sb_info, old_work.work);
90 s = sbi->s_journal->j_work_sb;
92 spin_lock(&sbi->old_work_lock);
93 sbi->work_queued = 0;
94 spin_unlock(&sbi->old_work_lock);
96 reiserfs_sync_fs(s, 1);
99 void reiserfs_schedule_old_flush(struct super_block *s)
101 struct reiserfs_sb_info *sbi = REISERFS_SB(s);
102 unsigned long delay;
105 * Avoid scheduling flush when sb is being shut down. It can race
106 * with journal shutdown and free still queued delayed work.
108 if (s->s_flags & MS_RDONLY || !(s->s_flags & MS_ACTIVE))
109 return;
111 spin_lock(&sbi->old_work_lock);
112 if (!sbi->work_queued) {
113 delay = msecs_to_jiffies(dirty_writeback_interval * 10);
114 queue_delayed_work(system_long_wq, &sbi->old_work, delay);
115 sbi->work_queued = 1;
117 spin_unlock(&sbi->old_work_lock);
120 static void cancel_old_flush(struct super_block *s)
122 struct reiserfs_sb_info *sbi = REISERFS_SB(s);
124 cancel_delayed_work_sync(&REISERFS_SB(s)->old_work);
125 spin_lock(&sbi->old_work_lock);
126 sbi->work_queued = 0;
127 spin_unlock(&sbi->old_work_lock);
130 static int reiserfs_freeze(struct super_block *s)
132 struct reiserfs_transaction_handle th;
134 cancel_old_flush(s);
136 reiserfs_write_lock(s);
137 if (!(s->s_flags & MS_RDONLY)) {
138 int err = journal_begin(&th, s, 1);
139 if (err) {
140 reiserfs_block_writes(&th);
141 } else {
142 reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s),
144 journal_mark_dirty(&th, SB_BUFFER_WITH_SB(s));
145 reiserfs_block_writes(&th);
146 journal_end_sync(&th);
149 reiserfs_write_unlock(s);
150 return 0;
153 static int reiserfs_unfreeze(struct super_block *s)
155 reiserfs_allow_writes(s);
156 return 0;
159 extern const struct in_core_key MAX_IN_CORE_KEY;
162 * this is used to delete "save link" when there are no items of a
163 * file it points to. It can either happen if unlink is completed but
164 * "save unlink" removal, or if file has both unlink and truncate
165 * pending and as unlink completes first (because key of "save link"
166 * protecting unlink is bigger that a key lf "save link" which
167 * protects truncate), so there left no items to make truncate
168 * completion on
170 static int remove_save_link_only(struct super_block *s,
171 struct reiserfs_key *key, int oid_free)
173 struct reiserfs_transaction_handle th;
174 int err;
176 /* we are going to do one balancing */
177 err = journal_begin(&th, s, JOURNAL_PER_BALANCE_CNT);
178 if (err)
179 return err;
181 reiserfs_delete_solid_item(&th, NULL, key);
182 if (oid_free)
183 /* removals are protected by direct items */
184 reiserfs_release_objectid(&th, le32_to_cpu(key->k_objectid));
186 return journal_end(&th);
189 #ifdef CONFIG_QUOTA
190 static int reiserfs_quota_on_mount(struct super_block *, int);
191 #endif
194 * Look for uncompleted unlinks and truncates and complete them
196 * Called with superblock write locked. If quotas are enabled, we have to
197 * release/retake lest we call dquot_quota_on_mount(), proceed to
198 * schedule_on_each_cpu() in invalidate_bdev() and deadlock waiting for the per
199 * cpu worklets to complete flush_async_commits() that in turn wait for the
200 * superblock write lock.
202 static int finish_unfinished(struct super_block *s)
204 INITIALIZE_PATH(path);
205 struct cpu_key max_cpu_key, obj_key;
206 struct reiserfs_key save_link_key, last_inode_key;
207 int retval = 0;
208 struct item_head *ih;
209 struct buffer_head *bh;
210 int item_pos;
211 char *item;
212 int done;
213 struct inode *inode;
214 int truncate;
215 #ifdef CONFIG_QUOTA
216 int i;
217 int ms_active_set;
218 int quota_enabled[REISERFS_MAXQUOTAS];
219 #endif
221 /* compose key to look for "save" links */
222 max_cpu_key.version = KEY_FORMAT_3_5;
223 max_cpu_key.on_disk_key.k_dir_id = ~0U;
224 max_cpu_key.on_disk_key.k_objectid = ~0U;
225 set_cpu_key_k_offset(&max_cpu_key, ~0U);
226 max_cpu_key.key_length = 3;
228 memset(&last_inode_key, 0, sizeof(last_inode_key));
230 #ifdef CONFIG_QUOTA
231 /* Needed for iput() to work correctly and not trash data */
232 if (s->s_flags & MS_ACTIVE) {
233 ms_active_set = 0;
234 } else {
235 ms_active_set = 1;
236 s->s_flags |= MS_ACTIVE;
238 /* Turn on quotas so that they are updated correctly */
239 for (i = 0; i < REISERFS_MAXQUOTAS; i++) {
240 quota_enabled[i] = 1;
241 if (REISERFS_SB(s)->s_qf_names[i]) {
242 int ret;
244 if (sb_has_quota_active(s, i)) {
245 quota_enabled[i] = 0;
246 continue;
248 reiserfs_write_unlock(s);
249 ret = reiserfs_quota_on_mount(s, i);
250 reiserfs_write_lock(s);
251 if (ret < 0)
252 reiserfs_warning(s, "reiserfs-2500",
253 "cannot turn on journaled "
254 "quota: error %d", ret);
257 #endif
259 done = 0;
260 REISERFS_SB(s)->s_is_unlinked_ok = 1;
261 while (!retval) {
262 int depth;
263 retval = search_item(s, &max_cpu_key, &path);
264 if (retval != ITEM_NOT_FOUND) {
265 reiserfs_error(s, "vs-2140",
266 "search_by_key returned %d", retval);
267 break;
270 bh = get_last_bh(&path);
271 item_pos = get_item_pos(&path);
272 if (item_pos != B_NR_ITEMS(bh)) {
273 reiserfs_warning(s, "vs-2060",
274 "wrong position found");
275 break;
277 item_pos--;
278 ih = item_head(bh, item_pos);
280 if (le32_to_cpu(ih->ih_key.k_dir_id) != MAX_KEY_OBJECTID)
281 /* there are no "save" links anymore */
282 break;
284 save_link_key = ih->ih_key;
285 if (is_indirect_le_ih(ih))
286 truncate = 1;
287 else
288 truncate = 0;
290 /* reiserfs_iget needs k_dirid and k_objectid only */
291 item = ih_item_body(bh, ih);
292 obj_key.on_disk_key.k_dir_id = le32_to_cpu(*(__le32 *) item);
293 obj_key.on_disk_key.k_objectid =
294 le32_to_cpu(ih->ih_key.k_objectid);
295 obj_key.on_disk_key.k_offset = 0;
296 obj_key.on_disk_key.k_type = 0;
298 pathrelse(&path);
300 inode = reiserfs_iget(s, &obj_key);
301 if (IS_ERR_OR_NULL(inode)) {
303 * the unlink almost completed, it just did not
304 * manage to remove "save" link and release objectid
306 reiserfs_warning(s, "vs-2180", "iget failed for %K",
307 &obj_key);
308 retval = remove_save_link_only(s, &save_link_key, 1);
309 continue;
312 if (!truncate && inode->i_nlink) {
313 /* file is not unlinked */
314 reiserfs_warning(s, "vs-2185",
315 "file %K is not unlinked",
316 &obj_key);
317 retval = remove_save_link_only(s, &save_link_key, 0);
318 continue;
320 depth = reiserfs_write_unlock_nested(inode->i_sb);
321 dquot_initialize(inode);
322 reiserfs_write_lock_nested(inode->i_sb, depth);
324 if (truncate && S_ISDIR(inode->i_mode)) {
326 * We got a truncate request for a dir which
327 * is impossible. The only imaginable way is to
328 * execute unfinished truncate request then boot
329 * into old kernel, remove the file and create dir
330 * with the same key.
332 reiserfs_warning(s, "green-2101",
333 "impossible truncate on a "
334 "directory %k. Please report",
335 INODE_PKEY(inode));
336 retval = remove_save_link_only(s, &save_link_key, 0);
337 truncate = 0;
338 iput(inode);
339 continue;
342 if (truncate) {
343 REISERFS_I(inode)->i_flags |=
344 i_link_saved_truncate_mask;
346 * not completed truncate found. New size was
347 * committed together with "save" link
349 reiserfs_info(s, "Truncating %k to %lld ..",
350 INODE_PKEY(inode), inode->i_size);
352 /* don't update modification time */
353 reiserfs_truncate_file(inode, 0);
355 retval = remove_save_link(inode, truncate);
356 } else {
357 REISERFS_I(inode)->i_flags |= i_link_saved_unlink_mask;
358 /* not completed unlink (rmdir) found */
359 reiserfs_info(s, "Removing %k..", INODE_PKEY(inode));
360 if (memcmp(&last_inode_key, INODE_PKEY(inode),
361 sizeof(last_inode_key))){
362 last_inode_key = *INODE_PKEY(inode);
363 /* removal gets completed in iput */
364 retval = 0;
365 } else {
366 reiserfs_warning(s, "super-2189", "Dead loop "
367 "in finish_unfinished "
368 "detected, just remove "
369 "save link\n");
370 retval = remove_save_link_only(s,
371 &save_link_key, 0);
375 iput(inode);
376 printk("done\n");
377 done++;
379 REISERFS_SB(s)->s_is_unlinked_ok = 0;
381 #ifdef CONFIG_QUOTA
382 /* Turn quotas off */
383 reiserfs_write_unlock(s);
384 for (i = 0; i < REISERFS_MAXQUOTAS; i++) {
385 if (sb_dqopt(s)->files[i] && quota_enabled[i])
386 dquot_quota_off(s, i);
388 reiserfs_write_lock(s);
389 if (ms_active_set)
390 /* Restore the flag back */
391 s->s_flags &= ~MS_ACTIVE;
392 #endif
393 pathrelse(&path);
394 if (done)
395 reiserfs_info(s, "There were %d uncompleted unlinks/truncates. "
396 "Completed\n", done);
397 return retval;
401 * to protect file being unlinked from getting lost we "safe" link files
402 * being unlinked. This link will be deleted in the same transaction with last
403 * item of file. mounting the filesystem we scan all these links and remove
404 * files which almost got lost
406 void add_save_link(struct reiserfs_transaction_handle *th,
407 struct inode *inode, int truncate)
409 INITIALIZE_PATH(path);
410 int retval;
411 struct cpu_key key;
412 struct item_head ih;
413 __le32 link;
415 BUG_ON(!th->t_trans_id);
417 /* file can only get one "save link" of each kind */
418 RFALSE(truncate &&
419 (REISERFS_I(inode)->i_flags & i_link_saved_truncate_mask),
420 "saved link already exists for truncated inode %lx",
421 (long)inode->i_ino);
422 RFALSE(!truncate &&
423 (REISERFS_I(inode)->i_flags & i_link_saved_unlink_mask),
424 "saved link already exists for unlinked inode %lx",
425 (long)inode->i_ino);
427 /* setup key of "save" link */
428 key.version = KEY_FORMAT_3_5;
429 key.on_disk_key.k_dir_id = MAX_KEY_OBJECTID;
430 key.on_disk_key.k_objectid = inode->i_ino;
431 if (!truncate) {
432 /* unlink, rmdir, rename */
433 set_cpu_key_k_offset(&key, 1 + inode->i_sb->s_blocksize);
434 set_cpu_key_k_type(&key, TYPE_DIRECT);
436 /* item head of "safe" link */
437 make_le_item_head(&ih, &key, key.version,
438 1 + inode->i_sb->s_blocksize, TYPE_DIRECT,
439 4 /*length */ , 0xffff /*free space */ );
440 } else {
441 /* truncate */
442 if (S_ISDIR(inode->i_mode))
443 reiserfs_warning(inode->i_sb, "green-2102",
444 "Adding a truncate savelink for "
445 "a directory %k! Please report",
446 INODE_PKEY(inode));
447 set_cpu_key_k_offset(&key, 1);
448 set_cpu_key_k_type(&key, TYPE_INDIRECT);
450 /* item head of "safe" link */
451 make_le_item_head(&ih, &key, key.version, 1, TYPE_INDIRECT,
452 4 /*length */ , 0 /*free space */ );
454 key.key_length = 3;
456 /* look for its place in the tree */
457 retval = search_item(inode->i_sb, &key, &path);
458 if (retval != ITEM_NOT_FOUND) {
459 if (retval != -ENOSPC)
460 reiserfs_error(inode->i_sb, "vs-2100",
461 "search_by_key (%K) returned %d", &key,
462 retval);
463 pathrelse(&path);
464 return;
467 /* body of "save" link */
468 link = INODE_PKEY(inode)->k_dir_id;
470 /* put "save" link into tree, don't charge quota to anyone */
471 retval =
472 reiserfs_insert_item(th, &path, &key, &ih, NULL, (char *)&link);
473 if (retval) {
474 if (retval != -ENOSPC)
475 reiserfs_error(inode->i_sb, "vs-2120",
476 "insert_item returned %d", retval);
477 } else {
478 if (truncate)
479 REISERFS_I(inode)->i_flags |=
480 i_link_saved_truncate_mask;
481 else
482 REISERFS_I(inode)->i_flags |= i_link_saved_unlink_mask;
486 /* this opens transaction unlike add_save_link */
487 int remove_save_link(struct inode *inode, int truncate)
489 struct reiserfs_transaction_handle th;
490 struct reiserfs_key key;
491 int err;
493 /* we are going to do one balancing only */
494 err = journal_begin(&th, inode->i_sb, JOURNAL_PER_BALANCE_CNT);
495 if (err)
496 return err;
498 /* setup key of "save" link */
499 key.k_dir_id = cpu_to_le32(MAX_KEY_OBJECTID);
500 key.k_objectid = INODE_PKEY(inode)->k_objectid;
501 if (!truncate) {
502 /* unlink, rmdir, rename */
503 set_le_key_k_offset(KEY_FORMAT_3_5, &key,
504 1 + inode->i_sb->s_blocksize);
505 set_le_key_k_type(KEY_FORMAT_3_5, &key, TYPE_DIRECT);
506 } else {
507 /* truncate */
508 set_le_key_k_offset(KEY_FORMAT_3_5, &key, 1);
509 set_le_key_k_type(KEY_FORMAT_3_5, &key, TYPE_INDIRECT);
512 if ((truncate &&
513 (REISERFS_I(inode)->i_flags & i_link_saved_truncate_mask)) ||
514 (!truncate &&
515 (REISERFS_I(inode)->i_flags & i_link_saved_unlink_mask)))
516 /* don't take quota bytes from anywhere */
517 reiserfs_delete_solid_item(&th, NULL, &key);
518 if (!truncate) {
519 reiserfs_release_objectid(&th, inode->i_ino);
520 REISERFS_I(inode)->i_flags &= ~i_link_saved_unlink_mask;
521 } else
522 REISERFS_I(inode)->i_flags &= ~i_link_saved_truncate_mask;
524 return journal_end(&th);
527 static void reiserfs_kill_sb(struct super_block *s)
529 if (REISERFS_SB(s)) {
530 reiserfs_proc_info_done(s);
532 * Force any pending inode evictions to occur now. Any
533 * inodes to be removed that have extended attributes
534 * associated with them need to clean them up before
535 * we can release the extended attribute root dentries.
536 * shrink_dcache_for_umount will BUG if we don't release
537 * those before it's called so ->put_super is too late.
539 shrink_dcache_sb(s);
541 dput(REISERFS_SB(s)->xattr_root);
542 REISERFS_SB(s)->xattr_root = NULL;
543 dput(REISERFS_SB(s)->priv_root);
544 REISERFS_SB(s)->priv_root = NULL;
547 kill_block_super(s);
550 static void reiserfs_put_super(struct super_block *s)
552 struct reiserfs_transaction_handle th;
553 th.t_trans_id = 0;
555 dquot_disable(s, -1, DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
557 reiserfs_write_lock(s);
560 * change file system state to current state if it was mounted
561 * with read-write permissions
563 if (!(s->s_flags & MS_RDONLY)) {
564 if (!journal_begin(&th, s, 10)) {
565 reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s),
567 set_sb_umount_state(SB_DISK_SUPER_BLOCK(s),
568 REISERFS_SB(s)->s_mount_state);
569 journal_mark_dirty(&th, SB_BUFFER_WITH_SB(s));
574 * note, journal_release checks for readonly mount, and can
575 * decide not to do a journal_end
577 journal_release(&th, s);
579 reiserfs_free_bitmap_cache(s);
581 brelse(SB_BUFFER_WITH_SB(s));
583 print_statistics(s);
585 if (REISERFS_SB(s)->reserved_blocks != 0) {
586 reiserfs_warning(s, "green-2005", "reserved blocks left %d",
587 REISERFS_SB(s)->reserved_blocks);
590 reiserfs_write_unlock(s);
591 mutex_destroy(&REISERFS_SB(s)->lock);
592 destroy_workqueue(REISERFS_SB(s)->commit_wq);
593 kfree(s->s_fs_info);
594 s->s_fs_info = NULL;
597 static struct kmem_cache *reiserfs_inode_cachep;
599 static struct inode *reiserfs_alloc_inode(struct super_block *sb)
601 struct reiserfs_inode_info *ei;
602 ei = kmem_cache_alloc(reiserfs_inode_cachep, GFP_KERNEL);
603 if (!ei)
604 return NULL;
605 atomic_set(&ei->openers, 0);
606 mutex_init(&ei->tailpack);
607 #ifdef CONFIG_QUOTA
608 memset(&ei->i_dquot, 0, sizeof(ei->i_dquot));
609 #endif
611 return &ei->vfs_inode;
614 static void reiserfs_i_callback(struct rcu_head *head)
616 struct inode *inode = container_of(head, struct inode, i_rcu);
617 kmem_cache_free(reiserfs_inode_cachep, REISERFS_I(inode));
620 static void reiserfs_destroy_inode(struct inode *inode)
622 call_rcu(&inode->i_rcu, reiserfs_i_callback);
625 static void init_once(void *foo)
627 struct reiserfs_inode_info *ei = (struct reiserfs_inode_info *)foo;
629 INIT_LIST_HEAD(&ei->i_prealloc_list);
630 inode_init_once(&ei->vfs_inode);
633 static int __init init_inodecache(void)
635 reiserfs_inode_cachep = kmem_cache_create("reiser_inode_cache",
636 sizeof(struct
637 reiserfs_inode_info),
638 0, (SLAB_RECLAIM_ACCOUNT|
639 SLAB_MEM_SPREAD|
640 SLAB_ACCOUNT),
641 init_once);
642 if (reiserfs_inode_cachep == NULL)
643 return -ENOMEM;
644 return 0;
647 static void destroy_inodecache(void)
650 * Make sure all delayed rcu free inodes are flushed before we
651 * destroy cache.
653 rcu_barrier();
654 kmem_cache_destroy(reiserfs_inode_cachep);
657 /* we don't mark inodes dirty, we just log them */
658 static void reiserfs_dirty_inode(struct inode *inode, int flags)
660 struct reiserfs_transaction_handle th;
662 int err = 0;
664 if (inode->i_sb->s_flags & MS_RDONLY) {
665 reiserfs_warning(inode->i_sb, "clm-6006",
666 "writing inode %lu on readonly FS",
667 inode->i_ino);
668 return;
670 reiserfs_write_lock(inode->i_sb);
673 * this is really only used for atime updates, so they don't have
674 * to be included in O_SYNC or fsync
676 err = journal_begin(&th, inode->i_sb, 1);
677 if (err)
678 goto out;
680 reiserfs_update_sd(&th, inode);
681 journal_end(&th);
683 out:
684 reiserfs_write_unlock(inode->i_sb);
687 static int reiserfs_show_options(struct seq_file *seq, struct dentry *root)
689 struct super_block *s = root->d_sb;
690 struct reiserfs_journal *journal = SB_JOURNAL(s);
691 long opts = REISERFS_SB(s)->s_mount_opt;
693 if (opts & (1 << REISERFS_LARGETAIL))
694 seq_puts(seq, ",tails=on");
695 else if (!(opts & (1 << REISERFS_SMALLTAIL)))
696 seq_puts(seq, ",notail");
697 /* tails=small is default so we don't show it */
699 if (!(opts & (1 << REISERFS_BARRIER_FLUSH)))
700 seq_puts(seq, ",barrier=none");
701 /* barrier=flush is default so we don't show it */
703 if (opts & (1 << REISERFS_ERROR_CONTINUE))
704 seq_puts(seq, ",errors=continue");
705 else if (opts & (1 << REISERFS_ERROR_PANIC))
706 seq_puts(seq, ",errors=panic");
707 /* errors=ro is default so we don't show it */
709 if (opts & (1 << REISERFS_DATA_LOG))
710 seq_puts(seq, ",data=journal");
711 else if (opts & (1 << REISERFS_DATA_WRITEBACK))
712 seq_puts(seq, ",data=writeback");
713 /* data=ordered is default so we don't show it */
715 if (opts & (1 << REISERFS_ATTRS))
716 seq_puts(seq, ",attrs");
718 if (opts & (1 << REISERFS_XATTRS_USER))
719 seq_puts(seq, ",user_xattr");
721 if (opts & (1 << REISERFS_EXPOSE_PRIVROOT))
722 seq_puts(seq, ",expose_privroot");
724 if (opts & (1 << REISERFS_POSIXACL))
725 seq_puts(seq, ",acl");
727 if (REISERFS_SB(s)->s_jdev)
728 seq_show_option(seq, "jdev", REISERFS_SB(s)->s_jdev);
730 if (journal->j_max_commit_age != journal->j_default_max_commit_age)
731 seq_printf(seq, ",commit=%d", journal->j_max_commit_age);
733 #ifdef CONFIG_QUOTA
734 if (REISERFS_SB(s)->s_qf_names[USRQUOTA])
735 seq_show_option(seq, "usrjquota",
736 REISERFS_SB(s)->s_qf_names[USRQUOTA]);
737 else if (opts & (1 << REISERFS_USRQUOTA))
738 seq_puts(seq, ",usrquota");
739 if (REISERFS_SB(s)->s_qf_names[GRPQUOTA])
740 seq_show_option(seq, "grpjquota",
741 REISERFS_SB(s)->s_qf_names[GRPQUOTA]);
742 else if (opts & (1 << REISERFS_GRPQUOTA))
743 seq_puts(seq, ",grpquota");
744 if (REISERFS_SB(s)->s_jquota_fmt) {
745 if (REISERFS_SB(s)->s_jquota_fmt == QFMT_VFS_OLD)
746 seq_puts(seq, ",jqfmt=vfsold");
747 else if (REISERFS_SB(s)->s_jquota_fmt == QFMT_VFS_V0)
748 seq_puts(seq, ",jqfmt=vfsv0");
750 #endif
752 /* Block allocator options */
753 if (opts & (1 << REISERFS_NO_BORDER))
754 seq_puts(seq, ",block-allocator=noborder");
755 if (opts & (1 << REISERFS_NO_UNHASHED_RELOCATION))
756 seq_puts(seq, ",block-allocator=no_unhashed_relocation");
757 if (opts & (1 << REISERFS_HASHED_RELOCATION))
758 seq_puts(seq, ",block-allocator=hashed_relocation");
759 if (opts & (1 << REISERFS_TEST4))
760 seq_puts(seq, ",block-allocator=test4");
761 show_alloc_options(seq, s);
762 return 0;
765 #ifdef CONFIG_QUOTA
766 static ssize_t reiserfs_quota_write(struct super_block *, int, const char *,
767 size_t, loff_t);
768 static ssize_t reiserfs_quota_read(struct super_block *, int, char *, size_t,
769 loff_t);
771 static struct dquot **reiserfs_get_dquots(struct inode *inode)
773 return REISERFS_I(inode)->i_dquot;
775 #endif
777 static const struct super_operations reiserfs_sops = {
778 .alloc_inode = reiserfs_alloc_inode,
779 .destroy_inode = reiserfs_destroy_inode,
780 .write_inode = reiserfs_write_inode,
781 .dirty_inode = reiserfs_dirty_inode,
782 .evict_inode = reiserfs_evict_inode,
783 .put_super = reiserfs_put_super,
784 .sync_fs = reiserfs_sync_fs,
785 .freeze_fs = reiserfs_freeze,
786 .unfreeze_fs = reiserfs_unfreeze,
787 .statfs = reiserfs_statfs,
788 .remount_fs = reiserfs_remount,
789 .show_options = reiserfs_show_options,
790 #ifdef CONFIG_QUOTA
791 .quota_read = reiserfs_quota_read,
792 .quota_write = reiserfs_quota_write,
793 .get_dquots = reiserfs_get_dquots,
794 #endif
797 #ifdef CONFIG_QUOTA
798 #define QTYPE2NAME(t) ((t)==USRQUOTA?"user":"group")
800 static int reiserfs_write_dquot(struct dquot *);
801 static int reiserfs_acquire_dquot(struct dquot *);
802 static int reiserfs_release_dquot(struct dquot *);
803 static int reiserfs_mark_dquot_dirty(struct dquot *);
804 static int reiserfs_write_info(struct super_block *, int);
805 static int reiserfs_quota_on(struct super_block *, int, int, struct path *);
807 static const struct dquot_operations reiserfs_quota_operations = {
808 .write_dquot = reiserfs_write_dquot,
809 .acquire_dquot = reiserfs_acquire_dquot,
810 .release_dquot = reiserfs_release_dquot,
811 .mark_dirty = reiserfs_mark_dquot_dirty,
812 .write_info = reiserfs_write_info,
813 .alloc_dquot = dquot_alloc,
814 .destroy_dquot = dquot_destroy,
815 .get_next_id = dquot_get_next_id,
818 static const struct quotactl_ops reiserfs_qctl_operations = {
819 .quota_on = reiserfs_quota_on,
820 .quota_off = dquot_quota_off,
821 .quota_sync = dquot_quota_sync,
822 .get_state = dquot_get_state,
823 .set_info = dquot_set_dqinfo,
824 .get_dqblk = dquot_get_dqblk,
825 .set_dqblk = dquot_set_dqblk,
827 #endif
829 static const struct export_operations reiserfs_export_ops = {
830 .encode_fh = reiserfs_encode_fh,
831 .fh_to_dentry = reiserfs_fh_to_dentry,
832 .fh_to_parent = reiserfs_fh_to_parent,
833 .get_parent = reiserfs_get_parent,
837 * this struct is used in reiserfs_getopt () for containing the value for
838 * those mount options that have values rather than being toggles.
840 typedef struct {
841 char *value;
843 * bitmask which is to set on mount_options bitmask
844 * when this value is found, 0 is no bits are to be changed.
846 int setmask;
848 * bitmask which is to clear on mount_options bitmask
849 * when this value is found, 0 is no bits are to be changed.
850 * This is applied BEFORE setmask
852 int clrmask;
853 } arg_desc_t;
855 /* Set this bit in arg_required to allow empty arguments */
856 #define REISERFS_OPT_ALLOWEMPTY 31
859 * this struct is used in reiserfs_getopt() for describing the
860 * set of reiserfs mount options
862 typedef struct {
863 char *option_name;
865 /* 0 if argument is not required, not 0 otherwise */
866 int arg_required;
868 /* list of values accepted by an option */
869 const arg_desc_t *values;
872 * bitmask which is to set on mount_options bitmask
873 * when this value is found, 0 is no bits are to be changed.
875 int setmask;
878 * bitmask which is to clear on mount_options bitmask
879 * when this value is found, 0 is no bits are to be changed.
880 * This is applied BEFORE setmask
882 int clrmask;
883 } opt_desc_t;
885 /* possible values for -o data= */
886 static const arg_desc_t logging_mode[] = {
887 {"ordered", 1 << REISERFS_DATA_ORDERED,
888 (1 << REISERFS_DATA_LOG | 1 << REISERFS_DATA_WRITEBACK)},
889 {"journal", 1 << REISERFS_DATA_LOG,
890 (1 << REISERFS_DATA_ORDERED | 1 << REISERFS_DATA_WRITEBACK)},
891 {"writeback", 1 << REISERFS_DATA_WRITEBACK,
892 (1 << REISERFS_DATA_ORDERED | 1 << REISERFS_DATA_LOG)},
893 {.value = NULL}
896 /* possible values for -o barrier= */
897 static const arg_desc_t barrier_mode[] = {
898 {"none", 1 << REISERFS_BARRIER_NONE, 1 << REISERFS_BARRIER_FLUSH},
899 {"flush", 1 << REISERFS_BARRIER_FLUSH, 1 << REISERFS_BARRIER_NONE},
900 {.value = NULL}
904 * possible values for "-o block-allocator=" and bits which are to be set in
905 * s_mount_opt of reiserfs specific part of in-core super block
907 static const arg_desc_t balloc[] = {
908 {"noborder", 1 << REISERFS_NO_BORDER, 0},
909 {"border", 0, 1 << REISERFS_NO_BORDER},
910 {"no_unhashed_relocation", 1 << REISERFS_NO_UNHASHED_RELOCATION, 0},
911 {"hashed_relocation", 1 << REISERFS_HASHED_RELOCATION, 0},
912 {"test4", 1 << REISERFS_TEST4, 0},
913 {"notest4", 0, 1 << REISERFS_TEST4},
914 {NULL, 0, 0}
917 static const arg_desc_t tails[] = {
918 {"on", 1 << REISERFS_LARGETAIL, 1 << REISERFS_SMALLTAIL},
919 {"off", 0, (1 << REISERFS_LARGETAIL) | (1 << REISERFS_SMALLTAIL)},
920 {"small", 1 << REISERFS_SMALLTAIL, 1 << REISERFS_LARGETAIL},
921 {NULL, 0, 0}
924 static const arg_desc_t error_actions[] = {
925 {"panic", 1 << REISERFS_ERROR_PANIC,
926 (1 << REISERFS_ERROR_RO | 1 << REISERFS_ERROR_CONTINUE)},
927 {"ro-remount", 1 << REISERFS_ERROR_RO,
928 (1 << REISERFS_ERROR_PANIC | 1 << REISERFS_ERROR_CONTINUE)},
929 #ifdef REISERFS_JOURNAL_ERROR_ALLOWS_NO_LOG
930 {"continue", 1 << REISERFS_ERROR_CONTINUE,
931 (1 << REISERFS_ERROR_PANIC | 1 << REISERFS_ERROR_RO)},
932 #endif
933 {NULL, 0, 0},
937 * proceed only one option from a list *cur - string containing of mount
938 * options
939 * opts - array of options which are accepted
940 * opt_arg - if option is found and requires an argument and if it is specifed
941 * in the input - pointer to the argument is stored here
942 * bit_flags - if option requires to set a certain bit - it is set here
943 * return -1 if unknown option is found, opt->arg_required otherwise
945 static int reiserfs_getopt(struct super_block *s, char **cur, opt_desc_t * opts,
946 char **opt_arg, unsigned long *bit_flags)
948 char *p;
950 * foo=bar,
951 * ^ ^ ^
952 * | | +-- option_end
953 * | +-- arg_start
954 * +-- option_start
956 const opt_desc_t *opt;
957 const arg_desc_t *arg;
959 p = *cur;
961 /* assume argument cannot contain commas */
962 *cur = strchr(p, ',');
963 if (*cur) {
964 *(*cur) = '\0';
965 (*cur)++;
968 if (!strncmp(p, "alloc=", 6)) {
970 * Ugly special case, probably we should redo options
971 * parser so that it can understand several arguments for
972 * some options, also so that it can fill several bitfields
973 * with option values.
975 if (reiserfs_parse_alloc_options(s, p + 6)) {
976 return -1;
977 } else {
978 return 0;
982 /* for every option in the list */
983 for (opt = opts; opt->option_name; opt++) {
984 if (!strncmp(p, opt->option_name, strlen(opt->option_name))) {
985 if (bit_flags) {
986 if (opt->clrmask ==
987 (1 << REISERFS_UNSUPPORTED_OPT))
988 reiserfs_warning(s, "super-6500",
989 "%s not supported.\n",
991 else
992 *bit_flags &= ~opt->clrmask;
993 if (opt->setmask ==
994 (1 << REISERFS_UNSUPPORTED_OPT))
995 reiserfs_warning(s, "super-6501",
996 "%s not supported.\n",
998 else
999 *bit_flags |= opt->setmask;
1001 break;
1004 if (!opt->option_name) {
1005 reiserfs_warning(s, "super-6502",
1006 "unknown mount option \"%s\"", p);
1007 return -1;
1010 p += strlen(opt->option_name);
1011 switch (*p) {
1012 case '=':
1013 if (!opt->arg_required) {
1014 reiserfs_warning(s, "super-6503",
1015 "the option \"%s\" does not "
1016 "require an argument\n",
1017 opt->option_name);
1018 return -1;
1020 break;
1022 case 0:
1023 if (opt->arg_required) {
1024 reiserfs_warning(s, "super-6504",
1025 "the option \"%s\" requires an "
1026 "argument\n", opt->option_name);
1027 return -1;
1029 break;
1030 default:
1031 reiserfs_warning(s, "super-6505",
1032 "head of option \"%s\" is only correct\n",
1033 opt->option_name);
1034 return -1;
1038 * move to the argument, or to next option if argument is not
1039 * required
1041 p++;
1043 if (opt->arg_required
1044 && !(opt->arg_required & (1 << REISERFS_OPT_ALLOWEMPTY))
1045 && !strlen(p)) {
1046 /* this catches "option=," if not allowed */
1047 reiserfs_warning(s, "super-6506",
1048 "empty argument for \"%s\"\n",
1049 opt->option_name);
1050 return -1;
1053 if (!opt->values) {
1054 /* *=NULLopt_arg contains pointer to argument */
1055 *opt_arg = p;
1056 return opt->arg_required & ~(1 << REISERFS_OPT_ALLOWEMPTY);
1059 /* values possible for this option are listed in opt->values */
1060 for (arg = opt->values; arg->value; arg++) {
1061 if (!strcmp(p, arg->value)) {
1062 if (bit_flags) {
1063 *bit_flags &= ~arg->clrmask;
1064 *bit_flags |= arg->setmask;
1066 return opt->arg_required;
1070 reiserfs_warning(s, "super-6506",
1071 "bad value \"%s\" for option \"%s\"\n", p,
1072 opt->option_name);
1073 return -1;
1076 /* returns 0 if something is wrong in option string, 1 - otherwise */
1077 static int reiserfs_parse_options(struct super_block *s,
1079 /* string given via mount's -o */
1080 char *options,
1083 * after the parsing phase, contains the
1084 * collection of bitflags defining what
1085 * mount options were selected.
1087 unsigned long *mount_options,
1089 /* strtol-ed from NNN of resize=NNN */
1090 unsigned long *blocks,
1091 char **jdev_name,
1092 unsigned int *commit_max_age,
1093 char **qf_names,
1094 unsigned int *qfmt)
1096 int c;
1097 char *arg = NULL;
1098 char *pos;
1099 opt_desc_t opts[] = {
1101 * Compatibility stuff, so that -o notail for old
1102 * setups still work
1104 {"tails",.arg_required = 't',.values = tails},
1105 {"notail",.clrmask =
1106 (1 << REISERFS_LARGETAIL) | (1 << REISERFS_SMALLTAIL)},
1107 {"conv",.setmask = 1 << REISERFS_CONVERT},
1108 {"attrs",.setmask = 1 << REISERFS_ATTRS},
1109 {"noattrs",.clrmask = 1 << REISERFS_ATTRS},
1110 {"expose_privroot", .setmask = 1 << REISERFS_EXPOSE_PRIVROOT},
1111 #ifdef CONFIG_REISERFS_FS_XATTR
1112 {"user_xattr",.setmask = 1 << REISERFS_XATTRS_USER},
1113 {"nouser_xattr",.clrmask = 1 << REISERFS_XATTRS_USER},
1114 #else
1115 {"user_xattr",.setmask = 1 << REISERFS_UNSUPPORTED_OPT},
1116 {"nouser_xattr",.clrmask = 1 << REISERFS_UNSUPPORTED_OPT},
1117 #endif
1118 #ifdef CONFIG_REISERFS_FS_POSIX_ACL
1119 {"acl",.setmask = 1 << REISERFS_POSIXACL},
1120 {"noacl",.clrmask = 1 << REISERFS_POSIXACL},
1121 #else
1122 {"acl",.setmask = 1 << REISERFS_UNSUPPORTED_OPT},
1123 {"noacl",.clrmask = 1 << REISERFS_UNSUPPORTED_OPT},
1124 #endif
1125 {.option_name = "nolog"},
1126 {"replayonly",.setmask = 1 << REPLAYONLY},
1127 {"block-allocator",.arg_required = 'a',.values = balloc},
1128 {"data",.arg_required = 'd',.values = logging_mode},
1129 {"barrier",.arg_required = 'b',.values = barrier_mode},
1130 {"resize",.arg_required = 'r',.values = NULL},
1131 {"jdev",.arg_required = 'j',.values = NULL},
1132 {"nolargeio",.arg_required = 'w',.values = NULL},
1133 {"commit",.arg_required = 'c',.values = NULL},
1134 {"usrquota",.setmask = 1 << REISERFS_USRQUOTA},
1135 {"grpquota",.setmask = 1 << REISERFS_GRPQUOTA},
1136 {"noquota",.clrmask = 1 << REISERFS_USRQUOTA | 1 << REISERFS_GRPQUOTA},
1137 {"errors",.arg_required = 'e',.values = error_actions},
1138 {"usrjquota",.arg_required =
1139 'u' | (1 << REISERFS_OPT_ALLOWEMPTY),.values = NULL},
1140 {"grpjquota",.arg_required =
1141 'g' | (1 << REISERFS_OPT_ALLOWEMPTY),.values = NULL},
1142 {"jqfmt",.arg_required = 'f',.values = NULL},
1143 {.option_name = NULL}
1146 *blocks = 0;
1147 if (!options || !*options)
1149 * use default configuration: create tails, journaling on, no
1150 * conversion to newest format
1152 return 1;
1154 for (pos = options; pos;) {
1155 c = reiserfs_getopt(s, &pos, opts, &arg, mount_options);
1156 if (c == -1)
1157 /* wrong option is given */
1158 return 0;
1160 if (c == 'r') {
1161 char *p;
1163 p = NULL;
1164 /* "resize=NNN" or "resize=auto" */
1166 if (!strcmp(arg, "auto")) {
1167 /* From JFS code, to auto-get the size. */
1168 *blocks =
1169 s->s_bdev->bd_inode->i_size >> s->
1170 s_blocksize_bits;
1171 } else {
1172 *blocks = simple_strtoul(arg, &p, 0);
1173 if (*p != '\0') {
1174 /* NNN does not look like a number */
1175 reiserfs_warning(s, "super-6507",
1176 "bad value %s for "
1177 "-oresize\n", arg);
1178 return 0;
1183 if (c == 'c') {
1184 char *p = NULL;
1185 unsigned long val = simple_strtoul(arg, &p, 0);
1186 /* commit=NNN (time in seconds) */
1187 if (*p != '\0' || val >= (unsigned int)-1) {
1188 reiserfs_warning(s, "super-6508",
1189 "bad value %s for -ocommit\n",
1190 arg);
1191 return 0;
1193 *commit_max_age = (unsigned int)val;
1196 if (c == 'w') {
1197 reiserfs_warning(s, "super-6509", "nolargeio option "
1198 "is no longer supported");
1199 return 0;
1202 if (c == 'j') {
1203 if (arg && *arg && jdev_name) {
1204 /* Hm, already assigned? */
1205 if (*jdev_name) {
1206 reiserfs_warning(s, "super-6510",
1207 "journal device was "
1208 "already specified to "
1209 "be %s", *jdev_name);
1210 return 0;
1212 *jdev_name = arg;
1215 #ifdef CONFIG_QUOTA
1216 if (c == 'u' || c == 'g') {
1217 int qtype = c == 'u' ? USRQUOTA : GRPQUOTA;
1219 if (sb_any_quota_loaded(s) &&
1220 (!*arg != !REISERFS_SB(s)->s_qf_names[qtype])) {
1221 reiserfs_warning(s, "super-6511",
1222 "cannot change journaled "
1223 "quota options when quota "
1224 "turned on.");
1225 return 0;
1227 if (*arg) { /* Some filename specified? */
1228 if (REISERFS_SB(s)->s_qf_names[qtype]
1229 && strcmp(REISERFS_SB(s)->s_qf_names[qtype],
1230 arg)) {
1231 reiserfs_warning(s, "super-6512",
1232 "%s quota file "
1233 "already specified.",
1234 QTYPE2NAME(qtype));
1235 return 0;
1237 if (strchr(arg, '/')) {
1238 reiserfs_warning(s, "super-6513",
1239 "quotafile must be "
1240 "on filesystem root.");
1241 return 0;
1243 qf_names[qtype] = kstrdup(arg, GFP_KERNEL);
1244 if (!qf_names[qtype]) {
1245 reiserfs_warning(s, "reiserfs-2502",
1246 "not enough memory "
1247 "for storing "
1248 "quotafile name.");
1249 return 0;
1251 if (qtype == USRQUOTA)
1252 *mount_options |= 1 << REISERFS_USRQUOTA;
1253 else
1254 *mount_options |= 1 << REISERFS_GRPQUOTA;
1255 } else {
1256 if (qf_names[qtype] !=
1257 REISERFS_SB(s)->s_qf_names[qtype])
1258 kfree(qf_names[qtype]);
1259 qf_names[qtype] = NULL;
1260 if (qtype == USRQUOTA)
1261 *mount_options &= ~(1 << REISERFS_USRQUOTA);
1262 else
1263 *mount_options &= ~(1 << REISERFS_GRPQUOTA);
1266 if (c == 'f') {
1267 if (!strcmp(arg, "vfsold"))
1268 *qfmt = QFMT_VFS_OLD;
1269 else if (!strcmp(arg, "vfsv0"))
1270 *qfmt = QFMT_VFS_V0;
1271 else {
1272 reiserfs_warning(s, "super-6514",
1273 "unknown quota format "
1274 "specified.");
1275 return 0;
1277 if (sb_any_quota_loaded(s) &&
1278 *qfmt != REISERFS_SB(s)->s_jquota_fmt) {
1279 reiserfs_warning(s, "super-6515",
1280 "cannot change journaled "
1281 "quota options when quota "
1282 "turned on.");
1283 return 0;
1286 #else
1287 if (c == 'u' || c == 'g' || c == 'f') {
1288 reiserfs_warning(s, "reiserfs-2503", "journaled "
1289 "quota options not supported.");
1290 return 0;
1292 #endif
1295 #ifdef CONFIG_QUOTA
1296 if (!REISERFS_SB(s)->s_jquota_fmt && !*qfmt
1297 && (qf_names[USRQUOTA] || qf_names[GRPQUOTA])) {
1298 reiserfs_warning(s, "super-6515",
1299 "journaled quota format not specified.");
1300 return 0;
1302 if ((!(*mount_options & (1 << REISERFS_USRQUOTA)) &&
1303 sb_has_quota_loaded(s, USRQUOTA)) ||
1304 (!(*mount_options & (1 << REISERFS_GRPQUOTA)) &&
1305 sb_has_quota_loaded(s, GRPQUOTA))) {
1306 reiserfs_warning(s, "super-6516", "quota options must "
1307 "be present when quota is turned on.");
1308 return 0;
1310 #endif
1312 return 1;
1315 static void switch_data_mode(struct super_block *s, unsigned long mode)
1317 REISERFS_SB(s)->s_mount_opt &= ~((1 << REISERFS_DATA_LOG) |
1318 (1 << REISERFS_DATA_ORDERED) |
1319 (1 << REISERFS_DATA_WRITEBACK));
1320 REISERFS_SB(s)->s_mount_opt |= (1 << mode);
1323 static void handle_data_mode(struct super_block *s, unsigned long mount_options)
1325 if (mount_options & (1 << REISERFS_DATA_LOG)) {
1326 if (!reiserfs_data_log(s)) {
1327 switch_data_mode(s, REISERFS_DATA_LOG);
1328 reiserfs_info(s, "switching to journaled data mode\n");
1330 } else if (mount_options & (1 << REISERFS_DATA_ORDERED)) {
1331 if (!reiserfs_data_ordered(s)) {
1332 switch_data_mode(s, REISERFS_DATA_ORDERED);
1333 reiserfs_info(s, "switching to ordered data mode\n");
1335 } else if (mount_options & (1 << REISERFS_DATA_WRITEBACK)) {
1336 if (!reiserfs_data_writeback(s)) {
1337 switch_data_mode(s, REISERFS_DATA_WRITEBACK);
1338 reiserfs_info(s, "switching to writeback data mode\n");
1343 static void handle_barrier_mode(struct super_block *s, unsigned long bits)
1345 int flush = (1 << REISERFS_BARRIER_FLUSH);
1346 int none = (1 << REISERFS_BARRIER_NONE);
1347 int all_barrier = flush | none;
1349 if (bits & all_barrier) {
1350 REISERFS_SB(s)->s_mount_opt &= ~all_barrier;
1351 if (bits & flush) {
1352 REISERFS_SB(s)->s_mount_opt |= flush;
1353 printk("reiserfs: enabling write barrier flush mode\n");
1354 } else if (bits & none) {
1355 REISERFS_SB(s)->s_mount_opt |= none;
1356 printk("reiserfs: write barriers turned off\n");
1361 static void handle_attrs(struct super_block *s)
1363 struct reiserfs_super_block *rs = SB_DISK_SUPER_BLOCK(s);
1365 if (reiserfs_attrs(s)) {
1366 if (old_format_only(s)) {
1367 reiserfs_warning(s, "super-6517", "cannot support "
1368 "attributes on 3.5.x disk format");
1369 REISERFS_SB(s)->s_mount_opt &= ~(1 << REISERFS_ATTRS);
1370 return;
1372 if (!(le32_to_cpu(rs->s_flags) & reiserfs_attrs_cleared)) {
1373 reiserfs_warning(s, "super-6518", "cannot support "
1374 "attributes until flag is set in "
1375 "super-block");
1376 REISERFS_SB(s)->s_mount_opt &= ~(1 << REISERFS_ATTRS);
1381 #ifdef CONFIG_QUOTA
1382 static void handle_quota_files(struct super_block *s, char **qf_names,
1383 unsigned int *qfmt)
1385 int i;
1387 for (i = 0; i < REISERFS_MAXQUOTAS; i++) {
1388 if (qf_names[i] != REISERFS_SB(s)->s_qf_names[i])
1389 kfree(REISERFS_SB(s)->s_qf_names[i]);
1390 REISERFS_SB(s)->s_qf_names[i] = qf_names[i];
1392 if (*qfmt)
1393 REISERFS_SB(s)->s_jquota_fmt = *qfmt;
1395 #endif
1397 static int reiserfs_remount(struct super_block *s, int *mount_flags, char *arg)
1399 struct reiserfs_super_block *rs;
1400 struct reiserfs_transaction_handle th;
1401 unsigned long blocks;
1402 unsigned long mount_options = REISERFS_SB(s)->s_mount_opt;
1403 unsigned long safe_mask = 0;
1404 unsigned int commit_max_age = (unsigned int)-1;
1405 struct reiserfs_journal *journal = SB_JOURNAL(s);
1406 char *new_opts;
1407 int err;
1408 char *qf_names[REISERFS_MAXQUOTAS];
1409 unsigned int qfmt = 0;
1410 #ifdef CONFIG_QUOTA
1411 int i;
1412 #endif
1414 new_opts = kstrdup(arg, GFP_KERNEL);
1415 if (arg && !new_opts)
1416 return -ENOMEM;
1418 sync_filesystem(s);
1419 reiserfs_write_lock(s);
1421 #ifdef CONFIG_QUOTA
1422 memcpy(qf_names, REISERFS_SB(s)->s_qf_names, sizeof(qf_names));
1423 #endif
1425 rs = SB_DISK_SUPER_BLOCK(s);
1427 if (!reiserfs_parse_options
1428 (s, arg, &mount_options, &blocks, NULL, &commit_max_age,
1429 qf_names, &qfmt)) {
1430 #ifdef CONFIG_QUOTA
1431 for (i = 0; i < REISERFS_MAXQUOTAS; i++)
1432 if (qf_names[i] != REISERFS_SB(s)->s_qf_names[i])
1433 kfree(qf_names[i]);
1434 #endif
1435 err = -EINVAL;
1436 goto out_err_unlock;
1438 #ifdef CONFIG_QUOTA
1439 handle_quota_files(s, qf_names, &qfmt);
1440 #endif
1442 handle_attrs(s);
1444 /* Add options that are safe here */
1445 safe_mask |= 1 << REISERFS_SMALLTAIL;
1446 safe_mask |= 1 << REISERFS_LARGETAIL;
1447 safe_mask |= 1 << REISERFS_NO_BORDER;
1448 safe_mask |= 1 << REISERFS_NO_UNHASHED_RELOCATION;
1449 safe_mask |= 1 << REISERFS_HASHED_RELOCATION;
1450 safe_mask |= 1 << REISERFS_TEST4;
1451 safe_mask |= 1 << REISERFS_ATTRS;
1452 safe_mask |= 1 << REISERFS_XATTRS_USER;
1453 safe_mask |= 1 << REISERFS_POSIXACL;
1454 safe_mask |= 1 << REISERFS_BARRIER_FLUSH;
1455 safe_mask |= 1 << REISERFS_BARRIER_NONE;
1456 safe_mask |= 1 << REISERFS_ERROR_RO;
1457 safe_mask |= 1 << REISERFS_ERROR_CONTINUE;
1458 safe_mask |= 1 << REISERFS_ERROR_PANIC;
1459 safe_mask |= 1 << REISERFS_USRQUOTA;
1460 safe_mask |= 1 << REISERFS_GRPQUOTA;
1463 * Update the bitmask, taking care to keep
1464 * the bits we're not allowed to change here
1466 REISERFS_SB(s)->s_mount_opt =
1467 (REISERFS_SB(s)->
1468 s_mount_opt & ~safe_mask) | (mount_options & safe_mask);
1470 if (commit_max_age != 0 && commit_max_age != (unsigned int)-1) {
1471 journal->j_max_commit_age = commit_max_age;
1472 journal->j_max_trans_age = commit_max_age;
1473 } else if (commit_max_age == 0) {
1474 /* 0 means restore defaults. */
1475 journal->j_max_commit_age = journal->j_default_max_commit_age;
1476 journal->j_max_trans_age = JOURNAL_MAX_TRANS_AGE;
1479 if (blocks) {
1480 err = reiserfs_resize(s, blocks);
1481 if (err != 0)
1482 goto out_err_unlock;
1485 if (*mount_flags & MS_RDONLY) {
1486 reiserfs_write_unlock(s);
1487 reiserfs_xattr_init(s, *mount_flags);
1488 /* remount read-only */
1489 if (s->s_flags & MS_RDONLY)
1490 /* it is read-only already */
1491 goto out_ok_unlocked;
1493 err = dquot_suspend(s, -1);
1494 if (err < 0)
1495 goto out_err;
1497 /* try to remount file system with read-only permissions */
1498 if (sb_umount_state(rs) == REISERFS_VALID_FS
1499 || REISERFS_SB(s)->s_mount_state != REISERFS_VALID_FS) {
1500 goto out_ok_unlocked;
1503 reiserfs_write_lock(s);
1505 err = journal_begin(&th, s, 10);
1506 if (err)
1507 goto out_err_unlock;
1509 /* Mounting a rw partition read-only. */
1510 reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
1511 set_sb_umount_state(rs, REISERFS_SB(s)->s_mount_state);
1512 journal_mark_dirty(&th, SB_BUFFER_WITH_SB(s));
1513 } else {
1514 /* remount read-write */
1515 if (!(s->s_flags & MS_RDONLY)) {
1516 reiserfs_write_unlock(s);
1517 reiserfs_xattr_init(s, *mount_flags);
1518 goto out_ok_unlocked; /* We are read-write already */
1521 if (reiserfs_is_journal_aborted(journal)) {
1522 err = journal->j_errno;
1523 goto out_err_unlock;
1526 handle_data_mode(s, mount_options);
1527 handle_barrier_mode(s, mount_options);
1528 REISERFS_SB(s)->s_mount_state = sb_umount_state(rs);
1530 /* now it is safe to call journal_begin */
1531 s->s_flags &= ~MS_RDONLY;
1532 err = journal_begin(&th, s, 10);
1533 if (err)
1534 goto out_err_unlock;
1536 /* Mount a partition which is read-only, read-write */
1537 reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
1538 REISERFS_SB(s)->s_mount_state = sb_umount_state(rs);
1539 s->s_flags &= ~MS_RDONLY;
1540 set_sb_umount_state(rs, REISERFS_ERROR_FS);
1541 if (!old_format_only(s))
1542 set_sb_mnt_count(rs, sb_mnt_count(rs) + 1);
1543 /* mark_buffer_dirty (SB_BUFFER_WITH_SB (s), 1); */
1544 journal_mark_dirty(&th, SB_BUFFER_WITH_SB(s));
1545 REISERFS_SB(s)->s_mount_state = REISERFS_VALID_FS;
1547 /* this will force a full flush of all journal lists */
1548 SB_JOURNAL(s)->j_must_wait = 1;
1549 err = journal_end(&th);
1550 if (err)
1551 goto out_err_unlock;
1553 reiserfs_write_unlock(s);
1554 if (!(*mount_flags & MS_RDONLY)) {
1555 dquot_resume(s, -1);
1556 reiserfs_write_lock(s);
1557 finish_unfinished(s);
1558 reiserfs_write_unlock(s);
1559 reiserfs_xattr_init(s, *mount_flags);
1562 out_ok_unlocked:
1563 if (new_opts)
1564 replace_mount_options(s, new_opts);
1565 return 0;
1567 out_err_unlock:
1568 reiserfs_write_unlock(s);
1569 out_err:
1570 kfree(new_opts);
1571 return err;
1574 static int read_super_block(struct super_block *s, int offset)
1576 struct buffer_head *bh;
1577 struct reiserfs_super_block *rs;
1578 int fs_blocksize;
1580 bh = sb_bread(s, offset / s->s_blocksize);
1581 if (!bh) {
1582 reiserfs_warning(s, "sh-2006",
1583 "bread failed (dev %s, block %lu, size %lu)",
1584 s->s_id, offset / s->s_blocksize,
1585 s->s_blocksize);
1586 return 1;
1589 rs = (struct reiserfs_super_block *)bh->b_data;
1590 if (!is_any_reiserfs_magic_string(rs)) {
1591 brelse(bh);
1592 return 1;
1595 * ok, reiserfs signature (old or new) found in at the given offset
1597 fs_blocksize = sb_blocksize(rs);
1598 brelse(bh);
1599 sb_set_blocksize(s, fs_blocksize);
1601 bh = sb_bread(s, offset / s->s_blocksize);
1602 if (!bh) {
1603 reiserfs_warning(s, "sh-2007",
1604 "bread failed (dev %s, block %lu, size %lu)",
1605 s->s_id, offset / s->s_blocksize,
1606 s->s_blocksize);
1607 return 1;
1610 rs = (struct reiserfs_super_block *)bh->b_data;
1611 if (sb_blocksize(rs) != s->s_blocksize) {
1612 reiserfs_warning(s, "sh-2011", "can't find a reiserfs "
1613 "filesystem on (dev %s, block %llu, size %lu)",
1614 s->s_id,
1615 (unsigned long long)bh->b_blocknr,
1616 s->s_blocksize);
1617 brelse(bh);
1618 return 1;
1621 if (rs->s_v1.s_root_block == cpu_to_le32(-1)) {
1622 brelse(bh);
1623 reiserfs_warning(s, "super-6519", "Unfinished reiserfsck "
1624 "--rebuild-tree run detected. Please run\n"
1625 "reiserfsck --rebuild-tree and wait for a "
1626 "completion. If that fails\n"
1627 "get newer reiserfsprogs package");
1628 return 1;
1631 SB_BUFFER_WITH_SB(s) = bh;
1632 SB_DISK_SUPER_BLOCK(s) = rs;
1635 * magic is of non-standard journal filesystem, look at s_version to
1636 * find which format is in use
1638 if (is_reiserfs_jr(rs)) {
1639 if (sb_version(rs) == REISERFS_VERSION_2)
1640 reiserfs_info(s, "found reiserfs format \"3.6\""
1641 " with non-standard journal\n");
1642 else if (sb_version(rs) == REISERFS_VERSION_1)
1643 reiserfs_info(s, "found reiserfs format \"3.5\""
1644 " with non-standard journal\n");
1645 else {
1646 reiserfs_warning(s, "sh-2012", "found unknown "
1647 "format \"%u\" of reiserfs with "
1648 "non-standard magic", sb_version(rs));
1649 return 1;
1651 } else
1653 * s_version of standard format may contain incorrect
1654 * information, so we just look at the magic string
1656 reiserfs_info(s,
1657 "found reiserfs format \"%s\" with standard journal\n",
1658 is_reiserfs_3_5(rs) ? "3.5" : "3.6");
1660 s->s_op = &reiserfs_sops;
1661 s->s_export_op = &reiserfs_export_ops;
1662 #ifdef CONFIG_QUOTA
1663 s->s_qcop = &reiserfs_qctl_operations;
1664 s->dq_op = &reiserfs_quota_operations;
1665 s->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP;
1666 #endif
1669 * new format is limited by the 32 bit wide i_blocks field, want to
1670 * be one full block below that.
1672 s->s_maxbytes = (512LL << 32) - s->s_blocksize;
1673 return 0;
1676 /* after journal replay, reread all bitmap and super blocks */
1677 static int reread_meta_blocks(struct super_block *s)
1679 ll_rw_block(REQ_OP_READ, 0, 1, &SB_BUFFER_WITH_SB(s));
1680 wait_on_buffer(SB_BUFFER_WITH_SB(s));
1681 if (!buffer_uptodate(SB_BUFFER_WITH_SB(s))) {
1682 reiserfs_warning(s, "reiserfs-2504", "error reading the super");
1683 return 1;
1686 return 0;
1689 /* hash detection stuff */
1692 * if root directory is empty - we set default - Yura's - hash and
1693 * warn about it
1694 * FIXME: we look for only one name in a directory. If tea and yura
1695 * both have the same value - we ask user to send report to the
1696 * mailing list
1698 static __u32 find_hash_out(struct super_block *s)
1700 int retval;
1701 struct inode *inode;
1702 struct cpu_key key;
1703 INITIALIZE_PATH(path);
1704 struct reiserfs_dir_entry de;
1705 struct reiserfs_de_head *deh;
1706 __u32 hash = DEFAULT_HASH;
1707 __u32 deh_hashval, teahash, r5hash, yurahash;
1709 inode = d_inode(s->s_root);
1711 make_cpu_key(&key, inode, ~0, TYPE_DIRENTRY, 3);
1712 retval = search_by_entry_key(s, &key, &path, &de);
1713 if (retval == IO_ERROR) {
1714 pathrelse(&path);
1715 return UNSET_HASH;
1717 if (retval == NAME_NOT_FOUND)
1718 de.de_entry_num--;
1720 set_de_name_and_namelen(&de);
1721 deh = de.de_deh + de.de_entry_num;
1723 if (deh_offset(deh) == DOT_DOT_OFFSET) {
1724 /* allow override in this case */
1725 if (reiserfs_rupasov_hash(s))
1726 hash = YURA_HASH;
1727 reiserfs_info(s, "FS seems to be empty, autodetect is using the default hash\n");
1728 goto out;
1731 deh_hashval = GET_HASH_VALUE(deh_offset(deh));
1732 r5hash = GET_HASH_VALUE(r5_hash(de.de_name, de.de_namelen));
1733 teahash = GET_HASH_VALUE(keyed_hash(de.de_name, de.de_namelen));
1734 yurahash = GET_HASH_VALUE(yura_hash(de.de_name, de.de_namelen));
1736 if ((teahash == r5hash && deh_hashval == r5hash) ||
1737 (teahash == yurahash && deh_hashval == yurahash) ||
1738 (r5hash == yurahash && deh_hashval == yurahash)) {
1739 reiserfs_warning(s, "reiserfs-2506",
1740 "Unable to automatically detect hash "
1741 "function. Please mount with -o "
1742 "hash={tea,rupasov,r5}");
1743 hash = UNSET_HASH;
1744 goto out;
1747 if (deh_hashval == yurahash)
1748 hash = YURA_HASH;
1749 else if (deh_hashval == teahash)
1750 hash = TEA_HASH;
1751 else if (deh_hashval == r5hash)
1752 hash = R5_HASH;
1753 else {
1754 reiserfs_warning(s, "reiserfs-2506",
1755 "Unrecognised hash function");
1756 hash = UNSET_HASH;
1758 out:
1759 pathrelse(&path);
1760 return hash;
1763 /* finds out which hash names are sorted with */
1764 static int what_hash(struct super_block *s)
1766 __u32 code;
1768 code = sb_hash_function_code(SB_DISK_SUPER_BLOCK(s));
1771 * reiserfs_hash_detect() == true if any of the hash mount options
1772 * were used. We must check them to make sure the user isn't
1773 * using a bad hash value
1775 if (code == UNSET_HASH || reiserfs_hash_detect(s))
1776 code = find_hash_out(s);
1778 if (code != UNSET_HASH && reiserfs_hash_detect(s)) {
1780 * detection has found the hash, and we must check against the
1781 * mount options
1783 if (reiserfs_rupasov_hash(s) && code != YURA_HASH) {
1784 reiserfs_warning(s, "reiserfs-2507",
1785 "Error, %s hash detected, "
1786 "unable to force rupasov hash",
1787 reiserfs_hashname(code));
1788 code = UNSET_HASH;
1789 } else if (reiserfs_tea_hash(s) && code != TEA_HASH) {
1790 reiserfs_warning(s, "reiserfs-2508",
1791 "Error, %s hash detected, "
1792 "unable to force tea hash",
1793 reiserfs_hashname(code));
1794 code = UNSET_HASH;
1795 } else if (reiserfs_r5_hash(s) && code != R5_HASH) {
1796 reiserfs_warning(s, "reiserfs-2509",
1797 "Error, %s hash detected, "
1798 "unable to force r5 hash",
1799 reiserfs_hashname(code));
1800 code = UNSET_HASH;
1802 } else {
1804 * find_hash_out was not called or
1805 * could not determine the hash
1807 if (reiserfs_rupasov_hash(s)) {
1808 code = YURA_HASH;
1809 } else if (reiserfs_tea_hash(s)) {
1810 code = TEA_HASH;
1811 } else if (reiserfs_r5_hash(s)) {
1812 code = R5_HASH;
1817 * if we are mounted RW, and we have a new valid hash code, update
1818 * the super
1820 if (code != UNSET_HASH &&
1821 !(s->s_flags & MS_RDONLY) &&
1822 code != sb_hash_function_code(SB_DISK_SUPER_BLOCK(s))) {
1823 set_sb_hash_function_code(SB_DISK_SUPER_BLOCK(s), code);
1825 return code;
1828 /* return pointer to appropriate function */
1829 static hashf_t hash_function(struct super_block *s)
1831 switch (what_hash(s)) {
1832 case TEA_HASH:
1833 reiserfs_info(s, "Using tea hash to sort names\n");
1834 return keyed_hash;
1835 case YURA_HASH:
1836 reiserfs_info(s, "Using rupasov hash to sort names\n");
1837 return yura_hash;
1838 case R5_HASH:
1839 reiserfs_info(s, "Using r5 hash to sort names\n");
1840 return r5_hash;
1842 return NULL;
1845 /* this is used to set up correct value for old partitions */
1846 static int function2code(hashf_t func)
1848 if (func == keyed_hash)
1849 return TEA_HASH;
1850 if (func == yura_hash)
1851 return YURA_HASH;
1852 if (func == r5_hash)
1853 return R5_HASH;
1855 BUG(); /* should never happen */
1857 return 0;
1860 #define SWARN(silent, s, id, ...) \
1861 if (!(silent)) \
1862 reiserfs_warning(s, id, __VA_ARGS__)
1864 static int reiserfs_fill_super(struct super_block *s, void *data, int silent)
1866 struct inode *root_inode;
1867 struct reiserfs_transaction_handle th;
1868 int old_format = 0;
1869 unsigned long blocks;
1870 unsigned int commit_max_age = 0;
1871 int jinit_done = 0;
1872 struct reiserfs_iget_args args;
1873 struct reiserfs_super_block *rs;
1874 char *jdev_name;
1875 struct reiserfs_sb_info *sbi;
1876 int errval = -EINVAL;
1877 char *qf_names[REISERFS_MAXQUOTAS] = {};
1878 unsigned int qfmt = 0;
1880 save_mount_options(s, data);
1882 sbi = kzalloc(sizeof(struct reiserfs_sb_info), GFP_KERNEL);
1883 if (!sbi)
1884 return -ENOMEM;
1885 s->s_fs_info = sbi;
1886 /* Set default values for options: non-aggressive tails, RO on errors */
1887 sbi->s_mount_opt |= (1 << REISERFS_SMALLTAIL);
1888 sbi->s_mount_opt |= (1 << REISERFS_ERROR_RO);
1889 sbi->s_mount_opt |= (1 << REISERFS_BARRIER_FLUSH);
1890 /* no preallocation minimum, be smart in reiserfs_file_write instead */
1891 sbi->s_alloc_options.preallocmin = 0;
1892 /* Preallocate by 16 blocks (17-1) at once */
1893 sbi->s_alloc_options.preallocsize = 17;
1894 /* setup default block allocator options */
1895 reiserfs_init_alloc_options(s);
1897 spin_lock_init(&sbi->old_work_lock);
1898 INIT_DELAYED_WORK(&sbi->old_work, flush_old_commits);
1899 mutex_init(&sbi->lock);
1900 sbi->lock_depth = -1;
1902 sbi->commit_wq = alloc_workqueue("reiserfs/%s", WQ_MEM_RECLAIM, 0,
1903 s->s_id);
1904 if (!sbi->commit_wq) {
1905 SWARN(silent, s, "", "Cannot allocate commit workqueue");
1906 errval = -ENOMEM;
1907 goto error_unlocked;
1910 jdev_name = NULL;
1911 if (reiserfs_parse_options
1912 (s, (char *)data, &sbi->s_mount_opt, &blocks, &jdev_name,
1913 &commit_max_age, qf_names, &qfmt) == 0) {
1914 goto error_unlocked;
1916 if (jdev_name && jdev_name[0]) {
1917 sbi->s_jdev = kstrdup(jdev_name, GFP_KERNEL);
1918 if (!sbi->s_jdev) {
1919 SWARN(silent, s, "", "Cannot allocate memory for "
1920 "journal device name");
1921 goto error;
1924 #ifdef CONFIG_QUOTA
1925 handle_quota_files(s, qf_names, &qfmt);
1926 #endif
1928 if (blocks) {
1929 SWARN(silent, s, "jmacd-7", "resize option for remount only");
1930 goto error_unlocked;
1934 * try old format (undistributed bitmap, super block in 8-th 1k
1935 * block of a device)
1937 if (!read_super_block(s, REISERFS_OLD_DISK_OFFSET_IN_BYTES))
1938 old_format = 1;
1941 * try new format (64-th 1k block), which can contain reiserfs
1942 * super block
1944 else if (read_super_block(s, REISERFS_DISK_OFFSET_IN_BYTES)) {
1945 SWARN(silent, s, "sh-2021", "can not find reiserfs on %s",
1946 s->s_id);
1947 goto error_unlocked;
1950 rs = SB_DISK_SUPER_BLOCK(s);
1952 * Let's do basic sanity check to verify that underlying device is not
1953 * smaller than the filesystem. If the check fails then abort and
1954 * scream, because bad stuff will happen otherwise.
1956 if (s->s_bdev && s->s_bdev->bd_inode
1957 && i_size_read(s->s_bdev->bd_inode) <
1958 sb_block_count(rs) * sb_blocksize(rs)) {
1959 SWARN(silent, s, "", "Filesystem cannot be "
1960 "mounted because it is bigger than the device");
1961 SWARN(silent, s, "", "You may need to run fsck "
1962 "or increase size of your LVM partition");
1963 SWARN(silent, s, "", "Or may be you forgot to "
1964 "reboot after fdisk when it told you to");
1965 goto error_unlocked;
1968 sbi->s_mount_state = SB_REISERFS_STATE(s);
1969 sbi->s_mount_state = REISERFS_VALID_FS;
1971 if ((errval = reiserfs_init_bitmap_cache(s))) {
1972 SWARN(silent, s, "jmacd-8", "unable to read bitmap");
1973 goto error_unlocked;
1976 errval = -EINVAL;
1977 #ifdef CONFIG_REISERFS_CHECK
1978 SWARN(silent, s, "", "CONFIG_REISERFS_CHECK is set ON");
1979 SWARN(silent, s, "", "- it is slow mode for debugging.");
1980 #endif
1982 /* make data=ordered the default */
1983 if (!reiserfs_data_log(s) && !reiserfs_data_ordered(s) &&
1984 !reiserfs_data_writeback(s)) {
1985 sbi->s_mount_opt |= (1 << REISERFS_DATA_ORDERED);
1988 if (reiserfs_data_log(s)) {
1989 reiserfs_info(s, "using journaled data mode\n");
1990 } else if (reiserfs_data_ordered(s)) {
1991 reiserfs_info(s, "using ordered data mode\n");
1992 } else {
1993 reiserfs_info(s, "using writeback data mode\n");
1995 if (reiserfs_barrier_flush(s)) {
1996 printk("reiserfs: using flush barriers\n");
1999 if (journal_init(s, jdev_name, old_format, commit_max_age)) {
2000 SWARN(silent, s, "sh-2022",
2001 "unable to initialize journal space");
2002 goto error_unlocked;
2003 } else {
2005 * once this is set, journal_release must be called
2006 * if we error out of the mount
2008 jinit_done = 1;
2011 if (reread_meta_blocks(s)) {
2012 SWARN(silent, s, "jmacd-9",
2013 "unable to reread meta blocks after journal init");
2014 goto error_unlocked;
2017 if (replay_only(s))
2018 goto error_unlocked;
2020 if (bdev_read_only(s->s_bdev) && !(s->s_flags & MS_RDONLY)) {
2021 SWARN(silent, s, "clm-7000",
2022 "Detected readonly device, marking FS readonly");
2023 s->s_flags |= MS_RDONLY;
2025 args.objectid = REISERFS_ROOT_OBJECTID;
2026 args.dirid = REISERFS_ROOT_PARENT_OBJECTID;
2027 root_inode =
2028 iget5_locked(s, REISERFS_ROOT_OBJECTID, reiserfs_find_actor,
2029 reiserfs_init_locked_inode, (void *)&args);
2030 if (!root_inode) {
2031 SWARN(silent, s, "jmacd-10", "get root inode failed");
2032 goto error_unlocked;
2036 * This path assumed to be called with the BKL in the old times.
2037 * Now we have inherited the big reiserfs lock from it and many
2038 * reiserfs helpers called in the mount path and elsewhere require
2039 * this lock to be held even if it's not always necessary. Let's be
2040 * conservative and hold it early. The window can be reduced after
2041 * careful review of the code.
2043 reiserfs_write_lock(s);
2045 if (root_inode->i_state & I_NEW) {
2046 reiserfs_read_locked_inode(root_inode, &args);
2047 unlock_new_inode(root_inode);
2050 s->s_root = d_make_root(root_inode);
2051 if (!s->s_root)
2052 goto error;
2053 /* define and initialize hash function */
2054 sbi->s_hash_function = hash_function(s);
2055 if (sbi->s_hash_function == NULL) {
2056 dput(s->s_root);
2057 s->s_root = NULL;
2058 goto error;
2061 if (is_reiserfs_3_5(rs)
2062 || (is_reiserfs_jr(rs) && SB_VERSION(s) == REISERFS_VERSION_1))
2063 set_bit(REISERFS_3_5, &sbi->s_properties);
2064 else if (old_format)
2065 set_bit(REISERFS_OLD_FORMAT, &sbi->s_properties);
2066 else
2067 set_bit(REISERFS_3_6, &sbi->s_properties);
2069 if (!(s->s_flags & MS_RDONLY)) {
2071 errval = journal_begin(&th, s, 1);
2072 if (errval) {
2073 dput(s->s_root);
2074 s->s_root = NULL;
2075 goto error;
2077 reiserfs_prepare_for_journal(s, SB_BUFFER_WITH_SB(s), 1);
2079 set_sb_umount_state(rs, REISERFS_ERROR_FS);
2080 set_sb_fs_state(rs, 0);
2083 * Clear out s_bmap_nr if it would wrap. We can handle this
2084 * case, but older revisions can't. This will cause the
2085 * file system to fail mount on those older implementations,
2086 * avoiding corruption. -jeffm
2088 if (bmap_would_wrap(reiserfs_bmap_count(s)) &&
2089 sb_bmap_nr(rs) != 0) {
2090 reiserfs_warning(s, "super-2030", "This file system "
2091 "claims to use %u bitmap blocks in "
2092 "its super block, but requires %u. "
2093 "Clearing to zero.", sb_bmap_nr(rs),
2094 reiserfs_bmap_count(s));
2096 set_sb_bmap_nr(rs, 0);
2099 if (old_format_only(s)) {
2101 * filesystem of format 3.5 either with standard
2102 * or non-standard journal
2104 if (convert_reiserfs(s)) {
2105 /* and -o conv is given */
2106 if (!silent)
2107 reiserfs_info(s,
2108 "converting 3.5 filesystem to the 3.6 format");
2110 if (is_reiserfs_3_5(rs))
2112 * put magic string of 3.6 format.
2113 * 2.2 will not be able to
2114 * mount this filesystem anymore
2116 memcpy(rs->s_v1.s_magic,
2117 reiserfs_3_6_magic_string,
2118 sizeof
2119 (reiserfs_3_6_magic_string));
2121 set_sb_version(rs, REISERFS_VERSION_2);
2122 reiserfs_convert_objectid_map_v1(s);
2123 set_bit(REISERFS_3_6, &sbi->s_properties);
2124 clear_bit(REISERFS_3_5, &sbi->s_properties);
2125 } else if (!silent) {
2126 reiserfs_info(s, "using 3.5.x disk format\n");
2128 } else
2129 set_sb_mnt_count(rs, sb_mnt_count(rs) + 1);
2132 journal_mark_dirty(&th, SB_BUFFER_WITH_SB(s));
2133 errval = journal_end(&th);
2134 if (errval) {
2135 dput(s->s_root);
2136 s->s_root = NULL;
2137 goto error;
2140 reiserfs_write_unlock(s);
2141 if ((errval = reiserfs_lookup_privroot(s)) ||
2142 (errval = reiserfs_xattr_init(s, s->s_flags))) {
2143 dput(s->s_root);
2144 s->s_root = NULL;
2145 goto error_unlocked;
2147 reiserfs_write_lock(s);
2150 * look for files which were to be removed in previous session
2152 finish_unfinished(s);
2153 } else {
2154 if (old_format_only(s) && !silent) {
2155 reiserfs_info(s, "using 3.5.x disk format\n");
2158 reiserfs_write_unlock(s);
2159 if ((errval = reiserfs_lookup_privroot(s)) ||
2160 (errval = reiserfs_xattr_init(s, s->s_flags))) {
2161 dput(s->s_root);
2162 s->s_root = NULL;
2163 goto error_unlocked;
2165 reiserfs_write_lock(s);
2168 * mark hash in super block: it could be unset. overwrite should be ok
2170 set_sb_hash_function_code(rs, function2code(sbi->s_hash_function));
2172 handle_attrs(s);
2174 reiserfs_proc_info_init(s);
2176 init_waitqueue_head(&(sbi->s_wait));
2177 spin_lock_init(&sbi->bitmap_lock);
2179 reiserfs_write_unlock(s);
2181 return (0);
2183 error:
2184 reiserfs_write_unlock(s);
2186 error_unlocked:
2187 /* kill the commit thread, free journal ram */
2188 if (jinit_done) {
2189 reiserfs_write_lock(s);
2190 journal_release_error(NULL, s);
2191 reiserfs_write_unlock(s);
2194 if (sbi->commit_wq)
2195 destroy_workqueue(sbi->commit_wq);
2197 cancel_delayed_work_sync(&REISERFS_SB(s)->old_work);
2199 reiserfs_free_bitmap_cache(s);
2200 if (SB_BUFFER_WITH_SB(s))
2201 brelse(SB_BUFFER_WITH_SB(s));
2202 #ifdef CONFIG_QUOTA
2204 int j;
2205 for (j = 0; j < REISERFS_MAXQUOTAS; j++)
2206 kfree(qf_names[j]);
2208 #endif
2209 kfree(sbi);
2211 s->s_fs_info = NULL;
2212 return errval;
2215 static int reiserfs_statfs(struct dentry *dentry, struct kstatfs *buf)
2217 struct reiserfs_super_block *rs = SB_DISK_SUPER_BLOCK(dentry->d_sb);
2219 buf->f_namelen = (REISERFS_MAX_NAME(s->s_blocksize));
2220 buf->f_bfree = sb_free_blocks(rs);
2221 buf->f_bavail = buf->f_bfree;
2222 buf->f_blocks = sb_block_count(rs) - sb_bmap_nr(rs) - 1;
2223 buf->f_bsize = dentry->d_sb->s_blocksize;
2224 /* changed to accommodate gcc folks. */
2225 buf->f_type = REISERFS_SUPER_MAGIC;
2226 buf->f_fsid.val[0] = (u32)crc32_le(0, rs->s_uuid, sizeof(rs->s_uuid)/2);
2227 buf->f_fsid.val[1] = (u32)crc32_le(0, rs->s_uuid + sizeof(rs->s_uuid)/2,
2228 sizeof(rs->s_uuid)/2);
2230 return 0;
2233 #ifdef CONFIG_QUOTA
2234 static int reiserfs_write_dquot(struct dquot *dquot)
2236 struct reiserfs_transaction_handle th;
2237 int ret, err;
2238 int depth;
2240 reiserfs_write_lock(dquot->dq_sb);
2241 ret =
2242 journal_begin(&th, dquot->dq_sb,
2243 REISERFS_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
2244 if (ret)
2245 goto out;
2246 depth = reiserfs_write_unlock_nested(dquot->dq_sb);
2247 ret = dquot_commit(dquot);
2248 reiserfs_write_lock_nested(dquot->dq_sb, depth);
2249 err = journal_end(&th);
2250 if (!ret && err)
2251 ret = err;
2252 out:
2253 reiserfs_write_unlock(dquot->dq_sb);
2254 return ret;
2257 static int reiserfs_acquire_dquot(struct dquot *dquot)
2259 struct reiserfs_transaction_handle th;
2260 int ret, err;
2261 int depth;
2263 reiserfs_write_lock(dquot->dq_sb);
2264 ret =
2265 journal_begin(&th, dquot->dq_sb,
2266 REISERFS_QUOTA_INIT_BLOCKS(dquot->dq_sb));
2267 if (ret)
2268 goto out;
2269 depth = reiserfs_write_unlock_nested(dquot->dq_sb);
2270 ret = dquot_acquire(dquot);
2271 reiserfs_write_lock_nested(dquot->dq_sb, depth);
2272 err = journal_end(&th);
2273 if (!ret && err)
2274 ret = err;
2275 out:
2276 reiserfs_write_unlock(dquot->dq_sb);
2277 return ret;
2280 static int reiserfs_release_dquot(struct dquot *dquot)
2282 struct reiserfs_transaction_handle th;
2283 int ret, err;
2285 reiserfs_write_lock(dquot->dq_sb);
2286 ret =
2287 journal_begin(&th, dquot->dq_sb,
2288 REISERFS_QUOTA_DEL_BLOCKS(dquot->dq_sb));
2289 reiserfs_write_unlock(dquot->dq_sb);
2290 if (ret) {
2291 /* Release dquot anyway to avoid endless cycle in dqput() */
2292 dquot_release(dquot);
2293 goto out;
2295 ret = dquot_release(dquot);
2296 reiserfs_write_lock(dquot->dq_sb);
2297 err = journal_end(&th);
2298 if (!ret && err)
2299 ret = err;
2300 reiserfs_write_unlock(dquot->dq_sb);
2301 out:
2302 return ret;
2305 static int reiserfs_mark_dquot_dirty(struct dquot *dquot)
2307 /* Are we journaling quotas? */
2308 if (REISERFS_SB(dquot->dq_sb)->s_qf_names[USRQUOTA] ||
2309 REISERFS_SB(dquot->dq_sb)->s_qf_names[GRPQUOTA]) {
2310 dquot_mark_dquot_dirty(dquot);
2311 return reiserfs_write_dquot(dquot);
2312 } else
2313 return dquot_mark_dquot_dirty(dquot);
2316 static int reiserfs_write_info(struct super_block *sb, int type)
2318 struct reiserfs_transaction_handle th;
2319 int ret, err;
2320 int depth;
2322 /* Data block + inode block */
2323 reiserfs_write_lock(sb);
2324 ret = journal_begin(&th, sb, 2);
2325 if (ret)
2326 goto out;
2327 depth = reiserfs_write_unlock_nested(sb);
2328 ret = dquot_commit_info(sb, type);
2329 reiserfs_write_lock_nested(sb, depth);
2330 err = journal_end(&th);
2331 if (!ret && err)
2332 ret = err;
2333 out:
2334 reiserfs_write_unlock(sb);
2335 return ret;
2339 * Turn on quotas during mount time - we need to find the quota file and such...
2341 static int reiserfs_quota_on_mount(struct super_block *sb, int type)
2343 return dquot_quota_on_mount(sb, REISERFS_SB(sb)->s_qf_names[type],
2344 REISERFS_SB(sb)->s_jquota_fmt, type);
2348 * Standard function to be called on quota_on
2350 static int reiserfs_quota_on(struct super_block *sb, int type, int format_id,
2351 struct path *path)
2353 int err;
2354 struct inode *inode;
2355 struct reiserfs_transaction_handle th;
2356 int opt = type == USRQUOTA ? REISERFS_USRQUOTA : REISERFS_GRPQUOTA;
2358 reiserfs_write_lock(sb);
2359 if (!(REISERFS_SB(sb)->s_mount_opt & (1 << opt))) {
2360 err = -EINVAL;
2361 goto out;
2364 /* Quotafile not on the same filesystem? */
2365 if (path->dentry->d_sb != sb) {
2366 err = -EXDEV;
2367 goto out;
2369 inode = d_inode(path->dentry);
2371 * We must not pack tails for quota files on reiserfs for quota
2372 * IO to work
2374 if (!(REISERFS_I(inode)->i_flags & i_nopack_mask)) {
2375 err = reiserfs_unpack(inode, NULL);
2376 if (err) {
2377 reiserfs_warning(sb, "super-6520",
2378 "Unpacking tail of quota file failed"
2379 " (%d). Cannot turn on quotas.", err);
2380 err = -EINVAL;
2381 goto out;
2383 mark_inode_dirty(inode);
2385 /* Journaling quota? */
2386 if (REISERFS_SB(sb)->s_qf_names[type]) {
2387 /* Quotafile not of fs root? */
2388 if (path->dentry->d_parent != sb->s_root)
2389 reiserfs_warning(sb, "super-6521",
2390 "Quota file not on filesystem root. "
2391 "Journalled quota will not work.");
2395 * When we journal data on quota file, we have to flush journal to see
2396 * all updates to the file when we bypass pagecache...
2398 if (reiserfs_file_data_log(inode)) {
2399 /* Just start temporary transaction and finish it */
2400 err = journal_begin(&th, sb, 1);
2401 if (err)
2402 goto out;
2403 err = journal_end_sync(&th);
2404 if (err)
2405 goto out;
2407 reiserfs_write_unlock(sb);
2408 return dquot_quota_on(sb, type, format_id, path);
2409 out:
2410 reiserfs_write_unlock(sb);
2411 return err;
2415 * Read data from quotafile - avoid pagecache and such because we cannot afford
2416 * acquiring the locks... As quota files are never truncated and quota code
2417 * itself serializes the operations (and no one else should touch the files)
2418 * we don't have to be afraid of races
2420 static ssize_t reiserfs_quota_read(struct super_block *sb, int type, char *data,
2421 size_t len, loff_t off)
2423 struct inode *inode = sb_dqopt(sb)->files[type];
2424 unsigned long blk = off >> sb->s_blocksize_bits;
2425 int err = 0, offset = off & (sb->s_blocksize - 1), tocopy;
2426 size_t toread;
2427 struct buffer_head tmp_bh, *bh;
2428 loff_t i_size = i_size_read(inode);
2430 if (off > i_size)
2431 return 0;
2432 if (off + len > i_size)
2433 len = i_size - off;
2434 toread = len;
2435 while (toread > 0) {
2436 tocopy =
2437 sb->s_blocksize - offset <
2438 toread ? sb->s_blocksize - offset : toread;
2439 tmp_bh.b_state = 0;
2441 * Quota files are without tails so we can safely
2442 * use this function
2444 reiserfs_write_lock(sb);
2445 err = reiserfs_get_block(inode, blk, &tmp_bh, 0);
2446 reiserfs_write_unlock(sb);
2447 if (err)
2448 return err;
2449 if (!buffer_mapped(&tmp_bh)) /* A hole? */
2450 memset(data, 0, tocopy);
2451 else {
2452 bh = sb_bread(sb, tmp_bh.b_blocknr);
2453 if (!bh)
2454 return -EIO;
2455 memcpy(data, bh->b_data + offset, tocopy);
2456 brelse(bh);
2458 offset = 0;
2459 toread -= tocopy;
2460 data += tocopy;
2461 blk++;
2463 return len;
2467 * Write to quotafile (we know the transaction is already started and has
2468 * enough credits)
2470 static ssize_t reiserfs_quota_write(struct super_block *sb, int type,
2471 const char *data, size_t len, loff_t off)
2473 struct inode *inode = sb_dqopt(sb)->files[type];
2474 unsigned long blk = off >> sb->s_blocksize_bits;
2475 int err = 0, offset = off & (sb->s_blocksize - 1), tocopy;
2476 int journal_quota = REISERFS_SB(sb)->s_qf_names[type] != NULL;
2477 size_t towrite = len;
2478 struct buffer_head tmp_bh, *bh;
2480 if (!current->journal_info) {
2481 printk(KERN_WARNING "reiserfs: Quota write (off=%llu, len=%llu) cancelled because transaction is not started.\n",
2482 (unsigned long long)off, (unsigned long long)len);
2483 return -EIO;
2485 while (towrite > 0) {
2486 tocopy = sb->s_blocksize - offset < towrite ?
2487 sb->s_blocksize - offset : towrite;
2488 tmp_bh.b_state = 0;
2489 reiserfs_write_lock(sb);
2490 err = reiserfs_get_block(inode, blk, &tmp_bh, GET_BLOCK_CREATE);
2491 reiserfs_write_unlock(sb);
2492 if (err)
2493 goto out;
2494 if (offset || tocopy != sb->s_blocksize)
2495 bh = sb_bread(sb, tmp_bh.b_blocknr);
2496 else
2497 bh = sb_getblk(sb, tmp_bh.b_blocknr);
2498 if (!bh) {
2499 err = -EIO;
2500 goto out;
2502 lock_buffer(bh);
2503 memcpy(bh->b_data + offset, data, tocopy);
2504 flush_dcache_page(bh->b_page);
2505 set_buffer_uptodate(bh);
2506 unlock_buffer(bh);
2507 reiserfs_write_lock(sb);
2508 reiserfs_prepare_for_journal(sb, bh, 1);
2509 journal_mark_dirty(current->journal_info, bh);
2510 if (!journal_quota)
2511 reiserfs_add_ordered_list(inode, bh);
2512 reiserfs_write_unlock(sb);
2513 brelse(bh);
2514 offset = 0;
2515 towrite -= tocopy;
2516 data += tocopy;
2517 blk++;
2519 out:
2520 if (len == towrite)
2521 return err;
2522 if (inode->i_size < off + len - towrite)
2523 i_size_write(inode, off + len - towrite);
2524 inode->i_version++;
2525 inode->i_mtime = inode->i_ctime = current_time(inode);
2526 mark_inode_dirty(inode);
2527 return len - towrite;
2530 #endif
2532 static struct dentry *get_super_block(struct file_system_type *fs_type,
2533 int flags, const char *dev_name,
2534 void *data)
2536 return mount_bdev(fs_type, flags, dev_name, data, reiserfs_fill_super);
2539 static int __init init_reiserfs_fs(void)
2541 int ret;
2543 ret = init_inodecache();
2544 if (ret)
2545 return ret;
2547 reiserfs_proc_info_global_init();
2549 ret = register_filesystem(&reiserfs_fs_type);
2550 if (ret)
2551 goto out;
2553 return 0;
2554 out:
2555 reiserfs_proc_info_global_done();
2556 destroy_inodecache();
2558 return ret;
2561 static void __exit exit_reiserfs_fs(void)
2563 reiserfs_proc_info_global_done();
2564 unregister_filesystem(&reiserfs_fs_type);
2565 destroy_inodecache();
2568 struct file_system_type reiserfs_fs_type = {
2569 .owner = THIS_MODULE,
2570 .name = "reiserfs",
2571 .mount = get_super_block,
2572 .kill_sb = reiserfs_kill_sb,
2573 .fs_flags = FS_REQUIRES_DEV,
2575 MODULE_ALIAS_FS("reiserfs");
2577 MODULE_DESCRIPTION("ReiserFS journaled filesystem");
2578 MODULE_AUTHOR("Hans Reiser <reiser@namesys.com>");
2579 MODULE_LICENSE("GPL");
2581 module_init(init_reiserfs_fs);
2582 module_exit(exit_reiserfs_fs);