libceph: redo callbacks and factor out MOSDOpReply decoding
[linux/fpc-iii.git] / fs / ubifs / dir.c
blob795992a8321e9e0c9531c92f97c91cc10835cc02
1 /* * This file is part of UBIFS.
3 * Copyright (C) 2006-2008 Nokia Corporation.
4 * Copyright (C) 2006, 2007 University of Szeged, Hungary
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU General Public License version 2 as published by
8 * the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
13 * more details.
15 * You should have received a copy of the GNU General Public License along with
16 * this program; if not, write to the Free Software Foundation, Inc., 51
17 * Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
19 * Authors: Artem Bityutskiy (Битюцкий Артём)
20 * Adrian Hunter
21 * Zoltan Sogor
25 * This file implements directory operations.
27 * All FS operations in this file allocate budget before writing anything to the
28 * media. If they fail to allocate it, the error is returned. The only
29 * exceptions are 'ubifs_unlink()' and 'ubifs_rmdir()' which keep working even
30 * if they unable to allocate the budget, because deletion %-ENOSPC failure is
31 * not what users are usually ready to get. UBIFS budgeting subsystem has some
32 * space reserved for these purposes.
34 * All operations in this file write all inodes which they change straight
35 * away, instead of marking them dirty. For example, 'ubifs_link()' changes
36 * @i_size of the parent inode and writes the parent inode together with the
37 * target inode. This was done to simplify file-system recovery which would
38 * otherwise be very difficult to do. The only exception is rename which marks
39 * the re-named inode dirty (because its @i_ctime is updated) but does not
40 * write it, but just marks it as dirty.
43 #include "ubifs.h"
45 /**
46 * inherit_flags - inherit flags of the parent inode.
47 * @dir: parent inode
48 * @mode: new inode mode flags
50 * This is a helper function for 'ubifs_new_inode()' which inherits flag of the
51 * parent directory inode @dir. UBIFS inodes inherit the following flags:
52 * o %UBIFS_COMPR_FL, which is useful to switch compression on/of on
53 * sub-directory basis;
54 * o %UBIFS_SYNC_FL - useful for the same reasons;
55 * o %UBIFS_DIRSYNC_FL - similar, but relevant only to directories.
57 * This function returns the inherited flags.
59 static int inherit_flags(const struct inode *dir, umode_t mode)
61 int flags;
62 const struct ubifs_inode *ui = ubifs_inode(dir);
64 if (!S_ISDIR(dir->i_mode))
66 * The parent is not a directory, which means that an extended
67 * attribute inode is being created. No flags.
69 return 0;
71 flags = ui->flags & (UBIFS_COMPR_FL | UBIFS_SYNC_FL | UBIFS_DIRSYNC_FL);
72 if (!S_ISDIR(mode))
73 /* The "DIRSYNC" flag only applies to directories */
74 flags &= ~UBIFS_DIRSYNC_FL;
75 return flags;
78 /**
79 * ubifs_new_inode - allocate new UBIFS inode object.
80 * @c: UBIFS file-system description object
81 * @dir: parent directory inode
82 * @mode: inode mode flags
84 * This function finds an unused inode number, allocates new inode and
85 * initializes it. Returns new inode in case of success and an error code in
86 * case of failure.
88 struct inode *ubifs_new_inode(struct ubifs_info *c, const struct inode *dir,
89 umode_t mode)
91 struct inode *inode;
92 struct ubifs_inode *ui;
94 inode = new_inode(c->vfs_sb);
95 ui = ubifs_inode(inode);
96 if (!inode)
97 return ERR_PTR(-ENOMEM);
100 * Set 'S_NOCMTIME' to prevent VFS form updating [mc]time of inodes and
101 * marking them dirty in file write path (see 'file_update_time()').
102 * UBIFS has to fully control "clean <-> dirty" transitions of inodes
103 * to make budgeting work.
105 inode->i_flags |= S_NOCMTIME;
107 inode_init_owner(inode, dir, mode);
108 inode->i_mtime = inode->i_atime = inode->i_ctime =
109 ubifs_current_time(inode);
110 inode->i_mapping->nrpages = 0;
112 switch (mode & S_IFMT) {
113 case S_IFREG:
114 inode->i_mapping->a_ops = &ubifs_file_address_operations;
115 inode->i_op = &ubifs_file_inode_operations;
116 inode->i_fop = &ubifs_file_operations;
117 break;
118 case S_IFDIR:
119 inode->i_op = &ubifs_dir_inode_operations;
120 inode->i_fop = &ubifs_dir_operations;
121 inode->i_size = ui->ui_size = UBIFS_INO_NODE_SZ;
122 break;
123 case S_IFLNK:
124 inode->i_op = &ubifs_symlink_inode_operations;
125 break;
126 case S_IFSOCK:
127 case S_IFIFO:
128 case S_IFBLK:
129 case S_IFCHR:
130 inode->i_op = &ubifs_file_inode_operations;
131 break;
132 default:
133 BUG();
136 ui->flags = inherit_flags(dir, mode);
137 ubifs_set_inode_flags(inode);
138 if (S_ISREG(mode))
139 ui->compr_type = c->default_compr;
140 else
141 ui->compr_type = UBIFS_COMPR_NONE;
142 ui->synced_i_size = 0;
144 spin_lock(&c->cnt_lock);
145 /* Inode number overflow is currently not supported */
146 if (c->highest_inum >= INUM_WARN_WATERMARK) {
147 if (c->highest_inum >= INUM_WATERMARK) {
148 spin_unlock(&c->cnt_lock);
149 ubifs_err(c, "out of inode numbers");
150 make_bad_inode(inode);
151 iput(inode);
152 return ERR_PTR(-EINVAL);
154 ubifs_warn(c, "running out of inode numbers (current %lu, max %u)",
155 (unsigned long)c->highest_inum, INUM_WATERMARK);
158 inode->i_ino = ++c->highest_inum;
160 * The creation sequence number remains with this inode for its
161 * lifetime. All nodes for this inode have a greater sequence number,
162 * and so it is possible to distinguish obsolete nodes belonging to a
163 * previous incarnation of the same inode number - for example, for the
164 * purpose of rebuilding the index.
166 ui->creat_sqnum = ++c->max_sqnum;
167 spin_unlock(&c->cnt_lock);
168 return inode;
171 static int dbg_check_name(const struct ubifs_info *c,
172 const struct ubifs_dent_node *dent,
173 const struct qstr *nm)
175 if (!dbg_is_chk_gen(c))
176 return 0;
177 if (le16_to_cpu(dent->nlen) != nm->len)
178 return -EINVAL;
179 if (memcmp(dent->name, nm->name, nm->len))
180 return -EINVAL;
181 return 0;
184 static struct dentry *ubifs_lookup(struct inode *dir, struct dentry *dentry,
185 unsigned int flags)
187 int err;
188 union ubifs_key key;
189 struct inode *inode = NULL;
190 struct ubifs_dent_node *dent;
191 struct ubifs_info *c = dir->i_sb->s_fs_info;
193 dbg_gen("'%pd' in dir ino %lu", dentry, dir->i_ino);
195 if (dentry->d_name.len > UBIFS_MAX_NLEN)
196 return ERR_PTR(-ENAMETOOLONG);
198 dent = kmalloc(UBIFS_MAX_DENT_NODE_SZ, GFP_NOFS);
199 if (!dent)
200 return ERR_PTR(-ENOMEM);
202 dent_key_init(c, &key, dir->i_ino, &dentry->d_name);
204 err = ubifs_tnc_lookup_nm(c, &key, dent, &dentry->d_name);
205 if (err) {
206 if (err == -ENOENT) {
207 dbg_gen("not found");
208 goto done;
210 goto out;
213 if (dbg_check_name(c, dent, &dentry->d_name)) {
214 err = -EINVAL;
215 goto out;
218 inode = ubifs_iget(dir->i_sb, le64_to_cpu(dent->inum));
219 if (IS_ERR(inode)) {
221 * This should not happen. Probably the file-system needs
222 * checking.
224 err = PTR_ERR(inode);
225 ubifs_err(c, "dead directory entry '%pd', error %d",
226 dentry, err);
227 ubifs_ro_mode(c, err);
228 goto out;
231 done:
232 kfree(dent);
234 * Note, d_splice_alias() would be required instead if we supported
235 * NFS.
237 d_add(dentry, inode);
238 return NULL;
240 out:
241 kfree(dent);
242 return ERR_PTR(err);
245 static int ubifs_create(struct inode *dir, struct dentry *dentry, umode_t mode,
246 bool excl)
248 struct inode *inode;
249 struct ubifs_info *c = dir->i_sb->s_fs_info;
250 int err, sz_change = CALC_DENT_SIZE(dentry->d_name.len);
251 struct ubifs_budget_req req = { .new_ino = 1, .new_dent = 1,
252 .dirtied_ino = 1 };
253 struct ubifs_inode *dir_ui = ubifs_inode(dir);
256 * Budget request settings: new inode, new direntry, changing the
257 * parent directory inode.
260 dbg_gen("dent '%pd', mode %#hx in dir ino %lu",
261 dentry, mode, dir->i_ino);
263 err = ubifs_budget_space(c, &req);
264 if (err)
265 return err;
267 inode = ubifs_new_inode(c, dir, mode);
268 if (IS_ERR(inode)) {
269 err = PTR_ERR(inode);
270 goto out_budg;
273 err = ubifs_init_security(dir, inode, &dentry->d_name);
274 if (err)
275 goto out_inode;
277 mutex_lock(&dir_ui->ui_mutex);
278 dir->i_size += sz_change;
279 dir_ui->ui_size = dir->i_size;
280 dir->i_mtime = dir->i_ctime = inode->i_ctime;
281 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 0, 0);
282 if (err)
283 goto out_cancel;
284 mutex_unlock(&dir_ui->ui_mutex);
286 ubifs_release_budget(c, &req);
287 insert_inode_hash(inode);
288 d_instantiate(dentry, inode);
289 return 0;
291 out_cancel:
292 dir->i_size -= sz_change;
293 dir_ui->ui_size = dir->i_size;
294 mutex_unlock(&dir_ui->ui_mutex);
295 out_inode:
296 make_bad_inode(inode);
297 iput(inode);
298 out_budg:
299 ubifs_release_budget(c, &req);
300 ubifs_err(c, "cannot create regular file, error %d", err);
301 return err;
305 * vfs_dent_type - get VFS directory entry type.
306 * @type: UBIFS directory entry type
308 * This function converts UBIFS directory entry type into VFS directory entry
309 * type.
311 static unsigned int vfs_dent_type(uint8_t type)
313 switch (type) {
314 case UBIFS_ITYPE_REG:
315 return DT_REG;
316 case UBIFS_ITYPE_DIR:
317 return DT_DIR;
318 case UBIFS_ITYPE_LNK:
319 return DT_LNK;
320 case UBIFS_ITYPE_BLK:
321 return DT_BLK;
322 case UBIFS_ITYPE_CHR:
323 return DT_CHR;
324 case UBIFS_ITYPE_FIFO:
325 return DT_FIFO;
326 case UBIFS_ITYPE_SOCK:
327 return DT_SOCK;
328 default:
329 BUG();
331 return 0;
335 * The classical Unix view for directory is that it is a linear array of
336 * (name, inode number) entries. Linux/VFS assumes this model as well.
337 * Particularly, 'readdir()' call wants us to return a directory entry offset
338 * which later may be used to continue 'readdir()'ing the directory or to
339 * 'seek()' to that specific direntry. Obviously UBIFS does not really fit this
340 * model because directory entries are identified by keys, which may collide.
342 * UBIFS uses directory entry hash value for directory offsets, so
343 * 'seekdir()'/'telldir()' may not always work because of possible key
344 * collisions. But UBIFS guarantees that consecutive 'readdir()' calls work
345 * properly by means of saving full directory entry name in the private field
346 * of the file description object.
348 * This means that UBIFS cannot support NFS which requires full
349 * 'seekdir()'/'telldir()' support.
351 static int ubifs_readdir(struct file *file, struct dir_context *ctx)
353 int err;
354 struct qstr nm;
355 union ubifs_key key;
356 struct ubifs_dent_node *dent;
357 struct inode *dir = file_inode(file);
358 struct ubifs_info *c = dir->i_sb->s_fs_info;
360 dbg_gen("dir ino %lu, f_pos %#llx", dir->i_ino, ctx->pos);
362 if (ctx->pos > UBIFS_S_KEY_HASH_MASK || ctx->pos == 2)
364 * The directory was seek'ed to a senseless position or there
365 * are no more entries.
367 return 0;
369 if (file->f_version == 0) {
371 * The file was seek'ed, which means that @file->private_data
372 * is now invalid. This may also be just the first
373 * 'ubifs_readdir()' invocation, in which case
374 * @file->private_data is NULL, and the below code is
375 * basically a no-op.
377 kfree(file->private_data);
378 file->private_data = NULL;
382 * 'generic_file_llseek()' unconditionally sets @file->f_version to
383 * zero, and we use this for detecting whether the file was seek'ed.
385 file->f_version = 1;
387 /* File positions 0 and 1 correspond to "." and ".." */
388 if (ctx->pos < 2) {
389 ubifs_assert(!file->private_data);
390 if (!dir_emit_dots(file, ctx))
391 return 0;
393 /* Find the first entry in TNC and save it */
394 lowest_dent_key(c, &key, dir->i_ino);
395 nm.name = NULL;
396 dent = ubifs_tnc_next_ent(c, &key, &nm);
397 if (IS_ERR(dent)) {
398 err = PTR_ERR(dent);
399 goto out;
402 ctx->pos = key_hash_flash(c, &dent->key);
403 file->private_data = dent;
406 dent = file->private_data;
407 if (!dent) {
409 * The directory was seek'ed to and is now readdir'ed.
410 * Find the entry corresponding to @ctx->pos or the closest one.
412 dent_key_init_hash(c, &key, dir->i_ino, ctx->pos);
413 nm.name = NULL;
414 dent = ubifs_tnc_next_ent(c, &key, &nm);
415 if (IS_ERR(dent)) {
416 err = PTR_ERR(dent);
417 goto out;
419 ctx->pos = key_hash_flash(c, &dent->key);
420 file->private_data = dent;
423 while (1) {
424 dbg_gen("feed '%s', ino %llu, new f_pos %#x",
425 dent->name, (unsigned long long)le64_to_cpu(dent->inum),
426 key_hash_flash(c, &dent->key));
427 ubifs_assert(le64_to_cpu(dent->ch.sqnum) >
428 ubifs_inode(dir)->creat_sqnum);
430 nm.len = le16_to_cpu(dent->nlen);
431 if (!dir_emit(ctx, dent->name, nm.len,
432 le64_to_cpu(dent->inum),
433 vfs_dent_type(dent->type)))
434 return 0;
436 /* Switch to the next entry */
437 key_read(c, &dent->key, &key);
438 nm.name = dent->name;
439 dent = ubifs_tnc_next_ent(c, &key, &nm);
440 if (IS_ERR(dent)) {
441 err = PTR_ERR(dent);
442 goto out;
445 kfree(file->private_data);
446 ctx->pos = key_hash_flash(c, &dent->key);
447 file->private_data = dent;
448 cond_resched();
451 out:
452 kfree(file->private_data);
453 file->private_data = NULL;
455 if (err != -ENOENT) {
456 ubifs_err(c, "cannot find next direntry, error %d", err);
457 return err;
460 /* 2 is a special value indicating that there are no more direntries */
461 ctx->pos = 2;
462 return 0;
465 /* Free saved readdir() state when the directory is closed */
466 static int ubifs_dir_release(struct inode *dir, struct file *file)
468 kfree(file->private_data);
469 file->private_data = NULL;
470 return 0;
474 * lock_2_inodes - a wrapper for locking two UBIFS inodes.
475 * @inode1: first inode
476 * @inode2: second inode
478 * We do not implement any tricks to guarantee strict lock ordering, because
479 * VFS has already done it for us on the @i_mutex. So this is just a simple
480 * wrapper function.
482 static void lock_2_inodes(struct inode *inode1, struct inode *inode2)
484 mutex_lock_nested(&ubifs_inode(inode1)->ui_mutex, WB_MUTEX_1);
485 mutex_lock_nested(&ubifs_inode(inode2)->ui_mutex, WB_MUTEX_2);
489 * unlock_2_inodes - a wrapper for unlocking two UBIFS inodes.
490 * @inode1: first inode
491 * @inode2: second inode
493 static void unlock_2_inodes(struct inode *inode1, struct inode *inode2)
495 mutex_unlock(&ubifs_inode(inode2)->ui_mutex);
496 mutex_unlock(&ubifs_inode(inode1)->ui_mutex);
499 static int ubifs_link(struct dentry *old_dentry, struct inode *dir,
500 struct dentry *dentry)
502 struct ubifs_info *c = dir->i_sb->s_fs_info;
503 struct inode *inode = d_inode(old_dentry);
504 struct ubifs_inode *ui = ubifs_inode(inode);
505 struct ubifs_inode *dir_ui = ubifs_inode(dir);
506 int err, sz_change = CALC_DENT_SIZE(dentry->d_name.len);
507 struct ubifs_budget_req req = { .new_dent = 1, .dirtied_ino = 2,
508 .dirtied_ino_d = ALIGN(ui->data_len, 8) };
511 * Budget request settings: new direntry, changing the target inode,
512 * changing the parent inode.
515 dbg_gen("dent '%pd' to ino %lu (nlink %d) in dir ino %lu",
516 dentry, inode->i_ino,
517 inode->i_nlink, dir->i_ino);
518 ubifs_assert(inode_is_locked(dir));
519 ubifs_assert(inode_is_locked(inode));
521 err = dbg_check_synced_i_size(c, inode);
522 if (err)
523 return err;
525 err = ubifs_budget_space(c, &req);
526 if (err)
527 return err;
529 lock_2_inodes(dir, inode);
530 inc_nlink(inode);
531 ihold(inode);
532 inode->i_ctime = ubifs_current_time(inode);
533 dir->i_size += sz_change;
534 dir_ui->ui_size = dir->i_size;
535 dir->i_mtime = dir->i_ctime = inode->i_ctime;
536 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 0, 0);
537 if (err)
538 goto out_cancel;
539 unlock_2_inodes(dir, inode);
541 ubifs_release_budget(c, &req);
542 d_instantiate(dentry, inode);
543 return 0;
545 out_cancel:
546 dir->i_size -= sz_change;
547 dir_ui->ui_size = dir->i_size;
548 drop_nlink(inode);
549 unlock_2_inodes(dir, inode);
550 ubifs_release_budget(c, &req);
551 iput(inode);
552 return err;
555 static int ubifs_unlink(struct inode *dir, struct dentry *dentry)
557 struct ubifs_info *c = dir->i_sb->s_fs_info;
558 struct inode *inode = d_inode(dentry);
559 struct ubifs_inode *dir_ui = ubifs_inode(dir);
560 int sz_change = CALC_DENT_SIZE(dentry->d_name.len);
561 int err, budgeted = 1;
562 struct ubifs_budget_req req = { .mod_dent = 1, .dirtied_ino = 2 };
563 unsigned int saved_nlink = inode->i_nlink;
566 * Budget request settings: deletion direntry, deletion inode (+1 for
567 * @dirtied_ino), changing the parent directory inode. If budgeting
568 * fails, go ahead anyway because we have extra space reserved for
569 * deletions.
572 dbg_gen("dent '%pd' from ino %lu (nlink %d) in dir ino %lu",
573 dentry, inode->i_ino,
574 inode->i_nlink, dir->i_ino);
575 ubifs_assert(inode_is_locked(dir));
576 ubifs_assert(inode_is_locked(inode));
577 err = dbg_check_synced_i_size(c, inode);
578 if (err)
579 return err;
581 err = ubifs_budget_space(c, &req);
582 if (err) {
583 if (err != -ENOSPC)
584 return err;
585 budgeted = 0;
588 lock_2_inodes(dir, inode);
589 inode->i_ctime = ubifs_current_time(dir);
590 drop_nlink(inode);
591 dir->i_size -= sz_change;
592 dir_ui->ui_size = dir->i_size;
593 dir->i_mtime = dir->i_ctime = inode->i_ctime;
594 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 1, 0);
595 if (err)
596 goto out_cancel;
597 unlock_2_inodes(dir, inode);
599 if (budgeted)
600 ubifs_release_budget(c, &req);
601 else {
602 /* We've deleted something - clean the "no space" flags */
603 c->bi.nospace = c->bi.nospace_rp = 0;
604 smp_wmb();
606 return 0;
608 out_cancel:
609 dir->i_size += sz_change;
610 dir_ui->ui_size = dir->i_size;
611 set_nlink(inode, saved_nlink);
612 unlock_2_inodes(dir, inode);
613 if (budgeted)
614 ubifs_release_budget(c, &req);
615 return err;
619 * check_dir_empty - check if a directory is empty or not.
620 * @c: UBIFS file-system description object
621 * @dir: VFS inode object of the directory to check
623 * This function checks if directory @dir is empty. Returns zero if the
624 * directory is empty, %-ENOTEMPTY if it is not, and other negative error codes
625 * in case of of errors.
627 static int check_dir_empty(struct ubifs_info *c, struct inode *dir)
629 struct qstr nm = { .name = NULL };
630 struct ubifs_dent_node *dent;
631 union ubifs_key key;
632 int err;
634 lowest_dent_key(c, &key, dir->i_ino);
635 dent = ubifs_tnc_next_ent(c, &key, &nm);
636 if (IS_ERR(dent)) {
637 err = PTR_ERR(dent);
638 if (err == -ENOENT)
639 err = 0;
640 } else {
641 kfree(dent);
642 err = -ENOTEMPTY;
644 return err;
647 static int ubifs_rmdir(struct inode *dir, struct dentry *dentry)
649 struct ubifs_info *c = dir->i_sb->s_fs_info;
650 struct inode *inode = d_inode(dentry);
651 int sz_change = CALC_DENT_SIZE(dentry->d_name.len);
652 int err, budgeted = 1;
653 struct ubifs_inode *dir_ui = ubifs_inode(dir);
654 struct ubifs_budget_req req = { .mod_dent = 1, .dirtied_ino = 2 };
657 * Budget request settings: deletion direntry, deletion inode and
658 * changing the parent inode. If budgeting fails, go ahead anyway
659 * because we have extra space reserved for deletions.
662 dbg_gen("directory '%pd', ino %lu in dir ino %lu", dentry,
663 inode->i_ino, dir->i_ino);
664 ubifs_assert(inode_is_locked(dir));
665 ubifs_assert(inode_is_locked(inode));
666 err = check_dir_empty(c, d_inode(dentry));
667 if (err)
668 return err;
670 err = ubifs_budget_space(c, &req);
671 if (err) {
672 if (err != -ENOSPC)
673 return err;
674 budgeted = 0;
677 lock_2_inodes(dir, inode);
678 inode->i_ctime = ubifs_current_time(dir);
679 clear_nlink(inode);
680 drop_nlink(dir);
681 dir->i_size -= sz_change;
682 dir_ui->ui_size = dir->i_size;
683 dir->i_mtime = dir->i_ctime = inode->i_ctime;
684 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 1, 0);
685 if (err)
686 goto out_cancel;
687 unlock_2_inodes(dir, inode);
689 if (budgeted)
690 ubifs_release_budget(c, &req);
691 else {
692 /* We've deleted something - clean the "no space" flags */
693 c->bi.nospace = c->bi.nospace_rp = 0;
694 smp_wmb();
696 return 0;
698 out_cancel:
699 dir->i_size += sz_change;
700 dir_ui->ui_size = dir->i_size;
701 inc_nlink(dir);
702 set_nlink(inode, 2);
703 unlock_2_inodes(dir, inode);
704 if (budgeted)
705 ubifs_release_budget(c, &req);
706 return err;
709 static int ubifs_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode)
711 struct inode *inode;
712 struct ubifs_inode *dir_ui = ubifs_inode(dir);
713 struct ubifs_info *c = dir->i_sb->s_fs_info;
714 int err, sz_change = CALC_DENT_SIZE(dentry->d_name.len);
715 struct ubifs_budget_req req = { .new_ino = 1, .new_dent = 1 };
718 * Budget request settings: new inode, new direntry and changing parent
719 * directory inode.
722 dbg_gen("dent '%pd', mode %#hx in dir ino %lu",
723 dentry, mode, dir->i_ino);
725 err = ubifs_budget_space(c, &req);
726 if (err)
727 return err;
729 inode = ubifs_new_inode(c, dir, S_IFDIR | mode);
730 if (IS_ERR(inode)) {
731 err = PTR_ERR(inode);
732 goto out_budg;
735 err = ubifs_init_security(dir, inode, &dentry->d_name);
736 if (err)
737 goto out_inode;
739 mutex_lock(&dir_ui->ui_mutex);
740 insert_inode_hash(inode);
741 inc_nlink(inode);
742 inc_nlink(dir);
743 dir->i_size += sz_change;
744 dir_ui->ui_size = dir->i_size;
745 dir->i_mtime = dir->i_ctime = inode->i_ctime;
746 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 0, 0);
747 if (err) {
748 ubifs_err(c, "cannot create directory, error %d", err);
749 goto out_cancel;
751 mutex_unlock(&dir_ui->ui_mutex);
753 ubifs_release_budget(c, &req);
754 d_instantiate(dentry, inode);
755 return 0;
757 out_cancel:
758 dir->i_size -= sz_change;
759 dir_ui->ui_size = dir->i_size;
760 drop_nlink(dir);
761 mutex_unlock(&dir_ui->ui_mutex);
762 out_inode:
763 make_bad_inode(inode);
764 iput(inode);
765 out_budg:
766 ubifs_release_budget(c, &req);
767 return err;
770 static int ubifs_mknod(struct inode *dir, struct dentry *dentry,
771 umode_t mode, dev_t rdev)
773 struct inode *inode;
774 struct ubifs_inode *ui;
775 struct ubifs_inode *dir_ui = ubifs_inode(dir);
776 struct ubifs_info *c = dir->i_sb->s_fs_info;
777 union ubifs_dev_desc *dev = NULL;
778 int sz_change = CALC_DENT_SIZE(dentry->d_name.len);
779 int err, devlen = 0;
780 struct ubifs_budget_req req = { .new_ino = 1, .new_dent = 1,
781 .new_ino_d = ALIGN(devlen, 8),
782 .dirtied_ino = 1 };
785 * Budget request settings: new inode, new direntry and changing parent
786 * directory inode.
789 dbg_gen("dent '%pd' in dir ino %lu", dentry, dir->i_ino);
791 if (S_ISBLK(mode) || S_ISCHR(mode)) {
792 dev = kmalloc(sizeof(union ubifs_dev_desc), GFP_NOFS);
793 if (!dev)
794 return -ENOMEM;
795 devlen = ubifs_encode_dev(dev, rdev);
798 err = ubifs_budget_space(c, &req);
799 if (err) {
800 kfree(dev);
801 return err;
804 inode = ubifs_new_inode(c, dir, mode);
805 if (IS_ERR(inode)) {
806 kfree(dev);
807 err = PTR_ERR(inode);
808 goto out_budg;
811 init_special_inode(inode, inode->i_mode, rdev);
812 inode->i_size = ubifs_inode(inode)->ui_size = devlen;
813 ui = ubifs_inode(inode);
814 ui->data = dev;
815 ui->data_len = devlen;
817 err = ubifs_init_security(dir, inode, &dentry->d_name);
818 if (err)
819 goto out_inode;
821 mutex_lock(&dir_ui->ui_mutex);
822 dir->i_size += sz_change;
823 dir_ui->ui_size = dir->i_size;
824 dir->i_mtime = dir->i_ctime = inode->i_ctime;
825 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 0, 0);
826 if (err)
827 goto out_cancel;
828 mutex_unlock(&dir_ui->ui_mutex);
830 ubifs_release_budget(c, &req);
831 insert_inode_hash(inode);
832 d_instantiate(dentry, inode);
833 return 0;
835 out_cancel:
836 dir->i_size -= sz_change;
837 dir_ui->ui_size = dir->i_size;
838 mutex_unlock(&dir_ui->ui_mutex);
839 out_inode:
840 make_bad_inode(inode);
841 iput(inode);
842 out_budg:
843 ubifs_release_budget(c, &req);
844 return err;
847 static int ubifs_symlink(struct inode *dir, struct dentry *dentry,
848 const char *symname)
850 struct inode *inode;
851 struct ubifs_inode *ui;
852 struct ubifs_inode *dir_ui = ubifs_inode(dir);
853 struct ubifs_info *c = dir->i_sb->s_fs_info;
854 int err, len = strlen(symname);
855 int sz_change = CALC_DENT_SIZE(dentry->d_name.len);
856 struct ubifs_budget_req req = { .new_ino = 1, .new_dent = 1,
857 .new_ino_d = ALIGN(len, 8),
858 .dirtied_ino = 1 };
861 * Budget request settings: new inode, new direntry and changing parent
862 * directory inode.
865 dbg_gen("dent '%pd', target '%s' in dir ino %lu", dentry,
866 symname, dir->i_ino);
868 if (len > UBIFS_MAX_INO_DATA)
869 return -ENAMETOOLONG;
871 err = ubifs_budget_space(c, &req);
872 if (err)
873 return err;
875 inode = ubifs_new_inode(c, dir, S_IFLNK | S_IRWXUGO);
876 if (IS_ERR(inode)) {
877 err = PTR_ERR(inode);
878 goto out_budg;
881 ui = ubifs_inode(inode);
882 ui->data = kmalloc(len + 1, GFP_NOFS);
883 if (!ui->data) {
884 err = -ENOMEM;
885 goto out_inode;
888 memcpy(ui->data, symname, len);
889 ((char *)ui->data)[len] = '\0';
890 inode->i_link = ui->data;
892 * The terminating zero byte is not written to the flash media and it
893 * is put just to make later in-memory string processing simpler. Thus,
894 * data length is @len, not @len + %1.
896 ui->data_len = len;
897 inode->i_size = ubifs_inode(inode)->ui_size = len;
899 err = ubifs_init_security(dir, inode, &dentry->d_name);
900 if (err)
901 goto out_inode;
903 mutex_lock(&dir_ui->ui_mutex);
904 dir->i_size += sz_change;
905 dir_ui->ui_size = dir->i_size;
906 dir->i_mtime = dir->i_ctime = inode->i_ctime;
907 err = ubifs_jnl_update(c, dir, &dentry->d_name, inode, 0, 0);
908 if (err)
909 goto out_cancel;
910 mutex_unlock(&dir_ui->ui_mutex);
912 ubifs_release_budget(c, &req);
913 insert_inode_hash(inode);
914 d_instantiate(dentry, inode);
915 return 0;
917 out_cancel:
918 dir->i_size -= sz_change;
919 dir_ui->ui_size = dir->i_size;
920 mutex_unlock(&dir_ui->ui_mutex);
921 out_inode:
922 make_bad_inode(inode);
923 iput(inode);
924 out_budg:
925 ubifs_release_budget(c, &req);
926 return err;
930 * lock_3_inodes - a wrapper for locking three UBIFS inodes.
931 * @inode1: first inode
932 * @inode2: second inode
933 * @inode3: third inode
935 * This function is used for 'ubifs_rename()' and @inode1 may be the same as
936 * @inode2 whereas @inode3 may be %NULL.
938 * We do not implement any tricks to guarantee strict lock ordering, because
939 * VFS has already done it for us on the @i_mutex. So this is just a simple
940 * wrapper function.
942 static void lock_3_inodes(struct inode *inode1, struct inode *inode2,
943 struct inode *inode3)
945 mutex_lock_nested(&ubifs_inode(inode1)->ui_mutex, WB_MUTEX_1);
946 if (inode2 != inode1)
947 mutex_lock_nested(&ubifs_inode(inode2)->ui_mutex, WB_MUTEX_2);
948 if (inode3)
949 mutex_lock_nested(&ubifs_inode(inode3)->ui_mutex, WB_MUTEX_3);
953 * unlock_3_inodes - a wrapper for unlocking three UBIFS inodes for rename.
954 * @inode1: first inode
955 * @inode2: second inode
956 * @inode3: third inode
958 static void unlock_3_inodes(struct inode *inode1, struct inode *inode2,
959 struct inode *inode3)
961 if (inode3)
962 mutex_unlock(&ubifs_inode(inode3)->ui_mutex);
963 if (inode1 != inode2)
964 mutex_unlock(&ubifs_inode(inode2)->ui_mutex);
965 mutex_unlock(&ubifs_inode(inode1)->ui_mutex);
968 static int ubifs_rename(struct inode *old_dir, struct dentry *old_dentry,
969 struct inode *new_dir, struct dentry *new_dentry)
971 struct ubifs_info *c = old_dir->i_sb->s_fs_info;
972 struct inode *old_inode = d_inode(old_dentry);
973 struct inode *new_inode = d_inode(new_dentry);
974 struct ubifs_inode *old_inode_ui = ubifs_inode(old_inode);
975 int err, release, sync = 0, move = (new_dir != old_dir);
976 int is_dir = S_ISDIR(old_inode->i_mode);
977 int unlink = !!new_inode;
978 int new_sz = CALC_DENT_SIZE(new_dentry->d_name.len);
979 int old_sz = CALC_DENT_SIZE(old_dentry->d_name.len);
980 struct ubifs_budget_req req = { .new_dent = 1, .mod_dent = 1,
981 .dirtied_ino = 3 };
982 struct ubifs_budget_req ino_req = { .dirtied_ino = 1,
983 .dirtied_ino_d = ALIGN(old_inode_ui->data_len, 8) };
984 struct timespec time;
985 unsigned int uninitialized_var(saved_nlink);
988 * Budget request settings: deletion direntry, new direntry, removing
989 * the old inode, and changing old and new parent directory inodes.
991 * However, this operation also marks the target inode as dirty and
992 * does not write it, so we allocate budget for the target inode
993 * separately.
996 dbg_gen("dent '%pd' ino %lu in dir ino %lu to dent '%pd' in dir ino %lu",
997 old_dentry, old_inode->i_ino, old_dir->i_ino,
998 new_dentry, new_dir->i_ino);
999 ubifs_assert(inode_is_locked(old_dir));
1000 ubifs_assert(inode_is_locked(new_dir));
1001 if (unlink)
1002 ubifs_assert(inode_is_locked(new_inode));
1005 if (unlink && is_dir) {
1006 err = check_dir_empty(c, new_inode);
1007 if (err)
1008 return err;
1011 err = ubifs_budget_space(c, &req);
1012 if (err)
1013 return err;
1014 err = ubifs_budget_space(c, &ino_req);
1015 if (err) {
1016 ubifs_release_budget(c, &req);
1017 return err;
1020 lock_3_inodes(old_dir, new_dir, new_inode);
1023 * Like most other Unix systems, set the @i_ctime for inodes on a
1024 * rename.
1026 time = ubifs_current_time(old_dir);
1027 old_inode->i_ctime = time;
1029 /* We must adjust parent link count when renaming directories */
1030 if (is_dir) {
1031 if (move) {
1033 * @old_dir loses a link because we are moving
1034 * @old_inode to a different directory.
1036 drop_nlink(old_dir);
1038 * @new_dir only gains a link if we are not also
1039 * overwriting an existing directory.
1041 if (!unlink)
1042 inc_nlink(new_dir);
1043 } else {
1045 * @old_inode is not moving to a different directory,
1046 * but @old_dir still loses a link if we are
1047 * overwriting an existing directory.
1049 if (unlink)
1050 drop_nlink(old_dir);
1054 old_dir->i_size -= old_sz;
1055 ubifs_inode(old_dir)->ui_size = old_dir->i_size;
1056 old_dir->i_mtime = old_dir->i_ctime = time;
1057 new_dir->i_mtime = new_dir->i_ctime = time;
1060 * And finally, if we unlinked a direntry which happened to have the
1061 * same name as the moved direntry, we have to decrement @i_nlink of
1062 * the unlinked inode and change its ctime.
1064 if (unlink) {
1066 * Directories cannot have hard-links, so if this is a
1067 * directory, just clear @i_nlink.
1069 saved_nlink = new_inode->i_nlink;
1070 if (is_dir)
1071 clear_nlink(new_inode);
1072 else
1073 drop_nlink(new_inode);
1074 new_inode->i_ctime = time;
1075 } else {
1076 new_dir->i_size += new_sz;
1077 ubifs_inode(new_dir)->ui_size = new_dir->i_size;
1081 * Do not ask 'ubifs_jnl_rename()' to flush write-buffer if @old_inode
1082 * is dirty, because this will be done later on at the end of
1083 * 'ubifs_rename()'.
1085 if (IS_SYNC(old_inode)) {
1086 sync = IS_DIRSYNC(old_dir) || IS_DIRSYNC(new_dir);
1087 if (unlink && IS_SYNC(new_inode))
1088 sync = 1;
1090 err = ubifs_jnl_rename(c, old_dir, old_dentry, new_dir, new_dentry,
1091 sync);
1092 if (err)
1093 goto out_cancel;
1095 unlock_3_inodes(old_dir, new_dir, new_inode);
1096 ubifs_release_budget(c, &req);
1098 mutex_lock(&old_inode_ui->ui_mutex);
1099 release = old_inode_ui->dirty;
1100 mark_inode_dirty_sync(old_inode);
1101 mutex_unlock(&old_inode_ui->ui_mutex);
1103 if (release)
1104 ubifs_release_budget(c, &ino_req);
1105 if (IS_SYNC(old_inode))
1106 err = old_inode->i_sb->s_op->write_inode(old_inode, NULL);
1107 return err;
1109 out_cancel:
1110 if (unlink) {
1111 set_nlink(new_inode, saved_nlink);
1112 } else {
1113 new_dir->i_size -= new_sz;
1114 ubifs_inode(new_dir)->ui_size = new_dir->i_size;
1116 old_dir->i_size += old_sz;
1117 ubifs_inode(old_dir)->ui_size = old_dir->i_size;
1118 if (is_dir) {
1119 if (move) {
1120 inc_nlink(old_dir);
1121 if (!unlink)
1122 drop_nlink(new_dir);
1123 } else {
1124 if (unlink)
1125 inc_nlink(old_dir);
1128 unlock_3_inodes(old_dir, new_dir, new_inode);
1129 ubifs_release_budget(c, &ino_req);
1130 ubifs_release_budget(c, &req);
1131 return err;
1134 int ubifs_getattr(struct vfsmount *mnt, struct dentry *dentry,
1135 struct kstat *stat)
1137 loff_t size;
1138 struct inode *inode = d_inode(dentry);
1139 struct ubifs_inode *ui = ubifs_inode(inode);
1141 mutex_lock(&ui->ui_mutex);
1142 generic_fillattr(inode, stat);
1143 stat->blksize = UBIFS_BLOCK_SIZE;
1144 stat->size = ui->ui_size;
1147 * Unfortunately, the 'stat()' system call was designed for block
1148 * device based file systems, and it is not appropriate for UBIFS,
1149 * because UBIFS does not have notion of "block". For example, it is
1150 * difficult to tell how many block a directory takes - it actually
1151 * takes less than 300 bytes, but we have to round it to block size,
1152 * which introduces large mistake. This makes utilities like 'du' to
1153 * report completely senseless numbers. This is the reason why UBIFS
1154 * goes the same way as JFFS2 - it reports zero blocks for everything
1155 * but regular files, which makes more sense than reporting completely
1156 * wrong sizes.
1158 if (S_ISREG(inode->i_mode)) {
1159 size = ui->xattr_size;
1160 size += stat->size;
1161 size = ALIGN(size, UBIFS_BLOCK_SIZE);
1163 * Note, user-space expects 512-byte blocks count irrespectively
1164 * of what was reported in @stat->size.
1166 stat->blocks = size >> 9;
1167 } else
1168 stat->blocks = 0;
1169 mutex_unlock(&ui->ui_mutex);
1170 return 0;
1173 const struct inode_operations ubifs_dir_inode_operations = {
1174 .lookup = ubifs_lookup,
1175 .create = ubifs_create,
1176 .link = ubifs_link,
1177 .symlink = ubifs_symlink,
1178 .unlink = ubifs_unlink,
1179 .mkdir = ubifs_mkdir,
1180 .rmdir = ubifs_rmdir,
1181 .mknod = ubifs_mknod,
1182 .rename = ubifs_rename,
1183 .setattr = ubifs_setattr,
1184 .getattr = ubifs_getattr,
1185 .setxattr = ubifs_setxattr,
1186 .getxattr = ubifs_getxattr,
1187 .listxattr = ubifs_listxattr,
1188 .removexattr = ubifs_removexattr,
1189 #ifdef CONFIG_UBIFS_ATIME_SUPPORT
1190 .update_time = ubifs_update_time,
1191 #endif
1194 const struct file_operations ubifs_dir_operations = {
1195 .llseek = generic_file_llseek,
1196 .release = ubifs_dir_release,
1197 .read = generic_read_dir,
1198 .iterate = ubifs_readdir,
1199 .fsync = ubifs_fsync,
1200 .unlocked_ioctl = ubifs_ioctl,
1201 #ifdef CONFIG_COMPAT
1202 .compat_ioctl = ubifs_compat_ioctl,
1203 #endif