sched: retune wake granularity
[wrt350n-kernel.git] / fs / xfs / xfs_utils.c
blob45d740df53b73d2166fe92490e68ea004ec83a7e
1 /*
2 * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
7 * published by the Free Software Foundation.
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
18 #include "xfs.h"
19 #include "xfs_fs.h"
20 #include "xfs_types.h"
21 #include "xfs_bit.h"
22 #include "xfs_log.h"
23 #include "xfs_inum.h"
24 #include "xfs_trans.h"
25 #include "xfs_sb.h"
26 #include "xfs_ag.h"
27 #include "xfs_dir2.h"
28 #include "xfs_dmapi.h"
29 #include "xfs_mount.h"
30 #include "xfs_bmap_btree.h"
31 #include "xfs_dir2_sf.h"
32 #include "xfs_attr_sf.h"
33 #include "xfs_dinode.h"
34 #include "xfs_inode.h"
35 #include "xfs_inode_item.h"
36 #include "xfs_bmap.h"
37 #include "xfs_error.h"
38 #include "xfs_quota.h"
39 #include "xfs_rw.h"
40 #include "xfs_itable.h"
41 #include "xfs_utils.h"
44 * xfs_get_dir_entry is used to get a reference to an inode given
45 * its parent directory inode and the name of the file. It does
46 * not lock the child inode, and it unlocks the directory before
47 * returning. The directory's generation number is returned for
48 * use by a later call to xfs_lock_dir_and_entry.
50 int
51 xfs_get_dir_entry(
52 bhv_vname_t *dentry,
53 xfs_inode_t **ipp)
55 bhv_vnode_t *vp;
57 vp = VNAME_TO_VNODE(dentry);
59 *ipp = xfs_vtoi(vp);
60 if (!*ipp)
61 return XFS_ERROR(ENOENT);
62 VN_HOLD(vp);
63 return 0;
66 int
67 xfs_dir_lookup_int(
68 xfs_inode_t *dp,
69 uint lock_mode,
70 bhv_vname_t *dentry,
71 xfs_ino_t *inum,
72 xfs_inode_t **ipp)
74 int error;
76 xfs_itrace_entry(dp);
78 error = xfs_dir_lookup(NULL, dp, VNAME(dentry), VNAMELEN(dentry), inum);
79 if (!error) {
81 * Unlock the directory. We do this because we can't
82 * hold the directory lock while doing the vn_get()
83 * in xfs_iget(). Doing so could cause us to hold
84 * a lock while waiting for the inode to finish
85 * being inactive while it's waiting for a log
86 * reservation in the inactive routine.
88 xfs_iunlock(dp, lock_mode);
89 error = xfs_iget(dp->i_mount, NULL, *inum, 0, 0, ipp, 0);
90 xfs_ilock(dp, lock_mode);
92 if (error) {
93 *ipp = NULL;
94 } else if ((*ipp)->i_d.di_mode == 0) {
96 * The inode has been freed. Something is
97 * wrong so just get out of here.
99 xfs_iunlock(dp, lock_mode);
100 xfs_iput_new(*ipp, 0);
101 *ipp = NULL;
102 xfs_ilock(dp, lock_mode);
103 error = XFS_ERROR(ENOENT);
106 return error;
110 * Allocates a new inode from disk and return a pointer to the
111 * incore copy. This routine will internally commit the current
112 * transaction and allocate a new one if the Space Manager needed
113 * to do an allocation to replenish the inode free-list.
115 * This routine is designed to be called from xfs_create and
116 * xfs_create_dir.
120 xfs_dir_ialloc(
121 xfs_trans_t **tpp, /* input: current transaction;
122 output: may be a new transaction. */
123 xfs_inode_t *dp, /* directory within whose allocate
124 the inode. */
125 mode_t mode,
126 xfs_nlink_t nlink,
127 xfs_dev_t rdev,
128 cred_t *credp,
129 prid_t prid, /* project id */
130 int okalloc, /* ok to allocate new space */
131 xfs_inode_t **ipp, /* pointer to inode; it will be
132 locked. */
133 int *committed)
136 xfs_trans_t *tp;
137 xfs_trans_t *ntp;
138 xfs_inode_t *ip;
139 xfs_buf_t *ialloc_context = NULL;
140 boolean_t call_again = B_FALSE;
141 int code;
142 uint log_res;
143 uint log_count;
144 void *dqinfo;
145 uint tflags;
147 tp = *tpp;
148 ASSERT(tp->t_flags & XFS_TRANS_PERM_LOG_RES);
151 * xfs_ialloc will return a pointer to an incore inode if
152 * the Space Manager has an available inode on the free
153 * list. Otherwise, it will do an allocation and replenish
154 * the freelist. Since we can only do one allocation per
155 * transaction without deadlocks, we will need to commit the
156 * current transaction and start a new one. We will then
157 * need to call xfs_ialloc again to get the inode.
159 * If xfs_ialloc did an allocation to replenish the freelist,
160 * it returns the bp containing the head of the freelist as
161 * ialloc_context. We will hold a lock on it across the
162 * transaction commit so that no other process can steal
163 * the inode(s) that we've just allocated.
165 code = xfs_ialloc(tp, dp, mode, nlink, rdev, credp, prid, okalloc,
166 &ialloc_context, &call_again, &ip);
169 * Return an error if we were unable to allocate a new inode.
170 * This should only happen if we run out of space on disk or
171 * encounter a disk error.
173 if (code) {
174 *ipp = NULL;
175 return code;
177 if (!call_again && (ip == NULL)) {
178 *ipp = NULL;
179 return XFS_ERROR(ENOSPC);
183 * If call_again is set, then we were unable to get an
184 * inode in one operation. We need to commit the current
185 * transaction and call xfs_ialloc() again. It is guaranteed
186 * to succeed the second time.
188 if (call_again) {
191 * Normally, xfs_trans_commit releases all the locks.
192 * We call bhold to hang on to the ialloc_context across
193 * the commit. Holding this buffer prevents any other
194 * processes from doing any allocations in this
195 * allocation group.
197 xfs_trans_bhold(tp, ialloc_context);
199 * Save the log reservation so we can use
200 * them in the next transaction.
202 log_res = xfs_trans_get_log_res(tp);
203 log_count = xfs_trans_get_log_count(tp);
206 * We want the quota changes to be associated with the next
207 * transaction, NOT this one. So, detach the dqinfo from this
208 * and attach it to the next transaction.
210 dqinfo = NULL;
211 tflags = 0;
212 if (tp->t_dqinfo) {
213 dqinfo = (void *)tp->t_dqinfo;
214 tp->t_dqinfo = NULL;
215 tflags = tp->t_flags & XFS_TRANS_DQ_DIRTY;
216 tp->t_flags &= ~(XFS_TRANS_DQ_DIRTY);
219 ntp = xfs_trans_dup(tp);
220 code = xfs_trans_commit(tp, 0);
221 tp = ntp;
222 if (committed != NULL) {
223 *committed = 1;
226 * If we get an error during the commit processing,
227 * release the buffer that is still held and return
228 * to the caller.
230 if (code) {
231 xfs_buf_relse(ialloc_context);
232 if (dqinfo) {
233 tp->t_dqinfo = dqinfo;
234 XFS_TRANS_FREE_DQINFO(tp->t_mountp, tp);
236 *tpp = ntp;
237 *ipp = NULL;
238 return code;
240 code = xfs_trans_reserve(tp, 0, log_res, 0,
241 XFS_TRANS_PERM_LOG_RES, log_count);
243 * Re-attach the quota info that we detached from prev trx.
245 if (dqinfo) {
246 tp->t_dqinfo = dqinfo;
247 tp->t_flags |= tflags;
250 if (code) {
251 xfs_buf_relse(ialloc_context);
252 *tpp = ntp;
253 *ipp = NULL;
254 return code;
256 xfs_trans_bjoin(tp, ialloc_context);
259 * Call ialloc again. Since we've locked out all
260 * other allocations in this allocation group,
261 * this call should always succeed.
263 code = xfs_ialloc(tp, dp, mode, nlink, rdev, credp, prid,
264 okalloc, &ialloc_context, &call_again, &ip);
267 * If we get an error at this point, return to the caller
268 * so that the current transaction can be aborted.
270 if (code) {
271 *tpp = tp;
272 *ipp = NULL;
273 return code;
275 ASSERT ((!call_again) && (ip != NULL));
277 } else {
278 if (committed != NULL) {
279 *committed = 0;
283 *ipp = ip;
284 *tpp = tp;
286 return 0;
290 * Decrement the link count on an inode & log the change.
291 * If this causes the link count to go to zero, initiate the
292 * logging activity required to truncate a file.
294 int /* error */
295 xfs_droplink(
296 xfs_trans_t *tp,
297 xfs_inode_t *ip)
299 int error;
301 xfs_ichgtime(ip, XFS_ICHGTIME_CHG);
303 ASSERT (ip->i_d.di_nlink > 0);
304 ip->i_d.di_nlink--;
305 drop_nlink(ip->i_vnode);
306 xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
308 error = 0;
309 if (ip->i_d.di_nlink == 0) {
311 * We're dropping the last link to this file.
312 * Move the on-disk inode to the AGI unlinked list.
313 * From xfs_inactive() we will pull the inode from
314 * the list and free it.
316 error = xfs_iunlink(tp, ip);
318 return error;
322 * This gets called when the inode's version needs to be changed from 1 to 2.
323 * Currently this happens when the nlink field overflows the old 16-bit value
324 * or when chproj is called to change the project for the first time.
325 * As a side effect the superblock version will also get rev'd
326 * to contain the NLINK bit.
328 void
329 xfs_bump_ino_vers2(
330 xfs_trans_t *tp,
331 xfs_inode_t *ip)
333 xfs_mount_t *mp;
335 ASSERT(ismrlocked (&ip->i_lock, MR_UPDATE));
336 ASSERT(ip->i_d.di_version == XFS_DINODE_VERSION_1);
338 ip->i_d.di_version = XFS_DINODE_VERSION_2;
339 ip->i_d.di_onlink = 0;
340 memset(&(ip->i_d.di_pad[0]), 0, sizeof(ip->i_d.di_pad));
341 mp = tp->t_mountp;
342 if (!XFS_SB_VERSION_HASNLINK(&mp->m_sb)) {
343 spin_lock(&mp->m_sb_lock);
344 if (!XFS_SB_VERSION_HASNLINK(&mp->m_sb)) {
345 XFS_SB_VERSION_ADDNLINK(&mp->m_sb);
346 spin_unlock(&mp->m_sb_lock);
347 xfs_mod_sb(tp, XFS_SB_VERSIONNUM);
348 } else {
349 spin_unlock(&mp->m_sb_lock);
352 /* Caller must log the inode */
356 * Increment the link count on an inode & log the change.
359 xfs_bumplink(
360 xfs_trans_t *tp,
361 xfs_inode_t *ip)
363 if (ip->i_d.di_nlink >= XFS_MAXLINK)
364 return XFS_ERROR(EMLINK);
365 xfs_ichgtime(ip, XFS_ICHGTIME_CHG);
367 ASSERT(ip->i_d.di_nlink > 0);
368 ip->i_d.di_nlink++;
369 inc_nlink(ip->i_vnode);
370 if ((ip->i_d.di_version == XFS_DINODE_VERSION_1) &&
371 (ip->i_d.di_nlink > XFS_MAXLINK_1)) {
373 * The inode has increased its number of links beyond
374 * what can fit in an old format inode. It now needs
375 * to be converted to a version 2 inode with a 32 bit
376 * link count. If this is the first inode in the file
377 * system to do this, then we need to bump the superblock
378 * version number as well.
380 xfs_bump_ino_vers2(tp, ip);
383 xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
384 return 0;
388 * Try to truncate the given file to 0 length. Currently called
389 * only out of xfs_remove when it has to truncate a file to free
390 * up space for the remove to proceed.
393 xfs_truncate_file(
394 xfs_mount_t *mp,
395 xfs_inode_t *ip)
397 xfs_trans_t *tp;
398 int error;
400 #ifdef QUOTADEBUG
402 * This is called to truncate the quotainodes too.
404 if (XFS_IS_UQUOTA_ON(mp)) {
405 if (ip->i_ino != mp->m_sb.sb_uquotino)
406 ASSERT(ip->i_udquot);
408 if (XFS_IS_OQUOTA_ON(mp)) {
409 if (ip->i_ino != mp->m_sb.sb_gquotino)
410 ASSERT(ip->i_gdquot);
412 #endif
414 * Make the call to xfs_itruncate_start before starting the
415 * transaction, because we cannot make the call while we're
416 * in a transaction.
418 xfs_ilock(ip, XFS_IOLOCK_EXCL);
419 error = xfs_itruncate_start(ip, XFS_ITRUNC_DEFINITE, (xfs_fsize_t)0);
420 if (error) {
421 xfs_iunlock(ip, XFS_IOLOCK_EXCL);
422 return error;
425 tp = xfs_trans_alloc(mp, XFS_TRANS_TRUNCATE_FILE);
426 if ((error = xfs_trans_reserve(tp, 0, XFS_ITRUNCATE_LOG_RES(mp), 0,
427 XFS_TRANS_PERM_LOG_RES,
428 XFS_ITRUNCATE_LOG_COUNT))) {
429 xfs_trans_cancel(tp, 0);
430 xfs_iunlock(ip, XFS_IOLOCK_EXCL);
431 return error;
435 * Follow the normal truncate locking protocol. Since we
436 * hold the inode in the transaction, we know that it's number
437 * of references will stay constant.
439 xfs_ilock(ip, XFS_ILOCK_EXCL);
440 xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL | XFS_IOLOCK_EXCL);
441 xfs_trans_ihold(tp, ip);
443 * Signal a sync xaction. The only case where that isn't
444 * the case is if we're truncating an already unlinked file
445 * on a wsync fs. In that case, we know the blocks can't
446 * reappear in the file because the links to file are
447 * permanently toast. Currently, we're always going to
448 * want a sync transaction because this code is being
449 * called from places where nlink is guaranteed to be 1
450 * but I'm leaving the tests in to protect against future
451 * changes -- rcc.
453 error = xfs_itruncate_finish(&tp, ip, (xfs_fsize_t)0,
454 XFS_DATA_FORK,
455 ((ip->i_d.di_nlink != 0 ||
456 !(mp->m_flags & XFS_MOUNT_WSYNC))
457 ? 1 : 0));
458 if (error) {
459 xfs_trans_cancel(tp, XFS_TRANS_RELEASE_LOG_RES |
460 XFS_TRANS_ABORT);
461 } else {
462 xfs_ichgtime(ip, XFS_ICHGTIME_MOD | XFS_ICHGTIME_CHG);
463 error = xfs_trans_commit(tp, XFS_TRANS_RELEASE_LOG_RES);
465 xfs_iunlock(ip, XFS_ILOCK_EXCL | XFS_IOLOCK_EXCL);
467 return error;