2 * Copyright (C) International Business Machines Corp., 2000-2004
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
12 * the GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 #include <linux/quotaops.h>
21 #include "jfs_incore.h"
22 #include "jfs_inode.h"
23 #include "jfs_superblock.h"
25 #include "jfs_extent.h"
26 #include "jfs_debug.h"
31 static int extBalloc(struct inode
*, s64
, s64
*, s64
*);
33 static int extBrealloc(struct inode
*, s64
, s64
, s64
*, s64
*);
35 static s64
extRoundDown(s64 nb
);
37 #define DPD(a) (printk("(a): %d\n",(a)))
38 #define DPC(a) (printk("(a): %c\n",(a)))
42 printk("(a): %x%08x ",(a)); \
44 printk("(a): %x ",(a) << 32); \
49 printk("(a): %x%08x\n",(a)); \
51 printk("(a): %x\n",(a) << 32); \
54 #define DPD1(a) (printk("(a): %d ",(a)))
55 #define DPX(a) (printk("(a): %08x\n",(a)))
56 #define DPX1(a) (printk("(a): %08x ",(a)))
57 #define DPS(a) (printk("%s\n",(a)))
58 #define DPE(a) (printk("\nENTERING: %s\n",(a)))
59 #define DPE1(a) (printk("\nENTERING: %s",(a)))
60 #define DPS1(a) (printk(" %s ",(a)))
66 * FUNCTION: allocate an extent for a specified page range within a
70 * ip - the inode of the file.
71 * xlen - requested extent length.
72 * pno - the starting page number with the file.
73 * xp - pointer to an xad. on entry, xad describes an
74 * extent that is used as an allocation hint if the
75 * xaddr of the xad is non-zero. on successful exit,
76 * the xad describes the newly allocated extent.
77 * abnr - bool indicating whether the newly allocated extent
78 * should be marked as allocated but not recorded.
83 * -ENOSPC - insufficient disk resources.
86 extAlloc(struct inode
*ip
, s64 xlen
, s64 pno
, xad_t
* xp
, bool abnr
)
88 struct jfs_sb_info
*sbi
= JFS_SBI(ip
->i_sb
);
89 s64 nxlen
, nxaddr
, xoff
, hint
, xaddr
= 0;
93 /* This blocks if we are low on resources */
94 txBeginAnon(ip
->i_sb
);
96 /* Avoid race with jfs_commit_inode() */
97 mutex_lock(&JFS_IP(ip
)->commit_mutex
);
99 /* validate extent length */
103 /* get the page's starting extent offset */
104 xoff
= pno
<< sbi
->l2nbperpage
;
106 /* check if an allocation hint was provided */
107 if ((hint
= addressXAD(xp
))) {
108 /* get the size of the extent described by the hint */
109 nxlen
= lengthXAD(xp
);
111 /* check if the hint is for the portion of the file
112 * immediately previous to the current allocation
113 * request and if hint extent has the same abnr
114 * value as the current request. if so, we can
115 * extend the hint extent to include the current
116 * extent if we can allocate the blocks immediately
117 * following the hint extent.
119 if (offsetXAD(xp
) + nxlen
== xoff
&&
120 abnr
== ((xp
->flag
& XAD_NOTRECORDED
) ? true : false))
121 xaddr
= hint
+ nxlen
;
123 /* adjust the hint to the last block of the extent */
127 /* allocate the disk blocks for the extent. initially, extBalloc()
128 * will try to allocate disk blocks for the requested size (xlen).
129 * if this fails (xlen contiguous free blocks not available), it'll
130 * try to allocate a smaller number of blocks (producing a smaller
131 * extent), with this smaller number of blocks consisting of the
132 * requested number of blocks rounded down to the next smaller
133 * power of 2 number (i.e. 16 -> 8). it'll continue to round down
134 * and retry the allocation until the number of blocks to allocate
135 * is smaller than the number of blocks per page.
138 if ((rc
= extBalloc(ip
, hint
? hint
: INOHINT(ip
), &nxlen
, &nxaddr
))) {
139 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
143 /* Allocate blocks to quota. */
144 rc
= dquot_alloc_block(ip
, nxlen
);
146 dbFree(ip
, nxaddr
, (s64
) nxlen
);
147 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
151 /* determine the value of the extent flag */
152 xflag
= abnr
? XAD_NOTRECORDED
: 0;
154 /* if we can extend the hint extent to cover the current request,
155 * extend it. otherwise, insert a new extent to
156 * cover the current request.
158 if (xaddr
&& xaddr
== nxaddr
)
159 rc
= xtExtend(0, ip
, xoff
, (int) nxlen
, 0);
161 rc
= xtInsert(0, ip
, xflag
, xoff
, (int) nxlen
, &nxaddr
, 0);
163 /* if the extend or insert failed,
164 * free the newly allocated blocks and return the error.
167 dbFree(ip
, nxaddr
, nxlen
);
168 dquot_free_block(ip
, nxlen
);
169 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
173 /* set the results of the extent allocation */
174 XADaddress(xp
, nxaddr
);
175 XADlength(xp
, nxlen
);
179 mark_inode_dirty(ip
);
181 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
183 * COMMIT_SyncList flags an anonymous tlock on page that is on
185 * We need to commit the inode to get the page written disk.
187 if (test_and_clear_cflag(COMMIT_Synclist
,ip
))
188 jfs_commit_inode(ip
, 0);
198 * FUNCTION: extend the allocation of a file extent containing a
199 * partial back last page.
202 * ip - the inode of the file.
203 * cp - cbuf for the partial backed last page.
204 * xlen - request size of the resulting extent.
205 * xp - pointer to an xad. on successful exit, the xad
206 * describes the newly allocated extent.
207 * abnr - bool indicating whether the newly allocated extent
208 * should be marked as allocated but not recorded.
213 * -ENOSPC - insufficient disk resources.
215 int extRealloc(struct inode
*ip
, s64 nxlen
, xad_t
* xp
, bool abnr
)
217 struct super_block
*sb
= ip
->i_sb
;
218 s64 xaddr
, xlen
, nxaddr
, delta
, xoff
;
219 s64 ntail
, nextend
, ninsert
;
220 int rc
, nbperpage
= JFS_SBI(sb
)->nbperpage
;
223 /* This blocks if we are low on resources */
224 txBeginAnon(ip
->i_sb
);
226 mutex_lock(&JFS_IP(ip
)->commit_mutex
);
227 /* validate extent length */
231 /* get the extend (partial) page's disk block address and
234 xaddr
= addressXAD(xp
);
235 xlen
= lengthXAD(xp
);
236 xoff
= offsetXAD(xp
);
238 /* if the extend page is abnr and if the request is for
239 * the extent to be allocated and recorded,
240 * make the page allocated and recorded.
242 if ((xp
->flag
& XAD_NOTRECORDED
) && !abnr
) {
244 if ((rc
= xtUpdate(0, ip
, xp
)))
248 /* try to allocated the request number of blocks for the
249 * extent. dbRealloc() first tries to satisfy the request
250 * by extending the allocation in place. otherwise, it will
251 * try to allocate a new set of blocks large enough for the
252 * request. in satisfying a request, dbReAlloc() may allocate
253 * less than what was request but will always allocate enough
254 * space as to satisfy the extend page.
256 if ((rc
= extBrealloc(ip
, xaddr
, xlen
, &nxlen
, &nxaddr
)))
259 /* Allocat blocks to quota. */
260 rc
= dquot_alloc_block(ip
, nxlen
);
262 dbFree(ip
, nxaddr
, (s64
) nxlen
);
263 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
267 delta
= nxlen
- xlen
;
269 /* check if the extend page is not abnr but the request is abnr
270 * and the allocated disk space is for more than one page. if this
271 * is the case, there is a miss match of abnr between the extend page
272 * and the one or more pages following the extend page. as a result,
273 * two extents will have to be manipulated. the first will be that
274 * of the extent of the extend page and will be manipulated thru
275 * an xtExtend() or an xtTailgate(), depending upon whether the
276 * disk allocation occurred as an inplace extension. the second
277 * extent will be manipulated (created) through an xtInsert() and
278 * will be for the pages following the extend page.
280 if (abnr
&& (!(xp
->flag
& XAD_NOTRECORDED
)) && (nxlen
> nbperpage
)) {
282 nextend
= ntail
- xlen
;
283 ninsert
= nxlen
- nbperpage
;
285 xflag
= XAD_NOTRECORDED
;
294 /* if we were able to extend the disk allocation in place,
295 * extend the extent. otherwise, move the extent to a
298 if (xaddr
== nxaddr
) {
299 /* extend the extent */
300 if ((rc
= xtExtend(0, ip
, xoff
+ xlen
, (int) nextend
, 0))) {
301 dbFree(ip
, xaddr
+ xlen
, delta
);
302 dquot_free_block(ip
, nxlen
);
307 * move the extent to a new location:
309 * xtTailgate() accounts for relocated tail extent;
311 if ((rc
= xtTailgate(0, ip
, xoff
, (int) ntail
, nxaddr
, 0))) {
312 dbFree(ip
, nxaddr
, nxlen
);
313 dquot_free_block(ip
, nxlen
);
319 /* check if we need to also insert a new extent */
321 /* perform the insert. if it fails, free the blocks
322 * to be inserted and make it appear that we only did
323 * the xtExtend() or xtTailgate() above.
325 xaddr
= nxaddr
+ ntail
;
326 if (xtInsert (0, ip
, xflag
, xoff
+ ntail
, (int) ninsert
,
328 dbFree(ip
, xaddr
, (s64
) ninsert
);
335 /* set the return results */
336 XADaddress(xp
, nxaddr
);
337 XADlength(xp
, nxlen
);
341 mark_inode_dirty(ip
);
343 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
352 * FUNCTION: produce an extent allocation hint for a file offset.
355 * ip - the inode of the file.
356 * offset - file offset for which the hint is needed.
357 * xp - pointer to the xad that is to be filled in with
364 int extHint(struct inode
*ip
, s64 offset
, xad_t
* xp
)
366 struct super_block
*sb
= ip
->i_sb
;
367 int nbperpage
= JFS_SBI(sb
)->nbperpage
;
374 /* init the hint as "no hint provided" */
377 /* determine the starting extent offset of the page previous
378 * to the page containing the offset.
380 prev
= ((offset
& ~POFFSET
) >> JFS_SBI(sb
)->l2bsize
) - nbperpage
;
382 /* if the offset is in the first page of the file, no hint provided.
387 rc
= xtLookup(ip
, prev
, nbperpage
, &xflag
, &xaddr
, &xlen
, 0);
389 if ((rc
== 0) && xlen
) {
390 if (xlen
!= nbperpage
) {
391 jfs_error(ip
->i_sb
, "corrupt xtree\n");
394 XADaddress(xp
, xaddr
);
398 * only preserve the abnr flag within the xad flags
399 * of the returned hint.
401 xp
->flag
= xflag
& XAD_NOTRECORDED
;
413 * FUNCTION: change a page with a file from not recorded to recorded.
416 * ip - inode of the file.
417 * cp - cbuf of the file page.
422 * -ENOSPC - insufficient disk resources.
424 int extRecord(struct inode
*ip
, xad_t
* xp
)
428 txBeginAnon(ip
->i_sb
);
430 mutex_lock(&JFS_IP(ip
)->commit_mutex
);
432 /* update the extent */
433 rc
= xtUpdate(0, ip
, xp
);
435 mutex_unlock(&JFS_IP(ip
)->commit_mutex
);
444 * FUNCTION: allocate disk space for a file page that represents
448 * ip - the inode of the file.
449 * cp - cbuf of the file page represent the hole.
454 * -ENOSPC - insufficient disk resources.
456 int extFill(struct inode
*ip
, xad_t
* xp
)
458 int rc
, nbperpage
= JFS_SBI(ip
->i_sb
)->nbperpage
;
459 s64 blkno
= offsetXAD(xp
) >> ip
->i_blkbits
;
461 // assert(ISSPARSE(ip));
463 /* initialize the extent allocation hint */
466 /* allocate an extent to fill the hole */
467 if ((rc
= extAlloc(ip
, nbperpage
, blkno
, xp
, false)))
470 assert(lengthPXD(xp
) == nbperpage
);
480 * FUNCTION: allocate disk blocks to form an extent.
482 * initially, we will try to allocate disk blocks for the
483 * requested size (nblocks). if this fails (nblocks
484 * contiguous free blocks not available), we'll try to allocate
485 * a smaller number of blocks (producing a smaller extent), with
486 * this smaller number of blocks consisting of the requested
487 * number of blocks rounded down to the next smaller power of 2
488 * number (i.e. 16 -> 8). we'll continue to round down and
489 * retry the allocation until the number of blocks to allocate
490 * is smaller than the number of blocks per page.
493 * ip - the inode of the file.
494 * hint - disk block number to be used as an allocation hint.
495 * *nblocks - pointer to an s64 value. on entry, this value specifies
496 * the desired number of block to be allocated. on successful
497 * exit, this value is set to the number of blocks actually
499 * blkno - pointer to a block address that is filled in on successful
500 * return with the starting block number of the newly
501 * allocated block range.
506 * -ENOSPC - insufficient disk resources.
509 extBalloc(struct inode
*ip
, s64 hint
, s64
* nblocks
, s64
* blkno
)
511 struct jfs_inode_info
*ji
= JFS_IP(ip
);
512 struct jfs_sb_info
*sbi
= JFS_SBI(ip
->i_sb
);
513 s64 nb
, nblks
, daddr
, max
;
514 int rc
, nbperpage
= sbi
->nbperpage
;
515 struct bmap
*bmp
= sbi
->bmap
;
518 /* get the number of blocks to initially attempt to allocate.
519 * we'll first try the number of blocks requested unless this
520 * number is greater than the maximum number of contiguous free
521 * blocks in the map. in that case, we'll start off with the
524 max
= (s64
) 1 << bmp
->db_maxfreebud
;
525 if (*nblocks
>= max
&& *nblocks
> nbperpage
)
526 nb
= nblks
= (max
> nbperpage
) ? max
: nbperpage
;
528 nb
= nblks
= *nblocks
;
530 /* try to allocate blocks */
531 while ((rc
= dbAlloc(ip
, hint
, nb
, &daddr
)) != 0) {
532 /* if something other than an out of space error,
533 * stop and return this error.
538 /* decrease the allocation request size */
539 nb
= min(nblks
, extRoundDown(nb
));
541 /* give up if we cannot cover a page */
549 if (S_ISREG(ip
->i_mode
) && (ji
->fileset
== FILESYSTEM_I
)) {
550 ag
= BLKTOAG(daddr
, sbi
);
551 spin_lock_irq(&ji
->ag_lock
);
552 if (ji
->active_ag
== -1) {
553 atomic_inc(&bmp
->db_active
[ag
]);
555 } else if (ji
->active_ag
!= ag
) {
556 atomic_dec(&bmp
->db_active
[ji
->active_ag
]);
557 atomic_inc(&bmp
->db_active
[ag
]);
560 spin_unlock_irq(&ji
->ag_lock
);
569 * NAME: extBrealloc()
571 * FUNCTION: attempt to extend an extent's allocation.
573 * Initially, we will try to extend the extent's allocation
574 * in place. If this fails, we'll try to move the extent
575 * to a new set of blocks. If moving the extent, we initially
576 * will try to allocate disk blocks for the requested size
577 * (newnblks). if this fails (new contiguous free blocks not
578 * available), we'll try to allocate a smaller number of
579 * blocks (producing a smaller extent), with this smaller
580 * number of blocks consisting of the requested number of
581 * blocks rounded down to the next smaller power of 2
582 * number (i.e. 16 -> 8). We'll continue to round down and
583 * retry the allocation until the number of blocks to allocate
584 * is smaller than the number of blocks per page.
587 * ip - the inode of the file.
588 * blkno - starting block number of the extents current allocation.
589 * nblks - number of blocks within the extents current allocation.
590 * newnblks - pointer to a s64 value. on entry, this value is the
591 * the new desired extent size (number of blocks). on
592 * successful exit, this value is set to the extent's actual
593 * new size (new number of blocks).
594 * newblkno - the starting block number of the extents new allocation.
599 * -ENOSPC - insufficient disk resources.
602 extBrealloc(struct inode
*ip
,
603 s64 blkno
, s64 nblks
, s64
* newnblks
, s64
* newblkno
)
607 /* try to extend in place */
608 if ((rc
= dbExtend(ip
, blkno
, nblks
, *newnblks
- nblks
)) == 0) {
616 /* in place extension not possible.
617 * try to move the extent to a new set of blocks.
619 return (extBalloc(ip
, blkno
, newnblks
, newblkno
));
625 * NAME: extRoundDown()
627 * FUNCTION: round down a specified number of blocks to the next
628 * smallest power of 2 number.
631 * nb - the inode of the file.
634 * next smallest power of 2 number.
636 static s64
extRoundDown(s64 nb
)
641 for (i
= 0, m
= (u64
) 1 << 63; i
< 64; i
++, m
>>= 1) {
648 k
= ((k
- 1) & nb
) ? k
: k
>> 1;