1 /* $NetBSD: uvm_vnode.c,v 1.92 2009/08/04 23:31:57 pooka Exp $ */
4 * Copyright (c) 1997 Charles D. Cranor and Washington University.
5 * Copyright (c) 1991, 1993
6 * The Regents of the University of California.
7 * Copyright (c) 1990 University of Utah.
11 * This code is derived from software contributed to Berkeley by
12 * the Systems Programming Group of the University of Utah Computer
15 * Redistribution and use in source and binary forms, with or without
16 * modification, are permitted provided that the following conditions
18 * 1. Redistributions of source code must retain the above copyright
19 * notice, this list of conditions and the following disclaimer.
20 * 2. Redistributions in binary form must reproduce the above copyright
21 * notice, this list of conditions and the following disclaimer in the
22 * documentation and/or other materials provided with the distribution.
23 * 3. All advertising materials mentioning features or use of this software
24 * must display the following acknowledgement:
25 * This product includes software developed by Charles D. Cranor,
26 * Washington University, the University of California, Berkeley and
28 * 4. Neither the name of the University nor the names of its contributors
29 * may be used to endorse or promote products derived from this software
30 * without specific prior written permission.
32 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
33 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
34 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
35 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
36 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
37 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
38 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
39 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
40 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
41 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
44 * @(#)vnode_pager.c 8.8 (Berkeley) 2/13/94
45 * from: Id: uvm_vnode.c,v 1.1.2.26 1998/02/02 20:38:07 chuck Exp
49 * uvm_vnode.c: the vnode pager.
52 #include <sys/cdefs.h>
53 __KERNEL_RCSID(0, "$NetBSD: uvm_vnode.c,v 1.92 2009/08/04 23:31:57 pooka Exp $");
55 #include "opt_uvmhist.h"
57 #include <sys/param.h>
58 #include <sys/systm.h>
59 #include <sys/kernel.h>
61 #include <sys/malloc.h>
62 #include <sys/vnode.h>
63 #include <sys/disklabel.h>
64 #include <sys/ioctl.h>
65 #include <sys/fcntl.h>
68 #include <sys/mount.h>
70 #include <miscfs/specfs/specdev.h>
73 #include <uvm/uvm_readahead.h>
79 static void uvn_detach(struct uvm_object
*);
80 static int uvn_get(struct uvm_object
*, voff_t
, struct vm_page
**, int *,
81 int, vm_prot_t
, int, int);
82 static int uvn_put(struct uvm_object
*, voff_t
, voff_t
, int);
83 static void uvn_reference(struct uvm_object
*);
85 static int uvn_findpage(struct uvm_object
*, voff_t
, struct vm_page
**,
89 * master pager structure
92 const struct uvm_pagerops uvm_vnodeops
= {
93 .pgo_reference
= uvn_reference
,
94 .pgo_detach
= uvn_detach
,
106 * duplicate a reference to a VM object. Note that the reference
107 * count must already be at least one (the passed in reference) so
108 * there is no chance of the uvn being killed or locked out here.
110 * => caller must call with object unlocked.
111 * => caller must be using the same accessprot as was used at attach time
115 uvn_reference(struct uvm_object
*uobj
)
117 vref((struct vnode
*)uobj
);
124 * remove a reference to a VM object.
126 * => caller must call with object unlocked and map locked.
130 uvn_detach(struct uvm_object
*uobj
)
132 vrele((struct vnode
*)uobj
);
136 * uvn_put: flush page data to backing store.
138 * => object must be locked on entry! VOP_PUTPAGES must unlock it.
139 * => flags: PGO_SYNCIO -- use sync. I/O
140 * => note: caller must set PG_CLEAN and pmap_clear_modify (if needed)
144 uvn_put(struct uvm_object
*uobj
, voff_t offlo
, voff_t offhi
, int flags
)
146 struct vnode
*vp
= (struct vnode
*)uobj
;
149 KASSERT(mutex_owned(&vp
->v_interlock
));
150 error
= VOP_PUTPAGES(vp
, offlo
, offhi
, flags
);
157 * uvn_get: get pages (synchronously) from backing store
159 * => prefer map unlocked (not required)
160 * => object must be locked! we will _unlock_ it before starting any I/O.
161 * => flags: PGO_ALLPAGES: get all of the pages
162 * PGO_LOCKED: fault data structures are locked
163 * => NOTE: offset is the offset of pps[0], _NOT_ pps[centeridx]
164 * => NOTE: caller must check for released pages!!
168 uvn_get(struct uvm_object
*uobj
, voff_t offset
,
169 struct vm_page
**pps
/* IN/OUT */,
170 int *npagesp
/* IN (OUT if PGO_LOCKED)*/,
171 int centeridx
, vm_prot_t access_type
, int advice
, int flags
)
173 struct vnode
*vp
= (struct vnode
*)uobj
;
176 UVMHIST_FUNC("uvn_get"); UVMHIST_CALLED(ubchist
);
178 UVMHIST_LOG(ubchist
, "vp %p off 0x%x", vp
, (int)offset
, 0,0);
180 if ((access_type
& VM_PROT_WRITE
) == 0 && (flags
& PGO_LOCKED
) == 0) {
182 uvm_ra_request(vp
->v_ractx
, advice
, uobj
, offset
,
183 *npagesp
<< PAGE_SHIFT
);
186 error
= VOP_GETPAGES(vp
, offset
, pps
, npagesp
, centeridx
,
187 access_type
, advice
, flags
);
189 KASSERT(((flags
& PGO_LOCKED
) != 0 && mutex_owned(&vp
->v_interlock
)) ||
190 (flags
& PGO_LOCKED
) == 0);
197 * return the page for the uobj and offset requested, allocating if needed.
198 * => uobj must be locked.
199 * => returned pages will be BUSY.
203 uvn_findpages(struct uvm_object
*uobj
, voff_t offset
, int *npagesp
,
204 struct vm_page
**pgs
, int flags
)
206 int i
, count
, found
, npages
, rv
;
210 if (flags
& UFP_BACKWARD
) {
211 for (i
= npages
- 1; i
>= 0; i
--, offset
-= PAGE_SIZE
) {
212 rv
= uvn_findpage(uobj
, offset
, &pgs
[i
], flags
);
214 if (flags
& UFP_DIRTYONLY
)
221 for (i
= 0; i
< npages
; i
++, offset
+= PAGE_SIZE
) {
222 rv
= uvn_findpage(uobj
, offset
, &pgs
[i
], flags
);
224 if (flags
& UFP_DIRTYONLY
)
236 uvn_findpage(struct uvm_object
*uobj
, voff_t offset
, struct vm_page
**pgp
,
241 UVMHIST_FUNC("uvn_findpage"); UVMHIST_CALLED(ubchist
);
242 UVMHIST_LOG(ubchist
, "vp %p off 0x%lx", uobj
, offset
,0,0);
245 UVMHIST_LOG(ubchist
, "dontcare", 0,0,0,0);
249 /* look for an existing page */
250 pg
= uvm_pagelookup(uobj
, offset
);
252 /* nope? allocate one now */
254 if (flags
& UFP_NOALLOC
) {
255 UVMHIST_LOG(ubchist
, "noalloc", 0,0,0,0);
258 pg
= uvm_pagealloc(uobj
, offset
, NULL
, 0);
260 if (flags
& UFP_NOWAIT
) {
261 UVMHIST_LOG(ubchist
, "nowait",0,0,0,0);
264 mutex_exit(&uobj
->vmobjlock
);
266 mutex_enter(&uobj
->vmobjlock
);
269 UVMHIST_LOG(ubchist
, "alloced %p", pg
,0,0,0);
271 } else if (flags
& UFP_NOCACHE
) {
272 UVMHIST_LOG(ubchist
, "nocache",0,0,0,0);
276 /* page is there, see if we need to wait on it */
277 if ((pg
->flags
& PG_BUSY
) != 0) {
278 if (flags
& UFP_NOWAIT
) {
279 UVMHIST_LOG(ubchist
, "nowait",0,0,0,0);
282 pg
->flags
|= PG_WANTED
;
283 UVMHIST_LOG(ubchist
, "wait %p", pg
,0,0,0);
284 UVM_UNLOCK_AND_WAIT(pg
, &uobj
->vmobjlock
, 0,
286 mutex_enter(&uobj
->vmobjlock
);
290 /* skip PG_RDONLY pages if requested */
291 if ((flags
& UFP_NORDONLY
) && (pg
->flags
& PG_RDONLY
)) {
292 UVMHIST_LOG(ubchist
, "nordonly",0,0,0,0);
296 /* stop on clean pages if requested */
297 if (flags
& UFP_DIRTYONLY
) {
298 dirty
= pmap_clear_modify(pg
) ||
299 (pg
->flags
& PG_CLEAN
) == 0;
300 pg
->flags
|= PG_CLEAN
;
302 UVMHIST_LOG(ubchist
, "dirtonly", 0,0,0,0);
307 /* mark the page BUSY and we're done. */
308 pg
->flags
|= PG_BUSY
;
309 UVM_PAGE_OWN(pg
, "uvn_findpage");
310 UVMHIST_LOG(ubchist
, "found %p", pg
,0,0,0);
318 * uvm_vnp_setsize: grow or shrink a vnode uobj
320 * grow => just update size value
321 * shrink => toss un-needed pages
323 * => we assume that the caller has a reference of some sort to the
324 * vnode in question so that it will not be yanked out from under
329 uvm_vnp_setsize(struct vnode
*vp
, voff_t newsize
)
331 struct uvm_object
*uobj
= &vp
->v_uobj
;
332 voff_t pgend
= round_page(newsize
);
334 UVMHIST_FUNC("uvm_vnp_setsize"); UVMHIST_CALLED(ubchist
);
336 mutex_enter(&uobj
->vmobjlock
);
337 UVMHIST_LOG(ubchist
, "vp %p old 0x%x new 0x%x",
338 vp
, vp
->v_size
, newsize
, 0);
341 * now check if the size has changed: if we shrink we had better
345 KASSERT(newsize
!= VSIZENOTSET
);
346 KASSERT(vp
->v_size
<= vp
->v_writesize
);
347 KASSERT(vp
->v_size
== vp
->v_writesize
||
348 newsize
== vp
->v_writesize
|| newsize
<= vp
->v_size
);
350 oldsize
= vp
->v_writesize
;
351 KASSERT(oldsize
!= VSIZENOTSET
|| pgend
> oldsize
);
353 if (oldsize
> pgend
) {
354 (void) uvn_put(uobj
, pgend
, 0, PGO_FREE
| PGO_SYNCIO
);
355 mutex_enter(&uobj
->vmobjlock
);
357 vp
->v_size
= vp
->v_writesize
= newsize
;
358 mutex_exit(&uobj
->vmobjlock
);
362 uvm_vnp_setwritesize(struct vnode
*vp
, voff_t newsize
)
365 mutex_enter(&vp
->v_interlock
);
366 KASSERT(newsize
!= VSIZENOTSET
);
367 KASSERT(vp
->v_size
!= VSIZENOTSET
);
368 KASSERT(vp
->v_writesize
!= VSIZENOTSET
);
369 KASSERT(vp
->v_size
<= vp
->v_writesize
);
370 KASSERT(vp
->v_size
<= newsize
);
371 vp
->v_writesize
= newsize
;
372 mutex_exit(&vp
->v_interlock
);
376 uvn_text_p(struct uvm_object
*uobj
)
378 struct vnode
*vp
= (struct vnode
*)uobj
;
380 return (vp
->v_iflag
& VI_EXECMAP
) != 0;
384 uvn_clean_p(struct uvm_object
*uobj
)
386 struct vnode
*vp
= (struct vnode
*)uobj
;
388 return (vp
->v_iflag
& VI_ONWORKLST
) == 0;
392 uvn_needs_writefault_p(struct uvm_object
*uobj
)
394 struct vnode
*vp
= (struct vnode
*)uobj
;
396 return uvn_clean_p(uobj
) ||
397 (vp
->v_iflag
& (VI_WRMAP
|VI_WRMAPDIRTY
)) == VI_WRMAP
;