1 // SPDX-License-Identifier: GPL-2.0-only
3 * kvm asynchronous fault support
5 * Copyright 2010 Red Hat, Inc.
8 * Gleb Natapov <gleb@redhat.com>
11 #include <linux/kvm_host.h>
12 #include <linux/slab.h>
13 #include <linux/module.h>
14 #include <linux/mmu_context.h>
15 #include <linux/sched/mm.h>
18 #include <trace/events/kvm.h>
20 static inline void kvm_async_page_present_sync(struct kvm_vcpu
*vcpu
,
21 struct kvm_async_pf
*work
)
23 #ifdef CONFIG_KVM_ASYNC_PF_SYNC
24 kvm_arch_async_page_present(vcpu
, work
);
27 static inline void kvm_async_page_present_async(struct kvm_vcpu
*vcpu
,
28 struct kvm_async_pf
*work
)
30 #ifndef CONFIG_KVM_ASYNC_PF_SYNC
31 kvm_arch_async_page_present(vcpu
, work
);
35 static struct kmem_cache
*async_pf_cache
;
37 int kvm_async_pf_init(void)
39 async_pf_cache
= KMEM_CACHE(kvm_async_pf
, 0);
47 void kvm_async_pf_deinit(void)
49 kmem_cache_destroy(async_pf_cache
);
50 async_pf_cache
= NULL
;
53 void kvm_async_pf_vcpu_init(struct kvm_vcpu
*vcpu
)
55 INIT_LIST_HEAD(&vcpu
->async_pf
.done
);
56 INIT_LIST_HEAD(&vcpu
->async_pf
.queue
);
57 spin_lock_init(&vcpu
->async_pf
.lock
);
60 static void async_pf_execute(struct work_struct
*work
)
62 struct kvm_async_pf
*apf
=
63 container_of(work
, struct kvm_async_pf
, work
);
64 struct mm_struct
*mm
= apf
->mm
;
65 struct kvm_vcpu
*vcpu
= apf
->vcpu
;
66 unsigned long addr
= apf
->addr
;
73 * This work is run asynchronously to the task which owns
74 * mm and might be done in another context, so we must
77 down_read(&mm
->mmap_sem
);
78 get_user_pages_remote(NULL
, mm
, addr
, 1, FOLL_WRITE
, NULL
, NULL
,
81 up_read(&mm
->mmap_sem
);
83 kvm_async_page_present_sync(vcpu
, apf
);
85 spin_lock(&vcpu
->async_pf
.lock
);
86 list_add_tail(&apf
->link
, &vcpu
->async_pf
.done
);
88 spin_unlock(&vcpu
->async_pf
.lock
);
91 * apf may be freed by kvm_check_async_pf_completion() after
95 trace_kvm_async_pf_completed(addr
, gva
);
97 if (swq_has_sleeper(&vcpu
->wq
))
98 swake_up_one(&vcpu
->wq
);
101 kvm_put_kvm(vcpu
->kvm
);
104 void kvm_clear_async_pf_completion_queue(struct kvm_vcpu
*vcpu
)
106 spin_lock(&vcpu
->async_pf
.lock
);
108 /* cancel outstanding work queue item */
109 while (!list_empty(&vcpu
->async_pf
.queue
)) {
110 struct kvm_async_pf
*work
=
111 list_first_entry(&vcpu
->async_pf
.queue
,
112 typeof(*work
), queue
);
113 list_del(&work
->queue
);
116 * We know it's present in vcpu->async_pf.done, do
122 spin_unlock(&vcpu
->async_pf
.lock
);
123 #ifdef CONFIG_KVM_ASYNC_PF_SYNC
124 flush_work(&work
->work
);
126 if (cancel_work_sync(&work
->work
)) {
128 kvm_put_kvm(vcpu
->kvm
); /* == work->vcpu->kvm */
129 kmem_cache_free(async_pf_cache
, work
);
132 spin_lock(&vcpu
->async_pf
.lock
);
135 while (!list_empty(&vcpu
->async_pf
.done
)) {
136 struct kvm_async_pf
*work
=
137 list_first_entry(&vcpu
->async_pf
.done
,
138 typeof(*work
), link
);
139 list_del(&work
->link
);
140 kmem_cache_free(async_pf_cache
, work
);
142 spin_unlock(&vcpu
->async_pf
.lock
);
144 vcpu
->async_pf
.queued
= 0;
147 void kvm_check_async_pf_completion(struct kvm_vcpu
*vcpu
)
149 struct kvm_async_pf
*work
;
151 while (!list_empty_careful(&vcpu
->async_pf
.done
) &&
152 kvm_arch_can_inject_async_page_present(vcpu
)) {
153 spin_lock(&vcpu
->async_pf
.lock
);
154 work
= list_first_entry(&vcpu
->async_pf
.done
, typeof(*work
),
156 list_del(&work
->link
);
157 spin_unlock(&vcpu
->async_pf
.lock
);
159 kvm_arch_async_page_ready(vcpu
, work
);
160 kvm_async_page_present_async(vcpu
, work
);
162 list_del(&work
->queue
);
163 vcpu
->async_pf
.queued
--;
164 kmem_cache_free(async_pf_cache
, work
);
168 int kvm_setup_async_pf(struct kvm_vcpu
*vcpu
, gva_t gva
, unsigned long hva
,
169 struct kvm_arch_async_pf
*arch
)
171 struct kvm_async_pf
*work
;
173 if (vcpu
->async_pf
.queued
>= ASYNC_PF_PER_VCPU
)
176 /* setup delayed work */
179 * do alloc nowait since if we are going to sleep anyway we
180 * may as well sleep faulting in page
182 work
= kmem_cache_zalloc(async_pf_cache
, GFP_NOWAIT
| __GFP_NOWARN
);
186 work
->wakeup_all
= false;
191 work
->mm
= current
->mm
;
193 kvm_get_kvm(work
->vcpu
->kvm
);
195 /* this can't really happen otherwise gfn_to_pfn_async
197 if (unlikely(kvm_is_error_hva(work
->addr
)))
200 INIT_WORK(&work
->work
, async_pf_execute
);
201 if (!schedule_work(&work
->work
))
204 list_add_tail(&work
->queue
, &vcpu
->async_pf
.queue
);
205 vcpu
->async_pf
.queued
++;
206 kvm_arch_async_page_not_present(vcpu
, work
);
209 kvm_put_kvm(work
->vcpu
->kvm
);
211 kmem_cache_free(async_pf_cache
, work
);
215 int kvm_async_pf_wakeup_all(struct kvm_vcpu
*vcpu
)
217 struct kvm_async_pf
*work
;
219 if (!list_empty_careful(&vcpu
->async_pf
.done
))
222 work
= kmem_cache_zalloc(async_pf_cache
, GFP_ATOMIC
);
226 work
->wakeup_all
= true;
227 INIT_LIST_HEAD(&work
->queue
); /* for list_del to work */
229 spin_lock(&vcpu
->async_pf
.lock
);
230 list_add_tail(&work
->link
, &vcpu
->async_pf
.done
);
231 spin_unlock(&vcpu
->async_pf
.lock
);
233 vcpu
->async_pf
.queued
++;