Blame - marvell/linux/virt/kvm/async_pf.c - T108

blob: 9e6532488c47dfa3fd1d4f0245aec32755bb029a [file] [log] [blame]

b.liu	e958203	2025-04-17 19:18:16 +0800	[diff] [blame^]	1	// SPDX-License-Identifier: GPL-2.0-only
				2	/*
				3	* kvm asynchronous fault support
				4	*
				5	* Copyright 2010 Red Hat, Inc.
				6	*
				7	* Author:
				8	* Gleb Natapov <gleb@redhat.com>
				9	*/
				10
				11	#include <linux/kvm_host.h>
				12	#include <linux/slab.h>
				13	#include <linux/module.h>
				14	#include <linux/mmu_context.h>
				15	#include <linux/sched/mm.h>
				16
				17	#include "async_pf.h"
				18	#include <trace/events/kvm.h>
				19
				20	static inline void kvm_async_page_present_sync(struct kvm_vcpu *vcpu,
				21	struct kvm_async_pf *work)
				22	{
				23	#ifdef CONFIG_KVM_ASYNC_PF_SYNC
				24	kvm_arch_async_page_present(vcpu, work);
				25	#endif
				26	}
				27	static inline void kvm_async_page_present_async(struct kvm_vcpu *vcpu,
				28	struct kvm_async_pf *work)
				29	{
				30	#ifndef CONFIG_KVM_ASYNC_PF_SYNC
				31	kvm_arch_async_page_present(vcpu, work);
				32	#endif
				33	}
				34
				35	static struct kmem_cache *async_pf_cache;
				36
				37	int kvm_async_pf_init(void)
				38	{
				39	async_pf_cache = KMEM_CACHE(kvm_async_pf, 0);
				40
				41	if (!async_pf_cache)
				42	return -ENOMEM;
				43
				44	return 0;
				45	}
				46
				47	void kvm_async_pf_deinit(void)
				48	{
				49	kmem_cache_destroy(async_pf_cache);
				50	async_pf_cache = NULL;
				51	}
				52
				53	void kvm_async_pf_vcpu_init(struct kvm_vcpu *vcpu)
				54	{
				55	INIT_LIST_HEAD(&vcpu->async_pf.done);
				56	INIT_LIST_HEAD(&vcpu->async_pf.queue);
				57	spin_lock_init(&vcpu->async_pf.lock);
				58	}
				59
				60	static void async_pf_execute(struct work_struct *work)
				61	{
				62	struct kvm_async_pf *apf =
				63	container_of(work, struct kvm_async_pf, work);
				64	struct mm_struct *mm = apf->mm;
				65	struct kvm_vcpu *vcpu = apf->vcpu;
				66	unsigned long addr = apf->addr;
				67	gpa_t cr2_or_gpa = apf->cr2_or_gpa;
				68	int locked = 1;
				69
				70	might_sleep();
				71
				72	/*
				73	* This work is run asynchronously to the task which owns
				74	* mm and might be done in another context, so we must
				75	* access remotely.
				76	*/
				77	down_read(&mm->mmap_sem);
				78	get_user_pages_remote(NULL, mm, addr, 1, FOLL_WRITE, NULL, NULL,
				79	&locked);
				80	if (locked)
				81	up_read(&mm->mmap_sem);
				82
				83	kvm_async_page_present_sync(vcpu, apf);
				84
				85	spin_lock(&vcpu->async_pf.lock);
				86	list_add_tail(&apf->link, &vcpu->async_pf.done);
				87	apf->vcpu = NULL;
				88	spin_unlock(&vcpu->async_pf.lock);
				89
				90	/*
				91	* apf may be freed by kvm_check_async_pf_completion() after
				92	* this point
				93	*/
				94
				95	trace_kvm_async_pf_completed(addr, cr2_or_gpa);
				96
				97	if (swq_has_sleeper(&vcpu->wq))
				98	swake_up_one(&vcpu->wq);
				99
				100	mmput(mm);
				101	}
				102
				103	static void kvm_flush_and_free_async_pf_work(struct kvm_async_pf *work)
				104	{
				105	/*
				106	* The async #PF is "done", but KVM must wait for the work item itself,
				107	* i.e. async_pf_execute(), to run to completion. If KVM is a module,
				108	* KVM must ensure no code owned by the KVM (the module) can be run
				109	* after the last call to module_put(). Note, flushing the work item
				110	* is always required when the item is taken off the completion queue.
				111	* E.g. even if the vCPU handles the item in the "normal" path, the VM
				112	* could be terminated before async_pf_execute() completes.
				113	*
				114	* Wake all events skip the queue and go straight done, i.e. don't
				115	* need to be flushed (but sanity check that the work wasn't queued).
				116	*/
				117	if (work->wakeup_all)
				118	WARN_ON_ONCE(work->work.func);
				119	else
				120	flush_work(&work->work);
				121	kmem_cache_free(async_pf_cache, work);
				122	}
				123
				124	void kvm_clear_async_pf_completion_queue(struct kvm_vcpu *vcpu)
				125	{
				126	spin_lock(&vcpu->async_pf.lock);
				127
				128	/* cancel outstanding work queue item */
				129	while (!list_empty(&vcpu->async_pf.queue)) {
				130	struct kvm_async_pf *work =
				131	list_first_entry(&vcpu->async_pf.queue,
				132	typeof(*work), queue);
				133	list_del(&work->queue);
				134
				135	/*
				136	* We know it's present in vcpu->async_pf.done, do
				137	* nothing here.
				138	*/
				139	if (!work->vcpu)
				140	continue;
				141
				142	spin_unlock(&vcpu->async_pf.lock);
				143	#ifdef CONFIG_KVM_ASYNC_PF_SYNC
				144	flush_work(&work->work);
				145	#else
				146	if (cancel_work_sync(&work->work)) {
				147	mmput(work->mm);
				148	kmem_cache_free(async_pf_cache, work);
				149	}
				150	#endif
				151	spin_lock(&vcpu->async_pf.lock);
				152	}
				153
				154	while (!list_empty(&vcpu->async_pf.done)) {
				155	struct kvm_async_pf *work =
				156	list_first_entry(&vcpu->async_pf.done,
				157	typeof(*work), link);
				158	list_del(&work->link);
				159
				160	spin_unlock(&vcpu->async_pf.lock);
				161	kvm_flush_and_free_async_pf_work(work);
				162	spin_lock(&vcpu->async_pf.lock);
				163	}
				164	spin_unlock(&vcpu->async_pf.lock);
				165
				166	vcpu->async_pf.queued = 0;
				167	}
				168
				169	void kvm_check_async_pf_completion(struct kvm_vcpu *vcpu)
				170	{
				171	struct kvm_async_pf *work;
				172
				173	while (!list_empty_careful(&vcpu->async_pf.done) &&
				174	kvm_arch_can_inject_async_page_present(vcpu)) {
				175	spin_lock(&vcpu->async_pf.lock);
				176	work = list_first_entry(&vcpu->async_pf.done, typeof(*work),
				177	link);
				178	list_del(&work->link);
				179	spin_unlock(&vcpu->async_pf.lock);
				180
				181	kvm_arch_async_page_ready(vcpu, work);
				182	kvm_async_page_present_async(vcpu, work);
				183
				184	list_del(&work->queue);
				185	vcpu->async_pf.queued--;
				186	kvm_flush_and_free_async_pf_work(work);
				187	}
				188	}
				189
				190	int kvm_setup_async_pf(struct kvm_vcpu *vcpu, gpa_t cr2_or_gpa,
				191	unsigned long hva, struct kvm_arch_async_pf *arch)
				192	{
				193	struct kvm_async_pf *work;
				194
				195	if (vcpu->async_pf.queued >= ASYNC_PF_PER_VCPU)
				196	return 0;
				197
				198	/* Arch specific code should not do async PF in this case */
				199	if (unlikely(kvm_is_error_hva(hva)))
				200	return 0;
				201
				202	/*
				203	* do alloc nowait since if we are going to sleep anyway we
				204	* may as well sleep faulting in page
				205	*/
				206	work = kmem_cache_zalloc(async_pf_cache, GFP_NOWAIT \| __GFP_NOWARN);
				207	if (!work)
				208	return 0;
				209
				210	work->wakeup_all = false;
				211	work->vcpu = vcpu;
				212	work->cr2_or_gpa = cr2_or_gpa;
				213	work->addr = hva;
				214	work->arch = *arch;
				215	work->mm = current->mm;
				216	mmget(work->mm);
				217
				218	INIT_WORK(&work->work, async_pf_execute);
				219
				220	list_add_tail(&work->queue, &vcpu->async_pf.queue);
				221	vcpu->async_pf.queued++;
				222	kvm_arch_async_page_not_present(vcpu, work);
				223
				224	schedule_work(&work->work);
				225
				226	return 1;
				227	}
				228
				229	int kvm_async_pf_wakeup_all(struct kvm_vcpu *vcpu)
				230	{
				231	struct kvm_async_pf *work;
				232
				233	if (!list_empty_careful(&vcpu->async_pf.done))
				234	return 0;
				235
				236	work = kmem_cache_zalloc(async_pf_cache, GFP_ATOMIC);
				237	if (!work)
				238	return -ENOMEM;
				239
				240	work->wakeup_all = true;
				241	INIT_LIST_HEAD(&work->queue); /* for list_del to work */
				242
				243	spin_lock(&vcpu->async_pf.lock);
				244	list_add_tail(&work->link, &vcpu->async_pf.done);
				245	spin_unlock(&vcpu->async_pf.lock);
				246
				247	vcpu->async_pf.queued++;
				248	return 0;
				249	}