virt/kvm/async_pf.c

*af585b92SGleb Natapov/*
*af585b92SGleb Natapov * kvm asynchronous fault support
*af585b92SGleb Natapov *
*af585b92SGleb Natapov * Copyright 2010 Red Hat, Inc.
*af585b92SGleb Natapov *
*af585b92SGleb Natapov * Author:
*af585b92SGleb Natapov *      Gleb Natapov <gleb@redhat.com>
*af585b92SGleb Natapov *
*af585b92SGleb Natapov * This file is free software; you can redistribute it and/or modify
*af585b92SGleb Natapov * it under the terms of version 2 of the GNU General Public License
*af585b92SGleb Natapov * as published by the Free Software Foundation.
*af585b92SGleb Natapov *
*af585b92SGleb Natapov * This program is distributed in the hope that it will be useful,
*af585b92SGleb Natapov * but WITHOUT ANY WARRANTY; without even the implied warranty of
*af585b92SGleb Natapov * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
*af585b92SGleb Natapov * GNU General Public License for more details.
*af585b92SGleb Natapov *
*af585b92SGleb Natapov * You should have received a copy of the GNU General Public License
*af585b92SGleb Natapov * along with this program; if not, write to the Free Software Foundation,
*af585b92SGleb Natapov * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA.
*af585b92SGleb Natapov */
*af585b92SGleb Natapov
*af585b92SGleb Natapov#include <linux/kvm_host.h>
*af585b92SGleb Natapov#include <linux/slab.h>
*af585b92SGleb Natapov#include <linux/module.h>
*af585b92SGleb Natapov#include <linux/mmu_context.h>
*af585b92SGleb Natapov
*af585b92SGleb Natapov#include "async_pf.h"
*af585b92SGleb Natapov#include <trace/events/kvm.h>
*af585b92SGleb Natapov
*af585b92SGleb Natapovstatic struct kmem_cache *async_pf_cache;
*af585b92SGleb Natapov
*af585b92SGleb Natapovint kvm_async_pf_init(void)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	async_pf_cache = KMEM_CACHE(kvm_async_pf, 0);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	if (!async_pf_cache)
*af585b92SGleb Natapov		return -ENOMEM;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	return 0;
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovvoid kvm_async_pf_deinit(void)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	if (async_pf_cache)
*af585b92SGleb Natapov		kmem_cache_destroy(async_pf_cache);
*af585b92SGleb Natapov	async_pf_cache = NULL;
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovvoid kvm_async_pf_vcpu_init(struct kvm_vcpu *vcpu)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	INIT_LIST_HEAD(&vcpu->async_pf.done);
*af585b92SGleb Natapov	INIT_LIST_HEAD(&vcpu->async_pf.queue);
*af585b92SGleb Natapov	spin_lock_init(&vcpu->async_pf.lock);
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovstatic void async_pf_execute(struct work_struct *work)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	struct page *page = NULL;
*af585b92SGleb Natapov	struct kvm_async_pf *apf =
*af585b92SGleb Natapov		container_of(work, struct kvm_async_pf, work);
*af585b92SGleb Natapov	struct mm_struct *mm = apf->mm;
*af585b92SGleb Natapov	struct kvm_vcpu *vcpu = apf->vcpu;
*af585b92SGleb Natapov	unsigned long addr = apf->addr;
*af585b92SGleb Natapov	gva_t gva = apf->gva;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	might_sleep();
*af585b92SGleb Natapov
*af585b92SGleb Natapov	use_mm(mm);
*af585b92SGleb Natapov	down_read(&mm->mmap_sem);
*af585b92SGleb Natapov	get_user_pages(current, mm, addr, 1, 1, 0, &page, NULL);
*af585b92SGleb Natapov	up_read(&mm->mmap_sem);
*af585b92SGleb Natapov	unuse_mm(mm);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	spin_lock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov	list_add_tail(&apf->link, &vcpu->async_pf.done);
*af585b92SGleb Natapov	apf->page = page;
*af585b92SGleb Natapov	apf->done = true;
*af585b92SGleb Natapov	spin_unlock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	/*
*af585b92SGleb Natapov	 * apf may be freed by kvm_check_async_pf_completion() after
*af585b92SGleb Natapov	 * this point
*af585b92SGleb Natapov	 */
*af585b92SGleb Natapov
*af585b92SGleb Natapov	trace_kvm_async_pf_completed(addr, page, gva);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	if (waitqueue_active(&vcpu->wq))
*af585b92SGleb Natapov		wake_up_interruptible(&vcpu->wq);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	mmdrop(mm);
*af585b92SGleb Natapov	kvm_put_kvm(vcpu->kvm);
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovvoid kvm_clear_async_pf_completion_queue(struct kvm_vcpu *vcpu)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	/* cancel outstanding work queue item */
*af585b92SGleb Natapov	while (!list_empty(&vcpu->async_pf.queue)) {
*af585b92SGleb Natapov		struct kvm_async_pf *work =
*af585b92SGleb Natapov			list_entry(vcpu->async_pf.queue.next,
*af585b92SGleb Natapov				   typeof(*work), queue);
*af585b92SGleb Natapov		cancel_work_sync(&work->work);
*af585b92SGleb Natapov		list_del(&work->queue);
*af585b92SGleb Natapov		if (!work->done) /* work was canceled */
*af585b92SGleb Natapov			kmem_cache_free(async_pf_cache, work);
*af585b92SGleb Natapov	}
*af585b92SGleb Natapov
*af585b92SGleb Natapov	spin_lock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov	while (!list_empty(&vcpu->async_pf.done)) {
*af585b92SGleb Natapov		struct kvm_async_pf *work =
*af585b92SGleb Natapov			list_entry(vcpu->async_pf.done.next,
*af585b92SGleb Natapov				   typeof(*work), link);
*af585b92SGleb Natapov		list_del(&work->link);
*af585b92SGleb Natapov		if (work->page)
*af585b92SGleb Natapov			put_page(work->page);
*af585b92SGleb Natapov		kmem_cache_free(async_pf_cache, work);
*af585b92SGleb Natapov	}
*af585b92SGleb Natapov	spin_unlock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	vcpu->async_pf.queued = 0;
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovvoid kvm_check_async_pf_completion(struct kvm_vcpu *vcpu)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	struct kvm_async_pf *work;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	if (list_empty_careful(&vcpu->async_pf.done))
*af585b92SGleb Natapov		return;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	spin_lock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov	work = list_first_entry(&vcpu->async_pf.done, typeof(*work), link);
*af585b92SGleb Natapov	list_del(&work->link);
*af585b92SGleb Natapov	spin_unlock(&vcpu->async_pf.lock);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	kvm_arch_async_page_present(vcpu, work);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	list_del(&work->queue);
*af585b92SGleb Natapov	vcpu->async_pf.queued--;
*af585b92SGleb Natapov	if (work->page)
*af585b92SGleb Natapov		put_page(work->page);
*af585b92SGleb Natapov	kmem_cache_free(async_pf_cache, work);
*af585b92SGleb Natapov}
*af585b92SGleb Natapov
*af585b92SGleb Natapovint kvm_setup_async_pf(struct kvm_vcpu *vcpu, gva_t gva, gfn_t gfn,
*af585b92SGleb Natapov		       struct kvm_arch_async_pf *arch)
*af585b92SGleb Natapov{
*af585b92SGleb Natapov	struct kvm_async_pf *work;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	if (vcpu->async_pf.queued >= ASYNC_PF_PER_VCPU)
*af585b92SGleb Natapov		return 0;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	/* setup delayed work */
*af585b92SGleb Natapov
*af585b92SGleb Natapov	/*
*af585b92SGleb Natapov	 * do alloc nowait since if we are going to sleep anyway we
*af585b92SGleb Natapov	 * may as well sleep faulting in page
*af585b92SGleb Natapov	 */
*af585b92SGleb Natapov	work = kmem_cache_zalloc(async_pf_cache, GFP_NOWAIT);
*af585b92SGleb Natapov	if (!work)
*af585b92SGleb Natapov		return 0;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	work->page = NULL;
*af585b92SGleb Natapov	work->done = false;
*af585b92SGleb Natapov	work->vcpu = vcpu;
*af585b92SGleb Natapov	work->gva = gva;
*af585b92SGleb Natapov	work->addr = gfn_to_hva(vcpu->kvm, gfn);
*af585b92SGleb Natapov	work->arch = *arch;
*af585b92SGleb Natapov	work->mm = current->mm;
*af585b92SGleb Natapov	atomic_inc(&work->mm->mm_count);
*af585b92SGleb Natapov	kvm_get_kvm(work->vcpu->kvm);
*af585b92SGleb Natapov
*af585b92SGleb Natapov	/* this can't really happen otherwise gfn_to_pfn_async
*af585b92SGleb Natapov	   would succeed */
*af585b92SGleb Natapov	if (unlikely(kvm_is_error_hva(work->addr)))
*af585b92SGleb Natapov		goto retry_sync;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	INIT_WORK(&work->work, async_pf_execute);
*af585b92SGleb Natapov	if (!schedule_work(&work->work))
*af585b92SGleb Natapov		goto retry_sync;
*af585b92SGleb Natapov
*af585b92SGleb Natapov	list_add_tail(&work->queue, &vcpu->async_pf.queue);
*af585b92SGleb Natapov	vcpu->async_pf.queued++;
*af585b92SGleb Natapov	kvm_arch_async_page_not_present(vcpu, work);
*af585b92SGleb Natapov	return 1;
*af585b92SGleb Natapovretry_sync:
*af585b92SGleb Natapov	kvm_put_kvm(work->vcpu->kvm);
*af585b92SGleb Natapov	mmdrop(work->mm);
*af585b92SGleb Natapov	kmem_cache_free(async_pf_cache, work);
*af585b92SGleb Natapov	return 0;
*af585b92SGleb Natapov}