2009-10-30 08:47:10 +03:00
/*
* Copyright ( C ) 2009. SUSE Linux Products GmbH . All rights reserved .
*
* Authors :
* Alexander Graf < agraf @ suse . de >
* Kevin Wolf < mail @ kevin - wolf . de >
*
* Description :
* This file is derived from arch / powerpc / kvm / 44 x . c ,
* by Hollis Blanchard < hollisb @ us . ibm . com > .
*
* This program is free software ; you can redistribute it and / or modify
* it under the terms of the GNU General Public License , version 2 , as
* published by the Free Software Foundation .
*/
# include <linux/kvm_host.h>
# include <linux/err.h>
2011-05-27 18:46:24 +04:00
# include <linux/export.h>
2010-04-27 09:49:17 +04:00
# include <linux/slab.h>
2013-12-09 16:53:42 +04:00
# include <linux/module.h>
# include <linux/miscdevice.h>
2009-10-30 08:47:10 +03:00
# include <asm/reg.h>
# include <asm/cputable.h>
# include <asm/cacheflush.h>
# include <asm/tlbflush.h>
# include <asm/uaccess.h>
# include <asm/io.h>
# include <asm/kvm_ppc.h>
# include <asm/kvm_book3s.h>
# include <asm/mmu_context.h>
2011-06-29 04:16:42 +04:00
# include <asm/page.h>
include cleanup: Update gfp.h and slab.h includes to prepare for breaking implicit slab.h inclusion from percpu.h
percpu.h is included by sched.h and module.h and thus ends up being
included when building most .c files. percpu.h includes slab.h which
in turn includes gfp.h making everything defined by the two files
universally available and complicating inclusion dependencies.
percpu.h -> slab.h dependency is about to be removed. Prepare for
this change by updating users of gfp and slab facilities include those
headers directly instead of assuming availability. As this conversion
needs to touch large number of source files, the following script is
used as the basis of conversion.
http://userweb.kernel.org/~tj/misc/slabh-sweep.py
The script does the followings.
* Scan files for gfp and slab usages and update includes such that
only the necessary includes are there. ie. if only gfp is used,
gfp.h, if slab is used, slab.h.
* When the script inserts a new include, it looks at the include
blocks and try to put the new include such that its order conforms
to its surrounding. It's put in the include block which contains
core kernel includes, in the same order that the rest are ordered -
alphabetical, Christmas tree, rev-Xmas-tree or at the end if there
doesn't seem to be any matching order.
* If the script can't find a place to put a new include (mostly
because the file doesn't have fitting include block), it prints out
an error message indicating which .h file needs to be added to the
file.
The conversion was done in the following steps.
1. The initial automatic conversion of all .c files updated slightly
over 4000 files, deleting around 700 includes and adding ~480 gfp.h
and ~3000 slab.h inclusions. The script emitted errors for ~400
files.
2. Each error was manually checked. Some didn't need the inclusion,
some needed manual addition while adding it to implementation .h or
embedding .c file was more appropriate for others. This step added
inclusions to around 150 files.
3. The script was run again and the output was compared to the edits
from #2 to make sure no file was left behind.
4. Several build tests were done and a couple of problems were fixed.
e.g. lib/decompress_*.c used malloc/free() wrappers around slab
APIs requiring slab.h to be added manually.
5. The script was run on all .h files but without automatically
editing them as sprinkling gfp.h and slab.h inclusions around .h
files could easily lead to inclusion dependency hell. Most gfp.h
inclusion directives were ignored as stuff from gfp.h was usually
wildly available and often used in preprocessor macros. Each
slab.h inclusion directive was examined and added manually as
necessary.
6. percpu.h was updated not to include slab.h.
7. Build test were done on the following configurations and failures
were fixed. CONFIG_GCOV_KERNEL was turned off for all tests (as my
distributed build env didn't work with gcov compiles) and a few
more options had to be turned off depending on archs to make things
build (like ipr on powerpc/64 which failed due to missing writeq).
* x86 and x86_64 UP and SMP allmodconfig and a custom test config.
* powerpc and powerpc64 SMP allmodconfig
* sparc and sparc64 SMP allmodconfig
* ia64 SMP allmodconfig
* s390 SMP allmodconfig
* alpha SMP allmodconfig
* um on x86_64 SMP allmodconfig
8. percpu.h modifications were reverted so that it could be applied as
a separate patch and serve as bisection point.
Given the fact that I had only a couple of failures from tests on step
6, I'm fairly confident about the coverage of this conversion patch.
If there is a breakage, it's likely to be something in one of the arch
headers which should be easily discoverable easily on most builds of
the specific arch.
Signed-off-by: Tejun Heo <tj@kernel.org>
Guess-its-ok-by: Christoph Lameter <cl@linux-foundation.org>
Cc: Ingo Molnar <mingo@redhat.com>
Cc: Lee Schermerhorn <Lee.Schermerhorn@hp.com>
2010-03-24 11:04:11 +03:00
# include <linux/gfp.h>
2009-10-30 08:47:10 +03:00
# include <linux/sched.h>
# include <linux/vmalloc.h>
2010-03-24 23:48:32 +03:00
# include <linux/highmem.h>
2009-10-30 08:47:10 +03:00
2013-10-07 20:48:01 +04:00
# include "book3s.h"
2011-06-29 04:17:33 +04:00
# include "trace.h"
2009-10-30 08:47:10 +03:00
# define VCPU_STAT(x) offsetof(struct kvm_vcpu, stat.x), KVM_STAT_VCPU
/* #define EXIT_DEBUG */
2010-04-16 02:11:53 +04:00
2009-10-30 08:47:10 +03:00
struct kvm_stats_debugfs_item debugfs_entries [ ] = {
{ " exits " , VCPU_STAT ( sum_exits ) } ,
{ " mmio " , VCPU_STAT ( mmio_exits ) } ,
{ " sig " , VCPU_STAT ( signal_exits ) } ,
{ " sysc " , VCPU_STAT ( syscall_exits ) } ,
{ " inst_emu " , VCPU_STAT ( emulated_inst_exits ) } ,
{ " dec " , VCPU_STAT ( dec_exits ) } ,
{ " ext_intr " , VCPU_STAT ( ext_intr_exits ) } ,
{ " queue_intr " , VCPU_STAT ( queue_intr ) } ,
{ " halt_wakeup " , VCPU_STAT ( halt_wakeup ) } ,
{ " pf_storage " , VCPU_STAT ( pf_storage ) } ,
{ " sp_storage " , VCPU_STAT ( sp_storage ) } ,
{ " pf_instruc " , VCPU_STAT ( pf_instruc ) } ,
{ " sp_instruc " , VCPU_STAT ( sp_instruc ) } ,
{ " ld " , VCPU_STAT ( ld ) } ,
{ " ld_slow " , VCPU_STAT ( ld_slow ) } ,
{ " st " , VCPU_STAT ( st ) } ,
{ " st_slow " , VCPU_STAT ( st_slow ) } ,
{ NULL }
} ;
void kvmppc_core_load_host_debugstate ( struct kvm_vcpu * vcpu )
{
}
void kvmppc_core_load_guest_debugstate ( struct kvm_vcpu * vcpu )
{
}
2013-10-07 20:47:56 +04:00
static inline unsigned long kvmppc_interrupt_offset ( struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:02 +04:00
if ( ! is_kvmppc_hv_enabled ( vcpu - > kvm ) )
2013-10-07 20:47:56 +04:00
return to_book3s ( vcpu ) - > hior ;
return 0 ;
}
static inline void kvmppc_update_int_pending ( struct kvm_vcpu * vcpu ,
unsigned long pending_now , unsigned long old_pending )
{
2013-10-07 20:48:02 +04:00
if ( is_kvmppc_hv_enabled ( vcpu - > kvm ) )
2013-10-07 20:47:56 +04:00
return ;
if ( pending_now )
vcpu - > arch . shared - > int_pending = 1 ;
else if ( old_pending )
vcpu - > arch . shared - > int_pending = 0 ;
}
static inline bool kvmppc_critical_section ( struct kvm_vcpu * vcpu )
{
ulong crit_raw ;
ulong crit_r1 ;
bool crit ;
2013-10-07 20:48:02 +04:00
if ( is_kvmppc_hv_enabled ( vcpu - > kvm ) )
2013-10-07 20:47:56 +04:00
return false ;
crit_raw = vcpu - > arch . shared - > critical ;
crit_r1 = kvmppc_get_gpr ( vcpu , 1 ) ;
/* Truncate crit indicators in 32 bit mode */
if ( ! ( vcpu - > arch . shared - > msr & MSR_SF ) ) {
crit_raw & = 0xffffffff ;
crit_r1 & = 0xffffffff ;
}
/* Critical section when crit == r1 */
crit = ( crit_raw = = crit_r1 ) ;
/* ... and we're in supervisor mode */
crit = crit & & ! ( vcpu - > arch . shared - > msr & MSR_PR ) ;
return crit ;
}
2009-10-30 08:47:10 +03:00
void kvmppc_inject_interrupt ( struct kvm_vcpu * vcpu , int vec , u64 flags )
{
2010-07-29 16:47:46 +04:00
vcpu - > arch . shared - > srr0 = kvmppc_get_pc ( vcpu ) ;
vcpu - > arch . shared - > srr1 = vcpu - > arch . shared - > msr | flags ;
2011-06-29 04:17:58 +04:00
kvmppc_set_pc ( vcpu , kvmppc_interrupt_offset ( vcpu ) + vec ) ;
2009-10-30 08:47:10 +03:00
vcpu - > arch . mmu . reset_msr ( vcpu ) ;
}
2009-12-21 22:21:23 +03:00
static int kvmppc_book3s_vec2irqprio ( unsigned int vec )
2009-10-30 08:47:10 +03:00
{
unsigned int prio ;
switch ( vec ) {
case 0x100 : prio = BOOK3S_IRQPRIO_SYSTEM_RESET ; break ;
case 0x200 : prio = BOOK3S_IRQPRIO_MACHINE_CHECK ; break ;
case 0x300 : prio = BOOK3S_IRQPRIO_DATA_STORAGE ; break ;
case 0x380 : prio = BOOK3S_IRQPRIO_DATA_SEGMENT ; break ;
case 0x400 : prio = BOOK3S_IRQPRIO_INST_STORAGE ; break ;
case 0x480 : prio = BOOK3S_IRQPRIO_INST_SEGMENT ; break ;
case 0x500 : prio = BOOK3S_IRQPRIO_EXTERNAL ; break ;
2010-08-30 12:44:15 +04:00
case 0x501 : prio = BOOK3S_IRQPRIO_EXTERNAL_LEVEL ; break ;
2009-10-30 08:47:10 +03:00
case 0x600 : prio = BOOK3S_IRQPRIO_ALIGNMENT ; break ;
case 0x700 : prio = BOOK3S_IRQPRIO_PROGRAM ; break ;
case 0x800 : prio = BOOK3S_IRQPRIO_FP_UNAVAIL ; break ;
case 0x900 : prio = BOOK3S_IRQPRIO_DECREMENTER ; break ;
case 0xc00 : prio = BOOK3S_IRQPRIO_SYSCALL ; break ;
case 0xd00 : prio = BOOK3S_IRQPRIO_DEBUG ; break ;
case 0xf20 : prio = BOOK3S_IRQPRIO_ALTIVEC ; break ;
case 0xf40 : prio = BOOK3S_IRQPRIO_VSX ; break ;
default : prio = BOOK3S_IRQPRIO_MAX ; break ;
}
2009-12-21 22:21:23 +03:00
return prio ;
}
2013-04-18 00:30:26 +04:00
void kvmppc_book3s_dequeue_irqprio ( struct kvm_vcpu * vcpu ,
2009-12-21 22:21:24 +03:00
unsigned int vec )
{
2011-06-29 04:17:58 +04:00
unsigned long old_pending = vcpu - > arch . pending_exceptions ;
2009-12-21 22:21:24 +03:00
clear_bit ( kvmppc_book3s_vec2irqprio ( vec ) ,
& vcpu - > arch . pending_exceptions ) ;
2010-08-05 14:24:40 +04:00
2011-06-29 04:17:58 +04:00
kvmppc_update_int_pending ( vcpu , vcpu - > arch . pending_exceptions ,
old_pending ) ;
2009-12-21 22:21:24 +03:00
}
2009-12-21 22:21:23 +03:00
void kvmppc_book3s_queue_irqprio ( struct kvm_vcpu * vcpu , unsigned int vec )
{
vcpu - > stat . queue_intr + + ;
set_bit ( kvmppc_book3s_vec2irqprio ( vec ) ,
& vcpu - > arch . pending_exceptions ) ;
2009-10-30 08:47:10 +03:00
# ifdef EXIT_DEBUG
printk ( KERN_INFO " Queueing interrupt %x \n " , vec ) ;
# endif
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_book3s_queue_irqprio ) ;
2009-10-30 08:47:10 +03:00
2010-01-08 04:58:07 +03:00
void kvmppc_core_queue_program ( struct kvm_vcpu * vcpu , ulong flags )
2009-10-30 08:47:10 +03:00
{
2011-06-29 04:18:52 +04:00
/* might as well deliver this straight away */
kvmppc_inject_interrupt ( vcpu , BOOK3S_INTERRUPT_PROGRAM , flags ) ;
2009-10-30 08:47:10 +03:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_core_queue_program ) ;
2009-10-30 08:47:10 +03:00
void kvmppc_core_queue_dec ( struct kvm_vcpu * vcpu )
{
kvmppc_book3s_queue_irqprio ( vcpu , BOOK3S_INTERRUPT_DECREMENTER ) ;
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_core_queue_dec ) ;
2009-10-30 08:47:10 +03:00
int kvmppc_core_pending_dec ( struct kvm_vcpu * vcpu )
{
2011-05-11 04:38:50 +04:00
return test_bit ( BOOK3S_IRQPRIO_DECREMENTER , & vcpu - > arch . pending_exceptions ) ;
2009-10-30 08:47:10 +03:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_core_pending_dec ) ;
2009-10-30 08:47:10 +03:00
2009-12-21 22:21:24 +03:00
void kvmppc_core_dequeue_dec ( struct kvm_vcpu * vcpu )
{
kvmppc_book3s_dequeue_irqprio ( vcpu , BOOK3S_INTERRUPT_DECREMENTER ) ;
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_core_dequeue_dec ) ;
2009-12-21 22:21:24 +03:00
2009-10-30 08:47:10 +03:00
void kvmppc_core_queue_external ( struct kvm_vcpu * vcpu ,
struct kvm_interrupt * irq )
{
2010-08-30 12:44:15 +04:00
unsigned int vec = BOOK3S_INTERRUPT_EXTERNAL ;
if ( irq - > irq = = KVM_INTERRUPT_SET_LEVEL )
vec = BOOK3S_INTERRUPT_EXTERNAL_LEVEL ;
kvmppc_book3s_queue_irqprio ( vcpu , vec ) ;
2009-10-30 08:47:10 +03:00
}
2013-02-14 18:00:25 +04:00
void kvmppc_core_dequeue_external ( struct kvm_vcpu * vcpu )
2010-03-24 23:48:18 +03:00
{
kvmppc_book3s_dequeue_irqprio ( vcpu , BOOK3S_INTERRUPT_EXTERNAL ) ;
2010-08-30 12:44:15 +04:00
kvmppc_book3s_dequeue_irqprio ( vcpu , BOOK3S_INTERRUPT_EXTERNAL_LEVEL ) ;
2010-03-24 23:48:18 +03:00
}
2009-10-30 08:47:10 +03:00
int kvmppc_book3s_irqprio_deliver ( struct kvm_vcpu * vcpu , unsigned int priority )
{
int deliver = 1 ;
int vec = 0 ;
2011-06-29 04:17:58 +04:00
bool crit = kvmppc_critical_section ( vcpu ) ;
2009-10-30 08:47:10 +03:00
switch ( priority ) {
case BOOK3S_IRQPRIO_DECREMENTER :
2010-07-29 16:47:49 +04:00
deliver = ( vcpu - > arch . shared - > msr & MSR_EE ) & & ! crit ;
2009-10-30 08:47:10 +03:00
vec = BOOK3S_INTERRUPT_DECREMENTER ;
break ;
case BOOK3S_IRQPRIO_EXTERNAL :
2010-08-30 12:44:15 +04:00
case BOOK3S_IRQPRIO_EXTERNAL_LEVEL :
2010-07-29 16:47:49 +04:00
deliver = ( vcpu - > arch . shared - > msr & MSR_EE ) & & ! crit ;
2009-10-30 08:47:10 +03:00
vec = BOOK3S_INTERRUPT_EXTERNAL ;
break ;
case BOOK3S_IRQPRIO_SYSTEM_RESET :
vec = BOOK3S_INTERRUPT_SYSTEM_RESET ;
break ;
case BOOK3S_IRQPRIO_MACHINE_CHECK :
vec = BOOK3S_INTERRUPT_MACHINE_CHECK ;
break ;
case BOOK3S_IRQPRIO_DATA_STORAGE :
vec = BOOK3S_INTERRUPT_DATA_STORAGE ;
break ;
case BOOK3S_IRQPRIO_INST_STORAGE :
vec = BOOK3S_INTERRUPT_INST_STORAGE ;
break ;
case BOOK3S_IRQPRIO_DATA_SEGMENT :
vec = BOOK3S_INTERRUPT_DATA_SEGMENT ;
break ;
case BOOK3S_IRQPRIO_INST_SEGMENT :
vec = BOOK3S_INTERRUPT_INST_SEGMENT ;
break ;
case BOOK3S_IRQPRIO_ALIGNMENT :
vec = BOOK3S_INTERRUPT_ALIGNMENT ;
break ;
case BOOK3S_IRQPRIO_PROGRAM :
vec = BOOK3S_INTERRUPT_PROGRAM ;
break ;
case BOOK3S_IRQPRIO_VSX :
vec = BOOK3S_INTERRUPT_VSX ;
break ;
case BOOK3S_IRQPRIO_ALTIVEC :
vec = BOOK3S_INTERRUPT_ALTIVEC ;
break ;
case BOOK3S_IRQPRIO_FP_UNAVAIL :
vec = BOOK3S_INTERRUPT_FP_UNAVAIL ;
break ;
case BOOK3S_IRQPRIO_SYSCALL :
vec = BOOK3S_INTERRUPT_SYSCALL ;
break ;
case BOOK3S_IRQPRIO_DEBUG :
vec = BOOK3S_INTERRUPT_TRACE ;
break ;
case BOOK3S_IRQPRIO_PERFORMANCE_MONITOR :
vec = BOOK3S_INTERRUPT_PERFMON ;
break ;
default :
deliver = 0 ;
printk ( KERN_ERR " KVM: Unknown interrupt: 0x%x \n " , priority ) ;
break ;
}
#if 0
printk ( KERN_INFO " Deliver interrupt 0x%x? %x \n " , vec , deliver ) ;
# endif
if ( deliver )
2011-06-29 04:18:52 +04:00
kvmppc_inject_interrupt ( vcpu , vec , 0 ) ;
2009-10-30 08:47:10 +03:00
return deliver ;
}
2010-08-30 12:44:15 +04:00
/*
* This function determines if an irqprio should be cleared once issued .
*/
static bool clear_irqprio ( struct kvm_vcpu * vcpu , unsigned int priority )
{
switch ( priority ) {
case BOOK3S_IRQPRIO_DECREMENTER :
/* DEC interrupts get cleared by mtdec */
return false ;
case BOOK3S_IRQPRIO_EXTERNAL_LEVEL :
/* External interrupts get cleared by userspace */
return false ;
}
return true ;
}
2012-02-16 18:07:37 +04:00
int kvmppc_core_prepare_to_enter ( struct kvm_vcpu * vcpu )
2009-10-30 08:47:10 +03:00
{
unsigned long * pending = & vcpu - > arch . pending_exceptions ;
2010-07-29 16:47:51 +04:00
unsigned long old_pending = vcpu - > arch . pending_exceptions ;
2009-10-30 08:47:10 +03:00
unsigned int priority ;
# ifdef EXIT_DEBUG
if ( vcpu - > arch . pending_exceptions )
printk ( KERN_EMERG " KVM: Check pending: %lx \n " , vcpu - > arch . pending_exceptions ) ;
# endif
priority = __ffs ( * pending ) ;
2010-04-16 02:11:56 +04:00
while ( priority < BOOK3S_IRQPRIO_MAX ) {
2009-12-21 22:21:24 +03:00
if ( kvmppc_book3s_irqprio_deliver ( vcpu , priority ) & &
2010-08-30 12:44:15 +04:00
clear_irqprio ( vcpu , priority ) ) {
2009-10-30 08:47:10 +03:00
clear_bit ( priority , & vcpu - > arch . pending_exceptions ) ;
break ;
}
priority = find_next_bit ( pending ,
BITS_PER_BYTE * sizeof ( * pending ) ,
priority + 1 ) ;
}
2010-07-29 16:47:51 +04:00
/* Tell the guest about our interrupt status */
2011-06-29 04:17:58 +04:00
kvmppc_update_int_pending ( vcpu , * pending , old_pending ) ;
2012-02-16 18:07:37 +04:00
return 0 ;
2009-10-30 08:47:10 +03:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_core_prepare_to_enter ) ;
2009-10-30 08:47:10 +03:00
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
pfn_t kvmppc_gfn_to_pfn ( struct kvm_vcpu * vcpu , gfn_t gfn , bool writing ,
bool * writable )
2010-07-29 16:47:54 +04:00
{
ulong mp_pa = vcpu - > arch . magic_page_pa ;
2012-03-14 01:52:44 +04:00
if ( ! ( vcpu - > arch . shared - > msr & MSR_SF ) )
mp_pa = ( uint32_t ) mp_pa ;
2010-07-29 16:47:54 +04:00
/* Magic page override */
if ( unlikely ( mp_pa ) & &
unlikely ( ( ( gfn < < PAGE_SHIFT ) & KVM_PAM ) = =
( ( mp_pa & PAGE_MASK ) & KVM_PAM ) ) ) {
ulong shared_page = ( ( ulong ) vcpu - > arch . shared ) & PAGE_MASK ;
pfn_t pfn ;
pfn = ( pfn_t ) virt_to_phys ( ( void * ) shared_page ) > > PAGE_SHIFT ;
get_page ( pfn_to_page ( pfn ) ) ;
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
if ( writable )
* writable = true ;
2010-07-29 16:47:54 +04:00
return pfn ;
}
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
return gfn_to_pfn_prot ( vcpu - > kvm , gfn , writing , writable ) ;
2010-07-29 16:47:54 +04:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_gfn_to_pfn ) ;
2010-07-29 16:47:54 +04:00
2009-10-30 08:47:10 +03:00
static int kvmppc_xlate ( struct kvm_vcpu * vcpu , ulong eaddr , bool data ,
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
bool iswrite , struct kvmppc_pte * pte )
2009-10-30 08:47:10 +03:00
{
2010-07-29 16:47:43 +04:00
int relocated = ( vcpu - > arch . shared - > msr & ( data ? MSR_DR : MSR_IR ) ) ;
2009-10-30 08:47:10 +03:00
int r ;
if ( relocated ) {
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
r = vcpu - > arch . mmu . xlate ( vcpu , eaddr , pte , data , iswrite ) ;
2009-10-30 08:47:10 +03:00
} else {
pte - > eaddr = eaddr ;
2010-07-29 16:47:52 +04:00
pte - > raddr = eaddr & KVM_PAM ;
2010-03-24 23:48:17 +03:00
pte - > vpage = VSID_REAL | eaddr > > 12 ;
2009-10-30 08:47:10 +03:00
pte - > may_read = true ;
pte - > may_write = true ;
pte - > may_execute = true ;
r = 0 ;
}
return r ;
}
static hva_t kvmppc_bad_hva ( void )
{
return PAGE_OFFSET ;
}
static hva_t kvmppc_pte_to_hva ( struct kvm_vcpu * vcpu , struct kvmppc_pte * pte ,
bool read )
{
hva_t hpage ;
if ( read & & ! pte - > may_read )
goto err ;
if ( ! read & & ! pte - > may_write )
goto err ;
hpage = gfn_to_hva ( vcpu - > kvm , pte - > raddr > > PAGE_SHIFT ) ;
if ( kvm_is_error_hva ( hpage ) )
goto err ;
return hpage | ( pte - > raddr & ~ PAGE_MASK ) ;
err :
return kvmppc_bad_hva ( ) ;
}
2010-02-19 13:00:38 +03:00
int kvmppc_st ( struct kvm_vcpu * vcpu , ulong * eaddr , int size , void * ptr ,
bool data )
2009-10-30 08:47:10 +03:00
{
struct kvmppc_pte pte ;
vcpu - > stat . st + + ;
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
if ( kvmppc_xlate ( vcpu , * eaddr , data , true , & pte ) )
2010-03-24 23:48:32 +03:00
return - ENOENT ;
2010-02-19 13:00:38 +03:00
* eaddr = pte . raddr ;
2009-10-30 08:47:10 +03:00
2010-03-24 23:48:32 +03:00
if ( ! pte . may_write )
return - EPERM ;
2009-10-30 08:47:10 +03:00
2010-03-24 23:48:32 +03:00
if ( kvm_write_guest ( vcpu - > kvm , pte . raddr , ptr , size ) )
return EMULATE_DO_MMIO ;
2009-10-30 08:47:10 +03:00
2010-02-19 13:00:38 +03:00
return EMULATE_DONE ;
2009-10-30 08:47:10 +03:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_st ) ;
2009-10-30 08:47:10 +03:00
2010-02-19 13:00:38 +03:00
int kvmppc_ld ( struct kvm_vcpu * vcpu , ulong * eaddr , int size , void * ptr ,
2009-10-30 08:47:10 +03:00
bool data )
{
struct kvmppc_pte pte ;
2010-02-19 13:00:38 +03:00
hva_t hva = * eaddr ;
2009-10-30 08:47:10 +03:00
vcpu - > stat . ld + + ;
KVM: PPC: Book3S PR: Better handling of host-side read-only pages
Currently we request write access to all pages that get mapped into the
guest, even if the guest is only loading from the page. This reduces
the effectiveness of KSM because it means that we unshare every page we
access. Also, we always set the changed (C) bit in the guest HPTE if
it allows writing, even for a guest load.
This fixes both these problems. We pass an 'iswrite' flag to the
mmu.xlate() functions and to kvmppc_mmu_map_page() to indicate whether
the access is a load or a store. The mmu.xlate() functions now only
set C for stores. kvmppc_gfn_to_pfn() now calls gfn_to_pfn_prot()
instead of gfn_to_pfn() so that it can indicate whether we need write
access to the page, and get back a 'writable' flag to indicate whether
the page is writable or not. If that 'writable' flag is clear, we then
make the host HPTE read-only even if the guest HPTE allowed writing.
This means that we can get a protection fault when the guest writes to a
page that it has mapped read-write but which is read-only on the host
side (perhaps due to KSM having merged the page). Thus we now call
kvmppc_handle_pagefault() for protection faults as well as HPTE not found
faults. In kvmppc_handle_pagefault(), if the access was allowed by the
guest HPTE and we thus need to install a new host HPTE, we then need to
remove the old host HPTE if there is one. This is done with a new
function, kvmppc_mmu_unmap_page(), which uses kvmppc_mmu_pte_vflush() to
find and remove the old host HPTE.
Since the memslot-related functions require the KVM SRCU read lock to
be held, this adds srcu_read_lock/unlock pairs around the calls to
kvmppc_handle_pagefault().
Finally, this changes kvmppc_mmu_book3s_32_xlate_pte() to not ignore
guest HPTEs that don't permit access, and to return -EPERM for accesses
that are not permitted by the page protections.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2013-09-20 08:52:51 +04:00
if ( kvmppc_xlate ( vcpu , * eaddr , data , false , & pte ) )
2010-02-19 13:00:38 +03:00
goto nopte ;
* eaddr = pte . raddr ;
2009-10-30 08:47:10 +03:00
hva = kvmppc_pte_to_hva ( vcpu , & pte , true ) ;
if ( kvm_is_error_hva ( hva ) )
2010-02-19 13:00:38 +03:00
goto mmio ;
2009-10-30 08:47:10 +03:00
if ( copy_from_user ( ptr , ( void __user * ) hva , size ) ) {
printk ( KERN_INFO " kvmppc_ld at 0x%lx failed \n " , hva ) ;
2010-02-19 13:00:38 +03:00
goto mmio ;
2009-10-30 08:47:10 +03:00
}
2010-02-19 13:00:38 +03:00
return EMULATE_DONE ;
2009-10-30 08:47:10 +03:00
2010-02-19 13:00:38 +03:00
nopte :
2009-10-30 08:47:10 +03:00
return - ENOENT ;
2010-02-19 13:00:38 +03:00
mmio :
return EMULATE_DO_MMIO ;
2009-10-30 08:47:10 +03:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_ld ) ;
2009-10-30 08:47:10 +03:00
int kvm_arch_vcpu_setup ( struct kvm_vcpu * vcpu )
{
return 0 ;
}
2012-08-09 00:38:19 +04:00
int kvmppc_subarch_vcpu_init ( struct kvm_vcpu * vcpu )
{
return 0 ;
}
void kvmppc_subarch_vcpu_uninit ( struct kvm_vcpu * vcpu )
{
}
2013-10-07 20:47:53 +04:00
int kvm_arch_vcpu_ioctl_get_sregs ( struct kvm_vcpu * vcpu ,
struct kvm_sregs * sregs )
{
2013-10-07 20:48:01 +04:00
return vcpu - > kvm - > arch . kvm_ops - > get_sregs ( vcpu , sregs ) ;
2013-10-07 20:47:53 +04:00
}
int kvm_arch_vcpu_ioctl_set_sregs ( struct kvm_vcpu * vcpu ,
struct kvm_sregs * sregs )
{
2013-10-07 20:48:01 +04:00
return vcpu - > kvm - > arch . kvm_ops - > set_sregs ( vcpu , sregs ) ;
2013-10-07 20:47:53 +04:00
}
2009-10-30 08:47:10 +03:00
int kvm_arch_vcpu_ioctl_get_regs ( struct kvm_vcpu * vcpu , struct kvm_regs * regs )
{
int i ;
2010-04-16 02:11:40 +04:00
regs - > pc = kvmppc_get_pc ( vcpu ) ;
2010-01-08 04:58:02 +03:00
regs - > cr = kvmppc_get_cr ( vcpu ) ;
2010-04-16 02:11:40 +04:00
regs - > ctr = kvmppc_get_ctr ( vcpu ) ;
regs - > lr = kvmppc_get_lr ( vcpu ) ;
2010-01-08 04:58:02 +03:00
regs - > xer = kvmppc_get_xer ( vcpu ) ;
2010-07-29 16:47:43 +04:00
regs - > msr = vcpu - > arch . shared - > msr ;
2010-07-29 16:47:46 +04:00
regs - > srr0 = vcpu - > arch . shared - > srr0 ;
regs - > srr1 = vcpu - > arch . shared - > srr1 ;
2009-10-30 08:47:10 +03:00
regs - > pid = vcpu - > arch . pid ;
2010-07-29 16:47:47 +04:00
regs - > sprg0 = vcpu - > arch . shared - > sprg0 ;
regs - > sprg1 = vcpu - > arch . shared - > sprg1 ;
regs - > sprg2 = vcpu - > arch . shared - > sprg2 ;
regs - > sprg3 = vcpu - > arch . shared - > sprg3 ;
KVM: PPC: Paravirtualize SPRG4-7, ESR, PIR, MASn
This allows additional registers to be accessed by the guest
in PR-mode KVM without trapping.
SPRG4-7 are readable from userspace. On booke, KVM will sync
these registers when it enters the guest, so that accesses from
guest userspace will work. The guest kernel, OTOH, must consistently
use either the real registers or the shared area between exits. This
also applies to the already-paravirted SPRG3.
On non-booke, it's not clear to what extent SPRG4-7 are supported
(they're not architected for book3s, but exist on at least some classic
chips). They are copied in the get/set regs ioctls, but I do not see any
non-booke emulation. I also do not see any syncing with real registers
(in PR-mode) including the user-readable SPRG3. This patch should not
make that situation any worse.
Signed-off-by: Scott Wood <scottwood@freescale.com>
Signed-off-by: Alexander Graf <agraf@suse.de>
Signed-off-by: Avi Kivity <avi@redhat.com>
2011-11-09 04:23:30 +04:00
regs - > sprg4 = vcpu - > arch . shared - > sprg4 ;
regs - > sprg5 = vcpu - > arch . shared - > sprg5 ;
regs - > sprg6 = vcpu - > arch . shared - > sprg6 ;
regs - > sprg7 = vcpu - > arch . shared - > sprg7 ;
2009-10-30 08:47:10 +03:00
for ( i = 0 ; i < ARRAY_SIZE ( regs - > gpr ) ; i + + )
2010-01-08 04:58:01 +03:00
regs - > gpr [ i ] = kvmppc_get_gpr ( vcpu , i ) ;
2009-10-30 08:47:10 +03:00
return 0 ;
}
int kvm_arch_vcpu_ioctl_set_regs ( struct kvm_vcpu * vcpu , struct kvm_regs * regs )
{
int i ;
2010-04-16 02:11:40 +04:00
kvmppc_set_pc ( vcpu , regs - > pc ) ;
2010-01-08 04:58:02 +03:00
kvmppc_set_cr ( vcpu , regs - > cr ) ;
2010-04-16 02:11:40 +04:00
kvmppc_set_ctr ( vcpu , regs - > ctr ) ;
kvmppc_set_lr ( vcpu , regs - > lr ) ;
2010-01-08 04:58:02 +03:00
kvmppc_set_xer ( vcpu , regs - > xer ) ;
2009-10-30 08:47:10 +03:00
kvmppc_set_msr ( vcpu , regs - > msr ) ;
2010-07-29 16:47:46 +04:00
vcpu - > arch . shared - > srr0 = regs - > srr0 ;
vcpu - > arch . shared - > srr1 = regs - > srr1 ;
2010-07-29 16:47:47 +04:00
vcpu - > arch . shared - > sprg0 = regs - > sprg0 ;
vcpu - > arch . shared - > sprg1 = regs - > sprg1 ;
vcpu - > arch . shared - > sprg2 = regs - > sprg2 ;
vcpu - > arch . shared - > sprg3 = regs - > sprg3 ;
KVM: PPC: Paravirtualize SPRG4-7, ESR, PIR, MASn
This allows additional registers to be accessed by the guest
in PR-mode KVM without trapping.
SPRG4-7 are readable from userspace. On booke, KVM will sync
these registers when it enters the guest, so that accesses from
guest userspace will work. The guest kernel, OTOH, must consistently
use either the real registers or the shared area between exits. This
also applies to the already-paravirted SPRG3.
On non-booke, it's not clear to what extent SPRG4-7 are supported
(they're not architected for book3s, but exist on at least some classic
chips). They are copied in the get/set regs ioctls, but I do not see any
non-booke emulation. I also do not see any syncing with real registers
(in PR-mode) including the user-readable SPRG3. This patch should not
make that situation any worse.
Signed-off-by: Scott Wood <scottwood@freescale.com>
Signed-off-by: Alexander Graf <agraf@suse.de>
Signed-off-by: Avi Kivity <avi@redhat.com>
2011-11-09 04:23:30 +04:00
vcpu - > arch . shared - > sprg4 = regs - > sprg4 ;
vcpu - > arch . shared - > sprg5 = regs - > sprg5 ;
vcpu - > arch . shared - > sprg6 = regs - > sprg6 ;
vcpu - > arch . shared - > sprg7 = regs - > sprg7 ;
2009-10-30 08:47:10 +03:00
2010-01-08 04:58:01 +03:00
for ( i = 0 ; i < ARRAY_SIZE ( regs - > gpr ) ; i + + )
kvmppc_set_gpr ( vcpu , i , regs - > gpr [ i ] ) ;
2009-10-30 08:47:10 +03:00
return 0 ;
}
int kvm_arch_vcpu_ioctl_get_fpu ( struct kvm_vcpu * vcpu , struct kvm_fpu * fpu )
{
return - ENOTSUPP ;
}
int kvm_arch_vcpu_ioctl_set_fpu ( struct kvm_vcpu * vcpu , struct kvm_fpu * fpu )
{
return - ENOTSUPP ;
}
2012-09-26 00:31:56 +04:00
int kvm_vcpu_ioctl_get_one_reg ( struct kvm_vcpu * vcpu , struct kvm_one_reg * reg )
{
int r ;
union kvmppc_one_reg val ;
int size ;
2012-09-26 00:32:30 +04:00
long int i ;
2012-09-26 00:31:56 +04:00
size = one_reg_size ( reg - > id ) ;
if ( size > sizeof ( val ) )
return - EINVAL ;
2013-10-07 20:48:01 +04:00
r = vcpu - > kvm - > arch . kvm_ops - > get_one_reg ( vcpu , reg - > id , & val ) ;
2012-09-26 00:31:56 +04:00
if ( r = = - EINVAL ) {
r = 0 ;
switch ( reg - > id ) {
case KVM_REG_PPC_DAR :
val = get_reg_val ( reg - > id , vcpu - > arch . shared - > dar ) ;
break ;
case KVM_REG_PPC_DSISR :
val = get_reg_val ( reg - > id , vcpu - > arch . shared - > dsisr ) ;
break ;
2012-09-26 00:32:30 +04:00
case KVM_REG_PPC_FPR0 . . . KVM_REG_PPC_FPR31 :
i = reg - > id - KVM_REG_PPC_FPR0 ;
2013-10-15 13:43:02 +04:00
val = get_reg_val ( reg - > id , VCPU_FPR ( vcpu , i ) ) ;
2012-09-26 00:32:30 +04:00
break ;
case KVM_REG_PPC_FPSCR :
2013-10-15 13:43:02 +04:00
val = get_reg_val ( reg - > id , vcpu - > arch . fp . fpscr ) ;
2012-09-26 00:32:30 +04:00
break ;
# ifdef CONFIG_ALTIVEC
case KVM_REG_PPC_VR0 . . . KVM_REG_PPC_VR31 :
if ( ! cpu_has_feature ( CPU_FTR_ALTIVEC ) ) {
r = - ENXIO ;
break ;
}
2013-10-15 13:43:02 +04:00
val . vval = vcpu - > arch . vr . vr [ reg - > id - KVM_REG_PPC_VR0 ] ;
2012-09-26 00:32:30 +04:00
break ;
case KVM_REG_PPC_VSCR :
if ( ! cpu_has_feature ( CPU_FTR_ALTIVEC ) ) {
r = - ENXIO ;
break ;
}
2013-10-15 13:43:02 +04:00
val = get_reg_val ( reg - > id , vcpu - > arch . vr . vscr . u [ 3 ] ) ;
2012-09-26 00:32:30 +04:00
break ;
2013-09-06 07:18:32 +04:00
case KVM_REG_PPC_VRSAVE :
val = get_reg_val ( reg - > id , vcpu - > arch . vrsave ) ;
break ;
2012-09-26 00:32:30 +04:00
# endif /* CONFIG_ALTIVEC */
2013-10-15 13:43:02 +04:00
# ifdef CONFIG_VSX
case KVM_REG_PPC_VSR0 . . . KVM_REG_PPC_VSR31 :
if ( cpu_has_feature ( CPU_FTR_VSX ) ) {
long int i = reg - > id - KVM_REG_PPC_VSR0 ;
val . vsxval [ 0 ] = vcpu - > arch . fp . fpr [ i ] [ 0 ] ;
val . vsxval [ 1 ] = vcpu - > arch . fp . fpr [ i ] [ 1 ] ;
} else {
r = - ENXIO ;
}
break ;
# endif /* CONFIG_VSX */
2013-03-21 00:24:58 +04:00
case KVM_REG_PPC_DEBUG_INST : {
u32 opcode = INS_TW ;
r = copy_to_user ( ( u32 __user * ) ( long ) reg - > addr ,
& opcode , sizeof ( u32 ) ) ;
break ;
}
2013-04-18 00:32:26 +04:00
# ifdef CONFIG_KVM_XICS
case KVM_REG_PPC_ICP_STATE :
if ( ! vcpu - > arch . icp ) {
r = - ENXIO ;
break ;
}
val = get_reg_val ( reg - > id , kvmppc_xics_get_icp ( vcpu ) ) ;
break ;
# endif /* CONFIG_KVM_XICS */
2012-09-26 00:31:56 +04:00
default :
r = - EINVAL ;
break ;
}
}
if ( r )
return r ;
if ( copy_to_user ( ( char __user * ) ( unsigned long ) reg - > addr , & val , size ) )
r = - EFAULT ;
return r ;
}
int kvm_vcpu_ioctl_set_one_reg ( struct kvm_vcpu * vcpu , struct kvm_one_reg * reg )
{
int r ;
union kvmppc_one_reg val ;
int size ;
2012-09-26 00:32:30 +04:00
long int i ;
2012-09-26 00:31:56 +04:00
size = one_reg_size ( reg - > id ) ;
if ( size > sizeof ( val ) )
return - EINVAL ;
if ( copy_from_user ( & val , ( char __user * ) ( unsigned long ) reg - > addr , size ) )
return - EFAULT ;
2013-10-07 20:48:01 +04:00
r = vcpu - > kvm - > arch . kvm_ops - > set_one_reg ( vcpu , reg - > id , & val ) ;
2012-09-26 00:31:56 +04:00
if ( r = = - EINVAL ) {
r = 0 ;
switch ( reg - > id ) {
case KVM_REG_PPC_DAR :
vcpu - > arch . shared - > dar = set_reg_val ( reg - > id , val ) ;
break ;
case KVM_REG_PPC_DSISR :
vcpu - > arch . shared - > dsisr = set_reg_val ( reg - > id , val ) ;
break ;
2012-09-26 00:32:30 +04:00
case KVM_REG_PPC_FPR0 . . . KVM_REG_PPC_FPR31 :
i = reg - > id - KVM_REG_PPC_FPR0 ;
2013-10-15 13:43:02 +04:00
VCPU_FPR ( vcpu , i ) = set_reg_val ( reg - > id , val ) ;
2012-09-26 00:32:30 +04:00
break ;
case KVM_REG_PPC_FPSCR :
2013-10-15 13:43:02 +04:00
vcpu - > arch . fp . fpscr = set_reg_val ( reg - > id , val ) ;
2012-09-26 00:32:30 +04:00
break ;
# ifdef CONFIG_ALTIVEC
case KVM_REG_PPC_VR0 . . . KVM_REG_PPC_VR31 :
if ( ! cpu_has_feature ( CPU_FTR_ALTIVEC ) ) {
r = - ENXIO ;
break ;
}
2013-10-15 13:43:02 +04:00
vcpu - > arch . vr . vr [ reg - > id - KVM_REG_PPC_VR0 ] = val . vval ;
2012-09-26 00:32:30 +04:00
break ;
case KVM_REG_PPC_VSCR :
if ( ! cpu_has_feature ( CPU_FTR_ALTIVEC ) ) {
r = - ENXIO ;
break ;
}
2013-10-15 13:43:02 +04:00
vcpu - > arch . vr . vscr . u [ 3 ] = set_reg_val ( reg - > id , val ) ;
2012-09-26 00:32:30 +04:00
break ;
2013-09-06 07:18:32 +04:00
case KVM_REG_PPC_VRSAVE :
if ( ! cpu_has_feature ( CPU_FTR_ALTIVEC ) ) {
r = - ENXIO ;
break ;
}
vcpu - > arch . vrsave = set_reg_val ( reg - > id , val ) ;
break ;
2012-09-26 00:32:30 +04:00
# endif /* CONFIG_ALTIVEC */
2013-10-15 13:43:02 +04:00
# ifdef CONFIG_VSX
case KVM_REG_PPC_VSR0 . . . KVM_REG_PPC_VSR31 :
if ( cpu_has_feature ( CPU_FTR_VSX ) ) {
long int i = reg - > id - KVM_REG_PPC_VSR0 ;
vcpu - > arch . fp . fpr [ i ] [ 0 ] = val . vsxval [ 0 ] ;
vcpu - > arch . fp . fpr [ i ] [ 1 ] = val . vsxval [ 1 ] ;
} else {
r = - ENXIO ;
}
break ;
# endif /* CONFIG_VSX */
2013-04-18 00:32:26 +04:00
# ifdef CONFIG_KVM_XICS
case KVM_REG_PPC_ICP_STATE :
if ( ! vcpu - > arch . icp ) {
r = - ENXIO ;
break ;
}
r = kvmppc_xics_set_icp ( vcpu ,
set_reg_val ( reg - > id , val ) ) ;
break ;
# endif /* CONFIG_KVM_XICS */
2012-09-26 00:31:56 +04:00
default :
r = - EINVAL ;
break ;
}
}
return r ;
}
2013-10-07 20:47:53 +04:00
void kvmppc_core_vcpu_load ( struct kvm_vcpu * vcpu , int cpu )
{
2013-10-07 20:48:01 +04:00
vcpu - > kvm - > arch . kvm_ops - > vcpu_load ( vcpu , cpu ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_core_vcpu_put ( struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:01 +04:00
vcpu - > kvm - > arch . kvm_ops - > vcpu_put ( vcpu ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_set_msr ( struct kvm_vcpu * vcpu , u64 msr )
{
2013-10-07 20:48:01 +04:00
vcpu - > kvm - > arch . kvm_ops - > set_msr ( vcpu , msr ) ;
2013-10-07 20:47:53 +04:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvmppc_set_msr ) ;
2013-10-07 20:47:53 +04:00
int kvmppc_vcpu_run ( struct kvm_run * kvm_run , struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:01 +04:00
return vcpu - > kvm - > arch . kvm_ops - > vcpu_run ( kvm_run , vcpu ) ;
2013-10-07 20:47:53 +04:00
}
2009-10-30 08:47:10 +03:00
int kvm_arch_vcpu_ioctl_translate ( struct kvm_vcpu * vcpu ,
struct kvm_translation * tr )
{
return 0 ;
}
2013-04-08 04:32:12 +04:00
int kvm_arch_vcpu_ioctl_set_guest_debug ( struct kvm_vcpu * vcpu ,
struct kvm_guest_debug * dbg )
{
return - EINVAL ;
}
2011-11-17 16:39:59 +04:00
void kvmppc_decrementer_func ( unsigned long data )
{
struct kvm_vcpu * vcpu = ( struct kvm_vcpu * ) data ;
kvmppc_core_queue_dec ( vcpu ) ;
kvm_vcpu_kick ( vcpu ) ;
}
2013-10-07 20:47:53 +04:00
struct kvm_vcpu * kvmppc_core_vcpu_create ( struct kvm * kvm , unsigned int id )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > vcpu_create ( kvm , id ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_core_vcpu_free ( struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:01 +04:00
vcpu - > kvm - > arch . kvm_ops - > vcpu_free ( vcpu ) ;
2013-10-07 20:47:53 +04:00
}
int kvmppc_core_check_requests ( struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:01 +04:00
return vcpu - > kvm - > arch . kvm_ops - > check_requests ( vcpu ) ;
2013-10-07 20:47:53 +04:00
}
int kvm_vm_ioctl_get_dirty_log ( struct kvm * kvm , struct kvm_dirty_log * log )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > get_dirty_log ( kvm , log ) ;
2013-10-07 20:47:53 +04:00
}
2013-10-07 20:48:00 +04:00
void kvmppc_core_free_memslot ( struct kvm * kvm , struct kvm_memory_slot * free ,
2013-10-07 20:47:53 +04:00
struct kvm_memory_slot * dont )
{
2013-10-07 20:48:01 +04:00
kvm - > arch . kvm_ops - > free_memslot ( free , dont ) ;
2013-10-07 20:47:53 +04:00
}
2013-10-07 20:48:00 +04:00
int kvmppc_core_create_memslot ( struct kvm * kvm , struct kvm_memory_slot * slot ,
2013-10-07 20:47:53 +04:00
unsigned long npages )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > create_memslot ( slot , npages ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_core_flush_memslot ( struct kvm * kvm , struct kvm_memory_slot * memslot )
{
2013-10-07 20:48:01 +04:00
kvm - > arch . kvm_ops - > flush_memslot ( kvm , memslot ) ;
2013-10-07 20:47:53 +04:00
}
int kvmppc_core_prepare_memory_region ( struct kvm * kvm ,
struct kvm_memory_slot * memslot ,
struct kvm_userspace_memory_region * mem )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > prepare_memory_region ( kvm , memslot , mem ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_core_commit_memory_region ( struct kvm * kvm ,
struct kvm_userspace_memory_region * mem ,
const struct kvm_memory_slot * old )
{
2013-10-07 20:48:01 +04:00
kvm - > arch . kvm_ops - > commit_memory_region ( kvm , mem , old ) ;
2013-10-07 20:47:53 +04:00
}
int kvm_unmap_hva ( struct kvm * kvm , unsigned long hva )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > unmap_hva ( kvm , hva ) ;
2013-10-07 20:47:53 +04:00
}
2013-10-07 20:47:59 +04:00
EXPORT_SYMBOL_GPL ( kvm_unmap_hva ) ;
2013-10-07 20:47:53 +04:00
int kvm_unmap_hva_range ( struct kvm * kvm , unsigned long start , unsigned long end )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > unmap_hva_range ( kvm , start , end ) ;
2013-10-07 20:47:53 +04:00
}
int kvm_age_hva ( struct kvm * kvm , unsigned long hva )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > age_hva ( kvm , hva ) ;
2013-10-07 20:47:53 +04:00
}
int kvm_test_age_hva ( struct kvm * kvm , unsigned long hva )
{
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > test_age_hva ( kvm , hva ) ;
2013-10-07 20:47:53 +04:00
}
void kvm_set_spte_hva ( struct kvm * kvm , unsigned long hva , pte_t pte )
{
2013-10-07 20:48:01 +04:00
kvm - > arch . kvm_ops - > set_spte_hva ( kvm , hva , pte ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_mmu_destroy ( struct kvm_vcpu * vcpu )
{
2013-10-07 20:48:01 +04:00
vcpu - > kvm - > arch . kvm_ops - > mmu_destroy ( vcpu ) ;
2013-10-07 20:47:53 +04:00
}
int kvmppc_core_init_vm ( struct kvm * kvm )
{
# ifdef CONFIG_PPC64
INIT_LIST_HEAD ( & kvm - > arch . spapr_tce_tables ) ;
INIT_LIST_HEAD ( & kvm - > arch . rtas_tokens ) ;
# endif
2013-10-07 20:48:01 +04:00
return kvm - > arch . kvm_ops - > init_vm ( kvm ) ;
2013-10-07 20:47:53 +04:00
}
void kvmppc_core_destroy_vm ( struct kvm * kvm )
{
2013-10-07 20:48:01 +04:00
kvm - > arch . kvm_ops - > destroy_vm ( kvm ) ;
2013-10-07 20:47:53 +04:00
# ifdef CONFIG_PPC64
kvmppc_rtas_tokens_free ( kvm ) ;
WARN_ON ( ! list_empty ( & kvm - > arch . spapr_tce_tables ) ) ;
# endif
}
int kvmppc_core_check_processor_compat ( void )
{
2013-10-07 20:48:01 +04:00
/*
* We always return 0 for book3s . We check
* for compatability while loading the HV
* or PR module
*/
return 0 ;
}
static int kvmppc_book3s_init ( void )
{
int r ;
r = kvm_init ( NULL , sizeof ( struct kvm_vcpu ) , 0 , THIS_MODULE ) ;
if ( r )
return r ;
# ifdef CONFIG_KVM_BOOK3S_32
r = kvmppc_book3s_init_pr ( ) ;
# endif
return r ;
}
static void kvmppc_book3s_exit ( void )
{
# ifdef CONFIG_KVM_BOOK3S_32
kvmppc_book3s_exit_pr ( ) ;
# endif
kvm_exit ( ) ;
2013-10-07 20:47:53 +04:00
}
2013-10-07 20:48:01 +04:00
module_init ( kvmppc_book3s_init ) ;
module_exit ( kvmppc_book3s_exit ) ;
2013-12-09 16:53:42 +04:00
/* On 32bit this is our one and only kernel module */
# ifdef CONFIG_KVM_BOOK3S_32
MODULE_ALIAS_MISCDEV ( KVM_MINOR ) ;
MODULE_ALIAS ( " devname:kvm " ) ;
# endif