2020-02-18 13:07:33 -08:00
// SPDX-License-Identifier: GPL-2.0
# define _GNU_SOURCE /* for program_invocation_short_name */
# include <fcntl.h>
# include <pthread.h>
# include <sched.h>
2020-04-10 16:17:02 -07:00
# include <semaphore.h>
2020-02-18 13:07:33 -08:00
# include <signal.h>
# include <stdio.h>
# include <stdlib.h>
# include <string.h>
# include <sys/ioctl.h>
2020-04-10 16:17:07 -07:00
# include <sys/mman.h>
2020-02-18 13:07:33 -08:00
# include <linux/compiler.h>
# include <test_util.h>
# include <kvm_util.h>
# include <processor.h>
# define VCPU_ID 0
2020-04-10 16:17:07 -07:00
/*
* s390x needs at least 1 MB alignment , and the x86_64 MOVE / DELETE tests need a
* 2 MB sized and aligned region so that the initial region corresponds to
* exactly one large page .
*/
# define MEM_REGION_SIZE 0x200000
2020-04-10 16:17:06 -07:00
# ifdef __x86_64__
2020-02-18 13:07:33 -08:00
/*
2020-04-10 16:17:07 -07:00
* Somewhat arbitrary location and slot , intended to not overlap anything .
2020-02-18 13:07:33 -08:00
*/
# define MEM_REGION_GPA 0xc0000000
# define MEM_REGION_SLOT 10
2020-04-10 16:17:02 -07:00
static const uint64_t MMIO_VAL = 0xbeefull ;
2020-04-10 16:17:03 -07:00
extern const uint64_t final_rip_start ;
extern const uint64_t final_rip_end ;
2020-04-10 16:17:02 -07:00
static sem_t vcpu_ready ;
static inline uint64_t guest_spin_on_val ( uint64_t spin_val )
2020-02-18 13:07:33 -08:00
{
uint64_t val ;
do {
val = READ_ONCE ( * ( ( uint64_t * ) MEM_REGION_GPA ) ) ;
2020-04-10 16:17:02 -07:00
} while ( val = = spin_val ) ;
2020-02-18 13:07:33 -08:00
2020-04-10 16:17:02 -07:00
GUEST_SYNC ( 0 ) ;
return val ;
2020-02-18 13:07:33 -08:00
}
static void * vcpu_worker ( void * data )
{
struct kvm_vm * vm = data ;
struct kvm_run * run ;
struct ucall uc ;
uint64_t cmd ;
/*
* Loop until the guest is done . Re - enter the guest on all MMIO exits ,
2020-04-10 16:17:02 -07:00
* which will occur if the guest attempts to access a memslot after it
* has been deleted or while it is being moved .
2020-02-18 13:07:33 -08:00
*/
run = vcpu_state ( vm , VCPU_ID ) ;
2020-04-10 16:17:02 -07:00
while ( 1 ) {
2020-02-18 13:07:33 -08:00
vcpu_run ( vm , VCPU_ID ) ;
2020-04-10 16:17:02 -07:00
if ( run - > exit_reason = = KVM_EXIT_IO ) {
cmd = get_ucall ( vm , VCPU_ID , & uc ) ;
if ( cmd ! = UCALL_SYNC )
break ;
sem_post ( & vcpu_ready ) ;
continue ;
}
if ( run - > exit_reason ! = KVM_EXIT_MMIO )
break ;
TEST_ASSERT ( ! run - > mmio . is_write , " Unexpected exit mmio write " ) ;
TEST_ASSERT ( run - > mmio . len = = 8 ,
" Unexpected exit mmio size = %u " , run - > mmio . len ) ;
TEST_ASSERT ( run - > mmio . phys_addr = = MEM_REGION_GPA ,
" Unexpected exit mmio address = 0x%llx " ,
run - > mmio . phys_addr ) ;
memcpy ( run - > mmio . data , & MMIO_VAL , 8 ) ;
}
if ( run - > exit_reason = = KVM_EXIT_IO & & cmd = = UCALL_ABORT )
TEST_FAIL ( " %s at %s:%ld, val = %lu " , ( const char * ) uc . args [ 0 ] ,
__FILE__ , uc . args [ 1 ] , uc . args [ 2 ] ) ;
2020-02-18 13:07:33 -08:00
return NULL ;
}
2020-04-10 16:17:02 -07:00
static void wait_for_vcpu ( void )
{
struct timespec ts ;
TEST_ASSERT ( ! clock_gettime ( CLOCK_REALTIME , & ts ) ,
" clock_gettime() failed: %d \n " , errno ) ;
ts . tv_sec + = 2 ;
TEST_ASSERT ( ! sem_timedwait ( & vcpu_ready , & ts ) ,
" sem_timedwait() failed: %d \n " , errno ) ;
/* Wait for the vCPU thread to reenter the guest. */
usleep ( 100000 ) ;
}
static struct kvm_vm * spawn_vm ( pthread_t * vcpu_thread , void * guest_code )
2020-02-18 13:07:33 -08:00
{
struct kvm_vm * vm ;
uint64_t * hva ;
uint64_t gpa ;
vm = vm_create_default ( VCPU_ID , 0 , guest_code ) ;
vm_userspace_mem_region_add ( vm , VM_MEM_SRC_ANONYMOUS_THP ,
MEM_REGION_GPA , MEM_REGION_SLOT ,
MEM_REGION_SIZE / getpagesize ( ) , 0 ) ;
/*
* Allocate and map two pages so that the GPA accessed by guest_code ( )
* stays valid across the memslot move .
*/
gpa = vm_phy_pages_alloc ( vm , 2 , MEM_REGION_GPA , MEM_REGION_SLOT ) ;
TEST_ASSERT ( gpa = = MEM_REGION_GPA , " Failed vm_phy_pages_alloc \n " ) ;
2021-06-22 13:05:22 -07:00
virt_map ( vm , MEM_REGION_GPA , MEM_REGION_GPA , 2 ) ;
2020-02-18 13:07:33 -08:00
/* Ditto for the host mapping so that both pages can be zeroed. */
hva = addr_gpa2hva ( vm , MEM_REGION_GPA ) ;
memset ( hva , 0 , 2 * 4096 ) ;
2020-04-10 16:17:02 -07:00
pthread_create ( vcpu_thread , NULL , vcpu_worker , vm ) ;
2020-02-18 13:07:33 -08:00
/* Ensure the guest thread is spun up. */
2020-04-10 16:17:02 -07:00
wait_for_vcpu ( ) ;
return vm ;
}
static void guest_code_move_memory_region ( void )
{
uint64_t val ;
GUEST_SYNC ( 0 ) ;
/*
2020-12-02 21:35:36 +01:00
* Spin until the memory region starts getting moved to a
* misaligned address .
* Every region move may or may not trigger MMIO , as the
* window where the memslot is invalid is usually quite small .
2020-04-10 16:17:02 -07:00
*/
val = guest_spin_on_val ( 0 ) ;
GUEST_ASSERT_1 ( val = = 1 | | val = = MMIO_VAL , val ) ;
2020-12-02 21:35:36 +01:00
/* Spin until the misaligning memory region move completes. */
val = guest_spin_on_val ( MMIO_VAL ) ;
GUEST_ASSERT_1 ( val = = 1 | | val = = 0 , val ) ;
/* Spin until the memory region starts to get re-aligned. */
val = guest_spin_on_val ( 0 ) ;
GUEST_ASSERT_1 ( val = = 1 | | val = = MMIO_VAL , val ) ;
/* Spin until the re-aligning memory region move completes. */
2020-04-10 16:17:02 -07:00
val = guest_spin_on_val ( MMIO_VAL ) ;
GUEST_ASSERT_1 ( val = = 1 , val ) ;
GUEST_DONE ( ) ;
}
static void test_move_memory_region ( void )
{
pthread_t vcpu_thread ;
struct kvm_vm * vm ;
uint64_t * hva ;
vm = spawn_vm ( & vcpu_thread , guest_code_move_memory_region ) ;
hva = addr_gpa2hva ( vm , MEM_REGION_GPA ) ;
2020-02-18 13:07:33 -08:00
/*
* Shift the region ' s base GPA . The guest should not see " 2 " as the
* hva - > gpa translation is misaligned , i . e . the guest is accessing a
* different host pfn .
*/
vm_mem_region_move ( vm , MEM_REGION_SLOT , MEM_REGION_GPA - 4096 ) ;
WRITE_ONCE ( * hva , 2 ) ;
2020-04-10 16:17:02 -07:00
/*
* The guest _might_ see an invalid memslot and trigger MMIO , but it ' s
* a tiny window . Spin and defer the sync until the memslot is
* restored and guest behavior is once again deterministic .
*/
2020-02-18 13:07:33 -08:00
usleep ( 100000 ) ;
/*
* Note , value in memory needs to be changed * before * restoring the
* memslot , else the guest could race the update and see " 2 " .
*/
WRITE_ONCE ( * hva , 1 ) ;
/* Restore the original base, the guest should see "1". */
vm_mem_region_move ( vm , MEM_REGION_SLOT , MEM_REGION_GPA ) ;
2020-04-10 16:17:02 -07:00
wait_for_vcpu ( ) ;
/* Defered sync from when the memslot was misaligned (above). */
wait_for_vcpu ( ) ;
2020-02-18 13:07:33 -08:00
pthread_join ( vcpu_thread , NULL ) ;
kvm_vm_free ( vm ) ;
}
2020-04-10 16:17:03 -07:00
static void guest_code_delete_memory_region ( void )
{
uint64_t val ;
GUEST_SYNC ( 0 ) ;
/* Spin until the memory region is deleted. */
val = guest_spin_on_val ( 0 ) ;
GUEST_ASSERT_1 ( val = = MMIO_VAL , val ) ;
/* Spin until the memory region is recreated. */
val = guest_spin_on_val ( MMIO_VAL ) ;
GUEST_ASSERT_1 ( val = = 0 , val ) ;
/* Spin until the memory region is deleted. */
val = guest_spin_on_val ( 0 ) ;
GUEST_ASSERT_1 ( val = = MMIO_VAL , val ) ;
asm ( " 1: \n \t "
" .pushsection .rodata \n \t "
" .global final_rip_start \n \t "
" final_rip_start: .quad 1b \n \t "
" .popsection " ) ;
/* Spin indefinitely (until the code memslot is deleted). */
guest_spin_on_val ( MMIO_VAL ) ;
asm ( " 1: \n \t "
" .pushsection .rodata \n \t "
" .global final_rip_end \n \t "
" final_rip_end: .quad 1b \n \t "
" .popsection " ) ;
GUEST_ASSERT_1 ( 0 , 0 ) ;
}
static void test_delete_memory_region ( void )
{
pthread_t vcpu_thread ;
struct kvm_regs regs ;
struct kvm_run * run ;
struct kvm_vm * vm ;
vm = spawn_vm ( & vcpu_thread , guest_code_delete_memory_region ) ;
/* Delete the memory region, the guest should not die. */
vm_mem_region_delete ( vm , MEM_REGION_SLOT ) ;
wait_for_vcpu ( ) ;
/* Recreate the memory region. The guest should see "0". */
vm_userspace_mem_region_add ( vm , VM_MEM_SRC_ANONYMOUS_THP ,
MEM_REGION_GPA , MEM_REGION_SLOT ,
MEM_REGION_SIZE / getpagesize ( ) , 0 ) ;
wait_for_vcpu ( ) ;
/* Delete the region again so that there's only one memslot left. */
vm_mem_region_delete ( vm , MEM_REGION_SLOT ) ;
wait_for_vcpu ( ) ;
/*
* Delete the primary memslot . This should cause an emulation error or
* shutdown due to the page tables getting nuked .
*/
vm_mem_region_delete ( vm , 0 ) ;
pthread_join ( vcpu_thread , NULL ) ;
run = vcpu_state ( vm , VCPU_ID ) ;
TEST_ASSERT ( run - > exit_reason = = KVM_EXIT_SHUTDOWN | |
run - > exit_reason = = KVM_EXIT_INTERNAL_ERROR ,
" Unexpected exit reason = %d " , run - > exit_reason ) ;
vcpu_regs_get ( vm , VCPU_ID , & regs ) ;
2020-04-17 12:35:38 -04:00
/*
* On AMD , after KVM_EXIT_SHUTDOWN the VMCB has been reinitialized already ,
* so the instruction pointer would point to the reset vector .
*/
if ( run - > exit_reason = = KVM_EXIT_INTERNAL_ERROR )
TEST_ASSERT ( regs . rip > = final_rip_start & &
regs . rip < final_rip_end ,
" Bad rip, expected 0x%lx - 0x%lx, got 0x%llx \n " ,
final_rip_start , final_rip_end , regs . rip ) ;
2020-04-10 16:17:03 -07:00
kvm_vm_free ( vm ) ;
}
2020-04-10 16:17:05 -07:00
static void test_zero_memory_regions ( void )
{
struct kvm_run * run ;
struct kvm_vm * vm ;
pr_info ( " Testing KVM_RUN with zero added memory regions \n " ) ;
2022-04-18 16:26:06 -07:00
vm = vm_create_barebones ( ) ;
2020-04-10 16:17:05 -07:00
vm_vcpu_add ( vm , VCPU_ID ) ;
2022-02-15 12:09:56 -08:00
vm_ioctl ( vm , KVM_SET_NR_MMU_PAGES , ( void * ) 64ul ) ;
2020-04-10 16:17:05 -07:00
vcpu_run ( vm , VCPU_ID ) ;
run = vcpu_state ( vm , VCPU_ID ) ;
TEST_ASSERT ( run - > exit_reason = = KVM_EXIT_INTERNAL_ERROR ,
" Unexpected exit_reason = %u \n " , run - > exit_reason ) ;
kvm_vm_free ( vm ) ;
}
2020-04-10 16:17:06 -07:00
# endif /* __x86_64__ */
2020-04-10 16:17:05 -07:00
2020-04-10 16:17:07 -07:00
/*
* Test it can be added memory slots up to KVM_CAP_NR_MEMSLOTS , then any
* tentative to add further slots should fail .
*/
static void test_add_max_memory_regions ( void )
{
int ret ;
struct kvm_vm * vm ;
uint32_t max_mem_slots ;
uint32_t slot ;
2021-04-26 15:01:21 +02:00
void * mem , * mem_aligned , * mem_extra ;
size_t alignment ;
# ifdef __s390x__
/* On s390x, the host address must be aligned to 1M (due to PGSTEs) */
alignment = 0x100000 ;
# else
alignment = 1 ;
# endif
2020-04-10 16:17:07 -07:00
max_mem_slots = kvm_check_cap ( KVM_CAP_NR_MEMSLOTS ) ;
TEST_ASSERT ( max_mem_slots > 0 ,
" KVM_CAP_NR_MEMSLOTS should be greater than 0 " ) ;
pr_info ( " Allowed number of memory slots: %i \n " , max_mem_slots ) ;
2022-04-18 16:26:06 -07:00
vm = vm_create_barebones ( ) ;
2020-04-10 16:17:07 -07:00
/* Check it can be added memory slots up to the maximum allowed */
pr_info ( " Adding slots 0..%i, each memory region with %dK size \n " ,
( max_mem_slots - 1 ) , MEM_REGION_SIZE > > 10 ) ;
2021-04-26 15:01:21 +02:00
2021-06-24 15:09:31 +08:00
mem = mmap ( NULL , ( size_t ) max_mem_slots * MEM_REGION_SIZE + alignment ,
2021-07-01 17:42:24 +02:00
PROT_READ | PROT_WRITE ,
MAP_PRIVATE | MAP_ANONYMOUS | MAP_NORESERVE , - 1 , 0 ) ;
2021-04-26 15:01:21 +02:00
TEST_ASSERT ( mem ! = MAP_FAILED , " Failed to mmap() host " ) ;
mem_aligned = ( void * ) ( ( ( size_t ) mem + alignment - 1 ) & ~ ( alignment - 1 ) ) ;
2022-02-26 00:15:43 +00:00
for ( slot = 0 ; slot < max_mem_slots ; slot + + )
vm_set_user_memory_region ( vm , slot , 0 ,
( ( uint64_t ) slot * MEM_REGION_SIZE ) ,
MEM_REGION_SIZE ,
mem_aligned + ( uint64_t ) slot * MEM_REGION_SIZE ) ;
2020-04-10 16:17:07 -07:00
/* Check it cannot be added memory slots beyond the limit */
2021-04-26 15:01:21 +02:00
mem_extra = mmap ( NULL , MEM_REGION_SIZE , PROT_READ | PROT_WRITE ,
MAP_PRIVATE | MAP_ANONYMOUS , - 1 , 0 ) ;
TEST_ASSERT ( mem_extra ! = MAP_FAILED , " Failed to mmap() host " ) ;
2020-04-10 16:17:07 -07:00
2022-02-26 00:15:43 +00:00
ret = __vm_set_user_memory_region ( vm , max_mem_slots , 0 ,
( uint64_t ) max_mem_slots * MEM_REGION_SIZE ,
MEM_REGION_SIZE , mem_extra ) ;
2020-04-10 16:17:07 -07:00
TEST_ASSERT ( ret = = - 1 & & errno = = EINVAL ,
" Adding one more memory slot should fail with EINVAL " ) ;
2021-06-24 15:09:31 +08:00
munmap ( mem , ( size_t ) max_mem_slots * MEM_REGION_SIZE + alignment ) ;
2021-04-26 15:01:21 +02:00
munmap ( mem_extra , MEM_REGION_SIZE ) ;
2020-04-10 16:17:07 -07:00
kvm_vm_free ( vm ) ;
}
2020-02-18 13:07:33 -08:00
int main ( int argc , char * argv [ ] )
{
2020-04-10 16:17:06 -07:00
# ifdef __x86_64__
2020-02-18 13:07:33 -08:00
int i , loops ;
2020-04-10 16:17:06 -07:00
# endif
2020-02-18 13:07:33 -08:00
/* Tell stdout not to buffer its content */
setbuf ( stdout , NULL ) ;
2020-04-10 16:17:06 -07:00
# ifdef __x86_64__
/*
* FIXME : the zero - memslot test fails on aarch64 and s390x because
* KVM_RUN fails with ENOEXEC or EFAULT .
*/
2020-04-10 16:17:05 -07:00
test_zero_memory_regions ( ) ;
2020-04-10 16:17:07 -07:00
# endif
test_add_max_memory_regions ( ) ;
2020-04-10 16:17:05 -07:00
2020-04-10 16:17:07 -07:00
# ifdef __x86_64__
2020-02-18 13:07:33 -08:00
if ( argc > 1 )
loops = atoi ( argv [ 1 ] ) ;
else
loops = 10 ;
2020-04-10 16:17:03 -07:00
pr_info ( " Testing MOVE of in-use region, %d loops \n " , loops ) ;
2020-02-18 13:07:33 -08:00
for ( i = 0 ; i < loops ; i + + )
test_move_memory_region ( ) ;
2020-04-10 16:17:03 -07:00
pr_info ( " Testing DELETE of in-use region, %d loops \n " , loops ) ;
for ( i = 0 ; i < loops ; i + + )
test_delete_memory_region ( ) ;
2020-04-10 16:17:06 -07:00
# endif
2020-04-10 16:17:03 -07:00
2020-02-18 13:07:33 -08:00
return 0 ;
}