2008-07-29 10:29:19 -07:00
/*
* xsave / xrstor support .
*
* Author : Suresh Siddha < suresh . b . siddha @ intel . com >
*/
# include <linux/bootmem.h>
# include <linux/compat.h>
# include <asm/i387.h>
2008-07-29 10:29:25 -07:00
# ifdef CONFIG_IA32_EMULATION
# include <asm/sigcontext32.h>
# endif
2008-07-29 17:23:16 -07:00
# include <asm/xcr.h>
2008-07-29 10:29:19 -07:00
/*
* Supported feature mask by the CPU and the kernel .
*/
2008-07-29 17:23:16 -07:00
u64 pcntxt_mask ;
2008-07-29 10:29:19 -07:00
2010-07-21 19:03:55 +02:00
/*
* Represents init state for the supported extended state .
*/
static struct xsave_struct * init_xstate_buf ;
2008-07-29 10:29:25 -07:00
struct _fpx_sw_bytes fx_sw_reserved ;
# ifdef CONFIG_IA32_EMULATION
struct _fpx_sw_bytes fx_sw_reserved_ia32 ;
# endif
2010-07-19 16:05:48 -07:00
static unsigned int * xstate_offsets , * xstate_sizes , xstate_features ;
2010-07-19 16:05:49 -07:00
/*
* If a processor implementation discern that a processor state component is
* in its initialized state it may modify the corresponding bit in the
* xsave_hdr . xstate_bv as ' 0 ' , with out modifying the corresponding memory
* layout in the case of xsaveopt . While presenting the xstate information to
* the user , we always ensure that the memory layout of a feature will be in
* the init state if the corresponding header bit is zero . This is to ensure
* that the user doesn ' t see some stale state in the memory layout during
* signal handling , debugging etc .
*/
void __sanitize_i387_state ( struct task_struct * tsk )
{
u64 xstate_bv ;
int feature_bit = 0x2 ;
struct i387_fxsave_struct * fx = & tsk - > thread . fpu . state - > fxsave ;
if ( ! fx )
return ;
BUG_ON ( task_thread_info ( tsk ) - > status & TS_USEDFPU ) ;
xstate_bv = tsk - > thread . fpu . state - > xsave . xsave_hdr . xstate_bv ;
/*
* None of the feature bits are in init state . So nothing else
* to do for us , as the memory layout is upto date .
*/
if ( ( xstate_bv & pcntxt_mask ) = = pcntxt_mask )
return ;
/*
* FP is in init state
*/
if ( ! ( xstate_bv & XSTATE_FP ) ) {
fx - > cwd = 0x37f ;
fx - > swd = 0 ;
fx - > twd = 0 ;
fx - > fop = 0 ;
fx - > rip = 0 ;
fx - > rdp = 0 ;
memset ( & fx - > st_space [ 0 ] , 0 , 128 ) ;
}
/*
* SSE is in init state
*/
if ( ! ( xstate_bv & XSTATE_SSE ) )
memset ( & fx - > xmm_space [ 0 ] , 0 , 256 ) ;
xstate_bv = ( pcntxt_mask & ~ xstate_bv ) > > 2 ;
/*
* Update all the other memory layouts for which the corresponding
* header bit is in the init state .
*/
while ( xstate_bv ) {
if ( xstate_bv & 0x1 ) {
int offset = xstate_offsets [ feature_bit ] ;
int size = xstate_sizes [ feature_bit ] ;
memcpy ( ( ( void * ) fx ) + offset ,
( ( void * ) init_xstate_buf ) + offset ,
size ) ;
}
xstate_bv > > = 1 ;
feature_bit + + ;
}
}
2008-07-29 10:29:25 -07:00
/*
* Check for the presence of extended state information in the
* user fpstate pointer in the sigcontext .
*/
int check_for_xstate ( struct i387_fxsave_struct __user * buf ,
void __user * fpstate ,
struct _fpx_sw_bytes * fx_sw_user )
{
int min_xstate_size = sizeof ( struct i387_fxsave_struct ) +
sizeof ( struct xsave_hdr_struct ) ;
unsigned int magic2 ;
int err ;
err = __copy_from_user ( fx_sw_user , & buf - > sw_reserved [ 0 ] ,
sizeof ( struct _fpx_sw_bytes ) ) ;
if ( err )
2010-06-03 12:07:46 +02:00
return - EFAULT ;
2008-07-29 10:29:25 -07:00
/*
* First Magic check failed .
*/
if ( fx_sw_user - > magic1 ! = FP_XSTATE_MAGIC1 )
2010-06-03 12:07:46 +02:00
return - EINVAL ;
2008-07-29 10:29:25 -07:00
/*
* Check for error scenarios .
*/
if ( fx_sw_user - > xstate_size < min_xstate_size | |
fx_sw_user - > xstate_size > xstate_size | |
fx_sw_user - > xstate_size > fx_sw_user - > extended_size )
2010-06-03 12:07:46 +02:00
return - EINVAL ;
2008-07-29 10:29:25 -07:00
err = __get_user ( magic2 , ( __u32 * ) ( ( ( void * ) fpstate ) +
fx_sw_user - > extended_size -
FP_XSTATE_MAGIC2_SIZE ) ) ;
2010-06-03 12:07:46 +02:00
if ( err )
return err ;
2008-07-29 10:29:25 -07:00
/*
* Check for the presence of second magic word at the end of memory
* layout . This detects the case where the user just copied the legacy
* fpstate layout with out copying the extended state information
* in the memory layout .
*/
2010-06-03 12:07:46 +02:00
if ( magic2 ! = FP_XSTATE_MAGIC2 )
return - EFAULT ;
2008-07-29 10:29:25 -07:00
return 0 ;
}
2008-07-29 10:29:22 -07:00
# ifdef CONFIG_X86_64
/*
* Signal frame handlers .
*/
int save_i387_xstate ( void __user * buf )
{
struct task_struct * tsk = current ;
int err = 0 ;
if ( ! access_ok ( VERIFY_WRITE , buf , sig_xstate_size ) )
return - EACCES ;
2008-08-13 11:38:15 -07:00
BUG_ON ( sig_xstate_size < xstate_size ) ;
2008-07-29 10:29:22 -07:00
2008-07-29 10:29:25 -07:00
if ( ( unsigned long ) buf % 64 )
2008-07-29 10:29:22 -07:00
printk ( " save_i387_xstate: bad fpstate %p \n " , buf ) ;
if ( ! used_math ( ) )
return 0 ;
2009-04-09 15:24:34 -07:00
2008-07-29 10:29:22 -07:00
if ( task_thread_info ( tsk ) - > status & TS_USEDFPU ) {
2010-05-06 11:45:45 +03:00
if ( use_xsave ( ) )
2008-07-29 10:29:25 -07:00
err = xsave_user ( buf ) ;
else
err = fxsave_user ( buf ) ;
2008-07-29 10:29:22 -07:00
if ( err )
return err ;
task_thread_info ( tsk ) - > status & = ~ TS_USEDFPU ;
stts ( ) ;
} else {
2010-07-19 16:05:49 -07:00
sanitize_i387_state ( tsk ) ;
2010-05-06 11:45:46 +03:00
if ( __copy_to_user ( buf , & tsk - > thread . fpu . state - > fxsave ,
2008-07-29 10:29:22 -07:00
xstate_size ) )
return - 1 ;
}
2008-07-29 10:29:25 -07:00
2009-04-09 15:24:34 -07:00
clear_used_math ( ) ; /* trigger finit */
2010-05-06 11:45:45 +03:00
if ( use_xsave ( ) ) {
2008-07-29 10:29:25 -07:00
struct _fpstate __user * fx = buf ;
2008-10-07 14:04:28 -07:00
struct _xstate __user * x = buf ;
u64 xstate_bv ;
2008-07-29 10:29:25 -07:00
err = __copy_to_user ( & fx - > sw_reserved , & fx_sw_reserved ,
sizeof ( struct _fpx_sw_bytes ) ) ;
err | = __put_user ( FP_XSTATE_MAGIC2 ,
( __u32 __user * ) ( buf + sig_xstate_size
- FP_XSTATE_MAGIC2_SIZE ) ) ;
2008-10-07 14:04:28 -07:00
/*
* Read the xstate_bv which we copied ( directly from the cpu or
* from the state in task struct ) to the user buffers and
* set the FP / SSE bits .
*/
err | = __get_user ( xstate_bv , & x - > xstate_hdr . xstate_bv ) ;
/*
* For legacy compatible , we always set FP / SSE bits in the bit
* vector while saving the state to the user context . This will
* enable us capturing any changes ( during sigreturn ) to
* the FP / SSE bits by the legacy applications which don ' t touch
* xstate_bv in the xsave header .
*
* xsave aware apps can change the xstate_bv in the xsave
* header as well as change any contents in the memory layout .
* xrestore as part of sigreturn will capture all the changes .
*/
xstate_bv | = XSTATE_FPSSE ;
err | = __put_user ( xstate_bv , & x - > xstate_hdr . xstate_bv ) ;
2008-10-07 14:04:27 -07:00
if ( err )
return err ;
2008-07-29 10:29:25 -07:00
}
2008-07-29 10:29:22 -07:00
return 1 ;
}
2008-07-29 10:29:25 -07:00
/*
* Restore the extended state if present . Otherwise , restore the FP / SSE
* state .
*/
2008-12-30 22:05:55 +05:30
static int restore_user_xstate ( void __user * buf )
2008-07-29 10:29:25 -07:00
{
struct _fpx_sw_bytes fx_sw_user ;
2008-07-29 17:23:16 -07:00
u64 mask ;
2008-07-29 10:29:25 -07:00
int err ;
if ( ( ( unsigned long ) buf % 64 ) | |
check_for_xstate ( buf , buf , & fx_sw_user ) )
goto fx_only ;
2008-07-29 17:23:16 -07:00
mask = fx_sw_user . xstate_bv ;
2008-07-29 10:29:25 -07:00
/*
* restore the state passed by the user .
*/
2008-07-29 17:23:16 -07:00
err = xrestore_user ( buf , mask ) ;
2008-07-29 10:29:25 -07:00
if ( err )
return err ;
/*
* init the state skipped by the user .
*/
2008-07-29 17:23:16 -07:00
mask = pcntxt_mask & ~ mask ;
2010-06-22 16:23:37 -07:00
if ( unlikely ( mask ) )
xrstor_state ( init_xstate_buf , mask ) ;
2008-07-29 10:29:25 -07:00
return 0 ;
fx_only :
/*
* couldn ' t find the extended state information in the
* memory layout . Restore just the FP / SSE and init all
* the other extended state .
*/
2008-07-29 17:23:16 -07:00
xrstor_state ( init_xstate_buf , pcntxt_mask & ~ XSTATE_FPSSE ) ;
2008-07-29 10:29:25 -07:00
return fxrstor_checking ( ( __force struct i387_fxsave_struct * ) buf ) ;
}
2008-07-29 10:29:22 -07:00
/*
* This restores directly out of user space . Exceptions are handled .
*/
int restore_i387_xstate ( void __user * buf )
{
struct task_struct * tsk = current ;
2008-07-29 10:29:25 -07:00
int err = 0 ;
2008-07-29 10:29:22 -07:00
if ( ! buf ) {
2008-07-29 10:29:25 -07:00
if ( used_math ( ) )
goto clear ;
2008-07-29 10:29:22 -07:00
return 0 ;
} else
if ( ! access_ok ( VERIFY_READ , buf , sig_xstate_size ) )
return - EACCES ;
if ( ! used_math ( ) ) {
err = init_fpu ( tsk ) ;
if ( err )
return err ;
}
if ( ! ( task_thread_info ( current ) - > status & TS_USEDFPU ) ) {
clts ( ) ;
task_thread_info ( current ) - > status | = TS_USEDFPU ;
}
2010-05-06 11:45:45 +03:00
if ( use_xsave ( ) )
2008-07-29 10:29:25 -07:00
err = restore_user_xstate ( buf ) ;
else
err = fxrstor_checking ( ( __force struct i387_fxsave_struct * )
buf ) ;
2008-07-29 10:29:22 -07:00
if ( unlikely ( err ) ) {
/*
* Encountered an error while doing the restore from the
* user buffer , clear the fpu state .
*/
2008-07-29 10:29:25 -07:00
clear :
2008-07-29 10:29:22 -07:00
clear_fpu ( tsk ) ;
clear_used_math ( ) ;
}
return err ;
}
# endif
2008-07-29 10:29:25 -07:00
/*
* Prepare the SW reserved portion of the fxsave memory layout , indicating
* the presence of the extended state information in the memory layout
* pointed by the fpstate pointer in the sigcontext .
* This will be saved when ever the FP and extended state context is
* saved on the user stack during the signal handler delivery to the user .
*/
2008-10-21 19:49:09 -04:00
static void prepare_fx_sw_frame ( void )
2008-07-29 10:29:25 -07:00
{
int size_extended = ( xstate_size - sizeof ( struct i387_fxsave_struct ) ) +
FP_XSTATE_MAGIC2_SIZE ;
sig_xstate_size = sizeof ( struct _fpstate ) + size_extended ;
# ifdef CONFIG_IA32_EMULATION
sig_xstate_ia32_size = sizeof ( struct _fpstate_ia32 ) + size_extended ;
# endif
memset ( & fx_sw_reserved , 0 , sizeof ( fx_sw_reserved ) ) ;
fx_sw_reserved . magic1 = FP_XSTATE_MAGIC1 ;
fx_sw_reserved . extended_size = sig_xstate_size ;
2008-07-29 17:23:16 -07:00
fx_sw_reserved . xstate_bv = pcntxt_mask ;
2008-07-29 10:29:25 -07:00
fx_sw_reserved . xstate_size = xstate_size ;
# ifdef CONFIG_IA32_EMULATION
memcpy ( & fx_sw_reserved_ia32 , & fx_sw_reserved ,
sizeof ( struct _fpx_sw_bytes ) ) ;
fx_sw_reserved_ia32 . extended_size = sig_xstate_ia32_size ;
# endif
}
2008-07-29 10:29:21 -07:00
# ifdef CONFIG_X86_64
unsigned int sig_xstate_size = sizeof ( struct _fpstate ) ;
# endif
2008-07-29 10:29:19 -07:00
/*
* Enable the extended processor state save / restore feature
*/
2010-07-21 14:23:10 -07:00
static inline void xstate_enable ( void )
2008-07-29 10:29:19 -07:00
{
set_in_cr4 ( X86_CR4_OSXSAVE ) ;
2008-07-29 17:23:16 -07:00
xsetbv ( XCR_XFEATURE_ENABLED_MASK , pcntxt_mask ) ;
2008-07-29 10:29:19 -07:00
}
2010-07-19 16:05:48 -07:00
/*
* Record the offsets and sizes of different state managed by the xsave
* memory layout .
*/
2010-07-21 19:03:56 +02:00
static void __init setup_xstate_features ( void )
2010-07-19 16:05:48 -07:00
{
int eax , ebx , ecx , edx , leaf = 0x2 ;
xstate_features = fls64 ( pcntxt_mask ) ;
xstate_offsets = alloc_bootmem ( xstate_features * sizeof ( int ) ) ;
xstate_sizes = alloc_bootmem ( xstate_features * sizeof ( int ) ) ;
do {
2010-07-21 19:03:54 +02:00
cpuid_count ( XSTATE_CPUID , leaf , & eax , & ebx , & ecx , & edx ) ;
2010-07-19 16:05:48 -07:00
if ( eax = = 0 )
break ;
xstate_offsets [ leaf ] = ebx ;
xstate_sizes [ leaf ] = eax ;
leaf + + ;
} while ( 1 ) ;
}
2008-07-29 10:29:19 -07:00
/*
* setup the xstate image representing the init state
*/
2008-08-30 06:03:34 +04:00
static void __init setup_xstate_init ( void )
2008-07-29 10:29:19 -07:00
{
2010-07-19 16:05:49 -07:00
setup_xstate_features ( ) ;
/*
* Setup init_xstate_buf to represent the init state of
* all the features managed by the xsave
*/
2010-11-16 13:23:51 -08:00
init_xstate_buf = alloc_bootmem_align ( xstate_size ,
__alignof__ ( struct xsave_struct ) ) ;
2008-07-29 10:29:19 -07:00
init_xstate_buf - > i387 . mxcsr = MXCSR_DEFAULT ;
2010-07-19 16:05:48 -07:00
2010-07-19 16:05:49 -07:00
clts ( ) ;
/*
* Init all the features state with header_bv being 0x0
*/
xrstor_state ( init_xstate_buf , - 1 ) ;
/*
* Dump the init state again . This is to identify the init state
* of any feature which is not represented by all zero ' s .
*/
xsave_state ( init_xstate_buf , - 1 ) ;
stts ( ) ;
2008-07-29 10:29:19 -07:00
}
/*
* Enable and initialize the xsave feature .
*/
2010-07-21 14:23:10 -07:00
static void __init xstate_enable_boot_cpu ( void )
2008-07-29 10:29:19 -07:00
{
unsigned int eax , ebx , ecx , edx ;
2010-07-21 19:03:54 +02:00
if ( boot_cpu_data . cpuid_level < XSTATE_CPUID ) {
WARN ( 1 , KERN_ERR " XSTATE_CPUID missing \n " ) ;
return ;
}
cpuid_count ( XSTATE_CPUID , 0 , & eax , & ebx , & ecx , & edx ) ;
2008-07-29 17:23:16 -07:00
pcntxt_mask = eax + ( ( u64 ) edx < < 32 ) ;
2008-07-29 10:29:19 -07:00
2008-07-29 17:23:16 -07:00
if ( ( pcntxt_mask & XSTATE_FPSSE ) ! = XSTATE_FPSSE ) {
printk ( KERN_ERR " FP/SSE not shown under xsave features 0x%llx \n " ,
pcntxt_mask ) ;
2008-07-29 10:29:19 -07:00
BUG ( ) ;
}
/*
2009-04-10 15:21:24 -07:00
* Support only the state known to OS .
2008-07-29 10:29:19 -07:00
*/
2008-07-29 17:23:16 -07:00
pcntxt_mask = pcntxt_mask & XCNTXT_MASK ;
2010-07-21 19:03:53 +02:00
2010-07-21 14:23:10 -07:00
xstate_enable ( ) ;
2008-07-29 10:29:19 -07:00
/*
* Recompute the context size for enabled features
*/
2010-07-21 19:03:54 +02:00
cpuid_count ( XSTATE_CPUID , 0 , & eax , & ebx , & ecx , & edx ) ;
2008-07-29 10:29:19 -07:00
xstate_size = ebx ;
2010-02-11 11:50:59 -08:00
update_regset_xstate_info ( xstate_size , pcntxt_mask ) ;
2008-07-29 10:29:25 -07:00
prepare_fx_sw_frame ( ) ;
2008-07-29 10:29:19 -07:00
setup_xstate_init ( ) ;
2008-07-29 17:23:16 -07:00
printk ( KERN_INFO " xsave/xrstor: enabled xstate_bv 0x%llx, "
2008-07-29 10:29:19 -07:00
" cntxt size 0x%x \n " ,
2008-07-29 17:23:16 -07:00
pcntxt_mask , xstate_size ) ;
2008-07-29 10:29:19 -07:00
}
2010-07-20 20:50:51 +02:00
2010-07-21 14:23:10 -07:00
/*
* For the very first instance , this calls xstate_enable_boot_cpu ( ) ;
* for all subsequent instances , this calls xstate_enable ( ) .
*
* This is somewhat obfuscated due to the lack of powerful enough
* overrides for the section checks .
*/
2010-07-20 20:50:51 +02:00
void __cpuinit xsave_init ( void )
{
2010-07-21 14:23:10 -07:00
static __refdata void ( * next_func ) ( void ) = xstate_enable_boot_cpu ;
void ( * this_func ) ( void ) ;
2010-07-21 19:03:52 +02:00
if ( ! cpu_has_xsave )
return ;
2010-07-21 14:23:10 -07:00
this_func = next_func ;
next_func = xstate_enable ;
this_func ( ) ;
2010-07-20 20:50:51 +02:00
}