2008-06-24 05:32:36 +04:00
/*
* Copyright ( C ) 2001 Ben . Herrenschmidt ( benh @ kernel . crashing . org )
*
* Modifications for ppc64 :
* Copyright ( C ) 2003 Dave Engebretsen < engebret @ us . ibm . com >
*
* Copyright 2008 Michael Ellerman , IBM Corporation .
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation ; either version
* 2 of the License , or ( at your option ) any later version .
*/
2010-06-29 01:08:29 +04:00
# include <linux/types.h>
2016-07-23 12:12:38 +03:00
# include <linux/jump_label.h>
2008-06-24 05:32:36 +04:00
# include <linux/kernel.h>
2008-06-24 05:33:03 +04:00
# include <linux/string.h>
# include <linux/init.h>
2008-06-24 05:32:36 +04:00
# include <asm/cputable.h>
# include <asm/code-patching.h>
2011-11-14 16:54:47 +04:00
# include <asm/page.h>
# include <asm/sections.h>
2016-07-05 08:03:41 +03:00
# include <asm/setup.h>
# include <asm/firmware.h>
2008-06-24 05:32:36 +04:00
struct fixup_entry {
unsigned long mask ;
unsigned long value ;
long start_off ;
long end_off ;
powerpc: Introduce infrastructure for feature sections with alternatives
The current feature section logic only supports nop'ing out code, this means
if you want to choose at runtime between instruction sequences, one or both
cases will have to execute the nop'ed out contents of the other section, eg:
BEGIN_FTR_SECTION
or 1,1,1
END_FTR_SECTION_IFSET(FOO)
BEGIN_FTR_SECTION
or 2,2,2
END_FTR_SECTION_IFCLR(FOO)
and the resulting code will be either,
or 1,1,1
nop
or,
nop
or 2,2,2
For small code segments this is fine, but for larger code blocks and in
performance criticial code segments, it would be nice to avoid the nops.
This commit starts to implement logic to allow the following:
BEGIN_FTR_SECTION
or 1,1,1
FTR_SECTION_ELSE
or 2,2,2
ALT_FTR_SECTION_END_IFSET(FOO)
and the resulting code will be:
or 1,1,1
or,
or 2,2,2
We achieve this by extending the existing FTR macros. The current feature
section semantic just becomes a special case, ie. if the else case is empty
we nop out the default case.
The key limitation is that the size of the else case must be less than or
equal to the size of the default case. If the else case is smaller the
remainder of the section is nop'ed.
We let the linker put the else case code in with the rest of the text,
so that relative branches from the else case are more likley to link,
this has the disadvantage that we can't free the unused else cases.
This commit introduces the required macro and linker script changes, but
does not enable the patching of the alternative sections.
We also need to update two hand-made section entries in reg.h and timex.h
Signed-off-by: Michael Ellerman <michael@ellerman.id.au>
Signed-off-by: Paul Mackerras <paulus@samba.org>
2008-06-24 05:32:54 +04:00
long alt_start_off ;
long alt_end_off ;
2008-06-24 05:32:36 +04:00
} ;
2008-06-24 05:33:02 +04:00
static unsigned int * calc_addr ( struct fixup_entry * fcur , long offset )
2008-06-24 05:32:36 +04:00
{
2008-06-24 05:33:02 +04:00
/*
* We store the offset to the code as a negative offset from
* the start of the alt_entry , to support the VDSO . This
* routine converts that back into an actual address .
*/
return ( unsigned int * ) ( ( unsigned long ) fcur + offset ) ;
}
static int patch_alt_instruction ( unsigned int * src , unsigned int * dest ,
unsigned int * alt_start , unsigned int * alt_end )
{
unsigned int instr ;
instr = * src ;
if ( instr_is_relative_branch ( * src ) ) {
unsigned int * target = ( unsigned int * ) branch_target ( src ) ;
/* Branch within the section doesn't need translating */
if ( target < alt_start | | target > = alt_end ) {
instr = translate_branch ( dest , src ) ;
if ( ! instr )
return 1 ;
}
}
patch_instruction ( dest , instr ) ;
return 0 ;
}
static int patch_feature_section ( unsigned long value , struct fixup_entry * fcur )
{
unsigned int * start , * end , * alt_start , * alt_end , * src , * dest ;
start = calc_addr ( fcur , fcur - > start_off ) ;
end = calc_addr ( fcur , fcur - > end_off ) ;
alt_start = calc_addr ( fcur , fcur - > alt_start_off ) ;
alt_end = calc_addr ( fcur , fcur - > alt_end_off ) ;
if ( ( alt_end - alt_start ) > ( end - start ) )
return 1 ;
2008-06-24 05:32:36 +04:00
if ( ( value & fcur - > mask ) = = fcur - > value )
2008-06-24 05:33:02 +04:00
return 0 ;
2008-06-24 05:32:36 +04:00
2008-06-24 05:33:02 +04:00
src = alt_start ;
dest = start ;
2008-06-24 05:32:36 +04:00
2008-06-24 05:33:02 +04:00
for ( ; src < alt_end ; src + + , dest + + ) {
if ( patch_alt_instruction ( src , dest , alt_start , alt_end ) )
return 1 ;
2008-06-24 05:32:36 +04:00
}
2008-06-24 05:33:02 +04:00
for ( ; dest < end ; dest + + )
2009-02-10 23:10:44 +03:00
patch_instruction ( dest , PPC_INST_NOP ) ;
2008-06-24 05:33:02 +04:00
return 0 ;
2008-06-24 05:32:36 +04:00
}
void do_feature_fixups ( unsigned long value , void * fixup_start , void * fixup_end )
{
struct fixup_entry * fcur , * fend ;
fcur = fixup_start ;
fend = fixup_end ;
2008-06-24 05:33:02 +04:00
for ( ; fcur < fend ; fcur + + ) {
if ( patch_feature_section ( value , fcur ) ) {
2008-07-17 08:46:00 +04:00
WARN_ON ( 1 ) ;
2008-06-24 05:33:02 +04:00
printk ( " Unable to patch feature section at %p - %p " \
" with %p - %p \n " ,
calc_addr ( fcur , fcur - > start_off ) ,
calc_addr ( fcur , fcur - > end_off ) ,
calc_addr ( fcur , fcur - > alt_start_off ) ,
calc_addr ( fcur , fcur - > alt_end_off ) ) ;
}
}
2008-06-24 05:32:36 +04:00
}
2008-06-24 05:33:03 +04:00
2008-07-01 19:16:40 +04:00
void do_lwsync_fixups ( unsigned long value , void * fixup_start , void * fixup_end )
{
2010-02-26 10:29:17 +03:00
long * start , * end ;
unsigned int * dest ;
2008-07-01 19:16:40 +04:00
if ( ! ( value & CPU_FTR_LWSYNC ) )
return ;
start = fixup_start ;
end = fixup_end ;
for ( ; start < end ; start + + ) {
dest = ( void * ) start + * start ;
2009-02-10 23:10:44 +03:00
patch_instruction ( dest , PPC_INST_LWSYNC ) ;
2008-07-01 19:16:40 +04:00
}
}
2016-07-05 08:03:41 +03:00
static void do_final_fixups ( void )
2011-11-14 16:54:47 +04:00
{
# if defined(CONFIG_PPC64) && defined(CONFIG_RELOCATABLE)
int * src , * dest ;
unsigned long length ;
if ( PHYSICAL_START = = 0 )
return ;
src = ( int * ) ( KERNELBASE + PHYSICAL_START ) ;
dest = ( int * ) KERNELBASE ;
length = ( __end_interrupts - _stext ) / sizeof ( int ) ;
while ( length - - ) {
patch_instruction ( dest , * src ) ;
src + + ;
dest + + ;
}
# endif
}
2016-07-26 15:29:18 +03:00
static unsigned long __initdata saved_cpu_features ;
static unsigned int __initdata saved_mmu_features ;
# ifdef CONFIG_PPC64
static unsigned long __initdata saved_firmware_features ;
# endif
void __init apply_feature_fixups ( void )
2016-07-05 08:03:41 +03:00
{
2016-08-02 08:53:01 +03:00
struct cpu_spec * spec = PTRRELOC ( * PTRRELOC ( & cur_cpu_spec ) ) ;
2016-07-05 08:03:41 +03:00
2016-07-26 15:29:18 +03:00
* PTRRELOC ( & saved_cpu_features ) = spec - > cpu_features ;
* PTRRELOC ( & saved_mmu_features ) = spec - > mmu_features ;
2016-07-05 08:03:41 +03:00
/*
* Apply the CPU - specific and firmware specific fixups to kernel text
* ( nop out sections not relevant to this CPU or this firmware ) .
*/
do_feature_fixups ( spec - > cpu_features ,
PTRRELOC ( & __start___ftr_fixup ) ,
PTRRELOC ( & __stop___ftr_fixup ) ) ;
do_feature_fixups ( spec - > mmu_features ,
PTRRELOC ( & __start___mmu_ftr_fixup ) ,
PTRRELOC ( & __stop___mmu_ftr_fixup ) ) ;
do_lwsync_fixups ( spec - > cpu_features ,
PTRRELOC ( & __start___lwsync_fixup ) ,
PTRRELOC ( & __stop___lwsync_fixup ) ) ;
# ifdef CONFIG_PPC64
2016-07-26 15:29:18 +03:00
saved_firmware_features = powerpc_firmware_features ;
2016-07-05 08:03:41 +03:00
do_feature_fixups ( powerpc_firmware_features ,
& __start___fw_ftr_fixup , & __stop___fw_ftr_fixup ) ;
# endif
do_final_fixups ( ) ;
2016-07-23 12:12:38 +03:00
/*
* Initialise jump label . This causes all the cpu / mmu_has_feature ( )
* checks to take on their correct polarity based on the current set of
* CPU / MMU features .
*/
jump_label_init ( ) ;
powerpc: Add option to use jump label for cpu_has_feature()
We do binary patching of asm code using CPU features, which is a
one-time operation, done during early boot. However checks of CPU
features in C code are currently done at run time, even though the set
of CPU features can never change after boot.
We can optimise this by using jump labels to implement cpu_has_feature(),
meaning checks in C code are binary patched into a single nop or branch.
For a C sequence along the lines of:
if (cpu_has_feature(FOO))
return 2;
The generated code before is roughly:
ld r9,-27640(r2)
ld r9,0(r9)
lwz r9,32(r9)
cmpwi cr7,r9,0
bge cr7, 1f
li r3,2
blr
1: ...
After (true):
nop
li r3,2
blr
After (false):
b 1f
li r3,2
blr
1: ...
mpe: Rename MAX_CPU_FEATURES as we already have a #define with that
name, and define it simply as a constant, rather than doing tricks with
sizeof and NULL pointers. Rename the array to cpu_feature_keys. Use the
kconfig we added to guard it. Add BUILD_BUG_ON() if the feature is not a
compile time constant. Rewrite the change log.
Signed-off-by: Kevin Hao <haokexin@gmail.com>
Signed-off-by: Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2016-07-23 12:12:41 +03:00
cpu_feature_keys_init ( ) ;
2016-07-23 12:12:42 +03:00
mmu_feature_keys_init ( ) ;
2016-07-05 08:03:41 +03:00
}
2016-07-26 15:29:18 +03:00
static int __init check_features ( void )
{
WARN ( saved_cpu_features ! = cur_cpu_spec - > cpu_features ,
" CPU features changed after feature patching! \n " ) ;
WARN ( saved_mmu_features ! = cur_cpu_spec - > mmu_features ,
" MMU features changed after feature patching! \n " ) ;
# ifdef CONFIG_PPC64
WARN ( saved_firmware_features ! = powerpc_firmware_features ,
" Firmware features changed after feature patching! \n " ) ;
# endif
return 0 ;
}
late_initcall ( check_features ) ;
2008-06-24 05:33:03 +04:00
# ifdef CONFIG_FTR_FIXUP_SELFTEST
# define check(x) \
if ( ! ( x ) ) printk ( " feature-fixups: test failed at line %d \n " , __LINE__ ) ;
/* This must be after the text it fixes up, vmlinux.lds.S enforces that atm */
static struct fixup_entry fixup ;
static long calc_offset ( struct fixup_entry * entry , unsigned int * p )
{
return ( unsigned long ) p - ( unsigned long ) entry ;
}
2014-08-20 02:55:18 +04:00
static void test_basic_patching ( void )
2008-06-24 05:33:03 +04:00
{
extern unsigned int ftr_fixup_test1 ;
extern unsigned int end_ftr_fixup_test1 ;
extern unsigned int ftr_fixup_test1_orig ;
extern unsigned int ftr_fixup_test1_expected ;
int size = & end_ftr_fixup_test1 - & ftr_fixup_test1 ;
fixup . value = fixup . mask = 8 ;
fixup . start_off = calc_offset ( & fixup , & ftr_fixup_test1 + 1 ) ;
fixup . end_off = calc_offset ( & fixup , & ftr_fixup_test1 + 2 ) ;
fixup . alt_start_off = fixup . alt_end_off = 0 ;
/* Sanity check */
check ( memcmp ( & ftr_fixup_test1 , & ftr_fixup_test1_orig , size ) = = 0 ) ;
/* Check we don't patch if the value matches */
patch_feature_section ( 8 , & fixup ) ;
check ( memcmp ( & ftr_fixup_test1 , & ftr_fixup_test1_orig , size ) = = 0 ) ;
/* Check we do patch if the value doesn't match */
patch_feature_section ( 0 , & fixup ) ;
check ( memcmp ( & ftr_fixup_test1 , & ftr_fixup_test1_expected , size ) = = 0 ) ;
/* Check we do patch if the mask doesn't match */
memcpy ( & ftr_fixup_test1 , & ftr_fixup_test1_orig , size ) ;
check ( memcmp ( & ftr_fixup_test1 , & ftr_fixup_test1_orig , size ) = = 0 ) ;
patch_feature_section ( ~ 8 , & fixup ) ;
check ( memcmp ( & ftr_fixup_test1 , & ftr_fixup_test1_expected , size ) = = 0 ) ;
}
static void test_alternative_patching ( void )
{
extern unsigned int ftr_fixup_test2 ;
extern unsigned int end_ftr_fixup_test2 ;
extern unsigned int ftr_fixup_test2_orig ;
extern unsigned int ftr_fixup_test2_alt ;
extern unsigned int ftr_fixup_test2_expected ;
int size = & end_ftr_fixup_test2 - & ftr_fixup_test2 ;
fixup . value = fixup . mask = 0xF ;
fixup . start_off = calc_offset ( & fixup , & ftr_fixup_test2 + 1 ) ;
fixup . end_off = calc_offset ( & fixup , & ftr_fixup_test2 + 2 ) ;
fixup . alt_start_off = calc_offset ( & fixup , & ftr_fixup_test2_alt ) ;
fixup . alt_end_off = calc_offset ( & fixup , & ftr_fixup_test2_alt + 1 ) ;
/* Sanity check */
check ( memcmp ( & ftr_fixup_test2 , & ftr_fixup_test2_orig , size ) = = 0 ) ;
/* Check we don't patch if the value matches */
patch_feature_section ( 0xF , & fixup ) ;
check ( memcmp ( & ftr_fixup_test2 , & ftr_fixup_test2_orig , size ) = = 0 ) ;
/* Check we do patch if the value doesn't match */
patch_feature_section ( 0 , & fixup ) ;
check ( memcmp ( & ftr_fixup_test2 , & ftr_fixup_test2_expected , size ) = = 0 ) ;
/* Check we do patch if the mask doesn't match */
memcpy ( & ftr_fixup_test2 , & ftr_fixup_test2_orig , size ) ;
check ( memcmp ( & ftr_fixup_test2 , & ftr_fixup_test2_orig , size ) = = 0 ) ;
patch_feature_section ( ~ 0xF , & fixup ) ;
check ( memcmp ( & ftr_fixup_test2 , & ftr_fixup_test2_expected , size ) = = 0 ) ;
}
static void test_alternative_case_too_big ( void )
{
extern unsigned int ftr_fixup_test3 ;
extern unsigned int end_ftr_fixup_test3 ;
extern unsigned int ftr_fixup_test3_orig ;
extern unsigned int ftr_fixup_test3_alt ;
int size = & end_ftr_fixup_test3 - & ftr_fixup_test3 ;
fixup . value = fixup . mask = 0xC ;
fixup . start_off = calc_offset ( & fixup , & ftr_fixup_test3 + 1 ) ;
fixup . end_off = calc_offset ( & fixup , & ftr_fixup_test3 + 2 ) ;
fixup . alt_start_off = calc_offset ( & fixup , & ftr_fixup_test3_alt ) ;
fixup . alt_end_off = calc_offset ( & fixup , & ftr_fixup_test3_alt + 2 ) ;
/* Sanity check */
check ( memcmp ( & ftr_fixup_test3 , & ftr_fixup_test3_orig , size ) = = 0 ) ;
/* Expect nothing to be patched, and the error returned to us */
check ( patch_feature_section ( 0xF , & fixup ) = = 1 ) ;
check ( memcmp ( & ftr_fixup_test3 , & ftr_fixup_test3_orig , size ) = = 0 ) ;
check ( patch_feature_section ( 0 , & fixup ) = = 1 ) ;
check ( memcmp ( & ftr_fixup_test3 , & ftr_fixup_test3_orig , size ) = = 0 ) ;
check ( patch_feature_section ( ~ 0xF , & fixup ) = = 1 ) ;
check ( memcmp ( & ftr_fixup_test3 , & ftr_fixup_test3_orig , size ) = = 0 ) ;
}
static void test_alternative_case_too_small ( void )
{
extern unsigned int ftr_fixup_test4 ;
extern unsigned int end_ftr_fixup_test4 ;
extern unsigned int ftr_fixup_test4_orig ;
extern unsigned int ftr_fixup_test4_alt ;
extern unsigned int ftr_fixup_test4_expected ;
int size = & end_ftr_fixup_test4 - & ftr_fixup_test4 ;
unsigned long flag ;
/* Check a high-bit flag */
flag = 1UL < < ( ( sizeof ( unsigned long ) - 1 ) * 8 ) ;
fixup . value = fixup . mask = flag ;
fixup . start_off = calc_offset ( & fixup , & ftr_fixup_test4 + 1 ) ;
fixup . end_off = calc_offset ( & fixup , & ftr_fixup_test4 + 5 ) ;
fixup . alt_start_off = calc_offset ( & fixup , & ftr_fixup_test4_alt ) ;
fixup . alt_end_off = calc_offset ( & fixup , & ftr_fixup_test4_alt + 2 ) ;
/* Sanity check */
check ( memcmp ( & ftr_fixup_test4 , & ftr_fixup_test4_orig , size ) = = 0 ) ;
/* Check we don't patch if the value matches */
patch_feature_section ( flag , & fixup ) ;
check ( memcmp ( & ftr_fixup_test4 , & ftr_fixup_test4_orig , size ) = = 0 ) ;
/* Check we do patch if the value doesn't match */
patch_feature_section ( 0 , & fixup ) ;
check ( memcmp ( & ftr_fixup_test4 , & ftr_fixup_test4_expected , size ) = = 0 ) ;
/* Check we do patch if the mask doesn't match */
memcpy ( & ftr_fixup_test4 , & ftr_fixup_test4_orig , size ) ;
check ( memcmp ( & ftr_fixup_test4 , & ftr_fixup_test4_orig , size ) = = 0 ) ;
patch_feature_section ( ~ flag , & fixup ) ;
check ( memcmp ( & ftr_fixup_test4 , & ftr_fixup_test4_expected , size ) = = 0 ) ;
}
static void test_alternative_case_with_branch ( void )
{
extern unsigned int ftr_fixup_test5 ;
extern unsigned int end_ftr_fixup_test5 ;
extern unsigned int ftr_fixup_test5_expected ;
int size = & end_ftr_fixup_test5 - & ftr_fixup_test5 ;
check ( memcmp ( & ftr_fixup_test5 , & ftr_fixup_test5_expected , size ) = = 0 ) ;
}
static void test_alternative_case_with_external_branch ( void )
{
extern unsigned int ftr_fixup_test6 ;
extern unsigned int end_ftr_fixup_test6 ;
extern unsigned int ftr_fixup_test6_expected ;
int size = & end_ftr_fixup_test6 - & ftr_fixup_test6 ;
check ( memcmp ( & ftr_fixup_test6 , & ftr_fixup_test6_expected , size ) = = 0 ) ;
}
static void test_cpu_macros ( void )
{
2010-06-29 01:08:29 +04:00
extern u8 ftr_fixup_test_FTR_macros ;
extern u8 ftr_fixup_test_FTR_macros_expected ;
2008-06-24 05:33:03 +04:00
unsigned long size = & ftr_fixup_test_FTR_macros_expected -
& ftr_fixup_test_FTR_macros ;
/* The fixups have already been done for us during boot */
check ( memcmp ( & ftr_fixup_test_FTR_macros ,
& ftr_fixup_test_FTR_macros_expected , size ) = = 0 ) ;
}
static void test_fw_macros ( void )
{
# ifdef CONFIG_PPC64
2010-06-29 01:08:29 +04:00
extern u8 ftr_fixup_test_FW_FTR_macros ;
extern u8 ftr_fixup_test_FW_FTR_macros_expected ;
2008-06-24 05:33:03 +04:00
unsigned long size = & ftr_fixup_test_FW_FTR_macros_expected -
& ftr_fixup_test_FW_FTR_macros ;
/* The fixups have already been done for us during boot */
check ( memcmp ( & ftr_fixup_test_FW_FTR_macros ,
& ftr_fixup_test_FW_FTR_macros_expected , size ) = = 0 ) ;
# endif
}
2008-07-01 19:16:40 +04:00
static void test_lwsync_macros ( void )
{
2010-06-29 01:08:29 +04:00
extern u8 lwsync_fixup_test ;
extern u8 end_lwsync_fixup_test ;
extern u8 lwsync_fixup_test_expected_LWSYNC ;
extern u8 lwsync_fixup_test_expected_SYNC ;
2008-07-01 19:16:40 +04:00
unsigned long size = & end_lwsync_fixup_test -
& lwsync_fixup_test ;
/* The fixups have already been done for us during boot */
if ( cur_cpu_spec - > cpu_features & CPU_FTR_LWSYNC ) {
check ( memcmp ( & lwsync_fixup_test ,
& lwsync_fixup_test_expected_LWSYNC , size ) = = 0 ) ;
} else {
check ( memcmp ( & lwsync_fixup_test ,
& lwsync_fixup_test_expected_SYNC , size ) = = 0 ) ;
}
}
2008-06-24 05:33:03 +04:00
static int __init test_feature_fixups ( void )
{
printk ( KERN_DEBUG " Running feature fixup self-tests ... \n " ) ;
test_basic_patching ( ) ;
test_alternative_patching ( ) ;
test_alternative_case_too_big ( ) ;
test_alternative_case_too_small ( ) ;
test_alternative_case_with_branch ( ) ;
test_alternative_case_with_external_branch ( ) ;
test_cpu_macros ( ) ;
test_fw_macros ( ) ;
2008-07-01 19:16:40 +04:00
test_lwsync_macros ( ) ;
2008-06-24 05:33:03 +04:00
return 0 ;
}
late_initcall ( test_feature_fixups ) ;
# endif /* CONFIG_FTR_FIXUP_SELFTEST */