2005-04-17 02:20:36 +04:00
/*
* c 2001 PPC 64 Team , IBM Corp
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation ; either version
* 2 of the License , or ( at your option ) any later version .
*/
2011-05-10 23:28:52 +04:00
# include <linux/smp.h>
2011-07-23 02:24:23 +04:00
# include <linux/export.h>
2010-07-12 08:36:09 +04:00
# include <linux/memblock.h>
2005-04-17 02:20:36 +04:00
# include <asm/lppaca.h>
# include <asm/paca.h>
powerpc: Make the 64-bit kernel as a position-independent executable
This implements CONFIG_RELOCATABLE for 64-bit by making the kernel as
a position-independent executable (PIE) when it is set. This involves
processing the dynamic relocations in the image in the early stages of
booting, even if the kernel is being run at the address it is linked at,
since the linker does not necessarily fill in words in the image for
which there are dynamic relocations. (In fact the linker does fill in
such words for 64-bit executables, though not for 32-bit executables,
so in principle we could avoid calling relocate() entirely when we're
running a 64-bit kernel at the linked address.)
The dynamic relocations are processed by a new function relocate(addr),
where the addr parameter is the virtual address where the image will be
run. In fact we call it twice; once before calling prom_init, and again
when starting the main kernel. This means that reloc_offset() returns
0 in prom_init (since it has been relocated to the address it is running
at), which necessitated a few adjustments.
This also changes __va and __pa to use an equivalent definition that is
simpler. With the relocatable kernel, PAGE_OFFSET and MEMORY_START are
constants (for 64-bit) whereas PHYSICAL_START is a variable (and
KERNELBASE ideally should be too, but isn't yet).
With this, relocatable kernels still copy themselves down to physical
address 0 and run there.
Signed-off-by: Paul Mackerras <paulus@samba.org>
2008-08-30 05:43:47 +04:00
# include <asm/sections.h>
2009-07-24 03:15:42 +04:00
# include <asm/pgtable.h>
2010-05-13 23:40:11 +04:00
# include <asm/kexec.h>
2005-04-17 02:20:36 +04:00
/* This symbol is provided by the linker - let it fill in the paca
* field correctly */
extern unsigned long __toc_start ;
2009-06-03 01:17:41 +04:00
# ifdef CONFIG_PPC_BOOK3S
2006-01-13 02:26:42 +03:00
/*
2008-04-10 10:43:47 +04:00
* The structure which the hypervisor knows about - this structure
2006-01-13 02:26:42 +03:00
* should not cross a page boundary . The vpa_init / register_vpa call
* is now known to fail if the lppaca structure crosses a page
2012-03-15 22:18:00 +04:00
* boundary . The lppaca is also used on POWER5 pSeries boxes .
* The lppaca is 640 bytes long , and cannot readily
2008-04-10 10:43:47 +04:00
* change since the hypervisor knows its layout , so a 1 kB alignment
* will suffice to ensure that it doesn ' t cross a page boundary .
2006-01-13 02:26:42 +03:00
*/
struct lppaca lppaca [ ] = {
2010-08-13 00:18:48 +04:00
[ 0 . . . ( NR_LPPACAS - 1 ) ] = {
2013-08-06 20:01:46 +04:00
. desc = cpu_to_be32 ( 0xd397d781 ) , /* "LpPa" */
. size = cpu_to_be16 ( sizeof ( struct lppaca ) ) ,
2006-01-13 02:26:42 +03:00
. fpregs_in_use = 1 ,
2013-08-06 20:01:46 +04:00
. slb_count = cpu_to_be16 ( 64 ) ,
2006-01-13 02:26:42 +03:00
. vmxregs_in_use = 0 ,
2008-10-22 09:53:45 +04:00
. page_ins = 0 ,
2006-01-13 02:26:42 +03:00
} ,
} ;
2010-08-13 00:18:48 +04:00
static struct lppaca * extra_lppacas ;
static long __initdata lppaca_size ;
2013-09-29 16:41:18 +04:00
static void __init allocate_lppacas ( int nr_cpus , unsigned long limit )
2010-08-13 00:18:48 +04:00
{
if ( nr_cpus < = NR_LPPACAS )
return ;
lppaca_size = PAGE_ALIGN ( sizeof ( struct lppaca ) *
( nr_cpus - NR_LPPACAS ) ) ;
extra_lppacas = __va ( memblock_alloc_base ( lppaca_size ,
PAGE_SIZE , limit ) ) ;
}
2013-09-29 16:41:18 +04:00
static struct lppaca * __init new_lppaca ( int cpu )
2010-08-13 00:18:48 +04:00
{
struct lppaca * lp ;
if ( cpu < NR_LPPACAS )
return & lppaca [ cpu ] ;
lp = extra_lppacas + ( cpu - NR_LPPACAS ) ;
* lp = lppaca [ 0 ] ;
return lp ;
}
2013-09-29 16:41:18 +04:00
static void __init free_lppacas ( void )
2010-08-13 00:18:48 +04:00
{
long new_size = 0 , nr ;
if ( ! lppaca_size )
return ;
nr = num_possible_cpus ( ) - NR_LPPACAS ;
if ( nr > 0 )
new_size = PAGE_ALIGN ( nr * sizeof ( struct lppaca ) ) ;
if ( new_size > = lppaca_size )
return ;
memblock_free ( __pa ( extra_lppacas ) + new_size , lppaca_size - new_size ) ;
lppaca_size = new_size ;
}
# else
2010-10-08 02:05:08 +04:00
static inline void allocate_lppacas ( int nr_cpus , unsigned long limit ) { }
2010-08-13 00:18:48 +04:00
static inline void free_lppacas ( void ) { }
2009-06-03 01:17:41 +04:00
# endif /* CONFIG_PPC_BOOK3S */
# ifdef CONFIG_PPC_STD_MMU_64
2006-08-07 10:19:19 +04:00
/*
* 3 persistent SLBs are registered here . The buffer will be zero
* initially , hence will all be invaild until we actually write them .
*/
2013-12-05 07:42:40 +04:00
static struct slb_shadow * slb_shadow ;
static void __init allocate_slb_shadows ( int nr_cpus , int limit )
{
int size = PAGE_ALIGN ( sizeof ( struct slb_shadow ) * nr_cpus ) ;
slb_shadow = __va ( memblock_alloc_base ( size , PAGE_SIZE , limit ) ) ;
memset ( slb_shadow , 0 , size ) ;
}
static struct slb_shadow * __init init_slb_shadow ( int cpu )
{
struct slb_shadow * s = & slb_shadow [ cpu ] ;
s - > persistent = cpu_to_be32 ( SLB_NUM_BOLTED ) ;
s - > buffer_length = cpu_to_be32 ( sizeof ( * s ) ) ;
return s ;
}
# else /* CONFIG_PPC_STD_MMU_64 */
static void __init allocate_slb_shadows ( int nr_cpus , int limit ) { }
2006-08-07 10:19:19 +04:00
2009-06-03 01:17:41 +04:00
# endif /* CONFIG_PPC_STD_MMU_64 */
2005-11-09 05:38:01 +03:00
/* The Paca is an array with one entry per processor. Each contains an
2005-04-17 02:20:36 +04:00
* lppaca , which contains the information shared between the
2005-11-24 08:34:45 +03:00
* hypervisor and Linux .
2005-04-17 02:20:36 +04:00
* On systems with hardware multi - threading , there are two threads
* per processor . The Paca array must contain an entry for each thread .
* The VPD Areas will give a max logical processors = 2 * max physical
* processors . The processor VPD array needs one entry per physical
* processor ( not thread ) .
*/
2010-01-28 16:23:22 +03:00
struct paca_struct * paca ;
2005-04-17 02:20:36 +04:00
EXPORT_SYMBOL ( paca ) ;
2008-04-24 07:43:49 +04:00
2010-01-28 16:23:22 +03:00
void __init initialise_paca ( struct paca_struct * new_paca , int cpu )
{
/* The TOC register (GPR2) points 32kB into the TOC, so that 64kB
* of the TOC can be addressed using a single machine instruction .
*/
2008-04-24 07:43:49 +04:00
unsigned long kernel_toc = ( unsigned long ) ( & __toc_start ) + 0x8000UL ;
2009-06-03 01:17:41 +04:00
# ifdef CONFIG_PPC_BOOK3S
2010-08-13 00:18:48 +04:00
new_paca - > lppaca_ptr = new_lppaca ( cpu ) ;
2009-07-24 03:15:42 +04:00
# else
2010-01-28 16:23:22 +03:00
new_paca - > kernel_pgd = swapper_pg_dir ;
2009-06-03 01:17:41 +04:00
# endif
2010-01-28 16:23:22 +03:00
new_paca - > lock_token = 0x8000 ;
new_paca - > paca_index = cpu ;
new_paca - > kernel_toc = kernel_toc ;
new_paca - > kernelbase = ( unsigned long ) _stext ;
new_paca - > kernel_msr = MSR_KERNEL ;
new_paca - > hw_cpu_id = 0xffff ;
2010-05-13 23:40:11 +04:00
new_paca - > kexec_state = KEXEC_STATE_NONE ;
2010-01-28 16:23:22 +03:00
new_paca - > __current = & init_task ;
2012-09-07 19:31:44 +04:00
new_paca - > data_offset = 0xfeeeeeeeeeeeeeeeULL ;
2009-06-03 01:17:41 +04:00
# ifdef CONFIG_PPC_STD_MMU_64
2013-12-05 07:42:40 +04:00
new_paca - > slb_shadow_ptr = init_slb_shadow ( cpu ) ;
2009-06-03 01:17:41 +04:00
# endif /* CONFIG_PPC_STD_MMU_64 */
2010-01-28 16:23:22 +03:00
}
2010-07-08 01:55:37 +04:00
/* Put the paca pointer into r13 and SPRG_PACA */
void setup_paca ( struct paca_struct * new_paca )
{
2011-01-20 09:50:21 +03:00
/* Setup r13 */
2010-07-08 01:55:37 +04:00
local_paca = new_paca ;
2011-01-20 09:50:21 +03:00
2010-07-08 01:55:37 +04:00
# ifdef CONFIG_PPC_BOOK3E
2011-01-20 09:50:21 +03:00
/* On Book3E, initialize the TLB miss exception frames */
2010-07-08 01:55:37 +04:00
mtspr ( SPRN_SPRG_TLB_EXFRAME , local_paca - > extlb ) ;
2011-01-20 09:50:21 +03:00
# else
/* In HV mode, we setup both HPACA and PACA to avoid problems
* if we do a GET_PACA ( ) before the feature fixups have been
* applied
*/
powerpc, KVM: Split HVMODE_206 cpu feature bit into separate HV and architecture bits
This replaces the single CPU_FTR_HVMODE_206 bit with two bits, one to
indicate that we have a usable hypervisor mode, and another to indicate
that the processor conforms to PowerISA version 2.06. We also add
another bit to indicate that the processor conforms to ISA version 2.01
and set that for PPC970 and derivatives.
Some PPC970 chips (specifically those in Apple machines) have a
hypervisor mode in that MSR[HV] is always 1, but the hypervisor mode
is not useful in the sense that there is no way to run any code in
supervisor mode (HV=0 PR=0). On these processors, the LPES0 and LPES1
bits in HID4 are always 0, and we use that as a way of detecting that
hypervisor mode is not useful.
Where we have a feature section in assembly code around code that
only applies on POWER7 in hypervisor mode, we use a construct like
END_FTR_SECTION_IFSET(CPU_FTR_HVMODE | CPU_FTR_ARCH_206)
The definition of END_FTR_SECTION_IFSET is such that the code will
be enabled (not overwritten with nops) only if all bits in the
provided mask are set.
Note that the CPU feature check in __tlbie() only needs to check the
ARCH_206 bit, not the HVMODE bit, because __tlbie() can only get called
if we are running bare-metal, i.e. in hypervisor mode.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2011-06-29 04:26:11 +04:00
if ( cpu_has_feature ( CPU_FTR_HVMODE ) )
2011-01-20 09:50:21 +03:00
mtspr ( SPRN_SPRG_HPACA , local_paca ) ;
2010-07-08 01:55:37 +04:00
# endif
2011-01-20 09:50:21 +03:00
mtspr ( SPRN_SPRG_PACA , local_paca ) ;
2010-07-08 01:55:37 +04:00
}
2010-01-28 16:23:22 +03:00
static int __initdata paca_size ;
void __init allocate_pacas ( void )
{
2011-05-10 23:28:52 +04:00
int cpu , limit ;
2010-01-28 16:23:22 +03:00
/*
* We can ' t take SLB misses on the paca , and we want to access them
* in real mode , so allocate them within the RMA and also within
2012-03-15 22:18:00 +04:00
* the first segment .
2010-01-28 16:23:22 +03:00
*/
2010-07-07 02:39:02 +04:00
limit = min ( 0x10000000ULL , ppc64_rma_size ) ;
2010-01-28 16:23:22 +03:00
2011-05-10 23:28:52 +04:00
paca_size = PAGE_ALIGN ( sizeof ( struct paca_struct ) * nr_cpu_ids ) ;
2010-01-28 16:23:22 +03:00
2010-07-12 08:36:09 +04:00
paca = __va ( memblock_alloc_base ( paca_size , PAGE_SIZE , limit ) ) ;
2010-01-28 16:23:22 +03:00
memset ( paca , 0 , paca_size ) ;
printk ( KERN_DEBUG " Allocated %u bytes for %d pacas at %p \n " ,
2011-05-10 23:28:52 +04:00
paca_size , nr_cpu_ids , paca ) ;
2010-01-28 16:23:22 +03:00
2011-05-10 23:28:52 +04:00
allocate_lppacas ( nr_cpu_ids , limit ) ;
2010-08-13 00:18:48 +04:00
2013-12-05 07:42:40 +04:00
allocate_slb_shadows ( nr_cpu_ids , limit ) ;
2010-01-28 16:23:22 +03:00
/* Can't use for_each_*_cpu, as they aren't functional yet */
2011-05-10 23:28:52 +04:00
for ( cpu = 0 ; cpu < nr_cpu_ids ; cpu + + )
2010-01-28 16:23:22 +03:00
initialise_paca ( & paca [ cpu ] , cpu ) ;
}
void __init free_unused_pacas ( void )
{
int new_size ;
2011-03-31 23:33:02 +04:00
new_size = PAGE_ALIGN ( sizeof ( struct paca_struct ) * nr_cpu_ids ) ;
2010-01-28 16:23:22 +03:00
if ( new_size > = paca_size )
return ;
2010-07-12 08:36:09 +04:00
memblock_free ( __pa ( paca ) + new_size , paca_size - new_size ) ;
2010-01-28 16:23:22 +03:00
printk ( KERN_DEBUG " Freed %u bytes for unused pacas \n " ,
paca_size - new_size ) ;
2008-04-24 07:43:49 +04:00
2010-01-28 16:23:22 +03:00
paca_size = new_size ;
2010-08-13 00:18:48 +04:00
free_lppacas ( ) ;
2008-04-24 07:43:49 +04:00
}