2019-05-27 09:55:01 +03:00
// SPDX-License-Identifier: GPL-2.0-or-later
2005-10-26 11:11:18 +04:00
/*
* Common boot and setup code for both 32 - bit and 64 - bit .
* Extracted from arch / powerpc / kernel / setup_64 . c .
*
* Copyright ( C ) 2001 PPC64 Team , IBM Corp
*/
2006-03-28 16:15:54 +04:00
# undef DEBUG
2011-07-23 02:24:23 +04:00
# include <linux/export.h>
2005-10-26 11:11:18 +04:00
# include <linux/string.h>
# include <linux/sched.h>
# include <linux/init.h>
# include <linux/kernel.h>
# include <linux/reboot.h>
# include <linux/delay.h>
# include <linux/initrd.h>
2006-03-14 08:11:50 +03:00
# include <linux/platform_device.h>
2005-10-26 11:11:18 +04:00
# include <linux/seq_file.h>
# include <linux/ioport.h>
# include <linux/console.h>
2006-07-10 15:44:13 +04:00
# include <linux/screen_info.h>
2005-10-26 11:11:18 +04:00
# include <linux/root_dev.h>
# include <linux/notifier.h>
# include <linux/cpu.h>
# include <linux/unistd.h>
# include <linux/serial.h>
# include <linux/serial_8250.h>
2007-10-25 09:27:44 +04:00
# include <linux/percpu.h>
2010-07-12 08:36:09 +04:00
# include <linux/memblock.h>
2009-03-19 06:40:51 +03:00
# include <linux/of_platform.h>
2016-07-05 08:07:51 +03:00
# include <linux/hugetlb.h>
2017-02-10 04:04:56 +03:00
# include <asm/debugfs.h>
2005-10-26 11:11:18 +04:00
# include <asm/io.h>
2010-01-28 16:23:22 +03:00
# include <asm/paca.h>
2005-10-26 11:11:18 +04:00
# include <asm/prom.h>
# include <asm/processor.h>
2005-11-11 13:15:21 +03:00
# include <asm/vdso_datapage.h>
2005-10-26 11:11:18 +04:00
# include <asm/pgtable.h>
# include <asm/smp.h>
# include <asm/elf.h>
# include <asm/machdep.h>
# include <asm/time.h>
# include <asm/cputable.h>
# include <asm/sections.h>
2006-03-28 16:15:54 +04:00
# include <asm/firmware.h>
2005-10-26 11:11:18 +04:00
# include <asm/btext.h>
# include <asm/nvram.h>
# include <asm/setup.h>
# include <asm/rtas.h>
# include <asm/iommu.h>
# include <asm/serial.h>
# include <asm/cache.h>
# include <asm/page.h>
# include <asm/mmu.h>
2005-11-08 14:55:08 +03:00
# include <asm/xmon.h>
2007-10-25 09:27:44 +04:00
# include <asm/cputhreads.h>
2008-10-15 12:25:28 +04:00
# include <mm/mmu_decl.h>
2012-02-16 05:14:45 +04:00
# include <asm/fadump.h>
2016-07-05 08:07:51 +03:00
# include <asm/udbg.h>
# include <asm/hugetlb.h>
# include <asm/livepatch.h>
# include <asm/mmu_context.h>
2016-07-23 12:12:40 +03:00
# include <asm/cpu_has_feature.h>
2019-04-26 19:23:34 +03:00
# include <asm/kasan.h>
2016-07-05 08:07:51 +03:00
# include "setup.h"
2005-10-26 11:11:18 +04:00
# ifdef DEBUG
2005-11-15 07:16:38 +03:00
# include <asm/udbg.h>
2005-10-26 11:11:18 +04:00
# define DBG(fmt...) udbg_printf(fmt)
# else
# define DBG(fmt...)
# endif
2006-03-28 16:15:54 +04:00
/* The main machine-dep calls structure
*/
struct machdep_calls ppc_md ;
EXPORT_SYMBOL ( ppc_md ) ;
struct machdep_calls * machine_id ;
EXPORT_SYMBOL ( machine_id ) ;
2005-11-10 05:37:51 +03:00
2014-03-28 06:36:27 +04:00
int boot_cpuid = - 1 ;
EXPORT_SYMBOL_GPL ( boot_cpuid ) ;
2017-01-09 02:31:43 +03:00
/*
* These are used in binfmt_elf . c to put aux entries on the stack
* for each elf executable being started .
*/
int dcache_bsize ;
int icache_bsize ;
int ucache_bsize ;
2005-11-10 07:53:40 +03:00
unsigned long klimit = ( unsigned long ) _end ;
2005-10-26 11:11:18 +04:00
/*
* This still seems to be needed . . . - - paulus
*/
struct screen_info screen_info = {
. orig_x = 0 ,
. orig_y = 25 ,
. orig_video_cols = 80 ,
. orig_video_lines = 25 ,
. orig_video_isVGA = 1 ,
. orig_video_points = 16
} ;
2014-08-20 02:00:02 +04:00
# if defined(CONFIG_FB_VGA16_MODULE)
EXPORT_SYMBOL ( screen_info ) ;
# endif
2005-10-26 11:11:18 +04:00
2010-05-25 02:09:16 +04:00
/* Variables required to store legacy IO irq routing */
int of_i8042_kbd_irq ;
2010-08-07 06:49:20 +04:00
EXPORT_SYMBOL_GPL ( of_i8042_kbd_irq ) ;
2010-05-25 02:09:16 +04:00
int of_i8042_aux_irq ;
2010-08-07 06:49:20 +04:00
EXPORT_SYMBOL_GPL ( of_i8042_aux_irq ) ;
2010-05-25 02:09:16 +04:00
2005-10-26 11:11:18 +04:00
# ifdef __DO_IRQ_CANON
/* XXX should go elsewhere eventually */
int ppc_do_canonicalize_irqs ;
EXPORT_SYMBOL ( ppc_do_canonicalize_irqs ) ;
# endif
2017-05-09 01:56:24 +03:00
# ifdef CONFIG_CRASH_CORE
/* This keeps a track of which one is the crashing cpu. */
int crashing_cpu = - 1 ;
# endif
2005-10-26 11:11:18 +04:00
/* also used by kexec */
void machine_shutdown ( void )
{
2012-02-16 05:15:15 +04:00
/*
* if fadump is active , cleanup the fadump registration before we
* shutdown .
*/
fadump_cleanup ( ) ;
[PATCH] powerpc: Merge kexec
This patch merges, to some extent, the PPC32 and PPC64 kexec implementations.
We adopt the PPC32 approach of having ppc_md callbacks for the kexec functions.
The current PPC64 implementation becomes the "default" implementation for PPC64
which platforms can select if they need no special treatment.
I've added these default callbacks to pseries/maple/cell/powermac, this means
iSeries no longer supports kexec - but it never worked anyway.
I've renamed PPC32's machine_kexec_simple to default_machine_kexec, inline with
PPC64. Judging by the comments it might be better named machine_kexec_non_of,
or something, but at the moment it's the only implementation for PPC32 so it's
the "default".
Kexec requires machine_shutdown(), which is in machine_kexec.c on PPC32, but we
already have in setup-common.c on powerpc. All this does is call
ppc_md.nvram_sync, which only powermac implements, so instead make
machine_shutdown a ppc_md member and have it call core99_nvram_sync directly
on powermac.
I've also stuck relocate_kernel.S into misc_32.S for powerpc.
Built for ARCH=ppc, and 32 & 64 bit ARCH=powerpc, with KEXEC=y/n. Booted on
P5 LPAR and successfully kexec'ed.
Should apply on top of 493f25ef4087395891c99fcfe2c72e62e293e89f.
Signed-off-by: Michael Ellerman <michael@ellerman.id.au>
Signed-off-by: Paul Mackerras <paulus@samba.org>
2005-11-14 15:35:00 +03:00
if ( ppc_md . machine_shutdown )
ppc_md . machine_shutdown ( ) ;
2005-10-26 11:11:18 +04:00
}
2016-07-29 02:07:16 +03:00
static void machine_hang ( void )
{
pr_emerg ( " System Halted, OK to turn off power \n " ) ;
local_irq_disable ( ) ;
while ( 1 )
;
}
2005-10-26 11:11:18 +04:00
void machine_restart ( char * cmd )
{
machine_shutdown ( ) ;
2006-01-13 19:15:17 +03:00
if ( ppc_md . restart )
ppc_md . restart ( cmd ) ;
2016-07-29 02:07:16 +03:00
2005-10-26 11:11:18 +04:00
smp_send_stop ( ) ;
2016-07-29 02:07:17 +03:00
do_kernel_restart ( cmd ) ;
mdelay ( 1000 ) ;
2016-07-29 02:07:16 +03:00
machine_hang ( ) ;
2005-10-26 11:11:18 +04:00
}
void machine_power_off ( void )
{
machine_shutdown ( ) ;
2014-10-13 18:01:09 +04:00
if ( pm_power_off )
pm_power_off ( ) ;
2016-07-29 02:07:16 +03:00
2005-10-26 11:11:18 +04:00
smp_send_stop ( ) ;
2016-07-29 02:07:16 +03:00
machine_hang ( ) ;
2005-10-26 11:11:18 +04:00
}
/* Used by the G5 thermal driver */
EXPORT_SYMBOL_GPL ( machine_power_off ) ;
2014-10-13 18:01:09 +04:00
void ( * pm_power_off ) ( void ) ;
2005-10-26 11:11:18 +04:00
EXPORT_SYMBOL_GPL ( pm_power_off ) ;
void machine_halt ( void )
{
machine_shutdown ( ) ;
2006-01-13 19:15:17 +03:00
if ( ppc_md . halt )
ppc_md . halt ( ) ;
2016-07-29 02:07:16 +03:00
2005-10-26 11:11:18 +04:00
smp_send_stop ( ) ;
2016-07-29 02:07:16 +03:00
machine_hang ( ) ;
2005-10-26 11:11:18 +04:00
}
# ifdef CONFIG_SMP
2009-10-29 16:34:14 +03:00
DEFINE_PER_CPU ( unsigned int , cpu_pvr ) ;
2005-10-26 11:11:18 +04:00
# endif
2010-04-26 19:32:39 +04:00
static void show_cpuinfo_summary ( struct seq_file * m )
{
struct device_node * root ;
const char * model = NULL ;
unsigned long bogosum = 0 ;
int i ;
2019-03-22 11:08:45 +03:00
if ( IS_ENABLED ( CONFIG_SMP ) & & IS_ENABLED ( CONFIG_PPC32 ) ) {
for_each_online_cpu ( i )
bogosum + = loops_per_jiffy ;
seq_printf ( m , " total bogomips \t : %lu.%02lu \n " ,
bogosum / ( 500000 / HZ ) , bogosum / ( 5000 / HZ ) % 100 ) ;
}
2010-04-26 19:32:39 +04:00
seq_printf ( m , " timebase \t : %lu \n " , ppc_tb_freq ) ;
if ( ppc_md . name )
seq_printf ( m , " platform \t : %s \n " , ppc_md . name ) ;
root = of_find_node_by_path ( " / " ) ;
if ( root )
model = of_get_property ( root , " model " , NULL ) ;
if ( model )
seq_printf ( m , " model \t \t : %s \n " , model ) ;
of_node_put ( root ) ;
if ( ppc_md . show_cpuinfo ! = NULL )
ppc_md . show_cpuinfo ( m ) ;
/* Display the amount of memory */
2019-03-22 11:08:45 +03:00
if ( IS_ENABLED ( CONFIG_PPC32 ) )
seq_printf ( m , " Memory \t \t : %d MB \n " ,
( unsigned int ) ( total_memory / ( 1024 * 1024 ) ) ) ;
2010-04-26 19:32:39 +04:00
}
2005-10-26 11:11:18 +04:00
static int show_cpuinfo ( struct seq_file * m , void * v )
{
unsigned long cpu_id = ( unsigned long ) v - 1 ;
unsigned int pvr ;
2014-03-11 15:31:18 +04:00
unsigned long proc_freq ;
2005-10-26 11:11:18 +04:00
unsigned short maj ;
unsigned short min ;
# ifdef CONFIG_SMP
2009-10-29 16:34:14 +03:00
pvr = per_cpu ( cpu_pvr , cpu_id ) ;
2005-10-26 11:11:18 +04:00
# else
pvr = mfspr ( SPRN_PVR ) ;
# endif
maj = ( pvr > > 8 ) & 0xFF ;
min = pvr & 0xFF ;
seq_printf ( m , " processor \t : %lu \n " , cpu_id ) ;
seq_printf ( m , " cpu \t \t : " ) ;
2017-05-09 06:17:08 +03:00
if ( cur_cpu_spec - > pvr_mask & & cur_cpu_spec - > cpu_name )
2005-10-26 11:11:18 +04:00
seq_printf ( m , " %s " , cur_cpu_spec - > cpu_name ) ;
else
seq_printf ( m , " unknown (%08x) " , pvr ) ;
if ( cpu_has_feature ( CPU_FTR_ALTIVEC ) )
seq_printf ( m , " , altivec supported " ) ;
seq_printf ( m , " \n " ) ;
# ifdef CONFIG_TAU
2019-03-22 11:08:44 +03:00
if ( cpu_has_feature ( CPU_FTR_TAU ) ) {
if ( IS_ENABLED ( CONFIG_TAU_AVERAGE ) ) {
/* more straightforward, but potentially misleading */
seq_printf ( m , " temperature \t : %u C (uncalibrated) \n " ,
cpu_temp ( cpu_id ) ) ;
} else {
/* show the actual temp sensor range */
u32 temp ;
temp = cpu_temp_both ( cpu_id ) ;
seq_printf ( m , " temperature \t : %u-%u C (uncalibrated) \n " ,
temp & 0xff , temp > > 16 ) ;
}
2005-10-26 11:11:18 +04:00
}
# endif /* CONFIG_TAU */
/*
2014-03-11 15:31:18 +04:00
* Platforms that have variable clock rates , should implement
* the method ppc_md . get_proc_freq ( ) that reports the clock
* rate of a given cpu . The rest can use ppc_proc_freq to
* report the clock rate that is same across all cpus .
2005-10-26 11:11:18 +04:00
*/
2014-03-11 15:31:18 +04:00
if ( ppc_md . get_proc_freq )
proc_freq = ppc_md . get_proc_freq ( cpu_id ) ;
else
proc_freq = ppc_proc_freq ;
if ( proc_freq )
2005-10-26 11:11:18 +04:00
seq_printf ( m , " clock \t \t : %lu.%06luMHz \n " ,
2014-03-11 15:31:18 +04:00
proc_freq / 1000000 , proc_freq % 1000000 ) ;
2005-10-26 11:11:18 +04:00
if ( ppc_md . show_percpuinfo ! = NULL )
ppc_md . show_percpuinfo ( m , cpu_id ) ;
/* If we are a Freescale core do a simple check so
* we dont have to keep adding cases in the future */
if ( PVR_VER ( pvr ) & 0x8000 ) {
2008-09-07 11:51:32 +04:00
switch ( PVR_VER ( pvr ) ) {
case 0x8000 : /* 7441/7450/7451, Voyager */
case 0x8001 : /* 7445/7455, Apollo 6 */
case 0x8002 : /* 7447/7457, Apollo 7 */
case 0x8003 : /* 7447A, Apollo 7 PM */
case 0x8004 : /* 7448, Apollo 8 */
case 0x800c : /* 7410, Nitro */
maj = ( ( pvr > > 8 ) & 0xF ) ;
min = PVR_MIN ( pvr ) ;
break ;
default : /* e500/book-e */
maj = PVR_MAJ ( pvr ) ;
min = PVR_MIN ( pvr ) ;
break ;
}
2005-10-26 11:11:18 +04:00
} else {
switch ( PVR_VER ( pvr ) ) {
case 0x0020 : /* 403 family */
maj = PVR_MAJ ( pvr ) + 1 ;
min = PVR_MIN ( pvr ) ;
break ;
case 0x1008 : /* 740P/750P ?? */
maj = ( ( pvr > > 8 ) & 0xFF ) - 1 ;
min = pvr & 0xFF ;
break ;
2017-06-15 04:53:16 +03:00
case 0x004e : /* POWER9 bits 12-15 give chip type */
maj = ( pvr > > 8 ) & 0x0F ;
min = pvr & 0xFF ;
break ;
2005-10-26 11:11:18 +04:00
default :
maj = ( pvr > > 8 ) & 0xFF ;
min = pvr & 0xFF ;
break ;
}
}
seq_printf ( m , " revision \t : %hd.%hd (pvr %04x %04x) \n " ,
maj , min , PVR_VER ( pvr ) , PVR_REV ( pvr ) ) ;
2019-03-22 11:08:45 +03:00
if ( IS_ENABLED ( CONFIG_PPC32 ) )
seq_printf ( m , " bogomips \t : %lu.%02lu \n " , loops_per_jiffy / ( 500000 / HZ ) ,
( loops_per_jiffy / ( 5000 / HZ ) ) % 100 ) ;
2005-10-26 11:11:18 +04:00
seq_printf ( m , " \n " ) ;
2010-04-26 19:32:40 +04:00
/* If this is the last cpu, print the summary */
if ( cpumask_next ( cpu_id , cpu_online_mask ) > = nr_cpu_ids )
show_cpuinfo_summary ( m ) ;
2005-10-26 11:11:18 +04:00
return 0 ;
}
static void * c_start ( struct seq_file * m , loff_t * pos )
{
2010-04-26 19:32:40 +04:00
if ( * pos = = 0 ) /* just in case, cpu 0 is not the first */
* pos = cpumask_first ( cpu_online_mask ) ;
else
* pos = cpumask_next ( * pos - 1 , cpu_online_mask ) ;
if ( ( * pos ) < nr_cpu_ids )
return ( void * ) ( unsigned long ) ( * pos + 1 ) ;
return NULL ;
2005-10-26 11:11:18 +04:00
}
static void * c_next ( struct seq_file * m , void * v , loff_t * pos )
{
2010-04-26 19:32:40 +04:00
( * pos ) + + ;
2005-10-26 11:11:18 +04:00
return c_start ( m , pos ) ;
}
static void c_stop ( struct seq_file * m , void * v )
{
}
2009-09-23 03:43:43 +04:00
const struct seq_operations cpuinfo_op = {
2018-01-10 09:10:14 +03:00
. start = c_start ,
. next = c_next ,
. stop = c_stop ,
. show = show_cpuinfo ,
2005-10-26 11:11:18 +04:00
} ;
2005-11-03 01:34:20 +03:00
void __init check_for_initrd ( void )
{
# ifdef CONFIG_BLK_DEV_INITRD
2007-02-28 06:12:29 +03:00
DBG ( " -> check_for_initrd() initrd_start=0x%lx initrd_end=0x%lx \n " ,
initrd_start , initrd_end ) ;
2005-11-03 01:34:20 +03:00
/* If we were passed an initrd, set the ROOT_DEV properly if the values
* look sensible . If not , clear initrd reference .
*/
2005-12-04 10:39:15 +03:00
if ( is_kernel_addr ( initrd_start ) & & is_kernel_addr ( initrd_end ) & &
2005-11-03 01:34:20 +03:00
initrd_end > initrd_start )
ROOT_DEV = Root_RAM0 ;
2005-11-11 11:07:11 +03:00
else
2005-11-03 01:34:20 +03:00
initrd_start = initrd_end = 0 ;
if ( initrd_start )
2014-09-17 08:39:39 +04:00
pr_info ( " Found initrd at 0x%lx:0x%lx \n " , initrd_start , initrd_end ) ;
2005-11-03 01:34:20 +03:00
DBG ( " <- check_for_initrd() \n " ) ;
# endif /* CONFIG_BLK_DEV_INITRD */
}
2005-11-05 02:33:55 +03:00
# ifdef CONFIG_SMP
powerpc/64s: Reimplement book3s idle code in C
Reimplement Book3S idle code in C, moving POWER7/8/9 implementation
speific HV idle code to the powernv platform code.
Book3S assembly stubs are kept in common code and used only to save
the stack frame and non-volatile GPRs before executing architected
idle instructions, and restoring the stack and reloading GPRs then
returning to C after waking from idle.
The complex logic dealing with threads and subcores, locking, SPRs,
HMIs, timebase resync, etc., is all done in C which makes it more
maintainable.
This is not a strict translation to C code, there are some
significant differences:
- Idle wakeup no longer uses the ->cpu_restore call to reinit SPRs,
but saves and restores them itself.
- The optimisation where EC=ESL=0 idle modes did not have to save GPRs
or change MSR is restored, because it's now simple to do. ESL=1
sleeps that do not lose GPRs can use this optimization too.
- KVM secondary entry and cede is now more of a call/return style
rather than branchy. nap_state_lost is not required because KVM
always returns via NVGPR restoring path.
- KVM secondary wakeup from offline sequence is moved entirely into
the offline wakeup, which avoids a hwsync in the normal idle wakeup
path.
Performance measured with context switch ping-pong on different
threads or cores, is possibly improved a small amount, 1-3% depending
on stop state and core vs thread test for shallow states. Deep states
it's in the noise compared with other latencies.
KVM improvements:
- Idle sleepers now always return to caller rather than branch out
to KVM first.
- This allows optimisations like very fast return to caller when no
state has been lost.
- KVM no longer requires nap_state_lost because it controls NVGPR
save/restore itself on the way in and out.
- The heavy idle wakeup KVM request check can be moved out of the
normal host idle code and into the not-performance-critical offline
code.
- KVM nap code now returns from where it is called, which makes the
flow a bit easier to follow.
Reviewed-by: Gautham R. Shenoy <ego@linux.vnet.ibm.com>
Signed-off-by: Nicholas Piggin <npiggin@gmail.com>
[mpe: Squash the KVM changes in]
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2019-04-12 17:30:52 +03:00
int threads_per_core , threads_per_subcore , threads_shift __read_mostly ;
cpumask_t threads_core_mask __read_mostly ;
KVM: PPC: Add support for Book3S processors in hypervisor mode
This adds support for KVM running on 64-bit Book 3S processors,
specifically POWER7, in hypervisor mode. Using hypervisor mode means
that the guest can use the processor's supervisor mode. That means
that the guest can execute privileged instructions and access privileged
registers itself without trapping to the host. This gives excellent
performance, but does mean that KVM cannot emulate a processor
architecture other than the one that the hardware implements.
This code assumes that the guest is running paravirtualized using the
PAPR (Power Architecture Platform Requirements) interface, which is the
interface that IBM's PowerVM hypervisor uses. That means that existing
Linux distributions that run on IBM pSeries machines will also run
under KVM without modification. In order to communicate the PAPR
hypercalls to qemu, this adds a new KVM_EXIT_PAPR_HCALL exit code
to include/linux/kvm.h.
Currently the choice between book3s_hv support and book3s_pr support
(i.e. the existing code, which runs the guest in user mode) has to be
made at kernel configuration time, so a given kernel binary can only
do one or the other.
This new book3s_hv code doesn't support MMIO emulation at present.
Since we are running paravirtualized guests, this isn't a serious
restriction.
With the guest running in supervisor mode, most exceptions go straight
to the guest. We will never get data or instruction storage or segment
interrupts, alignment interrupts, decrementer interrupts, program
interrupts, single-step interrupts, etc., coming to the hypervisor from
the guest. Therefore this introduces a new KVMTEST_NONHV macro for the
exception entry path so that we don't have to do the KVM test on entry
to those exception handlers.
We do however get hypervisor decrementer, hypervisor data storage,
hypervisor instruction storage, and hypervisor emulation assist
interrupts, so we have to handle those.
In hypervisor mode, real-mode accesses can access all of RAM, not just
a limited amount. Therefore we put all the guest state in the vcpu.arch
and use the shadow_vcpu in the PACA only for temporary scratch space.
We allocate the vcpu with kzalloc rather than vzalloc, and we don't use
anything in the kvmppc_vcpu_book3s struct, so we don't allocate it.
We don't have a shared page with the guest, but we still need a
kvm_vcpu_arch_shared struct to store the values of various registers,
so we include one in the vcpu_arch struct.
The POWER7 processor has a restriction that all threads in a core have
to be in the same partition. MMU-on kernel code counts as a partition
(partition 0), so we have to do a partition switch on every entry to and
exit from the guest. At present we require the host and guest to run
in single-thread mode because of this hardware restriction.
This code allocates a hashed page table for the guest and initializes
it with HPTEs for the guest's Virtual Real Memory Area (VRMA). We
require that the guest memory is allocated using 16MB huge pages, in
order to simplify the low-level memory management. This also means that
we can get away without tracking paging activity in the host for now,
since huge pages can't be paged or swapped.
This also adds a few new exports needed by the book3s_hv code.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2011-06-29 04:21:34 +04:00
EXPORT_SYMBOL_GPL ( threads_per_core ) ;
2014-05-23 12:15:27 +04:00
EXPORT_SYMBOL_GPL ( threads_per_subcore ) ;
KVM: PPC: Add support for Book3S processors in hypervisor mode
This adds support for KVM running on 64-bit Book 3S processors,
specifically POWER7, in hypervisor mode. Using hypervisor mode means
that the guest can use the processor's supervisor mode. That means
that the guest can execute privileged instructions and access privileged
registers itself without trapping to the host. This gives excellent
performance, but does mean that KVM cannot emulate a processor
architecture other than the one that the hardware implements.
This code assumes that the guest is running paravirtualized using the
PAPR (Power Architecture Platform Requirements) interface, which is the
interface that IBM's PowerVM hypervisor uses. That means that existing
Linux distributions that run on IBM pSeries machines will also run
under KVM without modification. In order to communicate the PAPR
hypercalls to qemu, this adds a new KVM_EXIT_PAPR_HCALL exit code
to include/linux/kvm.h.
Currently the choice between book3s_hv support and book3s_pr support
(i.e. the existing code, which runs the guest in user mode) has to be
made at kernel configuration time, so a given kernel binary can only
do one or the other.
This new book3s_hv code doesn't support MMIO emulation at present.
Since we are running paravirtualized guests, this isn't a serious
restriction.
With the guest running in supervisor mode, most exceptions go straight
to the guest. We will never get data or instruction storage or segment
interrupts, alignment interrupts, decrementer interrupts, program
interrupts, single-step interrupts, etc., coming to the hypervisor from
the guest. Therefore this introduces a new KVMTEST_NONHV macro for the
exception entry path so that we don't have to do the KVM test on entry
to those exception handlers.
We do however get hypervisor decrementer, hypervisor data storage,
hypervisor instruction storage, and hypervisor emulation assist
interrupts, so we have to handle those.
In hypervisor mode, real-mode accesses can access all of RAM, not just
a limited amount. Therefore we put all the guest state in the vcpu.arch
and use the shadow_vcpu in the PACA only for temporary scratch space.
We allocate the vcpu with kzalloc rather than vzalloc, and we don't use
anything in the kvmppc_vcpu_book3s struct, so we don't allocate it.
We don't have a shared page with the guest, but we still need a
kvm_vcpu_arch_shared struct to store the values of various registers,
so we include one in the vcpu_arch struct.
The POWER7 processor has a restriction that all threads in a core have
to be in the same partition. MMU-on kernel code counts as a partition
(partition 0), so we have to do a partition switch on every entry to and
exit from the guest. At present we require the host and guest to run
in single-thread mode because of this hardware restriction.
This code allocates a hashed page table for the guest and initializes
it with HPTEs for the guest's Virtual Real Memory Area (VRMA). We
require that the guest memory is allocated using 16MB huge pages, in
order to simplify the low-level memory management. This also means that
we can get away without tracking paging activity in the host for now,
since huge pages can't be paged or swapped.
This also adds a few new exports needed by the book3s_hv code.
Signed-off-by: Paul Mackerras <paulus@samba.org>
Signed-off-by: Alexander Graf <agraf@suse.de>
2011-06-29 04:21:34 +04:00
EXPORT_SYMBOL_GPL ( threads_shift ) ;
EXPORT_SYMBOL_GPL ( threads_core_mask ) ;
2007-10-25 09:27:44 +04:00
static void __init cpu_init_thread_core_maps ( int tpc )
{
int i ;
threads_per_core = tpc ;
2014-05-23 12:15:27 +04:00
threads_per_subcore = tpc ;
2011-04-28 09:07:23 +04:00
cpumask_clear ( & threads_core_mask ) ;
2007-10-25 09:27:44 +04:00
/* This implementation only supports power of 2 number of threads
* for simplicity and performance
*/
threads_shift = ilog2 ( tpc ) ;
BUG_ON ( tpc ! = ( 1 < < threads_shift ) ) ;
for ( i = 0 ; i < tpc ; i + + )
2011-04-28 09:07:23 +04:00
cpumask_set_cpu ( i , & threads_core_mask ) ;
2007-10-25 09:27:44 +04:00
printk ( KERN_INFO " CPU maps initialized for %d thread%s per core \n " ,
tpc , tpc > 1 ? " s " : " " ) ;
printk ( KERN_DEBUG " (thread shift is %d) \n " , threads_shift ) ;
}
2018-02-13 18:08:18 +03:00
u32 * cpu_to_phys_id = NULL ;
2005-11-05 02:33:55 +03:00
/**
* setup_cpu_maps - initialize the following cpu maps :
2010-04-26 19:32:44 +04:00
* cpu_possible_mask
* cpu_present_mask
2005-11-05 02:33:55 +03:00
*
* Having the possible map set up early allows us to restrict allocations
2011-05-10 23:28:48 +04:00
* of things like irqstacks to nr_cpu_ids rather than NR_CPUS .
2005-11-05 02:33:55 +03:00
*
* We do not initialize the online map here ; cpus set their own bits in
2010-04-26 19:32:44 +04:00
* cpu_online_mask as they come up .
2005-11-05 02:33:55 +03:00
*
* This function is valid only for Open Firmware systems . finish_device_tree
* must be called before using this .
*
* While we ' re here , we may as well set the " physical " cpu ids in the paca .
2006-03-25 09:25:17 +03:00
*
* NOTE : This must match the parsing done in early_init_dt_scan_cpus .
2005-11-05 02:33:55 +03:00
*/
void __init smp_setup_cpu_maps ( void )
{
2017-02-01 04:54:38 +03:00
struct device_node * dn ;
2005-11-05 02:33:55 +03:00
int cpu = 0 ;
2007-10-25 09:27:44 +04:00
int nthreads = 1 ;
DBG ( " smp_setup_cpu_maps() \n " ) ;
2005-11-05 02:33:55 +03:00
2019-03-08 03:31:06 +03:00
cpu_to_phys_id = memblock_alloc ( nr_cpu_ids * sizeof ( u32 ) ,
__alignof__ ( u32 ) ) ;
2019-03-12 09:30:31 +03:00
if ( ! cpu_to_phys_id )
panic ( " %s: Failed to allocate %zu bytes align=0x%zx \n " ,
__func__ , nr_cpu_ids * sizeof ( u32 ) , __alignof__ ( u32 ) ) ;
2018-02-13 18:08:18 +03:00
2017-02-01 04:54:38 +03:00
for_each_node_by_type ( dn , " cpu " ) {
2013-08-06 20:01:32 +04:00
const __be32 * intserv ;
2013-08-06 20:01:33 +04:00
__be32 cpu_be ;
2007-10-25 09:27:44 +04:00
int j , len ;
2017-08-21 18:16:47 +03:00
DBG ( " * %pOF... \n " , dn ) ;
2005-11-05 02:33:55 +03:00
2007-04-03 16:26:41 +04:00
intserv = of_get_property ( dn , " ibm,ppc-interrupt-server#s " ,
& len ) ;
2007-10-25 09:27:44 +04:00
if ( intserv ) {
DBG ( " ibm,ppc-interrupt-server#s -> %d threads \n " ,
nthreads ) ;
} else {
DBG ( " no ibm,ppc-interrupt-server#s -> 1 thread \n " ) ;
2011-12-08 11:20:27 +04:00
intserv = of_get_property ( dn , " reg " , & len ) ;
2013-08-06 20:01:33 +04:00
if ( ! intserv ) {
cpu_be = cpu_to_be32 ( cpu ) ;
2018-02-13 18:08:18 +03:00
/* XXX: what is this? uninitialized?? */
2013-08-06 20:01:33 +04:00
intserv = & cpu_be ; /* assume logical == phys */
2011-12-08 11:20:27 +04:00
len = 4 ;
2013-08-06 20:01:33 +04:00
}
2005-11-05 02:33:55 +03:00
}
2011-12-08 11:20:27 +04:00
nthreads = len / sizeof ( int ) ;
2011-05-10 23:28:48 +04:00
for ( j = 0 ; j < nthreads & & cpu < nr_cpu_ids ; j + + ) {
2014-06-25 05:15:51 +04:00
bool avail ;
2007-10-25 09:27:44 +04:00
DBG ( " thread %d -> cpu %d (hard id %d) \n " ,
2013-08-06 20:01:32 +04:00
j , cpu , be32_to_cpu ( intserv [ j ] ) ) ;
2014-06-25 05:15:51 +04:00
avail = of_device_is_available ( dn ) ;
if ( ! avail )
avail = ! of_property_match_string ( dn ,
" enable-method " , " spin-table " ) ;
set_cpu_present ( cpu , avail ) ;
2009-09-24 19:34:48 +04:00
set_cpu_possible ( cpu , true ) ;
2018-02-13 18:08:18 +03:00
cpu_to_phys_id [ cpu ] = be32_to_cpu ( intserv [ j ] ) ;
2005-11-05 02:33:55 +03:00
cpu + + ;
}
2017-02-01 04:54:38 +03:00
if ( cpu > = nr_cpu_ids ) {
of_node_put ( dn ) ;
break ;
}
2005-11-05 02:33:55 +03:00
}
2007-10-25 09:27:44 +04:00
/* If no SMT supported, nthreads is forced to 1 */
if ( ! cpu_has_feature ( CPU_FTR_SMT ) ) {
DBG ( " SMT disabled ! nthreads forced to 1 \n " ) ;
nthreads = 1 ;
}
2005-11-05 02:33:55 +03:00
# ifdef CONFIG_PPC64
/*
* On pSeries LPAR , we need to know how many cpus
* could possibly be added to this partition .
*/
2016-07-05 08:03:55 +03:00
if ( firmware_has_feature ( FW_FEATURE_LPAR ) & &
2005-11-10 05:37:51 +03:00
( dn = of_find_node_by_path ( " /rtas " ) ) ) {
2005-11-05 02:33:55 +03:00
int num_addr_cell , num_size_cell , maxcpus ;
2013-12-12 08:59:35 +04:00
const __be32 * ireg ;
2005-11-05 02:33:55 +03:00
2007-04-03 04:56:50 +04:00
num_addr_cell = of_n_addr_cells ( dn ) ;
2007-04-03 04:57:48 +04:00
num_size_cell = of_n_size_cells ( dn ) ;
2005-11-05 02:33:55 +03:00
2007-04-03 16:26:41 +04:00
ireg = of_get_property ( dn , " ibm,lrdr-capacity " , NULL ) ;
2005-11-05 02:33:55 +03:00
if ( ! ireg )
goto out ;
2013-12-12 08:59:35 +04:00
maxcpus = be32_to_cpup ( ireg + num_addr_cell + num_size_cell ) ;
2005-11-05 02:33:55 +03:00
/* Double maxcpus for processors which have SMT capability */
if ( cpu_has_feature ( CPU_FTR_SMT ) )
2007-10-25 09:27:44 +04:00
maxcpus * = nthreads ;
2005-11-05 02:33:55 +03:00
2011-05-10 23:28:48 +04:00
if ( maxcpus > nr_cpu_ids ) {
2005-11-05 02:33:55 +03:00
printk ( KERN_WARNING
" Partition configured for %d cpus, "
2017-09-09 02:14:18 +03:00
" operating system maximum is %u. \n " ,
2011-05-10 23:28:48 +04:00
maxcpus , nr_cpu_ids ) ;
maxcpus = nr_cpu_ids ;
2005-11-05 02:33:55 +03:00
} else
printk ( KERN_INFO " Partition configured for %d cpus. \n " ,
maxcpus ) ;
for ( cpu = 0 ; cpu < maxcpus ; cpu + + )
2009-09-24 19:34:48 +04:00
set_cpu_possible ( cpu , true ) ;
2005-11-05 02:33:55 +03:00
out :
of_node_put ( dn ) ;
}
2007-10-16 12:24:05 +04:00
vdso_data - > processorCount = num_present_cpus ( ) ;
# endif /* CONFIG_PPC64 */
2007-10-25 09:27:44 +04:00
/* Initialize CPU <=> thread mapping/
*
* WARNING : We assume that the number of threads is the same for
* every CPU in the system . If that is not the case , then some code
* here will have to be reworked
*/
cpu_init_thread_core_maps ( nthreads ) ;
2010-01-28 16:23:22 +03:00
2011-03-31 23:33:02 +04:00
/* Now that possible cpus are set, set nr_cpu_ids for later use */
2011-05-10 23:28:55 +04:00
setup_nr_cpu_ids ( ) ;
2011-03-31 23:33:02 +04:00
2010-01-28 16:23:22 +03:00
free_unused_pacas ( ) ;
2007-10-16 12:24:05 +04:00
}
2005-11-05 02:33:55 +03:00
# endif /* CONFIG_SMP */
2005-11-08 14:55:08 +03:00
2008-05-23 02:40:16 +04:00
# ifdef CONFIG_PCSPKR_PLATFORM
2006-03-14 08:11:50 +03:00
static __init int add_pcspkr ( void )
{
struct device_node * np ;
struct platform_device * pd ;
int ret ;
np = of_find_compatible_node ( NULL , NULL , " pnpPNP,100 " ) ;
of_node_put ( np ) ;
if ( ! np )
return - ENODEV ;
pd = platform_device_alloc ( " pcspkr " , - 1 ) ;
if ( ! pd )
return - ENOMEM ;
ret = platform_device_add ( pd ) ;
if ( ret )
platform_device_put ( pd ) ;
return ret ;
}
device_initcall ( add_pcspkr ) ;
2008-05-23 02:40:16 +04:00
# endif /* CONFIG_PCSPKR_PLATFORM */
2006-04-02 09:08:05 +04:00
2006-03-28 16:15:54 +04:00
void probe_machine ( void )
{
extern struct machdep_calls __machine_desc_start ;
extern struct machdep_calls __machine_desc_end ;
2016-07-05 08:03:59 +03:00
unsigned int i ;
2006-03-28 16:15:54 +04:00
/*
* Iterate all ppc_md structures until we find the proper
* one for the current machine type
*/
DBG ( " Probing machine type ... \n " ) ;
2016-07-05 08:03:59 +03:00
/*
* Check ppc_md is empty , if not we have a bug , ie , we setup an
* entry before probe_machine ( ) which will be overwritten
*/
for ( i = 0 ; i < ( sizeof ( ppc_md ) / sizeof ( void * ) ) ; i + + ) {
if ( ( ( void * * ) & ppc_md ) [ i ] ) {
printk ( KERN_ERR " Entry %d in ppc_md non empty before "
" machine probe ! \n " , i ) ;
}
}
2006-03-28 16:15:54 +04:00
for ( machine_id = & __machine_desc_start ;
machine_id < & __machine_desc_end ;
machine_id + + ) {
DBG ( " %s ... " , machine_id - > name ) ;
memcpy ( & ppc_md , machine_id , sizeof ( struct machdep_calls ) ) ;
if ( ppc_md . probe ( ) ) {
DBG ( " match ! \n " ) ;
break ;
}
DBG ( " \n " ) ;
}
/* What can we do if we didn't find ? */
if ( machine_id > = & __machine_desc_end ) {
2018-12-18 09:53:41 +03:00
pr_err ( " No suitable machine description found ! \n " ) ;
2006-03-28 16:15:54 +04:00
for ( ; ; ) ;
}
printk ( KERN_INFO " Using %s machine description \n " , ppc_md . name ) ;
}
2006-04-25 02:22:17 +04:00
2007-04-26 00:36:56 +04:00
/* Match a class of boards, not a specific device configuration. */
2006-04-25 02:22:17 +04:00
int check_legacy_ioport ( unsigned long base_port )
{
2007-04-26 00:36:56 +04:00
struct device_node * parent , * np = NULL ;
int ret = - ENODEV ;
switch ( base_port ) {
case I8042_DATA_REG :
2007-06-20 04:15:10 +04:00
if ( ! ( np = of_find_compatible_node ( NULL , NULL , " pnpPNP,303 " ) ) )
np = of_find_compatible_node ( NULL , NULL , " pnpPNP,f03 " ) ;
if ( np ) {
parent = of_get_parent ( np ) ;
2010-05-25 02:09:16 +04:00
of_i8042_kbd_irq = irq_of_parse_and_map ( parent , 0 ) ;
if ( ! of_i8042_kbd_irq )
of_i8042_kbd_irq = 1 ;
of_i8042_aux_irq = irq_of_parse_and_map ( parent , 1 ) ;
if ( ! of_i8042_aux_irq )
of_i8042_aux_irq = 12 ;
2007-06-20 04:15:10 +04:00
of_node_put ( np ) ;
np = parent ;
break ;
}
2007-04-26 00:36:56 +04:00
np = of_find_node_by_type ( NULL , " 8042 " ) ;
2007-07-25 05:28:32 +04:00
/* Pegasos has no device_type on its 8042 node, look for the
* name instead */
if ( ! np )
np = of_find_node_by_name ( NULL , " 8042 " ) ;
2011-05-13 05:03:13 +04:00
if ( np ) {
of_i8042_kbd_irq = 1 ;
of_i8042_aux_irq = 12 ;
}
2007-04-26 00:36:56 +04:00
break ;
case FDC_BASE : /* FDC1 */
np = of_find_node_by_type ( NULL , " fdc " ) ;
break ;
default :
/* ipmi is supposed to fail here */
break ;
}
if ( ! np )
return ret ;
parent = of_get_parent ( np ) ;
if ( parent ) {
2018-11-17 01:11:00 +03:00
if ( of_node_is_type ( parent , " isa " ) )
2007-04-26 00:36:56 +04:00
ret = 0 ;
of_node_put ( parent ) ;
}
of_node_put ( np ) ;
return ret ;
2006-04-25 02:22:17 +04:00
}
EXPORT_SYMBOL ( check_legacy_ioport ) ;
2006-05-05 09:02:08 +04:00
2017-12-04 08:27:25 +03:00
static int ppc_panic_event ( struct notifier_block * this ,
unsigned long event , void * ptr )
{
2018-05-19 07:35:54 +03:00
/*
* panic does a local_irq_disable , but we really
* want interrupts to be hard disabled .
*/
hard_irq_disable ( ) ;
2017-12-04 08:27:25 +03:00
/*
* If firmware - assisted dump has been registered then trigger
* firmware - assisted dump and let firmware handle everything else .
*/
crash_fadump ( NULL , ptr ) ;
2018-05-19 07:35:54 +03:00
if ( ppc_md . panic )
ppc_md . panic ( ptr ) ; /* May not return */
2017-12-04 08:27:25 +03:00
return NOTIFY_DONE ;
}
static struct notifier_block ppc_panic_block = {
. notifier_call = ppc_panic_event ,
. priority = INT_MIN /* may not return; must be done last */
} ;
void __init setup_panic ( void )
{
2018-05-19 07:35:54 +03:00
/* PPC64 always does a hard irq disable in its panic handler */
if ( ! IS_ENABLED ( CONFIG_PPC64 ) & & ! ppc_md . panic )
2017-12-04 08:27:25 +03:00
return ;
atomic_notifier_chain_register ( & panic_notifier_list , & ppc_panic_block ) ;
}
2007-05-12 04:57:35 +04:00
# ifdef CONFIG_CHECK_CACHE_COHERENCY
/*
* For platforms that have configurable cache - coherency . This function
* checks that the cache coherency setting of the kernel matches the setting
* left by the firmware , as indicated in the device tree . Since a mismatch
* will eventually result in DMA failures , we print * and error and call
* BUG ( ) in that case .
*/
2019-03-22 11:08:43 +03:00
# define KERNEL_COHERENCY (!IS_ENABLED(CONFIG_NOT_COHERENT_CACHE))
2007-05-12 04:57:35 +04:00
static int __init check_cache_coherency ( void )
{
struct device_node * np ;
const void * prop ;
2019-03-22 11:08:43 +03:00
bool devtree_coherency ;
2007-05-12 04:57:35 +04:00
np = of_find_node_by_path ( " / " ) ;
prop = of_get_property ( np , " coherency-off " , NULL ) ;
of_node_put ( np ) ;
2019-03-22 11:08:43 +03:00
devtree_coherency = prop ? false : true ;
2007-05-12 04:57:35 +04:00
if ( devtree_coherency ! = KERNEL_COHERENCY ) {
printk ( KERN_ERR
" kernel coherency:%s != device tree_coherency:%s \n " ,
KERNEL_COHERENCY ? " on " : " off " ,
devtree_coherency ? " on " : " off " ) ;
BUG ( ) ;
}
return 0 ;
}
late_initcall ( check_cache_coherency ) ;
# endif /* CONFIG_CHECK_CACHE_COHERENCY */
2007-06-20 04:54:19 +04:00
# ifdef CONFIG_DEBUG_FS
struct dentry * powerpc_debugfs_root ;
2009-10-26 21:52:24 +03:00
EXPORT_SYMBOL ( powerpc_debugfs_root ) ;
2007-06-20 04:54:19 +04:00
static int powerpc_debugfs_init ( void )
{
powerpc_debugfs_root = debugfs_create_dir ( " powerpc " , NULL ) ;
return powerpc_debugfs_root = = NULL ;
}
arch_initcall ( powerpc_debugfs_init ) ;
# endif
2009-03-19 06:40:51 +03:00
2011-06-18 11:36:40 +04:00
void ppc_printk_progress ( char * s , unsigned short hex )
2009-03-19 06:40:51 +03:00
{
2011-06-18 11:36:40 +04:00
pr_info ( " %s \n " , s ) ;
2009-03-19 06:40:51 +03:00
}
2011-07-08 09:17:27 +04:00
void arch_setup_pdev_archdata ( struct platform_device * pdev )
2009-03-19 06:40:51 +03:00
{
2011-07-08 09:17:27 +04:00
pdev - > archdata . dma_mask = DMA_BIT_MASK ( 32 ) ;
pdev - > dev . dma_mask = & pdev - > archdata . dma_mask ;
2009-03-19 06:40:51 +03:00
}
2016-07-05 08:07:51 +03:00
static __init void print_system_info ( void )
{
pr_info ( " ----------------------------------------------------- \n " ) ;
pr_info ( " phys_mem_size = 0x%llx \n " ,
( unsigned long long ) memblock_phys_mem_size ( ) ) ;
pr_info ( " dcache_bsize = 0x%x \n " , dcache_bsize ) ;
pr_info ( " icache_bsize = 0x%x \n " , icache_bsize ) ;
if ( ucache_bsize ! = 0 )
pr_info ( " ucache_bsize = 0x%x \n " , ucache_bsize ) ;
pr_info ( " cpu_features = 0x%016lx \n " , cur_cpu_spec - > cpu_features ) ;
pr_info ( " possible = 0x%016lx \n " ,
( unsigned long ) CPU_FTRS_POSSIBLE ) ;
pr_info ( " always = 0x%016lx \n " ,
( unsigned long ) CPU_FTRS_ALWAYS ) ;
pr_info ( " cpu_user_features = 0x%08x 0x%08x \n " ,
cur_cpu_spec - > cpu_user_features ,
cur_cpu_spec - > cpu_user_features2 ) ;
pr_info ( " mmu_features = 0x%08x \n " , cur_cpu_spec - > mmu_features ) ;
# ifdef CONFIG_PPC64
pr_info ( " firmware_features = 0x%016lx \n " , powerpc_firmware_features ) ;
2019-05-16 05:04:37 +03:00
# ifdef CONFIG_PPC_BOOK3S
pr_info ( " vmalloc start = 0x%lx \n " , KERN_VIRT_START ) ;
pr_info ( " IO start = 0x%lx \n " , KERN_IO_START ) ;
pr_info ( " vmemmap start = 0x%lx \n " , ( unsigned long ) vmemmap ) ;
# endif
2016-07-05 08:07:51 +03:00
# endif
2019-05-16 05:04:37 +03:00
if ( ! early_radix_enabled ( ) )
print_system_hash_info ( ) ;
2016-07-05 08:07:51 +03:00
if ( PHYSICAL_START > 0 )
pr_info ( " physical_start = 0x%llx \n " ,
( unsigned long long ) PHYSICAL_START ) ;
pr_info ( " ----------------------------------------------------- \n " ) ;
}
2018-02-13 18:08:19 +03:00
# ifdef CONFIG_SMP
static void smp_setup_pacas ( void )
{
int cpu ;
for_each_possible_cpu ( cpu ) {
if ( cpu = = smp_processor_id ( ) )
continue ;
allocate_paca ( cpu ) ;
set_hard_smp_processor_id ( cpu , cpu_to_phys_id [ cpu ] ) ;
}
memblock_free ( __pa ( cpu_to_phys_id ) , nr_cpu_ids * sizeof ( u32 ) ) ;
cpu_to_phys_id = NULL ;
}
# endif
2016-07-05 08:07:51 +03:00
/*
* Called into from start_kernel this initializes memblock , which is used
* to manage page allocation until mem_init is called .
*/
void __init setup_arch ( char * * cmdline_p )
{
2019-04-26 19:23:34 +03:00
kasan_init ( ) ;
2016-07-05 08:07:51 +03:00
* cmdline_p = boot_command_line ;
/* Set a half-reasonable default so udelay does something sensible */
loops_per_jiffy = 500000000 / HZ ;
/* Unflatten the device-tree passed by prom_init or kexec */
unflatten_device_tree ( ) ;
/*
* Initialize cache line / block info from device - tree ( on ppc64 ) or
* just cputable ( on ppc32 ) .
*/
initialize_cache_info ( ) ;
/* Initialize RTAS if available. */
rtas_initialize ( ) ;
/* Check if we have an initrd provided via the device-tree. */
check_for_initrd ( ) ;
/* Probe the machine type, establish ppc_md. */
probe_machine ( ) ;
2017-12-04 08:27:25 +03:00
/* Setup panic notifier if requested by the platform. */
setup_panic ( ) ;
2016-07-05 08:07:51 +03:00
/*
* Configure ppc_md . power_save ( ppc32 only , 64 - bit machines do
* it from their respective probe ( ) function .
*/
setup_power_save ( ) ;
/* Discover standard serial ports. */
find_legacy_serial_ports ( ) ;
/* Register early console with the printk subsystem. */
register_early_udbg_console ( ) ;
/* Setup the various CPU maps based on the device-tree. */
smp_setup_cpu_maps ( ) ;
/* Initialize xmon. */
xmon_setup ( ) ;
/* Check the SMT related command line arguments (ppc64). */
check_smt_enabled ( ) ;
2018-02-13 18:08:16 +03:00
/* Parse memory topology */
mem_topology_setup ( ) ;
2016-07-05 08:07:51 +03:00
/*
* Release secondary cpus out of their spinloops at 0x60 now that
* we can map physical - > logical CPU ids .
*
* Freescale Book3e parts spin in a loop provided by firmware ,
* so smp_release_cpus ( ) does nothing for them .
*/
# ifdef CONFIG_SMP
2018-02-13 18:08:19 +03:00
smp_setup_pacas ( ) ;
2018-03-31 12:57:10 +03:00
/* On BookE, setup per-core TLB data structures. */
setup_tlb_core_data ( ) ;
2016-07-05 08:07:51 +03:00
smp_release_cpus ( ) ;
# endif
/* Print various info about the machine that has been gathered so far. */
print_system_info ( ) ;
/* Reserve large chunks of memory for use by CMA for KVM. */
kvm_cma_reserve ( ) ;
2019-01-31 13:08:58 +03:00
klp_init_thread_info ( & init_task ) ;
2016-07-05 08:07:51 +03:00
init_mm . start_code = ( unsigned long ) _stext ;
init_mm . end_code = ( unsigned long ) _etext ;
init_mm . end_data = ( unsigned long ) _edata ;
init_mm . brk = klimit ;
2017-03-22 06:36:58 +03:00
2016-11-30 09:51:59 +03:00
mm_iommu_init ( & init_mm ) ;
2016-07-05 08:07:51 +03:00
irqstack_early_init ( ) ;
exc_lvl_early_init ( ) ;
emergency_stack_init ( ) ;
initmem_init ( ) ;
2018-09-28 18:39:20 +03:00
early_memtest ( min_low_pfn < < PAGE_SHIFT , max_low_pfn < < PAGE_SHIFT ) ;
2019-03-22 11:08:45 +03:00
if ( IS_ENABLED ( CONFIG_DUMMY_CONSOLE ) )
conswitchp = & dummy_con ;
2016-07-05 08:07:51 +03:00
if ( ppc_md . setup_arch )
ppc_md . setup_arch ( ) ;
2018-07-28 02:06:35 +03:00
setup_barrier_nospec ( ) ;
2018-12-12 17:03:08 +03:00
setup_spectre_v2 ( ) ;
2018-07-28 02:06:35 +03:00
2016-07-05 08:07:51 +03:00
paging_init ( ) ;
/* Initialize the MMU context management stuff. */
mmu_context_init ( ) ;
/* Interrupt code needs to be 64K-aligned. */
2019-03-22 11:08:45 +03:00
if ( IS_ENABLED ( CONFIG_PPC64 ) & & ( unsigned long ) _stext & 0xffff )
2016-07-05 08:07:51 +03:00
panic ( " Kernelbase not 64K-aligned (0x%lx)! \n " ,
( unsigned long ) _stext ) ;
}