2006-12-05 09:52:36 +03:00
/*
* pseries CPU Hotplug infrastructure .
*
2006-12-05 09:52:38 +03:00
* Split out from arch / powerpc / platforms / pseries / setup . c
* arch / powerpc / kernel / rtas . c , and arch / powerpc / platforms / pseries / smp . c
2006-12-05 09:52:36 +03:00
*
* Peter Bergner , IBM March 2001.
* Copyright ( C ) 2001 IBM .
2006-12-05 09:52:38 +03:00
* Dave Engebretsen , Peter Bergner , and
* Mike Corrigan { engebret | bergner | mikec } @ us . ibm . com
* Plus various changes from other IBM teams . . .
2006-12-05 09:52:36 +03:00
*
* Copyright ( C ) 2006 Michael Ellerman , IBM Corporation
*
* This program is free software ; you can redistribute it and / or
* modify it under the terms of the GNU General Public License
* as published by the Free Software Foundation ; either version
* 2 of the License , or ( at your option ) any later version .
*/
# include <linux/kernel.h>
# include <linux/delay.h>
# include <linux/cpu.h>
# include <asm/system.h>
# include <asm/prom.h>
# include <asm/rtas.h>
# include <asm/firmware.h>
# include <asm/machdep.h>
# include <asm/vdso_datapage.h>
# include <asm/pSeries_reconfig.h>
# include "xics.h"
2008-01-11 06:02:47 +03:00
# include "plpar_wrappers.h"
2009-10-29 22:22:53 +03:00
# include "offline_states.h"
2006-12-05 09:52:36 +03:00
/* This version can't take the spinlock, because it never returns */
static struct rtas_args rtas_stop_self_args = {
. token = RTAS_UNKNOWN_SERVICE ,
. nargs = 0 ,
. nret = 1 ,
. rets = & rtas_stop_self_args . args [ 0 ] ,
} ;
2009-10-29 22:22:53 +03:00
static DEFINE_PER_CPU ( enum cpu_state_vals , preferred_offline_state ) =
CPU_STATE_OFFLINE ;
static DEFINE_PER_CPU ( enum cpu_state_vals , current_state ) = CPU_STATE_OFFLINE ;
static enum cpu_state_vals default_offline_state = CPU_STATE_OFFLINE ;
static int cede_offline_enabled __read_mostly = 1 ;
/*
* Enable / disable cede_offline when available .
*/
static int __init setup_cede_offline ( char * str )
{
if ( ! strcmp ( str , " off " ) )
cede_offline_enabled = 0 ;
else if ( ! strcmp ( str , " on " ) )
cede_offline_enabled = 1 ;
else
return 0 ;
return 1 ;
}
__setup ( " cede_offline= " , setup_cede_offline ) ;
enum cpu_state_vals get_cpu_current_state ( int cpu )
{
return per_cpu ( current_state , cpu ) ;
}
void set_cpu_current_state ( int cpu , enum cpu_state_vals state )
{
per_cpu ( current_state , cpu ) = state ;
}
enum cpu_state_vals get_preferred_offline_state ( int cpu )
{
return per_cpu ( preferred_offline_state , cpu ) ;
}
void set_preferred_offline_state ( int cpu , enum cpu_state_vals state )
{
per_cpu ( preferred_offline_state , cpu ) = state ;
}
void set_default_offline_state ( int cpu )
{
per_cpu ( preferred_offline_state , cpu ) = default_offline_state ;
}
2006-12-05 09:52:37 +03:00
static void rtas_stop_self ( void )
2006-12-05 09:52:36 +03:00
{
struct rtas_args * args = & rtas_stop_self_args ;
local_irq_disable ( ) ;
BUG_ON ( args - > token = = RTAS_UNKNOWN_SERVICE ) ;
printk ( " cpu %u (hwid %u) Ready to die... \n " ,
smp_processor_id ( ) , hard_smp_processor_id ( ) ) ;
enter_rtas ( __pa ( args ) ) ;
panic ( " Alas, I survived. \n " ) ;
}
2006-12-05 09:52:39 +03:00
static void pseries_mach_cpu_die ( void )
2006-12-05 09:52:37 +03:00
{
2009-10-29 22:22:53 +03:00
unsigned int cpu = smp_processor_id ( ) ;
unsigned int hwcpu = hard_smp_processor_id ( ) ;
u8 cede_latency_hint = 0 ;
2006-12-05 09:52:37 +03:00
local_irq_disable ( ) ;
idle_task_exit ( ) ;
2008-02-06 23:37:31 +03:00
xics_teardown_cpu ( ) ;
2009-10-29 22:22:53 +03:00
if ( get_preferred_offline_state ( cpu ) = = CPU_STATE_INACTIVE ) {
set_cpu_current_state ( cpu , CPU_STATE_INACTIVE ) ;
2010-07-07 16:31:02 +04:00
if ( ppc_md . suspend_disable_cpu )
ppc_md . suspend_disable_cpu ( ) ;
2009-10-29 22:22:53 +03:00
cede_latency_hint = 2 ;
get_lppaca ( ) - > idle = 1 ;
if ( ! get_lppaca ( ) - > shared_proc )
get_lppaca ( ) - > donate_dedicated_cpu = 1 ;
while ( get_preferred_offline_state ( cpu ) = = CPU_STATE_INACTIVE ) {
extended_cede_processor ( cede_latency_hint ) ;
}
if ( ! get_lppaca ( ) - > shared_proc )
get_lppaca ( ) - > donate_dedicated_cpu = 0 ;
get_lppaca ( ) - > idle = 0 ;
2010-03-01 05:58:16 +03:00
if ( get_preferred_offline_state ( cpu ) = = CPU_STATE_ONLINE ) {
unregister_slb_shadow ( hwcpu , __pa ( get_slb_shadow ( ) ) ) ;
2009-10-29 22:22:53 +03:00
2010-03-01 05:58:16 +03:00
/*
* Call to start_secondary_resume ( ) will not return .
* Kernel stack will be reset and start_secondary ( )
* will be called to continue the online operation .
*/
start_secondary_resume ( ) ;
}
}
2009-10-29 22:22:53 +03:00
2010-03-01 05:58:16 +03:00
/* Requested state is CPU_STATE_OFFLINE at this point */
WARN_ON ( get_preferred_offline_state ( cpu ) ! = CPU_STATE_OFFLINE ) ;
2009-10-29 22:22:53 +03:00
2010-03-01 05:58:16 +03:00
set_cpu_current_state ( cpu , CPU_STATE_OFFLINE ) ;
unregister_slb_shadow ( hwcpu , __pa ( get_slb_shadow ( ) ) ) ;
rtas_stop_self ( ) ;
2009-10-29 22:22:53 +03:00
2006-12-05 09:52:37 +03:00
/* Should never get here... */
BUG ( ) ;
for ( ; ; ) ;
}
2006-12-05 09:52:39 +03:00
static int pseries_cpu_disable ( void )
2006-12-05 09:52:38 +03:00
{
int cpu = smp_processor_id ( ) ;
2009-09-24 19:34:48 +04:00
set_cpu_online ( cpu , false ) ;
2006-12-05 09:52:38 +03:00
vdso_data - > processorCount - - ;
/*fix boot_cpuid here*/
if ( cpu = = boot_cpuid )
2010-04-26 19:32:42 +04:00
boot_cpuid = cpumask_any ( cpu_online_mask ) ;
2006-12-05 09:52:38 +03:00
/* FIXME: abstract this to not be platform specific later on */
xics_migrate_irqs_away ( ) ;
return 0 ;
}
2009-10-29 22:22:53 +03:00
/*
* pseries_cpu_die : Wait for the cpu to die .
* @ cpu : logical processor id of the CPU whose death we ' re awaiting .
*
* This function is called from the context of the thread which is performing
* the cpu - offline . Here we wait for long enough to allow the cpu in question
* to self - destroy so that the cpu - offline thread can send the CPU_DEAD
* notifications .
*
* OTOH , pseries_mach_cpu_die ( ) is called by the @ cpu when it wants to
* self - destruct .
*/
2006-12-05 09:52:39 +03:00
static void pseries_cpu_die ( unsigned int cpu )
2006-12-05 09:52:38 +03:00
{
int tries ;
2009-10-29 22:22:53 +03:00
int cpu_status = 1 ;
2006-12-05 09:52:38 +03:00
unsigned int pcpu = get_hard_smp_processor_id ( cpu ) ;
2009-10-29 22:22:53 +03:00
if ( get_preferred_offline_state ( cpu ) = = CPU_STATE_INACTIVE ) {
cpu_status = 1 ;
for ( tries = 0 ; tries < 1000 ; tries + + ) {
if ( get_cpu_current_state ( cpu ) = = CPU_STATE_INACTIVE ) {
cpu_status = 0 ;
break ;
}
cpu_relax ( ) ;
}
} else if ( get_preferred_offline_state ( cpu ) = = CPU_STATE_OFFLINE ) {
for ( tries = 0 ; tries < 25 ; tries + + ) {
2010-04-28 17:39:41 +04:00
cpu_status = smp_query_cpu_stopped ( pcpu ) ;
if ( cpu_status = = QCSS_STOPPED | |
cpu_status = = QCSS_HARDWARE_ERROR )
2009-10-29 22:22:53 +03:00
break ;
cpu_relax ( ) ;
}
2006-12-05 09:52:38 +03:00
}
2009-10-29 22:22:53 +03:00
2006-12-05 09:52:38 +03:00
if ( cpu_status ! = 0 ) {
printk ( " Querying DEAD? cpu %i (%i) shows %i \n " ,
cpu , pcpu , cpu_status ) ;
}
/* Isolation and deallocation are definatly done by
* drslot_chrp_cpu . If they were not they would be
* done here . Change isolate state to Isolate and
* change allocation - state to Unusable .
*/
paca [ cpu ] . cpu_start = 0 ;
}
/*
2010-04-26 19:32:44 +04:00
* Update cpu_present_mask and paca ( s ) for a new cpu node . The wrinkle
2006-12-05 09:52:38 +03:00
* here is that a cpu device node may represent up to two logical cpus
* in the SMT case . We must honor the assumption in other code that
* the logical ids for sibling SMT threads x and y are adjacent , such
* that x ^ 1 = = y and y ^ 1 = = x .
*/
2006-12-05 09:52:39 +03:00
static int pseries_add_processor ( struct device_node * np )
2006-12-05 09:52:38 +03:00
{
unsigned int cpu ;
2010-04-26 19:32:42 +04:00
cpumask_var_t candidate_mask , tmp ;
2006-12-05 09:52:38 +03:00
int err = - ENOSPC , len , nthreads , i ;
const u32 * intserv ;
2007-04-03 16:26:41 +04:00
intserv = of_get_property ( np , " ibm,ppc-interrupt-server#s " , & len ) ;
2006-12-05 09:52:38 +03:00
if ( ! intserv )
return 0 ;
2010-04-26 19:32:42 +04:00
zalloc_cpumask_var ( & candidate_mask , GFP_KERNEL ) ;
zalloc_cpumask_var ( & tmp , GFP_KERNEL ) ;
2006-12-05 09:52:38 +03:00
nthreads = len / sizeof ( u32 ) ;
for ( i = 0 ; i < nthreads ; i + + )
2010-04-26 19:32:42 +04:00
cpumask_set_cpu ( i , tmp ) ;
2006-12-05 09:52:38 +03:00
2008-01-25 23:08:02 +03:00
cpu_maps_update_begin ( ) ;
2006-12-05 09:52:38 +03:00
2010-04-26 19:32:42 +04:00
BUG_ON ( ! cpumask_subset ( cpu_present_mask , cpu_possible_mask ) ) ;
2006-12-05 09:52:38 +03:00
/* Get a bitmap of unoccupied slots. */
2010-04-26 19:32:42 +04:00
cpumask_xor ( candidate_mask , cpu_possible_mask , cpu_present_mask ) ;
if ( cpumask_empty ( candidate_mask ) ) {
2006-12-05 09:52:38 +03:00
/* If we get here, it most likely means that NR_CPUS is
* less than the partition ' s max processors setting .
*/
printk ( KERN_ERR " Cannot add cpu %s; this system configuration "
" supports %d logical cpus. \n " , np - > full_name ,
2010-04-26 19:32:42 +04:00
cpumask_weight ( cpu_possible_mask ) ) ;
2006-12-05 09:52:38 +03:00
goto out_unlock ;
}
2010-04-26 19:32:42 +04:00
while ( ! cpumask_empty ( tmp ) )
if ( cpumask_subset ( tmp , candidate_mask ) )
2006-12-05 09:52:38 +03:00
/* Found a range where we can insert the new cpu(s) */
break ;
else
2010-04-26 19:32:42 +04:00
cpumask_shift_left ( tmp , tmp , nthreads ) ;
2006-12-05 09:52:38 +03:00
2010-04-26 19:32:42 +04:00
if ( cpumask_empty ( tmp ) ) {
2010-04-26 19:32:44 +04:00
printk ( KERN_ERR " Unable to find space in cpu_present_mask for "
2006-12-05 09:52:38 +03:00
" processor %s with %d thread(s) \n " , np - > name ,
nthreads ) ;
goto out_unlock ;
}
2010-04-26 19:32:42 +04:00
for_each_cpu ( cpu , tmp ) {
BUG_ON ( cpumask_test_cpu ( cpu , cpu_present_mask ) ) ;
2009-09-24 19:34:48 +04:00
set_cpu_present ( cpu , true ) ;
2006-12-05 09:52:38 +03:00
set_hard_smp_processor_id ( cpu , * intserv + + ) ;
}
err = 0 ;
out_unlock :
2008-01-25 23:08:02 +03:00
cpu_maps_update_done ( ) ;
2010-04-26 19:32:42 +04:00
free_cpumask_var ( candidate_mask ) ;
free_cpumask_var ( tmp ) ;
2006-12-05 09:52:38 +03:00
return err ;
}
/*
* Update the present map for a cpu node which is going away , and set
* the hard id in the paca ( s ) to - 1 to be consistent with boot time
* convention for non - present cpus .
*/
2006-12-05 09:52:39 +03:00
static void pseries_remove_processor ( struct device_node * np )
2006-12-05 09:52:38 +03:00
{
unsigned int cpu ;
int len , nthreads , i ;
const u32 * intserv ;
2007-04-03 16:26:41 +04:00
intserv = of_get_property ( np , " ibm,ppc-interrupt-server#s " , & len ) ;
2006-12-05 09:52:38 +03:00
if ( ! intserv )
return ;
nthreads = len / sizeof ( u32 ) ;
2008-01-25 23:08:02 +03:00
cpu_maps_update_begin ( ) ;
2006-12-05 09:52:38 +03:00
for ( i = 0 ; i < nthreads ; i + + ) {
for_each_present_cpu ( cpu ) {
if ( get_hard_smp_processor_id ( cpu ) ! = intserv [ i ] )
continue ;
BUG_ON ( cpu_online ( cpu ) ) ;
2009-09-24 19:34:48 +04:00
set_cpu_present ( cpu , false ) ;
2006-12-05 09:52:38 +03:00
set_hard_smp_processor_id ( cpu , - 1 ) ;
break ;
}
2010-04-26 19:32:42 +04:00
if ( cpu > = nr_cpu_ids )
2006-12-05 09:52:38 +03:00
printk ( KERN_WARNING " Could not find cpu to remove "
" with physical id 0x%x \n " , intserv [ i ] ) ;
}
2008-01-25 23:08:02 +03:00
cpu_maps_update_done ( ) ;
2006-12-05 09:52:38 +03:00
}
2006-12-05 09:52:39 +03:00
static int pseries_smp_notifier ( struct notifier_block * nb ,
unsigned long action , void * node )
2006-12-05 09:52:38 +03:00
{
int err = NOTIFY_OK ;
switch ( action ) {
case PSERIES_RECONFIG_ADD :
2006-12-05 09:52:39 +03:00
if ( pseries_add_processor ( node ) )
2006-12-05 09:52:38 +03:00
err = NOTIFY_BAD ;
break ;
case PSERIES_RECONFIG_REMOVE :
2006-12-05 09:52:39 +03:00
pseries_remove_processor ( node ) ;
2006-12-05 09:52:38 +03:00
break ;
default :
err = NOTIFY_DONE ;
break ;
}
return err ;
}
2006-12-05 09:52:39 +03:00
static struct notifier_block pseries_smp_nb = {
. notifier_call = pseries_smp_notifier ,
2006-12-05 09:52:38 +03:00
} ;
2009-10-29 22:22:53 +03:00
# define MAX_CEDE_LATENCY_LEVELS 4
# define CEDE_LATENCY_PARAM_LENGTH 10
# define CEDE_LATENCY_PARAM_MAX_LENGTH \
( MAX_CEDE_LATENCY_LEVELS * CEDE_LATENCY_PARAM_LENGTH * sizeof ( char ) )
# define CEDE_LATENCY_TOKEN 45
static char cede_parameters [ CEDE_LATENCY_PARAM_MAX_LENGTH ] ;
static int parse_cede_parameters ( void )
{
memset ( cede_parameters , 0 , CEDE_LATENCY_PARAM_MAX_LENGTH ) ;
2010-02-07 16:52:05 +03:00
return rtas_call ( rtas_token ( " ibm,get-system-parameter " ) , 3 , 1 ,
NULL ,
CEDE_LATENCY_TOKEN ,
__pa ( cede_parameters ) ,
CEDE_LATENCY_PARAM_MAX_LENGTH ) ;
2009-10-29 22:22:53 +03:00
}
2006-12-05 09:52:36 +03:00
static int __init pseries_cpu_hotplug_init ( void )
{
2007-10-10 04:38:24 +04:00
struct device_node * np ;
const char * typep ;
2009-10-29 22:22:53 +03:00
int cpu ;
2010-04-28 17:39:41 +04:00
int qcss_tok ;
2007-10-10 04:38:24 +04:00
for_each_node_by_name ( np , " interrupt-controller " ) {
typep = of_get_property ( np , " compatible " , NULL ) ;
if ( strstr ( typep , " open-pic " ) ) {
of_node_put ( np ) ;
printk ( KERN_INFO " CPU Hotplug not supported on "
" systems using MPIC \n " ) ;
return 0 ;
}
}
2006-12-05 09:52:36 +03:00
rtas_stop_self_args . token = rtas_token ( " stop-self " ) ;
2006-12-05 09:52:38 +03:00
qcss_tok = rtas_token ( " query-cpu-stopped-state " ) ;
2006-12-05 09:52:36 +03:00
2006-12-05 09:52:38 +03:00
if ( rtas_stop_self_args . token = = RTAS_UNKNOWN_SERVICE | |
qcss_tok = = RTAS_UNKNOWN_SERVICE ) {
printk ( KERN_INFO " CPU Hotplug not supported by firmware "
" - disabling. \n " ) ;
return 0 ;
}
2006-12-05 09:52:37 +03:00
2006-12-05 09:52:39 +03:00
ppc_md . cpu_die = pseries_mach_cpu_die ;
smp_ops - > cpu_disable = pseries_cpu_disable ;
smp_ops - > cpu_die = pseries_cpu_die ;
2006-12-05 09:52:38 +03:00
/* Processors can be added/removed only on LPAR */
2009-10-29 22:22:53 +03:00
if ( firmware_has_feature ( FW_FEATURE_LPAR ) ) {
2006-12-05 09:52:39 +03:00
pSeries_reconfig_notifier_register ( & pseries_smp_nb ) ;
2009-10-29 22:22:53 +03:00
cpu_maps_update_begin ( ) ;
if ( cede_offline_enabled & & parse_cede_parameters ( ) = = 0 ) {
default_offline_state = CPU_STATE_INACTIVE ;
for_each_online_cpu ( cpu )
set_default_offline_state ( cpu ) ;
}
cpu_maps_update_done ( ) ;
}
2006-12-05 09:52:38 +03:00
2006-12-05 09:52:36 +03:00
return 0 ;
}
arch_initcall ( pseries_cpu_hotplug_init ) ;