2008-05-03 18:29:28 +02:00
/*
* sched_clock for unstable cpu clocks
*
* Copyright ( C ) 2008 Red Hat , Inc . , Peter Zijlstra < pzijlstr @ redhat . com >
*
2008-07-09 00:15:33 -04:00
* Updates and enhancements :
* Copyright ( C ) 2008 Red Hat , Inc . Steven Rostedt < srostedt @ redhat . com >
*
2008-05-03 18:29:28 +02:00
* Based on code by :
* Ingo Molnar < mingo @ redhat . com >
* Guillaume Chazarain < guichaz @ gmail . com >
*
* Create a semi stable clock from a mixture of other events , including :
* - gtod
* - sched_clock ( )
* - explicit idle events
*
* We use gtod as base and the unstable clock deltas . The deltas are filtered ,
2008-08-25 17:15:34 +02:00
* making it monotonic and keeping it within an expected window .
2008-05-03 18:29:28 +02:00
*
* Furthermore , explicit sleep and wakeup hooks allow us to account for time
* that is otherwise invisible ( TSC gets stopped ) .
*
* The clock : sched_clock_cpu ( ) is monotonic per cpu , and should be somewhat
2008-08-25 17:15:34 +02:00
* consistent between cpus ( never more than 2 jiffies difference ) .
2008-05-03 18:29:28 +02:00
*/
# include <linux/spinlock.h>
2008-05-12 21:21:14 +02:00
# include <linux/hardirq.h>
2008-05-03 18:29:28 +02:00
# include <linux/module.h>
2009-02-26 20:20:29 +01:00
# include <linux/percpu.h>
# include <linux/ktime.h>
# include <linux/sched.h>
2008-05-03 18:29:28 +02:00
2008-07-25 19:45:00 +01:00
/*
* Scheduler clock - returns current time in nanosec units .
* This is default implementation .
* Architectures and sub - architectures can override this .
*/
unsigned long long __attribute__ ( ( weak ) ) sched_clock ( void )
{
2009-05-08 22:54:49 +09:30
return ( unsigned long long ) ( jiffies - INITIAL_JIFFIES )
* ( NSEC_PER_SEC / HZ ) ;
2008-07-25 19:45:00 +01:00
}
2008-05-03 18:29:28 +02:00
2008-08-11 08:59:03 +02:00
static __read_mostly int sched_clock_running ;
2008-05-03 18:29:28 +02:00
# ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
2009-02-26 20:20:29 +01:00
__read_mostly int sched_clock_stable ;
2008-05-03 18:29:28 +02:00
struct sched_clock_data {
/*
* Raw spinlock - this is a special case : this might be called
* from within instrumentation code so we dont want to do any
* instrumentation ourselves .
*/
raw_spinlock_t lock ;
u64 tick_raw ;
u64 tick_gtod ;
u64 clock ;
} ;
static DEFINE_PER_CPU_SHARED_ALIGNED ( struct sched_clock_data , sched_clock_data ) ;
static inline struct sched_clock_data * this_scd ( void )
{
return & __get_cpu_var ( sched_clock_data ) ;
}
static inline struct sched_clock_data * cpu_sdc ( int cpu )
{
return & per_cpu ( sched_clock_data , cpu ) ;
}
void sched_clock_init ( void )
{
u64 ktime_now = ktime_to_ns ( ktime_get ( ) ) ;
int cpu ;
for_each_possible_cpu ( cpu ) {
struct sched_clock_data * scd = cpu_sdc ( cpu ) ;
scd - > lock = ( raw_spinlock_t ) __RAW_SPIN_LOCK_UNLOCKED ;
2008-05-29 10:07:15 +02:00
scd - > tick_raw = 0 ;
2008-05-03 18:29:28 +02:00
scd - > tick_gtod = ktime_now ;
scd - > clock = ktime_now ;
}
2008-05-29 10:07:15 +02:00
sched_clock_running = 1 ;
2008-05-03 18:29:28 +02:00
}
2008-08-25 17:15:34 +02:00
/*
2009-02-26 20:20:29 +01:00
* min , max except they take wrapping into account
2008-08-25 17:15:34 +02:00
*/
static inline u64 wrap_min ( u64 x , u64 y )
{
return ( s64 ) ( x - y ) < 0 ? x : y ;
}
static inline u64 wrap_max ( u64 x , u64 y )
{
return ( s64 ) ( x - y ) > 0 ? x : y ;
}
2008-05-03 18:29:28 +02:00
/*
* update the percpu scd from the raw @ now value
*
* - filter out backward motion
2008-08-25 17:15:34 +02:00
* - use the GTOD tick value to create a window to filter crazy TSC values
2008-05-03 18:29:28 +02:00
*/
2008-07-30 10:15:55 +02:00
static u64 __update_sched_clock ( struct sched_clock_data * scd , u64 now )
2008-05-03 18:29:28 +02:00
{
2008-07-30 10:13:35 +02:00
s64 delta = now - scd - > tick_raw ;
2008-08-25 17:15:34 +02:00
u64 clock , min_clock , max_clock ;
2008-05-03 18:29:28 +02:00
2008-08-25 17:15:34 +02:00
if ( unlikely ( delta < 0 ) )
delta = 0 ;
2008-05-03 18:29:28 +02:00
2008-08-25 17:15:34 +02:00
/*
* scd - > clock = clamp ( scd - > tick_gtod + delta ,
2009-02-26 20:20:29 +01:00
* max ( scd - > tick_gtod , scd - > clock ) ,
* scd - > tick_gtod + TICK_NSEC ) ;
2008-08-25 17:15:34 +02:00
*/
2008-05-03 18:29:28 +02:00
2008-08-25 17:15:34 +02:00
clock = scd - > tick_gtod + delta ;
min_clock = wrap_max ( scd - > tick_gtod , scd - > clock ) ;
2008-12-22 23:05:28 +01:00
max_clock = wrap_max ( scd - > clock , scd - > tick_gtod + TICK_NSEC ) ;
2008-05-03 18:29:28 +02:00
2008-08-25 17:15:34 +02:00
clock = wrap_max ( clock , min_clock ) ;
clock = wrap_min ( clock , max_clock ) ;
2008-05-03 18:29:28 +02:00
2008-04-14 08:50:02 +02:00
scd - > clock = clock ;
2008-07-30 10:15:55 +02:00
2008-08-25 17:15:34 +02:00
return scd - > clock ;
2008-05-03 18:29:28 +02:00
}
static void lock_double_clock ( struct sched_clock_data * data1 ,
struct sched_clock_data * data2 )
{
if ( data1 < data2 ) {
__raw_spin_lock ( & data1 - > lock ) ;
__raw_spin_lock ( & data2 - > lock ) ;
} else {
__raw_spin_lock ( & data2 - > lock ) ;
__raw_spin_lock ( & data1 - > lock ) ;
}
}
u64 sched_clock_cpu ( int cpu )
{
2008-07-30 10:22:07 +02:00
u64 now , clock , this_clock , remote_clock ;
2009-02-26 20:20:29 +01:00
struct sched_clock_data * scd ;
2008-05-03 18:29:28 +02:00
2009-02-26 20:20:29 +01:00
if ( sched_clock_stable )
return sched_clock ( ) ;
2008-05-29 10:07:15 +02:00
2009-02-26 20:20:29 +01:00
scd = cpu_sdc ( cpu ) ;
2008-05-03 18:29:28 +02:00
2008-05-12 21:21:14 +02:00
/*
* Normally this is not called in NMI context - but if it is ,
* trying to do any locking here is totally lethal .
*/
if ( unlikely ( in_nmi ( ) ) )
return scd - > clock ;
2008-05-29 10:07:15 +02:00
if ( unlikely ( ! sched_clock_running ) )
return 0ull ;
2008-05-03 18:29:28 +02:00
WARN_ON_ONCE ( ! irqs_disabled ( ) ) ;
now = sched_clock ( ) ;
if ( cpu ! = raw_smp_processor_id ( ) ) {
struct sched_clock_data * my_scd = this_scd ( ) ;
lock_double_clock ( scd , my_scd ) ;
2008-07-30 10:22:07 +02:00
this_clock = __update_sched_clock ( my_scd , now ) ;
remote_clock = scd - > clock ;
/*
* Use the opportunity that we have both locks
* taken to couple the two clocks : we take the
* larger time as the latest time for both
* runqueues . ( this creates monotonic movement )
*/
2008-08-25 17:15:34 +02:00
if ( likely ( ( s64 ) ( remote_clock - this_clock ) < 0 ) ) {
2008-07-30 10:22:07 +02:00
clock = this_clock ;
scd - > clock = clock ;
} else {
/*
* Should be rare , but possible :
*/
clock = remote_clock ;
my_scd - > clock = remote_clock ;
}
2008-05-03 18:29:28 +02:00
__raw_spin_unlock ( & my_scd - > lock ) ;
} else {
__raw_spin_lock ( & scd - > lock ) ;
2008-07-30 10:22:07 +02:00
clock = __update_sched_clock ( scd , now ) ;
2008-05-03 18:29:28 +02:00
}
2008-04-14 08:50:02 +02:00
__raw_spin_unlock ( & scd - > lock ) ;
2008-05-03 18:29:28 +02:00
return clock ;
}
void sched_clock_tick ( void )
{
2009-02-26 21:40:16 +01:00
struct sched_clock_data * scd ;
2008-05-03 18:29:28 +02:00
u64 now , now_gtod ;
2009-02-26 21:40:16 +01:00
if ( sched_clock_stable )
return ;
2008-05-29 10:07:15 +02:00
if ( unlikely ( ! sched_clock_running ) )
return ;
2008-05-03 18:29:28 +02:00
WARN_ON_ONCE ( ! irqs_disabled ( ) ) ;
2009-02-26 21:40:16 +01:00
scd = this_scd ( ) ;
2008-05-03 18:29:28 +02:00
now_gtod = ktime_to_ns ( ktime_get ( ) ) ;
2008-07-09 00:15:32 -04:00
now = sched_clock ( ) ;
2008-05-03 18:29:28 +02:00
__raw_spin_lock ( & scd - > lock ) ;
scd - > tick_raw = now ;
scd - > tick_gtod = now_gtod ;
2008-08-25 17:15:34 +02:00
__update_sched_clock ( scd , now ) ;
2008-05-03 18:29:28 +02:00
__raw_spin_unlock ( & scd - > lock ) ;
}
/*
* We are going deep - idle ( irqs are disabled ) :
*/
void sched_clock_idle_sleep_event ( void )
{
sched_clock_cpu ( smp_processor_id ( ) ) ;
}
EXPORT_SYMBOL_GPL ( sched_clock_idle_sleep_event ) ;
/*
* We just idled delta nanoseconds ( called with irqs disabled ) :
*/
void sched_clock_idle_wakeup_event ( u64 delta_ns )
{
2008-12-22 23:05:28 +01:00
if ( timekeeping_suspended )
return ;
2008-08-25 17:15:34 +02:00
sched_clock_tick ( ) ;
2008-05-03 18:29:28 +02:00
touch_softlockup_watchdog ( ) ;
}
EXPORT_SYMBOL_GPL ( sched_clock_idle_wakeup_event ) ;
2009-02-26 21:40:16 +01:00
# else /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
void sched_clock_init ( void )
{
sched_clock_running = 1 ;
}
u64 sched_clock_cpu ( int cpu )
{
if ( unlikely ( ! sched_clock_running ) )
return 0 ;
return sched_clock ( ) ;
}
2009-02-26 20:20:29 +01:00
# endif /* CONFIG_HAVE_UNSTABLE_SCHED_CLOCK */
2008-05-03 18:29:28 +02:00
2008-06-27 13:41:15 +02:00
unsigned long long cpu_clock ( int cpu )
{
unsigned long long clock ;
unsigned long flags ;
2008-06-29 15:01:59 +02:00
local_irq_save ( flags ) ;
2008-06-27 13:41:15 +02:00
clock = sched_clock_cpu ( cpu ) ;
2008-06-29 15:01:59 +02:00
local_irq_restore ( flags ) ;
2008-06-27 13:41:15 +02:00
return clock ;
}
2008-06-27 14:49:35 +02:00
EXPORT_SYMBOL_GPL ( cpu_clock ) ;