2019-05-27 08:55:01 +02:00
/* SPDX-License-Identifier: GPL-2.0-or-later */
2005-09-26 16:04:21 +10:00
/ *
* PowerPC v e r s i o n
* Copyright ( C ) 1 9 9 5 - 1 9 9 6 G a r y T h o m a s ( g d t @linuxppc.org)
* Rewritten b y C o r t D o u g a n ( c o r t @cs.nmt.edu) for PReP
* Copyright ( C ) 1 9 9 6 C o r t D o u g a n < c o r t @cs.nmt.edu>
* Low- l e v e l e x c e p t i o n h a n d l e r s a n d M M U s u p p o r t
* rewritten b y P a u l M a c k e r r a s .
* Copyright ( C ) 1 9 9 6 P a u l M a c k e r r a s .
* MPC8 x x m o d i f i c a t i o n s b y D a n M a l e k
* Copyright ( C ) 1 9 9 7 D a n M a l e k ( d m a l e k @jlc.net).
*
* This f i l e c o n t a i n s l o w - l e v e l s u p p o r t a n d s e t u p f o r P o w e r P C 8 x x
* embedded p r o c e s s o r s , i n c l u d i n g t r a p a n d i n t e r r u p t d i s p a t c h .
* /
2009-04-25 22:11:05 -04:00
# include < l i n u x / i n i t . h >
2019-08-21 10:20:51 +00:00
# include < l i n u x / m a g i c . h >
2020-06-08 21:32:42 -07:00
# include < l i n u x / p g t a b l e . h >
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
# include < l i n u x / s i z e s . h >
2005-09-26 16:04:21 +10:00
# include < a s m / p r o c e s s o r . h >
# include < a s m / p a g e . h >
# include < a s m / m m u . h >
# include < a s m / c a c h e . h >
# include < a s m / c p u t a b l e . h >
# include < a s m / t h r e a d _ i n f o . h >
# include < a s m / p p c _ a s m . h >
# include < a s m / a s m - o f f s e t s . h >
2010-11-18 15:06:17 +00:00
# include < a s m / p t r a c e . h >
2016-01-13 23:33:46 -05:00
# include < a s m / e x p o r t . h >
2018-10-19 06:55:06 +00:00
# include < a s m / c o d e - p a t c h i n g - a s m . h >
2021-04-19 15:48:09 +00:00
# include < a s m / i n t e r r u p t . h >
2005-09-26 16:04:21 +10:00
2021-03-12 12:50:23 +00:00
/ *
* Value f o r t h e b i t s t h a t h a v e f i x e d v a l u e i n R P N e n t r i e s .
* Also u s e d f o r t a g g i n g D A R f o r D T L B e r r o r .
* /
# define R P N _ P A T T E R N 0 x00 f0
2019-04-30 12:38:50 +00:00
# include " h e a d _ 3 2 . h "
2020-05-19 05:49:20 +00:00
.macro compare_to_kernel_boundary scratch, a d d r
2015-04-20 07:54:46 +02:00
# if C O N F I G _ T A S K _ S I Z E < = 0 x80 0 0 0 0 0 0 & & C O N F I G _ P A G E _ O F F S E T > = 0 x80 0 0 0 0 0 0
2017-07-12 12:08:47 +02:00
/* By simply checking Address >= 0x80000000, we know if its a kernel address */
2020-05-19 05:49:20 +00:00
not. \ s c r a t c h , \ a d d r
# else
rlwinm \ s c r a t c h , \ a d d r , 1 6 , 0 x f f f8
cmpli c r0 , \ s c r a t c h , P A G E _ O F F S E T @h
2015-04-20 07:54:46 +02:00
# endif
2020-05-19 05:49:20 +00:00
.endm
2015-04-20 07:54:46 +02:00
2016-12-07 08:47:28 +01:00
# define P A G E _ S H I F T _ 5 1 2 K 1 9
# define P A G E _ S H I F T _ 8 M 2 3
2009-04-25 22:11:05 -04:00
_ _ HEAD
2007-09-13 15:42:35 -05:00
_ ENTRY( _ s t e x t ) ;
_ ENTRY( _ s t a r t ) ;
2005-09-26 16:04:21 +10:00
/ * MPC8 x x
* This p o r t w a s d o n e o n a n M B X b o a r d w i t h a n 8 6 0 . R i g h t n o w I o n l y
* support a n E L F c o m p r e s s e d ( z I m a g e ) b o o t f r o m E P P C - B u g b e c a u s e t h e
* code t h e r e l o a d s u p s o m e r e g i s t e r s b e f o r e c a l l i n g u s :
* r3 : ptr t o b o a r d i n f o d a t a
* r4 : initrd_ s t a r t o r i f n o i n i t r d t h e n 0
* r5 : initrd_ e n d - u n u s e d i f r4 i s 0
* r6 : Start o f c o m m a n d l i n e s t r i n g
* r7 : End o f c o m m a n d l i n e s t r i n g
*
* I d e c i d e d t o u s e c o n d i t i o n a l c o m p i l a t i o n i n s t e a d o f c h e c k i n g P V R a n d
* adding m o r e p r o c e s s o r s p e c i f i c b r a n c h e s a r o u n d c o d e I d o n ' t n e e d .
* Since t h i s i s a n e m b e d d e d p r o c e s s o r , I a l s o a p p r e c i a t e a n y m e m o r y
* savings I c a n g e t .
*
* The M P C 8 x x d o e s n o t h a v e a n y B A T s , b u t i t s u p p o r t s l a r g e p a g e s i z e s .
* We f i r s t i n i t i a l i z e t h e M M U t o s u p p o r t 8 M b y t e p a g e s , t h e n l o a d o n e
* entry i n t o e a c h o f t h e i n s t r u c t i o n a n d d a t a T L B s t o m a p t h e f i r s t
* 8 M 1 : 1 . I a l s o m a p p e d a n a d d i t i o n a l I / O s p a c e 1 : 1 s o w e c a n g e t t o
* the " i n t e r n a l " p r o c e s s o r r e g i s t e r s b e f o r e M M U _ i n i t i s c a l l e d .
*
* - - Dan
* /
.globl __start
__start :
2011-07-25 11:29:33 +00:00
mr r31 ,r3 / * s a v e d e v i c e t r e e p t r * /
2005-09-26 16:04:21 +10:00
/ * We h a v e t o t u r n o n t h e M M U r i g h t a w a y s o w e g e t c a c h e m o d e s
* set c o r r e c t l y .
* /
bl i n i t i a l _ m m u
/ * We n o w h a v e t h e l o w e r 8 M e g m a p p e d i n t o T L B e n t r i e s , a n d t h e c a c h e s
* ready t o w o r k .
* /
turn_on_mmu :
mfmsr r0
ori r0 ,r0 ,M S R _ D R | M S R _ I R
mtspr S P R N _ S R R 1 ,r0
lis r0 ,s t a r t _ h e r e @h
ori r0 ,r0 ,s t a r t _ h e r e @l
mtspr S P R N _ S R R 0 ,r0
rfi / * e n a b l e s M M U * /
2018-11-29 14:07:11 +00:00
# ifdef C O N F I G _ P E R F _ E V E N T S
.align 4
.globl itlb_miss_counter
itlb_miss_counter :
.space 4
.globl dtlb_miss_counter
dtlb_miss_counter :
.space 4
.globl instruction_counter
instruction_counter :
.space 4
# endif
2005-09-26 16:04:21 +10:00
/* System reset */
2021-04-19 15:48:09 +00:00
EXCEPTION( I N T E R R U P T _ S Y S T E M _ R E S E T , R e s e t , s y s t e m _ r e s e t _ e x c e p t i o n )
2005-09-26 16:04:21 +10:00
/* Machine check */
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ M A C H I N E _ C H E C K , M a c h i n e C h e c k )
EXCEPTION_ P R O L O G I N T E R R U P T _ M A C H I N E _ C H E C K M a c h i n e C h e c k h a n d l e _ d a r _ d s i s r =1
2021-03-12 12:50:41 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl m a c h i n e _ c h e c k _ e x c e p t i o n
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
/* External interrupt */
2021-04-19 15:48:09 +00:00
EXCEPTION( I N T E R R U P T _ E X T E R N A L , H a r d w a r e I n t e r r u p t , d o _ I R Q )
2005-09-26 16:04:21 +10:00
/* Alignment exception */
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ A L I G N M E N T , A l i g n m e n t )
EXCEPTION_ P R O L O G I N T E R R U P T _ A L I G N M E N T A l i g n m e n t h a n d l e _ d a r _ d s i s r =1
2021-03-12 12:50:40 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl a l i g n m e n t _ e x c e p t i o n
REST_ N V G P R S ( r1 )
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
/* Program check exception */
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ P R O G R A M , P r o g r a m C h e c k )
EXCEPTION_ P R O L O G I N T E R R U P T _ P R O G R A M P r o g r a m C h e c k
2021-03-12 12:50:40 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl p r o g r a m _ c h e c k _ e x c e p t i o n
REST_ N V G P R S ( r1 )
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
/* Decrementer */
2021-04-19 15:48:09 +00:00
EXCEPTION( I N T E R R U P T _ D E C R E M E N T E R , D e c r e m e n t e r , t i m e r _ i n t e r r u p t )
2005-09-26 16:04:21 +10:00
/* System call */
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ S Y S C A L L , S y s t e m C a l l )
SYSCALL_ E N T R Y I N T E R R U P T _ S Y S C A L L
2005-09-26 16:04:21 +10:00
/* Single step - not used on 601 */
2021-04-19 15:48:09 +00:00
EXCEPTION( I N T E R R U P T _ T R A C E , S i n g l e S t e p , s i n g l e _ s t e p _ e x c e p t i o n )
2005-09-26 16:04:21 +10:00
/ * On t h e M P C 8 x x , t h i s i s a s o f t w a r e e m u l a t i o n i n t e r r u p t . I t o c c u r s
* for a l l u n i m p l e m e n t e d a n d i l l e g a l i n s t r u c t i o n s .
* /
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ S O F T _ E M U _ 8 x x , S o f t E m u )
EXCEPTION_ P R O L O G I N T E R R U P T _ S O F T _ E M U _ 8 x x S o f t E m u
2021-03-12 12:50:40 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl e m u l a t i o n _ a s s i s t _ i n t e r r u p t
REST_ N V G P R S ( r1 )
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
/ *
* For t h e M P C 8 x x , t h i s i s a s o f t w a r e t a b l e w a l k t o l o a d t h e i n s t r u c t i o n
2018-11-29 14:07:15 +00:00
* TLB. T h e t a s k s w i t c h l o a d s t h e M _ T W B r e g i s t e r w i t h t h e p o i n t e r t o t h e f i r s t
2014-09-19 10:36:08 +02:00
* level t a b l e .
2005-09-26 16:04:21 +10:00
* If w e d i s c o v e r t h e r e i s n o s e c o n d l e v e l t a b l e ( v a l u e i s z e r o ) o r i f t h e r e
* is a n i n v a l i d p t e , w e l o a d t h a t i n t o t h e T L B , w h i c h c a u s e s a n o t h e r f a u l t
* into t h e T L B E r r o r i n t e r r u p t w h e r e w e c a n h a n d l e s u c h p r o b l e m s .
* We h a v e t o u s e t h e M D _ x x x r e g i s t e r s f o r t h e t a b l e w a l k b e c a u s e t h e
* equivalent M I _ x x x r e g i s t e r s o n l y p e r f o r m t h e a t t r i b u t e f u n c t i o n s .
* /
2015-04-20 07:54:38 +02:00
# ifdef C O N F I G _ 8 x x _ C P U 1 5
2020-11-24 15:24:56 +00:00
# define I N V A L I D A T E _ A D J A C E N T _ P A G E S _ C P U 1 5 ( a d d r , t m p ) \
addi t m p , a d d r , P A G E _ S I Z E ; \
tlbie t m p ; \
addi t m p , a d d r , - P A G E _ S I Z E ; \
tlbie t m p
2015-04-20 07:54:38 +02:00
# else
2020-11-24 15:24:56 +00:00
# define I N V A L I D A T E _ A D J A C E N T _ P A G E S _ C P U 1 5 ( a d d r , t m p )
2015-04-20 07:54:38 +02:00
# endif
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ I N S T _ T L B _ M I S S _ 8 x x , I n s t r u c t i o n T L B M i s s )
2020-11-24 15:24:57 +00:00
mtspr S P R N _ S P R G _ S C R A T C H 2 , r10
mtspr S P R N _ M _ T W , r11
2005-09-26 16:04:21 +10:00
/ * If w e a r e f a u l t i n g a k e r n e l a d d r e s s , w e h a v e t o u s e t h e
* kernel p a g e t a b l e s .
* /
2016-09-16 08:42:04 +02:00
mfspr r10 , S P R N _ S R R 0 / * G e t e f f e c t i v e a d d r e s s o f f a u l t * /
2020-11-24 15:24:56 +00:00
INVALIDATE_ A D J A C E N T _ P A G E S _ C P U 1 5 ( r10 , r11 )
2018-11-29 14:07:15 +00:00
mtspr S P R N _ M D _ E P N , r10
2020-11-24 15:24:55 +00:00
# ifdef C O N F I G _ M O D U L E S
2018-11-29 14:07:24 +00:00
mfcr r11
2020-05-19 05:49:20 +00:00
compare_ t o _ k e r n e l _ b o u n d a r y r10 , r10
2016-09-16 08:42:04 +02:00
# endif
2018-11-29 14:07:24 +00:00
mfspr r10 , S P R N _ M _ T W B / * G e t l e v e l 1 t a b l e * /
2020-11-24 15:24:55 +00:00
# ifdef C O N F I G _ M O D U L E S
2017-07-12 12:08:47 +02:00
blt+ 3 f
2018-11-29 14:07:24 +00:00
rlwinm r10 , r10 , 0 , 2 0 , 3 1
oris r10 , r10 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @ha
2005-09-26 16:04:21 +10:00
3 :
2020-05-19 05:49:08 +00:00
mtcr r11
2010-03-02 05:37:10 +00:00
# endif
2020-05-19 05:49:08 +00:00
lwz r11 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @l(r10) /* Get level 1 entry */
mtspr S P R N _ M D _ T W C , r11
2018-11-29 14:07:15 +00:00
mfspr r10 , S P R N _ M D _ T W C
2015-04-22 12:06:43 +02:00
lwz r10 , 0 ( r10 ) / * G e t t h e p t e * /
2020-10-12 08:54:33 +00:00
rlwimi r11 , r10 , 0 , _ P A G E _ G U A R D E D | _ P A G E _ A C C E S S E D
powerpc/8xx: Manage 512k huge pages as standard pages.
At the time being, 512k huge pages are handled through hugepd page
tables. The PMD entry is flagged as a hugepd pointer and it
means that only 512k hugepages can be managed in that 4M block.
However, the hugepd table has the same size as a normal page
table, and 512k entries can therefore be nested with normal pages.
On the 8xx, TLB loading is performed by software and allthough the
page tables are organised to match the L1 and L2 level defined by
the HW, all TLB entries have both L1 and L2 independent entries.
It means that even if two TLB entries are associated with the same
PMD entry, they can be loaded with different values in L1 part.
The L1 entry contains the page size (PS field):
- 00 for 4k and 16 pages
- 01 for 512k pages
- 11 for 8M pages
By adding a flag for hugepages in the PTE (_PAGE_HUGE) and copying it
into the lower bit of PS, we can then manage 512k pages with normal
page tables:
- PMD entry has PS=11 for 8M pages
- PMD entry has PS=00 for other pages.
As a PMD entry covers 4M areas, a PMD will either point to a hugepd
table having a single entry to an 8M page, or the PMD will point to
a standard page table which will have either entries to 4k or 16k or
512k pages. For 512k pages, as the L1 entry will not know it is a
512k page before the PTE is read, there will be 128 entries in the
PTE as if it was 4k pages. But when loading the TLB, it will be
flagged as a 512k page.
Note that we can't use pmd_ptr() in asm/nohash/32/pgtable.h because
it is not defined yet.
In ITLB miss, we keep the possibility to opt it out as when kernel
text is pinned and no user hugepages are used, we can save several
instruction by not using r11.
In DTLB miss, that's just one instruction so it's not worth bothering
with it.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/002819e8e166bf81d24b24782d98de7c40905d8f.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:09 +00:00
rlwimi r11 , r10 , 3 2 - 9 , _ P M D _ P A G E _ 5 1 2 K
mtspr S P R N _ M I _ T W C , r11
2005-09-26 16:04:21 +10:00
/ * The L i n u x P T E w o n ' t g o e x a c t l y i n t o t h e M M U T L B .
2018-01-12 13:45:31 +01:00
* Software i n d i c a t o r b i t s 2 0 a n d 2 3 m u s t b e c l e a r .
* Software i n d i c a t o r b i t s 2 2 , 2 4 , 2 5 , 2 6 , a n d 2 7 m u s t b e
2005-09-26 16:04:21 +10:00
* set. A l l o t h e r L i n u x P T E b i t s c o n t r o l t h e b e h a v i o r
* of t h e M M U .
* /
2020-02-09 18:14:42 +00:00
rlwinm r10 , r10 , 0 , ~ 0 x0 f00 / * C l e a r b i t s 2 0 - 2 3 * /
2018-11-29 14:07:24 +00:00
rlwimi r10 , r10 , 4 , 0 x04 0 0 / * C o p y _ P A G E _ E X E C i n t o b i t 2 1 * /
ori r10 , r10 , R P N _ P A T T E R N | 0 x20 0 / * S e t 2 2 a n d 2 4 - 2 7 * /
2018-01-12 13:45:19 +01:00
mtspr S P R N _ M I _ R P N , r10 / * U p d a t e T L B e n t r y * /
2005-09-26 16:04:21 +10:00
2010-03-02 05:37:12 +00:00
/* Restore registers */
2020-11-24 15:24:57 +00:00
0 : mfspr r10 , S P R N _ S P R G _ S C R A T C H 2
mfspr r11 , S P R N _ M _ T W
2018-01-12 13:45:23 +01:00
rfi
2018-10-19 06:55:08 +00:00
patch_ s i t e 0 b , p a t c h _ _ i t l b m i s s _ e x i t _ 1
2018-01-12 13:45:23 +01:00
# ifdef C O N F I G _ P E R F _ E V E N T S
2018-10-19 06:55:08 +00:00
patch_ s i t e 0 f , p a t c h _ _ i t l b m i s s _ p e r f
2018-11-29 14:07:11 +00:00
0 : lwz r10 , ( i t l b _ m i s s _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
addi r10 , r10 , 1
stw r10 , ( i t l b _ m i s s _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
2020-11-24 15:24:57 +00:00
mfspr r10 , S P R N _ S P R G _ S C R A T C H 2
mfspr r11 , S P R N _ M _ T W
2005-09-26 16:04:21 +10:00
rfi
2018-11-29 14:07:11 +00:00
# endif
2005-09-26 16:04:21 +10:00
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ D A T A _ T L B _ M I S S _ 8 x x , D a t a S t o r e T L B M i s s )
2020-11-24 15:24:58 +00:00
mtspr S P R N _ S P R G _ S C R A T C H 2 , r10
2019-12-21 08:32:31 +00:00
mtspr S P R N _ M _ T W , r11
2018-11-29 14:07:24 +00:00
mfcr r11
2005-09-26 16:04:21 +10:00
/ * If w e a r e f a u l t i n g a k e r n e l a d d r e s s , w e h a v e t o u s e t h e
* kernel p a g e t a b l e s .
* /
2016-09-16 08:42:08 +02:00
mfspr r10 , S P R N _ M D _ E P N
2020-05-19 05:49:20 +00:00
compare_ t o _ k e r n e l _ b o u n d a r y r10 , r10
2018-11-29 14:07:24 +00:00
mfspr r10 , S P R N _ M _ T W B / * G e t l e v e l 1 t a b l e * /
blt+ 3 f
rlwinm r10 , r10 , 0 , 2 0 , 3 1
oris r10 , r10 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @ha
2005-09-26 16:04:21 +10:00
3 :
2018-11-29 14:07:24 +00:00
mtcr r11
lwz r11 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @l(r10) /* Get level 1 entry */
2005-09-26 16:04:21 +10:00
2018-11-29 14:07:15 +00:00
mtspr S P R N _ M D _ T W C , r11
mfspr r10 , S P R N _ M D _ T W C
2005-09-26 16:04:21 +10:00
lwz r10 , 0 ( r10 ) / * G e t t h e p t e * /
2018-11-29 14:07:15 +00:00
2020-10-12 08:54:33 +00:00
/ * Insert G u a r d e d a n d A c c e s s e d f l a g s i n t o t h e T W C f r o m t h e L i n u x P T E .
2018-01-12 13:45:31 +01:00
* It i s b i t 2 7 o f b o t h t h e L i n u x P T E a n d t h e T W C ( a t l e a s t
2005-09-26 16:04:21 +10:00
* I g o t t h a t r i g h t : - ) . I t w i l l b e b e t t e r w h e n w e c a n p u t
* this i n t o t h e L i n u x p g d / p m d a n d l o a d i t i n t h e o p e r a t i o n
* above.
* /
2020-10-12 08:54:33 +00:00
rlwimi r11 , r10 , 0 , _ P A G E _ G U A R D E D | _ P A G E _ A C C E S S E D
powerpc/8xx: Manage 512k huge pages as standard pages.
At the time being, 512k huge pages are handled through hugepd page
tables. The PMD entry is flagged as a hugepd pointer and it
means that only 512k hugepages can be managed in that 4M block.
However, the hugepd table has the same size as a normal page
table, and 512k entries can therefore be nested with normal pages.
On the 8xx, TLB loading is performed by software and allthough the
page tables are organised to match the L1 and L2 level defined by
the HW, all TLB entries have both L1 and L2 independent entries.
It means that even if two TLB entries are associated with the same
PMD entry, they can be loaded with different values in L1 part.
The L1 entry contains the page size (PS field):
- 00 for 4k and 16 pages
- 01 for 512k pages
- 11 for 8M pages
By adding a flag for hugepages in the PTE (_PAGE_HUGE) and copying it
into the lower bit of PS, we can then manage 512k pages with normal
page tables:
- PMD entry has PS=11 for 8M pages
- PMD entry has PS=00 for other pages.
As a PMD entry covers 4M areas, a PMD will either point to a hugepd
table having a single entry to an 8M page, or the PMD will point to
a standard page table which will have either entries to 4k or 16k or
512k pages. For 512k pages, as the L1 entry will not know it is a
512k page before the PTE is read, there will be 128 entries in the
PTE as if it was 4k pages. But when loading the TLB, it will be
flagged as a 512k page.
Note that we can't use pmd_ptr() in asm/nohash/32/pgtable.h because
it is not defined yet.
In ITLB miss, we keep the possibility to opt it out as when kernel
text is pinned and no user hugepages are used, we can save several
instruction by not using r11.
In DTLB miss, that's just one instruction so it's not worth bothering
with it.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/002819e8e166bf81d24b24782d98de7c40905d8f.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:09 +00:00
rlwimi r11 , r10 , 3 2 - 9 , _ P M D _ P A G E _ 5 1 2 K
2018-01-12 13:45:33 +01:00
mtspr S P R N _ M D _ T W C , r11
2005-09-26 16:04:21 +10:00
/ * The L i n u x P T E w o n ' t g o e x a c t l y i n t o t h e M M U T L B .
* Software i n d i c a t o r b i t s 2 4 , 2 5 , 2 6 , a n d 2 7 m u s t b e
* set. A l l o t h e r L i n u x P T E b i t s c o n t r o l t h e b e h a v i o r
* of t h e M M U .
* /
2015-01-20 10:57:33 +01:00
li r11 , R P N _ P A T T E R N
2016-12-07 08:47:28 +01:00
rlwimi r10 , r11 , 0 , 2 4 , 2 7 / * S e t 2 4 - 2 7 * /
2018-01-12 13:45:19 +01:00
mtspr S P R N _ M D _ R P N , r10 / * U p d a t e T L B e n t r y * /
2020-11-24 15:24:58 +00:00
mtspr S P R N _ D A R , r11 / * T a g D A R * /
2005-09-26 16:04:21 +10:00
2010-03-02 05:37:12 +00:00
/* Restore registers */
2018-10-19 06:55:08 +00:00
2020-11-24 15:24:58 +00:00
0 : mfspr r10 , S P R N _ S P R G _ S C R A T C H 2
2019-12-21 08:32:31 +00:00
mfspr r11 , S P R N _ M _ T W
2018-01-12 13:45:23 +01:00
rfi
2018-10-19 06:55:08 +00:00
patch_ s i t e 0 b , p a t c h _ _ d t l b m i s s _ e x i t _ 1
2020-05-19 05:49:18 +00:00
# ifdef C O N F I G _ P E R F _ E V E N T S
patch_ s i t e 0 f , p a t c h _ _ d t l b m i s s _ p e r f
0 : lwz r10 , ( d t l b _ m i s s _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
addi r10 , r10 , 1
stw r10 , ( d t l b _ m i s s _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
2020-11-24 15:24:58 +00:00
mfspr r10 , S P R N _ S P R G _ S C R A T C H 2
2020-05-19 05:49:18 +00:00
mfspr r11 , S P R N _ M _ T W
rfi
# endif
2005-09-26 16:04:21 +10:00
/ * This i s a n i n s t r u c t i o n T L B e r r o r o n t h e M P C 8 x x . T h i s c o u l d b e d u e
* to m a n y r e a s o n s , s u c h a s e x e c u t i n g g u a r d e d m e m o r y o r i l l e g a l i n s t r u c t i o n
* addresses. T h e r e i s n o t h i n g t o d o b u t h a n d l e a b i g t i m e e r r o r f a u l t .
* /
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ I N S T _ T L B _ E R R O R _ 8 x x , I n s t r u c t i o n T L B E r r o r )
2021-03-12 12:50:38 +00:00
/* 0x400 is InstructionAccess exception, needed by bad_page_fault() */
2021-04-19 15:48:09 +00:00
EXCEPTION_ P R O L O G I N T E R R U P T _ I N S T _ S T O R A G E I n s t r u c t i o n T L B E r r o r
2017-07-19 14:49:28 +10:00
andis. r5 ,r9 ,D S I S R _ S R R 1 _ M A T C H _ 3 2 S @h /* Filter relevant SRR1 bits */
andis. r10 ,r9 ,S R R 1 _ I S I _ N O P T @h
powerpc/8xx: hide itlbie and dtlbie symbols
When disassembling InstructionTLBError we get the following messy code:
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <itlbie>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0 <itlbie>:
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
For a cleaner code dump, this patch replaces itlbie and dtlbie
symbols by local symbols.
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <InstructionTLBError+0xa0>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2018-12-13 08:08:11 +00:00
beq+ . L i t l b i e
2021-01-30 23:08:16 +10:00
tlbie r12
powerpc/8xx: hide itlbie and dtlbie symbols
When disassembling InstructionTLBError we get the following messy code:
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <itlbie>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0 <itlbie>:
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
For a cleaner code dump, this patch replaces itlbie and dtlbie
symbols by local symbols.
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <InstructionTLBError+0xa0>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2018-12-13 08:08:11 +00:00
.Litlbie :
2021-01-30 23:08:16 +10:00
stw r12 , _ D A R ( r11 )
stw r5 , _ D S I S R ( r11 )
2021-03-12 12:50:41 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl d o _ p a g e _ f a u l t
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
/ * This i s t h e d a t a T L B e r r o r o n t h e M P C 8 x x . T h i s c o u l d b e d u e t o
2014-08-29 11:14:38 +02:00
* many r e a s o n s , i n c l u d i n g a d i r t y u p d a t e t o a p t e . W e b a i l o u t t o
* a h i g h e r l e v e l f u n c t i o n t h a t c a n h a n d l e i t .
2005-09-26 16:04:21 +10:00
* /
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ D A T A _ T L B _ E R R O R _ 8 x x , D a t a T L B E r r o r )
2019-12-21 08:32:35 +00:00
EXCEPTION_ P R O L O G _ 0 h a n d l e _ d a r _ d s i s r =1
2014-08-29 11:14:38 +02:00
mfspr r11 , S P R N _ D A R
2019-12-21 08:32:25 +00:00
cmpwi c r1 , r11 , R P N _ P A T T E R N
beq- c r1 , F i x u p D A R / * m u s t b e a b u g g y d c b X , i c b i i n s n . * /
2014-08-29 11:14:37 +02:00
DARFixed : /* Return from dcbx instruction bug workaround */
2014-09-19 10:36:08 +02:00
EXCEPTION_ P R O L O G _ 1
2021-03-12 12:50:38 +00:00
/* 0x300 is DataAccess exception, needed by bad_page_fault() */
2021-04-19 15:48:09 +00:00
EXCEPTION_ P R O L O G _ 2 I N T E R R U P T _ D A T A _ S T O R A G E D a t a T L B E r r o r h a n d l e _ d a r _ d s i s r =1
2021-03-12 12:50:22 +00:00
lwz r4 , _ D A R ( r11 )
lwz r5 , _ D S I S R ( r11 )
2017-08-08 13:59:00 +02:00
andis. r10 ,r5 ,D S I S R _ N O H P T E @h
powerpc/8xx: hide itlbie and dtlbie symbols
When disassembling InstructionTLBError we get the following messy code:
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <itlbie>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0 <itlbie>:
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
For a cleaner code dump, this patch replaces itlbie and dtlbie
symbols by local symbols.
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <InstructionTLBError+0xa0>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2018-12-13 08:08:11 +00:00
beq+ . L d t l b i e
2014-09-19 10:36:10 +02:00
tlbie r4
powerpc/8xx: hide itlbie and dtlbie symbols
When disassembling InstructionTLBError we get the following messy code:
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <itlbie>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0 <itlbie>:
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
For a cleaner code dump, this patch replaces itlbie and dtlbie
symbols by local symbols.
c000138c: 7d 84 63 78 mr r4,r12
c0001390: 75 25 58 00 andis. r5,r9,22528
c0001394: 75 2a 40 00 andis. r10,r9,16384
c0001398: 41 a2 00 08 beq c00013a0 <InstructionTLBError+0xa0>
c000139c: 7c 00 22 64 tlbie r4,r0
c00013a0: 39 40 04 01 li r10,1025
c00013a4: 91 4b 00 b0 stw r10,176(r11)
c00013a8: 39 40 10 32 li r10,4146
c00013ac: 48 00 cc 59 bl c000e004 <transfer_to_handler>
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
2018-12-13 08:08:11 +00:00
.Ldtlbie :
2021-03-12 12:50:41 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl d o _ p a g e _ f a u l t
b i n t e r r u p t _ r e t u r n
2005-09-26 16:04:21 +10:00
2021-03-12 12:50:27 +00:00
# ifdef C O N F I G _ V M A P _ S T A C K
2019-12-21 08:32:35 +00:00
vmap_ s t a c k _ o v e r f l o w _ e x c e p t i o n
2021-03-12 12:50:27 +00:00
# endif
2019-12-21 08:32:35 +00:00
2005-09-26 16:04:21 +10:00
/ * On t h e M P C 8 x x , t h e s e n e x t f o u r t r a p s a r e u s e d f o r d e v e l o p m e n t
* support o f b r e a k p o i n t s a n d s u c h . S o m e d a y I w i l l g e t a r o u n d t o
* using t h e m .
* /
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ D A T A _ B R E A K P O I N T _ 8 x x , D a t a B r e a k p o i n t )
2019-12-21 08:32:35 +00:00
EXCEPTION_ P R O L O G _ 0 h a n d l e _ d a r _ d s i s r =1
2019-12-21 08:32:34 +00:00
mfspr r11 , S P R N _ S R R 0
cmplwi c r1 , r11 , ( . L d t l b i e - P A G E _ O F F S E T ) @l
cmplwi c r7 , r11 , ( . L i t l b i e - P A G E _ O F F S E T ) @l
cror 4 * c r1 + e q , 4 * c r1 + e q , 4 * c r7 + e q
2021-03-12 12:50:29 +00:00
bne c r1 , 1 f
powerpc/8xx: Implement hw_breakpoint
This patch implements HW breakpoint on the 8xx. The 8xx has
capability to manage HW breakpoints, which is slightly different
than BOOK3S:
1/ The breakpoint match doesn't trigger a DSI exception but a
dedicated data breakpoint exception.
2/ The breakpoint happens after the instruction has completed,
no need to single step or emulate the instruction,
3/ Matched address is not set in DAR but in BAR,
4/ DABR register doesn't exist, instead we have registers
LCTRL1, LCTRL2 and CMPx registers,
5/ The match on one comparator is not on a double word but
on a single word.
The patch does:
1/ Prepare the dedicated registers in call to __set_dabr(). In order
to emulate the double word handling of BOOK3S, comparator E is set to
DABR address value and comparator F to address + 4. Then breakpoint 1
is set to match comparator E or F,
2/ Skip the singlestepping stage when compiled for CONFIG_PPC_8xx,
3/ Implement the exception. In that exception, the matched address
is taken from SPRN_BAR and manage as if it was from SPRN_DAR.
4/ I/D TLB error exception routines perform a tlbie on bad TLBs. That
tlbie triggers the breakpoint exception when performed on the
breakpoint address. For this reason, the routine returns if the match
is from one of those two tlbie.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-11-29 09:52:15 +01:00
mtcr r10
2018-01-12 13:45:21 +01:00
mfspr r10 , S P R N _ S P R G _ S C R A T C H 0
mfspr r11 , S P R N _ S P R G _ S C R A T C H 1
powerpc/8xx: Implement hw_breakpoint
This patch implements HW breakpoint on the 8xx. The 8xx has
capability to manage HW breakpoints, which is slightly different
than BOOK3S:
1/ The breakpoint match doesn't trigger a DSI exception but a
dedicated data breakpoint exception.
2/ The breakpoint happens after the instruction has completed,
no need to single step or emulate the instruction,
3/ Matched address is not set in DAR but in BAR,
4/ DABR register doesn't exist, instead we have registers
LCTRL1, LCTRL2 and CMPx registers,
5/ The match on one comparator is not on a double word but
on a single word.
The patch does:
1/ Prepare the dedicated registers in call to __set_dabr(). In order
to emulate the double word handling of BOOK3S, comparator E is set to
DABR address value and comparator F to address + 4. Then breakpoint 1
is set to match comparator E or F,
2/ Skip the singlestepping stage when compiled for CONFIG_PPC_8xx,
3/ Implement the exception. In that exception, the matched address
is taken from SPRN_BAR and manage as if it was from SPRN_DAR.
4/ I/D TLB error exception routines perform a tlbie on bad TLBs. That
tlbie triggers the breakpoint exception when performed on the
breakpoint address. For this reason, the routine returns if the match
is from one of those two tlbie.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-11-29 09:52:15 +01:00
rfi
2021-03-12 12:50:29 +00:00
1 : EXCEPTION_ P R O L O G _ 1
2021-04-19 15:48:09 +00:00
EXCEPTION_ P R O L O G _ 2 I N T E R R U P T _ D A T A _ B R E A K P O I N T _ 8 x x D a t a B r e a k p o i n t h a n d l e _ d a r _ d s i s r =1
2021-03-12 12:50:29 +00:00
mfspr r4 ,S P R N _ B A R
stw r4 ,_ D A R ( r11 )
2021-03-12 12:50:40 +00:00
prepare_ t r a n s f e r _ t o _ h a n d l e r
bl d o _ b r e a k
REST_ N V G P R S ( r1 )
b i n t e r r u p t _ r e t u r n
2021-03-12 12:50:29 +00:00
2018-01-12 13:45:23 +01:00
# ifdef C O N F I G _ P E R F _ E V E N T S
2021-04-19 15:48:09 +00:00
START_ E X C E P T I O N ( I N T E R R U P T _ I N S T _ B R E A K P O I N T _ 8 x x , I n s t r u c t i o n B r e a k p o i n t )
2018-01-12 13:45:21 +01:00
mtspr S P R N _ S P R G _ S C R A T C H 0 , r10
2018-11-29 14:07:11 +00:00
lwz r10 , ( i n s t r u c t i o n _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
addi r10 , r10 , - 1
stw r10 , ( i n s t r u c t i o n _ c o u n t e r - P A G E _ O F F S E T ) @l(0)
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
lis r10 , 0 x f f f f
ori r10 , r10 , 0 x01
mtspr S P R N _ C O U N T A , r10
2018-01-12 13:45:21 +01:00
mfspr r10 , S P R N _ S P R G _ S C R A T C H 0
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
rfi
# else
2021-04-19 15:48:09 +00:00
EXCEPTION( I N T E R R U P T _ I N S T _ B R E A K P O I N T _ 8 x x , T r a p _ 1 d , u n k n o w n _ e x c e p t i o n )
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
# endif
2021-03-12 12:50:42 +00:00
EXCEPTION( 0 x1 e 0 0 , T r a p _ 1 e , u n k n o w n _ e x c e p t i o n )
EXCEPTION( 0 x1 f00 , T r a p _ 1 f , u n k n o w n _ e x c e p t i o n )
2005-09-26 16:04:21 +10:00
2021-03-12 12:50:29 +00:00
_ _ HEAD
2005-09-26 16:04:21 +10:00
. = 0 x2 0 0 0
2009-11-20 00:21:06 +00:00
/ * This i s t h e p r o c e d u r e t o c a l c u l a t e t h e d a t a E A f o r b u g g y d c b x ,d c b i i n s t r u c t i o n s
* by d e c o d i n g t h e r e g i s t e r s u s e d b y t h e d c b x i n s t r u c t i o n a n d a d d i n g t h e m .
2014-08-29 11:14:37 +02:00
* DAR i s s e t t o t h e c a l c u l a t e d a d d r e s s .
2009-11-20 00:21:06 +00:00
* /
FixupDAR : /* Entry point for dcbx workaround. */
2018-11-29 14:07:24 +00:00
mtspr S P R N _ M _ T W , r10
2009-11-20 00:21:06 +00:00
/* fetch instruction from memory. */
mfspr r10 , S P R N _ S R R 0
2018-11-29 14:07:15 +00:00
mtspr S P R N _ M D _ E P N , r10
2017-07-12 12:08:47 +02:00
rlwinm r11 , r10 , 1 6 , 0 x f f f8
2019-12-21 08:32:25 +00:00
cmpli c r1 , r11 , P A G E _ O F F S E T @h
2018-11-29 14:07:15 +00:00
mfspr r11 , S P R N _ M _ T W B / * G e t l e v e l 1 t a b l e * /
2019-12-21 08:32:25 +00:00
blt+ c r1 , 3 f
2018-10-19 06:55:06 +00:00
2016-09-16 08:42:08 +02:00
/* create physical page address from effective address */
tophys( r11 , r10 )
2018-11-29 14:07:15 +00:00
mfspr r11 , S P R N _ M _ T W B / * G e t l e v e l 1 t a b l e * /
rlwinm r11 , r11 , 0 , 2 0 , 3 1
oris r11 , r11 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @ha
3 :
2015-01-20 10:57:34 +01:00
lwz r11 , ( s w a p p e r _ p g _ d i r - P A G E _ O F F S E T ) @l(r11) /* Get the level 1 entry */
2018-11-29 14:07:15 +00:00
mtspr S P R N _ M D _ T W C , r11
2019-12-21 08:32:25 +00:00
mtcrf 0 x01 , r11
2018-11-29 14:07:15 +00:00
mfspr r11 , S P R N _ M D _ T W C
lwz r11 , 0 ( r11 ) / * G e t t h e p t e * /
2016-12-07 08:47:28 +01:00
bt 2 8 ,2 0 0 f / * b i t 2 8 = L a r g e p a g e ( 8 M ) * /
2009-11-20 00:21:06 +00:00
/* concat physical page address(r11) and page offset(r10) */
2014-09-19 10:36:09 +02:00
rlwimi r11 , r10 , 0 , 3 2 - P A G E _ S H I F T , 3 1
powerpc/8xx: Map linear kernel RAM with 8M pages
On a live running system (VoIP gateway for Air Trafic Control), over
a 10 minutes period (with 277s idle), we get 87 millions DTLB misses
and approximatly 35 secondes are spent in DTLB handler.
This represents 5.8% of the overall time and even 10.8% of the
non-idle time.
Among those 87 millions DTLB misses, 15% are on user addresses and
85% are on kernel addresses. And within the kernel addresses, 93%
are on addresses from the linear address space and only 7% are on
addresses from the virtual address space.
MPC8xx has no BATs but it has 8Mb page size. This patch implements
mapping of kernel RAM using 8Mb pages, on the same model as what is
done on the 40x.
In 4k pages mode, each PGD entry maps a 4Mb area: we map every two
entries to the same 8Mb physical page. In each second entry, we add
4Mb to the page physical address to ease life of the FixupDAR
routine. This is just ignored by HW.
In 16k pages mode, each PGD entry maps a 64Mb area: each PGD entry
will point to the first page of the area. The DTLB handler adds
the 3 bits from EPN to map the correct page.
With this patch applied, we now get only 13 millions TLB misses
during the 10 minutes period. The idle time has increased to 313s
and the overall time spent in DTLB miss handler is 6.3s, which
represents 1% of the overall time and 2.2% of non-idle time.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-02-09 17:07:50 +01:00
201 : lwz r11 ,0 ( r11 )
2009-11-20 00:21:06 +00:00
/* Check if it really is a dcbx instruction. */
/ * dcbt a n d d c b t s t d o e s n o t g e n e r a t e D T L B M i s s e s / E r r o r s ,
* no n e e d t o i n c l u d e t h e m h e r e * /
2014-08-29 11:14:38 +02:00
xoris r10 , r11 , 0 x7 c00 / * c h e c k i f m a j o r O P c o d e i s 3 1 * /
rlwinm r10 , r10 , 0 , 2 1 , 5
2019-12-21 08:32:25 +00:00
cmpwi c r1 , r10 , 2 0 2 8 / * I s d c b z ? * /
beq+ c r1 , 1 4 2 f
cmpwi c r1 , r10 , 9 4 0 / * I s d c b i ? * /
beq+ c r1 , 1 4 2 f
cmpwi c r1 , r10 , 1 0 8 / * I s d c b s t ? * /
beq+ c r1 , 1 4 4 f / * F i x u p s t o r e b i t ! * /
cmpwi c r1 , r10 , 1 7 2 / * I s d c b f ? * /
beq+ c r1 , 1 4 2 f
cmpwi c r1 , r10 , 1 9 6 4 / * I s i c b i ? * /
beq+ c r1 , 1 4 2 f
2018-11-29 14:07:24 +00:00
141 : mfspr r10 ,S P R N _ M _ T W
2014-08-29 11:14:38 +02:00
b D A R F i x e d / * N o p e , g o b a c k t o n o r m a l T L B p r o c e s s i n g * /
2009-11-20 00:21:06 +00:00
2016-12-07 08:47:28 +01:00
200 :
/* concat physical page address(r11) and page offset(r10) */
rlwimi r11 , r10 , 0 , 3 2 - P A G E _ S H I F T _ 8 M , 3 1
b 2 0 1 b
2009-11-20 00:21:06 +00:00
144 : mfspr r10 , S P R N _ D S I S R
rlwinm r10 , r10 ,0 ,7 ,5 / * C l e a r s t o r e b i t f o r b u g g y d c b s t i n s n * /
mtspr S P R N _ D S I S R , r10
142 : /* continue, it was a dcbx, dcbi instruction. */
mfctr r10
mtdar r10 / * s a v e c t r r e g i n D A R * /
rlwinm r10 , r11 , 2 4 , 2 4 , 2 8 / * o f f s e t i n t o j u m p t a b l e f o r r e g R B * /
addi r10 , r10 , 1 5 0 f @l /* add start of table */
mtctr r10 / * l o a d c t r w i t h j u m p a d d r e s s * /
xor r10 , r10 , r10 / * s u m s t a r t s a t z e r o * /
bctr / * j u m p i n t o t a b l e * /
150 :
add r10 , r10 , r0 ;b 151f
add r10 , r10 , r1 ;b 151f
add r10 , r10 , r2 ;b 151f
add r10 , r10 , r3 ;b 151f
add r10 , r10 , r4 ;b 151f
add r10 , r10 , r5 ;b 151f
add r10 , r10 , r6 ;b 151f
add r10 , r10 , r7 ;b 151f
add r10 , r10 , r8 ;b 151f
add r10 , r10 , r9 ;b 151f
mtctr r11 ;b 154f /* r10 needs special handling */
mtctr r11 ;b 153f /* r11 needs special handling */
add r10 , r10 , r12 ;b 151f
add r10 , r10 , r13 ;b 151f
add r10 , r10 , r14 ;b 151f
add r10 , r10 , r15 ;b 151f
add r10 , r10 , r16 ;b 151f
add r10 , r10 , r17 ;b 151f
add r10 , r10 , r18 ;b 151f
add r10 , r10 , r19 ;b 151f
add r10 , r10 , r20 ;b 151f
add r10 , r10 , r21 ;b 151f
add r10 , r10 , r22 ;b 151f
add r10 , r10 , r23 ;b 151f
add r10 , r10 , r24 ;b 151f
add r10 , r10 , r25 ;b 151f
add r10 , r10 , r26 ;b 151f
add r10 , r10 , r27 ;b 151f
add r10 , r10 , r28 ;b 151f
add r10 , r10 , r29 ;b 151f
add r10 , r10 , r30 ;b 151f
add r10 , r10 , r31
151 :
2019-12-21 08:32:25 +00:00
rlwinm r11 ,r11 ,1 9 ,2 4 ,2 8 / * o f f s e t i n t o j u m p t a b l e f o r r e g R A * /
cmpwi c r1 , r11 , 0
beq c r1 , 1 5 2 f / * i f r e g R A i s z e r o , d o n ' t a d d i t * /
2009-11-20 00:21:06 +00:00
addi r11 , r11 , 1 5 0 b @l /* add start of table */
mtctr r11 / * l o a d c t r w i t h j u m p a d d r e s s * /
rlwinm r11 ,r11 ,0 ,1 6 ,1 0 / * m a k e s u r e w e d o n ' t e x e c u t e t h i s m o r e t h a n o n c e * /
bctr / * j u m p i n t o t a b l e * /
152 :
mfdar r11
mtctr r11 / * r e s t o r e c t r r e g f r o m D A R * /
2019-12-21 08:32:35 +00:00
mfspr r11 , S P R N _ S P R G _ T H R E A D
stw r10 , D A R ( r11 )
mfspr r10 , S P R N _ D S I S R
stw r10 , D S I S R ( r11 )
2018-11-29 14:07:24 +00:00
mfspr r10 ,S P R N _ M _ T W
2009-11-20 00:21:06 +00:00
b D A R F i x e d / * G o b a c k t o n o r m a l T L B h a n d l i n g * /
/* special handling for r10,r11 since these are modified already */
2014-08-29 11:14:37 +02:00
153 : mfspr r11 , S P R N _ S P R G _ S C R A T C H 1 / * l o a d r11 f r o m S P R N _ S P R G _ S C R A T C H 1 * /
2014-08-29 11:14:39 +02:00
add r10 , r10 , r11 / * a d d i t * /
mfctr r11 / * r e s t o r e r11 * /
b 1 5 1 b
2014-08-29 11:14:37 +02:00
154 : mfspr r11 , S P R N _ S P R G _ S C R A T C H 0 / * l o a d r10 f r o m S P R N _ S P R G _ S C R A T C H 0 * /
2014-08-29 11:14:39 +02:00
add r10 , r10 , r11 / * a d d i t * /
2009-11-20 00:21:06 +00:00
mfctr r11 / * r e s t o r e r11 * /
b 1 5 1 b
2005-09-26 16:04:21 +10:00
/ *
* This i s w h e r e t h e m a i n k e r n e l c o d e s t a r t s .
* /
start_here :
/* ptr to current */
lis r2 ,i n i t _ t a s k @h
ori r2 ,r2 ,i n i t _ t a s k @l
/* ptr to phys current thread */
tophys( r4 ,r2 )
addi r4 ,r4 ,T H R E A D / * i n i t t a s k ' s T H R E A D * /
2009-07-14 20:52:54 +00:00
mtspr S P R N _ S P R G _ T H R E A D ,r4
2005-09-26 16:04:21 +10:00
/* stack */
lis r1 ,i n i t _ t h r e a d _ u n i o n @ha
addi r1 ,r1 ,i n i t _ t h r e a d _ u n i o n @l
2019-08-21 10:20:51 +00:00
lis r0 , S T A C K _ E N D _ M A G I C @h
ori r0 , r0 , S T A C K _ E N D _ M A G I C @l
stw r0 , 0 ( r1 )
2005-09-26 16:04:21 +10:00
li r0 ,0
stwu r0 ,T H R E A D _ S I Z E - S T A C K _ F R A M E _ O V E R H E A D ( r1 )
2018-07-13 13:10:47 +00:00
lis r6 , s w a p p e r _ p g _ d i r @ha
tophys( r6 ,r6 )
2018-11-29 14:07:15 +00:00
mtspr S P R N _ M _ T W B , r6
2018-07-13 13:10:47 +00:00
2005-09-26 16:04:21 +10:00
bl e a r l y _ i n i t / * W e h a v e t o d o t h i s w i t h M M U o n * /
/ *
* Decide w h a t s o r t o f m a c h i n e t h i s i s a n d i n i t i a l i z e t h e M M U .
* /
2019-04-26 16:23:34 +00:00
# ifdef C O N F I G _ K A S A N
bl k a s a n _ e a r l y _ i n i t
# endif
2011-07-25 11:29:33 +00:00
li r3 ,0
mr r4 ,r31
2005-09-26 16:04:21 +10:00
bl m a c h i n e _ i n i t
bl M M U _ i n i t
/ *
* Go b a c k t o r u n n i n g u n m a p p e d s o w e c a n l o a d u p n e w v a l u e s
* and c h a n g e t o u s i n g o u r e x c e p t i o n v e c t o r s .
* On t h e 8 x x , a l l w e h a v e t o d o i s i n v a l i d a t e t h e T L B t o c l e a r
* the o l d 8 M b y t e T L B m a p p i n g s a n d l o a d t h e p a g e t a b l e b a s e r e g i s t e r .
* /
/ * The r i g h t w a y t o d o t h i s w o u l d b e t o t r a c k i t d o w n t h r o u g h
* init' s T H R E A D l i k e t h e c o n t e x t s w i t c h c o d e d o e s , b u t t h i s i s
* easier. . . . . . u n t i l s o m e o n e c h a n g e s i n i t ' s s t a t i c s t r u c t u r e s .
* /
lis r4 ,2 f @h
ori r4 ,r4 ,2 f @l
tophys( r4 ,r4 )
li r3 ,M S R _ K E R N E L & ~ ( M S R _ I R | M S R _ D R )
mtspr S P R N _ S R R 0 ,r4
mtspr S P R N _ S R R 1 ,r3
rfi
/* Load up the kernel context */
2 :
2020-05-19 05:49:14 +00:00
# ifdef C O N F I G _ P I N _ T L B _ I M M R
lis r0 , M D _ T W A M @h
oris r0 , r0 , 0 x1 f00
mtspr S P R N _ M D _ C T R , r0
LOAD_ R E G _ I M M E D I A T E ( r0 , V I R T _ I M M R _ B A S E | M D _ E V A L I D )
tlbie r0
mtspr S P R N _ M D _ E P N , r0
LOAD_ R E G _ I M M E D I A T E ( r0 , M D _ S V A L I D | M D _ P S 5 1 2 K | M D _ G U A R D E D )
mtspr S P R N _ M D _ T W C , r0
mfspr r0 , S P R N _ I M M R
rlwinm r0 , r0 , 0 , 0 x f f f80 0 0 0
ori r0 , r0 , 0 x f0 | _ P A G E _ D I R T Y | _ P A G E _ S P S | _ P A G E _ S H | \
_ PAGE_ N O _ C A C H E | _ P A G E _ P R E S E N T
mtspr S P R N _ M D _ R P N , r0
lis r0 , ( M D _ T W A M | M D _ R S V 4 I ) @h
mtspr S P R N _ M D _ C T R , r0
2020-05-19 05:49:15 +00:00
# endif
# if ! d e f i n e d ( C O N F I G _ P I N _ T L B _ D A T A ) & & ! d e f i n e d ( C O N F I G _ P I N _ T L B _ I M M R )
lis r0 , M D _ T W A M @h
mtspr S P R N _ M D _ C T R , r0
2020-05-19 05:49:14 +00:00
# endif
2005-09-26 16:04:21 +10:00
tlbia / * C l e a r a l l T L B e n t r i e s * /
sync / * w a i t f o r t l b i a / t l b i e t o f i n i s h * /
/ * set u p t h e P T E p o i n t e r s f o r t h e A b a t r o n b d i G D B .
* /
lis r5 , a b a t r o n _ p t e p t r s @h
ori r5 , r5 , a b a t r o n _ p t e p t r s @l
2018-05-24 11:02:06 +00:00
stw r5 , 0 x f0 ( 0 ) / * M u s t m a t c h y o u r A b a t r o n c o n f i g f i l e * /
2005-09-26 16:04:21 +10:00
tophys( r5 ,r5 )
2019-01-09 20:30:07 +00:00
lis r6 , s w a p p e r _ p g _ d i r @h
ori r6 , r6 , s w a p p e r _ p g _ d i r @l
2005-09-26 16:04:21 +10:00
stw r6 , 0 ( r5 )
/* Now turn on the MMU for real! */
li r4 ,M S R _ K E R N E L
lis r3 ,s t a r t _ k e r n e l @h
ori r3 ,r3 ,s t a r t _ k e r n e l @l
mtspr S P R N _ S R R 0 ,r3
mtspr S P R N _ S R R 1 ,r4
rfi / * e n a b l e M M U a n d j u m p t o s t a r t _ k e r n e l * /
/ * Set u p t h e i n i t i a l M M U s t a t e s o w e c a n d o t h e f i r s t l e v e l o f
* kernel i n i t i a l i z a t i o n . T h i s m a p s t h e f i r s t 8 M B y t e s o f m e m o r y 1 : 1
* virtual t o p h y s i c a l . A l s o , s e t t h e c a c h e m o d e s i n c e t h a t i s d e f i n e d
* by T L B e n t r i e s a n d p e r f o r m a n y a d d i t i o n a l m a p p i n g ( l i k e o f t h e I M M R ) .
* If c o n f i g u r e d t o p i n s o m e T L B s , w e p i n t h e f i r s t 8 M b y t e s o f k e r n e l ,
powerpc/8xx: Fix vaddr for IMMR early remap
Memory: 124428K/131072K available (3748K kernel code, 188K rwdata,
648K rodata, 508K init, 290K bss, 6644K reserved)
Kernel virtual memory layout:
* 0xfffdf000..0xfffff000 : fixmap
* 0xfde00000..0xfe000000 : consistent mem
* 0xfddf6000..0xfde00000 : early ioremap
* 0xc9000000..0xfddf6000 : vmalloc & ioremap
SLUB: HWalign=16, Order=0-3, MinObjects=0, CPUs=1, Nodes=1
Today, IMMR is mapped 1:1 at startup
Mapping IMMR 1:1 is just wrong because it may overlap with another
area. On most mpc8xx boards it is OK as IMMR is set to 0xff000000
but for instance on EP88xC board, IMMR is at 0xfa200000 which
overlaps with VM ioremap area
This patch fixes the virtual address for remapping IMMR with the fixmap
regardless of the value of IMMR.
The size of IMMR area is 256kbytes (CPM at offset 0, security engine
at offset 128k) so a 512k page is enough
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-05-17 09:02:43 +02:00
* 2 4 Mbytes o f d a t a , a n d t h e 5 1 2 k I M M R s p a c e . A n y t h i n g n o t c o v e r e d b y
2005-09-26 16:04:21 +10:00
* these m a p p i n g s i s m a p p e d b y p a g e t a b l e s .
* /
initial_mmu :
2016-05-17 09:02:49 +02:00
li r8 , 0
mtspr S P R N _ M I _ C T R , r8 / * r e m o v e P I N N E D I T L B e n t r i e s * /
2020-05-19 05:49:07 +00:00
lis r10 , M D _ T W A M @h
2016-05-17 09:02:49 +02:00
mtspr S P R N _ M D _ C T R , r10 / * r e m o v e P I N N E D D T L B e n t r i e s * /
2005-09-26 16:04:21 +10:00
tlbia / * I n v a l i d a t e a l l T L B e n t r i e s * /
2015-04-22 12:06:45 +02:00
lis r8 , M I _ A P G _ I N I T @h /* Set protection modes */
ori r8 , r8 , M I _ A P G _ I N I T @l
2005-09-26 16:04:21 +10:00
mtspr S P R N _ M I _ A P , r8
2015-04-22 12:06:45 +02:00
lis r8 , M D _ A P G _ I N I T @h
ori r8 , r8 , M D _ A P G _ I N I T @l
2005-09-26 16:04:21 +10:00
mtspr S P R N _ M D _ A P , r8
2020-05-19 05:49:15 +00:00
/* Map the lower RAM (up to 32 Mbytes) into the ITLB and DTLB */
2019-02-13 16:06:21 +00:00
lis r8 , M I _ R S V 4 I @h
ori r8 , r8 , 0 x1 c00
2020-05-19 05:49:15 +00:00
oris r12 , r10 , M D _ R S V 4 I @h
ori r12 , r12 , 0 x1 c00
2019-02-13 16:06:21 +00:00
li r9 , 4 / * u p t o 4 p a g e s o f 8 M * /
mtctr r9
lis r9 , K E R N E L B A S E @h /* Create vaddr for TLB */
2020-10-12 08:54:33 +00:00
li r10 , M I _ P S 8 M E G | _ P M D _ A C C E S S E D | M I _ S V A L I D
2019-02-13 16:06:21 +00:00
li r11 , M I _ B O O T I N I T / * C r e a t e R P N f o r a d d r e s s 0 * /
1 :
mtspr S P R N _ M I _ C T R , r8 / * S e t i n s t r u c t i o n M M U c o n t r o l * /
addi r8 , r8 , 0 x10 0
ori r0 , r9 , M I _ E V A L I D / * M a r k i t v a l i d * /
mtspr S P R N _ M I _ E P N , r0
mtspr S P R N _ M I _ T W C , r10
mtspr S P R N _ M I _ R P N , r11 / * S t o r e T L B e n t r y * /
2020-05-19 05:49:15 +00:00
mtspr S P R N _ M D _ C T R , r12
addi r12 , r12 , 0 x10 0
mtspr S P R N _ M D _ E P N , r0
mtspr S P R N _ M D _ T W C , r10
mtspr S P R N _ M D _ R P N , r11
2019-02-13 16:06:21 +00:00
addis r9 , r9 , 0 x80
addis r11 , r11 , 0 x80
2020-05-19 05:49:15 +00:00
bdnz 1 b
2019-02-13 16:06:21 +00:00
2005-09-26 16:04:21 +10:00
/ * Since t h e c a c h e i s e n a b l e d a c c o r d i n g t o t h e i n f o r m a t i o n w e
* just l o a d e d i n t o t h e T L B , i n v a l i d a t e a n d e n a b l e t h e c a c h e s h e r e .
* We s h o u l d p r o b a b l y c h e c k / s e t o t h e r m o d e s . . . . l a t e r .
* /
lis r8 , I D C _ I N V A L L @h
mtspr S P R N _ I C _ C S T , r8
mtspr S P R N _ D C _ C S T , r8
lis r8 , I D C _ E N A B L E @h
mtspr S P R N _ I C _ C S T , r8
mtspr S P R N _ D C _ C S T , r8
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
/* Disable debug mode entry on breakpoints */
powerpc/8xx: Implement hw_breakpoint
This patch implements HW breakpoint on the 8xx. The 8xx has
capability to manage HW breakpoints, which is slightly different
than BOOK3S:
1/ The breakpoint match doesn't trigger a DSI exception but a
dedicated data breakpoint exception.
2/ The breakpoint happens after the instruction has completed,
no need to single step or emulate the instruction,
3/ Matched address is not set in DAR but in BAR,
4/ DABR register doesn't exist, instead we have registers
LCTRL1, LCTRL2 and CMPx registers,
5/ The match on one comparator is not on a double word but
on a single word.
The patch does:
1/ Prepare the dedicated registers in call to __set_dabr(). In order
to emulate the double word handling of BOOK3S, comparator E is set to
DABR address value and comparator F to address + 4. Then breakpoint 1
is set to match comparator E or F,
2/ Skip the singlestepping stage when compiled for CONFIG_PPC_8xx,
3/ Implement the exception. In that exception, the matched address
is taken from SPRN_BAR and manage as if it was from SPRN_DAR.
4/ I/D TLB error exception routines perform a tlbie on bad TLBs. That
tlbie triggers the breakpoint exception when performed on the
breakpoint address. For this reason, the routine returns if the match
is from one of those two tlbie.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-11-29 09:52:15 +01:00
mfspr r8 , S P R N _ D E R
2018-01-12 13:45:23 +01:00
# ifdef C O N F I G _ P E R F _ E V E N T S
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
rlwinm r8 , r8 , 0 , ~ 0 x c
# else
powerpc/8xx: Implement hw_breakpoint
This patch implements HW breakpoint on the 8xx. The 8xx has
capability to manage HW breakpoints, which is slightly different
than BOOK3S:
1/ The breakpoint match doesn't trigger a DSI exception but a
dedicated data breakpoint exception.
2/ The breakpoint happens after the instruction has completed,
no need to single step or emulate the instruction,
3/ Matched address is not set in DAR but in BAR,
4/ DABR register doesn't exist, instead we have registers
LCTRL1, LCTRL2 and CMPx registers,
5/ The match on one comparator is not on a double word but
on a single word.
The patch does:
1/ Prepare the dedicated registers in call to __set_dabr(). In order
to emulate the double word handling of BOOK3S, comparator E is set to
DABR address value and comparator F to address + 4. Then breakpoint 1
is set to match comparator E or F,
2/ Skip the singlestepping stage when compiled for CONFIG_PPC_8xx,
3/ Implement the exception. In that exception, the matched address
is taken from SPRN_BAR and manage as if it was from SPRN_DAR.
4/ I/D TLB error exception routines perform a tlbie on bad TLBs. That
tlbie triggers the breakpoint exception when performed on the
breakpoint address. For this reason, the routine returns if the match
is from one of those two tlbie.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-11-29 09:52:15 +01:00
rlwinm r8 , r8 , 0 , ~ 0 x8
powerpc/8xx: Perf events on PPC 8xx
This patch has been reworked since RFC version. In the RFC, this patch
was preceded by a patch clearing MSR RI for all PPC32 at all time at
exception prologs. Now MSR RI clearing is done only when this 8xx perf
events functionality is compiled in, it is therefore limited to 8xx
and merged inside this patch.
Other main changes have been to take into account detailed review from
Peter Zijlstra. The instructions counter has been reworked to behave
as a free running counter like the three other counters.
The 8xx has no PMU, however some events can be emulated by other means.
This patch implements the following events (as reported by 'perf list'):
cpu-cycles OR cycles [Hardware event]
instructions [Hardware event]
dTLB-load-misses [Hardware cache event]
iTLB-load-misses [Hardware cache event]
'cycles' event is implemented using the timebase clock. Timebase clock
corresponds to CPU clock divided by 16, so number of cycles is
approximatly 16 times the number of TB ticks
On the 8xx, TLB misses are handled by software. It is therefore
easy to count all TLB misses each time the TLB miss exception is
called.
'instructions' is calculated by using instruction watchpoint counter.
This patch sets counter A to count instructions at address greater
than 0, hence we count all instructions executed while MSR RI bit is
set. The counter is set to the maximum which is 0xffff. Every 65535
instructions, debug instruction breakpoint exception fires. The
exception handler increments a counter in memory which then
represent the upper part of the instruction counter. We therefore
end up with a 48 bits counter. In order to avoid unnecessary overhead
while no perf event is active, this counter is started when the first
event referring to this counter is added, and the counter is stopped
when the last event referring to it is deleted. In order to properly
support breakpoint exceptions, MSR RI bit has to be unset in exception
epilogs in order to avoid breakpoint exceptions during critical
sections during changes to SRR0 and SRR1 would be problematic.
All counters are handled as free running counters.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-12-15 13:42:18 +01:00
# endif
powerpc/8xx: Implement hw_breakpoint
This patch implements HW breakpoint on the 8xx. The 8xx has
capability to manage HW breakpoints, which is slightly different
than BOOK3S:
1/ The breakpoint match doesn't trigger a DSI exception but a
dedicated data breakpoint exception.
2/ The breakpoint happens after the instruction has completed,
no need to single step or emulate the instruction,
3/ Matched address is not set in DAR but in BAR,
4/ DABR register doesn't exist, instead we have registers
LCTRL1, LCTRL2 and CMPx registers,
5/ The match on one comparator is not on a double word but
on a single word.
The patch does:
1/ Prepare the dedicated registers in call to __set_dabr(). In order
to emulate the double word handling of BOOK3S, comparator E is set to
DABR address value and comparator F to address + 4. Then breakpoint 1
is set to match comparator E or F,
2/ Skip the singlestepping stage when compiled for CONFIG_PPC_8xx,
3/ Implement the exception. In that exception, the matched address
is taken from SPRN_BAR and manage as if it was from SPRN_DAR.
4/ I/D TLB error exception routines perform a tlbie on bad TLBs. That
tlbie triggers the breakpoint exception when performed on the
breakpoint address. For this reason, the routine returns if the match
is from one of those two tlbie.
Signed-off-by: Christophe Leroy <christophe.leroy@c-s.fr>
Signed-off-by: Scott Wood <oss@buserror.net>
2016-11-29 09:52:15 +01:00
mtspr S P R N _ D E R , r8
2005-09-26 16:04:21 +10:00
blr
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
_ GLOBAL( m m u _ p i n _ t l b )
lis r9 , ( 1 f - P A G E _ O F F S E T ) @h
ori r9 , r9 , ( 1 f - P A G E _ O F F S E T ) @l
mfmsr r10
mflr r11
li r12 , M S R _ K E R N E L & ~ ( M S R _ I R | M S R _ D R | M S R _ R I )
rlwinm r0 , r10 , 0 , ~ M S R _ R I
rlwinm r0 , r0 , 0 , ~ M S R _ E E
mtmsr r0
isync
.align 4
mtspr S P R N _ S R R 0 , r9
mtspr S P R N _ S R R 1 , r12
rfi
1 :
li r5 , 0
lis r6 , M D _ T W A M @h
mtspr S P R N _ M I _ C T R , r5
mtspr S P R N _ M D _ C T R , r6
tlbia
LOAD_ R E G _ I M M E D I A T E ( r5 , 2 8 < < 8 )
LOAD_ R E G _ I M M E D I A T E ( r6 , P A G E _ O F F S E T )
2020-10-12 08:54:33 +00:00
LOAD_ R E G _ I M M E D I A T E ( r7 , M I _ S V A L I D | M I _ P S 8 M E G | _ P M D _ A C C E S S E D )
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
LOAD_ R E G _ I M M E D I A T E ( r8 , 0 x f0 | _ P A G E _ R O | _ P A G E _ S P S | _ P A G E _ S H | _ P A G E _ P R E S E N T )
LOAD_ R E G _ A D D R ( r9 , _ s i n i t t e x t )
li r0 , 4
mtctr r0
2 : ori r0 , r6 , M I _ E V A L I D
mtspr S P R N _ M I _ C T R , r5
mtspr S P R N _ M I _ E P N , r0
mtspr S P R N _ M I _ T W C , r7
mtspr S P R N _ M I _ R P N , r8
addi r5 , r5 , 0 x10 0
addis r6 , r6 , S Z _ 8 M @h
addis r8 , r8 , S Z _ 8 M @h
cmplw r6 , r9
bdnzt l t , 2 b
lis r0 , M I _ R S V 4 I @h
mtspr S P R N _ M I _ C T R , r0
2020-11-24 15:24:55 +00:00
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
LOAD_ R E G _ I M M E D I A T E ( r5 , 2 8 < < 8 | M D _ T W A M )
# ifdef C O N F I G _ P I N _ T L B _ D A T A
LOAD_ R E G _ I M M E D I A T E ( r6 , P A G E _ O F F S E T )
2020-10-12 08:54:33 +00:00
LOAD_ R E G _ I M M E D I A T E ( r7 , M I _ S V A L I D | M I _ P S 8 M E G | _ P M D _ A C C E S S E D )
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
# ifdef C O N F I G _ P I N _ T L B _ I M M R
li r0 , 3
# else
li r0 , 4
# endif
mtctr r0
cmpwi r4 , 0
beq 4 f
LOAD_ R E G _ I M M E D I A T E ( r8 , 0 x f0 | _ P A G E _ R O | _ P A G E _ S P S | _ P A G E _ S H | _ P A G E _ P R E S E N T )
LOAD_ R E G _ A D D R ( r9 , _ s i n i t t e x t )
2 : ori r0 , r6 , M D _ E V A L I D
mtspr S P R N _ M D _ C T R , r5
mtspr S P R N _ M D _ E P N , r0
mtspr S P R N _ M D _ T W C , r7
mtspr S P R N _ M D _ R P N , r8
addi r5 , r5 , 0 x10 0
addis r6 , r6 , S Z _ 8 M @h
addis r8 , r8 , S Z _ 8 M @h
cmplw r6 , r9
bdnzt l t , 2 b
4 : LOAD_ R E G _ I M M E D I A T E ( r8 , 0 x f0 | _ P A G E _ S P S | _ P A G E _ S H | _ P A G E _ P R E S E N T )
2 : ori r0 , r6 , M D _ E V A L I D
mtspr S P R N _ M D _ C T R , r5
mtspr S P R N _ M D _ E P N , r0
mtspr S P R N _ M D _ T W C , r7
mtspr S P R N _ M D _ R P N , r8
addi r5 , r5 , 0 x10 0
addis r6 , r6 , S Z _ 8 M @h
addis r8 , r8 , S Z _ 8 M @h
cmplw r6 , r3
bdnzt l t , 2 b
# endif
# ifdef C O N F I G _ P I N _ T L B _ I M M R
LOAD_ R E G _ I M M E D I A T E ( r0 , V I R T _ I M M R _ B A S E | M D _ E V A L I D )
2020-10-12 08:54:33 +00:00
LOAD_ R E G _ I M M E D I A T E ( r7 , M D _ S V A L I D | M D _ P S 5 1 2 K | M D _ G U A R D E D | _ P M D _ A C C E S S E D )
powerpc/8xx: Add function to set pinned TLBs
Pinned TLBs cannot be modified when the MMU is enabled.
Create a function to rewrite the pinned TLB entries with MMU off.
To set pinned TLB, we have to turn off MMU, disable pinning,
do a TLB flush (Either with tlbie and tlbia) then reprogam
the TLB entries, enable pinning and turn on MMU.
If using tlbie, it cleared entries in both instruction and data
TLB regardless whether pinning is disabled or not.
If using tlbia, it clears all entries of the TLB which has
disabled pinning.
To make it easy, just clear all entries in both TLBs, and
reprogram them.
The function takes two arguments, the top of the memory to
consider and whether data is RO under _sinittext.
When DEBUG_PAGEALLOC is set, the top is the end of kernel rodata.
Otherwise, that's the top of physical RAM.
Everything below _sinittext is set RX, over _sinittext that's RW.
Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
Link: https://lore.kernel.org/r/c17806014bb1c06513ad1e1d510faea31984b177.1589866984.git.christophe.leroy@csgroup.eu
2020-05-19 05:49:13 +00:00
mfspr r8 , S P R N _ I M M R
rlwinm r8 , r8 , 0 , 0 x f f f80 0 0 0
ori r8 , r8 , 0 x f0 | _ P A G E _ D I R T Y | _ P A G E _ S P S | _ P A G E _ S H | \
_ PAGE_ N O _ C A C H E | _ P A G E _ P R E S E N T
mtspr S P R N _ M D _ C T R , r5
mtspr S P R N _ M D _ E P N , r0
mtspr S P R N _ M D _ T W C , r7
mtspr S P R N _ M D _ R P N , r8
# endif
# if d e f i n e d ( C O N F I G _ P I N _ T L B _ I M M R ) | | d e f i n e d ( C O N F I G _ P I N _ T L B _ D A T A )
lis r0 , ( M D _ R S V 4 I | M D _ T W A M ) @h
mtspr S P R N _ M I _ C T R , r0
# endif
mtspr S P R N _ S R R 1 , r10
mtspr S P R N _ S R R 0 , r11
rfi
2005-09-26 16:04:21 +10:00
/ *
* We p u t a f e w t h i n g s h e r e t h a t h a v e t o b e p a g e - a l i g n e d .
* This s t u f f g o e s a t t h e b e g i n n i n g o f t h e d a t a s e g m e n t ,
* which i s p a g e - a l i g n e d .
* /
.data
.globl sdata
sdata :
.globl empty_zero_page
2014-09-19 10:36:09 +02:00
.align PAGE_SHIFT
2005-09-26 16:04:21 +10:00
empty_zero_page :
2014-09-19 10:36:09 +02:00
.space PAGE_SIZE
2016-01-13 23:33:46 -05:00
EXPORT_ S Y M B O L ( e m p t y _ z e r o _ p a g e )
2005-09-26 16:04:21 +10:00
.globl swapper_pg_dir
swapper_pg_dir :
2014-09-19 10:36:09 +02:00
.space PGD_TABLE_SIZE
2005-09-26 16:04:21 +10:00
2021-01-20 19:50:21 +05:30
/ * Room f o r t w o P T E t a b l e p o i n t e r s , u s u a l l y t h e k e r n e l a n d c u r r e n t u s e r
2005-09-26 16:04:21 +10:00
* pointer t o t h e i r r e s p e c t i v e r o o t p a g e t a b l e ( p g d i r ) .
* /
2019-02-21 10:37:53 +00:00
.globl abatron_pteptrs
2005-09-26 16:04:21 +10:00
abatron_pteptrs :
.space 8