arm64: support __int128 on gcc 5+
Versions of gcc prior to gcc 5 emitted a __multi3 function call when
dealing with TI types, resulting in failures when trying to link to
libgcc, and more generally, bad performance. However, since gcc 5,
the compiler supports actually emitting fast instructions, which means
we can at long last enable this option and receive the speedups.
The gcc commit that added proper Aarch64 support is:
https://gcc.gnu.org/git/?p=gcc.git;a=commitdiff;h=d1ae7bb994f49316f6f63e6173f2931e837a351d
This commit appears to be part of the gcc 5 release.
There are still a few instructions, __ashlti3 and __ashrti3, which
require libgcc, which is fine. Rather than linking to libgcc, we
simply provide them ourselves, since they're not that complicated.
Signed-off-by: Jason A. Donenfeld <Jason@zx2c4.com>
Signed-off-by: Will Deacon <will.deacon@arm.com>
2017-11-03 17:18:58 +03:00
/ *
* Copyright ( C ) 2 0 1 7 J a s o n A . D o n e n f e l d < J a s o n @zx2c4.com>. All Rights Reserved.
*
* This p r o g r a m i s f r e e s o f t w a r e ; you can redistribute it and/or modify
* it u n d e r t h e t e r m s o f t h e G N U G e n e r a l P u b l i c L i c e n s e v e r s i o n 2 a s
* published b y t h e F r e e S o f t w a r e F o u n d a t i o n .
*
* This p r o g r a m i s d i s t r i b u t e d i n t h e h o p e t h a t i t w i l l b e u s e f u l ,
* but W I T H O U T A N Y W A R R A N T Y ; without even the implied warranty of
* MERCHANTABILITY o r F I T N E S S F O R A P A R T I C U L A R P U R P O S E . S e e t h e
* GNU G e n e r a l P u b l i c L i c e n s e f o r m o r e d e t a i l s .
*
* You s h o u l d h a v e r e c e i v e d a c o p y o f t h e G N U G e n e r a l P u b l i c L i c e n s e
* along w i t h t h i s p r o g r a m . I f n o t , s e e < h t t p : / / w w w . g n u . o r g / l i c e n s e s / > .
* /
# include < l i n u x / l i n k a g e . h >
ENTRY( _ _ a s h l t i 3 )
cbz x2 , 1 f
mov x3 , #64
sub x3 , x3 , x2
cmp x3 , #0
b. l e 2 f
lsl x1 , x1 , x2
lsr x3 , x0 , x3
lsl x2 , x0 , x2
orr x1 , x1 , x3
mov x0 , x2
1 :
ret
2 :
neg w1 , w3
mov x2 , #0
lsl x1 , x0 , x1
mov x0 , x2
ret
ENDPROC( _ _ a s h l t i 3 )
ENTRY( _ _ a s h r t i 3 )
cbz x2 , 3 f
mov x3 , #64
sub x3 , x3 , x2
cmp x3 , #0
b. l e 4 f
lsr x0 , x0 , x2
lsl x3 , x1 , x3
asr x2 , x1 , x2
orr x0 , x0 , x3
mov x1 , x2
3 :
ret
4 :
neg w0 , w3
asr x2 , x1 , #63
asr x0 , x1 , x0
mov x1 , x2
ret
ENDPROC( _ _ a s h r t i 3 )
2017-11-07 04:49:54 +03:00
ENTRY( _ _ l s h r t i 3 )
cbz x2 , 1 f
mov x3 , #64
sub x3 , x3 , x2
cmp x3 , #0
b. l e 2 f
lsr x0 , x0 , x2
lsl x3 , x1 , x3
lsr x2 , x1 , x2
orr x0 , x0 , x3
mov x1 , x2
1 :
ret
2 :
neg w0 , w3
mov x2 , #0
lsr x0 , x1 , x0
mov x1 , x2
ret
ENDPROC( _ _ l s h r t i 3 )