Similar to commit a6c30873ee4a ("ARM: 8989/1: use .fpu assembler
directives instead of assembler arguments").
GCC and GNU binutils support setting the "sub arch" via -march=,
-Wa,-march, target function attribute, and .arch assembler directive.
Clang was missing support for -Wa,-march=, but this was implemented in
clang-13.
The behavior of both GCC and Clang is to
prefer -Wa,-march= over -march= for assembler and assembler-with-cpp
sources, but Clang will warn about the -march= being unused.
clang: warning: argument unused during compilation: '-march=armv6k'
[-Wunused-command-line-argument]
Since most assembler is non-conditionally assembled with one sub arch
(modulo arch/arm/delay-loop.S which conditionally is assembled as armv4
based on CONFIG_ARCH_RPC, and arch/arm/mach-at91/pm-suspend.S which is
conditionally assembled as armv7-a based on CONFIG_CPU_V7), prefer the
.arch assembler directive.
Add a few more instances found in compile testing as found by Arnd and
Nathan.
Link: 1d51c699b9
Link: https://bugs.llvm.org/show_bug.cgi?id=48894
Link: https://github.com/ClangBuiltLinux/linux/issues/1195
Link: https://github.com/ClangBuiltLinux/linux/issues/1315
Suggested-by: Arnd Bergmann <arnd@arndb.de>
Suggested-by: Nathan Chancellor <nathan@kernel.org>
Signed-off-by: Arnd Bergmann <arnd@arndb.de>
Tested-by: Nathan Chancellor <nathan@kernel.org>
Signed-off-by: Nick Desaulniers <ndesaulniers@google.com>
Signed-off-by: Russell King (Oracle) <rmk+kernel@armlinux.org.uk>
64 lines
1.1 KiB
ArmAsm
64 lines
1.1 KiB
ArmAsm
/* SPDX-License-Identifier: GPL-2.0-only */
|
|
/*
|
|
* linux/arch/arm/lib/delay.S
|
|
*
|
|
* Copyright (C) 1995, 1996 Russell King
|
|
*/
|
|
#include <linux/linkage.h>
|
|
#include <asm/assembler.h>
|
|
#include <asm/delay.h>
|
|
|
|
#ifdef CONFIG_ARCH_RPC
|
|
.arch armv4
|
|
#endif
|
|
|
|
.text
|
|
|
|
.LC0: .word loops_per_jiffy
|
|
.LC1: .word UDELAY_MULT
|
|
|
|
/*
|
|
* loops = r0 * HZ * loops_per_jiffy / 1000000
|
|
*
|
|
* r0 <= 2000
|
|
* HZ <= 1000
|
|
*/
|
|
|
|
ENTRY(__loop_udelay)
|
|
ldr r2, .LC1
|
|
mul r0, r2, r0 @ r0 = delay_us * UDELAY_MULT
|
|
ENTRY(__loop_const_udelay) @ 0 <= r0 <= 0xfffffaf0
|
|
ldr r2, .LC0
|
|
ldr r2, [r2]
|
|
umull r1, r0, r2, r0 @ r0-r1 = r0 * loops_per_jiffy
|
|
adds r1, r1, #0xffffffff @ rounding up ...
|
|
adcs r0, r0, r0 @ and right shift by 31
|
|
reteq lr
|
|
|
|
.align 3
|
|
|
|
@ Delay routine
|
|
ENTRY(__loop_delay)
|
|
subs r0, r0, #1
|
|
#if 0
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
retls lr
|
|
subs r0, r0, #1
|
|
#endif
|
|
bhi __loop_delay
|
|
ret lr
|
|
ENDPROC(__loop_udelay)
|
|
ENDPROC(__loop_const_udelay)
|
|
ENDPROC(__loop_delay)
|