aboutsummaryrefslogtreecommitdiffstatshomepage
diff options
context:
space:
mode:
authorEric Biggers <ebiggers@google.com>2025-02-10 13:07:41 -0800
committerEric Biggers <ebiggers@google.com>2025-02-12 12:08:56 -0800
commitcf1ea3a7c1f63cba7d1dd313ee3accde0c0c8988 (patch)
treeb2e673e8e0f67ece26cf5d2078dfaff3869f32ed
parentx86/crc64: implement crc64_be and crc64_nvme using new template (diff)
downloadwireguard-linux-cf1ea3a7c1f63cba7d1dd313ee3accde0c0c8988.tar.xz
wireguard-linux-cf1ea3a7c1f63cba7d1dd313ee3accde0c0c8988.zip
x86/crc32: improve crc32c_arch() code generation with clang
crc32c_arch() is affected by https://github.com/llvm/llvm-project/issues/20571 where clang unnecessarily spills the inputs to "rm"-constrained operands to the stack. Replace "rm" with ASM_INPUT_RM which partially works around this by expanding to "r" when the compiler is clang. This results in better code generation with clang, though still not optimal. Link: https://lore.kernel.org/r/20250210210741.471725-1-ebiggers@kernel.org Signed-off-by: Eric Biggers <ebiggers@google.com>
-rw-r--r--arch/x86/lib/crc32-glue.c4
1 files changed, 2 insertions, 2 deletions
diff --git a/arch/x86/lib/crc32-glue.c b/arch/x86/lib/crc32-glue.c
index 9c3f9c1b7bb9..4b4721176799 100644
--- a/arch/x86/lib/crc32-glue.c
+++ b/arch/x86/lib/crc32-glue.c
@@ -55,10 +55,10 @@ u32 crc32c_arch(u32 crc, const u8 *p, size_t len)
for (num_longs = len / sizeof(unsigned long);
num_longs != 0; num_longs--, p += sizeof(unsigned long))
- asm(CRC32_INST : "+r" (crc) : "rm" (*(unsigned long *)p));
+ asm(CRC32_INST : "+r" (crc) : ASM_INPUT_RM (*(unsigned long *)p));
for (len %= sizeof(unsigned long); len; len--, p++)
- asm("crc32b %1, %0" : "+r" (crc) : "rm" (*p));
+ asm("crc32b %1, %0" : "+r" (crc) : ASM_INPUT_RM (*p));
return crc;
}