Commit 4c9a9380 authored by Alexey Dobriyan's avatar Alexey Dobriyan Committed by Ingo Molnar

x86/asm/64: Clean up memset16(), memset32(), memset64() assembly constraints in <asm/string_64.h>

- Use "+" constraint modifier,
  simplify inputs and output lists,
  delete dummy variables with meaningless names,

  "&" only makes sense in complex assembly creating constraints on
  intermediate registers. But 1 instruction assemblies don't have
  inner body so to speak.

- Write "rep stos*" on one line:
  Rep prefix is integral part of x86 instruction.  I'm not sure why
  people separate "rep" with newline.

  Uros Bizjak adds context: "some archaic assemblers rejected 'rep
  insn' on one line. I have checked that the minimum required
  binutils-2.25 assembles this without problems."

- Use __auto_type for maximum copy pasta experience,

- Reformat a bit to make everything looks nicer.

Note that "memory" clobber is too much if "n" is known at compile time.
However,

	"=m" (*(T(*)[n])s)

doesn't work because -Wvla even if "n" is compile time constant:

	if (BCP(n)) {
		rep stos
		: "=m" (*(T(*)[n])s)
	} else {
		rep stosw
		: "memory"
	}

The above doesn't work.
Signed-off-by: default avatarAlexey Dobriyan <adobriyan@gmail.com>
Signed-off-by: default avatarIngo Molnar <mingo@kernel.org>
Reviewed-by: default avatarUros Bizjak <ubizjak@gmail.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Andy Lutomirski <luto@kernel.org>
Cc: "H. Peter Anvin" <hpa@zytor.com>
Link: https://lore.kernel.org/r/20240314165715.31831-1-adobriyan@gmail.com
parent 64833714
...@@ -30,37 +30,40 @@ void *__memset(void *s, int c, size_t n); ...@@ -30,37 +30,40 @@ void *__memset(void *s, int c, size_t n);
#define __HAVE_ARCH_MEMSET16 #define __HAVE_ARCH_MEMSET16
static inline void *memset16(uint16_t *s, uint16_t v, size_t n) static inline void *memset16(uint16_t *s, uint16_t v, size_t n)
{ {
long d0, d1; const __auto_type s0 = s;
asm volatile("rep\n\t" asm volatile (
"stosw" "rep stosw"
: "=&c" (d0), "=&D" (d1) : "+D" (s), "+c" (n)
: "a" (v), "1" (s), "0" (n) : "a" (v)
: "memory"); : "memory"
return s; );
return s0;
} }
#define __HAVE_ARCH_MEMSET32 #define __HAVE_ARCH_MEMSET32
static inline void *memset32(uint32_t *s, uint32_t v, size_t n) static inline void *memset32(uint32_t *s, uint32_t v, size_t n)
{ {
long d0, d1; const __auto_type s0 = s;
asm volatile("rep\n\t" asm volatile (
"stosl" "rep stosl"
: "=&c" (d0), "=&D" (d1) : "+D" (s), "+c" (n)
: "a" (v), "1" (s), "0" (n) : "a" (v)
: "memory"); : "memory"
return s; );
return s0;
} }
#define __HAVE_ARCH_MEMSET64 #define __HAVE_ARCH_MEMSET64
static inline void *memset64(uint64_t *s, uint64_t v, size_t n) static inline void *memset64(uint64_t *s, uint64_t v, size_t n)
{ {
long d0, d1; const __auto_type s0 = s;
asm volatile("rep\n\t" asm volatile (
"stosq" "rep stosq"
: "=&c" (d0), "=&D" (d1) : "+D" (s), "+c" (n)
: "a" (v), "1" (s), "0" (n) : "a" (v)
: "memory"); : "memory"
return s; );
return s0;
} }
#endif #endif
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment