https://gcc.gnu.org/g:bf784936bc8be013db8b3e35002e76838f830f40
commit r13-8413-gbf784936bc8be013db8b3e35002e76838f830f40 Author: Lulu Cheng <chengl...@loongson.cn> Date: Tue Mar 5 14:43:04 2024 +0800 LoongArch: Fixed an issue with the implementation of the template atomic_compare_and_swapsi. If the hardware does not support LAMCAS, atomic_compare_and_swapsi needs to be implemented through "ll.w+sc.w". In the implementation of the instruction sequence, it is necessary to determine whether the two registers are equal. Since LoongArch's comparison instructions do not distinguish between 32-bit and 64-bit, the two operand registers that need to be compared are symbolically extended, and one of the operand registers is obtained from memory through the "ll.w" instruction, which can ensure that the symbolic expansion is carried out. However, the value of the other operand register is not guaranteed to be the value of the sign extension. gcc/ChangeLog: * config/loongarch/sync.md (atomic_cas_value_strong<mode>): In loongarch64, a sign extension operation is added when operands[2] is a register operand and the mode is SImode. gcc/testsuite/ChangeLog: * g++.target/loongarch/atomic-cas-int.C: New test. (cherry picked from commit 3a3fbec0a4d3f36de58df9ef0b3992a3ffb359c2) Diff: --- gcc/config/loongarch/sync.md | 46 ++++++++++++++++------ .../g++.target/loongarch/atomic-cas-int.C | 32 +++++++++++++++ 2 files changed, 67 insertions(+), 11 deletions(-) diff --git a/gcc/config/loongarch/sync.md b/gcc/config/loongarch/sync.md index db3a21690b8..89956e07c79 100644 --- a/gcc/config/loongarch/sync.md +++ b/gcc/config/loongarch/sync.md @@ -129,18 +129,42 @@ (clobber (match_scratch:GPR 6 "=&r"))] "" { - return "1:\\n\\t" - "ll.<amo>\\t%0,%1\\n\\t" - "bne\\t%0,%z2,2f\\n\\t" - "or%i3\\t%6,$zero,%3\\n\\t" - "sc.<amo>\\t%6,%1\\n\\t" - "beqz\\t%6,1b\\n\\t" - "b\\t3f\\n\\t" - "2:\\n\\t" - "%G5\\n\\t" - "3:\\n\\t"; + output_asm_insn ("1:", operands); + output_asm_insn ("ll.<amo>\t%0,%1", operands); + + /* Like the test case atomic-cas-int.C, in loongarch64, O1 and higher, the + return value of the val_without_const_folding will not be truncated and + will be passed directly to the function compare_exchange_strong. + However, the instruction 'bne' does not distinguish between 32-bit and + 64-bit operations. so if the upper 32 bits of the register are not + extended by the 32nd bit symbol, then the comparison may not be valid + here. This will affect the result of the operation. */ + + if (TARGET_64BIT && REG_P (operands[2]) + && GET_MODE (operands[2]) == SImode) + { + output_asm_insn ("addi.w\t%6,%2,0", operands); + output_asm_insn ("bne\t%0,%6,2f", operands); + } + else + output_asm_insn ("bne\t%0,%z2,2f", operands); + + output_asm_insn ("or%i3\t%6,$zero,%3", operands); + output_asm_insn ("sc.<amo>\t%6,%1", operands); + output_asm_insn ("beqz\t%6,1b", operands); + output_asm_insn ("b\t3f", operands); + output_asm_insn ("2:", operands); + output_asm_insn ("%G5", operands); + output_asm_insn ("3:", operands); + + return ""; } - [(set (attr "length") (const_int 28))]) + [(set (attr "length") + (if_then_else + (and (match_test "GET_MODE (operands[2]) == SImode") + (match_test "REG_P (operands[2])")) + (const_int 32) + (const_int 28)))]) (define_expand "atomic_compare_and_swap<mode>" [(match_operand:SI 0 "register_operand" "") ;; bool output diff --git a/gcc/testsuite/g++.target/loongarch/atomic-cas-int.C b/gcc/testsuite/g++.target/loongarch/atomic-cas-int.C new file mode 100644 index 00000000000..830ce48267a --- /dev/null +++ b/gcc/testsuite/g++.target/loongarch/atomic-cas-int.C @@ -0,0 +1,32 @@ +/* { dg-do run } */ +/* { dg-options "-O2" } */ + +#include <atomic> +#include <cstdio> + +__attribute__ ((noinline)) long +val_without_const_folding (long val) +{ + return val; +} + +int +main () +{ + int oldval = 0xaa; + int newval = 0xbb; + std::atomic<int> amo; + + amo.store (oldval); + + long longval = val_without_const_folding (0xff80000000000000 + oldval); + oldval = static_cast<int> (longval); + + amo.compare_exchange_strong (oldval, newval); + + if (newval != amo.load (std::memory_order_relaxed)) + __builtin_abort (); + + return 0; +} +