Add combine splitter to transform vpternlogd/vpcmpeqd/vpxor/vblendvps to vblendvps for ~op0
gcc/ChangeLog: PR target/100738 * config/i386/sse.md (*avx_cmp<mode>3_lt, *avx_cmp<mode>3_ltint): Remove MEM_P restriction and add force_reg for operands[2]. (*avx_cmp<mode>3_ltint_not): Add new define_insn_and_split. gcc/testsuite/ChangeLog: PR target/100738 * g++.target/i386/avx512vl-pr100738-1.C: New test.
This commit is contained in:
parent
79a89108dd
commit
456b53654a
2 changed files with 48 additions and 4 deletions
|
@ -3525,8 +3525,7 @@
|
|||
UNSPEC_PCMP)))]
|
||||
"TARGET_AVX512VL && ix86_pre_reload_split ()
|
||||
/* LT or GE 0 */
|
||||
&& ((INTVAL (operands[5]) == 1 && !MEM_P (operands[2]))
|
||||
|| (INTVAL (operands[5]) == 5 && !MEM_P (operands[1])))"
|
||||
&& ((INTVAL (operands[5]) == 1) || (INTVAL (operands[5]) == 5))"
|
||||
"#"
|
||||
"&& 1"
|
||||
[(set (match_dup 0)
|
||||
|
@ -3540,6 +3539,7 @@
|
|||
{
|
||||
if (INTVAL (operands[5]) == 5)
|
||||
std::swap (operands[1], operands[2]);
|
||||
operands[2] = force_reg (<MODE>mode, operands[2]);
|
||||
})
|
||||
|
||||
(define_insn_and_split "*avx_cmp<mode>3_ltint"
|
||||
|
@ -3554,8 +3554,7 @@
|
|||
UNSPEC_PCMP)))]
|
||||
"TARGET_AVX512VL && ix86_pre_reload_split ()
|
||||
/* LT or GE 0 */
|
||||
&& ((INTVAL (operands[5]) == 1 && !MEM_P (operands[2]))
|
||||
|| (INTVAL (operands[5]) == 5 && !MEM_P (operands[1])))"
|
||||
&& ((INTVAL (operands[5]) == 1) || (INTVAL (operands[5]) == 5))"
|
||||
"#"
|
||||
"&& 1"
|
||||
[(set (match_dup 0)
|
||||
|
@ -3572,7 +3571,44 @@
|
|||
std::swap (operands[1], operands[2]);
|
||||
operands[0] = gen_lowpart (<ssebytemode>mode, operands[0]);
|
||||
operands[1] = gen_lowpart (<ssebytemode>mode, operands[1]);
|
||||
operands[2] = force_reg (<ssebytemode>mode,
|
||||
gen_lowpart (<ssebytemode>mode, operands[2]));
|
||||
})
|
||||
|
||||
(define_insn_and_split "*avx_cmp<mode>3_ltint_not"
|
||||
[(set (match_operand:VI48_AVX 0 "register_operand")
|
||||
(vec_merge:VI48_AVX
|
||||
(match_operand:VI48_AVX 1 "vector_operand")
|
||||
(match_operand:VI48_AVX 2 "vector_operand")
|
||||
(unspec:<avx512fmaskmode>
|
||||
[(subreg:VI48_AVX
|
||||
(not:<ssebytemode>
|
||||
(match_operand:<ssebytemode> 3 "vector_operand")) 0)
|
||||
(match_operand:VI48_AVX 4 "const0_operand")
|
||||
(match_operand:SI 5 "const_0_to_7_operand")]
|
||||
UNSPEC_PCMP)))]
|
||||
"TARGET_AVX512VL && ix86_pre_reload_split ()
|
||||
/* not LT or GE 0 */
|
||||
&& ((INTVAL (operands[5]) == 1) || (INTVAL (operands[5]) == 5))"
|
||||
"#"
|
||||
"&& 1"
|
||||
[(set (match_dup 0)
|
||||
(unspec:<ssebytemode>
|
||||
[(match_dup 1)
|
||||
(match_dup 2)
|
||||
(subreg:<ssebytemode>
|
||||
(lt:VI48_AVX
|
||||
(match_dup 3)
|
||||
(match_dup 4)) 0)]
|
||||
UNSPEC_BLENDV))]
|
||||
{
|
||||
if (INTVAL (operands[5]) == 5)
|
||||
std::swap (operands[1], operands[2]);
|
||||
operands[0] = gen_lowpart (<ssebytemode>mode, operands[0]);
|
||||
operands[1] = force_reg (<ssebytemode>mode,
|
||||
gen_lowpart (<ssebytemode>mode, operands[1]));
|
||||
operands[2] = gen_lowpart (<ssebytemode>mode, operands[2]);
|
||||
operands[3] = lowpart_subreg (<MODE>mode, operands[3], <ssebytemode>mode);
|
||||
})
|
||||
|
||||
(define_insn "avx_vmcmp<mode>3"
|
||||
|
|
8
gcc/testsuite/g++.target/i386/avx512vl-pr100738-1.C
Executable file
8
gcc/testsuite/g++.target/i386/avx512vl-pr100738-1.C
Executable file
|
@ -0,0 +1,8 @@
|
|||
/* { dg-do compile } */
|
||||
/* { dg-options "-Ofast -march=cascadelake" } */
|
||||
/* { dg-final {scan-assembler-times "vblendvps\[ \\t\]" 2 } } */
|
||||
/* { dg-final {scan-assembler-not "vpcmpeqd\[ \\t\]" } } */
|
||||
/* { dg-final {scan-assembler-not "vpxor\[ \\t\]" } } */
|
||||
/* { dg-final {scan-assembler-not "vpternlogd\[ \\t\]" } } */
|
||||
|
||||
#include "pr100738-1.C"
|
Loading…
Add table
Reference in a new issue