aarch64: PR target/99037 Fix RTL represntation in move_lo_quad patterns
This patch fixes the RTL representation of the move_lo_quad patterns to use aarch64_simd_or_scalar_imm_zero for the zero part rather than a vec_duplicate of zero or a const_int 0. The expander that generates them is also adjusted so that we use and match the correct const_vector forms throughout. Co-Authored-By: Jakub Jelinek <jakub@redhat.com> gcc/ChangeLog: PR target/99037 * config/aarch64/aarch64-simd.md (move_lo_quad_internal_<mode>): Use aarch64_simd_or_scalar_imm_zero to match zeroes. Remove pattern matching const_int 0. (move_lo_quad_internal_be_<mode>): Likewise. (move_lo_quad_<mode>): Update for the above. * config/aarch64/iterators.md (VQ_2E): Delete. gcc/testsuite/ChangeLog: PR target/99808 * gcc.target/aarch64/pr99808.c: New test.
This commit is contained in:
parent
25e515d219
commit
37d9074e12
3 changed files with 24 additions and 42 deletions
|
@ -1586,25 +1586,10 @@
|
|||
;; On big-endian this is { zeroes, operand }
|
||||
|
||||
(define_insn "move_lo_quad_internal_<mode>"
|
||||
[(set (match_operand:VQMOV_NO2E 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQMOV_NO2E
|
||||
[(set (match_operand:VQMOV 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQMOV
|
||||
(match_operand:<VHALF> 1 "register_operand" "w,r,r")
|
||||
(vec_duplicate:<VHALF> (const_int 0))))]
|
||||
"TARGET_SIMD && !BYTES_BIG_ENDIAN"
|
||||
"@
|
||||
dup\\t%d0, %1.d[0]
|
||||
fmov\\t%d0, %1
|
||||
dup\\t%d0, %1"
|
||||
[(set_attr "type" "neon_dup<q>,f_mcr,neon_dup<q>")
|
||||
(set_attr "length" "4")
|
||||
(set_attr "arch" "simd,fp,simd")]
|
||||
)
|
||||
|
||||
(define_insn "move_lo_quad_internal_<mode>"
|
||||
[(set (match_operand:VQ_2E 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQ_2E
|
||||
(match_operand:<VHALF> 1 "register_operand" "w,r,r")
|
||||
(const_int 0)))]
|
||||
(match_operand:<VHALF> 2 "aarch64_simd_or_scalar_imm_zero")))]
|
||||
"TARGET_SIMD && !BYTES_BIG_ENDIAN"
|
||||
"@
|
||||
dup\\t%d0, %1.d[0]
|
||||
|
@ -1616,24 +1601,9 @@
|
|||
)
|
||||
|
||||
(define_insn "move_lo_quad_internal_be_<mode>"
|
||||
[(set (match_operand:VQMOV_NO2E 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQMOV_NO2E
|
||||
(vec_duplicate:<VHALF> (const_int 0))
|
||||
(match_operand:<VHALF> 1 "register_operand" "w,r,r")))]
|
||||
"TARGET_SIMD && BYTES_BIG_ENDIAN"
|
||||
"@
|
||||
dup\\t%d0, %1.d[0]
|
||||
fmov\\t%d0, %1
|
||||
dup\\t%d0, %1"
|
||||
[(set_attr "type" "neon_dup<q>,f_mcr,neon_dup<q>")
|
||||
(set_attr "length" "4")
|
||||
(set_attr "arch" "simd,fp,simd")]
|
||||
)
|
||||
|
||||
(define_insn "move_lo_quad_internal_be_<mode>"
|
||||
[(set (match_operand:VQ_2E 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQ_2E
|
||||
(const_int 0)
|
||||
[(set (match_operand:VQMOV 0 "register_operand" "=w,w,w")
|
||||
(vec_concat:VQMOV
|
||||
(match_operand:<VHALF> 2 "aarch64_simd_or_scalar_imm_zero")
|
||||
(match_operand:<VHALF> 1 "register_operand" "w,r,r")))]
|
||||
"TARGET_SIMD && BYTES_BIG_ENDIAN"
|
||||
"@
|
||||
|
@ -1647,13 +1617,14 @@
|
|||
|
||||
(define_expand "move_lo_quad_<mode>"
|
||||
[(match_operand:VQMOV 0 "register_operand")
|
||||
(match_operand:VQMOV 1 "register_operand")]
|
||||
(match_operand:<VHALF> 1 "register_operand")]
|
||||
"TARGET_SIMD"
|
||||
{
|
||||
rtx zs = CONST0_RTX (<VHALF>mode);
|
||||
if (BYTES_BIG_ENDIAN)
|
||||
emit_insn (gen_move_lo_quad_internal_be_<mode> (operands[0], operands[1]));
|
||||
emit_insn (gen_move_lo_quad_internal_be_<mode> (operands[0], operands[1], zs));
|
||||
else
|
||||
emit_insn (gen_move_lo_quad_internal_<mode> (operands[0], operands[1]));
|
||||
emit_insn (gen_move_lo_quad_internal_<mode> (operands[0], operands[1], zs));
|
||||
DONE;
|
||||
}
|
||||
)
|
||||
|
|
|
@ -125,9 +125,6 @@
|
|||
;; VQ without 2 element modes.
|
||||
(define_mode_iterator VQ_NO2E [V16QI V8HI V4SI V8HF V4SF V8BF])
|
||||
|
||||
;; Quad vector with only 2 element modes.
|
||||
(define_mode_iterator VQ_2E [V2DI V2DF])
|
||||
|
||||
;; BFmode vector modes.
|
||||
(define_mode_iterator VBF [V4BF V8BF])
|
||||
|
||||
|
|
14
gcc/testsuite/gcc.target/aarch64/pr99808.c
Normal file
14
gcc/testsuite/gcc.target/aarch64/pr99808.c
Normal file
|
@ -0,0 +1,14 @@
|
|||
/* PR target/99808 */
|
||||
/* PR target/99037 */
|
||||
/* { dg-do compile } */
|
||||
/* { dg-options "-Og -fweb -fno-forward-propagate -g" } */
|
||||
|
||||
#include <arm_neon.h>
|
||||
|
||||
float32x4_t
|
||||
foo (void)
|
||||
{
|
||||
float64x2_t arg2 = vcombine_f64 ((float64x1_t) 0UL, (float64x1_t) 1UL);
|
||||
return vcvt_high_f32_f64 ((float32x2_t) 1UL, arg2);
|
||||
}
|
||||
|
Loading…
Add table
Reference in a new issue