diff --git a/gcc/ChangeLog b/gcc/ChangeLog index 67b39211811..ecf2b805d70 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,12 @@ +2018-10-12 Wilco Dijkstra + + * config/aarch64/aarch64.md (zero_extendsidi2_aarch64): Add alternatives + to zero-extend between int and floating-point registers. + (load_pair_zero_extendsidi2_aarch64): Add alternative for zero-extended + ldp into floating-point registers. Add type and arch attributes. + (zero_extend2_aarch64): Add arch attribute. + Use f_loads for type attribute. + 2018-10-11 Martin Sebor * doc/extend.texi (attribute packed): Correct typos. diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md index b4a4315ff4b..58e9962ae24 100644 --- a/gcc/config/aarch64/aarch64.md +++ b/gcc/config/aarch64/aarch64.md @@ -1520,26 +1520,34 @@ ) (define_insn "*zero_extendsidi2_aarch64" - [(set (match_operand:DI 0 "register_operand" "=r,r") - (zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m")))] + [(set (match_operand:DI 0 "register_operand" "=r,r,w,w,r,w") + (zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m,r,m,w,w")))] "" "@ uxtw\t%0, %w1 - ldr\t%w0, %1" - [(set_attr "type" "extend,load_4")] + ldr\t%w0, %1 + fmov\t%s0, %w1 + ldr\t%s0, %1 + fmov\t%w0, %s1 + fmov\t%s0, %s1" + [(set_attr "type" "extend,load_4,f_mcr,f_loads,f_mrc,fmov") + (set_attr "arch" "*,*,fp,fp,fp,fp")] ) (define_insn "*load_pair_zero_extendsidi2_aarch64" - [(set (match_operand:DI 0 "register_operand" "=r") - (zero_extend:DI (match_operand:SI 1 "aarch64_mem_pair_operand" "Ump"))) - (set (match_operand:DI 2 "register_operand" "=r") - (zero_extend:DI (match_operand:SI 3 "memory_operand" "m")))] + [(set (match_operand:DI 0 "register_operand" "=r,w") + (zero_extend:DI (match_operand:SI 1 "aarch64_mem_pair_operand" "Ump,Ump"))) + (set (match_operand:DI 2 "register_operand" "=r,w") + (zero_extend:DI (match_operand:SI 3 "memory_operand" "m,m")))] "rtx_equal_p (XEXP (operands[3], 0), plus_constant (Pmode, XEXP (operands[1], 0), GET_MODE_SIZE (SImode)))" - "ldp\\t%w0, %w2, %1" - [(set_attr "type" "load_8")] + "@ + ldp\t%w0, %w2, %1 + ldp\t%s0, %s2, %1" + [(set_attr "type" "load_8,neon_load1_2reg") + (set_attr "arch" "*,fp")] ) (define_expand "2" @@ -1566,7 +1574,8 @@ and\t%0, %1, ldr\t%w0, %1 ldr\t%0, %1" - [(set_attr "type" "logic_imm,load_4,load_4")] + [(set_attr "type" "logic_imm,load_4,f_loads") + (set_attr "arch" "*,*,fp")] ) (define_expand "qihi2" diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index edb680ec4a7..964f4ea4c11 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,8 @@ +2018-10-12 Wilco Dijkstra + + * gcc.target/aarch64/popcnt.c: Test zero-extended popcount. + * gcc.target/aarch64/vec_zeroextend.c: Test zero-extended vectors. + 2018-10-11 Will Schmidt * gcc.target/powerpc/fold-vec-insert-char-p8.c: New. diff --git a/gcc/testsuite/gcc.target/aarch64/popcnt.c b/gcc/testsuite/gcc.target/aarch64/popcnt.c index 7e957966d8e..2b5e9f3e2c0 100644 --- a/gcc/testsuite/gcc.target/aarch64/popcnt.c +++ b/gcc/testsuite/gcc.target/aarch64/popcnt.c @@ -19,5 +19,16 @@ foo2 (long long x) return __builtin_popcountll (x); } -/* { dg-final { scan-assembler-not "popcount" } } */ -/* { dg-final { scan-assembler-times "cnt\t" 3 } } */ +int +foo3 (int *p) +{ + return __builtin_popcount (*p); +} + +/* { dg-final { scan-assembler-not {popcount} } } */ +/* { dg-final { scan-assembler-times {cnt\t} 4 } } */ +/* { dg-final { scan-assembler-times {fmov\ts} 1 {target lp64} } } */ +/* { dg-final { scan-assembler-times {fmov\td} 2 {target lp64} } } */ +/* { dg-final { scan-assembler-times {fmov\ts} 2 {target ilp32} } } */ +/* { dg-final { scan-assembler-times {fmov\td} 1 {target ilp32} } } */ +/* { dg-final { scan-assembler-times {ldr\ts} 1 } } */ diff --git a/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c b/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c new file mode 100644 index 00000000000..9c3971f036a --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c @@ -0,0 +1,21 @@ +/* { dg-do compile } */ +/* { dg-options "-O2" } */ + +#define vector __attribute__((vector_size(16) )) + +vector unsigned long long +f1(vector unsigned long long b, vector unsigned int a) +{ + b[0] = a[0]; + return b; +} + +unsigned long long +f2(vector unsigned int a) +{ + return a[0]; +} + +/* { dg-final { scan-assembler-times {fmov} 2 } } */ +/* { dg-final { scan-assembler-not {umov} } } */ +/* { dg-final { scan-assembler-not {uxtw} } } */