[arm] PR target/83687: Fix invalid combination of VSUB + VABS into VABD
Backport from mailine 2018-01-15 Kyrylo Tkachov <kyrylo.tkachov@arm.com> PR target/83687 * config/arm/iterators.md (VF): New mode iterator. * config/arm/neon.md (neon_vabd<mode>_2): Use the above. Remove integer-related logic from pattern. (neon_vabd<mode>_3): Likewise. * gcc.target/arm/neon-combine-sub-abs-into-vabd.c: Delete integer tests. * gcc.target/arm/pr83687.c: New test. From-SVN: r256791
This commit is contained in:
parent
76bc6ce90f
commit
f743dd807b
|
@ -1,3 +1,14 @@
|
|||
2018-01-17 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
|
||||
|
||||
Backport from mailine
|
||||
2018-01-15 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
|
||||
|
||||
PR target/83687
|
||||
* config/arm/iterators.md (VF): New mode iterator.
|
||||
* config/arm/neon.md (neon_vabd<mode>_2): Use the above.
|
||||
Remove integer-related logic from pattern.
|
||||
(neon_vabd<mode>_3): Likewise.
|
||||
|
||||
2018-01-17 Martin Liska <mliska@suse.cz>
|
||||
|
||||
Backport from mainline
|
||||
|
|
|
@ -116,6 +116,10 @@
|
|||
;; All supported vector modes (except singleton DImode).
|
||||
(define_mode_iterator VDQ [V8QI V16QI V4HI V8HI V2SI V4SI V4HF V8HF V2SF V4SF V2DI])
|
||||
|
||||
;; All supported floating-point vector modes (except V2DF).
|
||||
(define_mode_iterator VF [(V4HF "TARGET_NEON_FP16INST")
|
||||
(V8HF "TARGET_NEON_FP16INST") V2SF V4SF])
|
||||
|
||||
;; All supported vector modes (except those with 64-bit integer elements).
|
||||
(define_mode_iterator VDQW [V8QI V16QI V4HI V8HI V2SI V4SI V2SF V4SF])
|
||||
|
||||
|
|
|
@ -6199,28 +6199,22 @@ if (BYTES_BIG_ENDIAN)
|
|||
})
|
||||
|
||||
(define_insn "neon_vabd<mode>_2"
|
||||
[(set (match_operand:VDQ 0 "s_register_operand" "=w")
|
||||
(abs:VDQ (minus:VDQ (match_operand:VDQ 1 "s_register_operand" "w")
|
||||
(match_operand:VDQ 2 "s_register_operand" "w"))))]
|
||||
"TARGET_NEON && (!<Is_float_mode> || flag_unsafe_math_optimizations)"
|
||||
[(set (match_operand:VF 0 "s_register_operand" "=w")
|
||||
(abs:VF (minus:VF (match_operand:VF 1 "s_register_operand" "w")
|
||||
(match_operand:VF 2 "s_register_operand" "w"))))]
|
||||
"TARGET_NEON && flag_unsafe_math_optimizations"
|
||||
"vabd.<V_s_elem> %<V_reg>0, %<V_reg>1, %<V_reg>2"
|
||||
[(set (attr "type")
|
||||
(if_then_else (ne (symbol_ref "<Is_float_mode>") (const_int 0))
|
||||
(const_string "neon_fp_abd_s<q>")
|
||||
(const_string "neon_abd<q>")))]
|
||||
[(set_attr "type" "neon_fp_abd_s<q>")]
|
||||
)
|
||||
|
||||
(define_insn "neon_vabd<mode>_3"
|
||||
[(set (match_operand:VDQ 0 "s_register_operand" "=w")
|
||||
(abs:VDQ (unspec:VDQ [(match_operand:VDQ 1 "s_register_operand" "w")
|
||||
(match_operand:VDQ 2 "s_register_operand" "w")]
|
||||
UNSPEC_VSUB)))]
|
||||
"TARGET_NEON && (!<Is_float_mode> || flag_unsafe_math_optimizations)"
|
||||
[(set (match_operand:VF 0 "s_register_operand" "=w")
|
||||
(abs:VF (unspec:VF [(match_operand:VF 1 "s_register_operand" "w")
|
||||
(match_operand:VF 2 "s_register_operand" "w")]
|
||||
UNSPEC_VSUB)))]
|
||||
"TARGET_NEON && flag_unsafe_math_optimizations"
|
||||
"vabd.<V_if_elem> %<V_reg>0, %<V_reg>1, %<V_reg>2"
|
||||
[(set (attr "type")
|
||||
(if_then_else (ne (symbol_ref "<Is_float_mode>") (const_int 0))
|
||||
(const_string "neon_fp_abd_s<q>")
|
||||
(const_string "neon_abd<q>")))]
|
||||
[(set_attr "type" "neon_fp_abd_s<q>")]
|
||||
)
|
||||
|
||||
;; Copy from core-to-neon regs, then extend, not vice-versa
|
||||
|
|
|
@ -1,3 +1,13 @@
|
|||
2018-01-17 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
|
||||
|
||||
Backport from mainline
|
||||
2018-01-15 Kyrylo Tkachov <kyrylo.tkachov@arm.com>
|
||||
|
||||
PR target/83687
|
||||
* gcc.target/arm/neon-combine-sub-abs-into-vabd.c: Delete integer
|
||||
tests.
|
||||
* gcc.target/arm/pr83687.c: New test.
|
||||
|
||||
2018-01-17 Martin Liska <mliska@suse.cz>
|
||||
|
||||
Backport from mainline
|
||||
|
|
|
@ -12,31 +12,3 @@ float32x2_t f_sub_abs_to_vabd_32(float32x2_t val1, float32x2_t val2)
|
|||
return res;
|
||||
}
|
||||
/* { dg-final { scan-assembler "vabd\.f32" } }*/
|
||||
|
||||
#include <arm_neon.h>
|
||||
int8x8_t sub_abs_to_vabd_8(int8x8_t val1, int8x8_t val2)
|
||||
{
|
||||
int8x8_t sres = vsub_s8(val1, val2);
|
||||
int8x8_t res = vabs_s8 (sres);
|
||||
|
||||
return res;
|
||||
}
|
||||
/* { dg-final { scan-assembler "vabd\.s8" } }*/
|
||||
|
||||
int16x4_t sub_abs_to_vabd_16(int16x4_t val1, int16x4_t val2)
|
||||
{
|
||||
int16x4_t sres = vsub_s16(val1, val2);
|
||||
int16x4_t res = vabs_s16 (sres);
|
||||
|
||||
return res;
|
||||
}
|
||||
/* { dg-final { scan-assembler "vabd\.s16" } }*/
|
||||
|
||||
int32x2_t sub_abs_to_vabd_32(int32x2_t val1, int32x2_t val2)
|
||||
{
|
||||
int32x2_t sres = vsub_s32(val1, val2);
|
||||
int32x2_t res = vabs_s32 (sres);
|
||||
|
||||
return res;
|
||||
}
|
||||
/* { dg-final { scan-assembler "vabd\.s32" } }*/
|
||||
|
|
|
@ -0,0 +1,31 @@
|
|||
/* { dg-do run } */
|
||||
/* { dg-require-effective-target arm_neon_hw } */
|
||||
/* { dg-options "-O2" } */
|
||||
/* { dg-add-options arm_neon } */
|
||||
|
||||
#include <arm_neon.h>
|
||||
|
||||
__attribute__ ((noinline)) int8_t
|
||||
testFunction1 (int8_t a, int8_t b)
|
||||
{
|
||||
volatile int8x16_t sub = vsubq_s8 (vdupq_n_s8 (a), vdupq_n_s8 (b));
|
||||
int8x16_t abs = vabsq_s8 (sub);
|
||||
return vgetq_lane_s8 (abs, 0);
|
||||
}
|
||||
|
||||
__attribute__ ((noinline)) int8_t
|
||||
testFunction2 (int8_t a, int8_t b)
|
||||
{
|
||||
int8x16_t sub = vsubq_s8 (vdupq_n_s8 (a), vdupq_n_s8 (b));
|
||||
int8x16_t abs = vabsq_s8 (sub);
|
||||
return vgetq_lane_s8 (abs, 0);
|
||||
}
|
||||
|
||||
int
|
||||
main (void)
|
||||
{
|
||||
if (testFunction1 (-100, 100) != testFunction2 (-100, 100))
|
||||
__builtin_abort ();
|
||||
|
||||
return 0;
|
||||
}
|
Loading…
Reference in New Issue