S/390: Fix vec_splat_* builtins.
gcc/testsuite/ChangeLog: 2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com> * gcc.target/s390/zvector/vec-splat-2.c: New test. gcc/ChangeLog: 2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com> * config/s390/s390-builtin-types.def: New builtin types added. * config/s390/s390-builtins.def: Add s390_vec_splat_* definitions. * config/s390/s390.c (s390_expand_builtin): Always truncate constants to the mode in the pattern. * config/s390/vecintrin.h: Let the vec_splat_* macros point to the respective builtin __builtin_s390_vec_splat_*. From-SVN: r231157
This commit is contained in:
parent
4f3ccd0859
commit
dfbe4dfd9d
|
@ -1,3 +1,12 @@
|
|||
2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com>
|
||||
|
||||
* config/s390/s390-builtin-types.def: New builtin types added.
|
||||
* config/s390/s390-builtins.def: Add s390_vec_splat_* definitions.
|
||||
* config/s390/s390.c (s390_expand_builtin): Always truncate
|
||||
constants to the mode in the pattern.
|
||||
* config/s390/vecintrin.h: Let the vec_splat_* macros point to the
|
||||
respective builtin __builtin_s390_vec_splat_*.
|
||||
|
||||
2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com>
|
||||
|
||||
* config/s390/s390-builtin-types.def: Sort builtin types.
|
||||
|
|
|
@ -139,16 +139,19 @@ DEF_FN_TYPE_2 (BT_FN_UV16QI_USHORT, B_VX, BT_UV16QI, BT_USHORT)
|
|||
DEF_FN_TYPE_2 (BT_FN_UV16QI_UV16QI, B_VX, BT_UV16QI, BT_UV16QI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV2DI_ULONGLONG, B_VX, BT_UV2DI, BT_ULONGLONG)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV2DI_ULONGLONGCONSTPTR, B_VX, BT_UV2DI, BT_ULONGLONGCONSTPTR)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV2DI_USHORT, B_VX, BT_UV2DI, BT_USHORT)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV2DI_UV2DI, B_VX, BT_UV2DI, BT_UV2DI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV2DI_UV4SI, B_VX, BT_UV2DI, BT_UV4SI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV4SI_UINT, B_VX, BT_UV4SI, BT_UINT)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV4SI_UINTCONSTPTR, B_VX, BT_UV4SI, BT_UINTCONSTPTR)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV4SI_USHORT, B_VX, BT_UV4SI, BT_USHORT)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV4SI_UV4SI, B_VX, BT_UV4SI, BT_UV4SI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV4SI_UV8HI, B_VX, BT_UV4SI, BT_UV8HI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV8HI_USHORT, B_VX, BT_UV8HI, BT_USHORT)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV8HI_USHORTCONSTPTR, B_VX, BT_UV8HI, BT_USHORTCONSTPTR)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV8HI_UV16QI, B_VX, BT_UV8HI, BT_UV16QI)
|
||||
DEF_FN_TYPE_2 (BT_FN_UV8HI_UV8HI, B_VX, BT_UV8HI, BT_UV8HI)
|
||||
DEF_FN_TYPE_2 (BT_FN_V16QI_SCHAR, B_VX, BT_V16QI, BT_SCHAR)
|
||||
DEF_FN_TYPE_2 (BT_FN_V16QI_UCHAR, B_VX, BT_V16QI, BT_UCHAR)
|
||||
DEF_FN_TYPE_2 (BT_FN_V16QI_V16QI, B_VX, BT_V16QI, BT_V16QI)
|
||||
DEF_FN_TYPE_2 (BT_FN_V2DF_DBL, B_VX, BT_V2DF, BT_DBL)
|
||||
|
|
|
@ -362,6 +362,15 @@ B_DEF (s390_vrepih, vec_splatsv8hi, 0,
|
|||
B_DEF (s390_vrepif, vec_splatsv4si, 0, B_VX, O1_S16, BT_FN_V4SI_SHORT)
|
||||
B_DEF (s390_vrepig, vec_splatsv2di, 0, B_VX, O1_S16, BT_FN_V2DI_SHORT)
|
||||
|
||||
B_DEF (s390_vec_splat_u8, vec_splatsv16qi, 0, B_VX, O1_U8, BT_FN_UV16QI_UCHAR)
|
||||
B_DEF (s390_vec_splat_s8, vec_splatsv16qi, 0, B_VX, O1_S8, BT_FN_V16QI_SCHAR)
|
||||
B_DEF (s390_vec_splat_u16, vec_splatsv8hi, 0, B_VX, O1_U16, BT_FN_UV8HI_USHORT)
|
||||
B_DEF (s390_vec_splat_s16, vec_splatsv8hi, 0, B_VX, O1_S16, BT_FN_V8HI_SHORT)
|
||||
B_DEF (s390_vec_splat_u32, vec_splatsv4si, 0, B_VX, O1_U16, BT_FN_UV4SI_USHORT)
|
||||
B_DEF (s390_vec_splat_s32, vec_splatsv4si, 0, B_VX, O1_S16, BT_FN_V4SI_SHORT)
|
||||
B_DEF (s390_vec_splat_u64, vec_splatsv2di, 0, B_VX, O1_U16, BT_FN_UV2DI_USHORT)
|
||||
B_DEF (s390_vec_splat_s64, vec_splatsv2di, 0, B_VX, O1_S16, BT_FN_V2DI_SHORT)
|
||||
|
||||
OB_DEF (s390_vec_insert, s390_vec_insert_s8, s390_vec_insert_dbl,B_VX, BT_FN_OV4SI_INT_OV4SI_INT)
|
||||
OB_DEF_VAR (s390_vec_insert_s8, s390_vlvgb, O3_ELEM, BT_OV_V16QI_SCHAR_V16QI_INT)
|
||||
OB_DEF_VAR (s390_vec_insert_u8, s390_vlvgb, O3_ELEM, BT_OV_UV16QI_UCHAR_UV16QI_INT)
|
||||
|
|
|
@ -835,6 +835,15 @@ s390_expand_builtin (tree exp, rtx target, rtx subtarget ATTRIBUTE_UNUSED,
|
|||
insn_op = &insn_data[icode].operand[arity + nonvoid];
|
||||
op[arity] = expand_expr (arg, NULL_RTX, insn_op->mode, EXPAND_NORMAL);
|
||||
|
||||
/* expand_expr truncates constants to the target mode only if it
|
||||
is "convenient". However, our checks below rely on this
|
||||
being done. */
|
||||
if (CONST_INT_P (op[arity])
|
||||
&& SCALAR_INT_MODE_P (insn_op->mode)
|
||||
&& GET_MODE (op[arity]) != insn_op->mode)
|
||||
op[arity] = GEN_INT (trunc_int_for_mode (INTVAL (op[arity]),
|
||||
insn_op->mode));
|
||||
|
||||
/* Wrap the expanded RTX for pointer types into a MEM expr with
|
||||
the proper mode. This allows us to use e.g. (match_operand
|
||||
"memory_operand"..) in the insn patterns instead of (mem
|
||||
|
|
|
@ -67,14 +67,14 @@ __lcbb(const void *ptr, int bndry)
|
|||
#define vec_genmasks_16 __builtin_s390_vgmh
|
||||
#define vec_genmasks_32 __builtin_s390_vgmf
|
||||
#define vec_genmasks_64 __builtin_s390_vgmg
|
||||
#define vec_splat_u8 __builtin_s390_vlrepb
|
||||
#define vec_splat_s8 __builtin_s390_vlrepb
|
||||
#define vec_splat_u16 __builtin_s390_vlreph
|
||||
#define vec_splat_s16 __builtin_s390_vlreph
|
||||
#define vec_splat_u32 __builtin_s390_vlrepf
|
||||
#define vec_splat_s32 __builtin_s390_vlrepf
|
||||
#define vec_splat_u64 __builtin_s390_vlrepg
|
||||
#define vec_splat_s64 __builtin_s390_vlrepg
|
||||
#define vec_splat_u8 __builtin_s390_vec_splat_u8
|
||||
#define vec_splat_s8 __builtin_s390_vec_splat_s8
|
||||
#define vec_splat_u16 __builtin_s390_vec_splat_u16
|
||||
#define vec_splat_s16 __builtin_s390_vec_splat_s16
|
||||
#define vec_splat_u32 __builtin_s390_vec_splat_u32
|
||||
#define vec_splat_s32 __builtin_s390_vec_splat_s32
|
||||
#define vec_splat_u64 __builtin_s390_vec_splat_u64
|
||||
#define vec_splat_s64 __builtin_s390_vec_splat_s64
|
||||
#define vec_add_u128 __builtin_s390_vaq
|
||||
#define vec_addc_u128 __builtin_s390_vaccq
|
||||
#define vec_adde_u128 __builtin_s390_vacq
|
||||
|
|
|
@ -1,3 +1,7 @@
|
|||
2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com>
|
||||
|
||||
* gcc.target/s390/zvector/vec-splat-2.c: New test.
|
||||
|
||||
2015-12-02 Andreas Krebbel <krebbel@linux.vnet.ibm.com>
|
||||
|
||||
* gcc.target/s390/vector/vec-vrepi-1.c: New test.
|
||||
|
|
|
@ -0,0 +1,42 @@
|
|||
/* { dg-do compile } */
|
||||
/* { dg-options "-O3 -mzarch -march=z13 -mzvector" } */
|
||||
|
||||
#include <vecintrin.h>
|
||||
|
||||
vector signed char v16qi;
|
||||
vector short v8hi;
|
||||
vector int v4si;
|
||||
vector long long v2di;
|
||||
|
||||
vector unsigned char uv16qi;
|
||||
vector unsigned short uv8hi;
|
||||
vector unsigned int uv4si;
|
||||
vector unsigned long long uv2di;
|
||||
|
||||
int
|
||||
foo ()
|
||||
{
|
||||
v16qi = vec_splat_s8 (-112);
|
||||
uv16qi = vec_splat_u8 (215);
|
||||
|
||||
v8hi = vec_splat_s16 (-32000);
|
||||
uv8hi = vec_splat_u16 (64000);
|
||||
|
||||
v4si = vec_splat_s32 (-32000);
|
||||
uv4si = vec_splat_u32 (64000);
|
||||
|
||||
v2di = vec_splat_s64 (-32000);
|
||||
uv2di = vec_splat_u64 (64000);
|
||||
}
|
||||
|
||||
/* { dg-final { scan-assembler-times "vrepib\t%v.*,-112" 1 } } */
|
||||
/* { dg-final { scan-assembler-times "vrepib\t%v.*,-41" 1 } } */
|
||||
|
||||
/* { dg-final { scan-assembler-times "vrepih\t%v.*,-32000" 1 } } */
|
||||
/* { dg-final { scan-assembler-times "vrepih\t%v.*,-1536" 1 } } */
|
||||
|
||||
/* { dg-final { scan-assembler-times "vrepif\t%v.*,-32000" 1 } } */
|
||||
/* { dg-final { scan-assembler-times "vrepif\t%v.*,-1536" 1 } } */
|
||||
|
||||
/* { dg-final { scan-assembler-times "vrepig\t%v.*,-32000" 1 } } */
|
||||
/* { dg-final { scan-assembler-times "vrepig\t%v.*,-1536" 1 } } */
|
Loading…
Reference in New Issue