i386: Add push insns for 4-byte vectors [PR100722]

2021-05-23  Uroš Bizjak  <ubizjak@gmail.com>

gcc/
	PR target/100722
	* config/i386/mmx.md (*push<VI_32:mode>2_rex64):
	New instruction pattern.
	(*push<VI_32:mode>2): Ditto.
	(push splitter for SSE registers): New splitter.

gcc/testsuite/

	PR target/100722
	* gcc.target/i386/pr100722.c: New test.
This commit is contained in:
Uros Bizjak 2021-05-23 22:14:21 +02:00
parent fe03f4fc95
commit c01c433111
2 changed files with 50 additions and 0 deletions

View File

@ -302,6 +302,39 @@
]
(symbol_ref "true")))])
;; For TARGET_64BIT we always round up to 8 bytes.
(define_insn "*push<mode>2_rex64"
[(set (match_operand:VI_32 0 "push_operand" "=X,X")
(match_operand:VI_32 1 "nonmemory_no_elim_operand" "rC,*v"))]
"TARGET_SSE2 && TARGET_64BIT"
"@
push{q}\t%q1
#"
[(set_attr "type" "push,multi")
(set_attr "mode" "DI")])
(define_insn "*push<mode>2"
[(set (match_operand:VI_32 0 "push_operand" "=<,<")
(match_operand:VI_32 1 "general_no_elim_operand" "rC*m,*v"))]
"TARGET_SSE2 && !TARGET_64BIT"
"@
push{l}\t%1
#"
[(set_attr "type" "push,multi")
(set_attr "mode" "SI")])
(define_split
[(set (match_operand:VI_32 0 "push_operand")
(match_operand:VI_32 1 "sse_reg_operand"))]
"TARGET_SSE2 && reload_completed"
[(set (reg:P SP_REG) (plus:P (reg:P SP_REG) (match_dup 2)))
(set (match_dup 0) (match_dup 1))]
{
operands[2] = GEN_INT (-PUSH_ROUNDING (GET_MODE_SIZE (<VI_32:MODE>mode)));
/* Preserve memory attributes. */
operands[0] = replace_equiv_address (operands[0], stack_pointer_rtx);
})
(define_expand "movmisalign<mode>"
[(set (match_operand:VI_32 0 "nonimmediate_operand")
(match_operand:VI_32 1 "nonimmediate_operand"))]

View File

@ -0,0 +1,17 @@
/* PR target/100722 */
/* { dg-do compile } */
/* { dg-options "-O -msse2" } */
typedef char int8x4_t __attribute__((vector_size(4)));
void stack_callee (int8x4_t, int8x4_t, int8x4_t, int8x4_t,
int8x4_t, int8x4_t, int8x4_t);
int8x4_t stack_caller_x1;
void stack_caller (void)
{
stack_callee (stack_caller_x1, stack_caller_x1, stack_caller_x1,
stack_caller_x1, stack_caller_x1, stack_caller_x1,
stack_caller_x1);
}