Commit 1e021dc3 by Jakub Jelinek Committed by Jakub Jelinek

sse.md (*vec_concatv2si_sse4_1): Add avx512dq v=Yv,rm alternative.

	* config/i386/sse.md (*vec_concatv2si_sse4_1): Add avx512dq v=Yv,rm
	alternative.  Change x=x,x alternative to v=Yv,Yv and x=rm,C
	alternative to v=rm,C.

	* gcc.target/i386/avx512dq-concatv2si-1.c: New test.
	* gcc.target/i386/avx512vl-concatv2si-1.c: New test.

From-SVN: r237030
parent b93b1475
2016-06-02 Jakub Jelinek <jakub@redhat.com> 2016-06-02 Jakub Jelinek <jakub@redhat.com>
* config/i386/sse.md (*vec_concatv2si_sse4_1): Add avx512dq v=Yv,rm
alternative. Change x=x,x alternative to v=Yv,Yv and x=rm,C
alternative to v=rm,C.
* config/i386/sse.md (*vec_concatv2di): Add x86_avx512dq v=Yv,rm * config/i386/sse.md (*vec_concatv2di): Add x86_avx512dq v=Yv,rm
alternative. Change x=xm,C alternative to v=vm,C, x=x,x alternative alternative. Change x=xm,C alternative to v=vm,C, x=x,x alternative
to v=Yv,Yv and x=x,m to v=v,m. Use maybe_evex prefix attribute to v=Yv,Yv and x=x,m to v=v,m. Use maybe_evex prefix attribute
......
...@@ -13488,43 +13488,44 @@ ...@@ -13488,43 +13488,44 @@
(define_insn "*vec_concatv2si_sse4_1" (define_insn "*vec_concatv2si_sse4_1"
[(set (match_operand:V2SI 0 "register_operand" [(set (match_operand:V2SI 0 "register_operand"
"=Yr,*x,x, Yr,*x,x, x, *y,*y") "=Yr,*x, x, v,Yr,*x, v, v, *y,*y")
(vec_concat:V2SI (vec_concat:V2SI
(match_operand:SI 1 "nonimmediate_operand" (match_operand:SI 1 "nonimmediate_operand"
" 0, 0,x, 0,0, x,rm, 0,rm") " 0, 0, x,Yv, 0, 0,Yv,rm, 0,rm")
(match_operand:SI 2 "vector_move_operand" (match_operand:SI 2 "vector_move_operand"
" rm,rm,rm,Yr,*x,x, C,*ym, C")))] " rm,rm,rm,rm,Yr,*x,Yv, C,*ym, C")))]
"TARGET_SSE4_1 && !(MEM_P (operands[1]) && MEM_P (operands[2]))" "TARGET_SSE4_1 && !(MEM_P (operands[1]) && MEM_P (operands[2]))"
"@ "@
pinsrd\t{$1, %2, %0|%0, %2, 1} pinsrd\t{$1, %2, %0|%0, %2, 1}
pinsrd\t{$1, %2, %0|%0, %2, 1} pinsrd\t{$1, %2, %0|%0, %2, 1}
vpinsrd\t{$1, %2, %1, %0|%0, %1, %2, 1} vpinsrd\t{$1, %2, %1, %0|%0, %1, %2, 1}
vpinsrd\t{$1, %2, %1, %0|%0, %1, %2, 1}
punpckldq\t{%2, %0|%0, %2} punpckldq\t{%2, %0|%0, %2}
punpckldq\t{%2, %0|%0, %2} punpckldq\t{%2, %0|%0, %2}
vpunpckldq\t{%2, %1, %0|%0, %1, %2} vpunpckldq\t{%2, %1, %0|%0, %1, %2}
%vmovd\t{%1, %0|%0, %1} %vmovd\t{%1, %0|%0, %1}
punpckldq\t{%2, %0|%0, %2} punpckldq\t{%2, %0|%0, %2}
movd\t{%1, %0|%0, %1}" movd\t{%1, %0|%0, %1}"
[(set_attr "isa" "noavx,noavx,avx,noavx,noavx,avx,*,*,*") [(set_attr "isa" "noavx,noavx,avx,avx512dq,noavx,noavx,avx,*,*,*")
(set (attr "type") (set (attr "type")
(cond [(eq_attr "alternative" "6") (cond [(eq_attr "alternative" "7")
(const_string "ssemov") (const_string "ssemov")
(eq_attr "alternative" "7")
(const_string "mmxcvt")
(eq_attr "alternative" "8") (eq_attr "alternative" "8")
(const_string "mmxcvt")
(eq_attr "alternative" "9")
(const_string "mmxmov") (const_string "mmxmov")
] ]
(const_string "sselog"))) (const_string "sselog")))
(set (attr "prefix_extra") (set (attr "prefix_extra")
(if_then_else (eq_attr "alternative" "0,1,2") (if_then_else (eq_attr "alternative" "0,1,2,3")
(const_string "1") (const_string "1")
(const_string "*"))) (const_string "*")))
(set (attr "length_immediate") (set (attr "length_immediate")
(if_then_else (eq_attr "alternative" "0,1,2") (if_then_else (eq_attr "alternative" "0,1,2,3")
(const_string "1") (const_string "1")
(const_string "*"))) (const_string "*")))
(set_attr "prefix" "orig,orig,vex,orig,orig,vex,maybe_vex,orig,orig") (set_attr "prefix" "orig,orig,vex,evex,orig,orig,maybe_evex,maybe_vex,orig,orig")
(set_attr "mode" "TI,TI,TI,TI,TI,TI,TI,DI,DI")]) (set_attr "mode" "TI,TI,TI,TI,TI,TI,TI,TI,DI,DI")])
;; ??? In theory we can match memory for the MMX alternative, but allowing ;; ??? In theory we can match memory for the MMX alternative, but allowing
;; nonimmediate_operand for operand 2 and *not* allowing memory for the SSE ;; nonimmediate_operand for operand 2 and *not* allowing memory for the SSE
......
2016-06-02 Jakub Jelinek <jakub@redhat.com> 2016-06-02 Jakub Jelinek <jakub@redhat.com>
* gcc.target/i386/avx512dq-concatv2si-1.c: New test.
* gcc.target/i386/avx512vl-concatv2si-1.c: New test.
* gcc.target/i386/avx512dq-concatv2di-1.c: New test. * gcc.target/i386/avx512dq-concatv2di-1.c: New test.
* gcc.target/i386/avx512vl-concatv2di-1.c: New test. * gcc.target/i386/avx512vl-concatv2di-1.c: New test.
* gcc.target/i386/sse2-init-v2di-2.c: Adjust expected vec_concatv2di * gcc.target/i386/sse2-init-v2di-2.c: Adjust expected vec_concatv2di
......
/* { dg-do compile { target { ! ia32 } } } */
/* { dg-options "-O2 -mavx512vl -mavx512dq -masm=att" } */
typedef int V __attribute__((vector_size (8)));
void
f1 (int x, int y)
{
register int a __asm ("xmm16");
register int b __asm ("xmm17");
register V c __asm ("xmm3");
a = x;
b = y;
asm volatile ("" : "+v" (a), "+v" (b));
c = (V) { a, b };
asm volatile ("" : "+v" (c));
}
/* { dg-final { scan-assembler "vpunpckldq\[^\n\r]*%xmm17\[^\n\r]*%xmm16\[^\n\r]*%xmm3" } } */
void
f2 (int x, int y)
{
register int a __asm ("xmm16");
register V c __asm ("xmm3");
a = x;
asm volatile ("" : "+v" (a));
c = (V) { a, y };
asm volatile ("" : "+v" (c));
}
void
f3 (int x, int *y)
{
register int a __asm ("xmm16");
register V c __asm ("xmm3");
a = x;
asm volatile ("" : "+v" (a));
c = (V) { a, *y };
asm volatile ("" : "+v" (c));
}
/* { dg-final { scan-assembler-times "vpinsrd\[^\n\r]*\\\$1\[^\n\r]*%xmm16\[^\n\r]*%xmm3" 2 } } */
/* { dg-do compile { target { ! ia32 } } } */
/* { dg-options "-O2 -mavx512vl -mno-avx512dq -masm=att" } */
typedef int V __attribute__((vector_size (8)));
void
f1 (int x, int y)
{
register int a __asm ("xmm16");
register int b __asm ("xmm17");
register V c __asm ("xmm3");
a = x;
b = y;
asm volatile ("" : "+v" (a), "+v" (b));
c = (V) { a, b };
asm volatile ("" : "+v" (c));
}
/* { dg-final { scan-assembler "vpunpckldq\[^\n\r]*%xmm17\[^\n\r]*%xmm16\[^\n\r]*%xmm3" } } */
void
f2 (int x, int y)
{
register int a __asm ("xmm16");
register V c __asm ("xmm3");
a = x;
asm volatile ("" : "+v" (a));
c = (V) { a, y };
asm volatile ("" : "+v" (c));
}
void
f3 (int x, int *y)
{
register int a __asm ("xmm16");
register V c __asm ("xmm3");
a = x;
asm volatile ("" : "+v" (a));
c = (V) { a, *y };
asm volatile ("" : "+v" (c));
}
/* { dg-final { scan-assembler-not "vpinsrd\[^\n\r]*\\\$1\[^\n\r]*%xmm16\[^\n\r]*%xmm3" } } */
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment