Commit af120161 by Jakub Jelinek Committed by Jakub Jelinek

sse.md (vec_set_lo_<mode><mask_name>, [...]): Add && <mask_avx512dq_condition> condition.

	* config/i386/sse.md (vec_set_lo_<mode><mask_name>,
	vec_set_hi_<mode><mask_name>): Add && <mask_avx512dq_condition>
	condition.  For !TARGET_AVX512DQ, emit 32x4 instruction instead
	of 64x2.

	* gcc.target/i386/avx512dq-vinsert-1.c: New test.
	* gcc.target/i386/avx512vl-vinsert-1.c: New test.

From-SVN: r236569
parent 355023ce
2016-05-22 Jakub Jelinek <jakub@redhat.com>
* config/i386/sse.md (vec_set_lo_<mode><mask_name>,
vec_set_hi_<mode><mask_name>): Add && <mask_avx512dq_condition>
condition. For !TARGET_AVX512DQ, emit 32x4 instruction instead
of 64x2.
* config/i386/sse.md (vec_set_lo_v16hi, vec_set_hi_v16hi,
vec_set_lo_v32qi, vec_set_hi_v32qi): Add alternative with
v constraint instead of x and vinserti32x4 insn.
......
......@@ -17818,10 +17818,12 @@
(vec_select:<ssehalfvecmode>
(match_operand:VI8F_256 1 "register_operand" "v")
(parallel [(const_int 2) (const_int 3)]))))]
"TARGET_AVX"
"TARGET_AVX && <mask_avx512dq_condition>"
{
if (TARGET_AVX512VL)
if (TARGET_AVX512DQ)
return "vinsert<shuffletype>64x2\t{$0x0, %2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2, 0x0}";
else if (TARGET_AVX512VL)
return "vinsert<shuffletype>32x4\t{$0x0, %2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2, 0x0}";
else
return "vinsert<i128>\t{$0x0, %2, %1, %0|%0, %1, %2, 0x0}";
}
......@@ -17838,10 +17840,12 @@
(match_operand:VI8F_256 1 "register_operand" "v")
(parallel [(const_int 0) (const_int 1)]))
(match_operand:<ssehalfvecmode> 2 "nonimmediate_operand" "vm")))]
"TARGET_AVX"
"TARGET_AVX && <mask_avx512dq_condition>"
{
if (TARGET_AVX512VL)
if (TARGET_AVX512DQ)
return "vinsert<shuffletype>64x2\t{$0x1, %2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2, 0x1}";
else if (TARGET_AVX512VL)
return "vinsert<shuffletype>32x4\t{$0x1, %2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2, 0x1}";
else
return "vinsert<i128>\t{$0x1, %2, %1, %0|%0, %1, %2, 0x1}";
}
......
2016-05-22 Jakub Jelinek <jakub@redhat.com>
* gcc.target/i386/avx512dq-vinsert-1.c: New test.
* gcc.target/i386/avx512vl-vinsert-1.c: New test.
* gcc.target/i386/avx512vl-vinserti32x4-3.c: New test.
* gcc.target/i386/avx512dq-vbroadcast-2.c: New test.
......
/* { dg-do compile { target { ! ia32 } } } */
/* { dg-options "-O2 -mavx512vl -mavx512dq -masm=att" } */
typedef int V1 __attribute__((vector_size (32)));
typedef long long V2 __attribute__((vector_size (32)));
typedef float V3 __attribute__((vector_size (32)));
typedef double V4 __attribute__((vector_size (32)));
void
f1 (V1 x, int y)
{
register V1 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f2 (V1 x, int y)
{
register V1 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[6] = y;
asm volatile ("" : "+v" (a));
}
void
f3 (V2 x, long long y)
{
register V2 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[1] = y;
asm volatile ("" : "+v" (a));
}
void
f4 (V2 x, long long y)
{
register V2 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f5 (V3 x, float y)
{
register V3 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f6 (V3 x, float y)
{
register V3 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[6] = y;
asm volatile ("" : "+v" (a));
}
void
f7 (V4 x, double y)
{
register V4 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[1] = y;
asm volatile ("" : "+v" (a));
}
void
f8 (V4 x, double y)
{
register V4 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
/* { dg-final { scan-assembler-times "vinserti32x4\[^\n\r]*0x0\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinserti32x4\[^\n\r]*0x1\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinsertf32x4\[^\n\r]*0x0\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinsertf32x4\[^\n\r]*0x1\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vextracti32x4\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 1 } } */
/* { dg-final { scan-assembler-times "vextractf32x4\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 1 } } */
/* { dg-final { scan-assembler-times "vinserti64x2\[^\n\r]*0x0\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinserti64x2\[^\n\r]*0x1\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinsertf64x2\[^\n\r]*0x0\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vinsertf64x2\[^\n\r]*0x1\[^\n\r]*%ymm16" 1 } } */
/* { dg-final { scan-assembler-times "vextracti64x2\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 1 } } */
/* { dg-final { scan-assembler-times "vextractf64x2\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 1 } } */
/* { dg-do compile { target { ! ia32 } } } */
/* { dg-options "-O2 -mavx512vl -mno-avx512dq -masm=att" } */
typedef int V1 __attribute__((vector_size (32)));
typedef long long V2 __attribute__((vector_size (32)));
typedef float V3 __attribute__((vector_size (32)));
typedef double V4 __attribute__((vector_size (32)));
void
f1 (V1 x, int y)
{
register V1 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f2 (V1 x, int y)
{
register V1 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[6] = y;
asm volatile ("" : "+v" (a));
}
void
f3 (V2 x, long long y)
{
register V2 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[1] = y;
asm volatile ("" : "+v" (a));
}
void
f4 (V2 x, long long y)
{
register V2 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f5 (V3 x, float y)
{
register V3 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
void
f6 (V3 x, float y)
{
register V3 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[6] = y;
asm volatile ("" : "+v" (a));
}
void
f7 (V4 x, double y)
{
register V4 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[1] = y;
asm volatile ("" : "+v" (a));
}
void
f8 (V4 x, double y)
{
register V4 a __asm ("xmm16");
a = x;
asm volatile ("" : "+v" (a));
a[3] = y;
asm volatile ("" : "+v" (a));
}
/* { dg-final { scan-assembler-times "vinserti32x4\[^\n\r]*0x0\[^\n\r]*%ymm16" 2 } } */
/* { dg-final { scan-assembler-times "vinserti32x4\[^\n\r]*0x1\[^\n\r]*%ymm16" 2 } } */
/* { dg-final { scan-assembler-times "vinsertf32x4\[^\n\r]*0x0\[^\n\r]*%ymm16" 2 } } */
/* { dg-final { scan-assembler-times "vinsertf32x4\[^\n\r]*0x1\[^\n\r]*%ymm16" 2 } } */
/* { dg-final { scan-assembler-times "vextracti32x4\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 2 } } */
/* { dg-final { scan-assembler-times "vextractf32x4\[^\n\r]*0x1\[^\n\r]*%\[yz]mm16" 2 } } */
/* { dg-final { scan-assembler-not "vinserti64x2" } } */
/* { dg-final { scan-assembler-not "vinsertf64x2" } } */
/* { dg-final { scan-assembler-not "vextracti64x2" } } */
/* { dg-final { scan-assembler-not "vextracti64x2" } } */
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment