122 lines
6.0 KiB
Diff
122 lines
6.0 KiB
Diff
|
2022-01-18 Jakub Jelinek <jakub@redhat.com>
|
||
|
|
||
|
PR target/104104
|
||
|
* config/i386/sse.md
|
||
|
(<avx512>_<complexopname>_<mode><maskc_name><round_name>,
|
||
|
avx512fp16_<complexopname>sh_v8hf<mask_scalarc_name><round_scalarcz_name>,
|
||
|
avx512dq_mul<mode>3<mask_name>, <avx2_avx512>_permvar<mode><mask_name>,
|
||
|
avx2_perm<mode>_1<mask_name>, avx512f_perm<mode>_1<mask_name>,
|
||
|
avx512dq_rangep<mode><mask_name><round_saeonly_name>,
|
||
|
avx512dq_ranges<mode><mask_scalar_name><round_saeonly_scalar_name>,
|
||
|
<avx512>_getmant<mode><mask_name><round_saeonly_name>,
|
||
|
avx512f_vgetmant<mode><mask_scalar_name><round_saeonly_scalar_name>):
|
||
|
Use vxorps\t%x0, %x0, %x0 instead of vxorps\t{%x0, %x0, %x0}.
|
||
|
|
||
|
* gcc.target/i386/pr104104.c: New test.
|
||
|
|
||
|
--- gcc/config/i386/sse.md.jj 2022-01-18 11:58:59.156988142 +0100
|
||
|
+++ gcc/config/i386/sse.md 2022-01-18 21:20:40.022477778 +0100
|
||
|
@@ -6539,7 +6539,7 @@ (define_insn "<avx512>_<complexopname>_<
|
||
|
{
|
||
|
if (TARGET_DEST_FALSE_DEP_FOR_GLC
|
||
|
&& <maskc_dest_false_dep_for_glc_cond>)
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "v<complexopname><ssemodesuffix>\t{<round_maskc_op3>%2, %1, %0<maskc_operand3>|%0<maskc_operand3>, %1, %2<round_maskc_op3>}";
|
||
|
}
|
||
|
[(set_attr "type" "ssemul")
|
||
|
@@ -6750,7 +6750,7 @@ (define_insn "avx512fp16_<complexopname>
|
||
|
{
|
||
|
if (TARGET_DEST_FALSE_DEP_FOR_GLC
|
||
|
&& <mask_scalarc_dest_false_dep_for_glc_cond>)
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "v<complexopname>sh\t{<round_scalarc_mask_op3>%2, %1, %0<mask_scalarc_operand3>|%0<mask_scalarc_operand3>, %1, %2<round_scalarc_mask_op3>}";
|
||
|
}
|
||
|
[(set_attr "type" "ssemul")
|
||
|
@@ -15222,7 +15222,7 @@ (define_insn "avx512dq_mul<mode>3<mask_n
|
||
|
&& <mask3_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1])
|
||
|
&& !reg_mentioned_p (operands[0], operands[2]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vpmullq\t{%2, %1, %0<mask_operand3>|%0<mask_operand3>, %1, %2}";
|
||
|
}
|
||
|
[(set_attr "type" "sseimul")
|
||
|
@@ -24658,7 +24658,7 @@ (define_insn "<avx2_avx512>_permvar<mode
|
||
|
&& <mask3_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1])
|
||
|
&& !reg_mentioned_p (operands[0], operands[2]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vperm<ssemodesuffix>\t{%1, %2, %0<mask_operand3>|%0<mask_operand3>, %2, %1}";
|
||
|
}
|
||
|
[(set_attr "type" "sselog")
|
||
|
@@ -24900,7 +24900,7 @@ (define_insn "avx2_perm<mode>_1<mask_nam
|
||
|
if (TARGET_DEST_FALSE_DEP_FOR_GLC
|
||
|
&& <mask6_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vperm<ssemodesuffix>\t{%2, %1, %0<mask_operand6>|%0<mask_operand6>, %1, %2}";
|
||
|
}
|
||
|
[(set_attr "type" "sselog")
|
||
|
@@ -24975,7 +24975,7 @@ (define_insn "avx512f_perm<mode>_1<mask_
|
||
|
if (TARGET_DEST_FALSE_DEP_FOR_GLC
|
||
|
&& <mask10_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vperm<ssemodesuffix>\t{%2, %1, %0<mask_operand10>|%0<mask_operand10>, %1, %2}";
|
||
|
}
|
||
|
[(set_attr "type" "sselog")
|
||
|
@@ -26880,7 +26880,7 @@ (define_insn "avx512dq_rangep<mode><mask
|
||
|
&& <mask4_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1])
|
||
|
&& !reg_mentioned_p (operands[0], operands[2]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vrange<ssemodesuffix>\t{%3, <round_saeonly_mask_op4>%2, %1, %0<mask_operand4>|%0<mask_operand4>, %1, %2<round_saeonly_mask_op4>, %3}";
|
||
|
}
|
||
|
[(set_attr "type" "sse")
|
||
|
@@ -26903,7 +26903,7 @@ (define_insn "avx512dq_ranges<mode><mask
|
||
|
&& <mask_scalar4_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1])
|
||
|
&& !reg_mentioned_p (operands[0], operands[2]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vrange<ssescalarmodesuffix>\t{%3, <round_saeonly_scalar_mask_op4>%2, %1, %0<mask_scalar_operand4>|%0<mask_scalar_operand4>, %1, %<iptr>2<round_saeonly_scalar_mask_op4>, %3}";
|
||
|
}
|
||
|
[(set_attr "type" "sse")
|
||
|
@@ -26949,7 +26949,7 @@ (define_insn "<avx512>_getmant<mode><mas
|
||
|
if (TARGET_DEST_FALSE_DEP_FOR_GLC
|
||
|
&& <mask3_dest_false_dep_for_glc_cond>
|
||
|
&& MEM_P (operands[1]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vgetmant<ssemodesuffix>\t{%2, <round_saeonly_mask_op3>%1, %0<mask_operand3>|%0<mask_operand3>, %1<round_saeonly_mask_op3>, %2}";
|
||
|
}
|
||
|
[(set_attr "prefix" "evex")
|
||
|
@@ -26971,7 +26971,7 @@ (define_insn "avx512f_vgetmant<mode><mas
|
||
|
&& <mask_scalar4_dest_false_dep_for_glc_cond>
|
||
|
&& !reg_mentioned_p (operands[0], operands[1])
|
||
|
&& !reg_mentioned_p (operands[0], operands[2]))
|
||
|
- output_asm_insn ("vxorps\t{%x0, %x0, %x0}", operands);
|
||
|
+ output_asm_insn ("vxorps\t%x0, %x0, %x0", operands);
|
||
|
return "vgetmant<ssescalarmodesuffix>\t{%3, <round_saeonly_scalar_mask_op4>%2, %1, %0<mask_scalar_operand4>|%0<mask_scalar_operand4>, %1, %<iptr>2<round_saeonly_scalar_mask_op4>, %3}";
|
||
|
}
|
||
|
[(set_attr "prefix" "evex")
|
||
|
--- gcc/testsuite/gcc.target/i386/pr104104.c.jj 2022-01-18 21:38:17.007906673 +0100
|
||
|
+++ gcc/testsuite/gcc.target/i386/pr104104.c 2022-01-18 21:36:10.475623148 +0100
|
||
|
@@ -0,0 +1,10 @@
|
||
|
+/* PR target/104104 */
|
||
|
+/* { dg-do assemble { target vect_simd_clones } } */
|
||
|
+/* { dg-require-effective-target masm_intel } */
|
||
|
+/* { dg-options "-march=alderlake -masm=intel -O1 -fallow-store-data-races -funroll-all-loops" } */
|
||
|
+
|
||
|
+__attribute__ ((simd)) short int
|
||
|
+foo (void)
|
||
|
+{
|
||
|
+ return 0;
|
||
|
+}
|