You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
268 lines
8.1 KiB
268 lines
8.1 KiB
Description: Use unaligned VMOV instructions
|
|
Author: Stephen Kitt <skitt@debian.org>
|
|
Bug-Debian: https://bugs.debian.org/939559
|
|
|
|
Based on a patch originally by Claude Heiland-Allen <claude@mathr.co.uk>
|
|
|
|
--- a/gcc/config/i386/sse.md
|
|
+++ b/gcc/config/i386/sse.md
|
|
@@ -1058,17 +1058,11 @@
|
|
{
|
|
if (FLOAT_MODE_P (GET_MODE_INNER (<MODE>mode)))
|
|
{
|
|
- if (misaligned_operand (operands[1], <MODE>mode))
|
|
- return "vmovu<ssemodesuffix>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
- else
|
|
- return "vmova<ssemodesuffix>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
+ return "vmovu<ssemodesuffix>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
}
|
|
else
|
|
{
|
|
- if (misaligned_operand (operands[1], <MODE>mode))
|
|
- return "vmovdqu<ssescalarsize>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
- else
|
|
- return "vmovdqa<ssescalarsize>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
+ return "vmovdqu<ssescalarsize>\t{%1, %0%{%3%}%N2|%0%{%3%}%N2, %1}";
|
|
}
|
|
}
|
|
[(set_attr "type" "ssemov")
|
|
@@ -1184,17 +1178,11 @@
|
|
{
|
|
if (FLOAT_MODE_P (GET_MODE_INNER (<MODE>mode)))
|
|
{
|
|
- if (misaligned_operand (operands[0], <MODE>mode))
|
|
- return "vmovu<ssemodesuffix>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
- else
|
|
- return "vmova<ssemodesuffix>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
+ return "vmovu<ssemodesuffix>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
}
|
|
else
|
|
{
|
|
- if (misaligned_operand (operands[0], <MODE>mode))
|
|
- return "vmovdqu<ssescalarsize>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
- else
|
|
- return "vmovdqa<ssescalarsize>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
+ return "vmovdqu<ssescalarsize>\t{%1, %0%{%2%}|%0%{%2%}, %1}";
|
|
}
|
|
}
|
|
[(set_attr "type" "ssemov")
|
|
@@ -7806,7 +7794,7 @@
|
|
"TARGET_SSE && !(MEM_P (operands[0]) && MEM_P (operands[1]))"
|
|
"@
|
|
%vmovlps\t{%1, %0|%q0, %1}
|
|
- %vmovaps\t{%1, %0|%0, %1}
|
|
+ %vmovups\t{%1, %0|%0, %1}
|
|
%vmovlps\t{%1, %d0|%d0, %q1}"
|
|
[(set_attr "type" "ssemov")
|
|
(set_attr "prefix" "maybe_vex")
|
|
@@ -13997,29 +13985,15 @@
|
|
switch (<MODE>mode)
|
|
{
|
|
case E_V8DFmode:
|
|
- if (misaligned_operand (operands[2], <ssequartermode>mode))
|
|
- return "vmovupd\t{%2, %x0|%x0, %2}";
|
|
- else
|
|
- return "vmovapd\t{%2, %x0|%x0, %2}";
|
|
+ return "vmovupd\t{%2, %x0|%x0, %2}";
|
|
case E_V16SFmode:
|
|
- if (misaligned_operand (operands[2], <ssequartermode>mode))
|
|
- return "vmovups\t{%2, %x0|%x0, %2}";
|
|
- else
|
|
- return "vmovaps\t{%2, %x0|%x0, %2}";
|
|
+ return "vmovups\t{%2, %x0|%x0, %2}";
|
|
case E_V8DImode:
|
|
- if (misaligned_operand (operands[2], <ssequartermode>mode))
|
|
- return which_alternative == 2 ? "vmovdqu64\t{%2, %x0|%x0, %2}"
|
|
+ return which_alternative == 2 ? "vmovdqu64\t{%2, %x0|%x0, %2}"
|
|
: "vmovdqu\t{%2, %x0|%x0, %2}";
|
|
- else
|
|
- return which_alternative == 2 ? "vmovdqa64\t{%2, %x0|%x0, %2}"
|
|
- : "vmovdqa\t{%2, %x0|%x0, %2}";
|
|
case E_V16SImode:
|
|
- if (misaligned_operand (operands[2], <ssequartermode>mode))
|
|
- return which_alternative == 2 ? "vmovdqu32\t{%2, %x0|%x0, %2}"
|
|
+ return which_alternative == 2 ? "vmovdqu32\t{%2, %x0|%x0, %2}"
|
|
: "vmovdqu\t{%2, %x0|%x0, %2}";
|
|
- else
|
|
- return which_alternative == 2 ? "vmovdqa32\t{%2, %x0|%x0, %2}"
|
|
- : "vmovdqa\t{%2, %x0|%x0, %2}";
|
|
default:
|
|
gcc_unreachable ();
|
|
}
|
|
@@ -21225,63 +21199,27 @@
|
|
switch (get_attr_mode (insn))
|
|
{
|
|
case MODE_V16SF:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- return "vmovups\t{%1, %t0|%t0, %1}";
|
|
- else
|
|
- return "vmovaps\t{%1, %t0|%t0, %1}";
|
|
+ return "vmovups\t{%1, %t0|%t0, %1}";
|
|
case MODE_V8DF:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- return "vmovupd\t{%1, %t0|%t0, %1}";
|
|
- else
|
|
- return "vmovapd\t{%1, %t0|%t0, %1}";
|
|
+ return "vmovupd\t{%1, %t0|%t0, %1}";
|
|
case MODE_V8SF:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- return "vmovups\t{%1, %x0|%x0, %1}";
|
|
- else
|
|
- return "vmovaps\t{%1, %x0|%x0, %1}";
|
|
+ return "vmovups\t{%1, %x0|%x0, %1}";
|
|
case MODE_V4DF:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- return "vmovupd\t{%1, %x0|%x0, %1}";
|
|
- else
|
|
- return "vmovapd\t{%1, %x0|%x0, %1}";
|
|
+ return "vmovupd\t{%1, %x0|%x0, %1}";
|
|
case MODE_XI:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- {
|
|
- if (which_alternative == 2)
|
|
- return "vmovdqu\t{%1, %t0|%t0, %1}";
|
|
- else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
- return "vmovdqu64\t{%1, %t0|%t0, %1}";
|
|
- else
|
|
- return "vmovdqu32\t{%1, %t0|%t0, %1}";
|
|
- }
|
|
+ if (which_alternative == 2)
|
|
+ return "vmovdqu\t{%1, %t0|%t0, %1}";
|
|
+ else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
+ return "vmovdqu64\t{%1, %t0|%t0, %1}";
|
|
else
|
|
- {
|
|
- if (which_alternative == 2)
|
|
- return "vmovdqa\t{%1, %t0|%t0, %1}";
|
|
- else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
- return "vmovdqa64\t{%1, %t0|%t0, %1}";
|
|
- else
|
|
- return "vmovdqa32\t{%1, %t0|%t0, %1}";
|
|
- }
|
|
+ return "vmovdqu32\t{%1, %t0|%t0, %1}";
|
|
case MODE_OI:
|
|
- if (misaligned_operand (operands[1], <ssehalfvecmode>mode))
|
|
- {
|
|
- if (which_alternative == 2)
|
|
- return "vmovdqu\t{%1, %x0|%x0, %1}";
|
|
- else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
- return "vmovdqu64\t{%1, %x0|%x0, %1}";
|
|
- else
|
|
- return "vmovdqu32\t{%1, %x0|%x0, %1}";
|
|
- }
|
|
+ if (which_alternative == 2)
|
|
+ return "vmovdqu\t{%1, %x0|%x0, %1}";
|
|
+ else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
+ return "vmovdqu64\t{%1, %x0|%x0, %1}";
|
|
else
|
|
- {
|
|
- if (which_alternative == 2)
|
|
- return "vmovdqa\t{%1, %x0|%x0, %1}";
|
|
- else if (GET_MODE_SIZE (<ssescalarmode>mode) == 8)
|
|
- return "vmovdqa64\t{%1, %x0|%x0, %1}";
|
|
- else
|
|
- return "vmovdqa32\t{%1, %x0|%x0, %1}";
|
|
- }
|
|
+ return "vmovdqu32\t{%1, %x0|%x0, %1}";
|
|
default:
|
|
gcc_unreachable ();
|
|
}
|
|
--- a/gcc/config/i386/i386.c
|
|
+++ b/gcc/config/i386/i386.c
|
|
@@ -4981,13 +4981,13 @@
|
|
switch (type)
|
|
{
|
|
case opcode_int:
|
|
- opcode = misaligned_p ? "vmovdqu32" : "vmovdqa32";
|
|
+ opcode = "vmovdqu32";
|
|
break;
|
|
case opcode_float:
|
|
- opcode = misaligned_p ? "vmovups" : "vmovaps";
|
|
+ opcode = "vmovups";
|
|
break;
|
|
case opcode_double:
|
|
- opcode = misaligned_p ? "vmovupd" : "vmovapd";
|
|
+ opcode = "vmovupd";
|
|
break;
|
|
}
|
|
}
|
|
@@ -4996,16 +4996,16 @@
|
|
switch (scalar_mode)
|
|
{
|
|
case E_SFmode:
|
|
- opcode = misaligned_p ? "%vmovups" : "%vmovaps";
|
|
+ opcode = "%vmovups";
|
|
break;
|
|
case E_DFmode:
|
|
- opcode = misaligned_p ? "%vmovupd" : "%vmovapd";
|
|
+ opcode = "%vmovupd";
|
|
break;
|
|
case E_TFmode:
|
|
if (evex_reg_p)
|
|
- opcode = misaligned_p ? "vmovdqu64" : "vmovdqa64";
|
|
+ opcode = "vmovdqu64";
|
|
else
|
|
- opcode = misaligned_p ? "%vmovdqu" : "%vmovdqa";
|
|
+ opcode = "%vmovdqu";
|
|
break;
|
|
default:
|
|
gcc_unreachable ();
|
|
@@ -5017,48 +5017,32 @@
|
|
{
|
|
case E_QImode:
|
|
if (evex_reg_p)
|
|
- opcode = (misaligned_p
|
|
- ? (TARGET_AVX512BW
|
|
- ? "vmovdqu8"
|
|
- : "vmovdqu64")
|
|
- : "vmovdqa64");
|
|
+ opcode = TARGET_AVX512BW ? "vmovdqu8" : "vmovdqu64";
|
|
else
|
|
- opcode = (misaligned_p
|
|
- ? (TARGET_AVX512BW
|
|
- ? "vmovdqu8"
|
|
- : "%vmovdqu")
|
|
- : "%vmovdqa");
|
|
+ opcode = TARGET_AVX512BW ? "vmovdqu8" : "%vmovdqu";
|
|
break;
|
|
case E_HImode:
|
|
if (evex_reg_p)
|
|
- opcode = (misaligned_p
|
|
- ? (TARGET_AVX512BW
|
|
- ? "vmovdqu16"
|
|
- : "vmovdqu64")
|
|
- : "vmovdqa64");
|
|
+ opcode = TARGET_AVX512BW ? "vmovdqu16" : "vmovdqu64";
|
|
else
|
|
- opcode = (misaligned_p
|
|
- ? (TARGET_AVX512BW
|
|
- ? "vmovdqu16"
|
|
- : "%vmovdqu")
|
|
- : "%vmovdqa");
|
|
+ opcode = TARGET_AVX512BW ? "vmovdqu16" : "%vmovdqu";
|
|
break;
|
|
case E_SImode:
|
|
if (evex_reg_p)
|
|
- opcode = misaligned_p ? "vmovdqu32" : "vmovdqa32";
|
|
+ opcode = "vmovdqu32";
|
|
else
|
|
- opcode = misaligned_p ? "%vmovdqu" : "%vmovdqa";
|
|
+ opcode = "%vmovdqu";
|
|
break;
|
|
case E_DImode:
|
|
case E_TImode:
|
|
case E_OImode:
|
|
if (evex_reg_p)
|
|
- opcode = misaligned_p ? "vmovdqu64" : "vmovdqa64";
|
|
+ opcode = "vmovdqu64";
|
|
else
|
|
- opcode = misaligned_p ? "%vmovdqu" : "%vmovdqa";
|
|
+ opcode = "%vmovdqu";
|
|
break;
|
|
case E_XImode:
|
|
- opcode = misaligned_p ? "vmovdqu64" : "vmovdqa64";
|
|
+ opcode = "vmovdqu64";
|
|
break;
|
|
default:
|
|
gcc_unreachable ();
|