arm: MVE: Fix constant load pattern

This patch fixes the constant load pattern for MVE, this was not accounting
correctly for label + offset cases.

Added test that ICE'd before and removed the scan assemblers for the mve_vector*
tests as they were too fragile.

gcc/ChangeLog:
2020-04-07  Andre Vieira  <andre.simoesdiasvieira@arm.com>

	* config/arm/arm.c (output_move_neon): Deal with label + offset cases.
	* config/arm/mve.md (*mve_mov<mode>): Handle const vectors.

gcc/testsuite/ChangeLog:
2020-04-07  Andre Vieira  <andre.simoesdiasvieira@arm.com>

	* gcc.target/arm/mve/intrinsics/mve_load_from_array.c: New test.
	* gcc.target/arm/mve/intrinsics/mve_vector_float.c: Remove
	scan-assembler.
	* gcc.target/arm/mve/intrinsics/mve_vector_float1.c: Likewise.
	* gcc.target/arm/mve/intrinsics/mve_vector_int1.c: Likewise.
	* gcc.target/arm/mve/intrinsics/mve_vector_int2.c: Likewise.
This commit is contained in:
Andre Simoes Dias Vieira 2020-04-07 13:36:43 +01:00 committed by Andre Vieira
parent 3ce755a80d
commit b094133c1c
9 changed files with 59 additions and 82 deletions

View File

@ -1,3 +1,8 @@
2020-04-07 Andre Vieira <andre.simoesdiasvieira@arm.com>
* config/arm/arm.c (output_move_neon): Deal with label + offset cases.
* config/arm/mve.md (*mve_mov<mode>): Handle const vectors.
2020-04-07 Andre Vieira <andre.simoesdiasvieira@arm.com>
* config/arm/arm_mve.h: Remove use of typeof for addr pointer parameters

View File

@ -20122,52 +20122,43 @@ output_move_neon (rtx *operands)
break;
}
/* Fall through. */
case LABEL_REF:
case PLUS:
addr = XEXP (addr, 0);
/* Fall through. */
case LABEL_REF:
{
int i;
int overlap = -1;
if (TARGET_HAVE_MVE && !BYTES_BIG_ENDIAN
&& GET_CODE (addr) != LABEL_REF)
for (i = 0; i < nregs; i++)
{
sprintf (buff, "v%srw.32\t%%q0, %%1", load ? "ld" : "st");
ops[0] = reg;
ops[1] = mem;
output_asm_insn (buff, ops);
}
else
{
for (i = 0; i < nregs; i++)
/* We're only using DImode here because it's a convenient
size. */
ops[0] = gen_rtx_REG (DImode, REGNO (reg) + 2 * i);
ops[1] = adjust_address (mem, DImode, 8 * i);
if (reg_overlap_mentioned_p (ops[0], mem))
{
/* We're only using DImode here because it's a convenient
size. */
ops[0] = gen_rtx_REG (DImode, REGNO (reg) + 2 * i);
ops[1] = adjust_address (mem, DImode, 8 * i);
if (reg_overlap_mentioned_p (ops[0], mem))
{
gcc_assert (overlap == -1);
overlap = i;
}
else
{
if (TARGET_HAVE_MVE && GET_CODE (addr) == LABEL_REF)
sprintf (buff, "v%sr.64\t%%P0, %%1", load ? "ld" : "st");
else
sprintf (buff, "v%sr%%?\t%%P0, %%1", load ? "ld" : "st");
output_asm_insn (buff, ops);
}
gcc_assert (overlap == -1);
overlap = i;
}
if (overlap != -1)
else
{
ops[0] = gen_rtx_REG (DImode, REGNO (reg) + 2 * overlap);
ops[1] = adjust_address (mem, SImode, 8 * overlap);
if (TARGET_HAVE_MVE && GET_CODE (addr) == LABEL_REF)
sprintf (buff, "v%sr.32\t%%P0, %%1", load ? "ld" : "st");
sprintf (buff, "v%sr.64\t%%P0, %%1", load ? "ld" : "st");
else
sprintf (buff, "v%sr%%?\t%%P0, %%1", load ? "ld" : "st");
output_asm_insn (buff, ops);
}
}
if (overlap != -1)
{
ops[0] = gen_rtx_REG (DImode, REGNO (reg) + 2 * overlap);
ops[1] = adjust_address (mem, SImode, 8 * overlap);
if (TARGET_HAVE_MVE && GET_CODE (addr) == LABEL_REF)
sprintf (buff, "v%sr.32\t%%P0, %%1", load ? "ld" : "st");
else
sprintf (buff, "v%sr%%?\t%%P0, %%1", load ? "ld" : "st");
output_asm_insn (buff, ops);
}
return "";
}

View File

@ -695,9 +695,9 @@
case 2:
return "vmov\t%Q0, %R0, %e1 @ <mode>\;vmov\t%J0, %K0, %f1";
case 4:
if ((TARGET_HAVE_MVE_FLOAT && VALID_MVE_SF_MODE (<MODE>mode))
|| (MEM_P (operands[1])
&& GET_CODE (XEXP (operands[1], 0)) == LABEL_REF))
if (MEM_P (operands[1])
&& (GET_CODE (XEXP (operands[1], 0)) == LABEL_REF
|| GET_CODE (XEXP (operands[1], 0)) == CONST))
return output_move_neon (operands);
else
return "vldrb.8 %q0, %E1";

View File

@ -1,3 +1,12 @@
2020-04-07 Andre Vieira <andre.simoesdiasvieira@arm.com>
* gcc.target/arm/mve/intrinsics/mve_load_from_array.c: New test.
* gcc.target/arm/mve/intrinsics/mve_vector_float.c: Remove
scan-assembler.
* gcc.target/arm/mve/intrinsics/mve_vector_float1.c: Likewise.
* gcc.target/arm/mve/intrinsics/mve_vector_int1.c: Likewise.
* gcc.target/arm/mve/intrinsics/mve_vector_int2.c: Likewise.
2020-04-07 Andre Vieira <andre.simoesdiasvieira@arm.com>
* gcc.target/arm/mve/intrinsics/vmulq_n_f16.c: Fix test.

View File

@ -0,0 +1,19 @@
/* { dg-require-effective-target arm_v8_1m_mve_ok } */
/* { dg-add-options arm_v8_1m_mve } */
/* { dg-additional-options "-O2" } */
#include "arm_mve.h"
uint16x8_t
foo (void)
{
static uint16_t const a[] = {0, 1, 2, 3, 4, 5, 6, 7};
return vld1q (a);
}
uint16_t b[] = {0, 1, 2, 3, 4, 5, 6, 7};
void
bar (uint16x8_t value)
{
vst1q (b, value);
}

View File

@ -11,17 +11,9 @@ foo32 (float32x4_t value)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldmia.*" } } */
float16x8_t
foo16 (float16x8_t value)
{
float16x8_t b = value;
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldmia.*" } } */

View File

@ -13,10 +13,6 @@ foo32 ()
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldmia.*" } } */
float16x8_t value1;
float16x8_t
@ -25,7 +21,3 @@ foo16 ()
float16x8_t b = value1;
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldmia.*" } } */

View File

@ -16,10 +16,6 @@ foo8 (void)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldrb.8*" } } */
int16x8_t
foo16 (void)
{
@ -27,10 +23,6 @@ foo16 (void)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldrb.8*" } } */
int32x4_t
foo32 (void)
{
@ -38,10 +30,6 @@ foo32 (void)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldrb.8" } } */
int64x2_t
foo64 (void)
{
@ -49,6 +37,3 @@ foo64 (void)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldrb.8" } } */

View File

@ -11,10 +11,6 @@ foo8 ()
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldr.64.*" } } */
int16x8_t
foo16 (int16x8_t value)
{
@ -22,10 +18,6 @@ foo16 (int16x8_t value)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldr.64.*" } } */
int32x4_t
foo32 (int32x4_t value)
{
@ -33,17 +25,9 @@ foo32 (int32x4_t value)
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldr.64.*" } } */
int64x2_t
foo64 (int64x2_t value)
{
int64x2_t b = {1};
return b;
}
/* { dg-final { scan-assembler "vmov\\tq\[0-7\], q\[0-7\]" } } */
/* { dg-final { scan-assembler "vstrb.*" } } */
/* { dg-final { scan-assembler "vldr.64.*" } } */