1  /* { dg-do compile { target lp64 } } */
       2  /* { dg-options "-O -mlittle-endian -fno-stack-clash-protection -g" } */
       3  /* { dg-final { check-function-bodies "**" "" } } */
       4  
       5  #pragma GCC aarch64 "arm_sve.h"
       6  
       7  /*
       8  ** callee1:
       9  **	...
      10  **	ldr	(z[0-9]+), \[x1, #3, mul vl\]
      11  **	...
      12  **	st4w	{z[0-9]+\.s - \1\.s}, p0, \[x0\]
      13  **	st2w	{z3\.s - z4\.s}, p1, \[x0\]
      14  **	st3w	{z5\.s - z7\.s}, p2, \[x0\]
      15  **	ret
      16  */
      17  void __attribute__((noipa))
      18  callee1 (void *x0, svuint32x3_t z0, svuint32x2_t z3, svuint32x3_t z5,
      19  	 svuint32x4_t stack1, svuint32_t stack2, svbool_t p0,
      20  	 svbool_t p1, svbool_t p2)
      21  {
      22    svst4_u32 (p0, x0, stack1);
      23    svst2_u32 (p1, x0, z3);
      24    svst3_u32 (p2, x0, z5);
      25  }
      26  
      27  /*
      28  ** callee2:
      29  **	ptrue	p3\.b, all
      30  **	ld1w	(z[0-9]+\.s), p3/z, \[x2\]
      31  **	st1w	\1, p0, \[x0\]
      32  **	st2w	{z3\.s - z4\.s}, p1, \[x0\]
      33  **	st3w	{z0\.s - z2\.s}, p2, \[x0\]
      34  **	ret
      35  */
      36  void __attribute__((noipa))
      37  callee2 (void *x0, svuint32x3_t z0, svuint32x2_t z3, svuint32x3_t z5,
      38  	 svuint32x4_t stack1, svuint32_t stack2, svbool_t p0,
      39  	 svbool_t p1, svbool_t p2)
      40  {
      41    svst1_u32 (p0, x0, stack2);
      42    svst2_u32 (p1, x0, z3);
      43    svst3_u32 (p2, x0, z0);
      44  }
      45  
      46  void __attribute__((noipa))
      47  caller (void *x0)
      48  {
      49    svbool_t pg;
      50    pg = svptrue_b8 ();
      51    callee1 (x0,
      52  	   svld3_vnum_u32 (pg, x0, -9),
      53  	   svld2_vnum_u32 (pg, x0, -2),
      54  	   svld3_vnum_u32 (pg, x0, 0),
      55  	   svld4_vnum_u32 (pg, x0, 8),
      56  	   svld1_vnum_u32 (pg, x0, 5),
      57  	   svptrue_pat_b8 (SV_VL1),
      58  	   svptrue_pat_b16 (SV_VL2),
      59  	   svptrue_pat_b32 (SV_VL3));
      60  }
      61  
      62  /* { dg-final { scan-assembler {\tld3w\t{z0\.s - z2\.s}, p[0-7]/z, \[x0, #-9, mul vl\]\n} } } */
      63  /* { dg-final { scan-assembler {\tld2w\t{z3\.s - z4\.s}, p[0-7]/z, \[x0, #-2, mul vl\]\n} } } */
      64  /* { dg-final { scan-assembler {\tld3w\t{z5\.s - z7\.s}, p[0-7]/z, \[x0\]\n} } } */
      65  /* { dg-final { scan-assembler {\tld4w\t{(z[0-9]+)\.s - z[0-9]+\.s}.*\tstr\t\1, \[x1\]\n} } } */
      66  /* { dg-final { scan-assembler {\tld4w\t{z[0-9]+\.s - (z[0-9]+)\.s}.*\tstr\t\1, \[x1, #3, mul vl\]\n} } } */
      67  /* { dg-final { scan-assembler {\tld1w\t(z[0-9]+\.s), p[0-7]/z, \[x0, #5, mul vl\]\n.*\tst1w\t\1, p[0-7], \[x2\]\n} } } */
      68  /* { dg-final { scan-assembler {\tptrue\tp0\.b, vl1\n} } } */
      69  /* { dg-final { scan-assembler {\tptrue\tp1\.h, vl2\n} } } */
      70  /* { dg-final { scan-assembler {\tptrue\tp2\.s, vl3\n} } } */