1  /* { dg-options "-O2 -ftree-vectorize -fno-tree-loop-distribute-patterns" } */
       2  
       3  #include <stdint.h>
       4  
       5  #define TEST_LOOP(TYPE1, TYPE2)						\
       6    void									\
       7    f_##TYPE1##_##TYPE2 (TYPE1 *restrict dst1, TYPE1 *restrict src1,	\
       8  		       TYPE2 *restrict dst2, int n)			\
       9    {									\
      10      for (int i = 0; i < n; ++i)						\
      11        {									\
      12  	dst1[i] += src1[i];						\
      13  	dst2[i] = 1;							\
      14        }									\
      15    }
      16  
      17  #define TEST_ALL(T) \
      18    T (uint16_t, uint8_t) \
      19    T (uint32_t, uint16_t) \
      20    T (uint32_t, _Float16) \
      21    T (uint64_t, uint32_t) \
      22    T (uint64_t, float)
      23  
      24  TEST_ALL (TEST_LOOP)
      25  
      26  /* { dg-final { scan-assembler-times {\tmov\tz[0-9]+\.b, #1\n} 1 } } */
      27  /* { dg-final { scan-assembler-times {\tmov\tz[0-9]+\.h, #1\n} 1 } } */
      28  /* { dg-final { scan-assembler-times {\tmov\tz[0-9]+\.s, #1\n} 1 } } */
      29  /* { dg-final { scan-assembler-times {\tfmov\tz[0-9]+\.h, #1\.0} 1 } } */
      30  /* { dg-final { scan-assembler-times {\tfmov\tz[0-9]+\.s, #1\.0} 1 } } */
      31  
      32  /* { dg-final { scan-assembler-times {\tst1b\tz[0-9]+\.h,} 1 } } */
      33  /* { dg-final { scan-assembler-times {\tst1h\tz[0-9]+\.s,} 2 } } */
      34  /* { dg-final { scan-assembler-times {\tst1w\tz[0-9]+\.d,} 2 } } */
      35  
      36  /* { dg-final { scan-assembler-times {\tld1h\tz[0-9]+\.h,} 2 } } */
      37  /* { dg-final { scan-assembler-times {\tst1h\tz[0-9]+\.h,} 1 } } */
      38  /* { dg-final { scan-assembler-times {\tld1w\tz[0-9]+\.s,} 4 } } */
      39  /* { dg-final { scan-assembler-times {\tst1w\tz[0-9]+\.s,} 2 } } */
      40  /* { dg-final { scan-assembler-times {\tld1d\tz[0-9]+\.d,} 4 } } */
      41  /* { dg-final { scan-assembler-times {\tst1d\tz[0-9]+\.d,} 2 } } */