1  /* { dg-do compile } */
       2  /* { dg-options "-O2 -ftree-vectorize -ffast-math -fno-vect-cost-model" } */
       3  
       4  #include <stdint.h>
       5  
       6  #define TEST_LOOP(NAME, OUTTYPE, INTYPE, MASKTYPE)		\
       7    void __attribute__ ((noinline, noclone))			\
       8    NAME##_4 (OUTTYPE *__restrict dest, INTYPE *__restrict src,	\
       9  	    MASKTYPE *__restrict cond, INTYPE bias, intptr_t n)	\
      10    {								\
      11      for (intptr_t i = 0; i < n; ++i)				\
      12        {								\
      13  	INTYPE value = src[i] + bias;				\
      14  	if (cond[i])						\
      15  	  {							\
      16  	    dest[i * 4] = value;				\
      17  	    dest[i * 4 + 1] = value;				\
      18  	    dest[i * 4 + 2] = value;				\
      19  	    dest[i * 4 + 3] = value;				\
      20  	  }							\
      21        }								\
      22    }
      23  
      24  #define TEST2(NAME, OUTTYPE, INTYPE) \
      25    TEST_LOOP (NAME##_i8, OUTTYPE, INTYPE, int8_t) \
      26    TEST_LOOP (NAME##_i16, OUTTYPE, INTYPE, uint16_t) \
      27    TEST_LOOP (NAME##_f32, OUTTYPE, INTYPE, float) \
      28    TEST_LOOP (NAME##_f64, OUTTYPE, INTYPE, double)
      29  
      30  #define TEST1(NAME, OUTTYPE) \
      31    TEST2 (NAME##_i8, OUTTYPE, int8_t) \
      32    TEST2 (NAME##_i16, OUTTYPE, uint16_t) \
      33    TEST2 (NAME##_i32, OUTTYPE, int32_t) \
      34    TEST2 (NAME##_i64, OUTTYPE, uint64_t)
      35  
      36  #define TEST(NAME) \
      37    TEST1 (NAME##_i8, int8_t) \
      38    TEST1 (NAME##_i16, uint16_t) \
      39    TEST1 (NAME##_i32, int32_t) \
      40    TEST1 (NAME##_i64, uint64_t) \
      41    TEST2 (NAME##_f16_f16, _Float16, _Float16) \
      42    TEST2 (NAME##_f32_f32, float, float) \
      43    TEST2 (NAME##_f64_f64, double, double)
      44  
      45  TEST (test)
      46  
      47  /*    Mask |  8 16 32 64
      48      -------+------------
      49      In   8 |  1  1  1  1
      50          16 |  1  1  1  1
      51          32 |  1  1  1  1
      52          64 |  1  1  1  1.  */
      53  /* { dg-final { scan-assembler-times {\tst4b\t.z[0-9]} 16 } } */
      54  
      55  /*    Mask |  8 16 32 64
      56      -------+------------
      57      In   8 |  2  2  2  2
      58          16 |  2  1  1  1 x2 (for half float)
      59          32 |  2  1  1  1
      60          64 |  2  1  1  1.  */
      61  /* { dg-final { scan-assembler-times {\tst4h\t.z[0-9]} 28 } } */
      62  
      63  /*    Mask |  8 16 32 64
      64      -------+------------
      65      In   8 |  4  4  4  4
      66          16 |  4  2  2  2
      67          32 |  4  2  1  1 x2 (for float)
      68          64 |  4  2  1  1.  */
      69  /* { dg-final { scan-assembler-times {\tst4w\t.z[0-9]} 50 } } */
      70  
      71  /*    Mask |  8 16 32 64
      72      -------+------------
      73      In   8 |  8  8  8  8
      74          16 |  8  4  4  4
      75          32 |  8  4  2  2
      76          64 |  8  4  2  1 x2 (for double).  */
      77  /* { dg-final { scan-assembler-times {\tst4d\t.z[0-9]} 98 } } */