1  /* Disabling epilogues until we find a better way to deal with scans.  */
       2  /* { dg-additional-options "--param vect-epilogues-nomask=0" } */
       3  /* { dg-require-effective-target vect_int } */
       4  
       5  #include <stdarg.h>
       6  #include "tree-vect.h"
       7  
       8  #define N 64
       9  
      10  #define DOT 43680
      11  
      12  unsigned char X[N] __attribute__ ((__aligned__(__BIGGEST_ALIGNMENT__))) = {0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63};
      13  unsigned char Y[N] __attribute__ ((__aligned__(__BIGGEST_ALIGNMENT__))) = {64,63,62,61,60,59,58,57,56,55,54,53,52,51,50,49,48,47,46,45,44,43,42,41,40,39,38,37,36,35,34,33,32,31,30,29,28,27,26,25,24,23,22,21,20,19,18,17,16,15,14,13,12,11,10,9,8,7,6,5,4,3,2,1};
      14  
      15  /* char->short->short dot product. 
      16     Detected as a dot-product pattern.
      17     Should be vectorized on targets that support dot-product for unsigned chars,
      18     but currently this test cannot be vectorized as a dot-product on targets
      19     that support char->short->int dot-product. 
      20     Alternatively, this test can be vectorized using vect_widen_mult_qi (or
      21     vect_unpack and non-widening multplication: vect_unpack && vect_short_mult).
      22     */
      23  __attribute__ ((noinline)) unsigned short
      24  foo (int len) {
      25    int i;
      26    unsigned short result = 0;
      27  
      28    for (i=0; i<len; i++) {
      29      result += (unsigned short)(X[i] * Y[i]);
      30    }
      31    return result;
      32  }
      33  
      34  int main (void)
      35  {
      36    unsigned short dot;
      37    int i;
      38  
      39    check_vect ();
      40  
      41    dot = foo (N);
      42    if (dot != DOT)
      43      abort ();
      44  
      45    return 0;
      46  }
      47  
      48  /* { dg-final { scan-tree-dump-times "vect_recog_dot_prod_pattern: detected" 1 "vect" } } */
      49  
      50  /* When the vectorizer is enhanced to vectorize accumulation into short for 
      51     targets that support accumulation into int (powerpc, ia64) we'd have:
      52  dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" { target vect_udot_qi || vect_widen_mult_qi_to_hi } }
      53  */
      54  /* { dg-final { scan-tree-dump-times "vectorized 1 loops" 1 "vect" {target { vect_widen_mult_qi_to_hi || vect_unpack } } } } */
      55  
      56