1  /* { dg-do compile { target { ! ia32 } } } */
       2  /* { dg-options "-O2 -march=sandybridge" } */
       3  
       4  #include <stdint.h>
       5  #include <string.h>
       6  
       7  static const char b100_tab[200] = {
       8      '0', '0', '0', '1', '0', '2', '0', '3', '0', '4',
       9      '0', '5', '0', '6', '0', '7', '0', '8', '0', '9',
      10      '1', '0', '1', '1', '1', '2', '1', '3', '1', '4',
      11      '1', '5', '1', '6', '1', '7', '1', '8', '1', '9',
      12      '2', '0', '2', '1', '2', '2', '2', '3', '2', '4',
      13      '2', '5', '2', '6', '2', '7', '2', '8', '2', '9',
      14      '3', '0', '3', '1', '3', '2', '3', '3', '3', '4',
      15      '3', '5', '3', '6', '3', '7', '3', '8', '3', '9',
      16      '4', '0', '4', '1', '4', '2', '4', '3', '4', '4',
      17      '4', '5', '4', '6', '4', '7', '4', '8', '4', '9',
      18      '5', '0', '5', '1', '5', '2', '5', '3', '5', '4',
      19      '5', '5', '5', '6', '5', '7', '5', '8', '5', '9',
      20      '6', '0', '6', '1', '6', '2', '6', '3', '6', '4',
      21      '6', '5', '6', '6', '6', '7', '6', '8', '6', '9',
      22      '7', '0', '7', '1', '7', '2', '7', '3', '7', '4',
      23      '7', '5', '7', '6', '7', '7', '7', '8', '7', '9',
      24      '8', '0', '8', '1', '8', '2', '8', '3', '8', '4',
      25      '8', '5', '8', '6', '8', '7', '8', '8', '8', '9',
      26      '9', '0', '9', '1', '9', '2', '9', '3', '9', '4',
      27      '9', '5', '9', '6', '9', '7', '9', '8', '9', '9',
      28  };
      29  
      30  void uint64_to_ascii_ta7_32_base100(uint64_t val, char *dst) {
      31    const int64_t POW10_10 = ((int64_t)10) * 1000 * 1000 * 1000;
      32    const uint64_t POW2_57_DIV_POW100_4 =
      33        ((int64_t)(1) << 57) / 100 / 100 / 100 / 100 + 1;
      34    const uint64_t MASK32 = ((int64_t)(1) << 32) - 1;
      35    int64_t hix = val / POW10_10;
      36    int64_t lox = val % POW10_10;
      37    int64_t lor = lox & (uint64_t)(-2);
      38    uint64_t hi = hix * POW2_57_DIV_POW100_4;
      39    uint64_t lo = lor * POW2_57_DIV_POW100_4;
      40    memcpy(dst + 0 * 10 + 0, &b100_tab[(hi >> 57) * 2], 2);
      41    memcpy(dst + 1 * 10 + 0, &b100_tab[(lo >> 57) * 2], 2);
      42    hi = (hi >> 25) + 1;
      43    lo = (lo >> 25) + 1;
      44    hi = (hi & MASK32) * 100;
      45    lo = (lo & MASK32) * 100;
      46    memcpy(dst + 0 * 10 + 2, &b100_tab[(hi >> 32) * 2], 2);
      47    hi = (hi & MASK32) * 100;
      48    memcpy(dst + 1 * 10 + 2, &b100_tab[(lo >> 32) * 2], 2);
      49    lo = (lo & MASK32) * 100;
      50    memcpy(dst + 0 * 10 + 4, &b100_tab[(hi >> 32) * 2], 2);
      51    hi = (hi & MASK32) * 100;
      52    memcpy(dst + 1 * 10 + 4, &b100_tab[(lo >> 32) * 2], 2);
      53    lo = (lo & MASK32) * 100;
      54    memcpy(dst + 0 * 10 + 6, &b100_tab[(hi >> 32) * 2], 2);
      55    hi = (hi & MASK32) * 100;
      56    memcpy(dst + 1 * 10 + 6, &b100_tab[(lo >> 32) * 2], 2);
      57    lo = (lo & MASK32) * 100;
      58    hi >>= 32;
      59    lo >>= 32;
      60    lo = (lo & (-2)) | (lox & 1);
      61    memcpy(dst + 0 * 10 + 8, &b100_tab[hi * 2], 2);
      62    memcpy(dst + 1 * 10 + 8, &b100_tab[lo * 2], 2);
      63    dst[2 * 10] = 0;
      64  }
      65  
      66  /* { dg-final { scan-assembler-times "imulq" 11 } } */