(root)/
gcc-13.2.0/
gcc/
testsuite/
gcc.target/
x86_64/
abi/
bf16/
m256bf16/
args.h
       1  #ifndef INCLUDED_ARGS_H
       2  #define INCLUDED_ARGS_H
       3  
       4  #include <immintrin.h>
       5  #include <string.h>
       6  
       7  /* Assertion macro.  */
       8  #define assert(test) if (!(test)) abort()
       9  
      10  #ifdef __GNUC__
      11  #define ATTRIBUTE_UNUSED __attribute__((__unused__))
      12  #else
      13  #define ATTRIBUTE_UNUSED
      14  #endif
      15  
      16  /* This defines the calling sequences for integers and floats.  */
      17  #define I0 rdi
      18  #define I1 rsi
      19  #define I2 rdx
      20  #define I3 rcx
      21  #define I4 r8
      22  #define I5 r9
      23  #define F0 ymm0
      24  #define F1 ymm1
      25  #define F2 ymm2
      26  #define F3 ymm3
      27  #define F4 ymm4
      28  #define F5 ymm5
      29  #define F6 ymm6
      30  #define F7 ymm7
      31  
      32  typedef union {
      33    __bf16 ___bf16[16];
      34    float _float[8];
      35    double _double[4];
      36    long long _longlong[4];
      37    int _int[8];
      38    unsigned long long _ulonglong[4];
      39    __m64 _m64[4];
      40    __m128 _m128[2];
      41    __m256 _m256[1];
      42    __m256bf16 _m256bf16[1];
      43  } YMM_T;
      44  
      45  typedef union {
      46    float _float;
      47    double _double;
      48    long double _ldouble;
      49    unsigned long long _ulonglong[2];
      50  } X87_T;
      51  extern void (*callthis)(void);
      52  extern unsigned long long rax,rbx,rcx,rdx,rsi,rdi,rsp,rbp,r8,r9,r10,r11,r12,r13,r14,r15;
      53  extern YMM_T ymm_regs[16];
      54  extern X87_T x87_regs[8];
      55  extern volatile unsigned long long volatile_var;
      56  extern void snapshot (void);
      57  extern void snapshot_ret (void);
      58  #define WRAP_CALL(N) \
      59    (callthis = (void (*)()) (N), (typeof (&N)) snapshot)
      60  #define WRAP_RET(N) \
      61    (callthis = (void (*)()) (N), (typeof (&N)) snapshot_ret)
      62  
      63  /* Clear all integer registers.  */
      64  #define clear_int_hardware_registers \
      65    asm __volatile__ ("xor %%rax, %%rax\n\t" \
      66  		    "xor %%rbx, %%rbx\n\t" \
      67  		    "xor %%rcx, %%rcx\n\t" \
      68  		    "xor %%rdx, %%rdx\n\t" \
      69  		    "xor %%rsi, %%rsi\n\t" \
      70  		    "xor %%rdi, %%rdi\n\t" \
      71  		    "xor %%r8, %%r8\n\t" \
      72  		    "xor %%r9, %%r9\n\t" \
      73  		    "xor %%r10, %%r10\n\t" \
      74  		    "xor %%r11, %%r11\n\t" \
      75  		    "xor %%r12, %%r12\n\t" \
      76  		    "xor %%r13, %%r13\n\t" \
      77  		    "xor %%r14, %%r14\n\t" \
      78  		    "xor %%r15, %%r15\n\t" \
      79  		    ::: "rax", "rbx", "rcx", "rdx", "rsi", "rdi", "r8", \
      80  		    "r9", "r10", "r11", "r12", "r13", "r14", "r15");
      81  
      82  /* This is the list of registers available for passing arguments. Not all of
      83     these are used or even really available.  */
      84  struct IntegerRegisters
      85  {
      86    unsigned long long rax, rbx, rcx, rdx, rsi, rdi, r8, r9, r10, r11, r12, r13, r14, r15;
      87  };
      88  struct FloatRegisters
      89  {
      90    double mm0, mm1, mm2, mm3, mm4, mm5, mm6, mm7;
      91    long double st0, st1, st2, st3, st4, st5, st6, st7;
      92    YMM_T ymm0, ymm1, ymm2, ymm3, ymm4, ymm5, ymm6, ymm7, ymm8, ymm9,
      93          ymm10, ymm11, ymm12, ymm13, ymm14, ymm15;
      94  };
      95  
      96  /* Implemented in scalarargs.c  */
      97  extern struct IntegerRegisters iregs;
      98  extern struct FloatRegisters fregs;
      99  extern unsigned int num_iregs, num_fregs;
     100  
     101  /* Clear register struct.  */
     102  #define clear_struct_registers \
     103    rax = rbx = rcx = rdx = rdi = rsi = rbp = rsp \
     104      = r8 = r9 = r10 = r11 = r12 = r13 = r14 = r15 = 0; \
     105    memset (&iregs, 0, sizeof (iregs)); \
     106    memset (&fregs, 0, sizeof (fregs)); \
     107    memset (ymm_regs, 0, sizeof (ymm_regs)); \
     108    memset (x87_regs, 0, sizeof (x87_regs));
     109  
     110  /* Clear both hardware and register structs for integers.  */
     111  #define clear_int_registers \
     112    clear_struct_registers \
     113    clear_int_hardware_registers
     114  
     115  #define check_vector_arguments(T,O) do { \
     116    assert (num_fregs <= 0 \
     117  	  || memcmp (((char *) &fregs.ymm0) + (O), \
     118  		     &ymm_regs[0], \
     119  		     sizeof (__ ## T) - (O)) == 0); \
     120    assert (num_fregs <= 1 \
     121  	  || memcmp (((char *) &fregs.ymm1) + (O), \
     122  		     &ymm_regs[1], \
     123  		     sizeof (__ ## T) - (O)) == 0); \
     124    assert (num_fregs <= 2 \
     125  	  || memcmp (((char *) &fregs.ymm2) + (O), \
     126  		     &ymm_regs[2], \
     127  		     sizeof (__ ## T) - (O)) == 0); \
     128    assert (num_fregs <= 3 \
     129  	  || memcmp (((char *) &fregs.ymm3) + (O), \
     130  		     &ymm_regs[3], \
     131  		     sizeof (__ ## T) - (O)) == 0); \
     132    assert (num_fregs <= 4 \
     133  	  || memcmp (((char *) &fregs.ymm4) + (O), \
     134  		     &ymm_regs[4], \
     135  		     sizeof (__ ## T) - (O)) == 0); \
     136    assert (num_fregs <= 5 \
     137  	  || memcmp (((char *) &fregs.ymm5) + (O), \
     138  		     &ymm_regs[5], \
     139  		     sizeof (__ ## T) - (O)) == 0); \
     140    assert (num_fregs <= 6 \
     141  	  || memcmp (((char *) &fregs.ymm6) + (O), \
     142  		     &ymm_regs[6], \
     143  		     sizeof (__ ## T) - (O)) == 0); \
     144    assert (num_fregs <= 7 \
     145  	  || memcmp (((char *) &fregs.ymm7) + (O), \
     146  		     &ymm_regs[7], \
     147  		     sizeof (__ ## T) - (O)) == 0); \
     148    } while (0)
     149  
     150  #define check_m256_arguments check_vector_arguments(m256, 0)
     151  
     152  #endif /* INCLUDED_ARGS_H  */