1  /* Copyright (C) 2013-2023 Free Software Foundation, Inc.
       2  
       3     This file is part of GCC.
       4  
       5     GCC is free software; you can redistribute it and/or modify
       6     it under the terms of the GNU General Public License as published by
       7     the Free Software Foundation; either version 3, or (at your option)
       8     any later version.
       9  
      10     GCC is distributed in the hope that it will be useful,
      11     but WITHOUT ANY WARRANTY; without even the implied warranty of
      12     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
      13     GNU General Public License for more details.
      14  
      15     Under Section 7 of GPL version 3, you are granted additional
      16     permissions described in the GCC Runtime Library Exception, version
      17     3.1, as published by the Free Software Foundation.
      18  
      19     You should have received a copy of the GNU General Public License and
      20     a copy of the GCC Runtime Library Exception along with this program;
      21     see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
      22     <http://www.gnu.org/licenses/>.  */
      23  
      24  #ifndef _IMMINTRIN_H_INCLUDED
      25  #error "Never use <avx512vbmivlintrin.h> directly; include <immintrin.h> instead."
      26  #endif
      27  
      28  #ifndef _AVX512VBMIVLINTRIN_H_INCLUDED
      29  #define _AVX512VBMIVLINTRIN_H_INCLUDED
      30  
      31  #if !defined(__AVX512VL__) || !defined(__AVX512VBMI__)
      32  #pragma GCC push_options
      33  #pragma GCC target("avx512vbmi,avx512vl")
      34  #define __DISABLE_AVX512VBMIVL__
      35  #endif /* __AVX512VBMIVL__ */
      36  
      37  extern __inline __m256i
      38  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      39  _mm256_mask_multishift_epi64_epi8 (__m256i __W, __mmask32 __M, __m256i __X, __m256i __Y)
      40  {
      41    return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
      42  							  (__v32qi) __Y,
      43  							  (__v32qi) __W,
      44  							  (__mmask32) __M);
      45  }
      46  
      47  extern __inline __m256i
      48  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      49  _mm256_maskz_multishift_epi64_epi8 (__mmask32 __M, __m256i __X, __m256i __Y)
      50  {
      51    return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
      52  							  (__v32qi) __Y,
      53  							  (__v32qi)
      54  							  _mm256_setzero_si256 (),
      55  							  (__mmask32) __M);
      56  }
      57  
      58  extern __inline __m256i
      59  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      60  _mm256_multishift_epi64_epi8 (__m256i __X, __m256i __Y)
      61  {
      62    return (__m256i) __builtin_ia32_vpmultishiftqb256_mask ((__v32qi) __X,
      63  							  (__v32qi) __Y,
      64  							  (__v32qi)
      65  							  _mm256_undefined_si256 (),
      66  							  (__mmask32) -1);
      67  }
      68  
      69  extern __inline __m128i
      70  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      71  _mm_mask_multishift_epi64_epi8 (__m128i __W, __mmask16 __M, __m128i __X, __m128i __Y)
      72  {
      73    return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
      74  							  (__v16qi) __Y,
      75  							  (__v16qi) __W,
      76  							  (__mmask16) __M);
      77  }
      78  
      79  extern __inline __m128i
      80  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      81  _mm_maskz_multishift_epi64_epi8 (__mmask16 __M, __m128i __X, __m128i __Y)
      82  {
      83    return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
      84  							  (__v16qi) __Y,
      85  							  (__v16qi)
      86  							  _mm_setzero_si128 (),
      87  							  (__mmask16) __M);
      88  }
      89  
      90  extern __inline __m128i
      91  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
      92  _mm_multishift_epi64_epi8 (__m128i __X, __m128i __Y)
      93  {
      94    return (__m128i) __builtin_ia32_vpmultishiftqb128_mask ((__v16qi) __X,
      95  							  (__v16qi) __Y,
      96  							  (__v16qi)
      97  							  _mm_undefined_si128 (),
      98  							  (__mmask16) -1);
      99  }
     100  
     101  extern __inline __m256i
     102  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     103  _mm256_permutexvar_epi8 (__m256i __A, __m256i __B)
     104  {
     105    return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
     106  						     (__v32qi) __A,
     107  						     (__v32qi)
     108  						     _mm256_undefined_si256 (),
     109  						     (__mmask32) -1);
     110  }
     111  
     112  extern __inline __m256i
     113  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     114  _mm256_maskz_permutexvar_epi8 (__mmask32 __M, __m256i __A,
     115  				__m256i __B)
     116  {
     117    return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
     118  						     (__v32qi) __A,
     119  						     (__v32qi)
     120  						     _mm256_setzero_si256 (),
     121  						     (__mmask32) __M);
     122  }
     123  
     124  extern __inline __m256i
     125  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     126  _mm256_mask_permutexvar_epi8 (__m256i __W, __mmask32 __M, __m256i __A,
     127  			       __m256i __B)
     128  {
     129    return (__m256i) __builtin_ia32_permvarqi256_mask ((__v32qi) __B,
     130  						     (__v32qi) __A,
     131  						     (__v32qi) __W,
     132  						     (__mmask32) __M);
     133  }
     134  
     135  extern __inline __m128i
     136  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     137  _mm_permutexvar_epi8 (__m128i __A, __m128i __B)
     138  {
     139    return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
     140  						     (__v16qi) __A,
     141  						     (__v16qi)
     142  						     _mm_undefined_si128 (),
     143  						     (__mmask16) -1);
     144  }
     145  
     146  extern __inline __m128i
     147  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     148  _mm_maskz_permutexvar_epi8 (__mmask16 __M, __m128i __A, __m128i __B)
     149  {
     150    return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
     151  						     (__v16qi) __A,
     152  						     (__v16qi)
     153  						     _mm_setzero_si128 (),
     154  						     (__mmask16) __M);
     155  }
     156  
     157  extern __inline __m128i
     158  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     159  _mm_mask_permutexvar_epi8 (__m128i __W, __mmask16 __M, __m128i __A,
     160  			    __m128i __B)
     161  {
     162    return (__m128i) __builtin_ia32_permvarqi128_mask ((__v16qi) __B,
     163  						     (__v16qi) __A,
     164  						     (__v16qi) __W,
     165  						     (__mmask16) __M);
     166  }
     167  
     168  extern __inline __m256i
     169  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     170  _mm256_permutex2var_epi8 (__m256i __A, __m256i __I, __m256i __B)
     171  {
     172    return (__m256i) __builtin_ia32_vpermt2varqi256_mask ((__v32qi) __I
     173  							/* idx */ ,
     174  							(__v32qi) __A,
     175  							(__v32qi) __B,
     176  							(__mmask32) -1);
     177  }
     178  
     179  extern __inline __m256i
     180  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     181  _mm256_mask_permutex2var_epi8 (__m256i __A, __mmask32 __U,
     182  				__m256i __I, __m256i __B)
     183  {
     184    return (__m256i) __builtin_ia32_vpermt2varqi256_mask ((__v32qi) __I
     185  							/* idx */ ,
     186  							(__v32qi) __A,
     187  							(__v32qi) __B,
     188  							(__mmask32)
     189  							__U);
     190  }
     191  
     192  extern __inline __m256i
     193  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     194  _mm256_mask2_permutex2var_epi8 (__m256i __A, __m256i __I,
     195  				 __mmask32 __U, __m256i __B)
     196  {
     197    return (__m256i) __builtin_ia32_vpermi2varqi256_mask ((__v32qi) __A,
     198  							(__v32qi) __I
     199  							/* idx */ ,
     200  							(__v32qi) __B,
     201  							(__mmask32)
     202  							__U);
     203  }
     204  
     205  extern __inline __m256i
     206  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     207  _mm256_maskz_permutex2var_epi8 (__mmask32 __U, __m256i __A,
     208  				 __m256i __I, __m256i __B)
     209  {
     210    return (__m256i) __builtin_ia32_vpermt2varqi256_maskz ((__v32qi) __I
     211  							 /* idx */ ,
     212  							 (__v32qi) __A,
     213  							 (__v32qi) __B,
     214  							 (__mmask32)
     215  							 __U);
     216  }
     217  
     218  extern __inline __m128i
     219  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     220  _mm_permutex2var_epi8 (__m128i __A, __m128i __I, __m128i __B)
     221  {
     222    return (__m128i) __builtin_ia32_vpermt2varqi128_mask ((__v16qi) __I
     223  							/* idx */ ,
     224  							(__v16qi) __A,
     225  							(__v16qi) __B,
     226  							(__mmask16) -1);
     227  }
     228  
     229  extern __inline __m128i
     230  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     231  _mm_mask_permutex2var_epi8 (__m128i __A, __mmask16 __U, __m128i __I,
     232  			     __m128i __B)
     233  {
     234    return (__m128i) __builtin_ia32_vpermt2varqi128_mask ((__v16qi) __I
     235  							/* idx */ ,
     236  							(__v16qi) __A,
     237  							(__v16qi) __B,
     238  							(__mmask16)
     239  							__U);
     240  }
     241  
     242  extern __inline __m128i
     243  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     244  _mm_mask2_permutex2var_epi8 (__m128i __A, __m128i __I, __mmask16 __U,
     245  			      __m128i __B)
     246  {
     247    return (__m128i) __builtin_ia32_vpermi2varqi128_mask ((__v16qi) __A,
     248  							(__v16qi) __I
     249  							/* idx */ ,
     250  							(__v16qi) __B,
     251  							(__mmask16)
     252  							__U);
     253  }
     254  
     255  extern __inline __m128i
     256  __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     257  _mm_maskz_permutex2var_epi8 (__mmask16 __U, __m128i __A, __m128i __I,
     258  			      __m128i __B)
     259  {
     260    return (__m128i) __builtin_ia32_vpermt2varqi128_maskz ((__v16qi) __I
     261  							 /* idx */ ,
     262  							 (__v16qi) __A,
     263  							 (__v16qi) __B,
     264  							 (__mmask16)
     265  							 __U);
     266  }
     267  
     268  #ifdef __DISABLE_AVX512VBMIVL__
     269  #undef __DISABLE_AVX512VBMIVL__
     270  #pragma GCC pop_options
     271  #endif /* __DISABLE_AVX512VBMIVL__ */
     272  
     273  #endif /* _AVX512VBMIVLINTRIN_H_INCLUDED */