@@ -178,16 +178,16 @@ _kadd_mask64(__mmask64 __A, __mmask64 __B)
178
178
}
179
179
180
180
#define _kshiftli_mask32 (A , I ) \
181
- (__mmask32)__builtin_ia32_kshiftlisi((__mmask32)(A), (unsigned int)(I))
181
+ (( __mmask32)__builtin_ia32_kshiftlisi((__mmask32)(A), (unsigned int)(I) ))
182
182
183
183
#define _kshiftri_mask32 (A , I ) \
184
- (__mmask32)__builtin_ia32_kshiftrisi((__mmask32)(A), (unsigned int)(I))
184
+ (( __mmask32)__builtin_ia32_kshiftrisi((__mmask32)(A), (unsigned int)(I) ))
185
185
186
186
#define _kshiftli_mask64 (A , I ) \
187
- (__mmask64)__builtin_ia32_kshiftlidi((__mmask64)(A), (unsigned int)(I))
187
+ (( __mmask64)__builtin_ia32_kshiftlidi((__mmask64)(A), (unsigned int)(I) ))
188
188
189
189
#define _kshiftri_mask64 (A , I ) \
190
- (__mmask64)__builtin_ia32_kshiftridi((__mmask64)(A), (unsigned int)(I))
190
+ (( __mmask64)__builtin_ia32_kshiftridi((__mmask64)(A), (unsigned int)(I) ))
191
191
192
192
static __inline__ unsigned int __DEFAULT_FN_ATTRS
193
193
_cvtmask32_u32 (__mmask32 __A ) {
@@ -232,44 +232,44 @@ _store_mask64(__mmask64 *__A, __mmask64 __B) {
232
232
/* Integer compare */
233
233
234
234
#define _mm512_cmp_epi8_mask (a , b , p ) \
235
- (__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
236
- (__v64qi)(__m512i)(b), (int)(p), \
237
- (__mmask64)-1)
235
+ (( __mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
236
+ (__v64qi)(__m512i)(b), (int)(p), \
237
+ (__mmask64)-1) )
238
238
239
239
#define _mm512_mask_cmp_epi8_mask (m , a , b , p ) \
240
- (__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
241
- (__v64qi)(__m512i)(b), (int)(p), \
242
- (__mmask64)(m))
240
+ (( __mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
241
+ (__v64qi)(__m512i)(b), (int)(p), \
242
+ (__mmask64)(m) ))
243
243
244
244
#define _mm512_cmp_epu8_mask (a , b , p ) \
245
- (__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
246
- (__v64qi)(__m512i)(b), (int)(p), \
247
- (__mmask64)-1)
245
+ (( __mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
246
+ (__v64qi)(__m512i)(b), (int)(p), \
247
+ (__mmask64)-1) )
248
248
249
249
#define _mm512_mask_cmp_epu8_mask (m , a , b , p ) \
250
- (__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
251
- (__v64qi)(__m512i)(b), (int)(p), \
252
- (__mmask64)(m))
250
+ (( __mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
251
+ (__v64qi)(__m512i)(b), (int)(p), \
252
+ (__mmask64)(m) ))
253
253
254
254
#define _mm512_cmp_epi16_mask (a , b , p ) \
255
- (__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
256
- (__v32hi)(__m512i)(b), (int)(p), \
257
- (__mmask32)-1)
255
+ (( __mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
256
+ (__v32hi)(__m512i)(b), (int)(p), \
257
+ (__mmask32)-1) )
258
258
259
259
#define _mm512_mask_cmp_epi16_mask (m , a , b , p ) \
260
- (__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
261
- (__v32hi)(__m512i)(b), (int)(p), \
262
- (__mmask32)(m))
260
+ (( __mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
261
+ (__v32hi)(__m512i)(b), (int)(p), \
262
+ (__mmask32)(m) ))
263
263
264
264
#define _mm512_cmp_epu16_mask (a , b , p ) \
265
- (__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
266
- (__v32hi)(__m512i)(b), (int)(p), \
267
- (__mmask32)-1)
265
+ (( __mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
266
+ (__v32hi)(__m512i)(b), (int)(p), \
267
+ (__mmask32)-1) )
268
268
269
269
#define _mm512_mask_cmp_epu16_mask (m , a , b , p ) \
270
- (__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
271
- (__v32hi)(__m512i)(b), (int)(p), \
272
- (__mmask32)(m))
270
+ (( __mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
271
+ (__v32hi)(__m512i)(b), (int)(p), \
272
+ (__mmask32)(m) ))
273
273
274
274
#define _mm512_cmpeq_epi8_mask (A , B ) \
275
275
_mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_EQ)
@@ -1428,36 +1428,36 @@ _mm512_maskz_cvtepu8_epi16(__mmask32 __U, __m256i __A)
1428
1428
1429
1429
1430
1430
#define _mm512_shufflehi_epi16 (A , imm ) \
1431
- (__m512i)__builtin_ia32_pshufhw512((__v32hi)(__m512i)(A), (int)(imm))
1431
+ (( __m512i)__builtin_ia32_pshufhw512((__v32hi)(__m512i)(A), (int)(imm) ))
1432
1432
1433
1433
#define _mm512_mask_shufflehi_epi16 (W , U , A , imm ) \
1434
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1435
- (__v32hi)_mm512_shufflehi_epi16((A), \
1436
- (imm)), \
1437
- (__v32hi)(__m512i)(W))
1434
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1435
+ (__v32hi)_mm512_shufflehi_epi16((A), \
1436
+ (imm)), \
1437
+ (__v32hi)(__m512i)(W) ))
1438
1438
1439
1439
#define _mm512_maskz_shufflehi_epi16 (U , A , imm ) \
1440
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1441
- (__v32hi)_mm512_shufflehi_epi16((A), \
1442
- (imm)), \
1443
- (__v32hi)_mm512_setzero_si512())
1440
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1441
+ (__v32hi)_mm512_shufflehi_epi16((A), \
1442
+ (imm)), \
1443
+ (__v32hi)_mm512_setzero_si512() ))
1444
1444
1445
1445
#define _mm512_shufflelo_epi16 (A , imm ) \
1446
- (__m512i)__builtin_ia32_pshuflw512((__v32hi)(__m512i)(A), (int)(imm))
1446
+ (( __m512i)__builtin_ia32_pshuflw512((__v32hi)(__m512i)(A), (int)(imm) ))
1447
1447
1448
1448
1449
1449
#define _mm512_mask_shufflelo_epi16 (W , U , A , imm ) \
1450
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1451
- (__v32hi)_mm512_shufflelo_epi16((A), \
1452
- (imm)), \
1453
- (__v32hi)(__m512i)(W))
1450
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1451
+ (__v32hi)_mm512_shufflelo_epi16((A), \
1452
+ (imm)), \
1453
+ (__v32hi)(__m512i)(W) ))
1454
1454
1455
1455
1456
1456
#define _mm512_maskz_shufflelo_epi16 (U , A , imm ) \
1457
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1458
- (__v32hi)_mm512_shufflelo_epi16((A), \
1459
- (imm)), \
1460
- (__v32hi)_mm512_setzero_si512())
1457
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1458
+ (__v32hi)_mm512_shufflelo_epi16((A), \
1459
+ (imm)), \
1460
+ (__v32hi)_mm512_setzero_si512() ))
1461
1461
1462
1462
static __inline__ __m512i __DEFAULT_FN_ATTRS512
1463
1463
_mm512_sllv_epi16 (__m512i __A , __m512i __B )
@@ -1527,7 +1527,7 @@ _mm512_maskz_slli_epi16(__mmask32 __U, __m512i __A, unsigned int __B)
1527
1527
}
1528
1528
1529
1529
#define _mm512_bslli_epi128 (a , imm ) \
1530
- (__m512i)__builtin_ia32_pslldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm))
1530
+ (( __m512i)__builtin_ia32_pslldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm) ))
1531
1531
1532
1532
static __inline__ __m512i __DEFAULT_FN_ATTRS512
1533
1533
_mm512_srlv_epi16 (__m512i __A , __m512i __B )
@@ -1664,7 +1664,7 @@ _mm512_maskz_srli_epi16(__mmask32 __U, __m512i __A, int __B)
1664
1664
}
1665
1665
1666
1666
#define _mm512_bsrli_epi128 (a , imm ) \
1667
- (__m512i)__builtin_ia32_psrldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm))
1667
+ (( __m512i)__builtin_ia32_psrldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm) ))
1668
1668
1669
1669
static __inline__ __m512i __DEFAULT_FN_ATTRS512
1670
1670
_mm512_mask_mov_epi16 (__m512i __W , __mmask32 __U , __m512i __A )
@@ -1984,32 +1984,32 @@ _mm512_mask_permutexvar_epi16 (__m512i __W, __mmask32 __M, __m512i __A,
1984
1984
}
1985
1985
1986
1986
#define _mm512_alignr_epi8 (A , B , N ) \
1987
- (__m512i)__builtin_ia32_palignr512((__v64qi)(__m512i)(A), \
1988
- (__v64qi)(__m512i)(B), (int)(N))
1987
+ (( __m512i)__builtin_ia32_palignr512((__v64qi)(__m512i)(A), \
1988
+ (__v64qi)(__m512i)(B), (int)(N) ))
1989
1989
1990
1990
#define _mm512_mask_alignr_epi8 (W , U , A , B , N ) \
1991
- (__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1992
- (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \
1993
- (__v64qi)(__m512i)(W))
1991
+ (( __m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1992
+ (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \
1993
+ (__v64qi)(__m512i)(W) ))
1994
1994
1995
1995
#define _mm512_maskz_alignr_epi8 (U , A , B , N ) \
1996
- (__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1996
+ (( __m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1997
1997
(__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \
1998
- (__v64qi)(__m512i)_mm512_setzero_si512())
1998
+ (__v64qi)(__m512i)_mm512_setzero_si512()))
1999
1999
2000
2000
#define _mm512_dbsad_epu8 (A , B , imm ) \
2001
- (__m512i)__builtin_ia32_dbpsadbw512((__v64qi)(__m512i)(A), \
2002
- (__v64qi)(__m512i)(B), (int)(imm))
2001
+ (( __m512i)__builtin_ia32_dbpsadbw512((__v64qi)(__m512i)(A), \
2002
+ (__v64qi)(__m512i)(B), (int)(imm) ))
2003
2003
2004
2004
#define _mm512_mask_dbsad_epu8 (W , U , A , B , imm ) \
2005
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
2005
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
2006
2006
(__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \
2007
- (__v32hi)(__m512i)(W))
2007
+ (__v32hi)(__m512i)(W)))
2008
2008
2009
2009
#define _mm512_maskz_dbsad_epu8 (U , A , B , imm ) \
2010
- (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
2010
+ (( __m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
2011
2011
(__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \
2012
- (__v32hi)_mm512_setzero_si512())
2012
+ (__v32hi)_mm512_setzero_si512()))
2013
2013
2014
2014
static __inline__ __m512i __DEFAULT_FN_ATTRS512
2015
2015
_mm512_sad_epu8 (__m512i __A , __m512i __B )
0 commit comments