#define _mm_cmp_epi8_mask(a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)(__m128i)(a), \
- (__v16qi)(__m128i)(b), \
- (p), (__mmask16)-1); })
+ (__v16qi)(__m128i)(b), (int)(p), \
+ (__mmask16)-1); })
#define _mm_mask_cmp_epi8_mask(m, a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)(__m128i)(a), \
- (__v16qi)(__m128i)(b), \
- (p), (__mmask16)(m)); })
+ (__v16qi)(__m128i)(b), (int)(p), \
+ (__mmask16)(m)); })
#define _mm_cmp_epu8_mask(a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)(__m128i)(a), \
- (__v16qi)(__m128i)(b), \
- (p), (__mmask16)-1); })
+ (__v16qi)(__m128i)(b), (int)(p), \
+ (__mmask16)-1); })
#define _mm_mask_cmp_epu8_mask(m, a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)(__m128i)(a), \
- (__v16qi)(__m128i)(b), \
- (p), (__mmask16)(m)); })
+ (__v16qi)(__m128i)(b), (int)(p), \
+ (__mmask16)(m)); })
#define _mm256_cmp_epi8_mask(a, b, p) __extension__ ({ \
(__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)(__m256i)(a), \
- (__v32qi)(__m256i)(b), \
- (p), (__mmask32)-1); })
+ (__v32qi)(__m256i)(b), (int)(p), \
+ (__mmask32)-1); })
#define _mm256_mask_cmp_epi8_mask(m, a, b, p) __extension__ ({ \
(__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)(__m256i)(a), \
- (__v32qi)(__m256i)(b), \
- (p), (__mmask32)(m)); })
+ (__v32qi)(__m256i)(b), (int)(p), \
+ (__mmask32)(m)); })
#define _mm256_cmp_epu8_mask(a, b, p) __extension__ ({ \
(__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)(__m256i)(a), \
- (__v32qi)(__m256i)(b), \
- (p), (__mmask32)-1); })
+ (__v32qi)(__m256i)(b), (int)(p), \
+ (__mmask32)-1); })
#define _mm256_mask_cmp_epu8_mask(m, a, b, p) __extension__ ({ \
(__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)(__m256i)(a), \
- (__v32qi)(__m256i)(b), \
- (p), (__mmask32)(m)); })
+ (__v32qi)(__m256i)(b), (int)(p), \
+ (__mmask32)(m)); })
#define _mm_cmp_epi16_mask(a, b, p) __extension__ ({ \
(__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)(__m128i)(a), \
- (__v8hi)(__m128i)(b), \
- (p), (__mmask8)-1); })
+ (__v8hi)(__m128i)(b), (int)(p), \
+ (__mmask8)-1); })
#define _mm_mask_cmp_epi16_mask(m, a, b, p) __extension__ ({ \
(__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)(__m128i)(a), \
- (__v8hi)(__m128i)(b), \
- (p), (__mmask8)(m)); })
+ (__v8hi)(__m128i)(b), (int)(p), \
+ (__mmask8)(m)); })
#define _mm_cmp_epu16_mask(a, b, p) __extension__ ({ \
(__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)(__m128i)(a), \
- (__v8hi)(__m128i)(b), \
- (p), (__mmask8)-1); })
+ (__v8hi)(__m128i)(b), (int)(p), \
+ (__mmask8)-1); })
#define _mm_mask_cmp_epu16_mask(m, a, b, p) __extension__ ({ \
(__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)(__m128i)(a), \
- (__v8hi)(__m128i)(b), \
- (p), (__mmask8)(m)); })
+ (__v8hi)(__m128i)(b), (int)(p), \
+ (__mmask8)(m)); })
#define _mm256_cmp_epi16_mask(a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)(__m256i)(a), \
- (__v16hi)(__m256i)(b), \
- (p), (__mmask16)-1); })
+ (__v16hi)(__m256i)(b), (int)(p), \
+ (__mmask16)-1); })
#define _mm256_mask_cmp_epi16_mask(m, a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)(__m256i)(a), \
- (__v16hi)(__m256i)(b), \
- (p), (__mmask16)(m)); })
+ (__v16hi)(__m256i)(b), (int)(p), \
+ (__mmask16)(m)); })
#define _mm256_cmp_epu16_mask(a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)(__m256i)(a), \
- (__v16hi)(__m256i)(b), \
- (p), (__mmask16)-1); })
+ (__v16hi)(__m256i)(b), (int)(p), \
+ (__mmask16)-1); })
#define _mm256_mask_cmp_epu16_mask(m, a, b, p) __extension__ ({ \
(__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)(__m256i)(a), \
- (__v16hi)(__m256i)(b), \
- (p), (__mmask16)(m)); })
-
-#define _mm_mask_shufflehi_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshufhw128_mask ((__v8hi) __A, (__imm),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
-
-#define _mm_maskz_shufflehi_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshufhw128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)\
- _mm_setzero_hi (),\
- (__mmask8)( __U));\
-})
-
-
-#define _mm256_mask_shufflehi_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshufhw256_mask ((__v16hi) (__A),\
- (__imm),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
-
-
-#define _mm256_maskz_shufflehi_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshufhw256_mask ((__v16hi) (__A),\
- (__imm),\
- (__v16hi)\
- _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
-
-
-#define _mm_mask_shufflelo_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshuflw128_mask ((__v8hi) __A, (__imm),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
-
-#define _mm_maskz_shufflelo_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshuflw128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)\
- _mm_setzero_hi (),\
- (__mmask8)( __U));\
-})
-
-
-#define _mm256_mask_shufflelo_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshuflw256_mask ((__v16hi) (__A),\
- (__imm),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
-
-
-#define _mm256_maskz_shufflelo_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_pshuflw256_mask ((__v16hi) (__A),\
- (__imm),\
- (__v16hi)\
- _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
+ (__v16hi)(__m256i)(b), (int)(p), \
+ (__mmask16)(m)); })
+
+#define _mm_mask_shufflehi_epi16(W, U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_pshufhw128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
+
+#define _mm_maskz_shufflehi_epi16(U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_pshufhw128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)_mm_setzero_hi(), \
+ (__mmask8)(U)); })
+
+
+#define _mm256_mask_shufflehi_epi16(W, U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_pshufhw256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
+
+
+#define _mm256_maskz_shufflehi_epi16(U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_pshufhw256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
+
+
+#define _mm_mask_shufflelo_epi16(W, U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_pshuflw128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
+
+#define _mm_maskz_shufflelo_epi16(U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_pshuflw128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)_mm_setzero_hi(), \
+ (__mmask8)(U)); })
+
+
+#define _mm256_mask_shufflelo_epi16(W, U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_pshuflw256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
+
+
+#define _mm256_maskz_shufflelo_epi16(U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_pshuflw256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
static __inline__ __m256i __DEFAULT_FN_ATTRS
_mm256_sllv_epi16 (__m256i __A, __m256i __B)
(__mmask16) __U);
}
-#define _mm_mask_slli_epi16( __W, __U, __A, __B) __extension__ ({ \
-__builtin_ia32_psllwi128_mask ((__v8hi)( __A),( __B),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
+#define _mm_mask_slli_epi16(W, U, A, B) __extension__ ({ \
+ (__m128i)__builtin_ia32_psllwi128_mask((__v8hi)(__m128i)(A), (int)(B), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
-#define _mm_maskz_slli_epi16( __U, __A, __B) __extension__ ({ \
-__builtin_ia32_psllwi128_mask ((__v8hi)( __A),( __B),\
- (__v8hi)\
- _mm_setzero_si128 (),\
- (__mmask8)( __U));\
-})
+#define _mm_maskz_slli_epi16(U, A, B) __extension__ ({ \
+ (__m128i)__builtin_ia32_psllwi128_mask((__v8hi)(__m128i)(A), (int)(B), \
+ (__v8hi)_mm_setzero_si128(), \
+ (__mmask8)(U)); })
-#define _mm256_mask_slli_epi16( __W, __U, __A, __B) __extension__ ({ \
-__builtin_ia32_psllwi256_mask ((__v16hi)( __A),( __B),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
+#define _mm256_mask_slli_epi16(W, U, A, B) __extension__ ({ \
+ (__m256i)__builtin_ia32_psllwi256_mask((__v16hi)(__m256i)(A), (int)(B), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
-#define _mm256_maskz_slli_epi16( __U, __A, __B) __extension__ ({ \
-__builtin_ia32_psllwi256_mask ((__v16hi)( __A),( __B),\
- (__v16hi)\
- _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
+#define _mm256_maskz_slli_epi16(U, A, B) __extension__ ({ \
+ (__m256i)__builtin_ia32_psllwi256_mask((__v16hi)(__m256i)(A), (int)(B), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
(__mmask16) __U);
}
-#define _mm_mask_srai_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrawi128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
+#define _mm_mask_srai_epi16(W, U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_psrawi128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
-#define _mm_maskz_srai_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrawi128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)\
- _mm_setzero_si128 (),\
- (__mmask8)( __U));\
-})
+#define _mm_maskz_srai_epi16(U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_psrawi128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)_mm_setzero_si128(), \
+ (__mmask8)(U)); })
-#define _mm256_mask_srai_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrawi256_mask ((__v16hi)( __A),( __imm),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
+#define _mm256_mask_srai_epi16(W, U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_psrawi256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
-#define _mm256_maskz_srai_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrawi256_mask ((__v16hi)( __A),( __imm),\
- (__v16hi)\
- _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
+#define _mm256_maskz_srai_epi16(U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_psrawi256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
static __inline__ __m128i __DEFAULT_FN_ATTRS
_mm_mask_srl_epi16 (__m128i __W, __mmask8 __U, __m128i __A,
(__mmask16) __U);
}
-#define _mm_mask_srli_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrlwi128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
+#define _mm_mask_srli_epi16(W, U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_psrlwi128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
-#define _mm_maskz_srli_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrlwi128_mask ((__v8hi)( __A),( __imm),\
- (__v8hi)\
- _mm_setzero_si128 (),\
- (__mmask8)( __U));\
-})
+#define _mm_maskz_srli_epi16(U, A, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_psrlwi128_mask((__v8hi)(__m128i)(A), (int)(imm), \
+ (__v8hi)_mm_setzero_si128(), \
+ (__mmask8)(U)); })
-#define _mm256_mask_srli_epi16( __W, __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrlwi256_mask ((__v16hi)( __A),( __imm),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
+#define _mm256_mask_srli_epi16(W, U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_psrlwi256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
-#define _mm256_maskz_srli_epi16( __U, __A, __imm) __extension__ ({ \
-__builtin_ia32_psrlwi256_mask ((__v16hi)( __A),( __imm),\
- (__v16hi)\
- _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
+#define _mm256_maskz_srli_epi16(U, A, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_psrlwi256_mask((__v16hi)(__m256i)(A), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
static __inline__ __m128i __DEFAULT_FN_ATTRS
_mm_mask_mov_epi16 (__m128i __W, __mmask8 __U, __m128i __A)
(__mmask16) __M);
}
-#define _mm_mask_alignr_epi8( __W, __U, __A, __B, __N) __extension__ ({ \
-__builtin_ia32_palignr128_mask ((__v2di)( __A),\
- (__v2di)( __B),\
- ( __N) * 8,\
- (__v2di)( __W),\
- (__mmask16)( __U));\
-})
-
-#define _mm_maskz_alignr_epi8( __U, __A, __B, __N) __extension__ ({ \
-__builtin_ia32_palignr128_mask ((__v2di)( __A),\
- (__v2di)( __B),\
- ( __N) * 8,\
- (__v2di)\
- _mm_setzero_si128 (),\
- (__mmask16)( __U));\
-})
-
-#define _mm256_mask_alignr_epi8( __W, __U, __A, __B, __N) __extension__ ({ \
-__builtin_ia32_palignr256_mask ((__v4di)( __A),\
- (__v4di)( __B),\
- ( __N) * 8,\
- (__v4di)( __W),\
- (__mmask32)( __U));\
-})
-
-#define _mm256_maskz_alignr_epi8( __U, __A, __B, __N) __extension__ ({ \
-__builtin_ia32_palignr256_mask ((__v4di)( __A),\
- (__v4di)( __B),\
- ( __N) * 8,\
- (__v4di)\
- _mm256_setzero_si256 (),\
- (__mmask32)( __U));\
-})
-
-#define _mm_dbsad_epu8( __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw128_mask ((__v16qi)( __A),\
- (__v16qi)( __B),\
- ( __imm),\
- (__v8hi) _mm_setzero_hi (),\
- (__mmask8) -1);\
-})
-
-#define _mm_mask_dbsad_epu8( __W, __U, __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw128_mask ((__v16qi)( __A),\
- (__v16qi)( __B),\
- ( __imm),\
- (__v8hi)( __W),\
- (__mmask8)( __U));\
-})
-
-#define _mm_maskz_dbsad_epu8( __U, __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw128_mask ((__v16qi)( __A),\
- (__v16qi)( __B),\
- ( __imm),\
- (__v8hi) _mm_setzero_si128 (),\
- (__mmask8)( __U));\
-})
-
-#define _mm256_dbsad_epu8( __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw256_mask ((__v32qi)( __A),\
- (__v32qi)( __B),\
- ( __imm),\
- (__v16hi) _mm256_setzero_si256 (),\
- (__mmask16) -1);\
-})
-
-#define _mm256_mask_dbsad_epu8( __W, __U, __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw256_mask ((__v32qi)( __A),\
- (__v32qi)( __B),\
- ( __imm),\
- (__v16hi)( __W),\
- (__mmask16)( __U));\
-})
-
-#define _mm256_maskz_dbsad_epu8( __U, __A, __B, __imm) __extension__ ({ \
-__builtin_ia32_dbpsadbw256_mask ((__v32qi)( __A),\
- (__v32qi)( __B),\
- ( __imm),\
- (__v16hi) _mm256_setzero_si256 (),\
- (__mmask16)( __U));\
-})
+#define _mm_mask_alignr_epi8(W, U, A, B, N) __extension__ ({ \
+ (__m128i)__builtin_ia32_palignr128_mask((__v16qi)(__m128i)(A), \
+ (__v16qi)(__m128i)(B), (int)(N) * 8, \
+ (__v16qi)(__m128i)(W), \
+ (__mmask16)(U)); })
+
+#define _mm_maskz_alignr_epi8(U, A, B, N) __extension__ ({ \
+ (__m128i)__builtin_ia32_palignr128_mask((__v16qi)(__m128i)(A), \
+ (__v16qi)(__m128i)(B), (int)(N) * 8, \
+ (__v16qi)_mm_setzero_si128(), \
+ (__mmask16)(U)); })
+
+#define _mm256_mask_alignr_epi8(W, U, A, B, N) __extension__ ({ \
+ (__m256i)__builtin_ia32_palignr256_mask((__v32qi)(__m256i)(A), \
+ (__v32qi)(__m256i)(B), (int)(N) * 8, \
+ (__v32qi)(__m256i)(W), \
+ (__mmask32)(U)); })
+
+#define _mm256_maskz_alignr_epi8(U, A, B, N) __extension__ ({ \
+ (__m256i)__builtin_ia32_palignr256_mask((__v32qi)(__m256i)(A), \
+ (__v32qi)(__m256i)(B), (int)(N) * 8, \
+ (__v32qi)_mm256_setzero_si256(), \
+ (__mmask32)(U)); })
+
+#define _mm_dbsad_epu8(A, B, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \
+ (__v16qi)(__m128i)(B), (int)(imm), \
+ (__v8hi)_mm_setzero_hi(), \
+ (__mmask8)-1); })
+
+#define _mm_mask_dbsad_epu8(W, U, A, B, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \
+ (__v16qi)(__m128i)(B), (int)(imm), \
+ (__v8hi)(__m128i)(W), \
+ (__mmask8)(U)); })
+
+#define _mm_maskz_dbsad_epu8(U, A, B, imm) __extension__ ({ \
+ (__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \
+ (__v16qi)(__m128i)(B), (int)(imm), \
+ (__v8hi)_mm_setzero_si128(), \
+ (__mmask8)(U)); })
+
+#define _mm256_dbsad_epu8(A, B, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \
+ (__v32qi)(__m256i)(B), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)-1); })
+
+#define _mm256_mask_dbsad_epu8(W, U, A, B, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \
+ (__v32qi)(__m256i)(B), (int)(imm), \
+ (__v16hi)(__m256i)(W), \
+ (__mmask16)(U)); })
+
+#define _mm256_maskz_dbsad_epu8(U, A, B, imm) __extension__ ({ \
+ (__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \
+ (__v32qi)(__m256i)(B), (int)(imm), \
+ (__v16hi)_mm256_setzero_si256(), \
+ (__mmask16)(U)); })
#undef __DEFAULT_FN_ATTRS