Path: blob/master/tools/android-sdk/renderscript/clang-include/avx512vlbwintrin.h
496 views
/*===---- avx512vlbwintrin.h - AVX512VL and AVX512BW intrinsics ------------===1*2* Permission is hereby granted, free of charge, to any person obtaining a copy3* of this software and associated documentation files (the "Software"), to deal4* in the Software without restriction, including without limitation the rights5* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell6* copies of the Software, and to permit persons to whom the Software is7* furnished to do so, subject to the following conditions:8*9* The above copyright notice and this permission notice shall be included in10* all copies or substantial portions of the Software.11*12* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR13* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,14* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE15* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER16* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,17* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN18* THE SOFTWARE.19*20*===-----------------------------------------------------------------------===21*/2223#ifndef __IMMINTRIN_H24#error "Never use <avx512vlbwintrin.h> directly; include <immintrin.h> instead."25#endif2627#ifndef __AVX512VLBWINTRIN_H28#define __AVX512VLBWINTRIN_H2930/* Define the default attributes for the functions in this file. */31#define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512vl,avx512bw")))3233static __inline __m128i __DEFAULT_FN_ATTRS34_mm_setzero_hi(void){35return (__m128i)(__v8hi){ 0, 0, 0, 0, 0, 0, 0, 0 };36}3738/* Integer compare */3940static __inline__ __mmask16 __DEFAULT_FN_ATTRS41_mm_cmpeq_epi8_mask(__m128i __a, __m128i __b) {42return (__mmask16)__builtin_ia32_pcmpeqb128_mask((__v16qi)__a, (__v16qi)__b,43(__mmask16)-1);44}4546static __inline__ __mmask16 __DEFAULT_FN_ATTRS47_mm_mask_cmpeq_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {48return (__mmask16)__builtin_ia32_pcmpeqb128_mask((__v16qi)__a, (__v16qi)__b,49__u);50}5152static __inline__ __mmask16 __DEFAULT_FN_ATTRS53_mm_cmpeq_epu8_mask(__m128i __a, __m128i __b) {54return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 0,55(__mmask16)-1);56}5758static __inline__ __mmask16 __DEFAULT_FN_ATTRS59_mm_mask_cmpeq_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {60return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 0,61__u);62}6364static __inline__ __mmask32 __DEFAULT_FN_ATTRS65_mm256_cmpeq_epi8_mask(__m256i __a, __m256i __b) {66return (__mmask32)__builtin_ia32_pcmpeqb256_mask((__v32qi)__a, (__v32qi)__b,67(__mmask32)-1);68}6970static __inline__ __mmask32 __DEFAULT_FN_ATTRS71_mm256_mask_cmpeq_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {72return (__mmask32)__builtin_ia32_pcmpeqb256_mask((__v32qi)__a, (__v32qi)__b,73__u);74}7576static __inline__ __mmask32 __DEFAULT_FN_ATTRS77_mm256_cmpeq_epu8_mask(__m256i __a, __m256i __b) {78return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 0,79(__mmask32)-1);80}8182static __inline__ __mmask32 __DEFAULT_FN_ATTRS83_mm256_mask_cmpeq_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {84return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 0,85__u);86}8788static __inline__ __mmask8 __DEFAULT_FN_ATTRS89_mm_cmpeq_epi16_mask(__m128i __a, __m128i __b) {90return (__mmask8)__builtin_ia32_pcmpeqw128_mask((__v8hi)__a, (__v8hi)__b,91(__mmask8)-1);92}9394static __inline__ __mmask8 __DEFAULT_FN_ATTRS95_mm_mask_cmpeq_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {96return (__mmask8)__builtin_ia32_pcmpeqw128_mask((__v8hi)__a, (__v8hi)__b,97__u);98}99100static __inline__ __mmask8 __DEFAULT_FN_ATTRS101_mm_cmpeq_epu16_mask(__m128i __a, __m128i __b) {102return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 0,103(__mmask8)-1);104}105106static __inline__ __mmask8 __DEFAULT_FN_ATTRS107_mm_mask_cmpeq_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {108return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 0,109__u);110}111112static __inline__ __mmask16 __DEFAULT_FN_ATTRS113_mm256_cmpeq_epi16_mask(__m256i __a, __m256i __b) {114return (__mmask16)__builtin_ia32_pcmpeqw256_mask((__v16hi)__a, (__v16hi)__b,115(__mmask16)-1);116}117118static __inline__ __mmask16 __DEFAULT_FN_ATTRS119_mm256_mask_cmpeq_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {120return (__mmask16)__builtin_ia32_pcmpeqw256_mask((__v16hi)__a, (__v16hi)__b,121__u);122}123124static __inline__ __mmask16 __DEFAULT_FN_ATTRS125_mm256_cmpeq_epu16_mask(__m256i __a, __m256i __b) {126return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 0,127(__mmask16)-1);128}129130static __inline__ __mmask16 __DEFAULT_FN_ATTRS131_mm256_mask_cmpeq_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {132return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 0,133__u);134}135136static __inline__ __mmask16 __DEFAULT_FN_ATTRS137_mm_cmpge_epi8_mask(__m128i __a, __m128i __b) {138return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 5,139(__mmask16)-1);140}141142static __inline__ __mmask16 __DEFAULT_FN_ATTRS143_mm_mask_cmpge_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {144return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 5,145__u);146}147148static __inline__ __mmask16 __DEFAULT_FN_ATTRS149_mm_cmpge_epu8_mask(__m128i __a, __m128i __b) {150return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 5,151(__mmask16)-1);152}153154static __inline__ __mmask16 __DEFAULT_FN_ATTRS155_mm_mask_cmpge_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {156return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 5,157__u);158}159160static __inline__ __mmask32 __DEFAULT_FN_ATTRS161_mm256_cmpge_epi8_mask(__m256i __a, __m256i __b) {162return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 5,163(__mmask32)-1);164}165166static __inline__ __mmask32 __DEFAULT_FN_ATTRS167_mm256_mask_cmpge_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {168return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 5,169__u);170}171172static __inline__ __mmask32 __DEFAULT_FN_ATTRS173_mm256_cmpge_epu8_mask(__m256i __a, __m256i __b) {174return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 5,175(__mmask32)-1);176}177178static __inline__ __mmask32 __DEFAULT_FN_ATTRS179_mm256_mask_cmpge_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {180return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 5,181__u);182}183184static __inline__ __mmask8 __DEFAULT_FN_ATTRS185_mm_cmpge_epi16_mask(__m128i __a, __m128i __b) {186return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 5,187(__mmask8)-1);188}189190static __inline__ __mmask8 __DEFAULT_FN_ATTRS191_mm_mask_cmpge_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {192return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 5,193__u);194}195196static __inline__ __mmask8 __DEFAULT_FN_ATTRS197_mm_cmpge_epu16_mask(__m128i __a, __m128i __b) {198return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 5,199(__mmask8)-1);200}201202static __inline__ __mmask8 __DEFAULT_FN_ATTRS203_mm_mask_cmpge_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {204return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 5,205__u);206}207208static __inline__ __mmask16 __DEFAULT_FN_ATTRS209_mm256_cmpge_epi16_mask(__m256i __a, __m256i __b) {210return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 5,211(__mmask16)-1);212}213214static __inline__ __mmask16 __DEFAULT_FN_ATTRS215_mm256_mask_cmpge_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {216return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 5,217__u);218}219220static __inline__ __mmask16 __DEFAULT_FN_ATTRS221_mm256_cmpge_epu16_mask(__m256i __a, __m256i __b) {222return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 5,223(__mmask16)-1);224}225226static __inline__ __mmask16 __DEFAULT_FN_ATTRS227_mm256_mask_cmpge_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {228return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 5,229__u);230}231232static __inline__ __mmask16 __DEFAULT_FN_ATTRS233_mm_cmpgt_epi8_mask(__m128i __a, __m128i __b) {234return (__mmask16)__builtin_ia32_pcmpgtb128_mask((__v16qi)__a, (__v16qi)__b,235(__mmask16)-1);236}237238static __inline__ __mmask16 __DEFAULT_FN_ATTRS239_mm_mask_cmpgt_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {240return (__mmask16)__builtin_ia32_pcmpgtb128_mask((__v16qi)__a, (__v16qi)__b,241__u);242}243244static __inline__ __mmask16 __DEFAULT_FN_ATTRS245_mm_cmpgt_epu8_mask(__m128i __a, __m128i __b) {246return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 6,247(__mmask16)-1);248}249250static __inline__ __mmask16 __DEFAULT_FN_ATTRS251_mm_mask_cmpgt_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {252return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 6,253__u);254}255256static __inline__ __mmask32 __DEFAULT_FN_ATTRS257_mm256_cmpgt_epi8_mask(__m256i __a, __m256i __b) {258return (__mmask32)__builtin_ia32_pcmpgtb256_mask((__v32qi)__a, (__v32qi)__b,259(__mmask32)-1);260}261262static __inline__ __mmask32 __DEFAULT_FN_ATTRS263_mm256_mask_cmpgt_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {264return (__mmask32)__builtin_ia32_pcmpgtb256_mask((__v32qi)__a, (__v32qi)__b,265__u);266}267268static __inline__ __mmask32 __DEFAULT_FN_ATTRS269_mm256_cmpgt_epu8_mask(__m256i __a, __m256i __b) {270return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 6,271(__mmask32)-1);272}273274static __inline__ __mmask32 __DEFAULT_FN_ATTRS275_mm256_mask_cmpgt_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {276return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 6,277__u);278}279280static __inline__ __mmask8 __DEFAULT_FN_ATTRS281_mm_cmpgt_epi16_mask(__m128i __a, __m128i __b) {282return (__mmask8)__builtin_ia32_pcmpgtw128_mask((__v8hi)__a, (__v8hi)__b,283(__mmask8)-1);284}285286static __inline__ __mmask8 __DEFAULT_FN_ATTRS287_mm_mask_cmpgt_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {288return (__mmask8)__builtin_ia32_pcmpgtw128_mask((__v8hi)__a, (__v8hi)__b,289__u);290}291292static __inline__ __mmask8 __DEFAULT_FN_ATTRS293_mm_cmpgt_epu16_mask(__m128i __a, __m128i __b) {294return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 6,295(__mmask8)-1);296}297298static __inline__ __mmask8 __DEFAULT_FN_ATTRS299_mm_mask_cmpgt_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {300return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 6,301__u);302}303304static __inline__ __mmask16 __DEFAULT_FN_ATTRS305_mm256_cmpgt_epi16_mask(__m256i __a, __m256i __b) {306return (__mmask16)__builtin_ia32_pcmpgtw256_mask((__v16hi)__a, (__v16hi)__b,307(__mmask16)-1);308}309310static __inline__ __mmask16 __DEFAULT_FN_ATTRS311_mm256_mask_cmpgt_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {312return (__mmask16)__builtin_ia32_pcmpgtw256_mask((__v16hi)__a, (__v16hi)__b,313__u);314}315316static __inline__ __mmask16 __DEFAULT_FN_ATTRS317_mm256_cmpgt_epu16_mask(__m256i __a, __m256i __b) {318return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 6,319(__mmask16)-1);320}321322static __inline__ __mmask16 __DEFAULT_FN_ATTRS323_mm256_mask_cmpgt_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {324return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 6,325__u);326}327328static __inline__ __mmask16 __DEFAULT_FN_ATTRS329_mm_cmple_epi8_mask(__m128i __a, __m128i __b) {330return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 2,331(__mmask16)-1);332}333334static __inline__ __mmask16 __DEFAULT_FN_ATTRS335_mm_mask_cmple_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {336return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 2,337__u);338}339340static __inline__ __mmask16 __DEFAULT_FN_ATTRS341_mm_cmple_epu8_mask(__m128i __a, __m128i __b) {342return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 2,343(__mmask16)-1);344}345346static __inline__ __mmask16 __DEFAULT_FN_ATTRS347_mm_mask_cmple_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {348return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 2,349__u);350}351352static __inline__ __mmask32 __DEFAULT_FN_ATTRS353_mm256_cmple_epi8_mask(__m256i __a, __m256i __b) {354return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 2,355(__mmask32)-1);356}357358static __inline__ __mmask32 __DEFAULT_FN_ATTRS359_mm256_mask_cmple_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {360return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 2,361__u);362}363364static __inline__ __mmask32 __DEFAULT_FN_ATTRS365_mm256_cmple_epu8_mask(__m256i __a, __m256i __b) {366return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 2,367(__mmask32)-1);368}369370static __inline__ __mmask32 __DEFAULT_FN_ATTRS371_mm256_mask_cmple_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {372return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 2,373__u);374}375376static __inline__ __mmask8 __DEFAULT_FN_ATTRS377_mm_cmple_epi16_mask(__m128i __a, __m128i __b) {378return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 2,379(__mmask8)-1);380}381382static __inline__ __mmask8 __DEFAULT_FN_ATTRS383_mm_mask_cmple_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {384return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 2,385__u);386}387388static __inline__ __mmask8 __DEFAULT_FN_ATTRS389_mm_cmple_epu16_mask(__m128i __a, __m128i __b) {390return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 2,391(__mmask8)-1);392}393394static __inline__ __mmask8 __DEFAULT_FN_ATTRS395_mm_mask_cmple_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {396return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 2,397__u);398}399400static __inline__ __mmask16 __DEFAULT_FN_ATTRS401_mm256_cmple_epi16_mask(__m256i __a, __m256i __b) {402return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 2,403(__mmask16)-1);404}405406static __inline__ __mmask16 __DEFAULT_FN_ATTRS407_mm256_mask_cmple_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {408return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 2,409__u);410}411412static __inline__ __mmask16 __DEFAULT_FN_ATTRS413_mm256_cmple_epu16_mask(__m256i __a, __m256i __b) {414return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 2,415(__mmask16)-1);416}417418static __inline__ __mmask16 __DEFAULT_FN_ATTRS419_mm256_mask_cmple_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {420return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 2,421__u);422}423424static __inline__ __mmask16 __DEFAULT_FN_ATTRS425_mm_cmplt_epi8_mask(__m128i __a, __m128i __b) {426return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 1,427(__mmask16)-1);428}429430static __inline__ __mmask16 __DEFAULT_FN_ATTRS431_mm_mask_cmplt_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {432return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 1,433__u);434}435436static __inline__ __mmask16 __DEFAULT_FN_ATTRS437_mm_cmplt_epu8_mask(__m128i __a, __m128i __b) {438return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 1,439(__mmask16)-1);440}441442static __inline__ __mmask16 __DEFAULT_FN_ATTRS443_mm_mask_cmplt_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {444return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 1,445__u);446}447448static __inline__ __mmask32 __DEFAULT_FN_ATTRS449_mm256_cmplt_epi8_mask(__m256i __a, __m256i __b) {450return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 1,451(__mmask32)-1);452}453454static __inline__ __mmask32 __DEFAULT_FN_ATTRS455_mm256_mask_cmplt_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {456return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 1,457__u);458}459460static __inline__ __mmask32 __DEFAULT_FN_ATTRS461_mm256_cmplt_epu8_mask(__m256i __a, __m256i __b) {462return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 1,463(__mmask32)-1);464}465466static __inline__ __mmask32 __DEFAULT_FN_ATTRS467_mm256_mask_cmplt_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {468return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 1,469__u);470}471472static __inline__ __mmask8 __DEFAULT_FN_ATTRS473_mm_cmplt_epi16_mask(__m128i __a, __m128i __b) {474return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 1,475(__mmask8)-1);476}477478static __inline__ __mmask8 __DEFAULT_FN_ATTRS479_mm_mask_cmplt_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {480return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 1,481__u);482}483484static __inline__ __mmask8 __DEFAULT_FN_ATTRS485_mm_cmplt_epu16_mask(__m128i __a, __m128i __b) {486return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 1,487(__mmask8)-1);488}489490static __inline__ __mmask8 __DEFAULT_FN_ATTRS491_mm_mask_cmplt_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {492return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 1,493__u);494}495496static __inline__ __mmask16 __DEFAULT_FN_ATTRS497_mm256_cmplt_epi16_mask(__m256i __a, __m256i __b) {498return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 1,499(__mmask16)-1);500}501502static __inline__ __mmask16 __DEFAULT_FN_ATTRS503_mm256_mask_cmplt_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {504return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 1,505__u);506}507508static __inline__ __mmask16 __DEFAULT_FN_ATTRS509_mm256_cmplt_epu16_mask(__m256i __a, __m256i __b) {510return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 1,511(__mmask16)-1);512}513514static __inline__ __mmask16 __DEFAULT_FN_ATTRS515_mm256_mask_cmplt_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {516return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 1,517__u);518}519520static __inline__ __mmask16 __DEFAULT_FN_ATTRS521_mm_cmpneq_epi8_mask(__m128i __a, __m128i __b) {522return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 4,523(__mmask16)-1);524}525526static __inline__ __mmask16 __DEFAULT_FN_ATTRS527_mm_mask_cmpneq_epi8_mask(__mmask16 __u, __m128i __a, __m128i __b) {528return (__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)__a, (__v16qi)__b, 4,529__u);530}531532static __inline__ __mmask16 __DEFAULT_FN_ATTRS533_mm_cmpneq_epu8_mask(__m128i __a, __m128i __b) {534return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 4,535(__mmask16)-1);536}537538static __inline__ __mmask16 __DEFAULT_FN_ATTRS539_mm_mask_cmpneq_epu8_mask(__mmask16 __u, __m128i __a, __m128i __b) {540return (__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)__a, (__v16qi)__b, 4,541__u);542}543544static __inline__ __mmask32 __DEFAULT_FN_ATTRS545_mm256_cmpneq_epi8_mask(__m256i __a, __m256i __b) {546return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 4,547(__mmask32)-1);548}549550static __inline__ __mmask32 __DEFAULT_FN_ATTRS551_mm256_mask_cmpneq_epi8_mask(__mmask32 __u, __m256i __a, __m256i __b) {552return (__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)__a, (__v32qi)__b, 4,553__u);554}555556static __inline__ __mmask32 __DEFAULT_FN_ATTRS557_mm256_cmpneq_epu8_mask(__m256i __a, __m256i __b) {558return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 4,559(__mmask32)-1);560}561562static __inline__ __mmask32 __DEFAULT_FN_ATTRS563_mm256_mask_cmpneq_epu8_mask(__mmask32 __u, __m256i __a, __m256i __b) {564return (__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)__a, (__v32qi)__b, 4,565__u);566}567568static __inline__ __mmask8 __DEFAULT_FN_ATTRS569_mm_cmpneq_epi16_mask(__m128i __a, __m128i __b) {570return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 4,571(__mmask8)-1);572}573574static __inline__ __mmask8 __DEFAULT_FN_ATTRS575_mm_mask_cmpneq_epi16_mask(__mmask8 __u, __m128i __a, __m128i __b) {576return (__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)__a, (__v8hi)__b, 4,577__u);578}579580static __inline__ __mmask8 __DEFAULT_FN_ATTRS581_mm_cmpneq_epu16_mask(__m128i __a, __m128i __b) {582return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 4,583(__mmask8)-1);584}585586static __inline__ __mmask8 __DEFAULT_FN_ATTRS587_mm_mask_cmpneq_epu16_mask(__mmask8 __u, __m128i __a, __m128i __b) {588return (__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)__a, (__v8hi)__b, 4,589__u);590}591592static __inline__ __mmask16 __DEFAULT_FN_ATTRS593_mm256_cmpneq_epi16_mask(__m256i __a, __m256i __b) {594return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 4,595(__mmask16)-1);596}597598static __inline__ __mmask16 __DEFAULT_FN_ATTRS599_mm256_mask_cmpneq_epi16_mask(__mmask16 __u, __m256i __a, __m256i __b) {600return (__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)__a, (__v16hi)__b, 4,601__u);602}603604static __inline__ __mmask16 __DEFAULT_FN_ATTRS605_mm256_cmpneq_epu16_mask(__m256i __a, __m256i __b) {606return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 4,607(__mmask16)-1);608}609610static __inline__ __mmask16 __DEFAULT_FN_ATTRS611_mm256_mask_cmpneq_epu16_mask(__mmask16 __u, __m256i __a, __m256i __b) {612return (__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)__a, (__v16hi)__b, 4,613__u);614}615616static __inline__ __m256i __DEFAULT_FN_ATTRS617_mm256_mask_add_epi8 (__m256i __W, __mmask32 __U, __m256i __A, __m256i __B){618return (__m256i) __builtin_ia32_paddb256_mask ((__v32qi) __A,619(__v32qi) __B,620(__v32qi) __W,621(__mmask32) __U);622}623624static __inline__ __m256i __DEFAULT_FN_ATTRS625_mm256_maskz_add_epi8 (__mmask32 __U, __m256i __A, __m256i __B) {626return (__m256i) __builtin_ia32_paddb256_mask ((__v32qi) __A,627(__v32qi) __B,628(__v32qi)629_mm256_setzero_si256 (),630(__mmask32) __U);631}632633static __inline__ __m256i __DEFAULT_FN_ATTRS634_mm256_mask_add_epi16 (__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {635return (__m256i) __builtin_ia32_paddw256_mask ((__v16hi) __A,636(__v16hi) __B,637(__v16hi) __W,638(__mmask16) __U);639}640641static __inline__ __m256i __DEFAULT_FN_ATTRS642_mm256_maskz_add_epi16 (__mmask16 __U, __m256i __A, __m256i __B) {643return (__m256i) __builtin_ia32_paddw256_mask ((__v16hi) __A,644(__v16hi) __B,645(__v16hi)646_mm256_setzero_si256 (),647(__mmask16) __U);648}649650static __inline__ __m256i __DEFAULT_FN_ATTRS651_mm256_mask_sub_epi8 (__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {652return (__m256i) __builtin_ia32_psubb256_mask ((__v32qi) __A,653(__v32qi) __B,654(__v32qi) __W,655(__mmask32) __U);656}657658static __inline__ __m256i __DEFAULT_FN_ATTRS659_mm256_maskz_sub_epi8 (__mmask32 __U, __m256i __A, __m256i __B) {660return (__m256i) __builtin_ia32_psubb256_mask ((__v32qi) __A,661(__v32qi) __B,662(__v32qi)663_mm256_setzero_si256 (),664(__mmask32) __U);665}666667static __inline__ __m256i __DEFAULT_FN_ATTRS668_mm256_mask_sub_epi16 (__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {669return (__m256i) __builtin_ia32_psubw256_mask ((__v16hi) __A,670(__v16hi) __B,671(__v16hi) __W,672(__mmask16) __U);673}674675static __inline__ __m256i __DEFAULT_FN_ATTRS676_mm256_maskz_sub_epi16 (__mmask16 __U, __m256i __A, __m256i __B) {677return (__m256i) __builtin_ia32_psubw256_mask ((__v16hi) __A,678(__v16hi) __B,679(__v16hi)680_mm256_setzero_si256 (),681(__mmask16) __U);682}683static __inline__ __m128i __DEFAULT_FN_ATTRS684_mm_mask_add_epi8 (__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {685return (__m128i) __builtin_ia32_paddb128_mask ((__v16qi) __A,686(__v16qi) __B,687(__v16qi) __W,688(__mmask16) __U);689}690691static __inline__ __m128i __DEFAULT_FN_ATTRS692_mm_maskz_add_epi8 (__mmask16 __U, __m128i __A, __m128i __B) {693return (__m128i) __builtin_ia32_paddb128_mask ((__v16qi) __A,694(__v16qi) __B,695(__v16qi)696_mm_setzero_si128 (),697(__mmask16) __U);698}699700static __inline__ __m128i __DEFAULT_FN_ATTRS701_mm_mask_add_epi16 (__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {702return (__m128i) __builtin_ia32_paddw128_mask ((__v8hi) __A,703(__v8hi) __B,704(__v8hi) __W,705(__mmask8) __U);706}707708static __inline__ __m128i __DEFAULT_FN_ATTRS709_mm_maskz_add_epi16 (__mmask8 __U, __m128i __A, __m128i __B) {710return (__m128i) __builtin_ia32_paddw128_mask ((__v8hi) __A,711(__v8hi) __B,712(__v8hi)713_mm_setzero_si128 (),714(__mmask8) __U);715}716717static __inline__ __m128i __DEFAULT_FN_ATTRS718_mm_mask_sub_epi8 (__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {719return (__m128i) __builtin_ia32_psubb128_mask ((__v16qi) __A,720(__v16qi) __B,721(__v16qi) __W,722(__mmask16) __U);723}724725static __inline__ __m128i __DEFAULT_FN_ATTRS726_mm_maskz_sub_epi8 (__mmask16 __U, __m128i __A, __m128i __B) {727return (__m128i) __builtin_ia32_psubb128_mask ((__v16qi) __A,728(__v16qi) __B,729(__v16qi)730_mm_setzero_si128 (),731(__mmask16) __U);732}733734static __inline__ __m128i __DEFAULT_FN_ATTRS735_mm_mask_sub_epi16 (__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {736return (__m128i) __builtin_ia32_psubw128_mask ((__v8hi) __A,737(__v8hi) __B,738(__v8hi) __W,739(__mmask8) __U);740}741742static __inline__ __m128i __DEFAULT_FN_ATTRS743_mm_maskz_sub_epi16 (__mmask8 __U, __m128i __A, __m128i __B) {744return (__m128i) __builtin_ia32_psubw128_mask ((__v8hi) __A,745(__v8hi) __B,746(__v8hi)747_mm_setzero_si128 (),748(__mmask8) __U);749}750751static __inline__ __m256i __DEFAULT_FN_ATTRS752_mm256_mask_mullo_epi16 (__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {753return (__m256i) __builtin_ia32_pmullw256_mask ((__v16hi) __A,754(__v16hi) __B,755(__v16hi) __W,756(__mmask16) __U);757}758759static __inline__ __m256i __DEFAULT_FN_ATTRS760_mm256_maskz_mullo_epi16 (__mmask16 __U, __m256i __A, __m256i __B) {761return (__m256i) __builtin_ia32_pmullw256_mask ((__v16hi) __A,762(__v16hi) __B,763(__v16hi)764_mm256_setzero_si256 (),765(__mmask16) __U);766}767768static __inline__ __m128i __DEFAULT_FN_ATTRS769_mm_mask_mullo_epi16 (__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {770return (__m128i) __builtin_ia32_pmullw128_mask ((__v8hi) __A,771(__v8hi) __B,772(__v8hi) __W,773(__mmask8) __U);774}775776static __inline__ __m128i __DEFAULT_FN_ATTRS777_mm_maskz_mullo_epi16 (__mmask8 __U, __m128i __A, __m128i __B) {778return (__m128i) __builtin_ia32_pmullw128_mask ((__v8hi) __A,779(__v8hi) __B,780(__v8hi)781_mm_setzero_si128 (),782(__mmask8) __U);783}784785static __inline__ __m128i __DEFAULT_FN_ATTRS786_mm_mask_blend_epi8 (__mmask16 __U, __m128i __A, __m128i __W)787{788return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,789(__v16qi) __W,790(__v16qi) __A);791}792793static __inline__ __m256i __DEFAULT_FN_ATTRS794_mm256_mask_blend_epi8 (__mmask32 __U, __m256i __A, __m256i __W)795{796return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,797(__v32qi) __W,798(__v32qi) __A);799}800801static __inline__ __m128i __DEFAULT_FN_ATTRS802_mm_mask_blend_epi16 (__mmask8 __U, __m128i __A, __m128i __W)803{804return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,805(__v8hi) __W,806(__v8hi) __A);807}808809static __inline__ __m256i __DEFAULT_FN_ATTRS810_mm256_mask_blend_epi16 (__mmask16 __U, __m256i __A, __m256i __W)811{812return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,813(__v16hi) __W,814(__v16hi) __A);815}816817static __inline__ __m128i __DEFAULT_FN_ATTRS818_mm_mask_abs_epi8 (__m128i __W, __mmask16 __U, __m128i __A)819{820return (__m128i) __builtin_ia32_pabsb128_mask ((__v16qi) __A,821(__v16qi) __W,822(__mmask16) __U);823}824825static __inline__ __m128i __DEFAULT_FN_ATTRS826_mm_maskz_abs_epi8 (__mmask16 __U, __m128i __A)827{828return (__m128i) __builtin_ia32_pabsb128_mask ((__v16qi) __A,829(__v16qi) _mm_setzero_si128 (),830(__mmask16) __U);831}832833static __inline__ __m256i __DEFAULT_FN_ATTRS834_mm256_mask_abs_epi8 (__m256i __W, __mmask32 __U, __m256i __A)835{836return (__m256i) __builtin_ia32_pabsb256_mask ((__v32qi) __A,837(__v32qi) __W,838(__mmask32) __U);839}840841static __inline__ __m256i __DEFAULT_FN_ATTRS842_mm256_maskz_abs_epi8 (__mmask32 __U, __m256i __A)843{844return (__m256i) __builtin_ia32_pabsb256_mask ((__v32qi) __A,845(__v32qi) _mm256_setzero_si256 (),846(__mmask32) __U);847}848849static __inline__ __m128i __DEFAULT_FN_ATTRS850_mm_mask_abs_epi16 (__m128i __W, __mmask8 __U, __m128i __A)851{852return (__m128i) __builtin_ia32_pabsw128_mask ((__v8hi) __A,853(__v8hi) __W,854(__mmask8) __U);855}856857static __inline__ __m128i __DEFAULT_FN_ATTRS858_mm_maskz_abs_epi16 (__mmask8 __U, __m128i __A)859{860return (__m128i) __builtin_ia32_pabsw128_mask ((__v8hi) __A,861(__v8hi) _mm_setzero_si128 (),862(__mmask8) __U);863}864865static __inline__ __m256i __DEFAULT_FN_ATTRS866_mm256_mask_abs_epi16 (__m256i __W, __mmask16 __U, __m256i __A)867{868return (__m256i) __builtin_ia32_pabsw256_mask ((__v16hi) __A,869(__v16hi) __W,870(__mmask16) __U);871}872873static __inline__ __m256i __DEFAULT_FN_ATTRS874_mm256_maskz_abs_epi16 (__mmask16 __U, __m256i __A)875{876return (__m256i) __builtin_ia32_pabsw256_mask ((__v16hi) __A,877(__v16hi) _mm256_setzero_si256 (),878(__mmask16) __U);879}880881static __inline__ __m128i __DEFAULT_FN_ATTRS882_mm_maskz_packs_epi32 (__mmask8 __M, __m128i __A, __m128i __B)883{884return (__m128i) __builtin_ia32_packssdw128_mask ((__v4si) __A,885(__v4si) __B,886(__v8hi) _mm_setzero_si128 (), __M);887}888889static __inline__ __m128i __DEFAULT_FN_ATTRS890_mm_mask_packs_epi32 (__m128i __W, __mmask16 __M, __m128i __A,891__m128i __B)892{893return (__m128i) __builtin_ia32_packssdw128_mask ((__v4si) __A,894(__v4si) __B,895(__v8hi) __W, __M);896}897898static __inline__ __m256i __DEFAULT_FN_ATTRS899_mm256_maskz_packs_epi32 (__mmask16 __M, __m256i __A, __m256i __B)900{901return (__m256i) __builtin_ia32_packssdw256_mask ((__v8si) __A,902(__v8si) __B,903(__v16hi) _mm256_setzero_si256 (),904__M);905}906907static __inline__ __m256i __DEFAULT_FN_ATTRS908_mm256_mask_packs_epi32 (__m256i __W, __mmask16 __M, __m256i __A,909__m256i __B)910{911return (__m256i) __builtin_ia32_packssdw256_mask ((__v8si) __A,912(__v8si) __B,913(__v16hi) __W, __M);914}915916static __inline__ __m128i __DEFAULT_FN_ATTRS917_mm_maskz_packs_epi16 (__mmask16 __M, __m128i __A, __m128i __B)918{919return (__m128i) __builtin_ia32_packsswb128_mask ((__v8hi) __A,920(__v8hi) __B,921(__v16qi) _mm_setzero_si128 (),922__M);923}924925static __inline__ __m128i __DEFAULT_FN_ATTRS926_mm_mask_packs_epi16 (__m128i __W, __mmask16 __M, __m128i __A,927__m128i __B)928{929return (__m128i) __builtin_ia32_packsswb128_mask ((__v8hi) __A,930(__v8hi) __B,931(__v16qi) __W,932__M);933}934935static __inline__ __m256i __DEFAULT_FN_ATTRS936_mm256_maskz_packs_epi16 (__mmask32 __M, __m256i __A, __m256i __B)937{938return (__m256i) __builtin_ia32_packsswb256_mask ((__v16hi) __A,939(__v16hi) __B,940(__v32qi) _mm256_setzero_si256 (),941__M);942}943944static __inline__ __m256i __DEFAULT_FN_ATTRS945_mm256_mask_packs_epi16 (__m256i __W, __mmask32 __M, __m256i __A,946__m256i __B)947{948return (__m256i) __builtin_ia32_packsswb256_mask ((__v16hi) __A,949(__v16hi) __B,950(__v32qi) __W,951__M);952}953954static __inline__ __m128i __DEFAULT_FN_ATTRS955_mm_maskz_packus_epi32 (__mmask8 __M, __m128i __A, __m128i __B)956{957return (__m128i) __builtin_ia32_packusdw128_mask ((__v4si) __A,958(__v4si) __B,959(__v8hi) _mm_setzero_si128 (),960__M);961}962963static __inline__ __m128i __DEFAULT_FN_ATTRS964_mm_mask_packus_epi32 (__m128i __W, __mmask16 __M, __m128i __A,965__m128i __B)966{967return (__m128i) __builtin_ia32_packusdw128_mask ((__v4si) __A,968(__v4si) __B,969(__v8hi) __W, __M);970}971972static __inline__ __m256i __DEFAULT_FN_ATTRS973_mm256_maskz_packus_epi32 (__mmask16 __M, __m256i __A, __m256i __B)974{975return (__m256i) __builtin_ia32_packusdw256_mask ((__v8si) __A,976(__v8si) __B,977(__v16hi) _mm256_setzero_si256 (),978__M);979}980981static __inline__ __m256i __DEFAULT_FN_ATTRS982_mm256_mask_packus_epi32 (__m256i __W, __mmask16 __M, __m256i __A,983__m256i __B)984{985return (__m256i) __builtin_ia32_packusdw256_mask ((__v8si) __A,986(__v8si) __B,987(__v16hi) __W,988__M);989}990991static __inline__ __m128i __DEFAULT_FN_ATTRS992_mm_maskz_packus_epi16 (__mmask16 __M, __m128i __A, __m128i __B)993{994return (__m128i) __builtin_ia32_packuswb128_mask ((__v8hi) __A,995(__v8hi) __B,996(__v16qi) _mm_setzero_si128 (),997__M);998}9991000static __inline__ __m128i __DEFAULT_FN_ATTRS1001_mm_mask_packus_epi16 (__m128i __W, __mmask16 __M, __m128i __A,1002__m128i __B)1003{1004return (__m128i) __builtin_ia32_packuswb128_mask ((__v8hi) __A,1005(__v8hi) __B,1006(__v16qi) __W,1007__M);1008}10091010static __inline__ __m256i __DEFAULT_FN_ATTRS1011_mm256_maskz_packus_epi16 (__mmask32 __M, __m256i __A, __m256i __B)1012{1013return (__m256i) __builtin_ia32_packuswb256_mask ((__v16hi) __A,1014(__v16hi) __B,1015(__v32qi) _mm256_setzero_si256 (),1016__M);1017}10181019static __inline__ __m256i __DEFAULT_FN_ATTRS1020_mm256_mask_packus_epi16 (__m256i __W, __mmask32 __M, __m256i __A,1021__m256i __B)1022{1023return (__m256i) __builtin_ia32_packuswb256_mask ((__v16hi) __A,1024(__v16hi) __B,1025(__v32qi) __W,1026__M);1027}10281029static __inline__ __m128i __DEFAULT_FN_ATTRS1030_mm_mask_adds_epi8 (__m128i __W, __mmask16 __U, __m128i __A,1031__m128i __B)1032{1033return (__m128i) __builtin_ia32_paddsb128_mask ((__v16qi) __A,1034(__v16qi) __B,1035(__v16qi) __W,1036(__mmask16) __U);1037}10381039static __inline__ __m128i __DEFAULT_FN_ATTRS1040_mm_maskz_adds_epi8 (__mmask16 __U, __m128i __A, __m128i __B)1041{1042return (__m128i) __builtin_ia32_paddsb128_mask ((__v16qi) __A,1043(__v16qi) __B,1044(__v16qi) _mm_setzero_si128 (),1045(__mmask16) __U);1046}10471048static __inline__ __m256i __DEFAULT_FN_ATTRS1049_mm256_mask_adds_epi8 (__m256i __W, __mmask32 __U, __m256i __A,1050__m256i __B)1051{1052return (__m256i) __builtin_ia32_paddsb256_mask ((__v32qi) __A,1053(__v32qi) __B,1054(__v32qi) __W,1055(__mmask32) __U);1056}10571058static __inline__ __m256i __DEFAULT_FN_ATTRS1059_mm256_maskz_adds_epi8 (__mmask32 __U, __m256i __A, __m256i __B)1060{1061return (__m256i) __builtin_ia32_paddsb256_mask ((__v32qi) __A,1062(__v32qi) __B,1063(__v32qi) _mm256_setzero_si256 (),1064(__mmask32) __U);1065}10661067static __inline__ __m128i __DEFAULT_FN_ATTRS1068_mm_mask_adds_epi16 (__m128i __W, __mmask8 __U, __m128i __A,1069__m128i __B)1070{1071return (__m128i) __builtin_ia32_paddsw128_mask ((__v8hi) __A,1072(__v8hi) __B,1073(__v8hi) __W,1074(__mmask8) __U);1075}10761077static __inline__ __m128i __DEFAULT_FN_ATTRS1078_mm_maskz_adds_epi16 (__mmask8 __U, __m128i __A, __m128i __B)1079{1080return (__m128i) __builtin_ia32_paddsw128_mask ((__v8hi) __A,1081(__v8hi) __B,1082(__v8hi) _mm_setzero_si128 (),1083(__mmask8) __U);1084}10851086static __inline__ __m256i __DEFAULT_FN_ATTRS1087_mm256_mask_adds_epi16 (__m256i __W, __mmask16 __U, __m256i __A,1088__m256i __B)1089{1090return (__m256i) __builtin_ia32_paddsw256_mask ((__v16hi) __A,1091(__v16hi) __B,1092(__v16hi) __W,1093(__mmask16) __U);1094}10951096static __inline__ __m256i __DEFAULT_FN_ATTRS1097_mm256_maskz_adds_epi16 (__mmask16 __U, __m256i __A, __m256i __B)1098{1099return (__m256i) __builtin_ia32_paddsw256_mask ((__v16hi) __A,1100(__v16hi) __B,1101(__v16hi) _mm256_setzero_si256 (),1102(__mmask16) __U);1103}11041105static __inline__ __m128i __DEFAULT_FN_ATTRS1106_mm_mask_adds_epu8 (__m128i __W, __mmask16 __U, __m128i __A,1107__m128i __B)1108{1109return (__m128i) __builtin_ia32_paddusb128_mask ((__v16qi) __A,1110(__v16qi) __B,1111(__v16qi) __W,1112(__mmask16) __U);1113}11141115static __inline__ __m128i __DEFAULT_FN_ATTRS1116_mm_maskz_adds_epu8 (__mmask16 __U, __m128i __A, __m128i __B)1117{1118return (__m128i) __builtin_ia32_paddusb128_mask ((__v16qi) __A,1119(__v16qi) __B,1120(__v16qi) _mm_setzero_si128 (),1121(__mmask16) __U);1122}11231124static __inline__ __m256i __DEFAULT_FN_ATTRS1125_mm256_mask_adds_epu8 (__m256i __W, __mmask32 __U, __m256i __A,1126__m256i __B)1127{1128return (__m256i) __builtin_ia32_paddusb256_mask ((__v32qi) __A,1129(__v32qi) __B,1130(__v32qi) __W,1131(__mmask32) __U);1132}11331134static __inline__ __m256i __DEFAULT_FN_ATTRS1135_mm256_maskz_adds_epu8 (__mmask32 __U, __m256i __A, __m256i __B)1136{1137return (__m256i) __builtin_ia32_paddusb256_mask ((__v32qi) __A,1138(__v32qi) __B,1139(__v32qi) _mm256_setzero_si256 (),1140(__mmask32) __U);1141}11421143static __inline__ __m128i __DEFAULT_FN_ATTRS1144_mm_mask_adds_epu16 (__m128i __W, __mmask8 __U, __m128i __A,1145__m128i __B)1146{1147return (__m128i) __builtin_ia32_paddusw128_mask ((__v8hi) __A,1148(__v8hi) __B,1149(__v8hi) __W,1150(__mmask8) __U);1151}11521153static __inline__ __m128i __DEFAULT_FN_ATTRS1154_mm_maskz_adds_epu16 (__mmask8 __U, __m128i __A, __m128i __B)1155{1156return (__m128i) __builtin_ia32_paddusw128_mask ((__v8hi) __A,1157(__v8hi) __B,1158(__v8hi) _mm_setzero_si128 (),1159(__mmask8) __U);1160}11611162static __inline__ __m256i __DEFAULT_FN_ATTRS1163_mm256_mask_adds_epu16 (__m256i __W, __mmask16 __U, __m256i __A,1164__m256i __B)1165{1166return (__m256i) __builtin_ia32_paddusw256_mask ((__v16hi) __A,1167(__v16hi) __B,1168(__v16hi) __W,1169(__mmask16) __U);1170}11711172static __inline__ __m256i __DEFAULT_FN_ATTRS1173_mm256_maskz_adds_epu16 (__mmask16 __U, __m256i __A, __m256i __B)1174{1175return (__m256i) __builtin_ia32_paddusw256_mask ((__v16hi) __A,1176(__v16hi) __B,1177(__v16hi) _mm256_setzero_si256 (),1178(__mmask16) __U);1179}11801181static __inline__ __m128i __DEFAULT_FN_ATTRS1182_mm_mask_avg_epu8 (__m128i __W, __mmask16 __U, __m128i __A,1183__m128i __B)1184{1185return (__m128i) __builtin_ia32_pavgb128_mask ((__v16qi) __A,1186(__v16qi) __B,1187(__v16qi) __W,1188(__mmask16) __U);1189}11901191static __inline__ __m128i __DEFAULT_FN_ATTRS1192_mm_maskz_avg_epu8 (__mmask16 __U, __m128i __A, __m128i __B)1193{1194return (__m128i) __builtin_ia32_pavgb128_mask ((__v16qi) __A,1195(__v16qi) __B,1196(__v16qi) _mm_setzero_si128 (),1197(__mmask16) __U);1198}11991200static __inline__ __m256i __DEFAULT_FN_ATTRS1201_mm256_mask_avg_epu8 (__m256i __W, __mmask32 __U, __m256i __A,1202__m256i __B)1203{1204return (__m256i) __builtin_ia32_pavgb256_mask ((__v32qi) __A,1205(__v32qi) __B,1206(__v32qi) __W,1207(__mmask32) __U);1208}12091210static __inline__ __m256i __DEFAULT_FN_ATTRS1211_mm256_maskz_avg_epu8 (__mmask32 __U, __m256i __A, __m256i __B)1212{1213return (__m256i) __builtin_ia32_pavgb256_mask ((__v32qi) __A,1214(__v32qi) __B,1215(__v32qi) _mm256_setzero_si256 (),1216(__mmask32) __U);1217}12181219static __inline__ __m128i __DEFAULT_FN_ATTRS1220_mm_mask_avg_epu16 (__m128i __W, __mmask8 __U, __m128i __A,1221__m128i __B)1222{1223return (__m128i) __builtin_ia32_pavgw128_mask ((__v8hi) __A,1224(__v8hi) __B,1225(__v8hi) __W,1226(__mmask8) __U);1227}12281229static __inline__ __m128i __DEFAULT_FN_ATTRS1230_mm_maskz_avg_epu16 (__mmask8 __U, __m128i __A, __m128i __B)1231{1232return (__m128i) __builtin_ia32_pavgw128_mask ((__v8hi) __A,1233(__v8hi) __B,1234(__v8hi) _mm_setzero_si128 (),1235(__mmask8) __U);1236}12371238static __inline__ __m256i __DEFAULT_FN_ATTRS1239_mm256_mask_avg_epu16 (__m256i __W, __mmask16 __U, __m256i __A,1240__m256i __B)1241{1242return (__m256i) __builtin_ia32_pavgw256_mask ((__v16hi) __A,1243(__v16hi) __B,1244(__v16hi) __W,1245(__mmask16) __U);1246}12471248static __inline__ __m256i __DEFAULT_FN_ATTRS1249_mm256_maskz_avg_epu16 (__mmask16 __U, __m256i __A, __m256i __B)1250{1251return (__m256i) __builtin_ia32_pavgw256_mask ((__v16hi) __A,1252(__v16hi) __B,1253(__v16hi) _mm256_setzero_si256 (),1254(__mmask16) __U);1255}12561257static __inline__ __m128i __DEFAULT_FN_ATTRS1258_mm_maskz_max_epi8 (__mmask16 __M, __m128i __A, __m128i __B)1259{1260return (__m128i) __builtin_ia32_pmaxsb128_mask ((__v16qi) __A,1261(__v16qi) __B,1262(__v16qi) _mm_setzero_si128 (),1263(__mmask16) __M);1264}12651266static __inline__ __m128i __DEFAULT_FN_ATTRS1267_mm_mask_max_epi8 (__m128i __W, __mmask16 __M, __m128i __A,1268__m128i __B)1269{1270return (__m128i) __builtin_ia32_pmaxsb128_mask ((__v16qi) __A,1271(__v16qi) __B,1272(__v16qi) __W,1273(__mmask16) __M);1274}12751276static __inline__ __m256i __DEFAULT_FN_ATTRS1277_mm256_maskz_max_epi8 (__mmask32 __M, __m256i __A, __m256i __B)1278{1279return (__m256i) __builtin_ia32_pmaxsb256_mask ((__v32qi) __A,1280(__v32qi) __B,1281(__v32qi) _mm256_setzero_si256 (),1282(__mmask32) __M);1283}12841285static __inline__ __m256i __DEFAULT_FN_ATTRS1286_mm256_mask_max_epi8 (__m256i __W, __mmask32 __M, __m256i __A,1287__m256i __B)1288{1289return (__m256i) __builtin_ia32_pmaxsb256_mask ((__v32qi) __A,1290(__v32qi) __B,1291(__v32qi) __W,1292(__mmask32) __M);1293}12941295static __inline__ __m128i __DEFAULT_FN_ATTRS1296_mm_maskz_max_epi16 (__mmask8 __M, __m128i __A, __m128i __B)1297{1298return (__m128i) __builtin_ia32_pmaxsw128_mask ((__v8hi) __A,1299(__v8hi) __B,1300(__v8hi) _mm_setzero_si128 (),1301(__mmask8) __M);1302}13031304static __inline__ __m128i __DEFAULT_FN_ATTRS1305_mm_mask_max_epi16 (__m128i __W, __mmask8 __M, __m128i __A,1306__m128i __B)1307{1308return (__m128i) __builtin_ia32_pmaxsw128_mask ((__v8hi) __A,1309(__v8hi) __B,1310(__v8hi) __W,1311(__mmask8) __M);1312}13131314static __inline__ __m256i __DEFAULT_FN_ATTRS1315_mm256_maskz_max_epi16 (__mmask16 __M, __m256i __A, __m256i __B)1316{1317return (__m256i) __builtin_ia32_pmaxsw256_mask ((__v16hi) __A,1318(__v16hi) __B,1319(__v16hi) _mm256_setzero_si256 (),1320(__mmask16) __M);1321}13221323static __inline__ __m256i __DEFAULT_FN_ATTRS1324_mm256_mask_max_epi16 (__m256i __W, __mmask16 __M, __m256i __A,1325__m256i __B)1326{1327return (__m256i) __builtin_ia32_pmaxsw256_mask ((__v16hi) __A,1328(__v16hi) __B,1329(__v16hi) __W,1330(__mmask16) __M);1331}13321333static __inline__ __m128i __DEFAULT_FN_ATTRS1334_mm_maskz_max_epu8 (__mmask16 __M, __m128i __A, __m128i __B)1335{1336return (__m128i) __builtin_ia32_pmaxub128_mask ((__v16qi) __A,1337(__v16qi) __B,1338(__v16qi) _mm_setzero_si128 (),1339(__mmask16) __M);1340}13411342static __inline__ __m128i __DEFAULT_FN_ATTRS1343_mm_mask_max_epu8 (__m128i __W, __mmask16 __M, __m128i __A,1344__m128i __B)1345{1346return (__m128i) __builtin_ia32_pmaxub128_mask ((__v16qi) __A,1347(__v16qi) __B,1348(__v16qi) __W,1349(__mmask16) __M);1350}13511352static __inline__ __m256i __DEFAULT_FN_ATTRS1353_mm256_maskz_max_epu8 (__mmask32 __M, __m256i __A, __m256i __B)1354{1355return (__m256i) __builtin_ia32_pmaxub256_mask ((__v32qi) __A,1356(__v32qi) __B,1357(__v32qi) _mm256_setzero_si256 (),1358(__mmask32) __M);1359}13601361static __inline__ __m256i __DEFAULT_FN_ATTRS1362_mm256_mask_max_epu8 (__m256i __W, __mmask32 __M, __m256i __A,1363__m256i __B)1364{1365return (__m256i) __builtin_ia32_pmaxub256_mask ((__v32qi) __A,1366(__v32qi) __B,1367(__v32qi) __W,1368(__mmask32) __M);1369}13701371static __inline__ __m128i __DEFAULT_FN_ATTRS1372_mm_maskz_max_epu16 (__mmask8 __M, __m128i __A, __m128i __B)1373{1374return (__m128i) __builtin_ia32_pmaxuw128_mask ((__v8hi) __A,1375(__v8hi) __B,1376(__v8hi) _mm_setzero_si128 (),1377(__mmask8) __M);1378}13791380static __inline__ __m128i __DEFAULT_FN_ATTRS1381_mm_mask_max_epu16 (__m128i __W, __mmask8 __M, __m128i __A,1382__m128i __B)1383{1384return (__m128i) __builtin_ia32_pmaxuw128_mask ((__v8hi) __A,1385(__v8hi) __B,1386(__v8hi) __W,1387(__mmask8) __M);1388}13891390static __inline__ __m256i __DEFAULT_FN_ATTRS1391_mm256_maskz_max_epu16 (__mmask16 __M, __m256i __A, __m256i __B)1392{1393return (__m256i) __builtin_ia32_pmaxuw256_mask ((__v16hi) __A,1394(__v16hi) __B,1395(__v16hi) _mm256_setzero_si256 (),1396(__mmask16) __M);1397}13981399static __inline__ __m256i __DEFAULT_FN_ATTRS1400_mm256_mask_max_epu16 (__m256i __W, __mmask16 __M, __m256i __A,1401__m256i __B)1402{1403return (__m256i) __builtin_ia32_pmaxuw256_mask ((__v16hi) __A,1404(__v16hi) __B,1405(__v16hi) __W,1406(__mmask16) __M);1407}14081409static __inline__ __m128i __DEFAULT_FN_ATTRS1410_mm_maskz_min_epi8 (__mmask16 __M, __m128i __A, __m128i __B)1411{1412return (__m128i) __builtin_ia32_pminsb128_mask ((__v16qi) __A,1413(__v16qi) __B,1414(__v16qi) _mm_setzero_si128 (),1415(__mmask16) __M);1416}14171418static __inline__ __m128i __DEFAULT_FN_ATTRS1419_mm_mask_min_epi8 (__m128i __W, __mmask16 __M, __m128i __A,1420__m128i __B)1421{1422return (__m128i) __builtin_ia32_pminsb128_mask ((__v16qi) __A,1423(__v16qi) __B,1424(__v16qi) __W,1425(__mmask16) __M);1426}14271428static __inline__ __m256i __DEFAULT_FN_ATTRS1429_mm256_maskz_min_epi8 (__mmask32 __M, __m256i __A, __m256i __B)1430{1431return (__m256i) __builtin_ia32_pminsb256_mask ((__v32qi) __A,1432(__v32qi) __B,1433(__v32qi) _mm256_setzero_si256 (),1434(__mmask32) __M);1435}14361437static __inline__ __m256i __DEFAULT_FN_ATTRS1438_mm256_mask_min_epi8 (__m256i __W, __mmask32 __M, __m256i __A,1439__m256i __B)1440{1441return (__m256i) __builtin_ia32_pminsb256_mask ((__v32qi) __A,1442(__v32qi) __B,1443(__v32qi) __W,1444(__mmask32) __M);1445}14461447static __inline__ __m128i __DEFAULT_FN_ATTRS1448_mm_maskz_min_epi16 (__mmask8 __M, __m128i __A, __m128i __B)1449{1450return (__m128i) __builtin_ia32_pminsw128_mask ((__v8hi) __A,1451(__v8hi) __B,1452(__v8hi) _mm_setzero_si128 (),1453(__mmask8) __M);1454}14551456static __inline__ __m128i __DEFAULT_FN_ATTRS1457_mm_mask_min_epi16 (__m128i __W, __mmask8 __M, __m128i __A,1458__m128i __B)1459{1460return (__m128i) __builtin_ia32_pminsw128_mask ((__v8hi) __A,1461(__v8hi) __B,1462(__v8hi) __W,1463(__mmask8) __M);1464}14651466static __inline__ __m256i __DEFAULT_FN_ATTRS1467_mm256_maskz_min_epi16 (__mmask16 __M, __m256i __A, __m256i __B)1468{1469return (__m256i) __builtin_ia32_pminsw256_mask ((__v16hi) __A,1470(__v16hi) __B,1471(__v16hi) _mm256_setzero_si256 (),1472(__mmask16) __M);1473}14741475static __inline__ __m256i __DEFAULT_FN_ATTRS1476_mm256_mask_min_epi16 (__m256i __W, __mmask16 __M, __m256i __A,1477__m256i __B)1478{1479return (__m256i) __builtin_ia32_pminsw256_mask ((__v16hi) __A,1480(__v16hi) __B,1481(__v16hi) __W,1482(__mmask16) __M);1483}14841485static __inline__ __m128i __DEFAULT_FN_ATTRS1486_mm_maskz_min_epu8 (__mmask16 __M, __m128i __A, __m128i __B)1487{1488return (__m128i) __builtin_ia32_pminub128_mask ((__v16qi) __A,1489(__v16qi) __B,1490(__v16qi) _mm_setzero_si128 (),1491(__mmask16) __M);1492}14931494static __inline__ __m128i __DEFAULT_FN_ATTRS1495_mm_mask_min_epu8 (__m128i __W, __mmask16 __M, __m128i __A,1496__m128i __B)1497{1498return (__m128i) __builtin_ia32_pminub128_mask ((__v16qi) __A,1499(__v16qi) __B,1500(__v16qi) __W,1501(__mmask16) __M);1502}15031504static __inline__ __m256i __DEFAULT_FN_ATTRS1505_mm256_maskz_min_epu8 (__mmask32 __M, __m256i __A, __m256i __B)1506{1507return (__m256i) __builtin_ia32_pminub256_mask ((__v32qi) __A,1508(__v32qi) __B,1509(__v32qi) _mm256_setzero_si256 (),1510(__mmask32) __M);1511}15121513static __inline__ __m256i __DEFAULT_FN_ATTRS1514_mm256_mask_min_epu8 (__m256i __W, __mmask32 __M, __m256i __A,1515__m256i __B)1516{1517return (__m256i) __builtin_ia32_pminub256_mask ((__v32qi) __A,1518(__v32qi) __B,1519(__v32qi) __W,1520(__mmask32) __M);1521}15221523static __inline__ __m128i __DEFAULT_FN_ATTRS1524_mm_maskz_min_epu16 (__mmask8 __M, __m128i __A, __m128i __B)1525{1526return (__m128i) __builtin_ia32_pminuw128_mask ((__v8hi) __A,1527(__v8hi) __B,1528(__v8hi) _mm_setzero_si128 (),1529(__mmask8) __M);1530}15311532static __inline__ __m128i __DEFAULT_FN_ATTRS1533_mm_mask_min_epu16 (__m128i __W, __mmask8 __M, __m128i __A,1534__m128i __B)1535{1536return (__m128i) __builtin_ia32_pminuw128_mask ((__v8hi) __A,1537(__v8hi) __B,1538(__v8hi) __W,1539(__mmask8) __M);1540}15411542static __inline__ __m256i __DEFAULT_FN_ATTRS1543_mm256_maskz_min_epu16 (__mmask16 __M, __m256i __A, __m256i __B)1544{1545return (__m256i) __builtin_ia32_pminuw256_mask ((__v16hi) __A,1546(__v16hi) __B,1547(__v16hi) _mm256_setzero_si256 (),1548(__mmask16) __M);1549}15501551static __inline__ __m256i __DEFAULT_FN_ATTRS1552_mm256_mask_min_epu16 (__m256i __W, __mmask16 __M, __m256i __A,1553__m256i __B)1554{1555return (__m256i) __builtin_ia32_pminuw256_mask ((__v16hi) __A,1556(__v16hi) __B,1557(__v16hi) __W,1558(__mmask16) __M);1559}15601561static __inline__ __m128i __DEFAULT_FN_ATTRS1562_mm_mask_shuffle_epi8 (__m128i __W, __mmask16 __U, __m128i __A,1563__m128i __B)1564{1565return (__m128i) __builtin_ia32_pshufb128_mask ((__v16qi) __A,1566(__v16qi) __B,1567(__v16qi) __W,1568(__mmask16) __U);1569}15701571static __inline__ __m128i __DEFAULT_FN_ATTRS1572_mm_maskz_shuffle_epi8 (__mmask16 __U, __m128i __A, __m128i __B)1573{1574return (__m128i) __builtin_ia32_pshufb128_mask ((__v16qi) __A,1575(__v16qi) __B,1576(__v16qi) _mm_setzero_si128 (),1577(__mmask16) __U);1578}15791580static __inline__ __m256i __DEFAULT_FN_ATTRS1581_mm256_mask_shuffle_epi8 (__m256i __W, __mmask32 __U, __m256i __A,1582__m256i __B)1583{1584return (__m256i) __builtin_ia32_pshufb256_mask ((__v32qi) __A,1585(__v32qi) __B,1586(__v32qi) __W,1587(__mmask32) __U);1588}15891590static __inline__ __m256i __DEFAULT_FN_ATTRS1591_mm256_maskz_shuffle_epi8 (__mmask32 __U, __m256i __A, __m256i __B)1592{1593return (__m256i) __builtin_ia32_pshufb256_mask ((__v32qi) __A,1594(__v32qi) __B,1595(__v32qi) _mm256_setzero_si256 (),1596(__mmask32) __U);1597}15981599static __inline__ __m128i __DEFAULT_FN_ATTRS1600_mm_mask_subs_epi8 (__m128i __W, __mmask16 __U, __m128i __A,1601__m128i __B)1602{1603return (__m128i) __builtin_ia32_psubsb128_mask ((__v16qi) __A,1604(__v16qi) __B,1605(__v16qi) __W,1606(__mmask16) __U);1607}16081609static __inline__ __m128i __DEFAULT_FN_ATTRS1610_mm_maskz_subs_epi8 (__mmask16 __U, __m128i __A, __m128i __B)1611{1612return (__m128i) __builtin_ia32_psubsb128_mask ((__v16qi) __A,1613(__v16qi) __B,1614(__v16qi) _mm_setzero_si128 (),1615(__mmask16) __U);1616}16171618static __inline__ __m256i __DEFAULT_FN_ATTRS1619_mm256_mask_subs_epi8 (__m256i __W, __mmask32 __U, __m256i __A,1620__m256i __B)1621{1622return (__m256i) __builtin_ia32_psubsb256_mask ((__v32qi) __A,1623(__v32qi) __B,1624(__v32qi) __W,1625(__mmask32) __U);1626}16271628static __inline__ __m256i __DEFAULT_FN_ATTRS1629_mm256_maskz_subs_epi8 (__mmask32 __U, __m256i __A, __m256i __B)1630{1631return (__m256i) __builtin_ia32_psubsb256_mask ((__v32qi) __A,1632(__v32qi) __B,1633(__v32qi) _mm256_setzero_si256 (),1634(__mmask32) __U);1635}16361637static __inline__ __m128i __DEFAULT_FN_ATTRS1638_mm_mask_subs_epi16 (__m128i __W, __mmask8 __U, __m128i __A,1639__m128i __B)1640{1641return (__m128i) __builtin_ia32_psubsw128_mask ((__v8hi) __A,1642(__v8hi) __B,1643(__v8hi) __W,1644(__mmask8) __U);1645}16461647static __inline__ __m128i __DEFAULT_FN_ATTRS1648_mm_maskz_subs_epi16 (__mmask8 __U, __m128i __A, __m128i __B)1649{1650return (__m128i) __builtin_ia32_psubsw128_mask ((__v8hi) __A,1651(__v8hi) __B,1652(__v8hi) _mm_setzero_si128 (),1653(__mmask8) __U);1654}16551656static __inline__ __m256i __DEFAULT_FN_ATTRS1657_mm256_mask_subs_epi16 (__m256i __W, __mmask16 __U, __m256i __A,1658__m256i __B)1659{1660return (__m256i) __builtin_ia32_psubsw256_mask ((__v16hi) __A,1661(__v16hi) __B,1662(__v16hi) __W,1663(__mmask16) __U);1664}16651666static __inline__ __m256i __DEFAULT_FN_ATTRS1667_mm256_maskz_subs_epi16 (__mmask16 __U, __m256i __A, __m256i __B)1668{1669return (__m256i) __builtin_ia32_psubsw256_mask ((__v16hi) __A,1670(__v16hi) __B,1671(__v16hi) _mm256_setzero_si256 (),1672(__mmask16) __U);1673}16741675static __inline__ __m128i __DEFAULT_FN_ATTRS1676_mm_mask_subs_epu8 (__m128i __W, __mmask16 __U, __m128i __A,1677__m128i __B)1678{1679return (__m128i) __builtin_ia32_psubusb128_mask ((__v16qi) __A,1680(__v16qi) __B,1681(__v16qi) __W,1682(__mmask16) __U);1683}16841685static __inline__ __m128i __DEFAULT_FN_ATTRS1686_mm_maskz_subs_epu8 (__mmask16 __U, __m128i __A, __m128i __B)1687{1688return (__m128i) __builtin_ia32_psubusb128_mask ((__v16qi) __A,1689(__v16qi) __B,1690(__v16qi) _mm_setzero_si128 (),1691(__mmask16) __U);1692}16931694static __inline__ __m256i __DEFAULT_FN_ATTRS1695_mm256_mask_subs_epu8 (__m256i __W, __mmask32 __U, __m256i __A,1696__m256i __B)1697{1698return (__m256i) __builtin_ia32_psubusb256_mask ((__v32qi) __A,1699(__v32qi) __B,1700(__v32qi) __W,1701(__mmask32) __U);1702}17031704static __inline__ __m256i __DEFAULT_FN_ATTRS1705_mm256_maskz_subs_epu8 (__mmask32 __U, __m256i __A, __m256i __B)1706{1707return (__m256i) __builtin_ia32_psubusb256_mask ((__v32qi) __A,1708(__v32qi) __B,1709(__v32qi) _mm256_setzero_si256 (),1710(__mmask32) __U);1711}17121713static __inline__ __m128i __DEFAULT_FN_ATTRS1714_mm_mask_subs_epu16 (__m128i __W, __mmask8 __U, __m128i __A,1715__m128i __B)1716{1717return (__m128i) __builtin_ia32_psubusw128_mask ((__v8hi) __A,1718(__v8hi) __B,1719(__v8hi) __W,1720(__mmask8) __U);1721}17221723static __inline__ __m128i __DEFAULT_FN_ATTRS1724_mm_maskz_subs_epu16 (__mmask8 __U, __m128i __A, __m128i __B)1725{1726return (__m128i) __builtin_ia32_psubusw128_mask ((__v8hi) __A,1727(__v8hi) __B,1728(__v8hi) _mm_setzero_si128 (),1729(__mmask8) __U);1730}17311732static __inline__ __m256i __DEFAULT_FN_ATTRS1733_mm256_mask_subs_epu16 (__m256i __W, __mmask16 __U, __m256i __A,1734__m256i __B)1735{1736return (__m256i) __builtin_ia32_psubusw256_mask ((__v16hi) __A,1737(__v16hi) __B,1738(__v16hi) __W,1739(__mmask16) __U);1740}17411742static __inline__ __m256i __DEFAULT_FN_ATTRS1743_mm256_maskz_subs_epu16 (__mmask16 __U, __m256i __A, __m256i __B)1744{1745return (__m256i) __builtin_ia32_psubusw256_mask ((__v16hi) __A,1746(__v16hi) __B,1747(__v16hi) _mm256_setzero_si256 (),1748(__mmask16) __U);1749}17501751static __inline__ __m128i __DEFAULT_FN_ATTRS1752_mm_mask2_permutex2var_epi16 (__m128i __A, __m128i __I, __mmask8 __U,1753__m128i __B)1754{1755return (__m128i) __builtin_ia32_vpermi2varhi128_mask ((__v8hi) __A,1756(__v8hi) __I /* idx */ ,1757(__v8hi) __B,1758(__mmask8) __U);1759}17601761static __inline__ __m256i __DEFAULT_FN_ATTRS1762_mm256_mask2_permutex2var_epi16 (__m256i __A, __m256i __I,1763__mmask16 __U, __m256i __B)1764{1765return (__m256i) __builtin_ia32_vpermi2varhi256_mask ((__v16hi) __A,1766(__v16hi) __I /* idx */ ,1767(__v16hi) __B,1768(__mmask16) __U);1769}17701771static __inline__ __m128i __DEFAULT_FN_ATTRS1772_mm_permutex2var_epi16 (__m128i __A, __m128i __I, __m128i __B)1773{1774return (__m128i) __builtin_ia32_vpermt2varhi128_mask ((__v8hi) __I/* idx */,1775(__v8hi) __A,1776(__v8hi) __B,1777(__mmask8) -1);1778}17791780static __inline__ __m128i __DEFAULT_FN_ATTRS1781_mm_mask_permutex2var_epi16 (__m128i __A, __mmask8 __U, __m128i __I,1782__m128i __B)1783{1784return (__m128i) __builtin_ia32_vpermt2varhi128_mask ((__v8hi) __I/* idx */,1785(__v8hi) __A,1786(__v8hi) __B,1787(__mmask8) __U);1788}17891790static __inline__ __m128i __DEFAULT_FN_ATTRS1791_mm_maskz_permutex2var_epi16 (__mmask8 __U, __m128i __A, __m128i __I,1792__m128i __B)1793{1794return (__m128i) __builtin_ia32_vpermt2varhi128_maskz ((__v8hi) __I/* idx */,1795(__v8hi) __A,1796(__v8hi) __B,1797(__mmask8) __U);1798}17991800static __inline__ __m256i __DEFAULT_FN_ATTRS1801_mm256_permutex2var_epi16 (__m256i __A, __m256i __I, __m256i __B)1802{1803return (__m256i) __builtin_ia32_vpermt2varhi256_mask ((__v16hi) __I/* idx */,1804(__v16hi) __A,1805(__v16hi) __B,1806(__mmask16) -1);1807}18081809static __inline__ __m256i __DEFAULT_FN_ATTRS1810_mm256_mask_permutex2var_epi16 (__m256i __A, __mmask16 __U,1811__m256i __I, __m256i __B)1812{1813return (__m256i) __builtin_ia32_vpermt2varhi256_mask ((__v16hi) __I/* idx */,1814(__v16hi) __A,1815(__v16hi) __B,1816(__mmask16) __U);1817}18181819static __inline__ __m256i __DEFAULT_FN_ATTRS1820_mm256_maskz_permutex2var_epi16 (__mmask16 __U, __m256i __A,1821__m256i __I, __m256i __B)1822{1823return (__m256i) __builtin_ia32_vpermt2varhi256_maskz ((__v16hi) __I/* idx */,1824(__v16hi) __A,1825(__v16hi) __B,1826(__mmask16) __U);1827}18281829static __inline__ __m128i __DEFAULT_FN_ATTRS1830_mm_mask_maddubs_epi16 (__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) {1831return (__m128i) __builtin_ia32_pmaddubsw128_mask ((__v16qi) __X,1832(__v16qi) __Y,1833(__v8hi) __W,1834(__mmask8) __U);1835}18361837static __inline__ __m128i __DEFAULT_FN_ATTRS1838_mm_maskz_maddubs_epi16 (__mmask8 __U, __m128i __X, __m128i __Y) {1839return (__m128i) __builtin_ia32_pmaddubsw128_mask ((__v16qi) __X,1840(__v16qi) __Y,1841(__v8hi) _mm_setzero_si128(),1842(__mmask8) __U);1843}18441845static __inline__ __m256i __DEFAULT_FN_ATTRS1846_mm256_mask_maddubs_epi16 (__m256i __W, __mmask16 __U, __m256i __X,1847__m256i __Y) {1848return (__m256i) __builtin_ia32_pmaddubsw256_mask ((__v32qi) __X,1849(__v32qi) __Y,1850(__v16hi) __W,1851(__mmask16) __U);1852}18531854static __inline__ __m256i __DEFAULT_FN_ATTRS1855_mm256_maskz_maddubs_epi16 (__mmask16 __U, __m256i __X, __m256i __Y) {1856return (__m256i) __builtin_ia32_pmaddubsw256_mask ((__v32qi) __X,1857(__v32qi) __Y,1858(__v16hi) _mm256_setzero_si256(),1859(__mmask16) __U);1860}18611862static __inline__ __m128i __DEFAULT_FN_ATTRS1863_mm_mask_madd_epi16 (__m128i __W, __mmask8 __U, __m128i __A,1864__m128i __B) {1865return (__m128i) __builtin_ia32_pmaddwd128_mask ((__v8hi) __A,1866(__v8hi) __B,1867(__v4si) __W,1868(__mmask8) __U);1869}18701871static __inline__ __m128i __DEFAULT_FN_ATTRS1872_mm_maskz_madd_epi16 (__mmask8 __U, __m128i __A, __m128i __B) {1873return (__m128i) __builtin_ia32_pmaddwd128_mask ((__v8hi) __A,1874(__v8hi) __B,1875(__v4si) _mm_setzero_si128(),1876(__mmask8) __U);1877}18781879static __inline__ __m256i __DEFAULT_FN_ATTRS1880_mm256_mask_madd_epi16 (__m256i __W, __mmask8 __U, __m256i __A, __m256i __B) {1881return (__m256i) __builtin_ia32_pmaddwd256_mask ((__v16hi) __A,1882(__v16hi) __B,1883(__v8si) __W,1884(__mmask8) __U);1885}18861887static __inline__ __m256i __DEFAULT_FN_ATTRS1888_mm256_maskz_madd_epi16 (__mmask8 __U, __m256i __A, __m256i __B) {1889return (__m256i) __builtin_ia32_pmaddwd256_mask ((__v16hi) __A,1890(__v16hi) __B,1891(__v8si) _mm256_setzero_si256(),1892(__mmask8) __U);1893}18941895static __inline__ __m128i __DEFAULT_FN_ATTRS1896_mm_cvtsepi16_epi8 (__m128i __A) {1897return (__m128i) __builtin_ia32_pmovswb128_mask ((__v8hi) __A,1898(__v16qi) _mm_setzero_si128(),1899(__mmask8) -1);1900}19011902static __inline__ __m128i __DEFAULT_FN_ATTRS1903_mm_mask_cvtsepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {1904return (__m128i) __builtin_ia32_pmovswb128_mask ((__v8hi) __A,1905(__v16qi) __O,1906__M);1907}19081909static __inline__ __m128i __DEFAULT_FN_ATTRS1910_mm_maskz_cvtsepi16_epi8 (__mmask8 __M, __m128i __A) {1911return (__m128i) __builtin_ia32_pmovswb128_mask ((__v8hi) __A,1912(__v16qi) _mm_setzero_si128(),1913__M);1914}19151916static __inline__ __m128i __DEFAULT_FN_ATTRS1917_mm256_cvtsepi16_epi8 (__m256i __A) {1918return (__m128i) __builtin_ia32_pmovswb256_mask ((__v16hi) __A,1919(__v16qi) _mm_setzero_si128(),1920(__mmask16) -1);1921}19221923static __inline__ __m128i __DEFAULT_FN_ATTRS1924_mm256_mask_cvtsepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {1925return (__m128i) __builtin_ia32_pmovswb256_mask ((__v16hi) __A,1926(__v16qi) __O,1927__M);1928}19291930static __inline__ __m128i __DEFAULT_FN_ATTRS1931_mm256_maskz_cvtsepi16_epi8 (__mmask16 __M, __m256i __A) {1932return (__m128i) __builtin_ia32_pmovswb256_mask ((__v16hi) __A,1933(__v16qi) _mm_setzero_si128(),1934__M);1935}19361937static __inline__ __m128i __DEFAULT_FN_ATTRS1938_mm_cvtusepi16_epi8 (__m128i __A) {1939return (__m128i) __builtin_ia32_pmovuswb128_mask ((__v8hi) __A,1940(__v16qi) _mm_setzero_si128(),1941(__mmask8) -1);1942}19431944static __inline__ __m128i __DEFAULT_FN_ATTRS1945_mm_mask_cvtusepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {1946return (__m128i) __builtin_ia32_pmovuswb128_mask ((__v8hi) __A,1947(__v16qi) __O,1948__M);1949}19501951static __inline__ __m128i __DEFAULT_FN_ATTRS1952_mm_maskz_cvtusepi16_epi8 (__mmask8 __M, __m128i __A) {1953return (__m128i) __builtin_ia32_pmovuswb128_mask ((__v8hi) __A,1954(__v16qi) _mm_setzero_si128(),1955__M);1956}19571958static __inline__ __m128i __DEFAULT_FN_ATTRS1959_mm256_cvtusepi16_epi8 (__m256i __A) {1960return (__m128i) __builtin_ia32_pmovuswb256_mask ((__v16hi) __A,1961(__v16qi) _mm_setzero_si128(),1962(__mmask16) -1);1963}19641965static __inline__ __m128i __DEFAULT_FN_ATTRS1966_mm256_mask_cvtusepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {1967return (__m128i) __builtin_ia32_pmovuswb256_mask ((__v16hi) __A,1968(__v16qi) __O,1969__M);1970}19711972static __inline__ __m128i __DEFAULT_FN_ATTRS1973_mm256_maskz_cvtusepi16_epi8 (__mmask16 __M, __m256i __A) {1974return (__m128i) __builtin_ia32_pmovuswb256_mask ((__v16hi) __A,1975(__v16qi) _mm_setzero_si128(),1976__M);1977}19781979static __inline__ __m128i __DEFAULT_FN_ATTRS1980_mm_cvtepi16_epi8 (__m128i __A) {19811982return (__m128i) __builtin_ia32_pmovwb128_mask ((__v8hi) __A,1983(__v16qi) _mm_setzero_si128(),1984(__mmask8) -1);1985}19861987static __inline__ __m128i __DEFAULT_FN_ATTRS1988_mm_mask_cvtepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {1989return (__m128i) __builtin_ia32_pmovwb128_mask ((__v8hi) __A,1990(__v16qi) __O,1991__M);1992}19931994static __inline__ __m128i __DEFAULT_FN_ATTRS1995_mm_maskz_cvtepi16_epi8 (__mmask8 __M, __m128i __A) {1996return (__m128i) __builtin_ia32_pmovwb128_mask ((__v8hi) __A,1997(__v16qi) _mm_setzero_si128(),1998__M);1999}20002001static __inline__ void __DEFAULT_FN_ATTRS2002_mm_mask_cvtepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)2003{2004__builtin_ia32_pmovwb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);2005}200620072008static __inline__ void __DEFAULT_FN_ATTRS2009_mm_mask_cvtsepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)2010{2011__builtin_ia32_pmovswb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);2012}20132014static __inline__ void __DEFAULT_FN_ATTRS2015_mm_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)2016{2017__builtin_ia32_pmovuswb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);2018}20192020static __inline__ __m128i __DEFAULT_FN_ATTRS2021_mm256_cvtepi16_epi8 (__m256i __A) {2022return (__m128i) __builtin_ia32_pmovwb256_mask ((__v16hi) __A,2023(__v16qi) _mm_setzero_si128(),2024(__mmask16) -1);2025}20262027static __inline__ __m128i __DEFAULT_FN_ATTRS2028_mm256_mask_cvtepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {2029return (__m128i) __builtin_ia32_pmovwb256_mask ((__v16hi) __A,2030(__v16qi) __O,2031__M);2032}20332034static __inline__ __m128i __DEFAULT_FN_ATTRS2035_mm256_maskz_cvtepi16_epi8 (__mmask16 __M, __m256i __A) {2036return (__m128i) __builtin_ia32_pmovwb256_mask ((__v16hi) __A,2037(__v16qi) _mm_setzero_si128(),2038__M);2039}20402041static __inline__ void __DEFAULT_FN_ATTRS2042_mm256_mask_cvtepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)2043{2044__builtin_ia32_pmovwb256mem_mask ((__v16qi *) __P, (__v16hi) __A, __M);2045}20462047static __inline__ void __DEFAULT_FN_ATTRS2048_mm256_mask_cvtsepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)2049{2050__builtin_ia32_pmovswb256mem_mask ((__v16qi *) __P, (__v16hi) __A, __M);2051}20522053static __inline__ void __DEFAULT_FN_ATTRS2054_mm256_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)2055{2056__builtin_ia32_pmovuswb256mem_mask ((__v16qi*) __P, (__v16hi) __A, __M);2057}2058static __inline__ __m128i __DEFAULT_FN_ATTRS2059_mm_mask_mulhrs_epi16 (__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) {2060return (__m128i) __builtin_ia32_pmulhrsw128_mask ((__v8hi) __X,2061(__v8hi) __Y,2062(__v8hi) __W,2063(__mmask8) __U);2064}20652066static __inline__ __m128i __DEFAULT_FN_ATTRS2067_mm_maskz_mulhrs_epi16 (__mmask8 __U, __m128i __X, __m128i __Y) {2068return (__m128i) __builtin_ia32_pmulhrsw128_mask ((__v8hi) __X,2069(__v8hi) __Y,2070(__v8hi) _mm_setzero_si128(),2071(__mmask8) __U);2072}20732074static __inline__ __m256i __DEFAULT_FN_ATTRS2075_mm256_mask_mulhrs_epi16 (__m256i __W, __mmask16 __U, __m256i __X, __m256i __Y) {2076return (__m256i) __builtin_ia32_pmulhrsw256_mask ((__v16hi) __X,2077(__v16hi) __Y,2078(__v16hi) __W,2079(__mmask16) __U);2080}20812082static __inline__ __m256i __DEFAULT_FN_ATTRS2083_mm256_maskz_mulhrs_epi16 (__mmask16 __U, __m256i __X, __m256i __Y) {2084return (__m256i) __builtin_ia32_pmulhrsw256_mask ((__v16hi) __X,2085(__v16hi) __Y,2086(__v16hi) _mm256_setzero_si256(),2087(__mmask16) __U);2088}20892090static __inline__ __m128i __DEFAULT_FN_ATTRS2091_mm_mask_mulhi_epu16 (__m128i __W, __mmask8 __U, __m128i __A,2092__m128i __B) {2093return (__m128i) __builtin_ia32_pmulhuw128_mask ((__v8hi) __A,2094(__v8hi) __B,2095(__v8hi) __W,2096(__mmask8) __U);2097}20982099static __inline__ __m128i __DEFAULT_FN_ATTRS2100_mm_maskz_mulhi_epu16 (__mmask8 __U, __m128i __A, __m128i __B) {2101return (__m128i) __builtin_ia32_pmulhuw128_mask ((__v8hi) __A,2102(__v8hi) __B,2103(__v8hi) _mm_setzero_si128(),2104(__mmask8) __U);2105}21062107static __inline__ __m256i __DEFAULT_FN_ATTRS2108_mm256_mask_mulhi_epu16 (__m256i __W, __mmask16 __U, __m256i __A,2109__m256i __B) {2110return (__m256i) __builtin_ia32_pmulhuw256_mask ((__v16hi) __A,2111(__v16hi) __B,2112(__v16hi) __W,2113(__mmask16) __U);2114}21152116static __inline__ __m256i __DEFAULT_FN_ATTRS2117_mm256_maskz_mulhi_epu16 (__mmask16 __U, __m256i __A, __m256i __B) {2118return (__m256i) __builtin_ia32_pmulhuw256_mask ((__v16hi) __A,2119(__v16hi) __B,2120(__v16hi) _mm256_setzero_si256(),2121(__mmask16) __U);2122}21232124static __inline__ __m128i __DEFAULT_FN_ATTRS2125_mm_mask_mulhi_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2126__m128i __B) {2127return (__m128i) __builtin_ia32_pmulhw128_mask ((__v8hi) __A,2128(__v8hi) __B,2129(__v8hi) __W,2130(__mmask8) __U);2131}21322133static __inline__ __m128i __DEFAULT_FN_ATTRS2134_mm_maskz_mulhi_epi16 (__mmask8 __U, __m128i __A, __m128i __B) {2135return (__m128i) __builtin_ia32_pmulhw128_mask ((__v8hi) __A,2136(__v8hi) __B,2137(__v8hi) _mm_setzero_si128(),2138(__mmask8) __U);2139}21402141static __inline__ __m256i __DEFAULT_FN_ATTRS2142_mm256_mask_mulhi_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2143__m256i __B) {2144return (__m256i) __builtin_ia32_pmulhw256_mask ((__v16hi) __A,2145(__v16hi) __B,2146(__v16hi) __W,2147(__mmask16) __U);2148}21492150static __inline__ __m256i __DEFAULT_FN_ATTRS2151_mm256_maskz_mulhi_epi16 (__mmask16 __U, __m256i __A, __m256i __B) {2152return (__m256i) __builtin_ia32_pmulhw256_mask ((__v16hi) __A,2153(__v16hi) __B,2154(__v16hi) _mm256_setzero_si256(),2155(__mmask16) __U);2156}21572158static __inline__ __m128i __DEFAULT_FN_ATTRS2159_mm_mask_unpackhi_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {2160return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,2161(__v16qi)_mm_unpackhi_epi8(__A, __B),2162(__v16qi)__W);2163}21642165static __inline__ __m128i __DEFAULT_FN_ATTRS2166_mm_maskz_unpackhi_epi8(__mmask16 __U, __m128i __A, __m128i __B) {2167return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,2168(__v16qi)_mm_unpackhi_epi8(__A, __B),2169(__v16qi)_mm_setzero_si128());2170}21712172static __inline__ __m256i __DEFAULT_FN_ATTRS2173_mm256_mask_unpackhi_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {2174return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,2175(__v32qi)_mm256_unpackhi_epi8(__A, __B),2176(__v32qi)__W);2177}21782179static __inline__ __m256i __DEFAULT_FN_ATTRS2180_mm256_maskz_unpackhi_epi8(__mmask32 __U, __m256i __A, __m256i __B) {2181return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,2182(__v32qi)_mm256_unpackhi_epi8(__A, __B),2183(__v32qi)_mm256_setzero_si256());2184}21852186static __inline__ __m128i __DEFAULT_FN_ATTRS2187_mm_mask_unpackhi_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {2188return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,2189(__v8hi)_mm_unpackhi_epi16(__A, __B),2190(__v8hi)__W);2191}21922193static __inline__ __m128i __DEFAULT_FN_ATTRS2194_mm_maskz_unpackhi_epi16(__mmask8 __U, __m128i __A, __m128i __B) {2195return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,2196(__v8hi)_mm_unpackhi_epi16(__A, __B),2197(__v8hi) _mm_setzero_si128());2198}21992200static __inline__ __m256i __DEFAULT_FN_ATTRS2201_mm256_mask_unpackhi_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {2202return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,2203(__v16hi)_mm256_unpackhi_epi16(__A, __B),2204(__v16hi)__W);2205}22062207static __inline__ __m256i __DEFAULT_FN_ATTRS2208_mm256_maskz_unpackhi_epi16(__mmask16 __U, __m256i __A, __m256i __B) {2209return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,2210(__v16hi)_mm256_unpackhi_epi16(__A, __B),2211(__v16hi)_mm256_setzero_si256());2212}22132214static __inline__ __m128i __DEFAULT_FN_ATTRS2215_mm_mask_unpacklo_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {2216return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,2217(__v16qi)_mm_unpacklo_epi8(__A, __B),2218(__v16qi)__W);2219}22202221static __inline__ __m128i __DEFAULT_FN_ATTRS2222_mm_maskz_unpacklo_epi8(__mmask16 __U, __m128i __A, __m128i __B) {2223return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,2224(__v16qi)_mm_unpacklo_epi8(__A, __B),2225(__v16qi)_mm_setzero_si128());2226}22272228static __inline__ __m256i __DEFAULT_FN_ATTRS2229_mm256_mask_unpacklo_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {2230return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,2231(__v32qi)_mm256_unpacklo_epi8(__A, __B),2232(__v32qi)__W);2233}22342235static __inline__ __m256i __DEFAULT_FN_ATTRS2236_mm256_maskz_unpacklo_epi8(__mmask32 __U, __m256i __A, __m256i __B) {2237return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,2238(__v32qi)_mm256_unpacklo_epi8(__A, __B),2239(__v32qi)_mm256_setzero_si256());2240}22412242static __inline__ __m128i __DEFAULT_FN_ATTRS2243_mm_mask_unpacklo_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {2244return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,2245(__v8hi)_mm_unpacklo_epi16(__A, __B),2246(__v8hi)__W);2247}22482249static __inline__ __m128i __DEFAULT_FN_ATTRS2250_mm_maskz_unpacklo_epi16(__mmask8 __U, __m128i __A, __m128i __B) {2251return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,2252(__v8hi)_mm_unpacklo_epi16(__A, __B),2253(__v8hi) _mm_setzero_si128());2254}22552256static __inline__ __m256i __DEFAULT_FN_ATTRS2257_mm256_mask_unpacklo_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {2258return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,2259(__v16hi)_mm256_unpacklo_epi16(__A, __B),2260(__v16hi)__W);2261}22622263static __inline__ __m256i __DEFAULT_FN_ATTRS2264_mm256_maskz_unpacklo_epi16(__mmask16 __U, __m256i __A, __m256i __B) {2265return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,2266(__v16hi)_mm256_unpacklo_epi16(__A, __B),2267(__v16hi)_mm256_setzero_si256());2268}22692270static __inline__ __m128i __DEFAULT_FN_ATTRS2271_mm_mask_cvtepi8_epi16 (__m128i __W, __mmask32 __U, __m128i __A)2272{2273return (__m128i) __builtin_ia32_pmovsxbw128_mask ((__v16qi) __A,2274(__v8hi) __W,2275(__mmask8) __U);2276}22772278static __inline__ __m128i __DEFAULT_FN_ATTRS2279_mm_maskz_cvtepi8_epi16 (__mmask8 __U, __m128i __A)2280{2281return (__m128i) __builtin_ia32_pmovsxbw128_mask ((__v16qi) __A,2282(__v8hi)2283_mm_setzero_si128 (),2284(__mmask8) __U);2285}22862287static __inline__ __m256i __DEFAULT_FN_ATTRS2288_mm256_mask_cvtepi8_epi16 (__m256i __W, __mmask32 __U, __m128i __A)2289{2290return (__m256i) __builtin_ia32_pmovsxbw256_mask ((__v16qi) __A,2291(__v16hi) __W,2292(__mmask16) __U);2293}22942295static __inline__ __m256i __DEFAULT_FN_ATTRS2296_mm256_maskz_cvtepi8_epi16 (__mmask16 __U, __m128i __A)2297{2298return (__m256i) __builtin_ia32_pmovsxbw256_mask ((__v16qi) __A,2299(__v16hi)2300_mm256_setzero_si256 (),2301(__mmask16) __U);2302}230323042305static __inline__ __m128i __DEFAULT_FN_ATTRS2306_mm_mask_cvtepu8_epi16 (__m128i __W, __mmask32 __U, __m128i __A)2307{2308return (__m128i) __builtin_ia32_pmovzxbw128_mask ((__v16qi) __A,2309(__v8hi) __W,2310(__mmask8) __U);2311}23122313static __inline__ __m128i __DEFAULT_FN_ATTRS2314_mm_maskz_cvtepu8_epi16 (__mmask8 __U, __m128i __A)2315{2316return (__m128i) __builtin_ia32_pmovzxbw128_mask ((__v16qi) __A,2317(__v8hi)2318_mm_setzero_si128 (),2319(__mmask8) __U);2320}23212322static __inline__ __m256i __DEFAULT_FN_ATTRS2323_mm256_mask_cvtepu8_epi16 (__m256i __W, __mmask32 __U, __m128i __A)2324{2325return (__m256i) __builtin_ia32_pmovzxbw256_mask ((__v16qi) __A,2326(__v16hi) __W,2327(__mmask16) __U);2328}23292330static __inline__ __m256i __DEFAULT_FN_ATTRS2331_mm256_maskz_cvtepu8_epi16 (__mmask16 __U, __m128i __A)2332{2333return (__m256i) __builtin_ia32_pmovzxbw256_mask ((__v16qi) __A,2334(__v16hi)2335_mm256_setzero_si256 (),2336(__mmask16) __U);2337}233823392340#define _mm_cmp_epi8_mask(a, b, p) __extension__ ({ \2341(__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)(__m128i)(a), \2342(__v16qi)(__m128i)(b), (int)(p), \2343(__mmask16)-1); })23442345#define _mm_mask_cmp_epi8_mask(m, a, b, p) __extension__ ({ \2346(__mmask16)__builtin_ia32_cmpb128_mask((__v16qi)(__m128i)(a), \2347(__v16qi)(__m128i)(b), (int)(p), \2348(__mmask16)(m)); })23492350#define _mm_cmp_epu8_mask(a, b, p) __extension__ ({ \2351(__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)(__m128i)(a), \2352(__v16qi)(__m128i)(b), (int)(p), \2353(__mmask16)-1); })23542355#define _mm_mask_cmp_epu8_mask(m, a, b, p) __extension__ ({ \2356(__mmask16)__builtin_ia32_ucmpb128_mask((__v16qi)(__m128i)(a), \2357(__v16qi)(__m128i)(b), (int)(p), \2358(__mmask16)(m)); })23592360#define _mm256_cmp_epi8_mask(a, b, p) __extension__ ({ \2361(__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)(__m256i)(a), \2362(__v32qi)(__m256i)(b), (int)(p), \2363(__mmask32)-1); })23642365#define _mm256_mask_cmp_epi8_mask(m, a, b, p) __extension__ ({ \2366(__mmask32)__builtin_ia32_cmpb256_mask((__v32qi)(__m256i)(a), \2367(__v32qi)(__m256i)(b), (int)(p), \2368(__mmask32)(m)); })23692370#define _mm256_cmp_epu8_mask(a, b, p) __extension__ ({ \2371(__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)(__m256i)(a), \2372(__v32qi)(__m256i)(b), (int)(p), \2373(__mmask32)-1); })23742375#define _mm256_mask_cmp_epu8_mask(m, a, b, p) __extension__ ({ \2376(__mmask32)__builtin_ia32_ucmpb256_mask((__v32qi)(__m256i)(a), \2377(__v32qi)(__m256i)(b), (int)(p), \2378(__mmask32)(m)); })23792380#define _mm_cmp_epi16_mask(a, b, p) __extension__ ({ \2381(__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)(__m128i)(a), \2382(__v8hi)(__m128i)(b), (int)(p), \2383(__mmask8)-1); })23842385#define _mm_mask_cmp_epi16_mask(m, a, b, p) __extension__ ({ \2386(__mmask8)__builtin_ia32_cmpw128_mask((__v8hi)(__m128i)(a), \2387(__v8hi)(__m128i)(b), (int)(p), \2388(__mmask8)(m)); })23892390#define _mm_cmp_epu16_mask(a, b, p) __extension__ ({ \2391(__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)(__m128i)(a), \2392(__v8hi)(__m128i)(b), (int)(p), \2393(__mmask8)-1); })23942395#define _mm_mask_cmp_epu16_mask(m, a, b, p) __extension__ ({ \2396(__mmask8)__builtin_ia32_ucmpw128_mask((__v8hi)(__m128i)(a), \2397(__v8hi)(__m128i)(b), (int)(p), \2398(__mmask8)(m)); })23992400#define _mm256_cmp_epi16_mask(a, b, p) __extension__ ({ \2401(__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)(__m256i)(a), \2402(__v16hi)(__m256i)(b), (int)(p), \2403(__mmask16)-1); })24042405#define _mm256_mask_cmp_epi16_mask(m, a, b, p) __extension__ ({ \2406(__mmask16)__builtin_ia32_cmpw256_mask((__v16hi)(__m256i)(a), \2407(__v16hi)(__m256i)(b), (int)(p), \2408(__mmask16)(m)); })24092410#define _mm256_cmp_epu16_mask(a, b, p) __extension__ ({ \2411(__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)(__m256i)(a), \2412(__v16hi)(__m256i)(b), (int)(p), \2413(__mmask16)-1); })24142415#define _mm256_mask_cmp_epu16_mask(m, a, b, p) __extension__ ({ \2416(__mmask16)__builtin_ia32_ucmpw256_mask((__v16hi)(__m256i)(a), \2417(__v16hi)(__m256i)(b), (int)(p), \2418(__mmask16)(m)); })24192420#define _mm_mask_shufflehi_epi16(W, U, A, imm) __extension__ ({ \2421(__m128i)__builtin_ia32_selectw_128((__mmask8)(U), \2422(__v8hi)_mm_shufflehi_epi16((A), (imm)), \2423(__v8hi)(__m128i)(W)); })24242425#define _mm_maskz_shufflehi_epi16(U, A, imm) __extension__ ({ \2426(__m128i)__builtin_ia32_selectw_128((__mmask8)(U), \2427(__v8hi)_mm_shufflehi_epi16((A), (imm)), \2428(__v8hi)_mm_setzero_hi()); })24292430#define _mm256_mask_shufflehi_epi16(W, U, A, imm) __extension__ ({ \2431(__m256i)__builtin_ia32_selectw_256((__mmask16)(U), \2432(__v16hi)_mm256_shufflehi_epi16((A), (imm)), \2433(__v16hi)(__m256i)(W)); })24342435#define _mm256_maskz_shufflehi_epi16(U, A, imm) __extension__ ({ \2436(__m256i)__builtin_ia32_selectw_256((__mmask16)(U), \2437(__v16hi)_mm256_shufflehi_epi16((A), (imm)), \2438(__v16hi)_mm256_setzero_si256()); })24392440#define _mm_mask_shufflelo_epi16(W, U, A, imm) __extension__ ({ \2441(__m128i)__builtin_ia32_selectw_128((__mmask8)(U), \2442(__v8hi)_mm_shufflelo_epi16((A), (imm)), \2443(__v8hi)(__m128i)(W)); })24442445#define _mm_maskz_shufflelo_epi16(U, A, imm) __extension__ ({ \2446(__m128i)__builtin_ia32_selectw_128((__mmask8)(U), \2447(__v8hi)_mm_shufflelo_epi16((A), (imm)), \2448(__v8hi)_mm_setzero_hi()); })24492450#define _mm256_mask_shufflelo_epi16(W, U, A, imm) __extension__ ({ \2451(__m256i)__builtin_ia32_selectw_256((__mmask16)(U), \2452(__v16hi)_mm256_shufflelo_epi16((A), \2453(imm)), \2454(__v16hi)(__m256i)(W)); })24552456#define _mm256_maskz_shufflelo_epi16(U, A, imm) __extension__ ({ \2457(__m256i)__builtin_ia32_selectw_256((__mmask16)(U), \2458(__v16hi)_mm256_shufflelo_epi16((A), \2459(imm)), \2460(__v16hi)_mm256_setzero_si256()); })24612462static __inline__ __m256i __DEFAULT_FN_ATTRS2463_mm256_sllv_epi16 (__m256i __A, __m256i __B)2464{2465return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A,2466(__v16hi) __B,2467(__v16hi)2468_mm256_setzero_si256 (),2469(__mmask16) -1);2470}24712472static __inline__ __m256i __DEFAULT_FN_ATTRS2473_mm256_mask_sllv_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2474__m256i __B)2475{2476return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A,2477(__v16hi) __B,2478(__v16hi) __W,2479(__mmask16) __U);2480}24812482static __inline__ __m256i __DEFAULT_FN_ATTRS2483_mm256_maskz_sllv_epi16 (__mmask16 __U, __m256i __A, __m256i __B)2484{2485return (__m256i) __builtin_ia32_psllv16hi_mask ((__v16hi) __A,2486(__v16hi) __B,2487(__v16hi)2488_mm256_setzero_si256 (),2489(__mmask16) __U);2490}24912492static __inline__ __m128i __DEFAULT_FN_ATTRS2493_mm_sllv_epi16 (__m128i __A, __m128i __B)2494{2495return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A,2496(__v8hi) __B,2497(__v8hi)2498_mm_setzero_hi (),2499(__mmask8) -1);2500}25012502static __inline__ __m128i __DEFAULT_FN_ATTRS2503_mm_mask_sllv_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2504__m128i __B)2505{2506return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A,2507(__v8hi) __B,2508(__v8hi) __W,2509(__mmask8) __U);2510}25112512static __inline__ __m128i __DEFAULT_FN_ATTRS2513_mm_maskz_sllv_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2514{2515return (__m128i) __builtin_ia32_psllv8hi_mask ((__v8hi) __A,2516(__v8hi) __B,2517(__v8hi)2518_mm_setzero_si128 (),2519(__mmask8) __U);2520}25212522static __inline__ __m128i __DEFAULT_FN_ATTRS2523_mm_mask_sll_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2524__m128i __B)2525{2526return (__m128i) __builtin_ia32_psllw128_mask ((__v8hi) __A,2527(__v8hi) __B,2528(__v8hi) __W,2529(__mmask8) __U);2530}25312532static __inline__ __m128i __DEFAULT_FN_ATTRS2533_mm_maskz_sll_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2534{2535return (__m128i) __builtin_ia32_psllw128_mask ((__v8hi) __A,2536(__v8hi) __B,2537(__v8hi)2538_mm_setzero_si128 (),2539(__mmask8) __U);2540}25412542static __inline__ __m256i __DEFAULT_FN_ATTRS2543_mm256_mask_sll_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2544__m128i __B)2545{2546return (__m256i) __builtin_ia32_psllw256_mask ((__v16hi) __A,2547(__v8hi) __B,2548(__v16hi) __W,2549(__mmask16) __U);2550}25512552static __inline__ __m256i __DEFAULT_FN_ATTRS2553_mm256_maskz_sll_epi16 (__mmask16 __U, __m256i __A, __m128i __B)2554{2555return (__m256i) __builtin_ia32_psllw256_mask ((__v16hi) __A,2556(__v8hi) __B,2557(__v16hi)2558_mm256_setzero_si256 (),2559(__mmask16) __U);2560}25612562#define _mm_mask_slli_epi16(W, U, A, B) __extension__ ({ \2563(__m128i)__builtin_ia32_psllwi128_mask((__v8hi)(__m128i)(A), (int)(B), \2564(__v8hi)(__m128i)(W), \2565(__mmask8)(U)); })25662567#define _mm_maskz_slli_epi16(U, A, B) __extension__ ({ \2568(__m128i)__builtin_ia32_psllwi128_mask((__v8hi)(__m128i)(A), (int)(B), \2569(__v8hi)_mm_setzero_si128(), \2570(__mmask8)(U)); })25712572#define _mm256_mask_slli_epi16(W, U, A, B) __extension__ ({ \2573(__m256i)__builtin_ia32_psllwi256_mask((__v16hi)(__m256i)(A), (int)(B), \2574(__v16hi)(__m256i)(W), \2575(__mmask16)(U)); })25762577#define _mm256_maskz_slli_epi16(U, A, B) __extension__ ({ \2578(__m256i)__builtin_ia32_psllwi256_mask((__v16hi)(__m256i)(A), (int)(B), \2579(__v16hi)_mm256_setzero_si256(), \2580(__mmask16)(U)); })2581258225832584static __inline__ __m256i __DEFAULT_FN_ATTRS2585_mm256_srlv_epi16 (__m256i __A, __m256i __B)2586{2587return (__m256i) __builtin_ia32_psrlv16hi_mask ((__v16hi) __A,2588(__v16hi) __B,2589(__v16hi)2590_mm256_setzero_si256 (),2591(__mmask16) -1);2592}25932594static __inline__ __m256i __DEFAULT_FN_ATTRS2595_mm256_mask_srlv_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2596__m256i __B)2597{2598return (__m256i) __builtin_ia32_psrlv16hi_mask ((__v16hi) __A,2599(__v16hi) __B,2600(__v16hi) __W,2601(__mmask16) __U);2602}26032604static __inline__ __m256i __DEFAULT_FN_ATTRS2605_mm256_maskz_srlv_epi16 (__mmask16 __U, __m256i __A, __m256i __B)2606{2607return (__m256i) __builtin_ia32_psrlv16hi_mask ((__v16hi) __A,2608(__v16hi) __B,2609(__v16hi)2610_mm256_setzero_si256 (),2611(__mmask16) __U);2612}26132614static __inline__ __m128i __DEFAULT_FN_ATTRS2615_mm_srlv_epi16 (__m128i __A, __m128i __B)2616{2617return (__m128i) __builtin_ia32_psrlv8hi_mask ((__v8hi) __A,2618(__v8hi) __B,2619(__v8hi)2620_mm_setzero_hi (),2621(__mmask8) -1);2622}26232624static __inline__ __m128i __DEFAULT_FN_ATTRS2625_mm_mask_srlv_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2626__m128i __B)2627{2628return (__m128i) __builtin_ia32_psrlv8hi_mask ((__v8hi) __A,2629(__v8hi) __B,2630(__v8hi) __W,2631(__mmask8) __U);2632}26332634static __inline__ __m128i __DEFAULT_FN_ATTRS2635_mm_maskz_srlv_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2636{2637return (__m128i) __builtin_ia32_psrlv8hi_mask ((__v8hi) __A,2638(__v8hi) __B,2639(__v8hi)2640_mm_setzero_si128 (),2641(__mmask8) __U);2642}26432644static __inline__ __m256i __DEFAULT_FN_ATTRS2645_mm256_srav_epi16 (__m256i __A, __m256i __B)2646{2647return (__m256i) __builtin_ia32_psrav16hi_mask ((__v16hi) __A,2648(__v16hi) __B,2649(__v16hi)2650_mm256_setzero_si256 (),2651(__mmask16) -1);2652}26532654static __inline__ __m256i __DEFAULT_FN_ATTRS2655_mm256_mask_srav_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2656__m256i __B)2657{2658return (__m256i) __builtin_ia32_psrav16hi_mask ((__v16hi) __A,2659(__v16hi) __B,2660(__v16hi) __W,2661(__mmask16) __U);2662}26632664static __inline__ __m256i __DEFAULT_FN_ATTRS2665_mm256_maskz_srav_epi16 (__mmask16 __U, __m256i __A, __m256i __B)2666{2667return (__m256i) __builtin_ia32_psrav16hi_mask ((__v16hi) __A,2668(__v16hi) __B,2669(__v16hi)2670_mm256_setzero_si256 (),2671(__mmask16) __U);2672}26732674static __inline__ __m128i __DEFAULT_FN_ATTRS2675_mm_srav_epi16 (__m128i __A, __m128i __B)2676{2677return (__m128i) __builtin_ia32_psrav8hi_mask ((__v8hi) __A,2678(__v8hi) __B,2679(__v8hi)2680_mm_setzero_hi (),2681(__mmask8) -1);2682}26832684static __inline__ __m128i __DEFAULT_FN_ATTRS2685_mm_mask_srav_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2686__m128i __B)2687{2688return (__m128i) __builtin_ia32_psrav8hi_mask ((__v8hi) __A,2689(__v8hi) __B,2690(__v8hi) __W,2691(__mmask8) __U);2692}26932694static __inline__ __m128i __DEFAULT_FN_ATTRS2695_mm_maskz_srav_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2696{2697return (__m128i) __builtin_ia32_psrav8hi_mask ((__v8hi) __A,2698(__v8hi) __B,2699(__v8hi)2700_mm_setzero_si128 (),2701(__mmask8) __U);2702}27032704static __inline__ __m128i __DEFAULT_FN_ATTRS2705_mm_mask_sra_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2706__m128i __B)2707{2708return (__m128i) __builtin_ia32_psraw128_mask ((__v8hi) __A,2709(__v8hi) __B,2710(__v8hi) __W,2711(__mmask8) __U);2712}27132714static __inline__ __m128i __DEFAULT_FN_ATTRS2715_mm_maskz_sra_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2716{2717return (__m128i) __builtin_ia32_psraw128_mask ((__v8hi) __A,2718(__v8hi) __B,2719(__v8hi)2720_mm_setzero_si128 (),2721(__mmask8) __U);2722}27232724static __inline__ __m256i __DEFAULT_FN_ATTRS2725_mm256_mask_sra_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2726__m128i __B)2727{2728return (__m256i) __builtin_ia32_psraw256_mask ((__v16hi) __A,2729(__v8hi) __B,2730(__v16hi) __W,2731(__mmask16) __U);2732}27332734static __inline__ __m256i __DEFAULT_FN_ATTRS2735_mm256_maskz_sra_epi16 (__mmask16 __U, __m256i __A, __m128i __B)2736{2737return (__m256i) __builtin_ia32_psraw256_mask ((__v16hi) __A,2738(__v8hi) __B,2739(__v16hi)2740_mm256_setzero_si256 (),2741(__mmask16) __U);2742}27432744#define _mm_mask_srai_epi16(W, U, A, imm) __extension__ ({ \2745(__m128i)__builtin_ia32_psrawi128_mask((__v8hi)(__m128i)(A), (int)(imm), \2746(__v8hi)(__m128i)(W), \2747(__mmask8)(U)); })27482749#define _mm_maskz_srai_epi16(U, A, imm) __extension__ ({ \2750(__m128i)__builtin_ia32_psrawi128_mask((__v8hi)(__m128i)(A), (int)(imm), \2751(__v8hi)_mm_setzero_si128(), \2752(__mmask8)(U)); })27532754#define _mm256_mask_srai_epi16(W, U, A, imm) __extension__ ({ \2755(__m256i)__builtin_ia32_psrawi256_mask((__v16hi)(__m256i)(A), (int)(imm), \2756(__v16hi)(__m256i)(W), \2757(__mmask16)(U)); })27582759#define _mm256_maskz_srai_epi16(U, A, imm) __extension__ ({ \2760(__m256i)__builtin_ia32_psrawi256_mask((__v16hi)(__m256i)(A), (int)(imm), \2761(__v16hi)_mm256_setzero_si256(), \2762(__mmask16)(U)); })27632764static __inline__ __m128i __DEFAULT_FN_ATTRS2765_mm_mask_srl_epi16 (__m128i __W, __mmask8 __U, __m128i __A,2766__m128i __B)2767{2768return (__m128i) __builtin_ia32_psrlw128_mask ((__v8hi) __A,2769(__v8hi) __B,2770(__v8hi) __W,2771(__mmask8) __U);2772}27732774static __inline__ __m128i __DEFAULT_FN_ATTRS2775_mm_maskz_srl_epi16 (__mmask8 __U, __m128i __A, __m128i __B)2776{2777return (__m128i) __builtin_ia32_psrlw128_mask ((__v8hi) __A,2778(__v8hi) __B,2779(__v8hi)2780_mm_setzero_si128 (),2781(__mmask8) __U);2782}27832784static __inline__ __m256i __DEFAULT_FN_ATTRS2785_mm256_mask_srl_epi16 (__m256i __W, __mmask16 __U, __m256i __A,2786__m128i __B)2787{2788return (__m256i) __builtin_ia32_psrlw256_mask ((__v16hi) __A,2789(__v8hi) __B,2790(__v16hi) __W,2791(__mmask16) __U);2792}27932794static __inline__ __m256i __DEFAULT_FN_ATTRS2795_mm256_maskz_srl_epi16 (__mmask16 __U, __m256i __A, __m128i __B)2796{2797return (__m256i) __builtin_ia32_psrlw256_mask ((__v16hi) __A,2798(__v8hi) __B,2799(__v16hi)2800_mm256_setzero_si256 (),2801(__mmask16) __U);2802}28032804#define _mm_mask_srli_epi16(W, U, A, imm) __extension__ ({ \2805(__m128i)__builtin_ia32_psrlwi128_mask((__v8hi)(__m128i)(A), (int)(imm), \2806(__v8hi)(__m128i)(W), \2807(__mmask8)(U)); })28082809#define _mm_maskz_srli_epi16(U, A, imm) __extension__ ({ \2810(__m128i)__builtin_ia32_psrlwi128_mask((__v8hi)(__m128i)(A), (int)(imm), \2811(__v8hi)_mm_setzero_si128(), \2812(__mmask8)(U)); })28132814#define _mm256_mask_srli_epi16(W, U, A, imm) __extension__ ({ \2815(__m256i)__builtin_ia32_psrlwi256_mask((__v16hi)(__m256i)(A), (int)(imm), \2816(__v16hi)(__m256i)(W), \2817(__mmask16)(U)); })28182819#define _mm256_maskz_srli_epi16(U, A, imm) __extension__ ({ \2820(__m256i)__builtin_ia32_psrlwi256_mask((__v16hi)(__m256i)(A), (int)(imm), \2821(__v16hi)_mm256_setzero_si256(), \2822(__mmask16)(U)); })28232824static __inline__ __m128i __DEFAULT_FN_ATTRS2825_mm_mask_mov_epi16 (__m128i __W, __mmask8 __U, __m128i __A)2826{2827return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,2828(__v8hi) __A,2829(__v8hi) __W);2830}28312832static __inline__ __m128i __DEFAULT_FN_ATTRS2833_mm_maskz_mov_epi16 (__mmask8 __U, __m128i __A)2834{2835return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,2836(__v8hi) __A,2837(__v8hi) _mm_setzero_hi ());2838}28392840static __inline__ __m256i __DEFAULT_FN_ATTRS2841_mm256_mask_mov_epi16 (__m256i __W, __mmask16 __U, __m256i __A)2842{2843return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,2844(__v16hi) __A,2845(__v16hi) __W);2846}28472848static __inline__ __m256i __DEFAULT_FN_ATTRS2849_mm256_maskz_mov_epi16 (__mmask16 __U, __m256i __A)2850{2851return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,2852(__v16hi) __A,2853(__v16hi) _mm256_setzero_si256 ());2854}28552856static __inline__ __m128i __DEFAULT_FN_ATTRS2857_mm_mask_mov_epi8 (__m128i __W, __mmask16 __U, __m128i __A)2858{2859return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,2860(__v16qi) __A,2861(__v16qi) __W);2862}28632864static __inline__ __m128i __DEFAULT_FN_ATTRS2865_mm_maskz_mov_epi8 (__mmask16 __U, __m128i __A)2866{2867return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,2868(__v16qi) __A,2869(__v16qi) _mm_setzero_hi ());2870}28712872static __inline__ __m256i __DEFAULT_FN_ATTRS2873_mm256_mask_mov_epi8 (__m256i __W, __mmask32 __U, __m256i __A)2874{2875return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,2876(__v32qi) __A,2877(__v32qi) __W);2878}28792880static __inline__ __m256i __DEFAULT_FN_ATTRS2881_mm256_maskz_mov_epi8 (__mmask32 __U, __m256i __A)2882{2883return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,2884(__v32qi) __A,2885(__v32qi) _mm256_setzero_si256 ());2886}288728882889static __inline__ __m128i __DEFAULT_FN_ATTRS2890_mm_mask_set1_epi8 (__m128i __O, __mmask16 __M, char __A)2891{2892return (__m128i) __builtin_ia32_pbroadcastb128_gpr_mask (__A,2893(__v16qi) __O,2894__M);2895}28962897static __inline__ __m128i __DEFAULT_FN_ATTRS2898_mm_maskz_set1_epi8 (__mmask16 __M, char __A)2899{2900return (__m128i) __builtin_ia32_pbroadcastb128_gpr_mask (__A,2901(__v16qi)2902_mm_setzero_si128 (),2903__M);2904}29052906static __inline__ __m256i __DEFAULT_FN_ATTRS2907_mm256_mask_set1_epi8 (__m256i __O, __mmask32 __M, char __A)2908{2909return (__m256i) __builtin_ia32_pbroadcastb256_gpr_mask (__A,2910(__v32qi) __O,2911__M);2912}29132914static __inline__ __m256i __DEFAULT_FN_ATTRS2915_mm256_maskz_set1_epi8 (__mmask32 __M, char __A)2916{2917return (__m256i) __builtin_ia32_pbroadcastb256_gpr_mask (__A,2918(__v32qi)2919_mm256_setzero_si256 (),2920__M);2921}29222923static __inline__ __m128i __DEFAULT_FN_ATTRS2924_mm_mask_loadu_epi16 (__m128i __W, __mmask8 __U, void const *__P)2925{2926return (__m128i) __builtin_ia32_loaddquhi128_mask ((__v8hi *) __P,2927(__v8hi) __W,2928(__mmask8) __U);2929}29302931static __inline__ __m128i __DEFAULT_FN_ATTRS2932_mm_maskz_loadu_epi16 (__mmask8 __U, void const *__P)2933{2934return (__m128i) __builtin_ia32_loaddquhi128_mask ((__v8hi *) __P,2935(__v8hi)2936_mm_setzero_hi (),2937(__mmask8) __U);2938}29392940static __inline__ __m256i __DEFAULT_FN_ATTRS2941_mm256_mask_loadu_epi16 (__m256i __W, __mmask16 __U, void const *__P)2942{2943return (__m256i) __builtin_ia32_loaddquhi256_mask ((__v16hi *) __P,2944(__v16hi) __W,2945(__mmask16) __U);2946}29472948static __inline__ __m256i __DEFAULT_FN_ATTRS2949_mm256_maskz_loadu_epi16 (__mmask16 __U, void const *__P)2950{2951return (__m256i) __builtin_ia32_loaddquhi256_mask ((__v16hi *) __P,2952(__v16hi)2953_mm256_setzero_si256 (),2954(__mmask16) __U);2955}29562957static __inline__ __m128i __DEFAULT_FN_ATTRS2958_mm_mask_loadu_epi8 (__m128i __W, __mmask16 __U, void const *__P)2959{2960return (__m128i) __builtin_ia32_loaddquqi128_mask ((__v16qi *) __P,2961(__v16qi) __W,2962(__mmask16) __U);2963}29642965static __inline__ __m128i __DEFAULT_FN_ATTRS2966_mm_maskz_loadu_epi8 (__mmask16 __U, void const *__P)2967{2968return (__m128i) __builtin_ia32_loaddquqi128_mask ((__v16qi *) __P,2969(__v16qi)2970_mm_setzero_si128 (),2971(__mmask16) __U);2972}29732974static __inline__ __m256i __DEFAULT_FN_ATTRS2975_mm256_mask_loadu_epi8 (__m256i __W, __mmask32 __U, void const *__P)2976{2977return (__m256i) __builtin_ia32_loaddquqi256_mask ((__v32qi *) __P,2978(__v32qi) __W,2979(__mmask32) __U);2980}29812982static __inline__ __m256i __DEFAULT_FN_ATTRS2983_mm256_maskz_loadu_epi8 (__mmask32 __U, void const *__P)2984{2985return (__m256i) __builtin_ia32_loaddquqi256_mask ((__v32qi *) __P,2986(__v32qi)2987_mm256_setzero_si256 (),2988(__mmask32) __U);2989}2990static __inline__ void __DEFAULT_FN_ATTRS2991_mm_mask_storeu_epi16 (void *__P, __mmask8 __U, __m128i __A)2992{2993__builtin_ia32_storedquhi128_mask ((__v8hi *) __P,2994(__v8hi) __A,2995(__mmask8) __U);2996}29972998static __inline__ void __DEFAULT_FN_ATTRS2999_mm256_mask_storeu_epi16 (void *__P, __mmask16 __U, __m256i __A)3000{3001__builtin_ia32_storedquhi256_mask ((__v16hi *) __P,3002(__v16hi) __A,3003(__mmask16) __U);3004}30053006static __inline__ void __DEFAULT_FN_ATTRS3007_mm_mask_storeu_epi8 (void *__P, __mmask16 __U, __m128i __A)3008{3009__builtin_ia32_storedquqi128_mask ((__v16qi *) __P,3010(__v16qi) __A,3011(__mmask16) __U);3012}30133014static __inline__ void __DEFAULT_FN_ATTRS3015_mm256_mask_storeu_epi8 (void *__P, __mmask32 __U, __m256i __A)3016{3017__builtin_ia32_storedquqi256_mask ((__v32qi *) __P,3018(__v32qi) __A,3019(__mmask32) __U);3020}30213022static __inline__ __mmask16 __DEFAULT_FN_ATTRS3023_mm_test_epi8_mask (__m128i __A, __m128i __B)3024{3025return (__mmask16) __builtin_ia32_ptestmb128 ((__v16qi) __A,3026(__v16qi) __B,3027(__mmask16) -1);3028}30293030static __inline__ __mmask16 __DEFAULT_FN_ATTRS3031_mm_mask_test_epi8_mask (__mmask16 __U, __m128i __A, __m128i __B)3032{3033return (__mmask16) __builtin_ia32_ptestmb128 ((__v16qi) __A,3034(__v16qi) __B, __U);3035}30363037static __inline__ __mmask32 __DEFAULT_FN_ATTRS3038_mm256_test_epi8_mask (__m256i __A, __m256i __B)3039{3040return (__mmask32) __builtin_ia32_ptestmb256 ((__v32qi) __A,3041(__v32qi) __B,3042(__mmask32) -1);3043}30443045static __inline__ __mmask32 __DEFAULT_FN_ATTRS3046_mm256_mask_test_epi8_mask (__mmask32 __U, __m256i __A, __m256i __B)3047{3048return (__mmask32) __builtin_ia32_ptestmb256 ((__v32qi) __A,3049(__v32qi) __B, __U);3050}30513052static __inline__ __mmask8 __DEFAULT_FN_ATTRS3053_mm_test_epi16_mask (__m128i __A, __m128i __B)3054{3055return (__mmask8) __builtin_ia32_ptestmw128 ((__v8hi) __A,3056(__v8hi) __B,3057(__mmask8) -1);3058}30593060static __inline__ __mmask8 __DEFAULT_FN_ATTRS3061_mm_mask_test_epi16_mask (__mmask8 __U, __m128i __A, __m128i __B)3062{3063return (__mmask8) __builtin_ia32_ptestmw128 ((__v8hi) __A,3064(__v8hi) __B, __U);3065}30663067static __inline__ __mmask16 __DEFAULT_FN_ATTRS3068_mm256_test_epi16_mask (__m256i __A, __m256i __B)3069{3070return (__mmask16) __builtin_ia32_ptestmw256 ((__v16hi) __A,3071(__v16hi) __B,3072(__mmask16) -1);3073}30743075static __inline__ __mmask16 __DEFAULT_FN_ATTRS3076_mm256_mask_test_epi16_mask (__mmask16 __U, __m256i __A, __m256i __B)3077{3078return (__mmask16) __builtin_ia32_ptestmw256 ((__v16hi) __A,3079(__v16hi) __B, __U);3080}30813082static __inline__ __mmask16 __DEFAULT_FN_ATTRS3083_mm_testn_epi8_mask (__m128i __A, __m128i __B)3084{3085return (__mmask16) __builtin_ia32_ptestnmb128 ((__v16qi) __A,3086(__v16qi) __B,3087(__mmask16) -1);3088}30893090static __inline__ __mmask16 __DEFAULT_FN_ATTRS3091_mm_mask_testn_epi8_mask (__mmask16 __U, __m128i __A, __m128i __B)3092{3093return (__mmask16) __builtin_ia32_ptestnmb128 ((__v16qi) __A,3094(__v16qi) __B, __U);3095}30963097static __inline__ __mmask32 __DEFAULT_FN_ATTRS3098_mm256_testn_epi8_mask (__m256i __A, __m256i __B)3099{3100return (__mmask32) __builtin_ia32_ptestnmb256 ((__v32qi) __A,3101(__v32qi) __B,3102(__mmask32) -1);3103}31043105static __inline__ __mmask32 __DEFAULT_FN_ATTRS3106_mm256_mask_testn_epi8_mask (__mmask32 __U, __m256i __A, __m256i __B)3107{3108return (__mmask32) __builtin_ia32_ptestnmb256 ((__v32qi) __A,3109(__v32qi) __B, __U);3110}31113112static __inline__ __mmask8 __DEFAULT_FN_ATTRS3113_mm_testn_epi16_mask (__m128i __A, __m128i __B)3114{3115return (__mmask8) __builtin_ia32_ptestnmw128 ((__v8hi) __A,3116(__v8hi) __B,3117(__mmask8) -1);3118}31193120static __inline__ __mmask8 __DEFAULT_FN_ATTRS3121_mm_mask_testn_epi16_mask (__mmask8 __U, __m128i __A, __m128i __B)3122{3123return (__mmask8) __builtin_ia32_ptestnmw128 ((__v8hi) __A,3124(__v8hi) __B, __U);3125}31263127static __inline__ __mmask16 __DEFAULT_FN_ATTRS3128_mm256_testn_epi16_mask (__m256i __A, __m256i __B)3129{3130return (__mmask16) __builtin_ia32_ptestnmw256 ((__v16hi) __A,3131(__v16hi) __B,3132(__mmask16) -1);3133}31343135static __inline__ __mmask16 __DEFAULT_FN_ATTRS3136_mm256_mask_testn_epi16_mask (__mmask16 __U, __m256i __A, __m256i __B)3137{3138return (__mmask16) __builtin_ia32_ptestnmw256 ((__v16hi) __A,3139(__v16hi) __B, __U);3140}31413142static __inline__ __mmask16 __DEFAULT_FN_ATTRS3143_mm_movepi8_mask (__m128i __A)3144{3145return (__mmask16) __builtin_ia32_cvtb2mask128 ((__v16qi) __A);3146}31473148static __inline__ __mmask32 __DEFAULT_FN_ATTRS3149_mm256_movepi8_mask (__m256i __A)3150{3151return (__mmask32) __builtin_ia32_cvtb2mask256 ((__v32qi) __A);3152}31533154static __inline__ __mmask8 __DEFAULT_FN_ATTRS3155_mm_movepi16_mask (__m128i __A)3156{3157return (__mmask8) __builtin_ia32_cvtw2mask128 ((__v8hi) __A);3158}31593160static __inline__ __mmask16 __DEFAULT_FN_ATTRS3161_mm256_movepi16_mask (__m256i __A)3162{3163return (__mmask16) __builtin_ia32_cvtw2mask256 ((__v16hi) __A);3164}31653166static __inline__ __m128i __DEFAULT_FN_ATTRS3167_mm_movm_epi8 (__mmask16 __A)3168{3169return (__m128i) __builtin_ia32_cvtmask2b128 (__A);3170}31713172static __inline__ __m256i __DEFAULT_FN_ATTRS3173_mm256_movm_epi8 (__mmask32 __A)3174{3175return (__m256i) __builtin_ia32_cvtmask2b256 (__A);3176}31773178static __inline__ __m128i __DEFAULT_FN_ATTRS3179_mm_movm_epi16 (__mmask8 __A)3180{3181return (__m128i) __builtin_ia32_cvtmask2w128 (__A);3182}31833184static __inline__ __m256i __DEFAULT_FN_ATTRS3185_mm256_movm_epi16 (__mmask16 __A)3186{3187return (__m256i) __builtin_ia32_cvtmask2w256 (__A);3188}31893190static __inline__ __m128i __DEFAULT_FN_ATTRS3191_mm_mask_broadcastb_epi8 (__m128i __O, __mmask16 __M, __m128i __A)3192{3193return (__m128i)__builtin_ia32_selectb_128(__M,3194(__v16qi) _mm_broadcastb_epi8(__A),3195(__v16qi) __O);3196}31973198static __inline__ __m128i __DEFAULT_FN_ATTRS3199_mm_maskz_broadcastb_epi8 (__mmask16 __M, __m128i __A)3200{3201return (__m128i)__builtin_ia32_selectb_128(__M,3202(__v16qi) _mm_broadcastb_epi8(__A),3203(__v16qi) _mm_setzero_si128());3204}32053206static __inline__ __m256i __DEFAULT_FN_ATTRS3207_mm256_mask_broadcastb_epi8 (__m256i __O, __mmask32 __M, __m128i __A)3208{3209return (__m256i)__builtin_ia32_selectb_256(__M,3210(__v32qi) _mm256_broadcastb_epi8(__A),3211(__v32qi) __O);3212}32133214static __inline__ __m256i __DEFAULT_FN_ATTRS3215_mm256_maskz_broadcastb_epi8 (__mmask32 __M, __m128i __A)3216{3217return (__m256i)__builtin_ia32_selectb_256(__M,3218(__v32qi) _mm256_broadcastb_epi8(__A),3219(__v32qi) _mm256_setzero_si256());3220}32213222static __inline__ __m128i __DEFAULT_FN_ATTRS3223_mm_mask_broadcastw_epi16 (__m128i __O, __mmask8 __M, __m128i __A)3224{3225return (__m128i)__builtin_ia32_selectw_128(__M,3226(__v8hi) _mm_broadcastw_epi16(__A),3227(__v8hi) __O);3228}32293230static __inline__ __m128i __DEFAULT_FN_ATTRS3231_mm_maskz_broadcastw_epi16 (__mmask8 __M, __m128i __A)3232{3233return (__m128i)__builtin_ia32_selectw_128(__M,3234(__v8hi) _mm_broadcastw_epi16(__A),3235(__v8hi) _mm_setzero_si128());3236}32373238static __inline__ __m256i __DEFAULT_FN_ATTRS3239_mm256_mask_broadcastw_epi16 (__m256i __O, __mmask16 __M, __m128i __A)3240{3241return (__m256i)__builtin_ia32_selectw_256(__M,3242(__v16hi) _mm256_broadcastw_epi16(__A),3243(__v16hi) __O);3244}32453246static __inline__ __m256i __DEFAULT_FN_ATTRS3247_mm256_maskz_broadcastw_epi16 (__mmask16 __M, __m128i __A)3248{3249return (__m256i)__builtin_ia32_selectw_256(__M,3250(__v16hi) _mm256_broadcastw_epi16(__A),3251(__v16hi) _mm256_setzero_si256());3252}32533254static __inline__ __m256i __DEFAULT_FN_ATTRS3255_mm256_mask_set1_epi16 (__m256i __O, __mmask16 __M, short __A)3256{3257return (__m256i) __builtin_ia32_pbroadcastw256_gpr_mask (__A,3258(__v16hi) __O,3259__M);3260}32613262static __inline__ __m256i __DEFAULT_FN_ATTRS3263_mm256_maskz_set1_epi16 (__mmask16 __M, short __A)3264{3265return (__m256i) __builtin_ia32_pbroadcastw256_gpr_mask (__A,3266(__v16hi) _mm256_setzero_si256 (),3267__M);3268}32693270static __inline__ __m128i __DEFAULT_FN_ATTRS3271_mm_mask_set1_epi16 (__m128i __O, __mmask8 __M, short __A)3272{3273return (__m128i) __builtin_ia32_pbroadcastw128_gpr_mask (__A,3274(__v8hi) __O,3275__M);3276}32773278static __inline__ __m128i __DEFAULT_FN_ATTRS3279_mm_maskz_set1_epi16 (__mmask8 __M, short __A)3280{3281return (__m128i) __builtin_ia32_pbroadcastw128_gpr_mask (__A,3282(__v8hi) _mm_setzero_si128 (),3283__M);3284}32853286static __inline__ __m128i __DEFAULT_FN_ATTRS3287_mm_permutexvar_epi16 (__m128i __A, __m128i __B)3288{3289return (__m128i) __builtin_ia32_permvarhi128_mask ((__v8hi) __B,3290(__v8hi) __A,3291(__v8hi) _mm_undefined_si128 (),3292(__mmask8) -1);3293}32943295static __inline__ __m128i __DEFAULT_FN_ATTRS3296_mm_maskz_permutexvar_epi16 (__mmask8 __M, __m128i __A, __m128i __B)3297{3298return (__m128i) __builtin_ia32_permvarhi128_mask ((__v8hi) __B,3299(__v8hi) __A,3300(__v8hi) _mm_setzero_si128 (),3301(__mmask8) __M);3302}33033304static __inline__ __m128i __DEFAULT_FN_ATTRS3305_mm_mask_permutexvar_epi16 (__m128i __W, __mmask8 __M, __m128i __A,3306__m128i __B)3307{3308return (__m128i) __builtin_ia32_permvarhi128_mask ((__v8hi) __B,3309(__v8hi) __A,3310(__v8hi) __W,3311(__mmask8) __M);3312}33133314static __inline__ __m256i __DEFAULT_FN_ATTRS3315_mm256_permutexvar_epi16 (__m256i __A, __m256i __B)3316{3317return (__m256i) __builtin_ia32_permvarhi256_mask ((__v16hi) __B,3318(__v16hi) __A,3319(__v16hi) _mm256_undefined_si256 (),3320(__mmask16) -1);3321}33223323static __inline__ __m256i __DEFAULT_FN_ATTRS3324_mm256_maskz_permutexvar_epi16 (__mmask16 __M, __m256i __A,3325__m256i __B)3326{3327return (__m256i) __builtin_ia32_permvarhi256_mask ((__v16hi) __B,3328(__v16hi) __A,3329(__v16hi) _mm256_setzero_si256 (),3330(__mmask16) __M);3331}33323333static __inline__ __m256i __DEFAULT_FN_ATTRS3334_mm256_mask_permutexvar_epi16 (__m256i __W, __mmask16 __M, __m256i __A,3335__m256i __B)3336{3337return (__m256i) __builtin_ia32_permvarhi256_mask ((__v16hi) __B,3338(__v16hi) __A,3339(__v16hi) __W,3340(__mmask16) __M);3341}33423343#define _mm_mask_alignr_epi8(W, U, A, B, N) __extension__ ({ \3344(__m128i)__builtin_ia32_palignr128_mask((__v16qi)(__m128i)(A), \3345(__v16qi)(__m128i)(B), (int)(N), \3346(__v16qi)(__m128i)(W), \3347(__mmask16)(U)); })33483349#define _mm_maskz_alignr_epi8(U, A, B, N) __extension__ ({ \3350(__m128i)__builtin_ia32_palignr128_mask((__v16qi)(__m128i)(A), \3351(__v16qi)(__m128i)(B), (int)(N), \3352(__v16qi)_mm_setzero_si128(), \3353(__mmask16)(U)); })33543355#define _mm256_mask_alignr_epi8(W, U, A, B, N) __extension__ ({ \3356(__m256i)__builtin_ia32_palignr256_mask((__v32qi)(__m256i)(A), \3357(__v32qi)(__m256i)(B), (int)(N), \3358(__v32qi)(__m256i)(W), \3359(__mmask32)(U)); })33603361#define _mm256_maskz_alignr_epi8(U, A, B, N) __extension__ ({ \3362(__m256i)__builtin_ia32_palignr256_mask((__v32qi)(__m256i)(A), \3363(__v32qi)(__m256i)(B), (int)(N), \3364(__v32qi)_mm256_setzero_si256(), \3365(__mmask32)(U)); })33663367#define _mm_dbsad_epu8(A, B, imm) __extension__ ({ \3368(__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \3369(__v16qi)(__m128i)(B), (int)(imm), \3370(__v8hi)_mm_setzero_hi(), \3371(__mmask8)-1); })33723373#define _mm_mask_dbsad_epu8(W, U, A, B, imm) __extension__ ({ \3374(__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \3375(__v16qi)(__m128i)(B), (int)(imm), \3376(__v8hi)(__m128i)(W), \3377(__mmask8)(U)); })33783379#define _mm_maskz_dbsad_epu8(U, A, B, imm) __extension__ ({ \3380(__m128i)__builtin_ia32_dbpsadbw128_mask((__v16qi)(__m128i)(A), \3381(__v16qi)(__m128i)(B), (int)(imm), \3382(__v8hi)_mm_setzero_si128(), \3383(__mmask8)(U)); })33843385#define _mm256_dbsad_epu8(A, B, imm) __extension__ ({ \3386(__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \3387(__v32qi)(__m256i)(B), (int)(imm), \3388(__v16hi)_mm256_setzero_si256(), \3389(__mmask16)-1); })33903391#define _mm256_mask_dbsad_epu8(W, U, A, B, imm) __extension__ ({ \3392(__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \3393(__v32qi)(__m256i)(B), (int)(imm), \3394(__v16hi)(__m256i)(W), \3395(__mmask16)(U)); })33963397#define _mm256_maskz_dbsad_epu8(U, A, B, imm) __extension__ ({ \3398(__m256i)__builtin_ia32_dbpsadbw256_mask((__v32qi)(__m256i)(A), \3399(__v32qi)(__m256i)(B), (int)(imm), \3400(__v16hi)_mm256_setzero_si256(), \3401(__mmask16)(U)); })34023403#undef __DEFAULT_FN_ATTRS34043405#endif /* __AVX512VLBWINTRIN_H */340634073408