Path: blob/master/tools/android-sdk/renderscript/clang-include/avx512vlintrin.h
496 views
/*===---- avx512vlintrin.h - AVX512VL intrinsics ---------------------------===1*2* Permission is hereby granted, free of charge, to any person obtaining a copy3* of this software and associated documentation files (the "Software"), to deal4* in the Software without restriction, including without limitation the rights5* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell6* copies of the Software, and to permit persons to whom the Software is7* furnished to do so, subject to the following conditions:8*9* The above copyright notice and this permission notice shall be included in10* all copies or substantial portions of the Software.11*12* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR13* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,14* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE15* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER16* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,17* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN18* THE SOFTWARE.19*20*===-----------------------------------------------------------------------===21*/2223#ifndef __IMMINTRIN_H24#error "Never use <avx512vlintrin.h> directly; include <immintrin.h> instead."25#endif2627#ifndef __AVX512VLINTRIN_H28#define __AVX512VLINTRIN_H2930#define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512vl")))3132/* Doesn't require avx512vl, used in avx512dqintrin.h */33static __inline __m128i __attribute__((__always_inline__, __nodebug__, __target__("avx512f")))34_mm_setzero_di(void) {35return (__m128i)(__v2di){ 0LL, 0LL};36}3738/* Integer compare */3940static __inline__ __mmask8 __DEFAULT_FN_ATTRS41_mm_cmpeq_epi32_mask(__m128i __a, __m128i __b) {42return (__mmask8)__builtin_ia32_pcmpeqd128_mask((__v4si)__a, (__v4si)__b,43(__mmask8)-1);44}4546static __inline__ __mmask8 __DEFAULT_FN_ATTRS47_mm_mask_cmpeq_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {48return (__mmask8)__builtin_ia32_pcmpeqd128_mask((__v4si)__a, (__v4si)__b,49__u);50}5152static __inline__ __mmask8 __DEFAULT_FN_ATTRS53_mm_cmpeq_epu32_mask(__m128i __a, __m128i __b) {54return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 0,55(__mmask8)-1);56}5758static __inline__ __mmask8 __DEFAULT_FN_ATTRS59_mm_mask_cmpeq_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {60return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 0,61__u);62}6364static __inline__ __mmask8 __DEFAULT_FN_ATTRS65_mm256_cmpeq_epi32_mask(__m256i __a, __m256i __b) {66return (__mmask8)__builtin_ia32_pcmpeqd256_mask((__v8si)__a, (__v8si)__b,67(__mmask8)-1);68}6970static __inline__ __mmask8 __DEFAULT_FN_ATTRS71_mm256_mask_cmpeq_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {72return (__mmask8)__builtin_ia32_pcmpeqd256_mask((__v8si)__a, (__v8si)__b,73__u);74}7576static __inline__ __mmask8 __DEFAULT_FN_ATTRS77_mm256_cmpeq_epu32_mask(__m256i __a, __m256i __b) {78return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 0,79(__mmask8)-1);80}8182static __inline__ __mmask8 __DEFAULT_FN_ATTRS83_mm256_mask_cmpeq_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {84return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 0,85__u);86}8788static __inline__ __mmask8 __DEFAULT_FN_ATTRS89_mm_cmpeq_epi64_mask(__m128i __a, __m128i __b) {90return (__mmask8)__builtin_ia32_pcmpeqq128_mask((__v2di)__a, (__v2di)__b,91(__mmask8)-1);92}9394static __inline__ __mmask8 __DEFAULT_FN_ATTRS95_mm_mask_cmpeq_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {96return (__mmask8)__builtin_ia32_pcmpeqq128_mask((__v2di)__a, (__v2di)__b,97__u);98}99100static __inline__ __mmask8 __DEFAULT_FN_ATTRS101_mm_cmpeq_epu64_mask(__m128i __a, __m128i __b) {102return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 0,103(__mmask8)-1);104}105106static __inline__ __mmask8 __DEFAULT_FN_ATTRS107_mm_mask_cmpeq_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {108return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 0,109__u);110}111112static __inline__ __mmask8 __DEFAULT_FN_ATTRS113_mm256_cmpeq_epi64_mask(__m256i __a, __m256i __b) {114return (__mmask8)__builtin_ia32_pcmpeqq256_mask((__v4di)__a, (__v4di)__b,115(__mmask8)-1);116}117118static __inline__ __mmask8 __DEFAULT_FN_ATTRS119_mm256_mask_cmpeq_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {120return (__mmask8)__builtin_ia32_pcmpeqq256_mask((__v4di)__a, (__v4di)__b,121__u);122}123124static __inline__ __mmask8 __DEFAULT_FN_ATTRS125_mm256_cmpeq_epu64_mask(__m256i __a, __m256i __b) {126return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 0,127(__mmask8)-1);128}129130static __inline__ __mmask8 __DEFAULT_FN_ATTRS131_mm256_mask_cmpeq_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {132return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 0,133__u);134}135136137static __inline__ __mmask8 __DEFAULT_FN_ATTRS138_mm_cmpge_epi32_mask(__m128i __a, __m128i __b) {139return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 5,140(__mmask8)-1);141}142143static __inline__ __mmask8 __DEFAULT_FN_ATTRS144_mm_mask_cmpge_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {145return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 5,146__u);147}148149static __inline__ __mmask8 __DEFAULT_FN_ATTRS150_mm_cmpge_epu32_mask(__m128i __a, __m128i __b) {151return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 5,152(__mmask8)-1);153}154155static __inline__ __mmask8 __DEFAULT_FN_ATTRS156_mm_mask_cmpge_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {157return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 5,158__u);159}160161static __inline__ __mmask8 __DEFAULT_FN_ATTRS162_mm256_cmpge_epi32_mask(__m256i __a, __m256i __b) {163return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 5,164(__mmask8)-1);165}166167static __inline__ __mmask8 __DEFAULT_FN_ATTRS168_mm256_mask_cmpge_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {169return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 5,170__u);171}172173static __inline__ __mmask8 __DEFAULT_FN_ATTRS174_mm256_cmpge_epu32_mask(__m256i __a, __m256i __b) {175return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 5,176(__mmask8)-1);177}178179static __inline__ __mmask8 __DEFAULT_FN_ATTRS180_mm256_mask_cmpge_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {181return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 5,182__u);183}184185static __inline__ __mmask8 __DEFAULT_FN_ATTRS186_mm_cmpge_epi64_mask(__m128i __a, __m128i __b) {187return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 5,188(__mmask8)-1);189}190191static __inline__ __mmask8 __DEFAULT_FN_ATTRS192_mm_mask_cmpge_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {193return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 5,194__u);195}196197static __inline__ __mmask8 __DEFAULT_FN_ATTRS198_mm_cmpge_epu64_mask(__m128i __a, __m128i __b) {199return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 5,200(__mmask8)-1);201}202203static __inline__ __mmask8 __DEFAULT_FN_ATTRS204_mm_mask_cmpge_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {205return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 5,206__u);207}208209static __inline__ __mmask8 __DEFAULT_FN_ATTRS210_mm256_cmpge_epi64_mask(__m256i __a, __m256i __b) {211return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 5,212(__mmask8)-1);213}214215static __inline__ __mmask8 __DEFAULT_FN_ATTRS216_mm256_mask_cmpge_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {217return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 5,218__u);219}220221static __inline__ __mmask8 __DEFAULT_FN_ATTRS222_mm256_cmpge_epu64_mask(__m256i __a, __m256i __b) {223return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 5,224(__mmask8)-1);225}226227static __inline__ __mmask8 __DEFAULT_FN_ATTRS228_mm256_mask_cmpge_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {229return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 5,230__u);231}232233static __inline__ __mmask8 __DEFAULT_FN_ATTRS234_mm_cmpgt_epi32_mask(__m128i __a, __m128i __b) {235return (__mmask8)__builtin_ia32_pcmpgtd128_mask((__v4si)__a, (__v4si)__b,236(__mmask8)-1);237}238239static __inline__ __mmask8 __DEFAULT_FN_ATTRS240_mm_mask_cmpgt_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {241return (__mmask8)__builtin_ia32_pcmpgtd128_mask((__v4si)__a, (__v4si)__b,242__u);243}244245static __inline__ __mmask8 __DEFAULT_FN_ATTRS246_mm_cmpgt_epu32_mask(__m128i __a, __m128i __b) {247return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 6,248(__mmask8)-1);249}250251static __inline__ __mmask8 __DEFAULT_FN_ATTRS252_mm_mask_cmpgt_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {253return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 6,254__u);255}256257static __inline__ __mmask8 __DEFAULT_FN_ATTRS258_mm256_cmpgt_epi32_mask(__m256i __a, __m256i __b) {259return (__mmask8)__builtin_ia32_pcmpgtd256_mask((__v8si)__a, (__v8si)__b,260(__mmask8)-1);261}262263static __inline__ __mmask8 __DEFAULT_FN_ATTRS264_mm256_mask_cmpgt_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {265return (__mmask8)__builtin_ia32_pcmpgtd256_mask((__v8si)__a, (__v8si)__b,266__u);267}268269static __inline__ __mmask8 __DEFAULT_FN_ATTRS270_mm256_cmpgt_epu32_mask(__m256i __a, __m256i __b) {271return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 6,272(__mmask8)-1);273}274275static __inline__ __mmask8 __DEFAULT_FN_ATTRS276_mm256_mask_cmpgt_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {277return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 6,278__u);279}280281static __inline__ __mmask8 __DEFAULT_FN_ATTRS282_mm_cmpgt_epi64_mask(__m128i __a, __m128i __b) {283return (__mmask8)__builtin_ia32_pcmpgtq128_mask((__v2di)__a, (__v2di)__b,284(__mmask8)-1);285}286287static __inline__ __mmask8 __DEFAULT_FN_ATTRS288_mm_mask_cmpgt_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {289return (__mmask8)__builtin_ia32_pcmpgtq128_mask((__v2di)__a, (__v2di)__b,290__u);291}292293static __inline__ __mmask8 __DEFAULT_FN_ATTRS294_mm_cmpgt_epu64_mask(__m128i __a, __m128i __b) {295return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 6,296(__mmask8)-1);297}298299static __inline__ __mmask8 __DEFAULT_FN_ATTRS300_mm_mask_cmpgt_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {301return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 6,302__u);303}304305static __inline__ __mmask8 __DEFAULT_FN_ATTRS306_mm256_cmpgt_epi64_mask(__m256i __a, __m256i __b) {307return (__mmask8)__builtin_ia32_pcmpgtq256_mask((__v4di)__a, (__v4di)__b,308(__mmask8)-1);309}310311static __inline__ __mmask8 __DEFAULT_FN_ATTRS312_mm256_mask_cmpgt_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {313return (__mmask8)__builtin_ia32_pcmpgtq256_mask((__v4di)__a, (__v4di)__b,314__u);315}316317static __inline__ __mmask8 __DEFAULT_FN_ATTRS318_mm256_cmpgt_epu64_mask(__m256i __a, __m256i __b) {319return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 6,320(__mmask8)-1);321}322323static __inline__ __mmask8 __DEFAULT_FN_ATTRS324_mm256_mask_cmpgt_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {325return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 6,326__u);327}328329static __inline__ __mmask8 __DEFAULT_FN_ATTRS330_mm_cmple_epi32_mask(__m128i __a, __m128i __b) {331return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 2,332(__mmask8)-1);333}334335static __inline__ __mmask8 __DEFAULT_FN_ATTRS336_mm_mask_cmple_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {337return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 2,338__u);339}340341static __inline__ __mmask8 __DEFAULT_FN_ATTRS342_mm_cmple_epu32_mask(__m128i __a, __m128i __b) {343return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 2,344(__mmask8)-1);345}346347static __inline__ __mmask8 __DEFAULT_FN_ATTRS348_mm_mask_cmple_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {349return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 2,350__u);351}352353static __inline__ __mmask8 __DEFAULT_FN_ATTRS354_mm256_cmple_epi32_mask(__m256i __a, __m256i __b) {355return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 2,356(__mmask8)-1);357}358359static __inline__ __mmask8 __DEFAULT_FN_ATTRS360_mm256_mask_cmple_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {361return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 2,362__u);363}364365static __inline__ __mmask8 __DEFAULT_FN_ATTRS366_mm256_cmple_epu32_mask(__m256i __a, __m256i __b) {367return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 2,368(__mmask8)-1);369}370371static __inline__ __mmask8 __DEFAULT_FN_ATTRS372_mm256_mask_cmple_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {373return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 2,374__u);375}376377static __inline__ __mmask8 __DEFAULT_FN_ATTRS378_mm_cmple_epi64_mask(__m128i __a, __m128i __b) {379return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 2,380(__mmask8)-1);381}382383static __inline__ __mmask8 __DEFAULT_FN_ATTRS384_mm_mask_cmple_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {385return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 2,386__u);387}388389static __inline__ __mmask8 __DEFAULT_FN_ATTRS390_mm_cmple_epu64_mask(__m128i __a, __m128i __b) {391return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 2,392(__mmask8)-1);393}394395static __inline__ __mmask8 __DEFAULT_FN_ATTRS396_mm_mask_cmple_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {397return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 2,398__u);399}400401static __inline__ __mmask8 __DEFAULT_FN_ATTRS402_mm256_cmple_epi64_mask(__m256i __a, __m256i __b) {403return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 2,404(__mmask8)-1);405}406407static __inline__ __mmask8 __DEFAULT_FN_ATTRS408_mm256_mask_cmple_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {409return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 2,410__u);411}412413static __inline__ __mmask8 __DEFAULT_FN_ATTRS414_mm256_cmple_epu64_mask(__m256i __a, __m256i __b) {415return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 2,416(__mmask8)-1);417}418419static __inline__ __mmask8 __DEFAULT_FN_ATTRS420_mm256_mask_cmple_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {421return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 2,422__u);423}424425static __inline__ __mmask8 __DEFAULT_FN_ATTRS426_mm_cmplt_epi32_mask(__m128i __a, __m128i __b) {427return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 1,428(__mmask8)-1);429}430431static __inline__ __mmask8 __DEFAULT_FN_ATTRS432_mm_mask_cmplt_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {433return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 1,434__u);435}436437static __inline__ __mmask8 __DEFAULT_FN_ATTRS438_mm_cmplt_epu32_mask(__m128i __a, __m128i __b) {439return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 1,440(__mmask8)-1);441}442443static __inline__ __mmask8 __DEFAULT_FN_ATTRS444_mm_mask_cmplt_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {445return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 1,446__u);447}448449static __inline__ __mmask8 __DEFAULT_FN_ATTRS450_mm256_cmplt_epi32_mask(__m256i __a, __m256i __b) {451return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 1,452(__mmask8)-1);453}454455static __inline__ __mmask8 __DEFAULT_FN_ATTRS456_mm256_mask_cmplt_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {457return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 1,458__u);459}460461static __inline__ __mmask8 __DEFAULT_FN_ATTRS462_mm256_cmplt_epu32_mask(__m256i __a, __m256i __b) {463return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 1,464(__mmask8)-1);465}466467static __inline__ __mmask8 __DEFAULT_FN_ATTRS468_mm256_mask_cmplt_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {469return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 1,470__u);471}472473static __inline__ __mmask8 __DEFAULT_FN_ATTRS474_mm_cmplt_epi64_mask(__m128i __a, __m128i __b) {475return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 1,476(__mmask8)-1);477}478479static __inline__ __mmask8 __DEFAULT_FN_ATTRS480_mm_mask_cmplt_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {481return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 1,482__u);483}484485static __inline__ __mmask8 __DEFAULT_FN_ATTRS486_mm_cmplt_epu64_mask(__m128i __a, __m128i __b) {487return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 1,488(__mmask8)-1);489}490491static __inline__ __mmask8 __DEFAULT_FN_ATTRS492_mm_mask_cmplt_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {493return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 1,494__u);495}496497static __inline__ __mmask8 __DEFAULT_FN_ATTRS498_mm256_cmplt_epi64_mask(__m256i __a, __m256i __b) {499return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 1,500(__mmask8)-1);501}502503static __inline__ __mmask8 __DEFAULT_FN_ATTRS504_mm256_mask_cmplt_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {505return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 1,506__u);507}508509static __inline__ __mmask8 __DEFAULT_FN_ATTRS510_mm256_cmplt_epu64_mask(__m256i __a, __m256i __b) {511return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 1,512(__mmask8)-1);513}514515static __inline__ __mmask8 __DEFAULT_FN_ATTRS516_mm256_mask_cmplt_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {517return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 1,518__u);519}520521static __inline__ __mmask8 __DEFAULT_FN_ATTRS522_mm_cmpneq_epi32_mask(__m128i __a, __m128i __b) {523return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 4,524(__mmask8)-1);525}526527static __inline__ __mmask8 __DEFAULT_FN_ATTRS528_mm_mask_cmpneq_epi32_mask(__mmask8 __u, __m128i __a, __m128i __b) {529return (__mmask8)__builtin_ia32_cmpd128_mask((__v4si)__a, (__v4si)__b, 4,530__u);531}532533static __inline__ __mmask8 __DEFAULT_FN_ATTRS534_mm_cmpneq_epu32_mask(__m128i __a, __m128i __b) {535return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 4,536(__mmask8)-1);537}538539static __inline__ __mmask8 __DEFAULT_FN_ATTRS540_mm_mask_cmpneq_epu32_mask(__mmask8 __u, __m128i __a, __m128i __b) {541return (__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)__a, (__v4si)__b, 4,542__u);543}544545static __inline__ __mmask8 __DEFAULT_FN_ATTRS546_mm256_cmpneq_epi32_mask(__m256i __a, __m256i __b) {547return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 4,548(__mmask8)-1);549}550551static __inline__ __mmask8 __DEFAULT_FN_ATTRS552_mm256_mask_cmpneq_epi32_mask(__mmask8 __u, __m256i __a, __m256i __b) {553return (__mmask8)__builtin_ia32_cmpd256_mask((__v8si)__a, (__v8si)__b, 4,554__u);555}556557static __inline__ __mmask8 __DEFAULT_FN_ATTRS558_mm256_cmpneq_epu32_mask(__m256i __a, __m256i __b) {559return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 4,560(__mmask8)-1);561}562563static __inline__ __mmask8 __DEFAULT_FN_ATTRS564_mm256_mask_cmpneq_epu32_mask(__mmask8 __u, __m256i __a, __m256i __b) {565return (__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)__a, (__v8si)__b, 4,566__u);567}568569static __inline__ __mmask8 __DEFAULT_FN_ATTRS570_mm_cmpneq_epi64_mask(__m128i __a, __m128i __b) {571return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 4,572(__mmask8)-1);573}574575static __inline__ __mmask8 __DEFAULT_FN_ATTRS576_mm_mask_cmpneq_epi64_mask(__mmask8 __u, __m128i __a, __m128i __b) {577return (__mmask8)__builtin_ia32_cmpq128_mask((__v2di)__a, (__v2di)__b, 4,578__u);579}580581static __inline__ __mmask8 __DEFAULT_FN_ATTRS582_mm_cmpneq_epu64_mask(__m128i __a, __m128i __b) {583return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 4,584(__mmask8)-1);585}586587static __inline__ __mmask8 __DEFAULT_FN_ATTRS588_mm_mask_cmpneq_epu64_mask(__mmask8 __u, __m128i __a, __m128i __b) {589return (__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)__a, (__v2di)__b, 4,590__u);591}592593static __inline__ __mmask8 __DEFAULT_FN_ATTRS594_mm256_cmpneq_epi64_mask(__m256i __a, __m256i __b) {595return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 4,596(__mmask8)-1);597}598599static __inline__ __mmask8 __DEFAULT_FN_ATTRS600_mm256_mask_cmpneq_epi64_mask(__mmask8 __u, __m256i __a, __m256i __b) {601return (__mmask8)__builtin_ia32_cmpq256_mask((__v4di)__a, (__v4di)__b, 4,602__u);603}604605static __inline__ __mmask8 __DEFAULT_FN_ATTRS606_mm256_cmpneq_epu64_mask(__m256i __a, __m256i __b) {607return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 4,608(__mmask8)-1);609}610611static __inline__ __mmask8 __DEFAULT_FN_ATTRS612_mm256_mask_cmpneq_epu64_mask(__mmask8 __u, __m256i __a, __m256i __b) {613return (__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)__a, (__v4di)__b, 4,614__u);615}616617static __inline__ __m256i __DEFAULT_FN_ATTRS618_mm256_mask_add_epi32 (__m256i __W, __mmask8 __U, __m256i __A,619__m256i __B)620{621return (__m256i) __builtin_ia32_paddd256_mask ((__v8si) __A,622(__v8si) __B,623(__v8si) __W,624(__mmask8) __U);625}626627static __inline__ __m256i __DEFAULT_FN_ATTRS628_mm256_maskz_add_epi32 (__mmask8 __U, __m256i __A, __m256i __B)629{630return (__m256i) __builtin_ia32_paddd256_mask ((__v8si) __A,631(__v8si) __B,632(__v8si)633_mm256_setzero_si256 (),634(__mmask8) __U);635}636637static __inline__ __m256i __DEFAULT_FN_ATTRS638_mm256_mask_add_epi64 (__m256i __W, __mmask8 __U, __m256i __A,639__m256i __B)640{641return (__m256i) __builtin_ia32_paddq256_mask ((__v4di) __A,642(__v4di) __B,643(__v4di) __W,644(__mmask8) __U);645}646647static __inline__ __m256i __DEFAULT_FN_ATTRS648_mm256_maskz_add_epi64 (__mmask8 __U, __m256i __A, __m256i __B)649{650return (__m256i) __builtin_ia32_paddq256_mask ((__v4di) __A,651(__v4di) __B,652(__v4di)653_mm256_setzero_si256 (),654(__mmask8) __U);655}656657static __inline__ __m256i __DEFAULT_FN_ATTRS658_mm256_mask_sub_epi32 (__m256i __W, __mmask8 __U, __m256i __A,659__m256i __B)660{661return (__m256i) __builtin_ia32_psubd256_mask ((__v8si) __A,662(__v8si) __B,663(__v8si) __W,664(__mmask8) __U);665}666667static __inline__ __m256i __DEFAULT_FN_ATTRS668_mm256_maskz_sub_epi32 (__mmask8 __U, __m256i __A, __m256i __B)669{670return (__m256i) __builtin_ia32_psubd256_mask ((__v8si) __A,671(__v8si) __B,672(__v8si)673_mm256_setzero_si256 (),674(__mmask8) __U);675}676677static __inline__ __m256i __DEFAULT_FN_ATTRS678_mm256_mask_sub_epi64 (__m256i __W, __mmask8 __U, __m256i __A,679__m256i __B)680{681return (__m256i) __builtin_ia32_psubq256_mask ((__v4di) __A,682(__v4di) __B,683(__v4di) __W,684(__mmask8) __U);685}686687static __inline__ __m256i __DEFAULT_FN_ATTRS688_mm256_maskz_sub_epi64 (__mmask8 __U, __m256i __A, __m256i __B)689{690return (__m256i) __builtin_ia32_psubq256_mask ((__v4di) __A,691(__v4di) __B,692(__v4di)693_mm256_setzero_si256 (),694(__mmask8) __U);695}696697static __inline__ __m128i __DEFAULT_FN_ATTRS698_mm_mask_add_epi32 (__m128i __W, __mmask8 __U, __m128i __A,699__m128i __B)700{701return (__m128i) __builtin_ia32_paddd128_mask ((__v4si) __A,702(__v4si) __B,703(__v4si) __W,704(__mmask8) __U);705}706707static __inline__ __m128i __DEFAULT_FN_ATTRS708_mm_maskz_add_epi32 (__mmask8 __U, __m128i __A, __m128i __B)709{710return (__m128i) __builtin_ia32_paddd128_mask ((__v4si) __A,711(__v4si) __B,712(__v4si)713_mm_setzero_si128 (),714(__mmask8) __U);715}716717static __inline__ __m128i __DEFAULT_FN_ATTRS718_mm_mask_add_epi64 (__m128i __W, __mmask8 __U, __m128i __A,719__m128i __B)720{721return (__m128i) __builtin_ia32_paddq128_mask ((__v2di) __A,722(__v2di) __B,723(__v2di) __W,724(__mmask8) __U);725}726727static __inline__ __m128i __DEFAULT_FN_ATTRS728_mm_maskz_add_epi64 (__mmask8 __U, __m128i __A, __m128i __B)729{730return (__m128i) __builtin_ia32_paddq128_mask ((__v2di) __A,731(__v2di) __B,732(__v2di)733_mm_setzero_si128 (),734(__mmask8) __U);735}736737static __inline__ __m128i __DEFAULT_FN_ATTRS738_mm_mask_sub_epi32 (__m128i __W, __mmask8 __U, __m128i __A,739__m128i __B)740{741return (__m128i) __builtin_ia32_psubd128_mask ((__v4si) __A,742(__v4si) __B,743(__v4si) __W,744(__mmask8) __U);745}746747static __inline__ __m128i __DEFAULT_FN_ATTRS748_mm_maskz_sub_epi32 (__mmask8 __U, __m128i __A, __m128i __B)749{750return (__m128i) __builtin_ia32_psubd128_mask ((__v4si) __A,751(__v4si) __B,752(__v4si)753_mm_setzero_si128 (),754(__mmask8) __U);755}756757static __inline__ __m128i __DEFAULT_FN_ATTRS758_mm_mask_sub_epi64 (__m128i __W, __mmask8 __U, __m128i __A,759__m128i __B)760{761return (__m128i) __builtin_ia32_psubq128_mask ((__v2di) __A,762(__v2di) __B,763(__v2di) __W,764(__mmask8) __U);765}766767static __inline__ __m128i __DEFAULT_FN_ATTRS768_mm_maskz_sub_epi64 (__mmask8 __U, __m128i __A, __m128i __B)769{770return (__m128i) __builtin_ia32_psubq128_mask ((__v2di) __A,771(__v2di) __B,772(__v2di)773_mm_setzero_si128 (),774(__mmask8) __U);775}776777static __inline__ __m256i __DEFAULT_FN_ATTRS778_mm256_mask_mul_epi32 (__m256i __W, __mmask8 __M, __m256i __X,779__m256i __Y)780{781return (__m256i) __builtin_ia32_pmuldq256_mask ((__v8si) __X,782(__v8si) __Y,783(__v4di) __W, __M);784}785786static __inline__ __m256i __DEFAULT_FN_ATTRS787_mm256_maskz_mul_epi32 (__mmask8 __M, __m256i __X, __m256i __Y)788{789return (__m256i) __builtin_ia32_pmuldq256_mask ((__v8si) __X,790(__v8si) __Y,791(__v4di)792_mm256_setzero_si256 (),793__M);794}795796static __inline__ __m128i __DEFAULT_FN_ATTRS797_mm_mask_mul_epi32 (__m128i __W, __mmask8 __M, __m128i __X,798__m128i __Y)799{800return (__m128i) __builtin_ia32_pmuldq128_mask ((__v4si) __X,801(__v4si) __Y,802(__v2di) __W, __M);803}804805static __inline__ __m128i __DEFAULT_FN_ATTRS806_mm_maskz_mul_epi32 (__mmask8 __M, __m128i __X, __m128i __Y)807{808return (__m128i) __builtin_ia32_pmuldq128_mask ((__v4si) __X,809(__v4si) __Y,810(__v2di)811_mm_setzero_si128 (),812__M);813}814815static __inline__ __m256i __DEFAULT_FN_ATTRS816_mm256_mask_mul_epu32 (__m256i __W, __mmask8 __M, __m256i __X,817__m256i __Y)818{819return (__m256i) __builtin_ia32_pmuludq256_mask ((__v8si) __X,820(__v8si) __Y,821(__v4di) __W, __M);822}823824static __inline__ __m256i __DEFAULT_FN_ATTRS825_mm256_maskz_mul_epu32 (__mmask8 __M, __m256i __X, __m256i __Y)826{827return (__m256i) __builtin_ia32_pmuludq256_mask ((__v8si) __X,828(__v8si) __Y,829(__v4di)830_mm256_setzero_si256 (),831__M);832}833834static __inline__ __m128i __DEFAULT_FN_ATTRS835_mm_mask_mul_epu32 (__m128i __W, __mmask8 __M, __m128i __X,836__m128i __Y)837{838return (__m128i) __builtin_ia32_pmuludq128_mask ((__v4si) __X,839(__v4si) __Y,840(__v2di) __W, __M);841}842843static __inline__ __m128i __DEFAULT_FN_ATTRS844_mm_maskz_mul_epu32 (__mmask8 __M, __m128i __X, __m128i __Y)845{846return (__m128i) __builtin_ia32_pmuludq128_mask ((__v4si) __X,847(__v4si) __Y,848(__v2di)849_mm_setzero_si128 (),850__M);851}852853static __inline__ __m256i __DEFAULT_FN_ATTRS854_mm256_maskz_mullo_epi32 (__mmask8 __M, __m256i __A, __m256i __B)855{856return (__m256i) __builtin_ia32_pmulld256_mask ((__v8si) __A,857(__v8si) __B,858(__v8si)859_mm256_setzero_si256 (),860__M);861}862863static __inline__ __m256i __DEFAULT_FN_ATTRS864_mm256_mask_mullo_epi32 (__m256i __W, __mmask8 __M, __m256i __A,865__m256i __B)866{867return (__m256i) __builtin_ia32_pmulld256_mask ((__v8si) __A,868(__v8si) __B,869(__v8si) __W, __M);870}871872static __inline__ __m128i __DEFAULT_FN_ATTRS873_mm_maskz_mullo_epi32 (__mmask8 __M, __m128i __A, __m128i __B)874{875return (__m128i) __builtin_ia32_pmulld128_mask ((__v4si) __A,876(__v4si) __B,877(__v4si)878_mm_setzero_si128 (),879__M);880}881882static __inline__ __m128i __DEFAULT_FN_ATTRS883_mm_mask_mullo_epi32 (__m128i __W, __mmask16 __M, __m128i __A,884__m128i __B)885{886return (__m128i) __builtin_ia32_pmulld128_mask ((__v4si) __A,887(__v4si) __B,888(__v4si) __W, __M);889}890891static __inline__ __m256i __DEFAULT_FN_ATTRS892_mm256_mask_and_epi32(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)893{894return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,895(__v8si)_mm256_and_si256(__A, __B),896(__v8si)__W);897}898899static __inline__ __m256i __DEFAULT_FN_ATTRS900_mm256_maskz_and_epi32(__mmask8 __U, __m256i __A, __m256i __B)901{902return (__m256i)_mm256_mask_and_epi32(_mm256_setzero_si256(), __U, __A, __B);903}904905static __inline__ __m128i __DEFAULT_FN_ATTRS906_mm_mask_and_epi32(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)907{908return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,909(__v4si)_mm_and_si128(__A, __B),910(__v4si)__W);911}912913static __inline__ __m128i __DEFAULT_FN_ATTRS914_mm_maskz_and_epi32(__mmask8 __U, __m128i __A, __m128i __B)915{916return (__m128i)_mm_mask_and_epi32(_mm_setzero_si128(), __U, __A, __B);917}918919static __inline__ __m256i __DEFAULT_FN_ATTRS920_mm256_mask_andnot_epi32(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)921{922return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,923(__v8si)_mm256_andnot_si256(__A, __B),924(__v8si)__W);925}926927static __inline__ __m256i __DEFAULT_FN_ATTRS928_mm256_maskz_andnot_epi32(__mmask8 __U, __m256i __A, __m256i __B)929{930return (__m256i)_mm256_mask_andnot_epi32(_mm256_setzero_si256(),931__U, __A, __B);932}933934static __inline__ __m128i __DEFAULT_FN_ATTRS935_mm_mask_andnot_epi32(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)936{937return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,938(__v4si)_mm_andnot_si128(__A, __B),939(__v4si)__W);940}941942static __inline__ __m128i __DEFAULT_FN_ATTRS943_mm_maskz_andnot_epi32 (__mmask8 __U, __m128i __A, __m128i __B)944{945return (__m128i)_mm_mask_andnot_epi32(_mm_setzero_si128(), __U, __A, __B);946}947948static __inline__ __m256i __DEFAULT_FN_ATTRS949_mm256_mask_or_epi32 (__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)950{951return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,952(__v8si)_mm256_or_si256(__A, __B),953(__v8si)__W);954}955956static __inline__ __m256i __DEFAULT_FN_ATTRS957_mm256_maskz_or_epi32(__mmask8 __U, __m256i __A, __m256i __B)958{959return (__m256i)_mm256_mask_or_epi32(_mm256_setzero_si256(), __U, __A, __B);960}961962static __inline__ __m128i __DEFAULT_FN_ATTRS963_mm_mask_or_epi32(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)964{965return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,966(__v4si)_mm_or_si128(__A, __B),967(__v4si)__W);968}969970static __inline__ __m128i __DEFAULT_FN_ATTRS971_mm_maskz_or_epi32(__mmask8 __U, __m128i __A, __m128i __B)972{973return (__m128i)_mm_mask_or_epi32(_mm_setzero_si128(), __U, __A, __B);974}975976static __inline__ __m256i __DEFAULT_FN_ATTRS977_mm256_mask_xor_epi32(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)978{979return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,980(__v8si)_mm256_xor_si256(__A, __B),981(__v8si)__W);982}983984static __inline__ __m256i __DEFAULT_FN_ATTRS985_mm256_maskz_xor_epi32(__mmask8 __U, __m256i __A, __m256i __B)986{987return (__m256i)_mm256_mask_xor_epi32(_mm256_setzero_si256(), __U, __A, __B);988}989990static __inline__ __m128i __DEFAULT_FN_ATTRS991_mm_mask_xor_epi32(__m128i __W, __mmask8 __U, __m128i __A,992__m128i __B)993{994return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,995(__v4si)_mm_xor_si128(__A, __B),996(__v4si)__W);997}998999static __inline__ __m128i __DEFAULT_FN_ATTRS1000_mm_maskz_xor_epi32(__mmask8 __U, __m128i __A, __m128i __B)1001{1002return (__m128i)_mm_mask_xor_epi32(_mm_setzero_si128(), __U, __A, __B);1003}10041005static __inline__ __m256i __DEFAULT_FN_ATTRS1006_mm256_mask_and_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)1007{1008return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,1009(__v4di)_mm256_and_si256(__A, __B),1010(__v4di)__W);1011}10121013static __inline__ __m256i __DEFAULT_FN_ATTRS1014_mm256_maskz_and_epi64(__mmask8 __U, __m256i __A, __m256i __B)1015{1016return (__m256i)_mm256_mask_and_epi64(_mm256_setzero_si256(), __U, __A, __B);1017}10181019static __inline__ __m128i __DEFAULT_FN_ATTRS1020_mm_mask_and_epi64(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)1021{1022return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,1023(__v2di)_mm_and_si128(__A, __B),1024(__v2di)__W);1025}10261027static __inline__ __m128i __DEFAULT_FN_ATTRS1028_mm_maskz_and_epi64(__mmask8 __U, __m128i __A, __m128i __B)1029{1030return (__m128i)_mm_mask_and_epi64(_mm_setzero_si128(), __U, __A, __B);1031}10321033static __inline__ __m256i __DEFAULT_FN_ATTRS1034_mm256_mask_andnot_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)1035{1036return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,1037(__v4di)_mm256_andnot_si256(__A, __B),1038(__v4di)__W);1039}10401041static __inline__ __m256i __DEFAULT_FN_ATTRS1042_mm256_maskz_andnot_epi64(__mmask8 __U, __m256i __A, __m256i __B)1043{1044return (__m256i)_mm256_mask_andnot_epi64(_mm256_setzero_si256(),1045__U, __A, __B);1046}10471048static __inline__ __m128i __DEFAULT_FN_ATTRS1049_mm_mask_andnot_epi64(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)1050{1051return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,1052(__v2di)_mm_andnot_si128(__A, __B),1053(__v2di)__W);1054}10551056static __inline__ __m128i __DEFAULT_FN_ATTRS1057_mm_maskz_andnot_epi64(__mmask8 __U, __m128i __A, __m128i __B)1058{1059return (__m128i)_mm_mask_andnot_epi64(_mm_setzero_si128(), __U, __A, __B);1060}10611062static __inline__ __m256i __DEFAULT_FN_ATTRS1063_mm256_mask_or_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)1064{1065return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,1066(__v4di)_mm256_or_si256(__A, __B),1067(__v4di)__W);1068}10691070static __inline__ __m256i __DEFAULT_FN_ATTRS1071_mm256_maskz_or_epi64(__mmask8 __U, __m256i __A, __m256i __B)1072{1073return (__m256i)_mm256_mask_or_epi64(_mm256_setzero_si256(), __U, __A, __B);1074}10751076static __inline__ __m128i __DEFAULT_FN_ATTRS1077_mm_mask_or_epi64(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)1078{1079return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,1080(__v2di)_mm_or_si128(__A, __B),1081(__v2di)__W);1082}10831084static __inline__ __m128i __DEFAULT_FN_ATTRS1085_mm_maskz_or_epi64(__mmask8 __U, __m128i __A, __m128i __B)1086{1087return (__m128i)_mm_mask_or_epi64(_mm_setzero_si128(), __U, __A, __B);1088}10891090static __inline__ __m256i __DEFAULT_FN_ATTRS1091_mm256_mask_xor_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)1092{1093return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,1094(__v4di)_mm256_xor_si256(__A, __B),1095(__v4di)__W);1096}10971098static __inline__ __m256i __DEFAULT_FN_ATTRS1099_mm256_maskz_xor_epi64(__mmask8 __U, __m256i __A, __m256i __B)1100{1101return (__m256i)_mm256_mask_xor_epi64(_mm256_setzero_si256(), __U, __A, __B);1102}11031104static __inline__ __m128i __DEFAULT_FN_ATTRS1105_mm_mask_xor_epi64(__m128i __W, __mmask8 __U, __m128i __A,1106__m128i __B)1107{1108return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,1109(__v2di)_mm_xor_si128(__A, __B),1110(__v2di)__W);1111}11121113static __inline__ __m128i __DEFAULT_FN_ATTRS1114_mm_maskz_xor_epi64(__mmask8 __U, __m128i __A, __m128i __B)1115{1116return (__m128i)_mm_mask_xor_epi64(_mm_setzero_si128(), __U, __A, __B);1117}11181119#define _mm_cmp_epi32_mask(a, b, p) __extension__ ({ \1120(__mmask8)__builtin_ia32_cmpd128_mask((__v4si)(__m128i)(a), \1121(__v4si)(__m128i)(b), (int)(p), \1122(__mmask8)-1); })11231124#define _mm_mask_cmp_epi32_mask(m, a, b, p) __extension__ ({ \1125(__mmask8)__builtin_ia32_cmpd128_mask((__v4si)(__m128i)(a), \1126(__v4si)(__m128i)(b), (int)(p), \1127(__mmask8)(m)); })11281129#define _mm_cmp_epu32_mask(a, b, p) __extension__ ({ \1130(__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)(__m128i)(a), \1131(__v4si)(__m128i)(b), (int)(p), \1132(__mmask8)-1); })11331134#define _mm_mask_cmp_epu32_mask(m, a, b, p) __extension__ ({ \1135(__mmask8)__builtin_ia32_ucmpd128_mask((__v4si)(__m128i)(a), \1136(__v4si)(__m128i)(b), (int)(p), \1137(__mmask8)(m)); })11381139#define _mm256_cmp_epi32_mask(a, b, p) __extension__ ({ \1140(__mmask8)__builtin_ia32_cmpd256_mask((__v8si)(__m256i)(a), \1141(__v8si)(__m256i)(b), (int)(p), \1142(__mmask8)-1); })11431144#define _mm256_mask_cmp_epi32_mask(m, a, b, p) __extension__ ({ \1145(__mmask8)__builtin_ia32_cmpd256_mask((__v8si)(__m256i)(a), \1146(__v8si)(__m256i)(b), (int)(p), \1147(__mmask8)(m)); })11481149#define _mm256_cmp_epu32_mask(a, b, p) __extension__ ({ \1150(__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)(__m256i)(a), \1151(__v8si)(__m256i)(b), (int)(p), \1152(__mmask8)-1); })11531154#define _mm256_mask_cmp_epu32_mask(m, a, b, p) __extension__ ({ \1155(__mmask8)__builtin_ia32_ucmpd256_mask((__v8si)(__m256i)(a), \1156(__v8si)(__m256i)(b), (int)(p), \1157(__mmask8)(m)); })11581159#define _mm_cmp_epi64_mask(a, b, p) __extension__ ({ \1160(__mmask8)__builtin_ia32_cmpq128_mask((__v2di)(__m128i)(a), \1161(__v2di)(__m128i)(b), (int)(p), \1162(__mmask8)-1); })11631164#define _mm_mask_cmp_epi64_mask(m, a, b, p) __extension__ ({ \1165(__mmask8)__builtin_ia32_cmpq128_mask((__v2di)(__m128i)(a), \1166(__v2di)(__m128i)(b), (int)(p), \1167(__mmask8)(m)); })11681169#define _mm_cmp_epu64_mask(a, b, p) __extension__ ({ \1170(__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)(__m128i)(a), \1171(__v2di)(__m128i)(b), (int)(p), \1172(__mmask8)-1); })11731174#define _mm_mask_cmp_epu64_mask(m, a, b, p) __extension__ ({ \1175(__mmask8)__builtin_ia32_ucmpq128_mask((__v2di)(__m128i)(a), \1176(__v2di)(__m128i)(b), (int)(p), \1177(__mmask8)(m)); })11781179#define _mm256_cmp_epi64_mask(a, b, p) __extension__ ({ \1180(__mmask8)__builtin_ia32_cmpq256_mask((__v4di)(__m256i)(a), \1181(__v4di)(__m256i)(b), (int)(p), \1182(__mmask8)-1); })11831184#define _mm256_mask_cmp_epi64_mask(m, a, b, p) __extension__ ({ \1185(__mmask8)__builtin_ia32_cmpq256_mask((__v4di)(__m256i)(a), \1186(__v4di)(__m256i)(b), (int)(p), \1187(__mmask8)(m)); })11881189#define _mm256_cmp_epu64_mask(a, b, p) __extension__ ({ \1190(__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)(__m256i)(a), \1191(__v4di)(__m256i)(b), (int)(p), \1192(__mmask8)-1); })11931194#define _mm256_mask_cmp_epu64_mask(m, a, b, p) __extension__ ({ \1195(__mmask8)__builtin_ia32_ucmpq256_mask((__v4di)(__m256i)(a), \1196(__v4di)(__m256i)(b), (int)(p), \1197(__mmask8)(m)); })11981199#define _mm256_cmp_ps_mask(a, b, p) __extension__ ({ \1200(__mmask8)__builtin_ia32_cmpps256_mask((__v8sf)(__m256)(a), \1201(__v8sf)(__m256)(b), (int)(p), \1202(__mmask8)-1); })12031204#define _mm256_mask_cmp_ps_mask(m, a, b, p) __extension__ ({ \1205(__mmask8)__builtin_ia32_cmpps256_mask((__v8sf)(__m256)(a), \1206(__v8sf)(__m256)(b), (int)(p), \1207(__mmask8)(m)); })12081209#define _mm256_cmp_pd_mask(a, b, p) __extension__ ({ \1210(__mmask8)__builtin_ia32_cmppd256_mask((__v4df)(__m256d)(a), \1211(__v4df)(__m256d)(b), (int)(p), \1212(__mmask8)-1); })12131214#define _mm256_mask_cmp_pd_mask(m, a, b, p) __extension__ ({ \1215(__mmask8)__builtin_ia32_cmppd256_mask((__v4df)(__m256d)(a), \1216(__v4df)(__m256d)(b), (int)(p), \1217(__mmask8)(m)); })12181219#define _mm_cmp_ps_mask(a, b, p) __extension__ ({ \1220(__mmask8)__builtin_ia32_cmpps128_mask((__v4sf)(__m128)(a), \1221(__v4sf)(__m128)(b), (int)(p), \1222(__mmask8)-1); })12231224#define _mm_mask_cmp_ps_mask(m, a, b, p) __extension__ ({ \1225(__mmask8)__builtin_ia32_cmpps128_mask((__v4sf)(__m128)(a), \1226(__v4sf)(__m128)(b), (int)(p), \1227(__mmask8)(m)); })12281229#define _mm_cmp_pd_mask(a, b, p) __extension__ ({ \1230(__mmask8)__builtin_ia32_cmppd128_mask((__v2df)(__m128d)(a), \1231(__v2df)(__m128d)(b), (int)(p), \1232(__mmask8)-1); })12331234#define _mm_mask_cmp_pd_mask(m, a, b, p) __extension__ ({ \1235(__mmask8)__builtin_ia32_cmppd128_mask((__v2df)(__m128d)(a), \1236(__v2df)(__m128d)(b), (int)(p), \1237(__mmask8)(m)); })12381239static __inline__ __m128d __DEFAULT_FN_ATTRS1240_mm_mask_fmadd_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1241{1242return (__m128d) __builtin_ia32_vfmaddpd128_mask ((__v2df) __A,1243(__v2df) __B,1244(__v2df) __C,1245(__mmask8) __U);1246}12471248static __inline__ __m128d __DEFAULT_FN_ATTRS1249_mm_mask3_fmadd_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1250{1251return (__m128d) __builtin_ia32_vfmaddpd128_mask3 ((__v2df) __A,1252(__v2df) __B,1253(__v2df) __C,1254(__mmask8) __U);1255}12561257static __inline__ __m128d __DEFAULT_FN_ATTRS1258_mm_maskz_fmadd_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1259{1260return (__m128d) __builtin_ia32_vfmaddpd128_maskz ((__v2df) __A,1261(__v2df) __B,1262(__v2df) __C,1263(__mmask8) __U);1264}12651266static __inline__ __m128d __DEFAULT_FN_ATTRS1267_mm_mask_fmsub_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1268{1269return (__m128d) __builtin_ia32_vfmaddpd128_mask ((__v2df) __A,1270(__v2df) __B,1271-(__v2df) __C,1272(__mmask8) __U);1273}12741275static __inline__ __m128d __DEFAULT_FN_ATTRS1276_mm_maskz_fmsub_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1277{1278return (__m128d) __builtin_ia32_vfmaddpd128_maskz ((__v2df) __A,1279(__v2df) __B,1280-(__v2df) __C,1281(__mmask8) __U);1282}12831284static __inline__ __m128d __DEFAULT_FN_ATTRS1285_mm_mask3_fnmadd_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1286{1287return (__m128d) __builtin_ia32_vfmaddpd128_mask3 (-(__v2df) __A,1288(__v2df) __B,1289(__v2df) __C,1290(__mmask8) __U);1291}12921293static __inline__ __m128d __DEFAULT_FN_ATTRS1294_mm_maskz_fnmadd_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1295{1296return (__m128d) __builtin_ia32_vfmaddpd128_maskz (-(__v2df) __A,1297(__v2df) __B,1298(__v2df) __C,1299(__mmask8) __U);1300}13011302static __inline__ __m128d __DEFAULT_FN_ATTRS1303_mm_maskz_fnmsub_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1304{1305return (__m128d) __builtin_ia32_vfmaddpd128_maskz (-(__v2df) __A,1306(__v2df) __B,1307-(__v2df) __C,1308(__mmask8) __U);1309}13101311static __inline__ __m256d __DEFAULT_FN_ATTRS1312_mm256_mask_fmadd_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1313{1314return (__m256d) __builtin_ia32_vfmaddpd256_mask ((__v4df) __A,1315(__v4df) __B,1316(__v4df) __C,1317(__mmask8) __U);1318}13191320static __inline__ __m256d __DEFAULT_FN_ATTRS1321_mm256_mask3_fmadd_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1322{1323return (__m256d) __builtin_ia32_vfmaddpd256_mask3 ((__v4df) __A,1324(__v4df) __B,1325(__v4df) __C,1326(__mmask8) __U);1327}13281329static __inline__ __m256d __DEFAULT_FN_ATTRS1330_mm256_maskz_fmadd_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1331{1332return (__m256d) __builtin_ia32_vfmaddpd256_maskz ((__v4df) __A,1333(__v4df) __B,1334(__v4df) __C,1335(__mmask8) __U);1336}13371338static __inline__ __m256d __DEFAULT_FN_ATTRS1339_mm256_mask_fmsub_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1340{1341return (__m256d) __builtin_ia32_vfmaddpd256_mask ((__v4df) __A,1342(__v4df) __B,1343-(__v4df) __C,1344(__mmask8) __U);1345}13461347static __inline__ __m256d __DEFAULT_FN_ATTRS1348_mm256_maskz_fmsub_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1349{1350return (__m256d) __builtin_ia32_vfmaddpd256_maskz ((__v4df) __A,1351(__v4df) __B,1352-(__v4df) __C,1353(__mmask8) __U);1354}13551356static __inline__ __m256d __DEFAULT_FN_ATTRS1357_mm256_mask3_fnmadd_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1358{1359return (__m256d) __builtin_ia32_vfmaddpd256_mask3 (-(__v4df) __A,1360(__v4df) __B,1361(__v4df) __C,1362(__mmask8) __U);1363}13641365static __inline__ __m256d __DEFAULT_FN_ATTRS1366_mm256_maskz_fnmadd_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1367{1368return (__m256d) __builtin_ia32_vfmaddpd256_maskz (-(__v4df) __A,1369(__v4df) __B,1370(__v4df) __C,1371(__mmask8) __U);1372}13731374static __inline__ __m256d __DEFAULT_FN_ATTRS1375_mm256_maskz_fnmsub_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1376{1377return (__m256d) __builtin_ia32_vfmaddpd256_maskz (-(__v4df) __A,1378(__v4df) __B,1379-(__v4df) __C,1380(__mmask8) __U);1381}13821383static __inline__ __m128 __DEFAULT_FN_ATTRS1384_mm_mask_fmadd_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1385{1386return (__m128) __builtin_ia32_vfmaddps128_mask ((__v4sf) __A,1387(__v4sf) __B,1388(__v4sf) __C,1389(__mmask8) __U);1390}13911392static __inline__ __m128 __DEFAULT_FN_ATTRS1393_mm_mask3_fmadd_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1394{1395return (__m128) __builtin_ia32_vfmaddps128_mask3 ((__v4sf) __A,1396(__v4sf) __B,1397(__v4sf) __C,1398(__mmask8) __U);1399}14001401static __inline__ __m128 __DEFAULT_FN_ATTRS1402_mm_maskz_fmadd_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1403{1404return (__m128) __builtin_ia32_vfmaddps128_maskz ((__v4sf) __A,1405(__v4sf) __B,1406(__v4sf) __C,1407(__mmask8) __U);1408}14091410static __inline__ __m128 __DEFAULT_FN_ATTRS1411_mm_mask_fmsub_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1412{1413return (__m128) __builtin_ia32_vfmaddps128_mask ((__v4sf) __A,1414(__v4sf) __B,1415-(__v4sf) __C,1416(__mmask8) __U);1417}14181419static __inline__ __m128 __DEFAULT_FN_ATTRS1420_mm_maskz_fmsub_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1421{1422return (__m128) __builtin_ia32_vfmaddps128_maskz ((__v4sf) __A,1423(__v4sf) __B,1424-(__v4sf) __C,1425(__mmask8) __U);1426}14271428static __inline__ __m128 __DEFAULT_FN_ATTRS1429_mm_mask3_fnmadd_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1430{1431return (__m128) __builtin_ia32_vfmaddps128_mask3 (-(__v4sf) __A,1432(__v4sf) __B,1433(__v4sf) __C,1434(__mmask8) __U);1435}14361437static __inline__ __m128 __DEFAULT_FN_ATTRS1438_mm_maskz_fnmadd_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1439{1440return (__m128) __builtin_ia32_vfmaddps128_maskz (-(__v4sf) __A,1441(__v4sf) __B,1442(__v4sf) __C,1443(__mmask8) __U);1444}14451446static __inline__ __m128 __DEFAULT_FN_ATTRS1447_mm_maskz_fnmsub_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1448{1449return (__m128) __builtin_ia32_vfmaddps128_maskz (-(__v4sf) __A,1450(__v4sf) __B,1451-(__v4sf) __C,1452(__mmask8) __U);1453}14541455static __inline__ __m256 __DEFAULT_FN_ATTRS1456_mm256_mask_fmadd_ps(__m256 __A, __mmask8 __U, __m256 __B, __m256 __C)1457{1458return (__m256) __builtin_ia32_vfmaddps256_mask ((__v8sf) __A,1459(__v8sf) __B,1460(__v8sf) __C,1461(__mmask8) __U);1462}14631464static __inline__ __m256 __DEFAULT_FN_ATTRS1465_mm256_mask3_fmadd_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1466{1467return (__m256) __builtin_ia32_vfmaddps256_mask3 ((__v8sf) __A,1468(__v8sf) __B,1469(__v8sf) __C,1470(__mmask8) __U);1471}14721473static __inline__ __m256 __DEFAULT_FN_ATTRS1474_mm256_maskz_fmadd_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1475{1476return (__m256) __builtin_ia32_vfmaddps256_maskz ((__v8sf) __A,1477(__v8sf) __B,1478(__v8sf) __C,1479(__mmask8) __U);1480}14811482static __inline__ __m256 __DEFAULT_FN_ATTRS1483_mm256_mask_fmsub_ps(__m256 __A, __mmask8 __U, __m256 __B, __m256 __C)1484{1485return (__m256) __builtin_ia32_vfmaddps256_mask ((__v8sf) __A,1486(__v8sf) __B,1487-(__v8sf) __C,1488(__mmask8) __U);1489}14901491static __inline__ __m256 __DEFAULT_FN_ATTRS1492_mm256_maskz_fmsub_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1493{1494return (__m256) __builtin_ia32_vfmaddps256_maskz ((__v8sf) __A,1495(__v8sf) __B,1496-(__v8sf) __C,1497(__mmask8) __U);1498}14991500static __inline__ __m256 __DEFAULT_FN_ATTRS1501_mm256_mask3_fnmadd_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1502{1503return (__m256) __builtin_ia32_vfmaddps256_mask3 (-(__v8sf) __A,1504(__v8sf) __B,1505(__v8sf) __C,1506(__mmask8) __U);1507}15081509static __inline__ __m256 __DEFAULT_FN_ATTRS1510_mm256_maskz_fnmadd_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1511{1512return (__m256) __builtin_ia32_vfmaddps256_maskz (-(__v8sf) __A,1513(__v8sf) __B,1514(__v8sf) __C,1515(__mmask8) __U);1516}15171518static __inline__ __m256 __DEFAULT_FN_ATTRS1519_mm256_maskz_fnmsub_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1520{1521return (__m256) __builtin_ia32_vfmaddps256_maskz (-(__v8sf) __A,1522(__v8sf) __B,1523-(__v8sf) __C,1524(__mmask8) __U);1525}15261527static __inline__ __m128d __DEFAULT_FN_ATTRS1528_mm_mask_fmaddsub_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1529{1530return (__m128d) __builtin_ia32_vfmaddsubpd128_mask ((__v2df) __A,1531(__v2df) __B,1532(__v2df) __C,1533(__mmask8) __U);1534}15351536static __inline__ __m128d __DEFAULT_FN_ATTRS1537_mm_mask3_fmaddsub_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1538{1539return (__m128d) __builtin_ia32_vfmaddsubpd128_mask3 ((__v2df) __A,1540(__v2df) __B,1541(__v2df) __C,1542(__mmask8)1543__U);1544}15451546static __inline__ __m128d __DEFAULT_FN_ATTRS1547_mm_maskz_fmaddsub_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1548{1549return (__m128d) __builtin_ia32_vfmaddsubpd128_maskz ((__v2df) __A,1550(__v2df) __B,1551(__v2df) __C,1552(__mmask8)1553__U);1554}15551556static __inline__ __m128d __DEFAULT_FN_ATTRS1557_mm_mask_fmsubadd_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1558{1559return (__m128d) __builtin_ia32_vfmaddsubpd128_mask ((__v2df) __A,1560(__v2df) __B,1561-(__v2df) __C,1562(__mmask8) __U);1563}15641565static __inline__ __m128d __DEFAULT_FN_ATTRS1566_mm_maskz_fmsubadd_pd(__mmask8 __U, __m128d __A, __m128d __B, __m128d __C)1567{1568return (__m128d) __builtin_ia32_vfmaddsubpd128_maskz ((__v2df) __A,1569(__v2df) __B,1570-(__v2df) __C,1571(__mmask8)1572__U);1573}15741575static __inline__ __m256d __DEFAULT_FN_ATTRS1576_mm256_mask_fmaddsub_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1577{1578return (__m256d) __builtin_ia32_vfmaddsubpd256_mask ((__v4df) __A,1579(__v4df) __B,1580(__v4df) __C,1581(__mmask8) __U);1582}15831584static __inline__ __m256d __DEFAULT_FN_ATTRS1585_mm256_mask3_fmaddsub_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1586{1587return (__m256d) __builtin_ia32_vfmaddsubpd256_mask3 ((__v4df) __A,1588(__v4df) __B,1589(__v4df) __C,1590(__mmask8)1591__U);1592}15931594static __inline__ __m256d __DEFAULT_FN_ATTRS1595_mm256_maskz_fmaddsub_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1596{1597return (__m256d) __builtin_ia32_vfmaddsubpd256_maskz ((__v4df) __A,1598(__v4df) __B,1599(__v4df) __C,1600(__mmask8)1601__U);1602}16031604static __inline__ __m256d __DEFAULT_FN_ATTRS1605_mm256_mask_fmsubadd_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1606{1607return (__m256d) __builtin_ia32_vfmaddsubpd256_mask ((__v4df) __A,1608(__v4df) __B,1609-(__v4df) __C,1610(__mmask8) __U);1611}16121613static __inline__ __m256d __DEFAULT_FN_ATTRS1614_mm256_maskz_fmsubadd_pd(__mmask8 __U, __m256d __A, __m256d __B, __m256d __C)1615{1616return (__m256d) __builtin_ia32_vfmaddsubpd256_maskz ((__v4df) __A,1617(__v4df) __B,1618-(__v4df) __C,1619(__mmask8)1620__U);1621}16221623static __inline__ __m128 __DEFAULT_FN_ATTRS1624_mm_mask_fmaddsub_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1625{1626return (__m128) __builtin_ia32_vfmaddsubps128_mask ((__v4sf) __A,1627(__v4sf) __B,1628(__v4sf) __C,1629(__mmask8) __U);1630}16311632static __inline__ __m128 __DEFAULT_FN_ATTRS1633_mm_mask3_fmaddsub_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1634{1635return (__m128) __builtin_ia32_vfmaddsubps128_mask3 ((__v4sf) __A,1636(__v4sf) __B,1637(__v4sf) __C,1638(__mmask8) __U);1639}16401641static __inline__ __m128 __DEFAULT_FN_ATTRS1642_mm_maskz_fmaddsub_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1643{1644return (__m128) __builtin_ia32_vfmaddsubps128_maskz ((__v4sf) __A,1645(__v4sf) __B,1646(__v4sf) __C,1647(__mmask8) __U);1648}16491650static __inline__ __m128 __DEFAULT_FN_ATTRS1651_mm_mask_fmsubadd_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1652{1653return (__m128) __builtin_ia32_vfmaddsubps128_mask ((__v4sf) __A,1654(__v4sf) __B,1655-(__v4sf) __C,1656(__mmask8) __U);1657}16581659static __inline__ __m128 __DEFAULT_FN_ATTRS1660_mm_maskz_fmsubadd_ps(__mmask8 __U, __m128 __A, __m128 __B, __m128 __C)1661{1662return (__m128) __builtin_ia32_vfmaddsubps128_maskz ((__v4sf) __A,1663(__v4sf) __B,1664-(__v4sf) __C,1665(__mmask8) __U);1666}16671668static __inline__ __m256 __DEFAULT_FN_ATTRS1669_mm256_mask_fmaddsub_ps(__m256 __A, __mmask8 __U, __m256 __B,1670__m256 __C)1671{1672return (__m256) __builtin_ia32_vfmaddsubps256_mask ((__v8sf) __A,1673(__v8sf) __B,1674(__v8sf) __C,1675(__mmask8) __U);1676}16771678static __inline__ __m256 __DEFAULT_FN_ATTRS1679_mm256_mask3_fmaddsub_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1680{1681return (__m256) __builtin_ia32_vfmaddsubps256_mask3 ((__v8sf) __A,1682(__v8sf) __B,1683(__v8sf) __C,1684(__mmask8) __U);1685}16861687static __inline__ __m256 __DEFAULT_FN_ATTRS1688_mm256_maskz_fmaddsub_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1689{1690return (__m256) __builtin_ia32_vfmaddsubps256_maskz ((__v8sf) __A,1691(__v8sf) __B,1692(__v8sf) __C,1693(__mmask8) __U);1694}16951696static __inline__ __m256 __DEFAULT_FN_ATTRS1697_mm256_mask_fmsubadd_ps(__m256 __A, __mmask8 __U, __m256 __B, __m256 __C)1698{1699return (__m256) __builtin_ia32_vfmaddsubps256_mask ((__v8sf) __A,1700(__v8sf) __B,1701-(__v8sf) __C,1702(__mmask8) __U);1703}17041705static __inline__ __m256 __DEFAULT_FN_ATTRS1706_mm256_maskz_fmsubadd_ps(__mmask8 __U, __m256 __A, __m256 __B, __m256 __C)1707{1708return (__m256) __builtin_ia32_vfmaddsubps256_maskz ((__v8sf) __A,1709(__v8sf) __B,1710-(__v8sf) __C,1711(__mmask8) __U);1712}17131714static __inline__ __m128d __DEFAULT_FN_ATTRS1715_mm_mask3_fmsub_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1716{1717return (__m128d) __builtin_ia32_vfmsubpd128_mask3 ((__v2df) __A,1718(__v2df) __B,1719(__v2df) __C,1720(__mmask8) __U);1721}17221723static __inline__ __m256d __DEFAULT_FN_ATTRS1724_mm256_mask3_fmsub_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1725{1726return (__m256d) __builtin_ia32_vfmsubpd256_mask3 ((__v4df) __A,1727(__v4df) __B,1728(__v4df) __C,1729(__mmask8) __U);1730}17311732static __inline__ __m128 __DEFAULT_FN_ATTRS1733_mm_mask3_fmsub_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1734{1735return (__m128) __builtin_ia32_vfmsubps128_mask3 ((__v4sf) __A,1736(__v4sf) __B,1737(__v4sf) __C,1738(__mmask8) __U);1739}17401741static __inline__ __m256 __DEFAULT_FN_ATTRS1742_mm256_mask3_fmsub_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1743{1744return (__m256) __builtin_ia32_vfmsubps256_mask3 ((__v8sf) __A,1745(__v8sf) __B,1746(__v8sf) __C,1747(__mmask8) __U);1748}17491750static __inline__ __m128d __DEFAULT_FN_ATTRS1751_mm_mask3_fmsubadd_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1752{1753return (__m128d) __builtin_ia32_vfmsubaddpd128_mask3 ((__v2df) __A,1754(__v2df) __B,1755(__v2df) __C,1756(__mmask8)1757__U);1758}17591760static __inline__ __m256d __DEFAULT_FN_ATTRS1761_mm256_mask3_fmsubadd_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1762{1763return (__m256d) __builtin_ia32_vfmsubaddpd256_mask3 ((__v4df) __A,1764(__v4df) __B,1765(__v4df) __C,1766(__mmask8)1767__U);1768}17691770static __inline__ __m128 __DEFAULT_FN_ATTRS1771_mm_mask3_fmsubadd_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1772{1773return (__m128) __builtin_ia32_vfmsubaddps128_mask3 ((__v4sf) __A,1774(__v4sf) __B,1775(__v4sf) __C,1776(__mmask8) __U);1777}17781779static __inline__ __m256 __DEFAULT_FN_ATTRS1780_mm256_mask3_fmsubadd_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1781{1782return (__m256) __builtin_ia32_vfmsubaddps256_mask3 ((__v8sf) __A,1783(__v8sf) __B,1784(__v8sf) __C,1785(__mmask8) __U);1786}17871788static __inline__ __m128d __DEFAULT_FN_ATTRS1789_mm_mask_fnmadd_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1790{1791return (__m128d) __builtin_ia32_vfnmaddpd128_mask ((__v2df) __A,1792(__v2df) __B,1793(__v2df) __C,1794(__mmask8) __U);1795}17961797static __inline__ __m256d __DEFAULT_FN_ATTRS1798_mm256_mask_fnmadd_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1799{1800return (__m256d) __builtin_ia32_vfnmaddpd256_mask ((__v4df) __A,1801(__v4df) __B,1802(__v4df) __C,1803(__mmask8) __U);1804}18051806static __inline__ __m128 __DEFAULT_FN_ATTRS1807_mm_mask_fnmadd_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1808{1809return (__m128) __builtin_ia32_vfnmaddps128_mask ((__v4sf) __A,1810(__v4sf) __B,1811(__v4sf) __C,1812(__mmask8) __U);1813}18141815static __inline__ __m256 __DEFAULT_FN_ATTRS1816_mm256_mask_fnmadd_ps(__m256 __A, __mmask8 __U, __m256 __B, __m256 __C)1817{1818return (__m256) __builtin_ia32_vfnmaddps256_mask ((__v8sf) __A,1819(__v8sf) __B,1820(__v8sf) __C,1821(__mmask8) __U);1822}18231824static __inline__ __m128d __DEFAULT_FN_ATTRS1825_mm_mask_fnmsub_pd(__m128d __A, __mmask8 __U, __m128d __B, __m128d __C)1826{1827return (__m128d) __builtin_ia32_vfnmsubpd128_mask ((__v2df) __A,1828(__v2df) __B,1829(__v2df) __C,1830(__mmask8) __U);1831}18321833static __inline__ __m128d __DEFAULT_FN_ATTRS1834_mm_mask3_fnmsub_pd(__m128d __A, __m128d __B, __m128d __C, __mmask8 __U)1835{1836return (__m128d) __builtin_ia32_vfnmsubpd128_mask3 ((__v2df) __A,1837(__v2df) __B,1838(__v2df) __C,1839(__mmask8) __U);1840}18411842static __inline__ __m256d __DEFAULT_FN_ATTRS1843_mm256_mask_fnmsub_pd(__m256d __A, __mmask8 __U, __m256d __B, __m256d __C)1844{1845return (__m256d) __builtin_ia32_vfnmsubpd256_mask ((__v4df) __A,1846(__v4df) __B,1847(__v4df) __C,1848(__mmask8) __U);1849}18501851static __inline__ __m256d __DEFAULT_FN_ATTRS1852_mm256_mask3_fnmsub_pd(__m256d __A, __m256d __B, __m256d __C, __mmask8 __U)1853{1854return (__m256d) __builtin_ia32_vfnmsubpd256_mask3 ((__v4df) __A,1855(__v4df) __B,1856(__v4df) __C,1857(__mmask8) __U);1858}18591860static __inline__ __m128 __DEFAULT_FN_ATTRS1861_mm_mask_fnmsub_ps(__m128 __A, __mmask8 __U, __m128 __B, __m128 __C)1862{1863return (__m128) __builtin_ia32_vfnmsubps128_mask ((__v4sf) __A,1864(__v4sf) __B,1865(__v4sf) __C,1866(__mmask8) __U);1867}18681869static __inline__ __m128 __DEFAULT_FN_ATTRS1870_mm_mask3_fnmsub_ps(__m128 __A, __m128 __B, __m128 __C, __mmask8 __U)1871{1872return (__m128) __builtin_ia32_vfnmsubps128_mask3 ((__v4sf) __A,1873(__v4sf) __B,1874(__v4sf) __C,1875(__mmask8) __U);1876}18771878static __inline__ __m256 __DEFAULT_FN_ATTRS1879_mm256_mask_fnmsub_ps(__m256 __A, __mmask8 __U, __m256 __B, __m256 __C)1880{1881return (__m256) __builtin_ia32_vfnmsubps256_mask ((__v8sf) __A,1882(__v8sf) __B,1883(__v8sf) __C,1884(__mmask8) __U);1885}18861887static __inline__ __m256 __DEFAULT_FN_ATTRS1888_mm256_mask3_fnmsub_ps(__m256 __A, __m256 __B, __m256 __C, __mmask8 __U)1889{1890return (__m256) __builtin_ia32_vfnmsubps256_mask3 ((__v8sf) __A,1891(__v8sf) __B,1892(__v8sf) __C,1893(__mmask8) __U);1894}18951896static __inline__ __m128d __DEFAULT_FN_ATTRS1897_mm_mask_add_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {1898return (__m128d) __builtin_ia32_addpd128_mask ((__v2df) __A,1899(__v2df) __B,1900(__v2df) __W,1901(__mmask8) __U);1902}19031904static __inline__ __m128d __DEFAULT_FN_ATTRS1905_mm_maskz_add_pd (__mmask8 __U, __m128d __A, __m128d __B) {1906return (__m128d) __builtin_ia32_addpd128_mask ((__v2df) __A,1907(__v2df) __B,1908(__v2df)1909_mm_setzero_pd (),1910(__mmask8) __U);1911}19121913static __inline__ __m256d __DEFAULT_FN_ATTRS1914_mm256_mask_add_pd (__m256d __W, __mmask8 __U, __m256d __A, __m256d __B) {1915return (__m256d) __builtin_ia32_addpd256_mask ((__v4df) __A,1916(__v4df) __B,1917(__v4df) __W,1918(__mmask8) __U);1919}19201921static __inline__ __m256d __DEFAULT_FN_ATTRS1922_mm256_maskz_add_pd (__mmask8 __U, __m256d __A, __m256d __B) {1923return (__m256d) __builtin_ia32_addpd256_mask ((__v4df) __A,1924(__v4df) __B,1925(__v4df)1926_mm256_setzero_pd (),1927(__mmask8) __U);1928}19291930static __inline__ __m128 __DEFAULT_FN_ATTRS1931_mm_mask_add_ps (__m128 __W, __mmask16 __U, __m128 __A, __m128 __B) {1932return (__m128) __builtin_ia32_addps128_mask ((__v4sf) __A,1933(__v4sf) __B,1934(__v4sf) __W,1935(__mmask8) __U);1936}19371938static __inline__ __m128 __DEFAULT_FN_ATTRS1939_mm_maskz_add_ps (__mmask16 __U, __m128 __A, __m128 __B) {1940return (__m128) __builtin_ia32_addps128_mask ((__v4sf) __A,1941(__v4sf) __B,1942(__v4sf)1943_mm_setzero_ps (),1944(__mmask8) __U);1945}19461947static __inline__ __m256 __DEFAULT_FN_ATTRS1948_mm256_mask_add_ps (__m256 __W, __mmask16 __U, __m256 __A, __m256 __B) {1949return (__m256) __builtin_ia32_addps256_mask ((__v8sf) __A,1950(__v8sf) __B,1951(__v8sf) __W,1952(__mmask8) __U);1953}19541955static __inline__ __m256 __DEFAULT_FN_ATTRS1956_mm256_maskz_add_ps (__mmask16 __U, __m256 __A, __m256 __B) {1957return (__m256) __builtin_ia32_addps256_mask ((__v8sf) __A,1958(__v8sf) __B,1959(__v8sf)1960_mm256_setzero_ps (),1961(__mmask8) __U);1962}19631964static __inline__ __m128i __DEFAULT_FN_ATTRS1965_mm_mask_blend_epi32 (__mmask8 __U, __m128i __A, __m128i __W) {1966return (__m128i) __builtin_ia32_selectd_128 ((__mmask8) __U,1967(__v4si) __W,1968(__v4si) __A);1969}19701971static __inline__ __m256i __DEFAULT_FN_ATTRS1972_mm256_mask_blend_epi32 (__mmask8 __U, __m256i __A, __m256i __W) {1973return (__m256i) __builtin_ia32_selectd_256 ((__mmask8) __U,1974(__v8si) __W,1975(__v8si) __A);1976}19771978static __inline__ __m128d __DEFAULT_FN_ATTRS1979_mm_mask_blend_pd (__mmask8 __U, __m128d __A, __m128d __W) {1980return (__m128d) __builtin_ia32_selectpd_128 ((__mmask8) __U,1981(__v2df) __W,1982(__v2df) __A);1983}19841985static __inline__ __m256d __DEFAULT_FN_ATTRS1986_mm256_mask_blend_pd (__mmask8 __U, __m256d __A, __m256d __W) {1987return (__m256d) __builtin_ia32_selectpd_256 ((__mmask8) __U,1988(__v4df) __W,1989(__v4df) __A);1990}19911992static __inline__ __m128 __DEFAULT_FN_ATTRS1993_mm_mask_blend_ps (__mmask8 __U, __m128 __A, __m128 __W) {1994return (__m128) __builtin_ia32_selectps_128 ((__mmask8) __U,1995(__v4sf) __W,1996(__v4sf) __A);1997}19981999static __inline__ __m256 __DEFAULT_FN_ATTRS2000_mm256_mask_blend_ps (__mmask8 __U, __m256 __A, __m256 __W) {2001return (__m256) __builtin_ia32_selectps_256 ((__mmask8) __U,2002(__v8sf) __W,2003(__v8sf) __A);2004}20052006static __inline__ __m128i __DEFAULT_FN_ATTRS2007_mm_mask_blend_epi64 (__mmask8 __U, __m128i __A, __m128i __W) {2008return (__m128i) __builtin_ia32_selectq_128 ((__mmask8) __U,2009(__v2di) __W,2010(__v2di) __A);2011}20122013static __inline__ __m256i __DEFAULT_FN_ATTRS2014_mm256_mask_blend_epi64 (__mmask8 __U, __m256i __A, __m256i __W) {2015return (__m256i) __builtin_ia32_selectq_256 ((__mmask8) __U,2016(__v4di) __W,2017(__v4di) __A);2018}20192020static __inline__ __m128d __DEFAULT_FN_ATTRS2021_mm_mask_compress_pd (__m128d __W, __mmask8 __U, __m128d __A) {2022return (__m128d) __builtin_ia32_compressdf128_mask ((__v2df) __A,2023(__v2df) __W,2024(__mmask8) __U);2025}20262027static __inline__ __m128d __DEFAULT_FN_ATTRS2028_mm_maskz_compress_pd (__mmask8 __U, __m128d __A) {2029return (__m128d) __builtin_ia32_compressdf128_mask ((__v2df) __A,2030(__v2df)2031_mm_setzero_pd (),2032(__mmask8) __U);2033}20342035static __inline__ __m256d __DEFAULT_FN_ATTRS2036_mm256_mask_compress_pd (__m256d __W, __mmask8 __U, __m256d __A) {2037return (__m256d) __builtin_ia32_compressdf256_mask ((__v4df) __A,2038(__v4df) __W,2039(__mmask8) __U);2040}20412042static __inline__ __m256d __DEFAULT_FN_ATTRS2043_mm256_maskz_compress_pd (__mmask8 __U, __m256d __A) {2044return (__m256d) __builtin_ia32_compressdf256_mask ((__v4df) __A,2045(__v4df)2046_mm256_setzero_pd (),2047(__mmask8) __U);2048}20492050static __inline__ __m128i __DEFAULT_FN_ATTRS2051_mm_mask_compress_epi64 (__m128i __W, __mmask8 __U, __m128i __A) {2052return (__m128i) __builtin_ia32_compressdi128_mask ((__v2di) __A,2053(__v2di) __W,2054(__mmask8) __U);2055}20562057static __inline__ __m128i __DEFAULT_FN_ATTRS2058_mm_maskz_compress_epi64 (__mmask8 __U, __m128i __A) {2059return (__m128i) __builtin_ia32_compressdi128_mask ((__v2di) __A,2060(__v2di)2061_mm_setzero_si128 (),2062(__mmask8) __U);2063}20642065static __inline__ __m256i __DEFAULT_FN_ATTRS2066_mm256_mask_compress_epi64 (__m256i __W, __mmask8 __U, __m256i __A) {2067return (__m256i) __builtin_ia32_compressdi256_mask ((__v4di) __A,2068(__v4di) __W,2069(__mmask8) __U);2070}20712072static __inline__ __m256i __DEFAULT_FN_ATTRS2073_mm256_maskz_compress_epi64 (__mmask8 __U, __m256i __A) {2074return (__m256i) __builtin_ia32_compressdi256_mask ((__v4di) __A,2075(__v4di)2076_mm256_setzero_si256 (),2077(__mmask8) __U);2078}20792080static __inline__ __m128 __DEFAULT_FN_ATTRS2081_mm_mask_compress_ps (__m128 __W, __mmask8 __U, __m128 __A) {2082return (__m128) __builtin_ia32_compresssf128_mask ((__v4sf) __A,2083(__v4sf) __W,2084(__mmask8) __U);2085}20862087static __inline__ __m128 __DEFAULT_FN_ATTRS2088_mm_maskz_compress_ps (__mmask8 __U, __m128 __A) {2089return (__m128) __builtin_ia32_compresssf128_mask ((__v4sf) __A,2090(__v4sf)2091_mm_setzero_ps (),2092(__mmask8) __U);2093}20942095static __inline__ __m256 __DEFAULT_FN_ATTRS2096_mm256_mask_compress_ps (__m256 __W, __mmask8 __U, __m256 __A) {2097return (__m256) __builtin_ia32_compresssf256_mask ((__v8sf) __A,2098(__v8sf) __W,2099(__mmask8) __U);2100}21012102static __inline__ __m256 __DEFAULT_FN_ATTRS2103_mm256_maskz_compress_ps (__mmask8 __U, __m256 __A) {2104return (__m256) __builtin_ia32_compresssf256_mask ((__v8sf) __A,2105(__v8sf)2106_mm256_setzero_ps (),2107(__mmask8) __U);2108}21092110static __inline__ __m128i __DEFAULT_FN_ATTRS2111_mm_mask_compress_epi32 (__m128i __W, __mmask8 __U, __m128i __A) {2112return (__m128i) __builtin_ia32_compresssi128_mask ((__v4si) __A,2113(__v4si) __W,2114(__mmask8) __U);2115}21162117static __inline__ __m128i __DEFAULT_FN_ATTRS2118_mm_maskz_compress_epi32 (__mmask8 __U, __m128i __A) {2119return (__m128i) __builtin_ia32_compresssi128_mask ((__v4si) __A,2120(__v4si)2121_mm_setzero_si128 (),2122(__mmask8) __U);2123}21242125static __inline__ __m256i __DEFAULT_FN_ATTRS2126_mm256_mask_compress_epi32 (__m256i __W, __mmask8 __U, __m256i __A) {2127return (__m256i) __builtin_ia32_compresssi256_mask ((__v8si) __A,2128(__v8si) __W,2129(__mmask8) __U);2130}21312132static __inline__ __m256i __DEFAULT_FN_ATTRS2133_mm256_maskz_compress_epi32 (__mmask8 __U, __m256i __A) {2134return (__m256i) __builtin_ia32_compresssi256_mask ((__v8si) __A,2135(__v8si)2136_mm256_setzero_si256 (),2137(__mmask8) __U);2138}21392140static __inline__ void __DEFAULT_FN_ATTRS2141_mm_mask_compressstoreu_pd (void *__P, __mmask8 __U, __m128d __A) {2142__builtin_ia32_compressstoredf128_mask ((__v2df *) __P,2143(__v2df) __A,2144(__mmask8) __U);2145}21462147static __inline__ void __DEFAULT_FN_ATTRS2148_mm256_mask_compressstoreu_pd (void *__P, __mmask8 __U, __m256d __A) {2149__builtin_ia32_compressstoredf256_mask ((__v4df *) __P,2150(__v4df) __A,2151(__mmask8) __U);2152}21532154static __inline__ void __DEFAULT_FN_ATTRS2155_mm_mask_compressstoreu_epi64 (void *__P, __mmask8 __U, __m128i __A) {2156__builtin_ia32_compressstoredi128_mask ((__v2di *) __P,2157(__v2di) __A,2158(__mmask8) __U);2159}21602161static __inline__ void __DEFAULT_FN_ATTRS2162_mm256_mask_compressstoreu_epi64 (void *__P, __mmask8 __U, __m256i __A) {2163__builtin_ia32_compressstoredi256_mask ((__v4di *) __P,2164(__v4di) __A,2165(__mmask8) __U);2166}21672168static __inline__ void __DEFAULT_FN_ATTRS2169_mm_mask_compressstoreu_ps (void *__P, __mmask8 __U, __m128 __A) {2170__builtin_ia32_compressstoresf128_mask ((__v4sf *) __P,2171(__v4sf) __A,2172(__mmask8) __U);2173}21742175static __inline__ void __DEFAULT_FN_ATTRS2176_mm256_mask_compressstoreu_ps (void *__P, __mmask8 __U, __m256 __A) {2177__builtin_ia32_compressstoresf256_mask ((__v8sf *) __P,2178(__v8sf) __A,2179(__mmask8) __U);2180}21812182static __inline__ void __DEFAULT_FN_ATTRS2183_mm_mask_compressstoreu_epi32 (void *__P, __mmask8 __U, __m128i __A) {2184__builtin_ia32_compressstoresi128_mask ((__v4si *) __P,2185(__v4si) __A,2186(__mmask8) __U);2187}21882189static __inline__ void __DEFAULT_FN_ATTRS2190_mm256_mask_compressstoreu_epi32 (void *__P, __mmask8 __U, __m256i __A) {2191__builtin_ia32_compressstoresi256_mask ((__v8si *) __P,2192(__v8si) __A,2193(__mmask8) __U);2194}21952196static __inline__ __m128d __DEFAULT_FN_ATTRS2197_mm_mask_cvtepi32_pd (__m128d __W, __mmask8 __U, __m128i __A) {2198return (__m128d) __builtin_ia32_cvtdq2pd128_mask ((__v4si) __A,2199(__v2df) __W,2200(__mmask8) __U);2201}22022203static __inline__ __m128d __DEFAULT_FN_ATTRS2204_mm_maskz_cvtepi32_pd (__mmask8 __U, __m128i __A) {2205return (__m128d) __builtin_ia32_cvtdq2pd128_mask ((__v4si) __A,2206(__v2df)2207_mm_setzero_pd (),2208(__mmask8) __U);2209}22102211static __inline__ __m256d __DEFAULT_FN_ATTRS2212_mm256_mask_cvtepi32_pd (__m256d __W, __mmask8 __U, __m128i __A) {2213return (__m256d) __builtin_ia32_cvtdq2pd256_mask ((__v4si) __A,2214(__v4df) __W,2215(__mmask8) __U);2216}22172218static __inline__ __m256d __DEFAULT_FN_ATTRS2219_mm256_maskz_cvtepi32_pd (__mmask8 __U, __m128i __A) {2220return (__m256d) __builtin_ia32_cvtdq2pd256_mask ((__v4si) __A,2221(__v4df)2222_mm256_setzero_pd (),2223(__mmask8) __U);2224}22252226static __inline__ __m128 __DEFAULT_FN_ATTRS2227_mm_mask_cvtepi32_ps (__m128 __W, __mmask8 __U, __m128i __A) {2228return (__m128) __builtin_ia32_cvtdq2ps128_mask ((__v4si) __A,2229(__v4sf) __W,2230(__mmask8) __U);2231}22322233static __inline__ __m128 __DEFAULT_FN_ATTRS2234_mm_maskz_cvtepi32_ps (__mmask16 __U, __m128i __A) {2235return (__m128) __builtin_ia32_cvtdq2ps128_mask ((__v4si) __A,2236(__v4sf)2237_mm_setzero_ps (),2238(__mmask8) __U);2239}22402241static __inline__ __m256 __DEFAULT_FN_ATTRS2242_mm256_mask_cvtepi32_ps (__m256 __W, __mmask8 __U, __m256i __A) {2243return (__m256) __builtin_ia32_cvtdq2ps256_mask ((__v8si) __A,2244(__v8sf) __W,2245(__mmask8) __U);2246}22472248static __inline__ __m256 __DEFAULT_FN_ATTRS2249_mm256_maskz_cvtepi32_ps (__mmask16 __U, __m256i __A) {2250return (__m256) __builtin_ia32_cvtdq2ps256_mask ((__v8si) __A,2251(__v8sf)2252_mm256_setzero_ps (),2253(__mmask8) __U);2254}22552256static __inline__ __m128i __DEFAULT_FN_ATTRS2257_mm_mask_cvtpd_epi32 (__m128i __W, __mmask8 __U, __m128d __A) {2258return (__m128i) __builtin_ia32_cvtpd2dq128_mask ((__v2df) __A,2259(__v4si) __W,2260(__mmask8) __U);2261}22622263static __inline__ __m128i __DEFAULT_FN_ATTRS2264_mm_maskz_cvtpd_epi32 (__mmask8 __U, __m128d __A) {2265return (__m128i) __builtin_ia32_cvtpd2dq128_mask ((__v2df) __A,2266(__v4si)2267_mm_setzero_si128 (),2268(__mmask8) __U);2269}22702271static __inline__ __m128i __DEFAULT_FN_ATTRS2272_mm256_mask_cvtpd_epi32 (__m128i __W, __mmask8 __U, __m256d __A) {2273return (__m128i) __builtin_ia32_cvtpd2dq256_mask ((__v4df) __A,2274(__v4si) __W,2275(__mmask8) __U);2276}22772278static __inline__ __m128i __DEFAULT_FN_ATTRS2279_mm256_maskz_cvtpd_epi32 (__mmask8 __U, __m256d __A) {2280return (__m128i) __builtin_ia32_cvtpd2dq256_mask ((__v4df) __A,2281(__v4si)2282_mm_setzero_si128 (),2283(__mmask8) __U);2284}22852286static __inline__ __m128 __DEFAULT_FN_ATTRS2287_mm_mask_cvtpd_ps (__m128 __W, __mmask8 __U, __m128d __A) {2288return (__m128) __builtin_ia32_cvtpd2ps_mask ((__v2df) __A,2289(__v4sf) __W,2290(__mmask8) __U);2291}22922293static __inline__ __m128 __DEFAULT_FN_ATTRS2294_mm_maskz_cvtpd_ps (__mmask8 __U, __m128d __A) {2295return (__m128) __builtin_ia32_cvtpd2ps_mask ((__v2df) __A,2296(__v4sf)2297_mm_setzero_ps (),2298(__mmask8) __U);2299}23002301static __inline__ __m128 __DEFAULT_FN_ATTRS2302_mm256_mask_cvtpd_ps (__m128 __W, __mmask8 __U, __m256d __A) {2303return (__m128) __builtin_ia32_cvtpd2ps256_mask ((__v4df) __A,2304(__v4sf) __W,2305(__mmask8) __U);2306}23072308static __inline__ __m128 __DEFAULT_FN_ATTRS2309_mm256_maskz_cvtpd_ps (__mmask8 __U, __m256d __A) {2310return (__m128) __builtin_ia32_cvtpd2ps256_mask ((__v4df) __A,2311(__v4sf)2312_mm_setzero_ps (),2313(__mmask8) __U);2314}23152316static __inline__ __m128i __DEFAULT_FN_ATTRS2317_mm_cvtpd_epu32 (__m128d __A) {2318return (__m128i) __builtin_ia32_cvtpd2udq128_mask ((__v2df) __A,2319(__v4si)2320_mm_setzero_si128 (),2321(__mmask8) -1);2322}23232324static __inline__ __m128i __DEFAULT_FN_ATTRS2325_mm_mask_cvtpd_epu32 (__m128i __W, __mmask8 __U, __m128d __A) {2326return (__m128i) __builtin_ia32_cvtpd2udq128_mask ((__v2df) __A,2327(__v4si) __W,2328(__mmask8) __U);2329}23302331static __inline__ __m128i __DEFAULT_FN_ATTRS2332_mm_maskz_cvtpd_epu32 (__mmask8 __U, __m128d __A) {2333return (__m128i) __builtin_ia32_cvtpd2udq128_mask ((__v2df) __A,2334(__v4si)2335_mm_setzero_si128 (),2336(__mmask8) __U);2337}23382339static __inline__ __m128i __DEFAULT_FN_ATTRS2340_mm256_cvtpd_epu32 (__m256d __A) {2341return (__m128i) __builtin_ia32_cvtpd2udq256_mask ((__v4df) __A,2342(__v4si)2343_mm_setzero_si128 (),2344(__mmask8) -1);2345}23462347static __inline__ __m128i __DEFAULT_FN_ATTRS2348_mm256_mask_cvtpd_epu32 (__m128i __W, __mmask8 __U, __m256d __A) {2349return (__m128i) __builtin_ia32_cvtpd2udq256_mask ((__v4df) __A,2350(__v4si) __W,2351(__mmask8) __U);2352}23532354static __inline__ __m128i __DEFAULT_FN_ATTRS2355_mm256_maskz_cvtpd_epu32 (__mmask8 __U, __m256d __A) {2356return (__m128i) __builtin_ia32_cvtpd2udq256_mask ((__v4df) __A,2357(__v4si)2358_mm_setzero_si128 (),2359(__mmask8) __U);2360}23612362static __inline__ __m128i __DEFAULT_FN_ATTRS2363_mm_mask_cvtps_epi32 (__m128i __W, __mmask8 __U, __m128 __A) {2364return (__m128i) __builtin_ia32_cvtps2dq128_mask ((__v4sf) __A,2365(__v4si) __W,2366(__mmask8) __U);2367}23682369static __inline__ __m128i __DEFAULT_FN_ATTRS2370_mm_maskz_cvtps_epi32 (__mmask8 __U, __m128 __A) {2371return (__m128i) __builtin_ia32_cvtps2dq128_mask ((__v4sf) __A,2372(__v4si)2373_mm_setzero_si128 (),2374(__mmask8) __U);2375}23762377static __inline__ __m256i __DEFAULT_FN_ATTRS2378_mm256_mask_cvtps_epi32 (__m256i __W, __mmask8 __U, __m256 __A) {2379return (__m256i) __builtin_ia32_cvtps2dq256_mask ((__v8sf) __A,2380(__v8si) __W,2381(__mmask8) __U);2382}23832384static __inline__ __m256i __DEFAULT_FN_ATTRS2385_mm256_maskz_cvtps_epi32 (__mmask8 __U, __m256 __A) {2386return (__m256i) __builtin_ia32_cvtps2dq256_mask ((__v8sf) __A,2387(__v8si)2388_mm256_setzero_si256 (),2389(__mmask8) __U);2390}23912392static __inline__ __m128d __DEFAULT_FN_ATTRS2393_mm_mask_cvtps_pd (__m128d __W, __mmask8 __U, __m128 __A) {2394return (__m128d) __builtin_ia32_cvtps2pd128_mask ((__v4sf) __A,2395(__v2df) __W,2396(__mmask8) __U);2397}23982399static __inline__ __m128d __DEFAULT_FN_ATTRS2400_mm_maskz_cvtps_pd (__mmask8 __U, __m128 __A) {2401return (__m128d) __builtin_ia32_cvtps2pd128_mask ((__v4sf) __A,2402(__v2df)2403_mm_setzero_pd (),2404(__mmask8) __U);2405}24062407static __inline__ __m256d __DEFAULT_FN_ATTRS2408_mm256_mask_cvtps_pd (__m256d __W, __mmask8 __U, __m128 __A) {2409return (__m256d) __builtin_ia32_cvtps2pd256_mask ((__v4sf) __A,2410(__v4df) __W,2411(__mmask8) __U);2412}24132414static __inline__ __m256d __DEFAULT_FN_ATTRS2415_mm256_maskz_cvtps_pd (__mmask8 __U, __m128 __A) {2416return (__m256d) __builtin_ia32_cvtps2pd256_mask ((__v4sf) __A,2417(__v4df)2418_mm256_setzero_pd (),2419(__mmask8) __U);2420}24212422static __inline__ __m128i __DEFAULT_FN_ATTRS2423_mm_cvtps_epu32 (__m128 __A) {2424return (__m128i) __builtin_ia32_cvtps2udq128_mask ((__v4sf) __A,2425(__v4si)2426_mm_setzero_si128 (),2427(__mmask8) -1);2428}24292430static __inline__ __m128i __DEFAULT_FN_ATTRS2431_mm_mask_cvtps_epu32 (__m128i __W, __mmask8 __U, __m128 __A) {2432return (__m128i) __builtin_ia32_cvtps2udq128_mask ((__v4sf) __A,2433(__v4si) __W,2434(__mmask8) __U);2435}24362437static __inline__ __m128i __DEFAULT_FN_ATTRS2438_mm_maskz_cvtps_epu32 (__mmask8 __U, __m128 __A) {2439return (__m128i) __builtin_ia32_cvtps2udq128_mask ((__v4sf) __A,2440(__v4si)2441_mm_setzero_si128 (),2442(__mmask8) __U);2443}24442445static __inline__ __m256i __DEFAULT_FN_ATTRS2446_mm256_cvtps_epu32 (__m256 __A) {2447return (__m256i) __builtin_ia32_cvtps2udq256_mask ((__v8sf) __A,2448(__v8si)2449_mm256_setzero_si256 (),2450(__mmask8) -1);2451}24522453static __inline__ __m256i __DEFAULT_FN_ATTRS2454_mm256_mask_cvtps_epu32 (__m256i __W, __mmask8 __U, __m256 __A) {2455return (__m256i) __builtin_ia32_cvtps2udq256_mask ((__v8sf) __A,2456(__v8si) __W,2457(__mmask8) __U);2458}24592460static __inline__ __m256i __DEFAULT_FN_ATTRS2461_mm256_maskz_cvtps_epu32 (__mmask8 __U, __m256 __A) {2462return (__m256i) __builtin_ia32_cvtps2udq256_mask ((__v8sf) __A,2463(__v8si)2464_mm256_setzero_si256 (),2465(__mmask8) __U);2466}24672468static __inline__ __m128i __DEFAULT_FN_ATTRS2469_mm_mask_cvttpd_epi32 (__m128i __W, __mmask8 __U, __m128d __A) {2470return (__m128i) __builtin_ia32_cvttpd2dq128_mask ((__v2df) __A,2471(__v4si) __W,2472(__mmask8) __U);2473}24742475static __inline__ __m128i __DEFAULT_FN_ATTRS2476_mm_maskz_cvttpd_epi32 (__mmask8 __U, __m128d __A) {2477return (__m128i) __builtin_ia32_cvttpd2dq128_mask ((__v2df) __A,2478(__v4si)2479_mm_setzero_si128 (),2480(__mmask8) __U);2481}24822483static __inline__ __m128i __DEFAULT_FN_ATTRS2484_mm256_mask_cvttpd_epi32 (__m128i __W, __mmask8 __U, __m256d __A) {2485return (__m128i) __builtin_ia32_cvttpd2dq256_mask ((__v4df) __A,2486(__v4si) __W,2487(__mmask8) __U);2488}24892490static __inline__ __m128i __DEFAULT_FN_ATTRS2491_mm256_maskz_cvttpd_epi32 (__mmask8 __U, __m256d __A) {2492return (__m128i) __builtin_ia32_cvttpd2dq256_mask ((__v4df) __A,2493(__v4si)2494_mm_setzero_si128 (),2495(__mmask8) __U);2496}24972498static __inline__ __m128i __DEFAULT_FN_ATTRS2499_mm_cvttpd_epu32 (__m128d __A) {2500return (__m128i) __builtin_ia32_cvttpd2udq128_mask ((__v2df) __A,2501(__v4si)2502_mm_setzero_si128 (),2503(__mmask8) -1);2504}25052506static __inline__ __m128i __DEFAULT_FN_ATTRS2507_mm_mask_cvttpd_epu32 (__m128i __W, __mmask8 __U, __m128d __A) {2508return (__m128i) __builtin_ia32_cvttpd2udq128_mask ((__v2df) __A,2509(__v4si) __W,2510(__mmask8) __U);2511}25122513static __inline__ __m128i __DEFAULT_FN_ATTRS2514_mm_maskz_cvttpd_epu32 (__mmask8 __U, __m128d __A) {2515return (__m128i) __builtin_ia32_cvttpd2udq128_mask ((__v2df) __A,2516(__v4si)2517_mm_setzero_si128 (),2518(__mmask8) __U);2519}25202521static __inline__ __m128i __DEFAULT_FN_ATTRS2522_mm256_cvttpd_epu32 (__m256d __A) {2523return (__m128i) __builtin_ia32_cvttpd2udq256_mask ((__v4df) __A,2524(__v4si)2525_mm_setzero_si128 (),2526(__mmask8) -1);2527}25282529static __inline__ __m128i __DEFAULT_FN_ATTRS2530_mm256_mask_cvttpd_epu32 (__m128i __W, __mmask8 __U, __m256d __A) {2531return (__m128i) __builtin_ia32_cvttpd2udq256_mask ((__v4df) __A,2532(__v4si) __W,2533(__mmask8) __U);2534}25352536static __inline__ __m128i __DEFAULT_FN_ATTRS2537_mm256_maskz_cvttpd_epu32 (__mmask8 __U, __m256d __A) {2538return (__m128i) __builtin_ia32_cvttpd2udq256_mask ((__v4df) __A,2539(__v4si)2540_mm_setzero_si128 (),2541(__mmask8) __U);2542}25432544static __inline__ __m128i __DEFAULT_FN_ATTRS2545_mm_mask_cvttps_epi32 (__m128i __W, __mmask8 __U, __m128 __A) {2546return (__m128i) __builtin_ia32_cvttps2dq128_mask ((__v4sf) __A,2547(__v4si) __W,2548(__mmask8) __U);2549}25502551static __inline__ __m128i __DEFAULT_FN_ATTRS2552_mm_maskz_cvttps_epi32 (__mmask8 __U, __m128 __A) {2553return (__m128i) __builtin_ia32_cvttps2dq128_mask ((__v4sf) __A,2554(__v4si)2555_mm_setzero_si128 (),2556(__mmask8) __U);2557}25582559static __inline__ __m256i __DEFAULT_FN_ATTRS2560_mm256_mask_cvttps_epi32 (__m256i __W, __mmask8 __U, __m256 __A) {2561return (__m256i) __builtin_ia32_cvttps2dq256_mask ((__v8sf) __A,2562(__v8si) __W,2563(__mmask8) __U);2564}25652566static __inline__ __m256i __DEFAULT_FN_ATTRS2567_mm256_maskz_cvttps_epi32 (__mmask8 __U, __m256 __A) {2568return (__m256i) __builtin_ia32_cvttps2dq256_mask ((__v8sf) __A,2569(__v8si)2570_mm256_setzero_si256 (),2571(__mmask8) __U);2572}25732574static __inline__ __m128i __DEFAULT_FN_ATTRS2575_mm_cvttps_epu32 (__m128 __A) {2576return (__m128i) __builtin_ia32_cvttps2udq128_mask ((__v4sf) __A,2577(__v4si)2578_mm_setzero_si128 (),2579(__mmask8) -1);2580}25812582static __inline__ __m128i __DEFAULT_FN_ATTRS2583_mm_mask_cvttps_epu32 (__m128i __W, __mmask8 __U, __m128 __A) {2584return (__m128i) __builtin_ia32_cvttps2udq128_mask ((__v4sf) __A,2585(__v4si) __W,2586(__mmask8) __U);2587}25882589static __inline__ __m128i __DEFAULT_FN_ATTRS2590_mm_maskz_cvttps_epu32 (__mmask8 __U, __m128 __A) {2591return (__m128i) __builtin_ia32_cvttps2udq128_mask ((__v4sf) __A,2592(__v4si)2593_mm_setzero_si128 (),2594(__mmask8) __U);2595}25962597static __inline__ __m256i __DEFAULT_FN_ATTRS2598_mm256_cvttps_epu32 (__m256 __A) {2599return (__m256i) __builtin_ia32_cvttps2udq256_mask ((__v8sf) __A,2600(__v8si)2601_mm256_setzero_si256 (),2602(__mmask8) -1);2603}26042605static __inline__ __m256i __DEFAULT_FN_ATTRS2606_mm256_mask_cvttps_epu32 (__m256i __W, __mmask8 __U, __m256 __A) {2607return (__m256i) __builtin_ia32_cvttps2udq256_mask ((__v8sf) __A,2608(__v8si) __W,2609(__mmask8) __U);2610}26112612static __inline__ __m256i __DEFAULT_FN_ATTRS2613_mm256_maskz_cvttps_epu32 (__mmask8 __U, __m256 __A) {2614return (__m256i) __builtin_ia32_cvttps2udq256_mask ((__v8sf) __A,2615(__v8si)2616_mm256_setzero_si256 (),2617(__mmask8) __U);2618}26192620static __inline__ __m128d __DEFAULT_FN_ATTRS2621_mm_cvtepu32_pd (__m128i __A) {2622return (__m128d) __builtin_ia32_cvtudq2pd128_mask ((__v4si) __A,2623(__v2df)2624_mm_setzero_pd (),2625(__mmask8) -1);2626}26272628static __inline__ __m128d __DEFAULT_FN_ATTRS2629_mm_mask_cvtepu32_pd (__m128d __W, __mmask8 __U, __m128i __A) {2630return (__m128d) __builtin_ia32_cvtudq2pd128_mask ((__v4si) __A,2631(__v2df) __W,2632(__mmask8) __U);2633}26342635static __inline__ __m128d __DEFAULT_FN_ATTRS2636_mm_maskz_cvtepu32_pd (__mmask8 __U, __m128i __A) {2637return (__m128d) __builtin_ia32_cvtudq2pd128_mask ((__v4si) __A,2638(__v2df)2639_mm_setzero_pd (),2640(__mmask8) __U);2641}26422643static __inline__ __m256d __DEFAULT_FN_ATTRS2644_mm256_cvtepu32_pd (__m128i __A) {2645return (__m256d) __builtin_ia32_cvtudq2pd256_mask ((__v4si) __A,2646(__v4df)2647_mm256_setzero_pd (),2648(__mmask8) -1);2649}26502651static __inline__ __m256d __DEFAULT_FN_ATTRS2652_mm256_mask_cvtepu32_pd (__m256d __W, __mmask8 __U, __m128i __A) {2653return (__m256d) __builtin_ia32_cvtudq2pd256_mask ((__v4si) __A,2654(__v4df) __W,2655(__mmask8) __U);2656}26572658static __inline__ __m256d __DEFAULT_FN_ATTRS2659_mm256_maskz_cvtepu32_pd (__mmask8 __U, __m128i __A) {2660return (__m256d) __builtin_ia32_cvtudq2pd256_mask ((__v4si) __A,2661(__v4df)2662_mm256_setzero_pd (),2663(__mmask8) __U);2664}26652666static __inline__ __m128 __DEFAULT_FN_ATTRS2667_mm_cvtepu32_ps (__m128i __A) {2668return (__m128) __builtin_ia32_cvtudq2ps128_mask ((__v4si) __A,2669(__v4sf)2670_mm_setzero_ps (),2671(__mmask8) -1);2672}26732674static __inline__ __m128 __DEFAULT_FN_ATTRS2675_mm_mask_cvtepu32_ps (__m128 __W, __mmask8 __U, __m128i __A) {2676return (__m128) __builtin_ia32_cvtudq2ps128_mask ((__v4si) __A,2677(__v4sf) __W,2678(__mmask8) __U);2679}26802681static __inline__ __m128 __DEFAULT_FN_ATTRS2682_mm_maskz_cvtepu32_ps (__mmask8 __U, __m128i __A) {2683return (__m128) __builtin_ia32_cvtudq2ps128_mask ((__v4si) __A,2684(__v4sf)2685_mm_setzero_ps (),2686(__mmask8) __U);2687}26882689static __inline__ __m256 __DEFAULT_FN_ATTRS2690_mm256_cvtepu32_ps (__m256i __A) {2691return (__m256) __builtin_ia32_cvtudq2ps256_mask ((__v8si) __A,2692(__v8sf)2693_mm256_setzero_ps (),2694(__mmask8) -1);2695}26962697static __inline__ __m256 __DEFAULT_FN_ATTRS2698_mm256_mask_cvtepu32_ps (__m256 __W, __mmask8 __U, __m256i __A) {2699return (__m256) __builtin_ia32_cvtudq2ps256_mask ((__v8si) __A,2700(__v8sf) __W,2701(__mmask8) __U);2702}27032704static __inline__ __m256 __DEFAULT_FN_ATTRS2705_mm256_maskz_cvtepu32_ps (__mmask8 __U, __m256i __A) {2706return (__m256) __builtin_ia32_cvtudq2ps256_mask ((__v8si) __A,2707(__v8sf)2708_mm256_setzero_ps (),2709(__mmask8) __U);2710}27112712static __inline__ __m128d __DEFAULT_FN_ATTRS2713_mm_mask_div_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {2714return (__m128d) __builtin_ia32_divpd_mask ((__v2df) __A,2715(__v2df) __B,2716(__v2df) __W,2717(__mmask8) __U);2718}27192720static __inline__ __m128d __DEFAULT_FN_ATTRS2721_mm_maskz_div_pd (__mmask8 __U, __m128d __A, __m128d __B) {2722return (__m128d) __builtin_ia32_divpd_mask ((__v2df) __A,2723(__v2df) __B,2724(__v2df)2725_mm_setzero_pd (),2726(__mmask8) __U);2727}27282729static __inline__ __m256d __DEFAULT_FN_ATTRS2730_mm256_mask_div_pd (__m256d __W, __mmask8 __U, __m256d __A,2731__m256d __B) {2732return (__m256d) __builtin_ia32_divpd256_mask ((__v4df) __A,2733(__v4df) __B,2734(__v4df) __W,2735(__mmask8) __U);2736}27372738static __inline__ __m256d __DEFAULT_FN_ATTRS2739_mm256_maskz_div_pd (__mmask8 __U, __m256d __A, __m256d __B) {2740return (__m256d) __builtin_ia32_divpd256_mask ((__v4df) __A,2741(__v4df) __B,2742(__v4df)2743_mm256_setzero_pd (),2744(__mmask8) __U);2745}27462747static __inline__ __m128 __DEFAULT_FN_ATTRS2748_mm_mask_div_ps (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B) {2749return (__m128) __builtin_ia32_divps_mask ((__v4sf) __A,2750(__v4sf) __B,2751(__v4sf) __W,2752(__mmask8) __U);2753}27542755static __inline__ __m128 __DEFAULT_FN_ATTRS2756_mm_maskz_div_ps (__mmask8 __U, __m128 __A, __m128 __B) {2757return (__m128) __builtin_ia32_divps_mask ((__v4sf) __A,2758(__v4sf) __B,2759(__v4sf)2760_mm_setzero_ps (),2761(__mmask8) __U);2762}27632764static __inline__ __m256 __DEFAULT_FN_ATTRS2765_mm256_mask_div_ps (__m256 __W, __mmask8 __U, __m256 __A, __m256 __B) {2766return (__m256) __builtin_ia32_divps256_mask ((__v8sf) __A,2767(__v8sf) __B,2768(__v8sf) __W,2769(__mmask8) __U);2770}27712772static __inline__ __m256 __DEFAULT_FN_ATTRS2773_mm256_maskz_div_ps (__mmask8 __U, __m256 __A, __m256 __B) {2774return (__m256) __builtin_ia32_divps256_mask ((__v8sf) __A,2775(__v8sf) __B,2776(__v8sf)2777_mm256_setzero_ps (),2778(__mmask8) __U);2779}27802781static __inline__ __m128d __DEFAULT_FN_ATTRS2782_mm_mask_expand_pd (__m128d __W, __mmask8 __U, __m128d __A) {2783return (__m128d) __builtin_ia32_expanddf128_mask ((__v2df) __A,2784(__v2df) __W,2785(__mmask8) __U);2786}27872788static __inline__ __m128d __DEFAULT_FN_ATTRS2789_mm_maskz_expand_pd (__mmask8 __U, __m128d __A) {2790return (__m128d) __builtin_ia32_expanddf128_mask ((__v2df) __A,2791(__v2df)2792_mm_setzero_pd (),2793(__mmask8) __U);2794}27952796static __inline__ __m256d __DEFAULT_FN_ATTRS2797_mm256_mask_expand_pd (__m256d __W, __mmask8 __U, __m256d __A) {2798return (__m256d) __builtin_ia32_expanddf256_mask ((__v4df) __A,2799(__v4df) __W,2800(__mmask8) __U);2801}28022803static __inline__ __m256d __DEFAULT_FN_ATTRS2804_mm256_maskz_expand_pd (__mmask8 __U, __m256d __A) {2805return (__m256d) __builtin_ia32_expanddf256_mask ((__v4df) __A,2806(__v4df)2807_mm256_setzero_pd (),2808(__mmask8) __U);2809}28102811static __inline__ __m128i __DEFAULT_FN_ATTRS2812_mm_mask_expand_epi64 (__m128i __W, __mmask8 __U, __m128i __A) {2813return (__m128i) __builtin_ia32_expanddi128_mask ((__v2di) __A,2814(__v2di) __W,2815(__mmask8) __U);2816}28172818static __inline__ __m128i __DEFAULT_FN_ATTRS2819_mm_maskz_expand_epi64 (__mmask8 __U, __m128i __A) {2820return (__m128i) __builtin_ia32_expanddi128_mask ((__v2di) __A,2821(__v2di)2822_mm_setzero_si128 (),2823(__mmask8) __U);2824}28252826static __inline__ __m256i __DEFAULT_FN_ATTRS2827_mm256_mask_expand_epi64 (__m256i __W, __mmask8 __U, __m256i __A) {2828return (__m256i) __builtin_ia32_expanddi256_mask ((__v4di) __A,2829(__v4di) __W,2830(__mmask8) __U);2831}28322833static __inline__ __m256i __DEFAULT_FN_ATTRS2834_mm256_maskz_expand_epi64 (__mmask8 __U, __m256i __A) {2835return (__m256i) __builtin_ia32_expanddi256_mask ((__v4di) __A,2836(__v4di)2837_mm256_setzero_si256 (),2838(__mmask8) __U);2839}28402841static __inline__ __m128d __DEFAULT_FN_ATTRS2842_mm_mask_expandloadu_pd (__m128d __W, __mmask8 __U, void const *__P) {2843return (__m128d) __builtin_ia32_expandloaddf128_mask ((__v2df *) __P,2844(__v2df) __W,2845(__mmask8)2846__U);2847}28482849static __inline__ __m128d __DEFAULT_FN_ATTRS2850_mm_maskz_expandloadu_pd (__mmask8 __U, void const *__P) {2851return (__m128d) __builtin_ia32_expandloaddf128_mask ((__v2df *) __P,2852(__v2df)2853_mm_setzero_pd (),2854(__mmask8)2855__U);2856}28572858static __inline__ __m256d __DEFAULT_FN_ATTRS2859_mm256_mask_expandloadu_pd (__m256d __W, __mmask8 __U, void const *__P) {2860return (__m256d) __builtin_ia32_expandloaddf256_mask ((__v4df *) __P,2861(__v4df) __W,2862(__mmask8)2863__U);2864}28652866static __inline__ __m256d __DEFAULT_FN_ATTRS2867_mm256_maskz_expandloadu_pd (__mmask8 __U, void const *__P) {2868return (__m256d) __builtin_ia32_expandloaddf256_mask ((__v4df *) __P,2869(__v4df)2870_mm256_setzero_pd (),2871(__mmask8)2872__U);2873}28742875static __inline__ __m128i __DEFAULT_FN_ATTRS2876_mm_mask_expandloadu_epi64 (__m128i __W, __mmask8 __U, void const *__P) {2877return (__m128i) __builtin_ia32_expandloaddi128_mask ((__v2di *) __P,2878(__v2di) __W,2879(__mmask8)2880__U);2881}28822883static __inline__ __m128i __DEFAULT_FN_ATTRS2884_mm_maskz_expandloadu_epi64 (__mmask8 __U, void const *__P) {2885return (__m128i) __builtin_ia32_expandloaddi128_mask ((__v2di *) __P,2886(__v2di)2887_mm_setzero_si128 (),2888(__mmask8)2889__U);2890}28912892static __inline__ __m256i __DEFAULT_FN_ATTRS2893_mm256_mask_expandloadu_epi64 (__m256i __W, __mmask8 __U,2894void const *__P) {2895return (__m256i) __builtin_ia32_expandloaddi256_mask ((__v4di *) __P,2896(__v4di) __W,2897(__mmask8)2898__U);2899}29002901static __inline__ __m256i __DEFAULT_FN_ATTRS2902_mm256_maskz_expandloadu_epi64 (__mmask8 __U, void const *__P) {2903return (__m256i) __builtin_ia32_expandloaddi256_mask ((__v4di *) __P,2904(__v4di)2905_mm256_setzero_si256 (),2906(__mmask8)2907__U);2908}29092910static __inline__ __m128 __DEFAULT_FN_ATTRS2911_mm_mask_expandloadu_ps (__m128 __W, __mmask8 __U, void const *__P) {2912return (__m128) __builtin_ia32_expandloadsf128_mask ((__v4sf *) __P,2913(__v4sf) __W,2914(__mmask8) __U);2915}29162917static __inline__ __m128 __DEFAULT_FN_ATTRS2918_mm_maskz_expandloadu_ps (__mmask8 __U, void const *__P) {2919return (__m128) __builtin_ia32_expandloadsf128_mask ((__v4sf *) __P,2920(__v4sf)2921_mm_setzero_ps (),2922(__mmask8)2923__U);2924}29252926static __inline__ __m256 __DEFAULT_FN_ATTRS2927_mm256_mask_expandloadu_ps (__m256 __W, __mmask8 __U, void const *__P) {2928return (__m256) __builtin_ia32_expandloadsf256_mask ((__v8sf *) __P,2929(__v8sf) __W,2930(__mmask8) __U);2931}29322933static __inline__ __m256 __DEFAULT_FN_ATTRS2934_mm256_maskz_expandloadu_ps (__mmask8 __U, void const *__P) {2935return (__m256) __builtin_ia32_expandloadsf256_mask ((__v8sf *) __P,2936(__v8sf)2937_mm256_setzero_ps (),2938(__mmask8)2939__U);2940}29412942static __inline__ __m128i __DEFAULT_FN_ATTRS2943_mm_mask_expandloadu_epi32 (__m128i __W, __mmask8 __U, void const *__P) {2944return (__m128i) __builtin_ia32_expandloadsi128_mask ((__v4si *) __P,2945(__v4si) __W,2946(__mmask8)2947__U);2948}29492950static __inline__ __m128i __DEFAULT_FN_ATTRS2951_mm_maskz_expandloadu_epi32 (__mmask8 __U, void const *__P) {2952return (__m128i) __builtin_ia32_expandloadsi128_mask ((__v4si *) __P,2953(__v4si)2954_mm_setzero_si128 (),2955(__mmask8) __U);2956}29572958static __inline__ __m256i __DEFAULT_FN_ATTRS2959_mm256_mask_expandloadu_epi32 (__m256i __W, __mmask8 __U,2960void const *__P) {2961return (__m256i) __builtin_ia32_expandloadsi256_mask ((__v8si *) __P,2962(__v8si) __W,2963(__mmask8)2964__U);2965}29662967static __inline__ __m256i __DEFAULT_FN_ATTRS2968_mm256_maskz_expandloadu_epi32 (__mmask8 __U, void const *__P) {2969return (__m256i) __builtin_ia32_expandloadsi256_mask ((__v8si *) __P,2970(__v8si)2971_mm256_setzero_si256 (),2972(__mmask8)2973__U);2974}29752976static __inline__ __m128 __DEFAULT_FN_ATTRS2977_mm_mask_expand_ps (__m128 __W, __mmask8 __U, __m128 __A) {2978return (__m128) __builtin_ia32_expandsf128_mask ((__v4sf) __A,2979(__v4sf) __W,2980(__mmask8) __U);2981}29822983static __inline__ __m128 __DEFAULT_FN_ATTRS2984_mm_maskz_expand_ps (__mmask8 __U, __m128 __A) {2985return (__m128) __builtin_ia32_expandsf128_mask ((__v4sf) __A,2986(__v4sf)2987_mm_setzero_ps (),2988(__mmask8) __U);2989}29902991static __inline__ __m256 __DEFAULT_FN_ATTRS2992_mm256_mask_expand_ps (__m256 __W, __mmask8 __U, __m256 __A) {2993return (__m256) __builtin_ia32_expandsf256_mask ((__v8sf) __A,2994(__v8sf) __W,2995(__mmask8) __U);2996}29972998static __inline__ __m256 __DEFAULT_FN_ATTRS2999_mm256_maskz_expand_ps (__mmask8 __U, __m256 __A) {3000return (__m256) __builtin_ia32_expandsf256_mask ((__v8sf) __A,3001(__v8sf)3002_mm256_setzero_ps (),3003(__mmask8) __U);3004}30053006static __inline__ __m128i __DEFAULT_FN_ATTRS3007_mm_mask_expand_epi32 (__m128i __W, __mmask8 __U, __m128i __A) {3008return (__m128i) __builtin_ia32_expandsi128_mask ((__v4si) __A,3009(__v4si) __W,3010(__mmask8) __U);3011}30123013static __inline__ __m128i __DEFAULT_FN_ATTRS3014_mm_maskz_expand_epi32 (__mmask8 __U, __m128i __A) {3015return (__m128i) __builtin_ia32_expandsi128_mask ((__v4si) __A,3016(__v4si)3017_mm_setzero_si128 (),3018(__mmask8) __U);3019}30203021static __inline__ __m256i __DEFAULT_FN_ATTRS3022_mm256_mask_expand_epi32 (__m256i __W, __mmask8 __U, __m256i __A) {3023return (__m256i) __builtin_ia32_expandsi256_mask ((__v8si) __A,3024(__v8si) __W,3025(__mmask8) __U);3026}30273028static __inline__ __m256i __DEFAULT_FN_ATTRS3029_mm256_maskz_expand_epi32 (__mmask8 __U, __m256i __A) {3030return (__m256i) __builtin_ia32_expandsi256_mask ((__v8si) __A,3031(__v8si)3032_mm256_setzero_si256 (),3033(__mmask8) __U);3034}30353036static __inline__ __m128d __DEFAULT_FN_ATTRS3037_mm_getexp_pd (__m128d __A) {3038return (__m128d) __builtin_ia32_getexppd128_mask ((__v2df) __A,3039(__v2df)3040_mm_setzero_pd (),3041(__mmask8) -1);3042}30433044static __inline__ __m128d __DEFAULT_FN_ATTRS3045_mm_mask_getexp_pd (__m128d __W, __mmask8 __U, __m128d __A) {3046return (__m128d) __builtin_ia32_getexppd128_mask ((__v2df) __A,3047(__v2df) __W,3048(__mmask8) __U);3049}30503051static __inline__ __m128d __DEFAULT_FN_ATTRS3052_mm_maskz_getexp_pd (__mmask8 __U, __m128d __A) {3053return (__m128d) __builtin_ia32_getexppd128_mask ((__v2df) __A,3054(__v2df)3055_mm_setzero_pd (),3056(__mmask8) __U);3057}30583059static __inline__ __m256d __DEFAULT_FN_ATTRS3060_mm256_getexp_pd (__m256d __A) {3061return (__m256d) __builtin_ia32_getexppd256_mask ((__v4df) __A,3062(__v4df)3063_mm256_setzero_pd (),3064(__mmask8) -1);3065}30663067static __inline__ __m256d __DEFAULT_FN_ATTRS3068_mm256_mask_getexp_pd (__m256d __W, __mmask8 __U, __m256d __A) {3069return (__m256d) __builtin_ia32_getexppd256_mask ((__v4df) __A,3070(__v4df) __W,3071(__mmask8) __U);3072}30733074static __inline__ __m256d __DEFAULT_FN_ATTRS3075_mm256_maskz_getexp_pd (__mmask8 __U, __m256d __A) {3076return (__m256d) __builtin_ia32_getexppd256_mask ((__v4df) __A,3077(__v4df)3078_mm256_setzero_pd (),3079(__mmask8) __U);3080}30813082static __inline__ __m128 __DEFAULT_FN_ATTRS3083_mm_getexp_ps (__m128 __A) {3084return (__m128) __builtin_ia32_getexpps128_mask ((__v4sf) __A,3085(__v4sf)3086_mm_setzero_ps (),3087(__mmask8) -1);3088}30893090static __inline__ __m128 __DEFAULT_FN_ATTRS3091_mm_mask_getexp_ps (__m128 __W, __mmask8 __U, __m128 __A) {3092return (__m128) __builtin_ia32_getexpps128_mask ((__v4sf) __A,3093(__v4sf) __W,3094(__mmask8) __U);3095}30963097static __inline__ __m128 __DEFAULT_FN_ATTRS3098_mm_maskz_getexp_ps (__mmask8 __U, __m128 __A) {3099return (__m128) __builtin_ia32_getexpps128_mask ((__v4sf) __A,3100(__v4sf)3101_mm_setzero_ps (),3102(__mmask8) __U);3103}31043105static __inline__ __m256 __DEFAULT_FN_ATTRS3106_mm256_getexp_ps (__m256 __A) {3107return (__m256) __builtin_ia32_getexpps256_mask ((__v8sf) __A,3108(__v8sf)3109_mm256_setzero_ps (),3110(__mmask8) -1);3111}31123113static __inline__ __m256 __DEFAULT_FN_ATTRS3114_mm256_mask_getexp_ps (__m256 __W, __mmask8 __U, __m256 __A) {3115return (__m256) __builtin_ia32_getexpps256_mask ((__v8sf) __A,3116(__v8sf) __W,3117(__mmask8) __U);3118}31193120static __inline__ __m256 __DEFAULT_FN_ATTRS3121_mm256_maskz_getexp_ps (__mmask8 __U, __m256 __A) {3122return (__m256) __builtin_ia32_getexpps256_mask ((__v8sf) __A,3123(__v8sf)3124_mm256_setzero_ps (),3125(__mmask8) __U);3126}31273128static __inline__ __m128d __DEFAULT_FN_ATTRS3129_mm_mask_max_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {3130return (__m128d) __builtin_ia32_maxpd_mask ((__v2df) __A,3131(__v2df) __B,3132(__v2df) __W,3133(__mmask8) __U);3134}31353136static __inline__ __m128d __DEFAULT_FN_ATTRS3137_mm_maskz_max_pd (__mmask8 __U, __m128d __A, __m128d __B) {3138return (__m128d) __builtin_ia32_maxpd_mask ((__v2df) __A,3139(__v2df) __B,3140(__v2df)3141_mm_setzero_pd (),3142(__mmask8) __U);3143}31443145static __inline__ __m256d __DEFAULT_FN_ATTRS3146_mm256_mask_max_pd (__m256d __W, __mmask8 __U, __m256d __A,3147__m256d __B) {3148return (__m256d) __builtin_ia32_maxpd256_mask ((__v4df) __A,3149(__v4df) __B,3150(__v4df) __W,3151(__mmask8) __U);3152}31533154static __inline__ __m256d __DEFAULT_FN_ATTRS3155_mm256_maskz_max_pd (__mmask8 __U, __m256d __A, __m256d __B) {3156return (__m256d) __builtin_ia32_maxpd256_mask ((__v4df) __A,3157(__v4df) __B,3158(__v4df)3159_mm256_setzero_pd (),3160(__mmask8) __U);3161}31623163static __inline__ __m128 __DEFAULT_FN_ATTRS3164_mm_mask_max_ps (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B) {3165return (__m128) __builtin_ia32_maxps_mask ((__v4sf) __A,3166(__v4sf) __B,3167(__v4sf) __W,3168(__mmask8) __U);3169}31703171static __inline__ __m128 __DEFAULT_FN_ATTRS3172_mm_maskz_max_ps (__mmask8 __U, __m128 __A, __m128 __B) {3173return (__m128) __builtin_ia32_maxps_mask ((__v4sf) __A,3174(__v4sf) __B,3175(__v4sf)3176_mm_setzero_ps (),3177(__mmask8) __U);3178}31793180static __inline__ __m256 __DEFAULT_FN_ATTRS3181_mm256_mask_max_ps (__m256 __W, __mmask8 __U, __m256 __A, __m256 __B) {3182return (__m256) __builtin_ia32_maxps256_mask ((__v8sf) __A,3183(__v8sf) __B,3184(__v8sf) __W,3185(__mmask8) __U);3186}31873188static __inline__ __m256 __DEFAULT_FN_ATTRS3189_mm256_maskz_max_ps (__mmask8 __U, __m256 __A, __m256 __B) {3190return (__m256) __builtin_ia32_maxps256_mask ((__v8sf) __A,3191(__v8sf) __B,3192(__v8sf)3193_mm256_setzero_ps (),3194(__mmask8) __U);3195}31963197static __inline__ __m128d __DEFAULT_FN_ATTRS3198_mm_mask_min_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {3199return (__m128d) __builtin_ia32_minpd_mask ((__v2df) __A,3200(__v2df) __B,3201(__v2df) __W,3202(__mmask8) __U);3203}32043205static __inline__ __m128d __DEFAULT_FN_ATTRS3206_mm_maskz_min_pd (__mmask8 __U, __m128d __A, __m128d __B) {3207return (__m128d) __builtin_ia32_minpd_mask ((__v2df) __A,3208(__v2df) __B,3209(__v2df)3210_mm_setzero_pd (),3211(__mmask8) __U);3212}32133214static __inline__ __m256d __DEFAULT_FN_ATTRS3215_mm256_mask_min_pd (__m256d __W, __mmask8 __U, __m256d __A,3216__m256d __B) {3217return (__m256d) __builtin_ia32_minpd256_mask ((__v4df) __A,3218(__v4df) __B,3219(__v4df) __W,3220(__mmask8) __U);3221}32223223static __inline__ __m256d __DEFAULT_FN_ATTRS3224_mm256_maskz_min_pd (__mmask8 __U, __m256d __A, __m256d __B) {3225return (__m256d) __builtin_ia32_minpd256_mask ((__v4df) __A,3226(__v4df) __B,3227(__v4df)3228_mm256_setzero_pd (),3229(__mmask8) __U);3230}32313232static __inline__ __m128 __DEFAULT_FN_ATTRS3233_mm_mask_min_ps (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B) {3234return (__m128) __builtin_ia32_minps_mask ((__v4sf) __A,3235(__v4sf) __B,3236(__v4sf) __W,3237(__mmask8) __U);3238}32393240static __inline__ __m128 __DEFAULT_FN_ATTRS3241_mm_maskz_min_ps (__mmask8 __U, __m128 __A, __m128 __B) {3242return (__m128) __builtin_ia32_minps_mask ((__v4sf) __A,3243(__v4sf) __B,3244(__v4sf)3245_mm_setzero_ps (),3246(__mmask8) __U);3247}32483249static __inline__ __m256 __DEFAULT_FN_ATTRS3250_mm256_mask_min_ps (__m256 __W, __mmask8 __U, __m256 __A, __m256 __B) {3251return (__m256) __builtin_ia32_minps256_mask ((__v8sf) __A,3252(__v8sf) __B,3253(__v8sf) __W,3254(__mmask8) __U);3255}32563257static __inline__ __m256 __DEFAULT_FN_ATTRS3258_mm256_maskz_min_ps (__mmask8 __U, __m256 __A, __m256 __B) {3259return (__m256) __builtin_ia32_minps256_mask ((__v8sf) __A,3260(__v8sf) __B,3261(__v8sf)3262_mm256_setzero_ps (),3263(__mmask8) __U);3264}32653266static __inline__ __m128d __DEFAULT_FN_ATTRS3267_mm_mask_mul_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {3268return (__m128d) __builtin_ia32_mulpd_mask ((__v2df) __A,3269(__v2df) __B,3270(__v2df) __W,3271(__mmask8) __U);3272}32733274static __inline__ __m128d __DEFAULT_FN_ATTRS3275_mm_maskz_mul_pd (__mmask8 __U, __m128d __A, __m128d __B) {3276return (__m128d) __builtin_ia32_mulpd_mask ((__v2df) __A,3277(__v2df) __B,3278(__v2df)3279_mm_setzero_pd (),3280(__mmask8) __U);3281}32823283static __inline__ __m256d __DEFAULT_FN_ATTRS3284_mm256_mask_mul_pd (__m256d __W, __mmask8 __U, __m256d __A,3285__m256d __B) {3286return (__m256d) __builtin_ia32_mulpd256_mask ((__v4df) __A,3287(__v4df) __B,3288(__v4df) __W,3289(__mmask8) __U);3290}32913292static __inline__ __m256d __DEFAULT_FN_ATTRS3293_mm256_maskz_mul_pd (__mmask8 __U, __m256d __A, __m256d __B) {3294return (__m256d) __builtin_ia32_mulpd256_mask ((__v4df) __A,3295(__v4df) __B,3296(__v4df)3297_mm256_setzero_pd (),3298(__mmask8) __U);3299}33003301static __inline__ __m128 __DEFAULT_FN_ATTRS3302_mm_mask_mul_ps (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B) {3303return (__m128) __builtin_ia32_mulps_mask ((__v4sf) __A,3304(__v4sf) __B,3305(__v4sf) __W,3306(__mmask8) __U);3307}33083309static __inline__ __m128 __DEFAULT_FN_ATTRS3310_mm_maskz_mul_ps (__mmask8 __U, __m128 __A, __m128 __B) {3311return (__m128) __builtin_ia32_mulps_mask ((__v4sf) __A,3312(__v4sf) __B,3313(__v4sf)3314_mm_setzero_ps (),3315(__mmask8) __U);3316}33173318static __inline__ __m256 __DEFAULT_FN_ATTRS3319_mm256_mask_mul_ps (__m256 __W, __mmask8 __U, __m256 __A, __m256 __B) {3320return (__m256) __builtin_ia32_mulps256_mask ((__v8sf) __A,3321(__v8sf) __B,3322(__v8sf) __W,3323(__mmask8) __U);3324}33253326static __inline__ __m256 __DEFAULT_FN_ATTRS3327_mm256_maskz_mul_ps (__mmask8 __U, __m256 __A, __m256 __B) {3328return (__m256) __builtin_ia32_mulps256_mask ((__v8sf) __A,3329(__v8sf) __B,3330(__v8sf)3331_mm256_setzero_ps (),3332(__mmask8) __U);3333}33343335static __inline__ __m128i __DEFAULT_FN_ATTRS3336_mm_mask_abs_epi32 (__m128i __W, __mmask8 __U, __m128i __A) {3337return (__m128i) __builtin_ia32_pabsd128_mask ((__v4si) __A,3338(__v4si) __W,3339(__mmask8) __U);3340}33413342static __inline__ __m128i __DEFAULT_FN_ATTRS3343_mm_maskz_abs_epi32 (__mmask8 __U, __m128i __A) {3344return (__m128i) __builtin_ia32_pabsd128_mask ((__v4si) __A,3345(__v4si)3346_mm_setzero_si128 (),3347(__mmask8) __U);3348}33493350static __inline__ __m256i __DEFAULT_FN_ATTRS3351_mm256_mask_abs_epi32 (__m256i __W, __mmask8 __U, __m256i __A) {3352return (__m256i) __builtin_ia32_pabsd256_mask ((__v8si) __A,3353(__v8si) __W,3354(__mmask8) __U);3355}33563357static __inline__ __m256i __DEFAULT_FN_ATTRS3358_mm256_maskz_abs_epi32 (__mmask8 __U, __m256i __A) {3359return (__m256i) __builtin_ia32_pabsd256_mask ((__v8si) __A,3360(__v8si)3361_mm256_setzero_si256 (),3362(__mmask8) __U);3363}33643365static __inline__ __m128i __DEFAULT_FN_ATTRS3366_mm_abs_epi64 (__m128i __A) {3367return (__m128i) __builtin_ia32_pabsq128_mask ((__v2di) __A,3368(__v2di)3369_mm_setzero_si128 (),3370(__mmask8) -1);3371}33723373static __inline__ __m128i __DEFAULT_FN_ATTRS3374_mm_mask_abs_epi64 (__m128i __W, __mmask8 __U, __m128i __A) {3375return (__m128i) __builtin_ia32_pabsq128_mask ((__v2di) __A,3376(__v2di) __W,3377(__mmask8) __U);3378}33793380static __inline__ __m128i __DEFAULT_FN_ATTRS3381_mm_maskz_abs_epi64 (__mmask8 __U, __m128i __A) {3382return (__m128i) __builtin_ia32_pabsq128_mask ((__v2di) __A,3383(__v2di)3384_mm_setzero_si128 (),3385(__mmask8) __U);3386}33873388static __inline__ __m256i __DEFAULT_FN_ATTRS3389_mm256_abs_epi64 (__m256i __A) {3390return (__m256i) __builtin_ia32_pabsq256_mask ((__v4di) __A,3391(__v4di)3392_mm256_setzero_si256 (),3393(__mmask8) -1);3394}33953396static __inline__ __m256i __DEFAULT_FN_ATTRS3397_mm256_mask_abs_epi64 (__m256i __W, __mmask8 __U, __m256i __A) {3398return (__m256i) __builtin_ia32_pabsq256_mask ((__v4di) __A,3399(__v4di) __W,3400(__mmask8) __U);3401}34023403static __inline__ __m256i __DEFAULT_FN_ATTRS3404_mm256_maskz_abs_epi64 (__mmask8 __U, __m256i __A) {3405return (__m256i) __builtin_ia32_pabsq256_mask ((__v4di) __A,3406(__v4di)3407_mm256_setzero_si256 (),3408(__mmask8) __U);3409}34103411static __inline__ __m128i __DEFAULT_FN_ATTRS3412_mm_maskz_max_epi32 (__mmask8 __M, __m128i __A, __m128i __B) {3413return (__m128i) __builtin_ia32_pmaxsd128_mask ((__v4si) __A,3414(__v4si) __B,3415(__v4si)3416_mm_setzero_si128 (),3417__M);3418}34193420static __inline__ __m128i __DEFAULT_FN_ATTRS3421_mm_mask_max_epi32 (__m128i __W, __mmask8 __M, __m128i __A,3422__m128i __B) {3423return (__m128i) __builtin_ia32_pmaxsd128_mask ((__v4si) __A,3424(__v4si) __B,3425(__v4si) __W, __M);3426}34273428static __inline__ __m256i __DEFAULT_FN_ATTRS3429_mm256_maskz_max_epi32 (__mmask8 __M, __m256i __A, __m256i __B) {3430return (__m256i) __builtin_ia32_pmaxsd256_mask ((__v8si) __A,3431(__v8si) __B,3432(__v8si)3433_mm256_setzero_si256 (),3434__M);3435}34363437static __inline__ __m256i __DEFAULT_FN_ATTRS3438_mm256_mask_max_epi32 (__m256i __W, __mmask8 __M, __m256i __A,3439__m256i __B) {3440return (__m256i) __builtin_ia32_pmaxsd256_mask ((__v8si) __A,3441(__v8si) __B,3442(__v8si) __W, __M);3443}34443445static __inline__ __m128i __DEFAULT_FN_ATTRS3446_mm_maskz_max_epi64 (__mmask8 __M, __m128i __A, __m128i __B) {3447return (__m128i) __builtin_ia32_pmaxsq128_mask ((__v2di) __A,3448(__v2di) __B,3449(__v2di)3450_mm_setzero_si128 (),3451__M);3452}34533454static __inline__ __m128i __DEFAULT_FN_ATTRS3455_mm_mask_max_epi64 (__m128i __W, __mmask8 __M, __m128i __A,3456__m128i __B) {3457return (__m128i) __builtin_ia32_pmaxsq128_mask ((__v2di) __A,3458(__v2di) __B,3459(__v2di) __W, __M);3460}34613462static __inline__ __m128i __DEFAULT_FN_ATTRS3463_mm_max_epi64 (__m128i __A, __m128i __B) {3464return (__m128i) __builtin_ia32_pmaxsq128_mask ((__v2di) __A,3465(__v2di) __B,3466(__v2di)3467_mm_setzero_si128 (),3468(__mmask8) -1);3469}34703471static __inline__ __m256i __DEFAULT_FN_ATTRS3472_mm256_maskz_max_epi64 (__mmask8 __M, __m256i __A, __m256i __B) {3473return (__m256i) __builtin_ia32_pmaxsq256_mask ((__v4di) __A,3474(__v4di) __B,3475(__v4di)3476_mm256_setzero_si256 (),3477__M);3478}34793480static __inline__ __m256i __DEFAULT_FN_ATTRS3481_mm256_mask_max_epi64 (__m256i __W, __mmask8 __M, __m256i __A,3482__m256i __B) {3483return (__m256i) __builtin_ia32_pmaxsq256_mask ((__v4di) __A,3484(__v4di) __B,3485(__v4di) __W, __M);3486}34873488static __inline__ __m256i __DEFAULT_FN_ATTRS3489_mm256_max_epi64 (__m256i __A, __m256i __B) {3490return (__m256i) __builtin_ia32_pmaxsq256_mask ((__v4di) __A,3491(__v4di) __B,3492(__v4di)3493_mm256_setzero_si256 (),3494(__mmask8) -1);3495}34963497static __inline__ __m128i __DEFAULT_FN_ATTRS3498_mm_maskz_max_epu32 (__mmask8 __M, __m128i __A, __m128i __B) {3499return (__m128i) __builtin_ia32_pmaxud128_mask ((__v4si) __A,3500(__v4si) __B,3501(__v4si)3502_mm_setzero_si128 (),3503__M);3504}35053506static __inline__ __m128i __DEFAULT_FN_ATTRS3507_mm_mask_max_epu32 (__m128i __W, __mmask8 __M, __m128i __A,3508__m128i __B) {3509return (__m128i) __builtin_ia32_pmaxud128_mask ((__v4si) __A,3510(__v4si) __B,3511(__v4si) __W, __M);3512}35133514static __inline__ __m256i __DEFAULT_FN_ATTRS3515_mm256_maskz_max_epu32 (__mmask8 __M, __m256i __A, __m256i __B) {3516return (__m256i) __builtin_ia32_pmaxud256_mask ((__v8si) __A,3517(__v8si) __B,3518(__v8si)3519_mm256_setzero_si256 (),3520__M);3521}35223523static __inline__ __m256i __DEFAULT_FN_ATTRS3524_mm256_mask_max_epu32 (__m256i __W, __mmask8 __M, __m256i __A,3525__m256i __B) {3526return (__m256i) __builtin_ia32_pmaxud256_mask ((__v8si) __A,3527(__v8si) __B,3528(__v8si) __W, __M);3529}35303531static __inline__ __m128i __DEFAULT_FN_ATTRS3532_mm_maskz_max_epu64 (__mmask8 __M, __m128i __A, __m128i __B) {3533return (__m128i) __builtin_ia32_pmaxuq128_mask ((__v2di) __A,3534(__v2di) __B,3535(__v2di)3536_mm_setzero_si128 (),3537__M);3538}35393540static __inline__ __m128i __DEFAULT_FN_ATTRS3541_mm_max_epu64 (__m128i __A, __m128i __B) {3542return (__m128i) __builtin_ia32_pmaxuq128_mask ((__v2di) __A,3543(__v2di) __B,3544(__v2di)3545_mm_setzero_si128 (),3546(__mmask8) -1);3547}35483549static __inline__ __m128i __DEFAULT_FN_ATTRS3550_mm_mask_max_epu64 (__m128i __W, __mmask8 __M, __m128i __A,3551__m128i __B) {3552return (__m128i) __builtin_ia32_pmaxuq128_mask ((__v2di) __A,3553(__v2di) __B,3554(__v2di) __W, __M);3555}35563557static __inline__ __m256i __DEFAULT_FN_ATTRS3558_mm256_maskz_max_epu64 (__mmask8 __M, __m256i __A, __m256i __B) {3559return (__m256i) __builtin_ia32_pmaxuq256_mask ((__v4di) __A,3560(__v4di) __B,3561(__v4di)3562_mm256_setzero_si256 (),3563__M);3564}35653566static __inline__ __m256i __DEFAULT_FN_ATTRS3567_mm256_max_epu64 (__m256i __A, __m256i __B) {3568return (__m256i) __builtin_ia32_pmaxuq256_mask ((__v4di) __A,3569(__v4di) __B,3570(__v4di)3571_mm256_setzero_si256 (),3572(__mmask8) -1);3573}35743575static __inline__ __m256i __DEFAULT_FN_ATTRS3576_mm256_mask_max_epu64 (__m256i __W, __mmask8 __M, __m256i __A,3577__m256i __B) {3578return (__m256i) __builtin_ia32_pmaxuq256_mask ((__v4di) __A,3579(__v4di) __B,3580(__v4di) __W, __M);3581}35823583static __inline__ __m128i __DEFAULT_FN_ATTRS3584_mm_maskz_min_epi32 (__mmask8 __M, __m128i __A, __m128i __B) {3585return (__m128i) __builtin_ia32_pminsd128_mask ((__v4si) __A,3586(__v4si) __B,3587(__v4si)3588_mm_setzero_si128 (),3589__M);3590}35913592static __inline__ __m128i __DEFAULT_FN_ATTRS3593_mm_mask_min_epi32 (__m128i __W, __mmask8 __M, __m128i __A,3594__m128i __B) {3595return (__m128i) __builtin_ia32_pminsd128_mask ((__v4si) __A,3596(__v4si) __B,3597(__v4si) __W, __M);3598}35993600static __inline__ __m256i __DEFAULT_FN_ATTRS3601_mm256_maskz_min_epi32 (__mmask8 __M, __m256i __A, __m256i __B) {3602return (__m256i) __builtin_ia32_pminsd256_mask ((__v8si) __A,3603(__v8si) __B,3604(__v8si)3605_mm256_setzero_si256 (),3606__M);3607}36083609static __inline__ __m256i __DEFAULT_FN_ATTRS3610_mm256_mask_min_epi32 (__m256i __W, __mmask8 __M, __m256i __A,3611__m256i __B) {3612return (__m256i) __builtin_ia32_pminsd256_mask ((__v8si) __A,3613(__v8si) __B,3614(__v8si) __W, __M);3615}36163617static __inline__ __m128i __DEFAULT_FN_ATTRS3618_mm_min_epi64 (__m128i __A, __m128i __B) {3619return (__m128i) __builtin_ia32_pminsq128_mask ((__v2di) __A,3620(__v2di) __B,3621(__v2di)3622_mm_setzero_si128 (),3623(__mmask8) -1);3624}36253626static __inline__ __m128i __DEFAULT_FN_ATTRS3627_mm_mask_min_epi64 (__m128i __W, __mmask8 __M, __m128i __A,3628__m128i __B) {3629return (__m128i) __builtin_ia32_pminsq128_mask ((__v2di) __A,3630(__v2di) __B,3631(__v2di) __W, __M);3632}36333634static __inline__ __m128i __DEFAULT_FN_ATTRS3635_mm_maskz_min_epi64 (__mmask8 __M, __m128i __A, __m128i __B) {3636return (__m128i) __builtin_ia32_pminsq128_mask ((__v2di) __A,3637(__v2di) __B,3638(__v2di)3639_mm_setzero_si128 (),3640__M);3641}36423643static __inline__ __m256i __DEFAULT_FN_ATTRS3644_mm256_min_epi64 (__m256i __A, __m256i __B) {3645return (__m256i) __builtin_ia32_pminsq256_mask ((__v4di) __A,3646(__v4di) __B,3647(__v4di)3648_mm256_setzero_si256 (),3649(__mmask8) -1);3650}36513652static __inline__ __m256i __DEFAULT_FN_ATTRS3653_mm256_mask_min_epi64 (__m256i __W, __mmask8 __M, __m256i __A,3654__m256i __B) {3655return (__m256i) __builtin_ia32_pminsq256_mask ((__v4di) __A,3656(__v4di) __B,3657(__v4di) __W, __M);3658}36593660static __inline__ __m256i __DEFAULT_FN_ATTRS3661_mm256_maskz_min_epi64 (__mmask8 __M, __m256i __A, __m256i __B) {3662return (__m256i) __builtin_ia32_pminsq256_mask ((__v4di) __A,3663(__v4di) __B,3664(__v4di)3665_mm256_setzero_si256 (),3666__M);3667}36683669static __inline__ __m128i __DEFAULT_FN_ATTRS3670_mm_maskz_min_epu32 (__mmask8 __M, __m128i __A, __m128i __B) {3671return (__m128i) __builtin_ia32_pminud128_mask ((__v4si) __A,3672(__v4si) __B,3673(__v4si)3674_mm_setzero_si128 (),3675__M);3676}36773678static __inline__ __m128i __DEFAULT_FN_ATTRS3679_mm_mask_min_epu32 (__m128i __W, __mmask8 __M, __m128i __A,3680__m128i __B) {3681return (__m128i) __builtin_ia32_pminud128_mask ((__v4si) __A,3682(__v4si) __B,3683(__v4si) __W, __M);3684}36853686static __inline__ __m256i __DEFAULT_FN_ATTRS3687_mm256_maskz_min_epu32 (__mmask8 __M, __m256i __A, __m256i __B) {3688return (__m256i) __builtin_ia32_pminud256_mask ((__v8si) __A,3689(__v8si) __B,3690(__v8si)3691_mm256_setzero_si256 (),3692__M);3693}36943695static __inline__ __m256i __DEFAULT_FN_ATTRS3696_mm256_mask_min_epu32 (__m256i __W, __mmask8 __M, __m256i __A,3697__m256i __B) {3698return (__m256i) __builtin_ia32_pminud256_mask ((__v8si) __A,3699(__v8si) __B,3700(__v8si) __W, __M);3701}37023703static __inline__ __m128i __DEFAULT_FN_ATTRS3704_mm_min_epu64 (__m128i __A, __m128i __B) {3705return (__m128i) __builtin_ia32_pminuq128_mask ((__v2di) __A,3706(__v2di) __B,3707(__v2di)3708_mm_setzero_si128 (),3709(__mmask8) -1);3710}37113712static __inline__ __m128i __DEFAULT_FN_ATTRS3713_mm_mask_min_epu64 (__m128i __W, __mmask8 __M, __m128i __A,3714__m128i __B) {3715return (__m128i) __builtin_ia32_pminuq128_mask ((__v2di) __A,3716(__v2di) __B,3717(__v2di) __W, __M);3718}37193720static __inline__ __m128i __DEFAULT_FN_ATTRS3721_mm_maskz_min_epu64 (__mmask8 __M, __m128i __A, __m128i __B) {3722return (__m128i) __builtin_ia32_pminuq128_mask ((__v2di) __A,3723(__v2di) __B,3724(__v2di)3725_mm_setzero_si128 (),3726__M);3727}37283729static __inline__ __m256i __DEFAULT_FN_ATTRS3730_mm256_min_epu64 (__m256i __A, __m256i __B) {3731return (__m256i) __builtin_ia32_pminuq256_mask ((__v4di) __A,3732(__v4di) __B,3733(__v4di)3734_mm256_setzero_si256 (),3735(__mmask8) -1);3736}37373738static __inline__ __m256i __DEFAULT_FN_ATTRS3739_mm256_mask_min_epu64 (__m256i __W, __mmask8 __M, __m256i __A,3740__m256i __B) {3741return (__m256i) __builtin_ia32_pminuq256_mask ((__v4di) __A,3742(__v4di) __B,3743(__v4di) __W, __M);3744}37453746static __inline__ __m256i __DEFAULT_FN_ATTRS3747_mm256_maskz_min_epu64 (__mmask8 __M, __m256i __A, __m256i __B) {3748return (__m256i) __builtin_ia32_pminuq256_mask ((__v4di) __A,3749(__v4di) __B,3750(__v4di)3751_mm256_setzero_si256 (),3752__M);3753}37543755#define _mm_roundscale_pd(A, imm) __extension__ ({ \3756(__m128d)__builtin_ia32_rndscalepd_128_mask((__v2df)(__m128d)(A), \3757(int)(imm), \3758(__v2df)_mm_setzero_pd(), \3759(__mmask8)-1); })376037613762#define _mm_mask_roundscale_pd(W, U, A, imm) __extension__ ({ \3763(__m128d)__builtin_ia32_rndscalepd_128_mask((__v2df)(__m128d)(A), \3764(int)(imm), \3765(__v2df)(__m128d)(W), \3766(__mmask8)(U)); })376737683769#define _mm_maskz_roundscale_pd(U, A, imm) __extension__ ({ \3770(__m128d)__builtin_ia32_rndscalepd_128_mask((__v2df)(__m128d)(A), \3771(int)(imm), \3772(__v2df)_mm_setzero_pd(), \3773(__mmask8)(U)); })377437753776#define _mm256_roundscale_pd(A, imm) __extension__ ({ \3777(__m256d)__builtin_ia32_rndscalepd_256_mask((__v4df)(__m256d)(A), \3778(int)(imm), \3779(__v4df)_mm256_setzero_pd(), \3780(__mmask8)-1); })378137823783#define _mm256_mask_roundscale_pd(W, U, A, imm) __extension__ ({ \3784(__m256d)__builtin_ia32_rndscalepd_256_mask((__v4df)(__m256d)(A), \3785(int)(imm), \3786(__v4df)(__m256d)(W), \3787(__mmask8)(U)); })378837893790#define _mm256_maskz_roundscale_pd(U, A, imm) __extension__ ({ \3791(__m256d)__builtin_ia32_rndscalepd_256_mask((__v4df)(__m256d)(A), \3792(int)(imm), \3793(__v4df)_mm256_setzero_pd(), \3794(__mmask8)(U)); })37953796#define _mm_roundscale_ps(A, imm) __extension__ ({ \3797(__m128)__builtin_ia32_rndscaleps_128_mask((__v4sf)(__m128)(A), (int)(imm), \3798(__v4sf)_mm_setzero_ps(), \3799(__mmask8)-1); })380038013802#define _mm_mask_roundscale_ps(W, U, A, imm) __extension__ ({ \3803(__m128)__builtin_ia32_rndscaleps_128_mask((__v4sf)(__m128)(A), (int)(imm), \3804(__v4sf)(__m128)(W), \3805(__mmask8)(U)); })380638073808#define _mm_maskz_roundscale_ps(U, A, imm) __extension__ ({ \3809(__m128)__builtin_ia32_rndscaleps_128_mask((__v4sf)(__m128)(A), (int)(imm), \3810(__v4sf)_mm_setzero_ps(), \3811(__mmask8)(U)); })38123813#define _mm256_roundscale_ps(A, imm) __extension__ ({ \3814(__m256)__builtin_ia32_rndscaleps_256_mask((__v8sf)(__m256)(A), (int)(imm), \3815(__v8sf)_mm256_setzero_ps(), \3816(__mmask8)-1); })38173818#define _mm256_mask_roundscale_ps(W, U, A, imm) __extension__ ({ \3819(__m256)__builtin_ia32_rndscaleps_256_mask((__v8sf)(__m256)(A), (int)(imm), \3820(__v8sf)(__m256)(W), \3821(__mmask8)(U)); })382238233824#define _mm256_maskz_roundscale_ps(U, A, imm) __extension__ ({ \3825(__m256)__builtin_ia32_rndscaleps_256_mask((__v8sf)(__m256)(A), (int)(imm), \3826(__v8sf)_mm256_setzero_ps(), \3827(__mmask8)(U)); })38283829static __inline__ __m128d __DEFAULT_FN_ATTRS3830_mm_scalef_pd (__m128d __A, __m128d __B) {3831return (__m128d) __builtin_ia32_scalefpd128_mask ((__v2df) __A,3832(__v2df) __B,3833(__v2df)3834_mm_setzero_pd (),3835(__mmask8) -1);3836}38373838static __inline__ __m128d __DEFAULT_FN_ATTRS3839_mm_mask_scalef_pd (__m128d __W, __mmask8 __U, __m128d __A,3840__m128d __B) {3841return (__m128d) __builtin_ia32_scalefpd128_mask ((__v2df) __A,3842(__v2df) __B,3843(__v2df) __W,3844(__mmask8) __U);3845}38463847static __inline__ __m128d __DEFAULT_FN_ATTRS3848_mm_maskz_scalef_pd (__mmask8 __U, __m128d __A, __m128d __B) {3849return (__m128d) __builtin_ia32_scalefpd128_mask ((__v2df) __A,3850(__v2df) __B,3851(__v2df)3852_mm_setzero_pd (),3853(__mmask8) __U);3854}38553856static __inline__ __m256d __DEFAULT_FN_ATTRS3857_mm256_scalef_pd (__m256d __A, __m256d __B) {3858return (__m256d) __builtin_ia32_scalefpd256_mask ((__v4df) __A,3859(__v4df) __B,3860(__v4df)3861_mm256_setzero_pd (),3862(__mmask8) -1);3863}38643865static __inline__ __m256d __DEFAULT_FN_ATTRS3866_mm256_mask_scalef_pd (__m256d __W, __mmask8 __U, __m256d __A,3867__m256d __B) {3868return (__m256d) __builtin_ia32_scalefpd256_mask ((__v4df) __A,3869(__v4df) __B,3870(__v4df) __W,3871(__mmask8) __U);3872}38733874static __inline__ __m256d __DEFAULT_FN_ATTRS3875_mm256_maskz_scalef_pd (__mmask8 __U, __m256d __A, __m256d __B) {3876return (__m256d) __builtin_ia32_scalefpd256_mask ((__v4df) __A,3877(__v4df) __B,3878(__v4df)3879_mm256_setzero_pd (),3880(__mmask8) __U);3881}38823883static __inline__ __m128 __DEFAULT_FN_ATTRS3884_mm_scalef_ps (__m128 __A, __m128 __B) {3885return (__m128) __builtin_ia32_scalefps128_mask ((__v4sf) __A,3886(__v4sf) __B,3887(__v4sf)3888_mm_setzero_ps (),3889(__mmask8) -1);3890}38913892static __inline__ __m128 __DEFAULT_FN_ATTRS3893_mm_mask_scalef_ps (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B) {3894return (__m128) __builtin_ia32_scalefps128_mask ((__v4sf) __A,3895(__v4sf) __B,3896(__v4sf) __W,3897(__mmask8) __U);3898}38993900static __inline__ __m128 __DEFAULT_FN_ATTRS3901_mm_maskz_scalef_ps (__mmask8 __U, __m128 __A, __m128 __B) {3902return (__m128) __builtin_ia32_scalefps128_mask ((__v4sf) __A,3903(__v4sf) __B,3904(__v4sf)3905_mm_setzero_ps (),3906(__mmask8) __U);3907}39083909static __inline__ __m256 __DEFAULT_FN_ATTRS3910_mm256_scalef_ps (__m256 __A, __m256 __B) {3911return (__m256) __builtin_ia32_scalefps256_mask ((__v8sf) __A,3912(__v8sf) __B,3913(__v8sf)3914_mm256_setzero_ps (),3915(__mmask8) -1);3916}39173918static __inline__ __m256 __DEFAULT_FN_ATTRS3919_mm256_mask_scalef_ps (__m256 __W, __mmask8 __U, __m256 __A,3920__m256 __B) {3921return (__m256) __builtin_ia32_scalefps256_mask ((__v8sf) __A,3922(__v8sf) __B,3923(__v8sf) __W,3924(__mmask8) __U);3925}39263927static __inline__ __m256 __DEFAULT_FN_ATTRS3928_mm256_maskz_scalef_ps (__mmask8 __U, __m256 __A, __m256 __B) {3929return (__m256) __builtin_ia32_scalefps256_mask ((__v8sf) __A,3930(__v8sf) __B,3931(__v8sf)3932_mm256_setzero_ps (),3933(__mmask8) __U);3934}39353936#define _mm_i64scatter_pd(addr, index, v1, scale) __extension__ ({ \3937__builtin_ia32_scatterdiv2df((double *)(addr), (__mmask8)-1, \3938(__v2di)(__m128i)(index), \3939(__v2df)(__m128d)(v1), (int)(scale)); })39403941#define _mm_mask_i64scatter_pd(addr, mask, index, v1, scale) __extension__ ({ \3942__builtin_ia32_scatterdiv2df((double *)(addr), (__mmask8)(mask), \3943(__v2di)(__m128i)(index), \3944(__v2df)(__m128d)(v1), (int)(scale)); })39453946#define _mm_i64scatter_epi64(addr, index, v1, scale) __extension__ ({ \3947__builtin_ia32_scatterdiv2di((long long *)(addr), (__mmask8)-1, \3948(__v2di)(__m128i)(index), \3949(__v2di)(__m128i)(v1), (int)(scale)); })39503951#define _mm_mask_i64scatter_epi64(addr, mask, index, v1, scale) __extension__ ({ \3952__builtin_ia32_scatterdiv2di((long long *)(addr), (__mmask8)(mask), \3953(__v2di)(__m128i)(index), \3954(__v2di)(__m128i)(v1), (int)(scale)); })39553956#define _mm256_i64scatter_pd(addr, index, v1, scale) __extension__ ({ \3957__builtin_ia32_scatterdiv4df((double *)(addr), (__mmask8)-1, \3958(__v4di)(__m256i)(index), \3959(__v4df)(__m256d)(v1), (int)(scale)); })39603961#define _mm256_mask_i64scatter_pd(addr, mask, index, v1, scale) __extension__ ({ \3962__builtin_ia32_scatterdiv4df((double *)(addr), (__mmask8)(mask), \3963(__v4di)(__m256i)(index), \3964(__v4df)(__m256d)(v1), (int)(scale)); })39653966#define _mm256_i64scatter_epi64(addr, index, v1, scale) __extension__ ({ \3967__builtin_ia32_scatterdiv4di((long long *)(addr), (__mmask8)-1, \3968(__v4di)(__m256i)(index), \3969(__v4di)(__m256i)(v1), (int)(scale)); })39703971#define _mm256_mask_i64scatter_epi64(addr, mask, index, v1, scale) __extension__ ({ \3972__builtin_ia32_scatterdiv4di((long long *)(addr), (__mmask8)(mask), \3973(__v4di)(__m256i)(index), \3974(__v4di)(__m256i)(v1), (int)(scale)); })39753976#define _mm_i64scatter_ps(addr, index, v1, scale) __extension__ ({ \3977__builtin_ia32_scatterdiv4sf((float *)(addr), (__mmask8)-1, \3978(__v2di)(__m128i)(index), (__v4sf)(__m128)(v1), \3979(int)(scale)); })39803981#define _mm_mask_i64scatter_ps(addr, mask, index, v1, scale) __extension__ ({ \3982__builtin_ia32_scatterdiv4sf((float *)(addr), (__mmask8)(mask), \3983(__v2di)(__m128i)(index), (__v4sf)(__m128)(v1), \3984(int)(scale)); })39853986#define _mm_i64scatter_epi32(addr, index, v1, scale) __extension__ ({ \3987__builtin_ia32_scatterdiv4si((int *)(addr), (__mmask8)-1, \3988(__v2di)(__m128i)(index), \3989(__v4si)(__m128i)(v1), (int)(scale)); })39903991#define _mm_mask_i64scatter_epi32(addr, mask, index, v1, scale) __extension__ ({ \3992__builtin_ia32_scatterdiv4si((int *)(addr), (__mmask8)(mask), \3993(__v2di)(__m128i)(index), \3994(__v4si)(__m128i)(v1), (int)(scale)); })39953996#define _mm256_i64scatter_ps(addr, index, v1, scale) __extension__ ({ \3997__builtin_ia32_scatterdiv8sf((float *)(addr), (__mmask8)-1, \3998(__v4di)(__m256i)(index), (__v4sf)(__m128)(v1), \3999(int)(scale)); })40004001#define _mm256_mask_i64scatter_ps(addr, mask, index, v1, scale) __extension__ ({ \4002__builtin_ia32_scatterdiv8sf((float *)(addr), (__mmask8)(mask), \4003(__v4di)(__m256i)(index), (__v4sf)(__m128)(v1), \4004(int)(scale)); })40054006#define _mm256_i64scatter_epi32(addr, index, v1, scale) __extension__ ({ \4007__builtin_ia32_scatterdiv8si((int *)(addr), (__mmask8)-1, \4008(__v4di)(__m256i)(index), \4009(__v4si)(__m128i)(v1), (int)(scale)); })40104011#define _mm256_mask_i64scatter_epi32(addr, mask, index, v1, scale) __extension__ ({ \4012__builtin_ia32_scatterdiv8si((int *)(addr), (__mmask8)(mask), \4013(__v4di)(__m256i)(index), \4014(__v4si)(__m128i)(v1), (int)(scale)); })40154016#define _mm_i32scatter_pd(addr, index, v1, scale) __extension__ ({ \4017__builtin_ia32_scattersiv2df((double *)(addr), (__mmask8)-1, \4018(__v4si)(__m128i)(index), \4019(__v2df)(__m128d)(v1), (int)(scale)); })40204021#define _mm_mask_i32scatter_pd(addr, mask, index, v1, scale) __extension__ ({ \4022__builtin_ia32_scattersiv2df((double *)(addr), (__mmask8)(mask), \4023(__v4si)(__m128i)(index), \4024(__v2df)(__m128d)(v1), (int)(scale)); })40254026#define _mm_i32scatter_epi64(addr, index, v1, scale) __extension__ ({ \4027__builtin_ia32_scattersiv2di((long long *)(addr), (__mmask8)-1, \4028(__v4si)(__m128i)(index), \4029(__v2di)(__m128i)(v1), (int)(scale)); })40304031#define _mm_mask_i32scatter_epi64(addr, mask, index, v1, scale) __extension__ ({ \4032__builtin_ia32_scattersiv2di((long long *)(addr), (__mmask8)(mask), \4033(__v4si)(__m128i)(index), \4034(__v2di)(__m128i)(v1), (int)(scale)); })40354036#define _mm256_i32scatter_pd(addr, index, v1, scale) __extension__ ({ \4037__builtin_ia32_scattersiv4df((double *)(addr), (__mmask8)-1, \4038(__v4si)(__m128i)(index), \4039(__v4df)(__m256d)(v1), (int)(scale)); })40404041#define _mm256_mask_i32scatter_pd(addr, mask, index, v1, scale) __extension__ ({ \4042__builtin_ia32_scattersiv4df((double *)(addr), (__mmask8)(mask), \4043(__v4si)(__m128i)(index), \4044(__v4df)(__m256d)(v1), (int)(scale)); })40454046#define _mm256_i32scatter_epi64(addr, index, v1, scale) __extension__ ({ \4047__builtin_ia32_scattersiv4di((long long *)(addr), (__mmask8)-1, \4048(__v4si)(__m128i)(index), \4049(__v4di)(__m256i)(v1), (int)(scale)); })40504051#define _mm256_mask_i32scatter_epi64(addr, mask, index, v1, scale) __extension__ ({ \4052__builtin_ia32_scattersiv4di((long long *)(addr), (__mmask8)(mask), \4053(__v4si)(__m128i)(index), \4054(__v4di)(__m256i)(v1), (int)(scale)); })40554056#define _mm_i32scatter_ps(addr, index, v1, scale) __extension__ ({ \4057__builtin_ia32_scattersiv4sf((float *)(addr), (__mmask8)-1, \4058(__v4si)(__m128i)(index), (__v4sf)(__m128)(v1), \4059(int)(scale)); })40604061#define _mm_mask_i32scatter_ps(addr, mask, index, v1, scale) __extension__ ({ \4062__builtin_ia32_scattersiv4sf((float *)(addr), (__mmask8)(mask), \4063(__v4si)(__m128i)(index), (__v4sf)(__m128)(v1), \4064(int)(scale)); })40654066#define _mm_i32scatter_epi32(addr, index, v1, scale) __extension__ ({ \4067__builtin_ia32_scattersiv4si((int *)(addr), (__mmask8)-1, \4068(__v4si)(__m128i)(index), \4069(__v4si)(__m128i)(v1), (int)(scale)); })40704071#define _mm_mask_i32scatter_epi32(addr, mask, index, v1, scale) __extension__ ({ \4072__builtin_ia32_scattersiv4si((int *)(addr), (__mmask8)(mask), \4073(__v4si)(__m128i)(index), \4074(__v4si)(__m128i)(v1), (int)(scale)); })40754076#define _mm256_i32scatter_ps(addr, index, v1, scale) __extension__ ({ \4077__builtin_ia32_scattersiv8sf((float *)(addr), (__mmask8)-1, \4078(__v8si)(__m256i)(index), (__v8sf)(__m256)(v1), \4079(int)(scale)); })40804081#define _mm256_mask_i32scatter_ps(addr, mask, index, v1, scale) __extension__ ({ \4082__builtin_ia32_scattersiv8sf((float *)(addr), (__mmask8)(mask), \4083(__v8si)(__m256i)(index), (__v8sf)(__m256)(v1), \4084(int)(scale)); })40854086#define _mm256_i32scatter_epi32(addr, index, v1, scale) __extension__ ({ \4087__builtin_ia32_scattersiv8si((int *)(addr), (__mmask8)-1, \4088(__v8si)(__m256i)(index), \4089(__v8si)(__m256i)(v1), (int)(scale)); })40904091#define _mm256_mask_i32scatter_epi32(addr, mask, index, v1, scale) __extension__ ({ \4092__builtin_ia32_scattersiv8si((int *)(addr), (__mmask8)(mask), \4093(__v8si)(__m256i)(index), \4094(__v8si)(__m256i)(v1), (int)(scale)); })40954096static __inline__ __m128d __DEFAULT_FN_ATTRS4097_mm_mask_sqrt_pd (__m128d __W, __mmask8 __U, __m128d __A) {4098return (__m128d) __builtin_ia32_sqrtpd128_mask ((__v2df) __A,4099(__v2df) __W,4100(__mmask8) __U);4101}41024103static __inline__ __m128d __DEFAULT_FN_ATTRS4104_mm_maskz_sqrt_pd (__mmask8 __U, __m128d __A) {4105return (__m128d) __builtin_ia32_sqrtpd128_mask ((__v2df) __A,4106(__v2df)4107_mm_setzero_pd (),4108(__mmask8) __U);4109}41104111static __inline__ __m256d __DEFAULT_FN_ATTRS4112_mm256_mask_sqrt_pd (__m256d __W, __mmask8 __U, __m256d __A) {4113return (__m256d) __builtin_ia32_sqrtpd256_mask ((__v4df) __A,4114(__v4df) __W,4115(__mmask8) __U);4116}41174118static __inline__ __m256d __DEFAULT_FN_ATTRS4119_mm256_maskz_sqrt_pd (__mmask8 __U, __m256d __A) {4120return (__m256d) __builtin_ia32_sqrtpd256_mask ((__v4df) __A,4121(__v4df)4122_mm256_setzero_pd (),4123(__mmask8) __U);4124}41254126static __inline__ __m128 __DEFAULT_FN_ATTRS4127_mm_mask_sqrt_ps (__m128 __W, __mmask8 __U, __m128 __A) {4128return (__m128) __builtin_ia32_sqrtps128_mask ((__v4sf) __A,4129(__v4sf) __W,4130(__mmask8) __U);4131}41324133static __inline__ __m128 __DEFAULT_FN_ATTRS4134_mm_maskz_sqrt_ps (__mmask8 __U, __m128 __A) {4135return (__m128) __builtin_ia32_sqrtps128_mask ((__v4sf) __A,4136(__v4sf)4137_mm_setzero_ps (),4138(__mmask8) __U);4139}41404141static __inline__ __m256 __DEFAULT_FN_ATTRS4142_mm256_mask_sqrt_ps (__m256 __W, __mmask8 __U, __m256 __A) {4143return (__m256) __builtin_ia32_sqrtps256_mask ((__v8sf) __A,4144(__v8sf) __W,4145(__mmask8) __U);4146}41474148static __inline__ __m256 __DEFAULT_FN_ATTRS4149_mm256_maskz_sqrt_ps (__mmask8 __U, __m256 __A) {4150return (__m256) __builtin_ia32_sqrtps256_mask ((__v8sf) __A,4151(__v8sf)4152_mm256_setzero_ps (),4153(__mmask8) __U);4154}41554156static __inline__ __m128d __DEFAULT_FN_ATTRS4157_mm_mask_sub_pd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B) {4158return (__m128d) __builtin_ia32_subpd128_mask ((__v2df) __A,4159(__v2df) __B,4160(__v2df) __W,4161(__mmask8) __U);4162}41634164static __inline__ __m128d __DEFAULT_FN_ATTRS4165_mm_maskz_sub_pd (__mmask8 __U, __m128d __A, __m128d __B) {4166return (__m128d) __builtin_ia32_subpd128_mask ((__v2df) __A,4167(__v2df) __B,4168(__v2df)4169_mm_setzero_pd (),4170(__mmask8) __U);4171}41724173static __inline__ __m256d __DEFAULT_FN_ATTRS4174_mm256_mask_sub_pd (__m256d __W, __mmask8 __U, __m256d __A,4175__m256d __B) {4176return (__m256d) __builtin_ia32_subpd256_mask ((__v4df) __A,4177(__v4df) __B,4178(__v4df) __W,4179(__mmask8) __U);4180}41814182static __inline__ __m256d __DEFAULT_FN_ATTRS4183_mm256_maskz_sub_pd (__mmask8 __U, __m256d __A, __m256d __B) {4184return (__m256d) __builtin_ia32_subpd256_mask ((__v4df) __A,4185(__v4df) __B,4186(__v4df)4187_mm256_setzero_pd (),4188(__mmask8) __U);4189}41904191static __inline__ __m128 __DEFAULT_FN_ATTRS4192_mm_mask_sub_ps (__m128 __W, __mmask16 __U, __m128 __A, __m128 __B) {4193return (__m128) __builtin_ia32_subps128_mask ((__v4sf) __A,4194(__v4sf) __B,4195(__v4sf) __W,4196(__mmask8) __U);4197}41984199static __inline__ __m128 __DEFAULT_FN_ATTRS4200_mm_maskz_sub_ps (__mmask16 __U, __m128 __A, __m128 __B) {4201return (__m128) __builtin_ia32_subps128_mask ((__v4sf) __A,4202(__v4sf) __B,4203(__v4sf)4204_mm_setzero_ps (),4205(__mmask8) __U);4206}42074208static __inline__ __m256 __DEFAULT_FN_ATTRS4209_mm256_mask_sub_ps (__m256 __W, __mmask16 __U, __m256 __A, __m256 __B) {4210return (__m256) __builtin_ia32_subps256_mask ((__v8sf) __A,4211(__v8sf) __B,4212(__v8sf) __W,4213(__mmask8) __U);4214}42154216static __inline__ __m256 __DEFAULT_FN_ATTRS4217_mm256_maskz_sub_ps (__mmask16 __U, __m256 __A, __m256 __B) {4218return (__m256) __builtin_ia32_subps256_mask ((__v8sf) __A,4219(__v8sf) __B,4220(__v8sf)4221_mm256_setzero_ps (),4222(__mmask8) __U);4223}42244225static __inline__ __m128i __DEFAULT_FN_ATTRS4226_mm_mask2_permutex2var_epi32 (__m128i __A, __m128i __I, __mmask8 __U,4227__m128i __B) {4228return (__m128i) __builtin_ia32_vpermi2vard128_mask ((__v4si) __A,4229(__v4si) __I4230/* idx */ ,4231(__v4si) __B,4232(__mmask8) __U);4233}42344235static __inline__ __m256i __DEFAULT_FN_ATTRS4236_mm256_mask2_permutex2var_epi32 (__m256i __A, __m256i __I,4237__mmask8 __U, __m256i __B) {4238return (__m256i) __builtin_ia32_vpermi2vard256_mask ((__v8si) __A,4239(__v8si) __I4240/* idx */ ,4241(__v8si) __B,4242(__mmask8) __U);4243}42444245static __inline__ __m128d __DEFAULT_FN_ATTRS4246_mm_mask2_permutex2var_pd (__m128d __A, __m128i __I, __mmask8 __U,4247__m128d __B) {4248return (__m128d) __builtin_ia32_vpermi2varpd128_mask ((__v2df) __A,4249(__v2di) __I4250/* idx */ ,4251(__v2df) __B,4252(__mmask8)4253__U);4254}42554256static __inline__ __m256d __DEFAULT_FN_ATTRS4257_mm256_mask2_permutex2var_pd (__m256d __A, __m256i __I, __mmask8 __U,4258__m256d __B) {4259return (__m256d) __builtin_ia32_vpermi2varpd256_mask ((__v4df) __A,4260(__v4di) __I4261/* idx */ ,4262(__v4df) __B,4263(__mmask8)4264__U);4265}42664267static __inline__ __m128 __DEFAULT_FN_ATTRS4268_mm_mask2_permutex2var_ps (__m128 __A, __m128i __I, __mmask8 __U,4269__m128 __B) {4270return (__m128) __builtin_ia32_vpermi2varps128_mask ((__v4sf) __A,4271(__v4si) __I4272/* idx */ ,4273(__v4sf) __B,4274(__mmask8) __U);4275}42764277static __inline__ __m256 __DEFAULT_FN_ATTRS4278_mm256_mask2_permutex2var_ps (__m256 __A, __m256i __I, __mmask8 __U,4279__m256 __B) {4280return (__m256) __builtin_ia32_vpermi2varps256_mask ((__v8sf) __A,4281(__v8si) __I4282/* idx */ ,4283(__v8sf) __B,4284(__mmask8) __U);4285}42864287static __inline__ __m128i __DEFAULT_FN_ATTRS4288_mm_mask2_permutex2var_epi64 (__m128i __A, __m128i __I, __mmask8 __U,4289__m128i __B) {4290return (__m128i) __builtin_ia32_vpermi2varq128_mask ((__v2di) __A,4291(__v2di) __I4292/* idx */ ,4293(__v2di) __B,4294(__mmask8) __U);4295}42964297static __inline__ __m256i __DEFAULT_FN_ATTRS4298_mm256_mask2_permutex2var_epi64 (__m256i __A, __m256i __I,4299__mmask8 __U, __m256i __B) {4300return (__m256i) __builtin_ia32_vpermi2varq256_mask ((__v4di) __A,4301(__v4di) __I4302/* idx */ ,4303(__v4di) __B,4304(__mmask8) __U);4305}43064307static __inline__ __m128i __DEFAULT_FN_ATTRS4308_mm_permutex2var_epi32 (__m128i __A, __m128i __I, __m128i __B) {4309return (__m128i) __builtin_ia32_vpermt2vard128_mask ((__v4si) __I4310/* idx */ ,4311(__v4si) __A,4312(__v4si) __B,4313(__mmask8) -1);4314}43154316static __inline__ __m128i __DEFAULT_FN_ATTRS4317_mm_mask_permutex2var_epi32 (__m128i __A, __mmask8 __U, __m128i __I,4318__m128i __B) {4319return (__m128i) __builtin_ia32_vpermt2vard128_mask ((__v4si) __I4320/* idx */ ,4321(__v4si) __A,4322(__v4si) __B,4323(__mmask8) __U);4324}43254326static __inline__ __m128i __DEFAULT_FN_ATTRS4327_mm_maskz_permutex2var_epi32 (__mmask8 __U, __m128i __A, __m128i __I,4328__m128i __B) {4329return (__m128i) __builtin_ia32_vpermt2vard128_maskz ((__v4si) __I4330/* idx */ ,4331(__v4si) __A,4332(__v4si) __B,4333(__mmask8)4334__U);4335}43364337static __inline__ __m256i __DEFAULT_FN_ATTRS4338_mm256_permutex2var_epi32 (__m256i __A, __m256i __I, __m256i __B) {4339return (__m256i) __builtin_ia32_vpermt2vard256_mask ((__v8si) __I4340/* idx */ ,4341(__v8si) __A,4342(__v8si) __B,4343(__mmask8) -1);4344}43454346static __inline__ __m256i __DEFAULT_FN_ATTRS4347_mm256_mask_permutex2var_epi32 (__m256i __A, __mmask8 __U, __m256i __I,4348__m256i __B) {4349return (__m256i) __builtin_ia32_vpermt2vard256_mask ((__v8si) __I4350/* idx */ ,4351(__v8si) __A,4352(__v8si) __B,4353(__mmask8) __U);4354}43554356static __inline__ __m256i __DEFAULT_FN_ATTRS4357_mm256_maskz_permutex2var_epi32 (__mmask8 __U, __m256i __A,4358__m256i __I, __m256i __B) {4359return (__m256i) __builtin_ia32_vpermt2vard256_maskz ((__v8si) __I4360/* idx */ ,4361(__v8si) __A,4362(__v8si) __B,4363(__mmask8)4364__U);4365}43664367static __inline__ __m128d __DEFAULT_FN_ATTRS4368_mm_permutex2var_pd (__m128d __A, __m128i __I, __m128d __B) {4369return (__m128d) __builtin_ia32_vpermt2varpd128_mask ((__v2di) __I4370/* idx */ ,4371(__v2df) __A,4372(__v2df) __B,4373(__mmask8) -43741);4375}43764377static __inline__ __m128d __DEFAULT_FN_ATTRS4378_mm_mask_permutex2var_pd (__m128d __A, __mmask8 __U, __m128i __I,4379__m128d __B) {4380return (__m128d) __builtin_ia32_vpermt2varpd128_mask ((__v2di) __I4381/* idx */ ,4382(__v2df) __A,4383(__v2df) __B,4384(__mmask8)4385__U);4386}43874388static __inline__ __m128d __DEFAULT_FN_ATTRS4389_mm_maskz_permutex2var_pd (__mmask8 __U, __m128d __A, __m128i __I,4390__m128d __B) {4391return (__m128d) __builtin_ia32_vpermt2varpd128_maskz ((__v2di) __I4392/* idx */ ,4393(__v2df) __A,4394(__v2df) __B,4395(__mmask8)4396__U);4397}43984399static __inline__ __m256d __DEFAULT_FN_ATTRS4400_mm256_permutex2var_pd (__m256d __A, __m256i __I, __m256d __B) {4401return (__m256d) __builtin_ia32_vpermt2varpd256_mask ((__v4di) __I4402/* idx */ ,4403(__v4df) __A,4404(__v4df) __B,4405(__mmask8) -44061);4407}44084409static __inline__ __m256d __DEFAULT_FN_ATTRS4410_mm256_mask_permutex2var_pd (__m256d __A, __mmask8 __U, __m256i __I,4411__m256d __B) {4412return (__m256d) __builtin_ia32_vpermt2varpd256_mask ((__v4di) __I4413/* idx */ ,4414(__v4df) __A,4415(__v4df) __B,4416(__mmask8)4417__U);4418}44194420static __inline__ __m256d __DEFAULT_FN_ATTRS4421_mm256_maskz_permutex2var_pd (__mmask8 __U, __m256d __A, __m256i __I,4422__m256d __B) {4423return (__m256d) __builtin_ia32_vpermt2varpd256_maskz ((__v4di) __I4424/* idx */ ,4425(__v4df) __A,4426(__v4df) __B,4427(__mmask8)4428__U);4429}44304431static __inline__ __m128 __DEFAULT_FN_ATTRS4432_mm_permutex2var_ps (__m128 __A, __m128i __I, __m128 __B) {4433return (__m128) __builtin_ia32_vpermt2varps128_mask ((__v4si) __I4434/* idx */ ,4435(__v4sf) __A,4436(__v4sf) __B,4437(__mmask8) -1);4438}44394440static __inline__ __m128 __DEFAULT_FN_ATTRS4441_mm_mask_permutex2var_ps (__m128 __A, __mmask8 __U, __m128i __I,4442__m128 __B) {4443return (__m128) __builtin_ia32_vpermt2varps128_mask ((__v4si) __I4444/* idx */ ,4445(__v4sf) __A,4446(__v4sf) __B,4447(__mmask8) __U);4448}44494450static __inline__ __m128 __DEFAULT_FN_ATTRS4451_mm_maskz_permutex2var_ps (__mmask8 __U, __m128 __A, __m128i __I,4452__m128 __B) {4453return (__m128) __builtin_ia32_vpermt2varps128_maskz ((__v4si) __I4454/* idx */ ,4455(__v4sf) __A,4456(__v4sf) __B,4457(__mmask8)4458__U);4459}44604461static __inline__ __m256 __DEFAULT_FN_ATTRS4462_mm256_permutex2var_ps (__m256 __A, __m256i __I, __m256 __B) {4463return (__m256) __builtin_ia32_vpermt2varps256_mask ((__v8si) __I4464/* idx */ ,4465(__v8sf) __A,4466(__v8sf) __B,4467(__mmask8) -1);4468}44694470static __inline__ __m256 __DEFAULT_FN_ATTRS4471_mm256_mask_permutex2var_ps (__m256 __A, __mmask8 __U, __m256i __I,4472__m256 __B) {4473return (__m256) __builtin_ia32_vpermt2varps256_mask ((__v8si) __I4474/* idx */ ,4475(__v8sf) __A,4476(__v8sf) __B,4477(__mmask8) __U);4478}44794480static __inline__ __m256 __DEFAULT_FN_ATTRS4481_mm256_maskz_permutex2var_ps (__mmask8 __U, __m256 __A, __m256i __I,4482__m256 __B) {4483return (__m256) __builtin_ia32_vpermt2varps256_maskz ((__v8si) __I4484/* idx */ ,4485(__v8sf) __A,4486(__v8sf) __B,4487(__mmask8)4488__U);4489}44904491static __inline__ __m128i __DEFAULT_FN_ATTRS4492_mm_permutex2var_epi64 (__m128i __A, __m128i __I, __m128i __B) {4493return (__m128i) __builtin_ia32_vpermt2varq128_mask ((__v2di) __I4494/* idx */ ,4495(__v2di) __A,4496(__v2di) __B,4497(__mmask8) -1);4498}44994500static __inline__ __m128i __DEFAULT_FN_ATTRS4501_mm_mask_permutex2var_epi64 (__m128i __A, __mmask8 __U, __m128i __I,4502__m128i __B) {4503return (__m128i) __builtin_ia32_vpermt2varq128_mask ((__v2di) __I4504/* idx */ ,4505(__v2di) __A,4506(__v2di) __B,4507(__mmask8) __U);4508}45094510static __inline__ __m128i __DEFAULT_FN_ATTRS4511_mm_maskz_permutex2var_epi64 (__mmask8 __U, __m128i __A, __m128i __I,4512__m128i __B) {4513return (__m128i) __builtin_ia32_vpermt2varq128_maskz ((__v2di) __I4514/* idx */ ,4515(__v2di) __A,4516(__v2di) __B,4517(__mmask8)4518__U);4519}452045214522static __inline__ __m256i __DEFAULT_FN_ATTRS4523_mm256_permutex2var_epi64 (__m256i __A, __m256i __I, __m256i __B) {4524return (__m256i) __builtin_ia32_vpermt2varq256_mask ((__v4di) __I4525/* idx */ ,4526(__v4di) __A,4527(__v4di) __B,4528(__mmask8) -1);4529}45304531static __inline__ __m256i __DEFAULT_FN_ATTRS4532_mm256_mask_permutex2var_epi64 (__m256i __A, __mmask8 __U, __m256i __I,4533__m256i __B) {4534return (__m256i) __builtin_ia32_vpermt2varq256_mask ((__v4di) __I4535/* idx */ ,4536(__v4di) __A,4537(__v4di) __B,4538(__mmask8) __U);4539}45404541static __inline__ __m256i __DEFAULT_FN_ATTRS4542_mm256_maskz_permutex2var_epi64 (__mmask8 __U, __m256i __A,4543__m256i __I, __m256i __B) {4544return (__m256i) __builtin_ia32_vpermt2varq256_maskz ((__v4di) __I4545/* idx */ ,4546(__v4di) __A,4547(__v4di) __B,4548(__mmask8)4549__U);4550}45514552static __inline__ __m128i __DEFAULT_FN_ATTRS4553_mm_mask_cvtepi8_epi32 (__m128i __W, __mmask8 __U, __m128i __A)4554{4555return (__m128i) __builtin_ia32_pmovsxbd128_mask ((__v16qi) __A,4556(__v4si) __W,4557(__mmask8) __U);4558}45594560static __inline__ __m128i __DEFAULT_FN_ATTRS4561_mm_maskz_cvtepi8_epi32 (__mmask8 __U, __m128i __A)4562{4563return (__m128i) __builtin_ia32_pmovsxbd128_mask ((__v16qi) __A,4564(__v4si)4565_mm_setzero_si128 (),4566(__mmask8) __U);4567}45684569static __inline__ __m256i __DEFAULT_FN_ATTRS4570_mm256_mask_cvtepi8_epi32 (__m256i __W, __mmask8 __U, __m128i __A)4571{4572return (__m256i) __builtin_ia32_pmovsxbd256_mask ((__v16qi) __A,4573(__v8si) __W,4574(__mmask8) __U);4575}45764577static __inline__ __m256i __DEFAULT_FN_ATTRS4578_mm256_maskz_cvtepi8_epi32 (__mmask8 __U, __m128i __A)4579{4580return (__m256i) __builtin_ia32_pmovsxbd256_mask ((__v16qi) __A,4581(__v8si)4582_mm256_setzero_si256 (),4583(__mmask8) __U);4584}45854586static __inline__ __m128i __DEFAULT_FN_ATTRS4587_mm_mask_cvtepi8_epi64 (__m128i __W, __mmask8 __U, __m128i __A)4588{4589return (__m128i) __builtin_ia32_pmovsxbq128_mask ((__v16qi) __A,4590(__v2di) __W,4591(__mmask8) __U);4592}45934594static __inline__ __m128i __DEFAULT_FN_ATTRS4595_mm_maskz_cvtepi8_epi64 (__mmask8 __U, __m128i __A)4596{4597return (__m128i) __builtin_ia32_pmovsxbq128_mask ((__v16qi) __A,4598(__v2di)4599_mm_setzero_si128 (),4600(__mmask8) __U);4601}46024603static __inline__ __m256i __DEFAULT_FN_ATTRS4604_mm256_mask_cvtepi8_epi64 (__m256i __W, __mmask8 __U, __m128i __A)4605{4606return (__m256i) __builtin_ia32_pmovsxbq256_mask ((__v16qi) __A,4607(__v4di) __W,4608(__mmask8) __U);4609}46104611static __inline__ __m256i __DEFAULT_FN_ATTRS4612_mm256_maskz_cvtepi8_epi64 (__mmask8 __U, __m128i __A)4613{4614return (__m256i) __builtin_ia32_pmovsxbq256_mask ((__v16qi) __A,4615(__v4di)4616_mm256_setzero_si256 (),4617(__mmask8) __U);4618}46194620static __inline__ __m128i __DEFAULT_FN_ATTRS4621_mm_mask_cvtepi32_epi64 (__m128i __W, __mmask8 __U, __m128i __X)4622{4623return (__m128i) __builtin_ia32_pmovsxdq128_mask ((__v4si) __X,4624(__v2di) __W,4625(__mmask8) __U);4626}46274628static __inline__ __m128i __DEFAULT_FN_ATTRS4629_mm_maskz_cvtepi32_epi64 (__mmask8 __U, __m128i __X)4630{4631return (__m128i) __builtin_ia32_pmovsxdq128_mask ((__v4si) __X,4632(__v2di)4633_mm_setzero_si128 (),4634(__mmask8) __U);4635}46364637static __inline__ __m256i __DEFAULT_FN_ATTRS4638_mm256_mask_cvtepi32_epi64 (__m256i __W, __mmask8 __U, __m128i __X)4639{4640return (__m256i) __builtin_ia32_pmovsxdq256_mask ((__v4si) __X,4641(__v4di) __W,4642(__mmask8) __U);4643}46444645static __inline__ __m256i __DEFAULT_FN_ATTRS4646_mm256_maskz_cvtepi32_epi64 (__mmask8 __U, __m128i __X)4647{4648return (__m256i) __builtin_ia32_pmovsxdq256_mask ((__v4si) __X,4649(__v4di)4650_mm256_setzero_si256 (),4651(__mmask8) __U);4652}46534654static __inline__ __m128i __DEFAULT_FN_ATTRS4655_mm_mask_cvtepi16_epi32 (__m128i __W, __mmask8 __U, __m128i __A)4656{4657return (__m128i) __builtin_ia32_pmovsxwd128_mask ((__v8hi) __A,4658(__v4si) __W,4659(__mmask8) __U);4660}46614662static __inline__ __m128i __DEFAULT_FN_ATTRS4663_mm_maskz_cvtepi16_epi32 (__mmask8 __U, __m128i __A)4664{4665return (__m128i) __builtin_ia32_pmovsxwd128_mask ((__v8hi) __A,4666(__v4si)4667_mm_setzero_si128 (),4668(__mmask8) __U);4669}46704671static __inline__ __m256i __DEFAULT_FN_ATTRS4672_mm256_mask_cvtepi16_epi32 (__m256i __W, __mmask8 __U, __m128i __A)4673{4674return (__m256i) __builtin_ia32_pmovsxwd256_mask ((__v8hi) __A,4675(__v8si) __W,4676(__mmask8) __U);4677}46784679static __inline__ __m256i __DEFAULT_FN_ATTRS4680_mm256_maskz_cvtepi16_epi32 (__mmask8 __U, __m128i __A)4681{4682return (__m256i) __builtin_ia32_pmovsxwd256_mask ((__v8hi) __A,4683(__v8si)4684_mm256_setzero_si256 (),4685(__mmask8) __U);4686}46874688static __inline__ __m128i __DEFAULT_FN_ATTRS4689_mm_mask_cvtepi16_epi64 (__m128i __W, __mmask8 __U, __m128i __A)4690{4691return (__m128i) __builtin_ia32_pmovsxwq128_mask ((__v8hi) __A,4692(__v2di) __W,4693(__mmask8) __U);4694}46954696static __inline__ __m128i __DEFAULT_FN_ATTRS4697_mm_maskz_cvtepi16_epi64 (__mmask8 __U, __m128i __A)4698{4699return (__m128i) __builtin_ia32_pmovsxwq128_mask ((__v8hi) __A,4700(__v2di)4701_mm_setzero_si128 (),4702(__mmask8) __U);4703}47044705static __inline__ __m256i __DEFAULT_FN_ATTRS4706_mm256_mask_cvtepi16_epi64 (__m256i __W, __mmask8 __U, __m128i __A)4707{4708return (__m256i) __builtin_ia32_pmovsxwq256_mask ((__v8hi) __A,4709(__v4di) __W,4710(__mmask8) __U);4711}47124713static __inline__ __m256i __DEFAULT_FN_ATTRS4714_mm256_maskz_cvtepi16_epi64 (__mmask8 __U, __m128i __A)4715{4716return (__m256i) __builtin_ia32_pmovsxwq256_mask ((__v8hi) __A,4717(__v4di)4718_mm256_setzero_si256 (),4719(__mmask8) __U);4720}472147224723static __inline__ __m128i __DEFAULT_FN_ATTRS4724_mm_mask_cvtepu8_epi32 (__m128i __W, __mmask8 __U, __m128i __A)4725{4726return (__m128i) __builtin_ia32_pmovzxbd128_mask ((__v16qi) __A,4727(__v4si) __W,4728(__mmask8) __U);4729}47304731static __inline__ __m128i __DEFAULT_FN_ATTRS4732_mm_maskz_cvtepu8_epi32 (__mmask8 __U, __m128i __A)4733{4734return (__m128i) __builtin_ia32_pmovzxbd128_mask ((__v16qi) __A,4735(__v4si)4736_mm_setzero_si128 (),4737(__mmask8) __U);4738}47394740static __inline__ __m256i __DEFAULT_FN_ATTRS4741_mm256_mask_cvtepu8_epi32 (__m256i __W, __mmask8 __U, __m128i __A)4742{4743return (__m256i) __builtin_ia32_pmovzxbd256_mask ((__v16qi) __A,4744(__v8si) __W,4745(__mmask8) __U);4746}47474748static __inline__ __m256i __DEFAULT_FN_ATTRS4749_mm256_maskz_cvtepu8_epi32 (__mmask8 __U, __m128i __A)4750{4751return (__m256i) __builtin_ia32_pmovzxbd256_mask ((__v16qi) __A,4752(__v8si)4753_mm256_setzero_si256 (),4754(__mmask8) __U);4755}47564757static __inline__ __m128i __DEFAULT_FN_ATTRS4758_mm_mask_cvtepu8_epi64 (__m128i __W, __mmask8 __U, __m128i __A)4759{4760return (__m128i) __builtin_ia32_pmovzxbq128_mask ((__v16qi) __A,4761(__v2di) __W,4762(__mmask8) __U);4763}47644765static __inline__ __m128i __DEFAULT_FN_ATTRS4766_mm_maskz_cvtepu8_epi64 (__mmask8 __U, __m128i __A)4767{4768return (__m128i) __builtin_ia32_pmovzxbq128_mask ((__v16qi) __A,4769(__v2di)4770_mm_setzero_si128 (),4771(__mmask8) __U);4772}47734774static __inline__ __m256i __DEFAULT_FN_ATTRS4775_mm256_mask_cvtepu8_epi64 (__m256i __W, __mmask8 __U, __m128i __A)4776{4777return (__m256i) __builtin_ia32_pmovzxbq256_mask ((__v16qi) __A,4778(__v4di) __W,4779(__mmask8) __U);4780}47814782static __inline__ __m256i __DEFAULT_FN_ATTRS4783_mm256_maskz_cvtepu8_epi64 (__mmask8 __U, __m128i __A)4784{4785return (__m256i) __builtin_ia32_pmovzxbq256_mask ((__v16qi) __A,4786(__v4di)4787_mm256_setzero_si256 (),4788(__mmask8) __U);4789}47904791static __inline__ __m128i __DEFAULT_FN_ATTRS4792_mm_mask_cvtepu32_epi64 (__m128i __W, __mmask8 __U, __m128i __X)4793{4794return (__m128i) __builtin_ia32_pmovzxdq128_mask ((__v4si) __X,4795(__v2di) __W,4796(__mmask8) __U);4797}47984799static __inline__ __m128i __DEFAULT_FN_ATTRS4800_mm_maskz_cvtepu32_epi64 (__mmask8 __U, __m128i __X)4801{4802return (__m128i) __builtin_ia32_pmovzxdq128_mask ((__v4si) __X,4803(__v2di)4804_mm_setzero_si128 (),4805(__mmask8) __U);4806}48074808static __inline__ __m256i __DEFAULT_FN_ATTRS4809_mm256_mask_cvtepu32_epi64 (__m256i __W, __mmask8 __U, __m128i __X)4810{4811return (__m256i) __builtin_ia32_pmovzxdq256_mask ((__v4si) __X,4812(__v4di) __W,4813(__mmask8) __U);4814}48154816static __inline__ __m256i __DEFAULT_FN_ATTRS4817_mm256_maskz_cvtepu32_epi64 (__mmask8 __U, __m128i __X)4818{4819return (__m256i) __builtin_ia32_pmovzxdq256_mask ((__v4si) __X,4820(__v4di)4821_mm256_setzero_si256 (),4822(__mmask8) __U);4823}48244825static __inline__ __m128i __DEFAULT_FN_ATTRS4826_mm_mask_cvtepu16_epi32 (__m128i __W, __mmask8 __U, __m128i __A)4827{4828return (__m128i) __builtin_ia32_pmovzxwd128_mask ((__v8hi) __A,4829(__v4si) __W,4830(__mmask8) __U);4831}48324833static __inline__ __m128i __DEFAULT_FN_ATTRS4834_mm_maskz_cvtepu16_epi32 (__mmask8 __U, __m128i __A)4835{4836return (__m128i) __builtin_ia32_pmovzxwd128_mask ((__v8hi) __A,4837(__v4si)4838_mm_setzero_si128 (),4839(__mmask8) __U);4840}48414842static __inline__ __m256i __DEFAULT_FN_ATTRS4843_mm256_mask_cvtepu16_epi32 (__m256i __W, __mmask8 __U, __m128i __A)4844{4845return (__m256i) __builtin_ia32_pmovzxwd256_mask ((__v8hi) __A,4846(__v8si) __W,4847(__mmask8) __U);4848}48494850static __inline__ __m256i __DEFAULT_FN_ATTRS4851_mm256_maskz_cvtepu16_epi32 (__mmask8 __U, __m128i __A)4852{4853return (__m256i) __builtin_ia32_pmovzxwd256_mask ((__v8hi) __A,4854(__v8si)4855_mm256_setzero_si256 (),4856(__mmask8) __U);4857}48584859static __inline__ __m128i __DEFAULT_FN_ATTRS4860_mm_mask_cvtepu16_epi64 (__m128i __W, __mmask8 __U, __m128i __A)4861{4862return (__m128i) __builtin_ia32_pmovzxwq128_mask ((__v8hi) __A,4863(__v2di) __W,4864(__mmask8) __U);4865}48664867static __inline__ __m128i __DEFAULT_FN_ATTRS4868_mm_maskz_cvtepu16_epi64 (__mmask8 __U, __m128i __A)4869{4870return (__m128i) __builtin_ia32_pmovzxwq128_mask ((__v8hi) __A,4871(__v2di)4872_mm_setzero_si128 (),4873(__mmask8) __U);4874}48754876static __inline__ __m256i __DEFAULT_FN_ATTRS4877_mm256_mask_cvtepu16_epi64 (__m256i __W, __mmask8 __U, __m128i __A)4878{4879return (__m256i) __builtin_ia32_pmovzxwq256_mask ((__v8hi) __A,4880(__v4di) __W,4881(__mmask8) __U);4882}48834884static __inline__ __m256i __DEFAULT_FN_ATTRS4885_mm256_maskz_cvtepu16_epi64 (__mmask8 __U, __m128i __A)4886{4887return (__m256i) __builtin_ia32_pmovzxwq256_mask ((__v8hi) __A,4888(__v4di)4889_mm256_setzero_si256 (),4890(__mmask8) __U);4891}489248934894#define _mm_rol_epi32(a, b) __extension__ ({\4895(__m128i)__builtin_ia32_prold128_mask((__v4si)(__m128i)(a), (int)(b), \4896(__v4si)_mm_setzero_si128(), \4897(__mmask8)-1); })48984899#define _mm_mask_rol_epi32(w, u, a, b) __extension__ ({\4900(__m128i)__builtin_ia32_prold128_mask((__v4si)(__m128i)(a), (int)(b), \4901(__v4si)(__m128i)(w), (__mmask8)(u)); })49024903#define _mm_maskz_rol_epi32(u, a, b) __extension__ ({\4904(__m128i)__builtin_ia32_prold128_mask((__v4si)(__m128i)(a), (int)(b), \4905(__v4si)_mm_setzero_si128(), \4906(__mmask8)(u)); })49074908#define _mm256_rol_epi32(a, b) __extension__ ({\4909(__m256i)__builtin_ia32_prold256_mask((__v8si)(__m256i)(a), (int)(b), \4910(__v8si)_mm256_setzero_si256(), \4911(__mmask8)-1); })49124913#define _mm256_mask_rol_epi32(w, u, a, b) __extension__ ({\4914(__m256i)__builtin_ia32_prold256_mask((__v8si)(__m256i)(a), (int)(b), \4915(__v8si)(__m256i)(w), (__mmask8)(u)); })49164917#define _mm256_maskz_rol_epi32(u, a, b) __extension__ ({\4918(__m256i)__builtin_ia32_prold256_mask((__v8si)(__m256i)(a), (int)(b), \4919(__v8si)_mm256_setzero_si256(), \4920(__mmask8)(u)); })49214922#define _mm_rol_epi64(a, b) __extension__ ({\4923(__m128i)__builtin_ia32_prolq128_mask((__v2di)(__m128i)(a), (int)(b), \4924(__v2di)_mm_setzero_di(), \4925(__mmask8)-1); })49264927#define _mm_mask_rol_epi64(w, u, a, b) __extension__ ({\4928(__m128i)__builtin_ia32_prolq128_mask((__v2di)(__m128i)(a), (int)(b), \4929(__v2di)(__m128i)(w), (__mmask8)(u)); })49304931#define _mm_maskz_rol_epi64(u, a, b) __extension__ ({\4932(__m128i)__builtin_ia32_prolq128_mask((__v2di)(__m128i)(a), (int)(b), \4933(__v2di)_mm_setzero_di(), \4934(__mmask8)(u)); })49354936#define _mm256_rol_epi64(a, b) __extension__ ({\4937(__m256i)__builtin_ia32_prolq256_mask((__v4di)(__m256i)(a), (int)(b), \4938(__v4di)_mm256_setzero_si256(), \4939(__mmask8)-1); })49404941#define _mm256_mask_rol_epi64(w, u, a, b) __extension__ ({\4942(__m256i)__builtin_ia32_prolq256_mask((__v4di)(__m256i)(a), (int)(b), \4943(__v4di)(__m256i)(w), (__mmask8)(u)); })49444945#define _mm256_maskz_rol_epi64(u, a, b) __extension__ ({\4946(__m256i)__builtin_ia32_prolq256_mask((__v4di)(__m256i)(a), (int)(b), \4947(__v4di)_mm256_setzero_si256(), \4948(__mmask8)(u)); })49494950static __inline__ __m128i __DEFAULT_FN_ATTRS4951_mm_rolv_epi32 (__m128i __A, __m128i __B)4952{4953return (__m128i) __builtin_ia32_prolvd128_mask ((__v4si) __A,4954(__v4si) __B,4955(__v4si)4956_mm_setzero_si128 (),4957(__mmask8) -1);4958}49594960static __inline__ __m128i __DEFAULT_FN_ATTRS4961_mm_mask_rolv_epi32 (__m128i __W, __mmask8 __U, __m128i __A,4962__m128i __B)4963{4964return (__m128i) __builtin_ia32_prolvd128_mask ((__v4si) __A,4965(__v4si) __B,4966(__v4si) __W,4967(__mmask8) __U);4968}49694970static __inline__ __m128i __DEFAULT_FN_ATTRS4971_mm_maskz_rolv_epi32 (__mmask8 __U, __m128i __A, __m128i __B)4972{4973return (__m128i) __builtin_ia32_prolvd128_mask ((__v4si) __A,4974(__v4si) __B,4975(__v4si)4976_mm_setzero_si128 (),4977(__mmask8) __U);4978}49794980static __inline__ __m256i __DEFAULT_FN_ATTRS4981_mm256_rolv_epi32 (__m256i __A, __m256i __B)4982{4983return (__m256i) __builtin_ia32_prolvd256_mask ((__v8si) __A,4984(__v8si) __B,4985(__v8si)4986_mm256_setzero_si256 (),4987(__mmask8) -1);4988}49894990static __inline__ __m256i __DEFAULT_FN_ATTRS4991_mm256_mask_rolv_epi32 (__m256i __W, __mmask8 __U, __m256i __A,4992__m256i __B)4993{4994return (__m256i) __builtin_ia32_prolvd256_mask ((__v8si) __A,4995(__v8si) __B,4996(__v8si) __W,4997(__mmask8) __U);4998}49995000static __inline__ __m256i __DEFAULT_FN_ATTRS5001_mm256_maskz_rolv_epi32 (__mmask8 __U, __m256i __A, __m256i __B)5002{5003return (__m256i) __builtin_ia32_prolvd256_mask ((__v8si) __A,5004(__v8si) __B,5005(__v8si)5006_mm256_setzero_si256 (),5007(__mmask8) __U);5008}50095010static __inline__ __m128i __DEFAULT_FN_ATTRS5011_mm_rolv_epi64 (__m128i __A, __m128i __B)5012{5013return (__m128i) __builtin_ia32_prolvq128_mask ((__v2di) __A,5014(__v2di) __B,5015(__v2di)5016_mm_setzero_di (),5017(__mmask8) -1);5018}50195020static __inline__ __m128i __DEFAULT_FN_ATTRS5021_mm_mask_rolv_epi64 (__m128i __W, __mmask8 __U, __m128i __A,5022__m128i __B)5023{5024return (__m128i) __builtin_ia32_prolvq128_mask ((__v2di) __A,5025(__v2di) __B,5026(__v2di) __W,5027(__mmask8) __U);5028}50295030static __inline__ __m128i __DEFAULT_FN_ATTRS5031_mm_maskz_rolv_epi64 (__mmask8 __U, __m128i __A, __m128i __B)5032{5033return (__m128i) __builtin_ia32_prolvq128_mask ((__v2di) __A,5034(__v2di) __B,5035(__v2di)5036_mm_setzero_di (),5037(__mmask8) __U);5038}50395040static __inline__ __m256i __DEFAULT_FN_ATTRS5041_mm256_rolv_epi64 (__m256i __A, __m256i __B)5042{5043return (__m256i) __builtin_ia32_prolvq256_mask ((__v4di) __A,5044(__v4di) __B,5045(__v4di)5046_mm256_setzero_si256 (),5047(__mmask8) -1);5048}50495050static __inline__ __m256i __DEFAULT_FN_ATTRS5051_mm256_mask_rolv_epi64 (__m256i __W, __mmask8 __U, __m256i __A,5052__m256i __B)5053{5054return (__m256i) __builtin_ia32_prolvq256_mask ((__v4di) __A,5055(__v4di) __B,5056(__v4di) __W,5057(__mmask8) __U);5058}50595060static __inline__ __m256i __DEFAULT_FN_ATTRS5061_mm256_maskz_rolv_epi64 (__mmask8 __U, __m256i __A, __m256i __B)5062{5063return (__m256i) __builtin_ia32_prolvq256_mask ((__v4di) __A,5064(__v4di) __B,5065(__v4di)5066_mm256_setzero_si256 (),5067(__mmask8) __U);5068}50695070#define _mm_ror_epi32(A, B) __extension__ ({ \5071(__m128i)__builtin_ia32_prord128_mask((__v4si)(__m128i)(A), (int)(B), \5072(__v4si)_mm_setzero_si128(), \5073(__mmask8)-1); })50745075#define _mm_mask_ror_epi32(W, U, A, B) __extension__ ({ \5076(__m128i)__builtin_ia32_prord128_mask((__v4si)(__m128i)(A), (int)(B), \5077(__v4si)(__m128i)(W), (__mmask8)(U)); })50785079#define _mm_maskz_ror_epi32(U, A, B) __extension__ ({ \5080(__m128i)__builtin_ia32_prord128_mask((__v4si)(__m128i)(A), (int)(B), \5081(__v4si)_mm_setzero_si128(), \5082(__mmask8)(U)); })50835084#define _mm256_ror_epi32(A, B) __extension__ ({ \5085(__m256i)__builtin_ia32_prord256_mask((__v8si)(__m256i)(A), (int)(B), \5086(__v8si)_mm256_setzero_si256(), \5087(__mmask8)-1); })50885089#define _mm256_mask_ror_epi32(W, U, A, B) __extension__ ({ \5090(__m256i)__builtin_ia32_prord256_mask((__v8si)(__m256i)(A), (int)(B), \5091(__v8si)(__m256i)(W), (__mmask8)(U)); })50925093#define _mm256_maskz_ror_epi32(U, A, B) __extension__ ({ \5094(__m256i)__builtin_ia32_prord256_mask((__v8si)(__m256i)(A), (int)(B), \5095(__v8si)_mm256_setzero_si256(), \5096(__mmask8)(U)); })50975098#define _mm_ror_epi64(A, B) __extension__ ({ \5099(__m128i)__builtin_ia32_prorq128_mask((__v2di)(__m128i)(A), (int)(B), \5100(__v2di)_mm_setzero_di(), \5101(__mmask8)-1); })51025103#define _mm_mask_ror_epi64(W, U, A, B) __extension__ ({ \5104(__m128i)__builtin_ia32_prorq128_mask((__v2di)(__m128i)(A), (int)(B), \5105(__v2di)(__m128i)(W), (__mmask8)(U)); })51065107#define _mm_maskz_ror_epi64(U, A, B) __extension__ ({ \5108(__m128i)__builtin_ia32_prorq128_mask((__v2di)(__m128i)(A), (int)(B), \5109(__v2di)_mm_setzero_di(), \5110(__mmask8)(U)); })51115112#define _mm256_ror_epi64(A, B) __extension__ ({ \5113(__m256i)__builtin_ia32_prorq256_mask((__v4di)(__m256i)(A), (int)(B), \5114(__v4di)_mm256_setzero_si256(), \5115(__mmask8)-1); })51165117#define _mm256_mask_ror_epi64(W, U, A, B) __extension__ ({ \5118(__m256i)__builtin_ia32_prorq256_mask((__v4di)(__m256i)(A), (int)(B), \5119(__v4di)(__m256i)(W), (__mmask8)(U)); })51205121#define _mm256_maskz_ror_epi64(U, A, B) __extension__ ({ \5122(__m256i)__builtin_ia32_prorq256_mask((__v4di)(__m256i)(A), (int)(B), \5123(__v4di)_mm256_setzero_si256(), \5124(__mmask8)(U)); })51255126static __inline__ __m128i __DEFAULT_FN_ATTRS5127_mm_mask_sll_epi32 (__m128i __W, __mmask8 __U, __m128i __A,5128__m128i __B)5129{5130return (__m128i) __builtin_ia32_pslld128_mask ((__v4si) __A,5131(__v4si) __B,5132(__v4si) __W,5133(__mmask8) __U);5134}51355136static __inline__ __m128i __DEFAULT_FN_ATTRS5137_mm_maskz_sll_epi32 (__mmask8 __U, __m128i __A, __m128i __B)5138{5139return (__m128i) __builtin_ia32_pslld128_mask ((__v4si) __A,5140(__v4si) __B,5141(__v4si)5142_mm_setzero_si128 (),5143(__mmask8) __U);5144}51455146static __inline__ __m256i __DEFAULT_FN_ATTRS5147_mm256_mask_sll_epi32 (__m256i __W, __mmask8 __U, __m256i __A,5148__m128i __B)5149{5150return (__m256i) __builtin_ia32_pslld256_mask ((__v8si) __A,5151(__v4si) __B,5152(__v8si) __W,5153(__mmask8) __U);5154}51555156static __inline__ __m256i __DEFAULT_FN_ATTRS5157_mm256_maskz_sll_epi32 (__mmask8 __U, __m256i __A, __m128i __B)5158{5159return (__m256i) __builtin_ia32_pslld256_mask ((__v8si) __A,5160(__v4si) __B,5161(__v8si)5162_mm256_setzero_si256 (),5163(__mmask8) __U);5164}51655166#define _mm_mask_slli_epi32(W, U, A, B) __extension__ ({ \5167(__m128i)__builtin_ia32_pslldi128_mask((__v4si)(__m128i)(A), (int)(B), \5168(__v4si)(__m128i)(W), \5169(__mmask8)(U)); })51705171#define _mm_maskz_slli_epi32(U, A, B) __extension__ ({ \5172(__m128i)__builtin_ia32_pslldi128_mask((__v4si)(__m128i)(A), (int)(B), \5173(__v4si)_mm_setzero_si128(), \5174(__mmask8)(U)); })51755176#define _mm256_mask_slli_epi32(W, U, A, B) __extension__ ({ \5177(__m256i)__builtin_ia32_pslldi256_mask((__v8si)(__m256i)(A), (int)(B), \5178(__v8si)(__m256i)(W), \5179(__mmask8)(U)); })51805181#define _mm256_maskz_slli_epi32(U, A, B) __extension__ ({ \5182(__m256i)__builtin_ia32_pslldi256_mask((__v8si)(__m256i)(A), (int)(B), \5183(__v8si)_mm256_setzero_si256(), \5184(__mmask8)(U)); })51855186static __inline__ __m128i __DEFAULT_FN_ATTRS5187_mm_mask_sll_epi64 (__m128i __W, __mmask8 __U, __m128i __A,5188__m128i __B)5189{5190return (__m128i) __builtin_ia32_psllq128_mask ((__v2di) __A,5191(__v2di) __B,5192(__v2di) __W,5193(__mmask8) __U);5194}51955196static __inline__ __m128i __DEFAULT_FN_ATTRS5197_mm_maskz_sll_epi64 (__mmask8 __U, __m128i __A, __m128i __B)5198{5199return (__m128i) __builtin_ia32_psllq128_mask ((__v2di) __A,5200(__v2di) __B,5201(__v2di)5202_mm_setzero_di (),5203(__mmask8) __U);5204}52055206static __inline__ __m256i __DEFAULT_FN_ATTRS5207_mm256_mask_sll_epi64 (__m256i __W, __mmask8 __U, __m256i __A,5208__m128i __B)5209{5210return (__m256i) __builtin_ia32_psllq256_mask ((__v4di) __A,5211(__v2di) __B,5212(__v4di) __W,5213(__mmask8) __U);5214}52155216static __inline__ __m256i __DEFAULT_FN_ATTRS5217_mm256_maskz_sll_epi64 (__mmask8 __U, __m256i __A, __m128i __B)5218{5219return (__m256i) __builtin_ia32_psllq256_mask ((__v4di) __A,5220(__v2di) __B,5221(__v4di)5222_mm256_setzero_si256 (),5223(__mmask8) __U);5224}52255226#define _mm_mask_slli_epi64(W, U, A, B) __extension__ ({ \5227(__m128i)__builtin_ia32_psllqi128_mask((__v2di)(__m128i)(A), (int)(B), \5228(__v2di)(__m128i)(W), \5229(__mmask8)(U)); })52305231#define _mm_maskz_slli_epi64(U, A, B) __extension__ ({ \5232(__m128i)__builtin_ia32_psllqi128_mask((__v2di)(__m128i)(A), (int)(B), \5233(__v2di)_mm_setzero_di(), \5234(__mmask8)(U)); })52355236#define _mm256_mask_slli_epi64(W, U, A, B) __extension__ ({ \5237(__m256i)__builtin_ia32_psllqi256_mask((__v4di)(__m256i)(A), (int)(B), \5238(__v4di)(__m256i)(W), \5239(__mmask8)(U)); })52405241#define _mm256_maskz_slli_epi64(U, A, B) __extension__ ({ \5242(__m256i)__builtin_ia32_psllqi256_mask((__v4di)(__m256i)(A), (int)(B), \5243(__v4di)_mm256_setzero_si256(), \5244(__mmask8)(U)); })524552465247static __inline__ __m128i __DEFAULT_FN_ATTRS5248_mm_rorv_epi32 (__m128i __A, __m128i __B)5249{5250return (__m128i) __builtin_ia32_prorvd128_mask ((__v4si) __A,5251(__v4si) __B,5252(__v4si)5253_mm_setzero_si128 (),5254(__mmask8) -1);5255}52565257static __inline__ __m128i __DEFAULT_FN_ATTRS5258_mm_mask_rorv_epi32 (__m128i __W, __mmask8 __U, __m128i __A,5259__m128i __B)5260{5261return (__m128i) __builtin_ia32_prorvd128_mask ((__v4si) __A,5262(__v4si) __B,5263(__v4si) __W,5264(__mmask8) __U);5265}52665267static __inline__ __m128i __DEFAULT_FN_ATTRS5268_mm_maskz_rorv_epi32 (__mmask8 __U, __m128i __A, __m128i __B)5269{5270return (__m128i) __builtin_ia32_prorvd128_mask ((__v4si) __A,5271(__v4si) __B,5272(__v4si)5273_mm_setzero_si128 (),5274(__mmask8) __U);5275}52765277static __inline__ __m256i __DEFAULT_FN_ATTRS5278_mm256_rorv_epi32 (__m256i __A, __m256i __B)5279{5280return (__m256i) __builtin_ia32_prorvd256_mask ((__v8si) __A,5281(__v8si) __B,5282(__v8si)5283_mm256_setzero_si256 (),5284(__mmask8) -1);5285}52865287static __inline__ __m256i __DEFAULT_FN_ATTRS5288_mm256_mask_rorv_epi32 (__m256i __W, __mmask8 __U, __m256i __A,5289__m256i __B)5290{5291return (__m256i) __builtin_ia32_prorvd256_mask ((__v8si) __A,5292(__v8si) __B,5293(__v8si) __W,5294(__mmask8) __U);5295}52965297static __inline__ __m256i __DEFAULT_FN_ATTRS5298_mm256_maskz_rorv_epi32 (__mmask8 __U, __m256i __A, __m256i __B)5299{5300return (__m256i) __builtin_ia32_prorvd256_mask ((__v8si) __A,5301(__v8si) __B,5302(__v8si)5303_mm256_setzero_si256 (),5304(__mmask8) __U);5305}53065307static __inline__ __m128i __DEFAULT_FN_ATTRS5308_mm_rorv_epi64 (__m128i __A, __m128i __B)5309{5310return (__m128i) __builtin_ia32_prorvq128_mask ((__v2di) __A,5311(__v2di) __B,5312(__v2di)5313_mm_setzero_di (),5314(__mmask8) -1);5315}53165317static __inline__ __m128i __DEFAULT_FN_ATTRS5318_mm_mask_rorv_epi64 (__m128i __W, __mmask8 __U, __m128i __A,5319__m128i __B)5320{5321return (__m128i) __builtin_ia32_prorvq128_mask ((__v2di) __A,5322(__v2di) __B,5323(__v2di) __W,5324(__mmask8) __U);5325}53265327static __inline__ __m128i __DEFAULT_FN_ATTRS5328_mm_maskz_rorv_epi64 (__mmask8 __U, __m128i __A, __m128i __B)5329{5330return (__m128i) __builtin_ia32_prorvq128_mask ((__v2di) __A,5331(__v2di) __B,5332(__v2di)5333_mm_setzero_di (),5334(__mmask8) __U);5335}53365337static __inline__ __m256i __DEFAULT_FN_ATTRS5338_mm256_rorv_epi64 (__m256i __A, __m256i __B)5339{5340return (__m256i) __builtin_ia32_prorvq256_mask ((__v4di) __A,5341(__v4di) __B,5342(__v4di)5343_mm256_setzero_si256 (),5344(__mmask8) -1);5345}53465347static __inline__ __m256i __DEFAULT_FN_ATTRS5348_mm256_mask_rorv_epi64 (__m256i __W, __mmask8 __U, __m256i __A,5349__m256i __B)5350{5351return (__m256i) __builtin_ia32_prorvq256_mask ((__v4di) __A,5352(__v4di) __B,5353(__v4di) __W,5354(__mmask8) __U);5355}53565357static __inline__ __m256i __DEFAULT_FN_ATTRS5358_mm256_maskz_rorv_epi64 (__mmask8 __U, __m256i __A, __m256i __B)5359{5360return (__m256i) __builtin_ia32_prorvq256_mask ((__v4di) __A,5361(__v4di) __B,5362(__v4di)5363_mm256_setzero_si256 (),5364(__mmask8) __U);5365}53665367static __inline__ __m128i __DEFAULT_FN_ATTRS5368_mm_mask_sllv_epi64 (__m128i __W, __mmask8 __U, __m128i __X,5369__m128i __Y)5370{5371return (__m128i) __builtin_ia32_psllv2di_mask ((__v2di) __X,5372(__v2di) __Y,5373(__v2di) __W,5374(__mmask8) __U);5375}53765377static __inline__ __m128i __DEFAULT_FN_ATTRS5378_mm_maskz_sllv_epi64 (__mmask8 __U, __m128i __X, __m128i __Y)5379{5380return (__m128i) __builtin_ia32_psllv2di_mask ((__v2di) __X,5381(__v2di) __Y,5382(__v2di)5383_mm_setzero_di (),5384(__mmask8) __U);5385}53865387static __inline__ __m256i __DEFAULT_FN_ATTRS5388_mm256_mask_sllv_epi64 (__m256i __W, __mmask8 __U, __m256i __X,5389__m256i __Y)5390{5391return (__m256i) __builtin_ia32_psllv4di_mask ((__v4di) __X,5392(__v4di) __Y,5393(__v4di) __W,5394(__mmask8) __U);5395}53965397static __inline__ __m256i __DEFAULT_FN_ATTRS5398_mm256_maskz_sllv_epi64 (__mmask8 __U, __m256i __X, __m256i __Y)5399{5400return (__m256i) __builtin_ia32_psllv4di_mask ((__v4di) __X,5401(__v4di) __Y,5402(__v4di)5403_mm256_setzero_si256 (),5404(__mmask8) __U);5405}54065407static __inline__ __m128i __DEFAULT_FN_ATTRS5408_mm_mask_sllv_epi32 (__m128i __W, __mmask8 __U, __m128i __X,5409__m128i __Y)5410{5411return (__m128i) __builtin_ia32_psllv4si_mask ((__v4si) __X,5412(__v4si) __Y,5413(__v4si) __W,5414(__mmask8) __U);5415}54165417static __inline__ __m128i __DEFAULT_FN_ATTRS5418_mm_maskz_sllv_epi32 (__mmask8 __U, __m128i __X, __m128i __Y)5419{5420return (__m128i) __builtin_ia32_psllv4si_mask ((__v4si) __X,5421(__v4si) __Y,5422(__v4si)5423_mm_setzero_si128 (),5424(__mmask8) __U);5425}54265427static __inline__ __m256i __DEFAULT_FN_ATTRS5428_mm256_mask_sllv_epi32 (__m256i __W, __mmask8 __U, __m256i __X,5429__m256i __Y)5430{5431return (__m256i) __builtin_ia32_psllv8si_mask ((__v8si) __X,5432(__v8si) __Y,5433(__v8si) __W,5434(__mmask8) __U);5435}54365437static __inline__ __m256i __DEFAULT_FN_ATTRS5438_mm256_maskz_sllv_epi32 (__mmask8 __U, __m256i __X, __m256i __Y)5439{5440return (__m256i) __builtin_ia32_psllv8si_mask ((__v8si) __X,5441(__v8si) __Y,5442(__v8si)5443_mm256_setzero_si256 (),5444(__mmask8) __U);5445}5446544754485449static __inline__ __m128i __DEFAULT_FN_ATTRS5450_mm_mask_srlv_epi64 (__m128i __W, __mmask8 __U, __m128i __X,5451__m128i __Y)5452{5453return (__m128i) __builtin_ia32_psrlv2di_mask ((__v2di) __X,5454(__v2di) __Y,5455(__v2di) __W,5456(__mmask8) __U);5457}54585459static __inline__ __m128i __DEFAULT_FN_ATTRS5460_mm_maskz_srlv_epi64 (__mmask8 __U, __m128i __X, __m128i __Y)5461{5462return (__m128i) __builtin_ia32_psrlv2di_mask ((__v2di) __X,5463(__v2di) __Y,5464(__v2di)5465_mm_setzero_di (),5466(__mmask8) __U);5467}54685469static __inline__ __m256i __DEFAULT_FN_ATTRS5470_mm256_mask_srlv_epi64 (__m256i __W, __mmask8 __U, __m256i __X,5471__m256i __Y)5472{5473return (__m256i) __builtin_ia32_psrlv4di_mask ((__v4di) __X,5474(__v4di) __Y,5475(__v4di) __W,5476(__mmask8) __U);5477}54785479static __inline__ __m256i __DEFAULT_FN_ATTRS5480_mm256_maskz_srlv_epi64 (__mmask8 __U, __m256i __X, __m256i __Y)5481{5482return (__m256i) __builtin_ia32_psrlv4di_mask ((__v4di) __X,5483(__v4di) __Y,5484(__v4di)5485_mm256_setzero_si256 (),5486(__mmask8) __U);5487}54885489static __inline__ __m128i __DEFAULT_FN_ATTRS5490_mm_mask_srlv_epi32 (__m128i __W, __mmask8 __U, __m128i __X,5491__m128i __Y)5492{5493return (__m128i) __builtin_ia32_psrlv4si_mask ((__v4si) __X,5494(__v4si) __Y,5495(__v4si) __W,5496(__mmask8) __U);5497}54985499static __inline__ __m128i __DEFAULT_FN_ATTRS5500_mm_maskz_srlv_epi32 (__mmask8 __U, __m128i __X, __m128i __Y)5501{5502return (__m128i) __builtin_ia32_psrlv4si_mask ((__v4si) __X,5503(__v4si) __Y,5504(__v4si)5505_mm_setzero_si128 (),5506(__mmask8) __U);5507}55085509static __inline__ __m256i __DEFAULT_FN_ATTRS5510_mm256_mask_srlv_epi32 (__m256i __W, __mmask8 __U, __m256i __X,5511__m256i __Y)5512{5513return (__m256i) __builtin_ia32_psrlv8si_mask ((__v8si) __X,5514(__v8si) __Y,5515(__v8si) __W,5516(__mmask8) __U);5517}55185519static __inline__ __m256i __DEFAULT_FN_ATTRS5520_mm256_maskz_srlv_epi32 (__mmask8 __U, __m256i __X, __m256i __Y)5521{5522return (__m256i) __builtin_ia32_psrlv8si_mask ((__v8si) __X,5523(__v8si) __Y,5524(__v8si)5525_mm256_setzero_si256 (),5526(__mmask8) __U);5527}5528552955305531static __inline__ __m128i __DEFAULT_FN_ATTRS5532_mm_mask_srl_epi32 (__m128i __W, __mmask8 __U, __m128i __A,5533__m128i __B)5534{5535return (__m128i) __builtin_ia32_psrld128_mask ((__v4si) __A,5536(__v4si) __B,5537(__v4si) __W,5538(__mmask8) __U);5539}55405541static __inline__ __m128i __DEFAULT_FN_ATTRS5542_mm_maskz_srl_epi32 (__mmask8 __U, __m128i __A, __m128i __B)5543{5544return (__m128i) __builtin_ia32_psrld128_mask ((__v4si) __A,5545(__v4si) __B,5546(__v4si)5547_mm_setzero_si128 (),5548(__mmask8) __U);5549}55505551static __inline__ __m256i __DEFAULT_FN_ATTRS5552_mm256_mask_srl_epi32 (__m256i __W, __mmask8 __U, __m256i __A,5553__m128i __B)5554{5555return (__m256i) __builtin_ia32_psrld256_mask ((__v8si) __A,5556(__v4si) __B,5557(__v8si) __W,5558(__mmask8) __U);5559}55605561static __inline__ __m256i __DEFAULT_FN_ATTRS5562_mm256_maskz_srl_epi32 (__mmask8 __U, __m256i __A, __m128i __B)5563{5564return (__m256i) __builtin_ia32_psrld256_mask ((__v8si) __A,5565(__v4si) __B,5566(__v8si)5567_mm256_setzero_si256 (),5568(__mmask8) __U);5569}55705571#define _mm_mask_srli_epi32(W, U, A, imm) __extension__ ({ \5572(__m128i)__builtin_ia32_psrldi128_mask((__v4si)(__m128i)(A), (int)(imm), \5573(__v4si)(__m128i)(W), \5574(__mmask8)(U)); })55755576#define _mm_maskz_srli_epi32(U, A, imm) __extension__ ({ \5577(__m128i)__builtin_ia32_psrldi128_mask((__v4si)(__m128i)(A), (int)(imm), \5578(__v4si)_mm_setzero_si128(), \5579(__mmask8)(U)); })55805581#define _mm256_mask_srli_epi32(W, U, A, imm) __extension__ ({ \5582(__m256i)__builtin_ia32_psrldi256_mask((__v8si)(__m256i)(A), (int)(imm), \5583(__v8si)(__m256i)(W), \5584(__mmask8)(U)); })55855586#define _mm256_maskz_srli_epi32(U, A, imm) __extension__ ({ \5587(__m256i)__builtin_ia32_psrldi256_mask((__v8si)(__m256i)(A), (int)(imm), \5588(__v8si)_mm256_setzero_si256(), \5589(__mmask8)(U)); })55905591static __inline__ __m128i __DEFAULT_FN_ATTRS5592_mm_mask_srl_epi64 (__m128i __W, __mmask8 __U, __m128i __A,5593__m128i __B)5594{5595return (__m128i) __builtin_ia32_psrlq128_mask ((__v2di) __A,5596(__v2di) __B,5597(__v2di) __W,5598(__mmask8) __U);5599}56005601static __inline__ __m128i __DEFAULT_FN_ATTRS5602_mm_maskz_srl_epi64 (__mmask8 __U, __m128i __A, __m128i __B)5603{5604return (__m128i) __builtin_ia32_psrlq128_mask ((__v2di) __A,5605(__v2di) __B,5606(__v2di)5607_mm_setzero_di (),5608(__mmask8) __U);5609}56105611static __inline__ __m256i __DEFAULT_FN_ATTRS5612_mm256_mask_srl_epi64 (__m256i __W, __mmask8 __U, __m256i __A,5613__m128i __B)5614{5615return (__m256i) __builtin_ia32_psrlq256_mask ((__v4di) __A,5616(__v2di) __B,5617(__v4di) __W,5618(__mmask8) __U);5619}56205621static __inline__ __m256i __DEFAULT_FN_ATTRS5622_mm256_maskz_srl_epi64 (__mmask8 __U, __m256i __A, __m128i __B)5623{5624return (__m256i) __builtin_ia32_psrlq256_mask ((__v4di) __A,5625(__v2di) __B,5626(__v4di)5627_mm256_setzero_si256 (),5628(__mmask8) __U);5629}56305631#define _mm_mask_srli_epi64(W, U, A, imm) __extension__ ({ \5632(__m128i)__builtin_ia32_psrlqi128_mask((__v2di)(__m128i)(A), (int)(imm), \5633(__v2di)(__m128i)(W), \5634(__mmask8)(U)); })56355636#define _mm_maskz_srli_epi64(U, A, imm) __extension__ ({ \5637(__m128i)__builtin_ia32_psrlqi128_mask((__v2di)(__m128i)(A), (int)(imm), \5638(__v2di)_mm_setzero_si128(), \5639(__mmask8)(U)); })56405641#define _mm256_mask_srli_epi64(W, U, A, imm) __extension__ ({ \5642(__m256i)__builtin_ia32_psrlqi256_mask((__v4di)(__m256i)(A), (int)(imm), \5643(__v4di)(__m256i)(W), \5644(__mmask8)(U)); })56455646#define _mm256_maskz_srli_epi64(U, A, imm) __extension__ ({ \5647(__m256i)__builtin_ia32_psrlqi256_mask((__v4di)(__m256i)(A), (int)(imm), \5648(__v4di)_mm256_setzero_si256(), \5649(__mmask8)(U)); })56505651static __inline__ __m128i __DEFAULT_FN_ATTRS5652_mm_mask_srav_epi32 (__m128i __W, __mmask8 __U, __m128i __X,5653__m128i __Y)5654{5655return (__m128i) __builtin_ia32_psrav4si_mask ((__v4si) __X,5656(__v4si) __Y,5657(__v4si) __W,5658(__mmask8) __U);5659}56605661static __inline__ __m128i __DEFAULT_FN_ATTRS5662_mm_maskz_srav_epi32 (__mmask8 __U, __m128i __X, __m128i __Y)5663{5664return (__m128i) __builtin_ia32_psrav4si_mask ((__v4si) __X,5665(__v4si) __Y,5666(__v4si)5667_mm_setzero_si128 (),5668(__mmask8) __U);5669}56705671static __inline__ __m256i __DEFAULT_FN_ATTRS5672_mm256_mask_srav_epi32 (__m256i __W, __mmask8 __U, __m256i __X,5673__m256i __Y)5674{5675return (__m256i) __builtin_ia32_psrav8si_mask ((__v8si) __X,5676(__v8si) __Y,5677(__v8si) __W,5678(__mmask8) __U);5679}56805681static __inline__ __m256i __DEFAULT_FN_ATTRS5682_mm256_maskz_srav_epi32 (__mmask8 __U, __m256i __X, __m256i __Y)5683{5684return (__m256i) __builtin_ia32_psrav8si_mask ((__v8si) __X,5685(__v8si) __Y,5686(__v8si)5687_mm256_setzero_si256 (),5688(__mmask8) __U);5689}56905691static __inline__ __m128i __DEFAULT_FN_ATTRS5692_mm_srav_epi64 (__m128i __X, __m128i __Y)5693{5694return (__m128i) __builtin_ia32_psravq128_mask ((__v2di) __X,5695(__v2di) __Y,5696(__v2di)5697_mm_setzero_di (),5698(__mmask8) -1);5699}57005701static __inline__ __m128i __DEFAULT_FN_ATTRS5702_mm_mask_srav_epi64 (__m128i __W, __mmask8 __U, __m128i __X,5703__m128i __Y)5704{5705return (__m128i) __builtin_ia32_psravq128_mask ((__v2di) __X,5706(__v2di) __Y,5707(__v2di) __W,5708(__mmask8) __U);5709}57105711static __inline__ __m128i __DEFAULT_FN_ATTRS5712_mm_maskz_srav_epi64 (__mmask8 __U, __m128i __X, __m128i __Y)5713{5714return (__m128i) __builtin_ia32_psravq128_mask ((__v2di) __X,5715(__v2di) __Y,5716(__v2di)5717_mm_setzero_di (),5718(__mmask8) __U);5719}57205721static __inline__ __m256i __DEFAULT_FN_ATTRS5722_mm256_srav_epi64 (__m256i __X, __m256i __Y)5723{5724return (__m256i) __builtin_ia32_psravq256_mask ((__v4di) __X,5725(__v4di) __Y,5726(__v4di)5727_mm256_setzero_si256 (),5728(__mmask8) -1);5729}57305731static __inline__ __m256i __DEFAULT_FN_ATTRS5732_mm256_mask_srav_epi64 (__m256i __W, __mmask8 __U, __m256i __X,5733__m256i __Y)5734{5735return (__m256i) __builtin_ia32_psravq256_mask ((__v4di) __X,5736(__v4di) __Y,5737(__v4di) __W,5738(__mmask8) __U);5739}57405741static __inline__ __m256i __DEFAULT_FN_ATTRS5742_mm256_maskz_srav_epi64 (__mmask8 __U, __m256i __X, __m256i __Y)5743{5744return (__m256i) __builtin_ia32_psravq256_mask ((__v4di) __X,5745(__v4di) __Y,5746(__v4di)5747_mm256_setzero_si256 (),5748(__mmask8) __U);5749}57505751static __inline__ __m128i __DEFAULT_FN_ATTRS5752_mm_mask_mov_epi32 (__m128i __W, __mmask8 __U, __m128i __A)5753{5754return (__m128i) __builtin_ia32_selectd_128 ((__mmask8) __U,5755(__v4si) __A,5756(__v4si) __W);5757}57585759static __inline__ __m128i __DEFAULT_FN_ATTRS5760_mm_maskz_mov_epi32 (__mmask8 __U, __m128i __A)5761{5762return (__m128i) __builtin_ia32_selectd_128 ((__mmask8) __U,5763(__v4si) __A,5764(__v4si) _mm_setzero_si128 ());5765}576657675768static __inline__ __m256i __DEFAULT_FN_ATTRS5769_mm256_mask_mov_epi32 (__m256i __W, __mmask8 __U, __m256i __A)5770{5771return (__m256i) __builtin_ia32_selectd_256 ((__mmask8) __U,5772(__v8si) __A,5773(__v8si) __W);5774}57755776static __inline__ __m256i __DEFAULT_FN_ATTRS5777_mm256_maskz_mov_epi32 (__mmask8 __U, __m256i __A)5778{5779return (__m256i) __builtin_ia32_selectd_256 ((__mmask8) __U,5780(__v8si) __A,5781(__v8si) _mm256_setzero_si256 ());5782}57835784static __inline__ __m128i __DEFAULT_FN_ATTRS5785_mm_mask_load_epi32 (__m128i __W, __mmask8 __U, void const *__P)5786{5787return (__m128i) __builtin_ia32_movdqa32load128_mask ((__v4si *) __P,5788(__v4si) __W,5789(__mmask8)5790__U);5791}57925793static __inline__ __m128i __DEFAULT_FN_ATTRS5794_mm_maskz_load_epi32 (__mmask8 __U, void const *__P)5795{5796return (__m128i) __builtin_ia32_movdqa32load128_mask ((__v4si *) __P,5797(__v4si)5798_mm_setzero_si128 (),5799(__mmask8)5800__U);5801}58025803static __inline__ __m256i __DEFAULT_FN_ATTRS5804_mm256_mask_load_epi32 (__m256i __W, __mmask8 __U, void const *__P)5805{5806return (__m256i) __builtin_ia32_movdqa32load256_mask ((__v8si *) __P,5807(__v8si) __W,5808(__mmask8)5809__U);5810}58115812static __inline__ __m256i __DEFAULT_FN_ATTRS5813_mm256_maskz_load_epi32 (__mmask8 __U, void const *__P)5814{5815return (__m256i) __builtin_ia32_movdqa32load256_mask ((__v8si *) __P,5816(__v8si)5817_mm256_setzero_si256 (),5818(__mmask8)5819__U);5820}58215822static __inline__ void __DEFAULT_FN_ATTRS5823_mm_mask_store_epi32 (void *__P, __mmask8 __U, __m128i __A)5824{5825__builtin_ia32_movdqa32store128_mask ((__v4si *) __P,5826(__v4si) __A,5827(__mmask8) __U);5828}58295830static __inline__ void __DEFAULT_FN_ATTRS5831_mm256_mask_store_epi32 (void *__P, __mmask8 __U, __m256i __A)5832{5833__builtin_ia32_movdqa32store256_mask ((__v8si *) __P,5834(__v8si) __A,5835(__mmask8) __U);5836}58375838static __inline__ __m128i __DEFAULT_FN_ATTRS5839_mm_mask_mov_epi64 (__m128i __W, __mmask8 __U, __m128i __A)5840{5841return (__m128i) __builtin_ia32_selectq_128 ((__mmask8) __U,5842(__v2di) __A,5843(__v2di) __W);5844}58455846static __inline__ __m128i __DEFAULT_FN_ATTRS5847_mm_maskz_mov_epi64 (__mmask8 __U, __m128i __A)5848{5849return (__m128i) __builtin_ia32_selectq_128 ((__mmask8) __U,5850(__v2di) __A,5851(__v2di) _mm_setzero_di ());5852}58535854static __inline__ __m256i __DEFAULT_FN_ATTRS5855_mm256_mask_mov_epi64 (__m256i __W, __mmask8 __U, __m256i __A)5856{5857return (__m256i) __builtin_ia32_selectq_256 ((__mmask8) __U,5858(__v4di) __A,5859(__v4di) __W);5860}58615862static __inline__ __m256i __DEFAULT_FN_ATTRS5863_mm256_maskz_mov_epi64 (__mmask8 __U, __m256i __A)5864{5865return (__m256i) __builtin_ia32_selectq_256 ((__mmask8) __U,5866(__v4di) __A,5867(__v4di) _mm256_setzero_si256 ());5868}58695870static __inline__ __m128i __DEFAULT_FN_ATTRS5871_mm_mask_load_epi64 (__m128i __W, __mmask8 __U, void const *__P)5872{5873return (__m128i) __builtin_ia32_movdqa64load128_mask ((__v2di *) __P,5874(__v2di) __W,5875(__mmask8)5876__U);5877}58785879static __inline__ __m128i __DEFAULT_FN_ATTRS5880_mm_maskz_load_epi64 (__mmask8 __U, void const *__P)5881{5882return (__m128i) __builtin_ia32_movdqa64load128_mask ((__v2di *) __P,5883(__v2di)5884_mm_setzero_di (),5885(__mmask8)5886__U);5887}58885889static __inline__ __m256i __DEFAULT_FN_ATTRS5890_mm256_mask_load_epi64 (__m256i __W, __mmask8 __U, void const *__P)5891{5892return (__m256i) __builtin_ia32_movdqa64load256_mask ((__v4di *) __P,5893(__v4di) __W,5894(__mmask8)5895__U);5896}58975898static __inline__ __m256i __DEFAULT_FN_ATTRS5899_mm256_maskz_load_epi64 (__mmask8 __U, void const *__P)5900{5901return (__m256i) __builtin_ia32_movdqa64load256_mask ((__v4di *) __P,5902(__v4di)5903_mm256_setzero_si256 (),5904(__mmask8)5905__U);5906}59075908static __inline__ void __DEFAULT_FN_ATTRS5909_mm_mask_store_epi64 (void *__P, __mmask8 __U, __m128i __A)5910{5911__builtin_ia32_movdqa64store128_mask ((__v2di *) __P,5912(__v2di) __A,5913(__mmask8) __U);5914}59155916static __inline__ void __DEFAULT_FN_ATTRS5917_mm256_mask_store_epi64 (void *__P, __mmask8 __U, __m256i __A)5918{5919__builtin_ia32_movdqa64store256_mask ((__v4di *) __P,5920(__v4di) __A,5921(__mmask8) __U);5922}59235924static __inline__ __m128d __DEFAULT_FN_ATTRS5925_mm_mask_movedup_pd (__m128d __W, __mmask8 __U, __m128d __A)5926{5927return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,5928(__v2df)_mm_movedup_pd(__A),5929(__v2df)__W);5930}59315932static __inline__ __m128d __DEFAULT_FN_ATTRS5933_mm_maskz_movedup_pd (__mmask8 __U, __m128d __A)5934{5935return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,5936(__v2df)_mm_movedup_pd(__A),5937(__v2df)_mm_setzero_pd());5938}59395940static __inline__ __m256d __DEFAULT_FN_ATTRS5941_mm256_mask_movedup_pd (__m256d __W, __mmask8 __U, __m256d __A)5942{5943return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,5944(__v4df)_mm256_movedup_pd(__A),5945(__v4df)__W);5946}59475948static __inline__ __m256d __DEFAULT_FN_ATTRS5949_mm256_maskz_movedup_pd (__mmask8 __U, __m256d __A)5950{5951return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,5952(__v4df)_mm256_movedup_pd(__A),5953(__v4df)_mm256_setzero_pd());5954}595559565957#define _mm_mask_set1_epi32(O, M, A) __extension__ ({ \5958(__m128i)__builtin_ia32_pbroadcastd128_gpr_mask((int)(A), \5959(__v4si)(__m128i)(O), \5960(__mmask8)(M)); })59615962#define _mm_maskz_set1_epi32(M, A) __extension__ ({ \5963(__m128i)__builtin_ia32_pbroadcastd128_gpr_mask((int)(A), \5964(__v4si)_mm_setzero_si128(), \5965(__mmask8)(M)); })59665967#define _mm256_mask_set1_epi32(O, M, A) __extension__ ({ \5968(__m256i)__builtin_ia32_pbroadcastd256_gpr_mask((int)(A), \5969(__v8si)(__m256i)(O), \5970(__mmask8)(M)); })59715972#define _mm256_maskz_set1_epi32(M, A) __extension__ ({ \5973(__m256i)__builtin_ia32_pbroadcastd256_gpr_mask((int)(A), \5974(__v8si)_mm256_setzero_si256(), \5975(__mmask8)(M)); })59765977static __inline__ __m128i __DEFAULT_FN_ATTRS5978_mm_mask_set1_epi64 (__m128i __O, __mmask8 __M, long long __A)5979{5980return (__m128i) __builtin_ia32_pbroadcastq128_gpr_mask (__A, (__v2di) __O,5981__M);5982}59835984static __inline__ __m128i __DEFAULT_FN_ATTRS5985_mm_maskz_set1_epi64 (__mmask8 __M, long long __A)5986{5987return (__m128i) __builtin_ia32_pbroadcastq128_gpr_mask (__A,5988(__v2di)5989_mm_setzero_si128 (),5990__M);5991}59925993static __inline__ __m256i __DEFAULT_FN_ATTRS5994_mm256_mask_set1_epi64 (__m256i __O, __mmask8 __M, long long __A)5995{5996return (__m256i) __builtin_ia32_pbroadcastq256_gpr_mask (__A, (__v4di) __O,5997__M);5998}59996000static __inline__ __m256i __DEFAULT_FN_ATTRS6001_mm256_maskz_set1_epi64 (__mmask8 __M, long long __A)6002{6003return (__m256i) __builtin_ia32_pbroadcastq256_gpr_mask (__A,6004(__v4di)6005_mm256_setzero_si256 (),6006__M);6007}60086009#define _mm_fixupimm_pd(A, B, C, imm) __extension__ ({ \6010(__m128d)__builtin_ia32_fixupimmpd128_mask((__v2df)(__m128d)(A), \6011(__v2df)(__m128d)(B), \6012(__v2di)(__m128i)(C), (int)(imm), \6013(__mmask8)-1); })60146015#define _mm_mask_fixupimm_pd(A, U, B, C, imm) __extension__ ({ \6016(__m128d)__builtin_ia32_fixupimmpd128_mask((__v2df)(__m128d)(A), \6017(__v2df)(__m128d)(B), \6018(__v2di)(__m128i)(C), (int)(imm), \6019(__mmask8)(U)); })60206021#define _mm_maskz_fixupimm_pd(U, A, B, C, imm) __extension__ ({ \6022(__m128d)__builtin_ia32_fixupimmpd128_maskz((__v2df)(__m128d)(A), \6023(__v2df)(__m128d)(B), \6024(__v2di)(__m128i)(C), \6025(int)(imm), (__mmask8)(U)); })60266027#define _mm256_fixupimm_pd(A, B, C, imm) __extension__ ({ \6028(__m256d)__builtin_ia32_fixupimmpd256_mask((__v4df)(__m256d)(A), \6029(__v4df)(__m256d)(B), \6030(__v4di)(__m256i)(C), (int)(imm), \6031(__mmask8)-1); })60326033#define _mm256_mask_fixupimm_pd(A, U, B, C, imm) __extension__ ({ \6034(__m256d)__builtin_ia32_fixupimmpd256_mask((__v4df)(__m256d)(A), \6035(__v4df)(__m256d)(B), \6036(__v4di)(__m256i)(C), (int)(imm), \6037(__mmask8)(U)); })60386039#define _mm256_maskz_fixupimm_pd(U, A, B, C, imm) __extension__ ({ \6040(__m256d)__builtin_ia32_fixupimmpd256_maskz((__v4df)(__m256d)(A), \6041(__v4df)(__m256d)(B), \6042(__v4di)(__m256i)(C), \6043(int)(imm), (__mmask8)(U)); })60446045#define _mm_fixupimm_ps(A, B, C, imm) __extension__ ({ \6046(__m128)__builtin_ia32_fixupimmps128_mask((__v4sf)(__m128)(A), \6047(__v4sf)(__m128)(B), \6048(__v4si)(__m128i)(C), (int)(imm), \6049(__mmask8)-1); })60506051#define _mm_mask_fixupimm_ps(A, U, B, C, imm) __extension__ ({ \6052(__m128)__builtin_ia32_fixupimmps128_mask((__v4sf)(__m128)(A), \6053(__v4sf)(__m128)(B), \6054(__v4si)(__m128i)(C), (int)(imm), \6055(__mmask8)(U)); })60566057#define _mm_maskz_fixupimm_ps(U, A, B, C, imm) __extension__ ({ \6058(__m128)__builtin_ia32_fixupimmps128_maskz((__v4sf)(__m128)(A), \6059(__v4sf)(__m128)(B), \6060(__v4si)(__m128i)(C), (int)(imm), \6061(__mmask8)(U)); })60626063#define _mm256_fixupimm_ps(A, B, C, imm) __extension__ ({ \6064(__m256)__builtin_ia32_fixupimmps256_mask((__v8sf)(__m256)(A), \6065(__v8sf)(__m256)(B), \6066(__v8si)(__m256i)(C), (int)(imm), \6067(__mmask8)-1); })60686069#define _mm256_mask_fixupimm_ps(A, U, B, C, imm) __extension__ ({ \6070(__m256)__builtin_ia32_fixupimmps256_mask((__v8sf)(__m256)(A), \6071(__v8sf)(__m256)(B), \6072(__v8si)(__m256i)(C), (int)(imm), \6073(__mmask8)(U)); })60746075#define _mm256_maskz_fixupimm_ps(U, A, B, C, imm) __extension__ ({ \6076(__m256)__builtin_ia32_fixupimmps256_maskz((__v8sf)(__m256)(A), \6077(__v8sf)(__m256)(B), \6078(__v8si)(__m256i)(C), (int)(imm), \6079(__mmask8)(U)); })60806081static __inline__ __m128d __DEFAULT_FN_ATTRS6082_mm_mask_load_pd (__m128d __W, __mmask8 __U, void const *__P)6083{6084return (__m128d) __builtin_ia32_loadapd128_mask ((__v2df *) __P,6085(__v2df) __W,6086(__mmask8) __U);6087}60886089static __inline__ __m128d __DEFAULT_FN_ATTRS6090_mm_maskz_load_pd (__mmask8 __U, void const *__P)6091{6092return (__m128d) __builtin_ia32_loadapd128_mask ((__v2df *) __P,6093(__v2df)6094_mm_setzero_pd (),6095(__mmask8) __U);6096}60976098static __inline__ __m256d __DEFAULT_FN_ATTRS6099_mm256_mask_load_pd (__m256d __W, __mmask8 __U, void const *__P)6100{6101return (__m256d) __builtin_ia32_loadapd256_mask ((__v4df *) __P,6102(__v4df) __W,6103(__mmask8) __U);6104}61056106static __inline__ __m256d __DEFAULT_FN_ATTRS6107_mm256_maskz_load_pd (__mmask8 __U, void const *__P)6108{6109return (__m256d) __builtin_ia32_loadapd256_mask ((__v4df *) __P,6110(__v4df)6111_mm256_setzero_pd (),6112(__mmask8) __U);6113}61146115static __inline__ __m128 __DEFAULT_FN_ATTRS6116_mm_mask_load_ps (__m128 __W, __mmask8 __U, void const *__P)6117{6118return (__m128) __builtin_ia32_loadaps128_mask ((__v4sf *) __P,6119(__v4sf) __W,6120(__mmask8) __U);6121}61226123static __inline__ __m128 __DEFAULT_FN_ATTRS6124_mm_maskz_load_ps (__mmask8 __U, void const *__P)6125{6126return (__m128) __builtin_ia32_loadaps128_mask ((__v4sf *) __P,6127(__v4sf)6128_mm_setzero_ps (),6129(__mmask8) __U);6130}61316132static __inline__ __m256 __DEFAULT_FN_ATTRS6133_mm256_mask_load_ps (__m256 __W, __mmask8 __U, void const *__P)6134{6135return (__m256) __builtin_ia32_loadaps256_mask ((__v8sf *) __P,6136(__v8sf) __W,6137(__mmask8) __U);6138}61396140static __inline__ __m256 __DEFAULT_FN_ATTRS6141_mm256_maskz_load_ps (__mmask8 __U, void const *__P)6142{6143return (__m256) __builtin_ia32_loadaps256_mask ((__v8sf *) __P,6144(__v8sf)6145_mm256_setzero_ps (),6146(__mmask8) __U);6147}61486149static __inline__ __m128i __DEFAULT_FN_ATTRS6150_mm_mask_loadu_epi64 (__m128i __W, __mmask8 __U, void const *__P)6151{6152return (__m128i) __builtin_ia32_loaddqudi128_mask ((__v2di *) __P,6153(__v2di) __W,6154(__mmask8) __U);6155}61566157static __inline__ __m128i __DEFAULT_FN_ATTRS6158_mm_maskz_loadu_epi64 (__mmask8 __U, void const *__P)6159{6160return (__m128i) __builtin_ia32_loaddqudi128_mask ((__v2di *) __P,6161(__v2di)6162_mm_setzero_si128 (),6163(__mmask8) __U);6164}61656166static __inline__ __m256i __DEFAULT_FN_ATTRS6167_mm256_mask_loadu_epi64 (__m256i __W, __mmask8 __U, void const *__P)6168{6169return (__m256i) __builtin_ia32_loaddqudi256_mask ((__v4di *) __P,6170(__v4di) __W,6171(__mmask8) __U);6172}61736174static __inline__ __m256i __DEFAULT_FN_ATTRS6175_mm256_maskz_loadu_epi64 (__mmask8 __U, void const *__P)6176{6177return (__m256i) __builtin_ia32_loaddqudi256_mask ((__v4di *) __P,6178(__v4di)6179_mm256_setzero_si256 (),6180(__mmask8) __U);6181}61826183static __inline__ __m128i __DEFAULT_FN_ATTRS6184_mm_mask_loadu_epi32 (__m128i __W, __mmask8 __U, void const *__P)6185{6186return (__m128i) __builtin_ia32_loaddqusi128_mask ((__v4si *) __P,6187(__v4si) __W,6188(__mmask8) __U);6189}61906191static __inline__ __m128i __DEFAULT_FN_ATTRS6192_mm_maskz_loadu_epi32 (__mmask8 __U, void const *__P)6193{6194return (__m128i) __builtin_ia32_loaddqusi128_mask ((__v4si *) __P,6195(__v4si)6196_mm_setzero_si128 (),6197(__mmask8) __U);6198}61996200static __inline__ __m256i __DEFAULT_FN_ATTRS6201_mm256_mask_loadu_epi32 (__m256i __W, __mmask8 __U, void const *__P)6202{6203return (__m256i) __builtin_ia32_loaddqusi256_mask ((__v8si *) __P,6204(__v8si) __W,6205(__mmask8) __U);6206}62076208static __inline__ __m256i __DEFAULT_FN_ATTRS6209_mm256_maskz_loadu_epi32 (__mmask8 __U, void const *__P)6210{6211return (__m256i) __builtin_ia32_loaddqusi256_mask ((__v8si *) __P,6212(__v8si)6213_mm256_setzero_si256 (),6214(__mmask8) __U);6215}62166217static __inline__ __m128d __DEFAULT_FN_ATTRS6218_mm_mask_loadu_pd (__m128d __W, __mmask8 __U, void const *__P)6219{6220return (__m128d) __builtin_ia32_loadupd128_mask ((__v2df *) __P,6221(__v2df) __W,6222(__mmask8) __U);6223}62246225static __inline__ __m128d __DEFAULT_FN_ATTRS6226_mm_maskz_loadu_pd (__mmask8 __U, void const *__P)6227{6228return (__m128d) __builtin_ia32_loadupd128_mask ((__v2df *) __P,6229(__v2df)6230_mm_setzero_pd (),6231(__mmask8) __U);6232}62336234static __inline__ __m256d __DEFAULT_FN_ATTRS6235_mm256_mask_loadu_pd (__m256d __W, __mmask8 __U, void const *__P)6236{6237return (__m256d) __builtin_ia32_loadupd256_mask ((__v4df *) __P,6238(__v4df) __W,6239(__mmask8) __U);6240}62416242static __inline__ __m256d __DEFAULT_FN_ATTRS6243_mm256_maskz_loadu_pd (__mmask8 __U, void const *__P)6244{6245return (__m256d) __builtin_ia32_loadupd256_mask ((__v4df *) __P,6246(__v4df)6247_mm256_setzero_pd (),6248(__mmask8) __U);6249}62506251static __inline__ __m128 __DEFAULT_FN_ATTRS6252_mm_mask_loadu_ps (__m128 __W, __mmask8 __U, void const *__P)6253{6254return (__m128) __builtin_ia32_loadups128_mask ((__v4sf *) __P,6255(__v4sf) __W,6256(__mmask8) __U);6257}62586259static __inline__ __m128 __DEFAULT_FN_ATTRS6260_mm_maskz_loadu_ps (__mmask8 __U, void const *__P)6261{6262return (__m128) __builtin_ia32_loadups128_mask ((__v4sf *) __P,6263(__v4sf)6264_mm_setzero_ps (),6265(__mmask8) __U);6266}62676268static __inline__ __m256 __DEFAULT_FN_ATTRS6269_mm256_mask_loadu_ps (__m256 __W, __mmask8 __U, void const *__P)6270{6271return (__m256) __builtin_ia32_loadups256_mask ((__v8sf *) __P,6272(__v8sf) __W,6273(__mmask8) __U);6274}62756276static __inline__ __m256 __DEFAULT_FN_ATTRS6277_mm256_maskz_loadu_ps (__mmask8 __U, void const *__P)6278{6279return (__m256) __builtin_ia32_loadups256_mask ((__v8sf *) __P,6280(__v8sf)6281_mm256_setzero_ps (),6282(__mmask8) __U);6283}62846285static __inline__ void __DEFAULT_FN_ATTRS6286_mm_mask_store_pd (void *__P, __mmask8 __U, __m128d __A)6287{6288__builtin_ia32_storeapd128_mask ((__v2df *) __P,6289(__v2df) __A,6290(__mmask8) __U);6291}62926293static __inline__ void __DEFAULT_FN_ATTRS6294_mm256_mask_store_pd (void *__P, __mmask8 __U, __m256d __A)6295{6296__builtin_ia32_storeapd256_mask ((__v4df *) __P,6297(__v4df) __A,6298(__mmask8) __U);6299}63006301static __inline__ void __DEFAULT_FN_ATTRS6302_mm_mask_store_ps (void *__P, __mmask8 __U, __m128 __A)6303{6304__builtin_ia32_storeaps128_mask ((__v4sf *) __P,6305(__v4sf) __A,6306(__mmask8) __U);6307}63086309static __inline__ void __DEFAULT_FN_ATTRS6310_mm256_mask_store_ps (void *__P, __mmask8 __U, __m256 __A)6311{6312__builtin_ia32_storeaps256_mask ((__v8sf *) __P,6313(__v8sf) __A,6314(__mmask8) __U);6315}63166317static __inline__ void __DEFAULT_FN_ATTRS6318_mm_mask_storeu_epi64 (void *__P, __mmask8 __U, __m128i __A)6319{6320__builtin_ia32_storedqudi128_mask ((__v2di *) __P,6321(__v2di) __A,6322(__mmask8) __U);6323}63246325static __inline__ void __DEFAULT_FN_ATTRS6326_mm256_mask_storeu_epi64 (void *__P, __mmask8 __U, __m256i __A)6327{6328__builtin_ia32_storedqudi256_mask ((__v4di *) __P,6329(__v4di) __A,6330(__mmask8) __U);6331}63326333static __inline__ void __DEFAULT_FN_ATTRS6334_mm_mask_storeu_epi32 (void *__P, __mmask8 __U, __m128i __A)6335{6336__builtin_ia32_storedqusi128_mask ((__v4si *) __P,6337(__v4si) __A,6338(__mmask8) __U);6339}63406341static __inline__ void __DEFAULT_FN_ATTRS6342_mm256_mask_storeu_epi32 (void *__P, __mmask8 __U, __m256i __A)6343{6344__builtin_ia32_storedqusi256_mask ((__v8si *) __P,6345(__v8si) __A,6346(__mmask8) __U);6347}63486349static __inline__ void __DEFAULT_FN_ATTRS6350_mm_mask_storeu_pd (void *__P, __mmask8 __U, __m128d __A)6351{6352__builtin_ia32_storeupd128_mask ((__v2df *) __P,6353(__v2df) __A,6354(__mmask8) __U);6355}63566357static __inline__ void __DEFAULT_FN_ATTRS6358_mm256_mask_storeu_pd (void *__P, __mmask8 __U, __m256d __A)6359{6360__builtin_ia32_storeupd256_mask ((__v4df *) __P,6361(__v4df) __A,6362(__mmask8) __U);6363}63646365static __inline__ void __DEFAULT_FN_ATTRS6366_mm_mask_storeu_ps (void *__P, __mmask8 __U, __m128 __A)6367{6368__builtin_ia32_storeups128_mask ((__v4sf *) __P,6369(__v4sf) __A,6370(__mmask8) __U);6371}63726373static __inline__ void __DEFAULT_FN_ATTRS6374_mm256_mask_storeu_ps (void *__P, __mmask8 __U, __m256 __A)6375{6376__builtin_ia32_storeups256_mask ((__v8sf *) __P,6377(__v8sf) __A,6378(__mmask8) __U);6379}638063816382static __inline__ __m128d __DEFAULT_FN_ATTRS6383_mm_mask_unpackhi_pd(__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)6384{6385return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,6386(__v2df)_mm_unpackhi_pd(__A, __B),6387(__v2df)__W);6388}63896390static __inline__ __m128d __DEFAULT_FN_ATTRS6391_mm_maskz_unpackhi_pd(__mmask8 __U, __m128d __A, __m128d __B)6392{6393return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,6394(__v2df)_mm_unpackhi_pd(__A, __B),6395(__v2df)_mm_setzero_pd());6396}63976398static __inline__ __m256d __DEFAULT_FN_ATTRS6399_mm256_mask_unpackhi_pd(__m256d __W, __mmask8 __U, __m256d __A, __m256d __B)6400{6401return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,6402(__v4df)_mm256_unpackhi_pd(__A, __B),6403(__v4df)__W);6404}64056406static __inline__ __m256d __DEFAULT_FN_ATTRS6407_mm256_maskz_unpackhi_pd(__mmask8 __U, __m256d __A, __m256d __B)6408{6409return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,6410(__v4df)_mm256_unpackhi_pd(__A, __B),6411(__v4df)_mm256_setzero_pd());6412}64136414static __inline__ __m128 __DEFAULT_FN_ATTRS6415_mm_mask_unpackhi_ps(__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)6416{6417return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,6418(__v4sf)_mm_unpackhi_ps(__A, __B),6419(__v4sf)__W);6420}64216422static __inline__ __m128 __DEFAULT_FN_ATTRS6423_mm_maskz_unpackhi_ps(__mmask8 __U, __m128 __A, __m128 __B)6424{6425return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,6426(__v4sf)_mm_unpackhi_ps(__A, __B),6427(__v4sf)_mm_setzero_ps());6428}64296430static __inline__ __m256 __DEFAULT_FN_ATTRS6431_mm256_mask_unpackhi_ps(__m256 __W, __mmask8 __U, __m256 __A, __m256 __B)6432{6433return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,6434(__v8sf)_mm256_unpackhi_ps(__A, __B),6435(__v8sf)__W);6436}64376438static __inline__ __m256 __DEFAULT_FN_ATTRS6439_mm256_maskz_unpackhi_ps(__mmask8 __U, __m256 __A, __m256 __B)6440{6441return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,6442(__v8sf)_mm256_unpackhi_ps(__A, __B),6443(__v8sf)_mm256_setzero_ps());6444}64456446static __inline__ __m128d __DEFAULT_FN_ATTRS6447_mm_mask_unpacklo_pd(__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)6448{6449return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,6450(__v2df)_mm_unpacklo_pd(__A, __B),6451(__v2df)__W);6452}64536454static __inline__ __m128d __DEFAULT_FN_ATTRS6455_mm_maskz_unpacklo_pd(__mmask8 __U, __m128d __A, __m128d __B)6456{6457return (__m128d)__builtin_ia32_selectpd_128((__mmask8)__U,6458(__v2df)_mm_unpacklo_pd(__A, __B),6459(__v2df)_mm_setzero_pd());6460}64616462static __inline__ __m256d __DEFAULT_FN_ATTRS6463_mm256_mask_unpacklo_pd(__m256d __W, __mmask8 __U, __m256d __A, __m256d __B)6464{6465return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,6466(__v4df)_mm256_unpacklo_pd(__A, __B),6467(__v4df)__W);6468}64696470static __inline__ __m256d __DEFAULT_FN_ATTRS6471_mm256_maskz_unpacklo_pd(__mmask8 __U, __m256d __A, __m256d __B)6472{6473return (__m256d)__builtin_ia32_selectpd_256((__mmask8)__U,6474(__v4df)_mm256_unpacklo_pd(__A, __B),6475(__v4df)_mm256_setzero_pd());6476}64776478static __inline__ __m128 __DEFAULT_FN_ATTRS6479_mm_mask_unpacklo_ps(__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)6480{6481return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,6482(__v4sf)_mm_unpacklo_ps(__A, __B),6483(__v4sf)__W);6484}64856486static __inline__ __m128 __DEFAULT_FN_ATTRS6487_mm_maskz_unpacklo_ps(__mmask8 __U, __m128 __A, __m128 __B)6488{6489return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,6490(__v4sf)_mm_unpacklo_ps(__A, __B),6491(__v4sf)_mm_setzero_ps());6492}64936494static __inline__ __m256 __DEFAULT_FN_ATTRS6495_mm256_mask_unpacklo_ps(__m256 __W, __mmask8 __U, __m256 __A, __m256 __B)6496{6497return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,6498(__v8sf)_mm256_unpacklo_ps(__A, __B),6499(__v8sf)__W);6500}65016502static __inline__ __m256 __DEFAULT_FN_ATTRS6503_mm256_maskz_unpacklo_ps(__mmask8 __U, __m256 __A, __m256 __B)6504{6505return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,6506(__v8sf)_mm256_unpacklo_ps(__A, __B),6507(__v8sf)_mm256_setzero_ps());6508}65096510static __inline__ __m128d __DEFAULT_FN_ATTRS6511_mm_rcp14_pd (__m128d __A)6512{6513return (__m128d) __builtin_ia32_rcp14pd128_mask ((__v2df) __A,6514(__v2df)6515_mm_setzero_pd (),6516(__mmask8) -1);6517}65186519static __inline__ __m128d __DEFAULT_FN_ATTRS6520_mm_mask_rcp14_pd (__m128d __W, __mmask8 __U, __m128d __A)6521{6522return (__m128d) __builtin_ia32_rcp14pd128_mask ((__v2df) __A,6523(__v2df) __W,6524(__mmask8) __U);6525}65266527static __inline__ __m128d __DEFAULT_FN_ATTRS6528_mm_maskz_rcp14_pd (__mmask8 __U, __m128d __A)6529{6530return (__m128d) __builtin_ia32_rcp14pd128_mask ((__v2df) __A,6531(__v2df)6532_mm_setzero_pd (),6533(__mmask8) __U);6534}65356536static __inline__ __m256d __DEFAULT_FN_ATTRS6537_mm256_rcp14_pd (__m256d __A)6538{6539return (__m256d) __builtin_ia32_rcp14pd256_mask ((__v4df) __A,6540(__v4df)6541_mm256_setzero_pd (),6542(__mmask8) -1);6543}65446545static __inline__ __m256d __DEFAULT_FN_ATTRS6546_mm256_mask_rcp14_pd (__m256d __W, __mmask8 __U, __m256d __A)6547{6548return (__m256d) __builtin_ia32_rcp14pd256_mask ((__v4df) __A,6549(__v4df) __W,6550(__mmask8) __U);6551}65526553static __inline__ __m256d __DEFAULT_FN_ATTRS6554_mm256_maskz_rcp14_pd (__mmask8 __U, __m256d __A)6555{6556return (__m256d) __builtin_ia32_rcp14pd256_mask ((__v4df) __A,6557(__v4df)6558_mm256_setzero_pd (),6559(__mmask8) __U);6560}65616562static __inline__ __m128 __DEFAULT_FN_ATTRS6563_mm_rcp14_ps (__m128 __A)6564{6565return (__m128) __builtin_ia32_rcp14ps128_mask ((__v4sf) __A,6566(__v4sf)6567_mm_setzero_ps (),6568(__mmask8) -1);6569}65706571static __inline__ __m128 __DEFAULT_FN_ATTRS6572_mm_mask_rcp14_ps (__m128 __W, __mmask8 __U, __m128 __A)6573{6574return (__m128) __builtin_ia32_rcp14ps128_mask ((__v4sf) __A,6575(__v4sf) __W,6576(__mmask8) __U);6577}65786579static __inline__ __m128 __DEFAULT_FN_ATTRS6580_mm_maskz_rcp14_ps (__mmask8 __U, __m128 __A)6581{6582return (__m128) __builtin_ia32_rcp14ps128_mask ((__v4sf) __A,6583(__v4sf)6584_mm_setzero_ps (),6585(__mmask8) __U);6586}65876588static __inline__ __m256 __DEFAULT_FN_ATTRS6589_mm256_rcp14_ps (__m256 __A)6590{6591return (__m256) __builtin_ia32_rcp14ps256_mask ((__v8sf) __A,6592(__v8sf)6593_mm256_setzero_ps (),6594(__mmask8) -1);6595}65966597static __inline__ __m256 __DEFAULT_FN_ATTRS6598_mm256_mask_rcp14_ps (__m256 __W, __mmask8 __U, __m256 __A)6599{6600return (__m256) __builtin_ia32_rcp14ps256_mask ((__v8sf) __A,6601(__v8sf) __W,6602(__mmask8) __U);6603}66046605static __inline__ __m256 __DEFAULT_FN_ATTRS6606_mm256_maskz_rcp14_ps (__mmask8 __U, __m256 __A)6607{6608return (__m256) __builtin_ia32_rcp14ps256_mask ((__v8sf) __A,6609(__v8sf)6610_mm256_setzero_ps (),6611(__mmask8) __U);6612}66136614#define _mm_mask_permute_pd(W, U, X, C) __extension__ ({ \6615(__m128d)__builtin_ia32_selectpd_128((__mmask8)(U), \6616(__v2df)_mm_permute_pd((X), (C)), \6617(__v2df)(__m128d)(W)); })66186619#define _mm_maskz_permute_pd(U, X, C) __extension__ ({ \6620(__m128d)__builtin_ia32_selectpd_128((__mmask8)(U), \6621(__v2df)_mm_permute_pd((X), (C)), \6622(__v2df)_mm_setzero_pd()); })66236624#define _mm256_mask_permute_pd(W, U, X, C) __extension__ ({ \6625(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \6626(__v4df)_mm256_permute_pd((X), (C)), \6627(__v4df)(__m256d)(W)); })66286629#define _mm256_maskz_permute_pd(U, X, C) __extension__ ({ \6630(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \6631(__v4df)_mm256_permute_pd((X), (C)), \6632(__v4df)_mm256_setzero_pd()); })66336634#define _mm_mask_permute_ps(W, U, X, C) __extension__ ({ \6635(__m128)__builtin_ia32_selectps_128((__mmask8)(U), \6636(__v4sf)_mm_permute_ps((X), (C)), \6637(__v4sf)(__m128)(W)); })66386639#define _mm_maskz_permute_ps(U, X, C) __extension__ ({ \6640(__m128)__builtin_ia32_selectps_128((__mmask8)(U), \6641(__v4sf)_mm_permute_ps((X), (C)), \6642(__v4sf)_mm_setzero_ps()); })66436644#define _mm256_mask_permute_ps(W, U, X, C) __extension__ ({ \6645(__m256)__builtin_ia32_selectps_256((__mmask8)(U), \6646(__v8sf)_mm256_permute_ps((X), (C)), \6647(__v8sf)(__m256)(W)); })66486649#define _mm256_maskz_permute_ps(U, X, C) __extension__ ({ \6650(__m256)__builtin_ia32_selectps_256((__mmask8)(U), \6651(__v8sf)_mm256_permute_ps((X), (C)), \6652(__v8sf)_mm256_setzero_ps()); })66536654static __inline__ __m128d __DEFAULT_FN_ATTRS6655_mm_mask_permutevar_pd (__m128d __W, __mmask8 __U, __m128d __A,6656__m128i __C)6657{6658return (__m128d) __builtin_ia32_vpermilvarpd_mask ((__v2df) __A,6659(__v2di) __C,6660(__v2df) __W,6661(__mmask8) __U);6662}66636664static __inline__ __m128d __DEFAULT_FN_ATTRS6665_mm_maskz_permutevar_pd (__mmask8 __U, __m128d __A, __m128i __C)6666{6667return (__m128d) __builtin_ia32_vpermilvarpd_mask ((__v2df) __A,6668(__v2di) __C,6669(__v2df)6670_mm_setzero_pd (),6671(__mmask8) __U);6672}66736674static __inline__ __m256d __DEFAULT_FN_ATTRS6675_mm256_mask_permutevar_pd (__m256d __W, __mmask8 __U, __m256d __A,6676__m256i __C)6677{6678return (__m256d) __builtin_ia32_vpermilvarpd256_mask ((__v4df) __A,6679(__v4di) __C,6680(__v4df) __W,6681(__mmask8)6682__U);6683}66846685static __inline__ __m256d __DEFAULT_FN_ATTRS6686_mm256_maskz_permutevar_pd (__mmask8 __U, __m256d __A, __m256i __C)6687{6688return (__m256d) __builtin_ia32_vpermilvarpd256_mask ((__v4df) __A,6689(__v4di) __C,6690(__v4df)6691_mm256_setzero_pd (),6692(__mmask8)6693__U);6694}66956696static __inline__ __m128 __DEFAULT_FN_ATTRS6697_mm_mask_permutevar_ps (__m128 __W, __mmask8 __U, __m128 __A,6698__m128i __C)6699{6700return (__m128) __builtin_ia32_vpermilvarps_mask ((__v4sf) __A,6701(__v4si) __C,6702(__v4sf) __W,6703(__mmask8) __U);6704}67056706static __inline__ __m128 __DEFAULT_FN_ATTRS6707_mm_maskz_permutevar_ps (__mmask8 __U, __m128 __A, __m128i __C)6708{6709return (__m128) __builtin_ia32_vpermilvarps_mask ((__v4sf) __A,6710(__v4si) __C,6711(__v4sf)6712_mm_setzero_ps (),6713(__mmask8) __U);6714}67156716static __inline__ __m256 __DEFAULT_FN_ATTRS6717_mm256_mask_permutevar_ps (__m256 __W, __mmask8 __U, __m256 __A,6718__m256i __C)6719{6720return (__m256) __builtin_ia32_vpermilvarps256_mask ((__v8sf) __A,6721(__v8si) __C,6722(__v8sf) __W,6723(__mmask8) __U);6724}67256726static __inline__ __m256 __DEFAULT_FN_ATTRS6727_mm256_maskz_permutevar_ps (__mmask8 __U, __m256 __A, __m256i __C)6728{6729return (__m256) __builtin_ia32_vpermilvarps256_mask ((__v8sf) __A,6730(__v8si) __C,6731(__v8sf)6732_mm256_setzero_ps (),6733(__mmask8) __U);6734}67356736static __inline__ __mmask8 __DEFAULT_FN_ATTRS6737_mm_test_epi32_mask (__m128i __A, __m128i __B)6738{6739return (__mmask8) __builtin_ia32_ptestmd128 ((__v4si) __A,6740(__v4si) __B,6741(__mmask8) -1);6742}67436744static __inline__ __mmask8 __DEFAULT_FN_ATTRS6745_mm_mask_test_epi32_mask (__mmask8 __U, __m128i __A, __m128i __B)6746{6747return (__mmask8) __builtin_ia32_ptestmd128 ((__v4si) __A,6748(__v4si) __B, __U);6749}67506751static __inline__ __mmask8 __DEFAULT_FN_ATTRS6752_mm256_test_epi32_mask (__m256i __A, __m256i __B)6753{6754return (__mmask8) __builtin_ia32_ptestmd256 ((__v8si) __A,6755(__v8si) __B,6756(__mmask8) -1);6757}67586759static __inline__ __mmask8 __DEFAULT_FN_ATTRS6760_mm256_mask_test_epi32_mask (__mmask8 __U, __m256i __A, __m256i __B)6761{6762return (__mmask8) __builtin_ia32_ptestmd256 ((__v8si) __A,6763(__v8si) __B, __U);6764}67656766static __inline__ __mmask8 __DEFAULT_FN_ATTRS6767_mm_test_epi64_mask (__m128i __A, __m128i __B)6768{6769return (__mmask8) __builtin_ia32_ptestmq128 ((__v2di) __A,6770(__v2di) __B,6771(__mmask8) -1);6772}67736774static __inline__ __mmask8 __DEFAULT_FN_ATTRS6775_mm_mask_test_epi64_mask (__mmask8 __U, __m128i __A, __m128i __B)6776{6777return (__mmask8) __builtin_ia32_ptestmq128 ((__v2di) __A,6778(__v2di) __B, __U);6779}67806781static __inline__ __mmask8 __DEFAULT_FN_ATTRS6782_mm256_test_epi64_mask (__m256i __A, __m256i __B)6783{6784return (__mmask8) __builtin_ia32_ptestmq256 ((__v4di) __A,6785(__v4di) __B,6786(__mmask8) -1);6787}67886789static __inline__ __mmask8 __DEFAULT_FN_ATTRS6790_mm256_mask_test_epi64_mask (__mmask8 __U, __m256i __A, __m256i __B)6791{6792return (__mmask8) __builtin_ia32_ptestmq256 ((__v4di) __A,6793(__v4di) __B, __U);6794}67956796static __inline__ __mmask8 __DEFAULT_FN_ATTRS6797_mm_testn_epi32_mask (__m128i __A, __m128i __B)6798{6799return (__mmask8) __builtin_ia32_ptestnmd128 ((__v4si) __A,6800(__v4si) __B,6801(__mmask8) -1);6802}68036804static __inline__ __mmask8 __DEFAULT_FN_ATTRS6805_mm_mask_testn_epi32_mask (__mmask8 __U, __m128i __A, __m128i __B)6806{6807return (__mmask8) __builtin_ia32_ptestnmd128 ((__v4si) __A,6808(__v4si) __B, __U);6809}68106811static __inline__ __mmask8 __DEFAULT_FN_ATTRS6812_mm256_testn_epi32_mask (__m256i __A, __m256i __B)6813{6814return (__mmask8) __builtin_ia32_ptestnmd256 ((__v8si) __A,6815(__v8si) __B,6816(__mmask8) -1);6817}68186819static __inline__ __mmask8 __DEFAULT_FN_ATTRS6820_mm256_mask_testn_epi32_mask (__mmask8 __U, __m256i __A, __m256i __B)6821{6822return (__mmask8) __builtin_ia32_ptestnmd256 ((__v8si) __A,6823(__v8si) __B, __U);6824}68256826static __inline__ __mmask8 __DEFAULT_FN_ATTRS6827_mm_testn_epi64_mask (__m128i __A, __m128i __B)6828{6829return (__mmask8) __builtin_ia32_ptestnmq128 ((__v2di) __A,6830(__v2di) __B,6831(__mmask8) -1);6832}68336834static __inline__ __mmask8 __DEFAULT_FN_ATTRS6835_mm_mask_testn_epi64_mask (__mmask8 __U, __m128i __A, __m128i __B)6836{6837return (__mmask8) __builtin_ia32_ptestnmq128 ((__v2di) __A,6838(__v2di) __B, __U);6839}68406841static __inline__ __mmask8 __DEFAULT_FN_ATTRS6842_mm256_testn_epi64_mask (__m256i __A, __m256i __B)6843{6844return (__mmask8) __builtin_ia32_ptestnmq256 ((__v4di) __A,6845(__v4di) __B,6846(__mmask8) -1);6847}68486849static __inline__ __mmask8 __DEFAULT_FN_ATTRS6850_mm256_mask_testn_epi64_mask (__mmask8 __U, __m256i __A, __m256i __B)6851{6852return (__mmask8) __builtin_ia32_ptestnmq256 ((__v4di) __A,6853(__v4di) __B, __U);6854}6855685668576858static __inline__ __m128i __DEFAULT_FN_ATTRS6859_mm_mask_unpackhi_epi32(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)6860{6861return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,6862(__v4si)_mm_unpackhi_epi32(__A, __B),6863(__v4si)__W);6864}68656866static __inline__ __m128i __DEFAULT_FN_ATTRS6867_mm_maskz_unpackhi_epi32(__mmask8 __U, __m128i __A, __m128i __B)6868{6869return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,6870(__v4si)_mm_unpackhi_epi32(__A, __B),6871(__v4si)_mm_setzero_si128());6872}68736874static __inline__ __m256i __DEFAULT_FN_ATTRS6875_mm256_mask_unpackhi_epi32(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)6876{6877return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,6878(__v8si)_mm256_unpackhi_epi32(__A, __B),6879(__v8si)__W);6880}68816882static __inline__ __m256i __DEFAULT_FN_ATTRS6883_mm256_maskz_unpackhi_epi32(__mmask8 __U, __m256i __A, __m256i __B)6884{6885return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,6886(__v8si)_mm256_unpackhi_epi32(__A, __B),6887(__v8si)_mm256_setzero_si256());6888}68896890static __inline__ __m128i __DEFAULT_FN_ATTRS6891_mm_mask_unpackhi_epi64(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)6892{6893return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,6894(__v2di)_mm_unpackhi_epi64(__A, __B),6895(__v2di)__W);6896}68976898static __inline__ __m128i __DEFAULT_FN_ATTRS6899_mm_maskz_unpackhi_epi64(__mmask8 __U, __m128i __A, __m128i __B)6900{6901return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,6902(__v2di)_mm_unpackhi_epi64(__A, __B),6903(__v2di)_mm_setzero_di());6904}69056906static __inline__ __m256i __DEFAULT_FN_ATTRS6907_mm256_mask_unpackhi_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)6908{6909return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,6910(__v4di)_mm256_unpackhi_epi64(__A, __B),6911(__v4di)__W);6912}69136914static __inline__ __m256i __DEFAULT_FN_ATTRS6915_mm256_maskz_unpackhi_epi64(__mmask8 __U, __m256i __A, __m256i __B)6916{6917return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,6918(__v4di)_mm256_unpackhi_epi64(__A, __B),6919(__v4di)_mm256_setzero_si256());6920}69216922static __inline__ __m128i __DEFAULT_FN_ATTRS6923_mm_mask_unpacklo_epi32(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)6924{6925return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,6926(__v4si)_mm_unpacklo_epi32(__A, __B),6927(__v4si)__W);6928}69296930static __inline__ __m128i __DEFAULT_FN_ATTRS6931_mm_maskz_unpacklo_epi32(__mmask8 __U, __m128i __A, __m128i __B)6932{6933return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,6934(__v4si)_mm_unpacklo_epi32(__A, __B),6935(__v4si)_mm_setzero_si128());6936}69376938static __inline__ __m256i __DEFAULT_FN_ATTRS6939_mm256_mask_unpacklo_epi32(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)6940{6941return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,6942(__v8si)_mm256_unpacklo_epi32(__A, __B),6943(__v8si)__W);6944}69456946static __inline__ __m256i __DEFAULT_FN_ATTRS6947_mm256_maskz_unpacklo_epi32(__mmask8 __U, __m256i __A, __m256i __B)6948{6949return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,6950(__v8si)_mm256_unpacklo_epi32(__A, __B),6951(__v8si)_mm256_setzero_si256());6952}69536954static __inline__ __m128i __DEFAULT_FN_ATTRS6955_mm_mask_unpacklo_epi64(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)6956{6957return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,6958(__v2di)_mm_unpacklo_epi64(__A, __B),6959(__v2di)__W);6960}69616962static __inline__ __m128i __DEFAULT_FN_ATTRS6963_mm_maskz_unpacklo_epi64(__mmask8 __U, __m128i __A, __m128i __B)6964{6965return (__m128i)__builtin_ia32_selectq_128((__mmask8)__U,6966(__v2di)_mm_unpacklo_epi64(__A, __B),6967(__v2di)_mm_setzero_di());6968}69696970static __inline__ __m256i __DEFAULT_FN_ATTRS6971_mm256_mask_unpacklo_epi64(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B)6972{6973return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,6974(__v4di)_mm256_unpacklo_epi64(__A, __B),6975(__v4di)__W);6976}69776978static __inline__ __m256i __DEFAULT_FN_ATTRS6979_mm256_maskz_unpacklo_epi64(__mmask8 __U, __m256i __A, __m256i __B)6980{6981return (__m256i)__builtin_ia32_selectq_256((__mmask8)__U,6982(__v4di)_mm256_unpacklo_epi64(__A, __B),6983(__v4di)_mm256_setzero_si256());6984}69856986static __inline__ __m128i __DEFAULT_FN_ATTRS6987_mm_mask_sra_epi32 (__m128i __W, __mmask8 __U, __m128i __A,6988__m128i __B)6989{6990return (__m128i) __builtin_ia32_psrad128_mask ((__v4si) __A,6991(__v4si) __B,6992(__v4si) __W,6993(__mmask8) __U);6994}69956996static __inline__ __m128i __DEFAULT_FN_ATTRS6997_mm_maskz_sra_epi32 (__mmask8 __U, __m128i __A, __m128i __B)6998{6999return (__m128i) __builtin_ia32_psrad128_mask ((__v4si) __A,7000(__v4si) __B,7001(__v4si)7002_mm_setzero_si128 (),7003(__mmask8) __U);7004}70057006static __inline__ __m256i __DEFAULT_FN_ATTRS7007_mm256_mask_sra_epi32 (__m256i __W, __mmask8 __U, __m256i __A,7008__m128i __B)7009{7010return (__m256i) __builtin_ia32_psrad256_mask ((__v8si) __A,7011(__v4si) __B,7012(__v8si) __W,7013(__mmask8) __U);7014}70157016static __inline__ __m256i __DEFAULT_FN_ATTRS7017_mm256_maskz_sra_epi32 (__mmask8 __U, __m256i __A, __m128i __B)7018{7019return (__m256i) __builtin_ia32_psrad256_mask ((__v8si) __A,7020(__v4si) __B,7021(__v8si)7022_mm256_setzero_si256 (),7023(__mmask8) __U);7024}70257026#define _mm_mask_srai_epi32(W, U, A, imm) __extension__ ({ \7027(__m128i)__builtin_ia32_psradi128_mask((__v4si)(__m128i)(A), (int)(imm), \7028(__v4si)(__m128i)(W), \7029(__mmask8)(U)); })70307031#define _mm_maskz_srai_epi32(U, A, imm) __extension__ ({ \7032(__m128i)__builtin_ia32_psradi128_mask((__v4si)(__m128i)(A), (int)(imm), \7033(__v4si)_mm_setzero_si128(), \7034(__mmask8)(U)); })70357036#define _mm256_mask_srai_epi32(W, U, A, imm) __extension__ ({ \7037(__m256i)__builtin_ia32_psradi256_mask((__v8si)(__m256i)(A), (int)(imm), \7038(__v8si)(__m256i)(W), \7039(__mmask8)(U)); })70407041#define _mm256_maskz_srai_epi32(U, A, imm) __extension__ ({ \7042(__m256i)__builtin_ia32_psradi256_mask((__v8si)(__m256i)(A), (int)(imm), \7043(__v8si)_mm256_setzero_si256(), \7044(__mmask8)(U)); })70457046static __inline__ __m128i __DEFAULT_FN_ATTRS7047_mm_sra_epi64 (__m128i __A, __m128i __B)7048{7049return (__m128i) __builtin_ia32_psraq128_mask ((__v2di) __A,7050(__v2di) __B,7051(__v2di)7052_mm_setzero_di (),7053(__mmask8) -1);7054}70557056static __inline__ __m128i __DEFAULT_FN_ATTRS7057_mm_mask_sra_epi64 (__m128i __W, __mmask8 __U, __m128i __A,7058__m128i __B)7059{7060return (__m128i) __builtin_ia32_psraq128_mask ((__v2di) __A,7061(__v2di) __B,7062(__v2di) __W,7063(__mmask8) __U);7064}70657066static __inline__ __m128i __DEFAULT_FN_ATTRS7067_mm_maskz_sra_epi64 (__mmask8 __U, __m128i __A, __m128i __B)7068{7069return (__m128i) __builtin_ia32_psraq128_mask ((__v2di) __A,7070(__v2di) __B,7071(__v2di)7072_mm_setzero_di (),7073(__mmask8) __U);7074}70757076static __inline__ __m256i __DEFAULT_FN_ATTRS7077_mm256_sra_epi64 (__m256i __A, __m128i __B)7078{7079return (__m256i) __builtin_ia32_psraq256_mask ((__v4di) __A,7080(__v2di) __B,7081(__v4di)7082_mm256_setzero_si256 (),7083(__mmask8) -1);7084}70857086static __inline__ __m256i __DEFAULT_FN_ATTRS7087_mm256_mask_sra_epi64 (__m256i __W, __mmask8 __U, __m256i __A,7088__m128i __B)7089{7090return (__m256i) __builtin_ia32_psraq256_mask ((__v4di) __A,7091(__v2di) __B,7092(__v4di) __W,7093(__mmask8) __U);7094}70957096static __inline__ __m256i __DEFAULT_FN_ATTRS7097_mm256_maskz_sra_epi64 (__mmask8 __U, __m256i __A, __m128i __B)7098{7099return (__m256i) __builtin_ia32_psraq256_mask ((__v4di) __A,7100(__v2di) __B,7101(__v4di)7102_mm256_setzero_si256 (),7103(__mmask8) __U);7104}71057106#define _mm_srai_epi64(A, imm) __extension__ ({ \7107(__m128i)__builtin_ia32_psraqi128_mask((__v2di)(__m128i)(A), (int)(imm), \7108(__v2di)_mm_setzero_di(), \7109(__mmask8)-1); })71107111#define _mm_mask_srai_epi64(W, U, A, imm) __extension__ ({ \7112(__m128i)__builtin_ia32_psraqi128_mask((__v2di)(__m128i)(A), (int)(imm), \7113(__v2di)(__m128i)(W), \7114(__mmask8)(U)); })71157116#define _mm_maskz_srai_epi64(U, A, imm) __extension__ ({ \7117(__m128i)__builtin_ia32_psraqi128_mask((__v2di)(__m128i)(A), (int)(imm), \7118(__v2di)_mm_setzero_si128(), \7119(__mmask8)(U)); })71207121#define _mm256_srai_epi64(A, imm) __extension__ ({ \7122(__m256i)__builtin_ia32_psraqi256_mask((__v4di)(__m256i)(A), (int)(imm), \7123(__v4di)_mm256_setzero_si256(), \7124(__mmask8)-1); })71257126#define _mm256_mask_srai_epi64(W, U, A, imm) __extension__ ({ \7127(__m256i)__builtin_ia32_psraqi256_mask((__v4di)(__m256i)(A), (int)(imm), \7128(__v4di)(__m256i)(W), \7129(__mmask8)(U)); })71307131#define _mm256_maskz_srai_epi64(U, A, imm) __extension__ ({ \7132(__m256i)__builtin_ia32_psraqi256_mask((__v4di)(__m256i)(A), (int)(imm), \7133(__v4di)_mm256_setzero_si256(), \7134(__mmask8)(U)); })71357136#define _mm_ternarylogic_epi32(A, B, C, imm) __extension__ ({ \7137(__m128i)__builtin_ia32_pternlogd128_mask((__v4si)(__m128i)(A), \7138(__v4si)(__m128i)(B), \7139(__v4si)(__m128i)(C), (int)(imm), \7140(__mmask8)-1); })71417142#define _mm_mask_ternarylogic_epi32(A, U, B, C, imm) __extension__ ({ \7143(__m128i)__builtin_ia32_pternlogd128_mask((__v4si)(__m128i)(A), \7144(__v4si)(__m128i)(B), \7145(__v4si)(__m128i)(C), (int)(imm), \7146(__mmask8)(U)); })71477148#define _mm_maskz_ternarylogic_epi32(U, A, B, C, imm) __extension__ ({ \7149(__m128i)__builtin_ia32_pternlogd128_maskz((__v4si)(__m128i)(A), \7150(__v4si)(__m128i)(B), \7151(__v4si)(__m128i)(C), (int)(imm), \7152(__mmask8)(U)); })71537154#define _mm256_ternarylogic_epi32(A, B, C, imm) __extension__ ({ \7155(__m256i)__builtin_ia32_pternlogd256_mask((__v8si)(__m256i)(A), \7156(__v8si)(__m256i)(B), \7157(__v8si)(__m256i)(C), (int)(imm), \7158(__mmask8)-1); })71597160#define _mm256_mask_ternarylogic_epi32(A, U, B, C, imm) __extension__ ({ \7161(__m256i)__builtin_ia32_pternlogd256_mask((__v8si)(__m256i)(A), \7162(__v8si)(__m256i)(B), \7163(__v8si)(__m256i)(C), (int)(imm), \7164(__mmask8)(U)); })71657166#define _mm256_maskz_ternarylogic_epi32(U, A, B, C, imm) __extension__ ({ \7167(__m256i)__builtin_ia32_pternlogd256_maskz((__v8si)(__m256i)(A), \7168(__v8si)(__m256i)(B), \7169(__v8si)(__m256i)(C), (int)(imm), \7170(__mmask8)(U)); })71717172#define _mm_ternarylogic_epi64(A, B, C, imm) __extension__ ({ \7173(__m128i)__builtin_ia32_pternlogq128_mask((__v2di)(__m128i)(A), \7174(__v2di)(__m128i)(B), \7175(__v2di)(__m128i)(C), (int)(imm), \7176(__mmask8)-1); })71777178#define _mm_mask_ternarylogic_epi64(A, U, B, C, imm) __extension__ ({ \7179(__m128i)__builtin_ia32_pternlogq128_mask((__v2di)(__m128i)(A), \7180(__v2di)(__m128i)(B), \7181(__v2di)(__m128i)(C), (int)(imm), \7182(__mmask8)(U)); })71837184#define _mm_maskz_ternarylogic_epi64(U, A, B, C, imm) __extension__ ({ \7185(__m128i)__builtin_ia32_pternlogq128_maskz((__v2di)(__m128i)(A), \7186(__v2di)(__m128i)(B), \7187(__v2di)(__m128i)(C), (int)(imm), \7188(__mmask8)(U)); })71897190#define _mm256_ternarylogic_epi64(A, B, C, imm) __extension__ ({ \7191(__m256i)__builtin_ia32_pternlogq256_mask((__v4di)(__m256i)(A), \7192(__v4di)(__m256i)(B), \7193(__v4di)(__m256i)(C), (int)(imm), \7194(__mmask8)-1); })71957196#define _mm256_mask_ternarylogic_epi64(A, U, B, C, imm) __extension__ ({ \7197(__m256i)__builtin_ia32_pternlogq256_mask((__v4di)(__m256i)(A), \7198(__v4di)(__m256i)(B), \7199(__v4di)(__m256i)(C), (int)(imm), \7200(__mmask8)(U)); })72017202#define _mm256_maskz_ternarylogic_epi64(U, A, B, C, imm) __extension__ ({ \7203(__m256i)__builtin_ia32_pternlogq256_maskz((__v4di)(__m256i)(A), \7204(__v4di)(__m256i)(B), \7205(__v4di)(__m256i)(C), (int)(imm), \7206(__mmask8)(U)); })7207720872097210#define _mm256_shuffle_f32x4(A, B, imm) __extension__ ({ \7211(__m256)__builtin_ia32_shuf_f32x4_256_mask((__v8sf)(__m256)(A), \7212(__v8sf)(__m256)(B), (int)(imm), \7213(__v8sf)_mm256_setzero_ps(), \7214(__mmask8)-1); })72157216#define _mm256_mask_shuffle_f32x4(W, U, A, B, imm) __extension__ ({ \7217(__m256)__builtin_ia32_shuf_f32x4_256_mask((__v8sf)(__m256)(A), \7218(__v8sf)(__m256)(B), (int)(imm), \7219(__v8sf)(__m256)(W), \7220(__mmask8)(U)); })72217222#define _mm256_maskz_shuffle_f32x4(U, A, B, imm) __extension__ ({ \7223(__m256)__builtin_ia32_shuf_f32x4_256_mask((__v8sf)(__m256)(A), \7224(__v8sf)(__m256)(B), (int)(imm), \7225(__v8sf)_mm256_setzero_ps(), \7226(__mmask8)(U)); })72277228#define _mm256_shuffle_f64x2(A, B, imm) __extension__ ({ \7229(__m256d)__builtin_ia32_shuf_f64x2_256_mask((__v4df)(__m256d)(A), \7230(__v4df)(__m256d)(B), \7231(int)(imm), \7232(__v4df)_mm256_setzero_pd(), \7233(__mmask8)-1); })72347235#define _mm256_mask_shuffle_f64x2(W, U, A, B, imm) __extension__ ({ \7236(__m256d)__builtin_ia32_shuf_f64x2_256_mask((__v4df)(__m256d)(A), \7237(__v4df)(__m256d)(B), \7238(int)(imm), \7239(__v4df)(__m256d)(W), \7240(__mmask8)(U)); })72417242#define _mm256_maskz_shuffle_f64x2(U, A, B, imm) __extension__ ({ \7243(__m256d)__builtin_ia32_shuf_f64x2_256_mask((__v4df)(__m256d)(A), \7244(__v4df)(__m256d)(B), \7245(int)(imm), \7246(__v4df)_mm256_setzero_pd(), \7247(__mmask8)(U)); })72487249#define _mm256_shuffle_i32x4(A, B, imm) __extension__ ({ \7250(__m256i)__builtin_ia32_shuf_i32x4_256_mask((__v8si)(__m256i)(A), \7251(__v8si)(__m256i)(B), \7252(int)(imm), \7253(__v8si)_mm256_setzero_si256(), \7254(__mmask8)-1); })72557256#define _mm256_mask_shuffle_i32x4(W, U, A, B, imm) __extension__ ({ \7257(__m256i)__builtin_ia32_shuf_i32x4_256_mask((__v8si)(__m256i)(A), \7258(__v8si)(__m256i)(B), \7259(int)(imm), \7260(__v8si)(__m256i)(W), \7261(__mmask8)(U)); })72627263#define _mm256_maskz_shuffle_i32x4(U, A, B, imm) __extension__ ({ \7264(__m256i)__builtin_ia32_shuf_i32x4_256_mask((__v8si)(__m256i)(A), \7265(__v8si)(__m256i)(B), \7266(int)(imm), \7267(__v8si)_mm256_setzero_si256(), \7268(__mmask8)(U)); })72697270#define _mm256_shuffle_i64x2(A, B, imm) __extension__ ({ \7271(__m256i)__builtin_ia32_shuf_i64x2_256_mask((__v4di)(__m256i)(A), \7272(__v4di)(__m256i)(B), \7273(int)(imm), \7274(__v4di)_mm256_setzero_si256(), \7275(__mmask8)-1); })72767277#define _mm256_mask_shuffle_i64x2(W, U, A, B, imm) __extension__ ({ \7278(__m256i)__builtin_ia32_shuf_i64x2_256_mask((__v4di)(__m256i)(A), \7279(__v4di)(__m256i)(B), \7280(int)(imm), \7281(__v4di)(__m256i)(W), \7282(__mmask8)(U)); })72837284#define _mm256_maskz_shuffle_i64x2(U, A, B, imm) __extension__ ({ \7285(__m256i)__builtin_ia32_shuf_i64x2_256_mask((__v4di)(__m256i)(A), \7286(__v4di)(__m256i)(B), \7287(int)(imm), \7288(__v4di)_mm256_setzero_si256(), \7289(__mmask8)(U)); })72907291#define _mm_mask_shuffle_pd(W, U, A, B, M) __extension__ ({ \7292(__m128d)__builtin_ia32_selectpd_128((__mmask8)(U), \7293(__v2df)_mm_shuffle_pd((A), (B), (M)), \7294(__v2df)(__m128d)(W)); })72957296#define _mm_maskz_shuffle_pd(U, A, B, M) __extension__ ({ \7297(__m128d)__builtin_ia32_selectpd_128((__mmask8)(U), \7298(__v2df)_mm_shuffle_pd((A), (B), (M)), \7299(__v2df)_mm_setzero_pd()); })73007301#define _mm256_mask_shuffle_pd(W, U, A, B, M) __extension__ ({ \7302(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \7303(__v4df)_mm256_shuffle_pd((A), (B), (M)), \7304(__v4df)(__m256d)(W)); })73057306#define _mm256_maskz_shuffle_pd(U, A, B, M) __extension__ ({ \7307(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \7308(__v4df)_mm256_shuffle_pd((A), (B), (M)), \7309(__v4df)_mm256_setzero_pd()); })73107311#define _mm_mask_shuffle_ps(W, U, A, B, M) __extension__ ({ \7312(__m128)__builtin_ia32_selectps_128((__mmask8)(U), \7313(__v4sf)_mm_shuffle_ps((A), (B), (M)), \7314(__v4sf)(__m128)(W)); })73157316#define _mm_maskz_shuffle_ps(U, A, B, M) __extension__ ({ \7317(__m128)__builtin_ia32_selectps_128((__mmask8)(U), \7318(__v4sf)_mm_shuffle_ps((A), (B), (M)), \7319(__v4sf)_mm_setzero_ps()); })73207321#define _mm256_mask_shuffle_ps(W, U, A, B, M) __extension__ ({ \7322(__m256)__builtin_ia32_selectps_256((__mmask8)(U), \7323(__v8sf)_mm256_shuffle_ps((A), (B), (M)), \7324(__v8sf)(__m256)(W)); })73257326#define _mm256_maskz_shuffle_ps(U, A, B, M) __extension__ ({ \7327(__m256)__builtin_ia32_selectps_256((__mmask8)(U), \7328(__v8sf)_mm256_shuffle_ps((A), (B), (M)), \7329(__v8sf)_mm256_setzero_ps()); })73307331static __inline__ __m128d __DEFAULT_FN_ATTRS7332_mm_rsqrt14_pd (__m128d __A)7333{7334return (__m128d) __builtin_ia32_rsqrt14pd128_mask ((__v2df) __A,7335(__v2df)7336_mm_setzero_pd (),7337(__mmask8) -1);7338}73397340static __inline__ __m128d __DEFAULT_FN_ATTRS7341_mm_mask_rsqrt14_pd (__m128d __W, __mmask8 __U, __m128d __A)7342{7343return (__m128d) __builtin_ia32_rsqrt14pd128_mask ((__v2df) __A,7344(__v2df) __W,7345(__mmask8) __U);7346}73477348static __inline__ __m128d __DEFAULT_FN_ATTRS7349_mm_maskz_rsqrt14_pd (__mmask8 __U, __m128d __A)7350{7351return (__m128d) __builtin_ia32_rsqrt14pd128_mask ((__v2df) __A,7352(__v2df)7353_mm_setzero_pd (),7354(__mmask8) __U);7355}73567357static __inline__ __m256d __DEFAULT_FN_ATTRS7358_mm256_rsqrt14_pd (__m256d __A)7359{7360return (__m256d) __builtin_ia32_rsqrt14pd256_mask ((__v4df) __A,7361(__v4df)7362_mm256_setzero_pd (),7363(__mmask8) -1);7364}73657366static __inline__ __m256d __DEFAULT_FN_ATTRS7367_mm256_mask_rsqrt14_pd (__m256d __W, __mmask8 __U, __m256d __A)7368{7369return (__m256d) __builtin_ia32_rsqrt14pd256_mask ((__v4df) __A,7370(__v4df) __W,7371(__mmask8) __U);7372}73737374static __inline__ __m256d __DEFAULT_FN_ATTRS7375_mm256_maskz_rsqrt14_pd (__mmask8 __U, __m256d __A)7376{7377return (__m256d) __builtin_ia32_rsqrt14pd256_mask ((__v4df) __A,7378(__v4df)7379_mm256_setzero_pd (),7380(__mmask8) __U);7381}73827383static __inline__ __m128 __DEFAULT_FN_ATTRS7384_mm_rsqrt14_ps (__m128 __A)7385{7386return (__m128) __builtin_ia32_rsqrt14ps128_mask ((__v4sf) __A,7387(__v4sf)7388_mm_setzero_ps (),7389(__mmask8) -1);7390}73917392static __inline__ __m128 __DEFAULT_FN_ATTRS7393_mm_mask_rsqrt14_ps (__m128 __W, __mmask8 __U, __m128 __A)7394{7395return (__m128) __builtin_ia32_rsqrt14ps128_mask ((__v4sf) __A,7396(__v4sf) __W,7397(__mmask8) __U);7398}73997400static __inline__ __m128 __DEFAULT_FN_ATTRS7401_mm_maskz_rsqrt14_ps (__mmask8 __U, __m128 __A)7402{7403return (__m128) __builtin_ia32_rsqrt14ps128_mask ((__v4sf) __A,7404(__v4sf)7405_mm_setzero_ps (),7406(__mmask8) __U);7407}74087409static __inline__ __m256 __DEFAULT_FN_ATTRS7410_mm256_rsqrt14_ps (__m256 __A)7411{7412return (__m256) __builtin_ia32_rsqrt14ps256_mask ((__v8sf) __A,7413(__v8sf)7414_mm256_setzero_ps (),7415(__mmask8) -1);7416}74177418static __inline__ __m256 __DEFAULT_FN_ATTRS7419_mm256_mask_rsqrt14_ps (__m256 __W, __mmask8 __U, __m256 __A)7420{7421return (__m256) __builtin_ia32_rsqrt14ps256_mask ((__v8sf) __A,7422(__v8sf) __W,7423(__mmask8) __U);7424}74257426static __inline__ __m256 __DEFAULT_FN_ATTRS7427_mm256_maskz_rsqrt14_ps (__mmask8 __U, __m256 __A)7428{7429return (__m256) __builtin_ia32_rsqrt14ps256_mask ((__v8sf) __A,7430(__v8sf)7431_mm256_setzero_ps (),7432(__mmask8) __U);7433}74347435static __inline__ __m256 __DEFAULT_FN_ATTRS7436_mm256_broadcast_f32x4 (__m128 __A)7437{7438return (__m256) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf) __A,7439(__v8sf)_mm256_undefined_pd (),7440(__mmask8) -1);7441}74427443static __inline__ __m256 __DEFAULT_FN_ATTRS7444_mm256_mask_broadcast_f32x4 (__m256 __O, __mmask8 __M, __m128 __A)7445{7446return (__m256) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf) __A,7447(__v8sf) __O,7448__M);7449}74507451static __inline__ __m256 __DEFAULT_FN_ATTRS7452_mm256_maskz_broadcast_f32x4 (__mmask8 __M, __m128 __A)7453{7454return (__m256) __builtin_ia32_broadcastf32x4_256_mask ((__v4sf) __A,7455(__v8sf) _mm256_setzero_ps (),7456__M);7457}74587459static __inline__ __m256i __DEFAULT_FN_ATTRS7460_mm256_broadcast_i32x4 (__m128i __A)7461{7462return (__m256i) __builtin_ia32_broadcasti32x4_256_mask ((__v4si) __A,7463(__v8si)_mm256_undefined_si256 (),7464(__mmask8) -1);7465}74667467static __inline__ __m256i __DEFAULT_FN_ATTRS7468_mm256_mask_broadcast_i32x4 (__m256i __O, __mmask8 __M, __m128i __A)7469{7470return (__m256i) __builtin_ia32_broadcasti32x4_256_mask ((__v4si) __A,7471(__v8si)7472__O, __M);7473}74747475static __inline__ __m256i __DEFAULT_FN_ATTRS7476_mm256_maskz_broadcast_i32x4 (__mmask8 __M, __m128i __A)7477{7478return (__m256i) __builtin_ia32_broadcasti32x4_256_mask ((__v4si)7479__A,7480(__v8si) _mm256_setzero_si256 (),7481__M);7482}74837484static __inline__ __m256d __DEFAULT_FN_ATTRS7485_mm256_mask_broadcastsd_pd (__m256d __O, __mmask8 __M, __m128d __A)7486{7487return (__m256d)__builtin_ia32_selectpd_256(__M,7488(__v4df) _mm256_broadcastsd_pd(__A),7489(__v4df) __O);7490}74917492static __inline__ __m256d __DEFAULT_FN_ATTRS7493_mm256_maskz_broadcastsd_pd (__mmask8 __M, __m128d __A)7494{7495return (__m256d)__builtin_ia32_selectpd_256(__M,7496(__v4df) _mm256_broadcastsd_pd(__A),7497(__v4df) _mm256_setzero_pd());7498}74997500static __inline__ __m128 __DEFAULT_FN_ATTRS7501_mm_mask_broadcastss_ps (__m128 __O, __mmask8 __M, __m128 __A)7502{7503return (__m128)__builtin_ia32_selectps_128(__M,7504(__v4sf) _mm_broadcastss_ps(__A),7505(__v4sf) __O);7506}75077508static __inline__ __m128 __DEFAULT_FN_ATTRS7509_mm_maskz_broadcastss_ps (__mmask8 __M, __m128 __A)7510{7511return (__m128)__builtin_ia32_selectps_128(__M,7512(__v4sf) _mm_broadcastss_ps(__A),7513(__v4sf) _mm_setzero_ps());7514}75157516static __inline__ __m256 __DEFAULT_FN_ATTRS7517_mm256_mask_broadcastss_ps (__m256 __O, __mmask8 __M, __m128 __A)7518{7519return (__m256)__builtin_ia32_selectps_256(__M,7520(__v8sf) _mm256_broadcastss_ps(__A),7521(__v8sf) __O);7522}75237524static __inline__ __m256 __DEFAULT_FN_ATTRS7525_mm256_maskz_broadcastss_ps (__mmask8 __M, __m128 __A)7526{7527return (__m256)__builtin_ia32_selectps_256(__M,7528(__v8sf) _mm256_broadcastss_ps(__A),7529(__v8sf) _mm256_setzero_ps());7530}75317532static __inline__ __m128i __DEFAULT_FN_ATTRS7533_mm_mask_broadcastd_epi32 (__m128i __O, __mmask8 __M, __m128i __A)7534{7535return (__m128i)__builtin_ia32_selectd_128(__M,7536(__v4si) _mm_broadcastd_epi32(__A),7537(__v4si) __O);7538}75397540static __inline__ __m128i __DEFAULT_FN_ATTRS7541_mm_maskz_broadcastd_epi32 (__mmask8 __M, __m128i __A)7542{7543return (__m128i)__builtin_ia32_selectd_128(__M,7544(__v4si) _mm_broadcastd_epi32(__A),7545(__v4si) _mm_setzero_si128());7546}75477548static __inline__ __m256i __DEFAULT_FN_ATTRS7549_mm256_mask_broadcastd_epi32 (__m256i __O, __mmask8 __M, __m128i __A)7550{7551return (__m256i)__builtin_ia32_selectd_256(__M,7552(__v8si) _mm256_broadcastd_epi32(__A),7553(__v8si) __O);7554}75557556static __inline__ __m256i __DEFAULT_FN_ATTRS7557_mm256_maskz_broadcastd_epi32 (__mmask8 __M, __m128i __A)7558{7559return (__m256i)__builtin_ia32_selectd_256(__M,7560(__v8si) _mm256_broadcastd_epi32(__A),7561(__v8si) _mm256_setzero_si256());7562}75637564static __inline__ __m128i __DEFAULT_FN_ATTRS7565_mm_mask_broadcastq_epi64 (__m128i __O, __mmask8 __M, __m128i __A)7566{7567return (__m128i)__builtin_ia32_selectq_128(__M,7568(__v2di) _mm_broadcastq_epi64(__A),7569(__v2di) __O);7570}75717572static __inline__ __m128i __DEFAULT_FN_ATTRS7573_mm_maskz_broadcastq_epi64 (__mmask8 __M, __m128i __A)7574{7575return (__m128i)__builtin_ia32_selectq_128(__M,7576(__v2di) _mm_broadcastq_epi64(__A),7577(__v2di) _mm_setzero_si128());7578}75797580static __inline__ __m256i __DEFAULT_FN_ATTRS7581_mm256_mask_broadcastq_epi64 (__m256i __O, __mmask8 __M, __m128i __A)7582{7583return (__m256i)__builtin_ia32_selectq_256(__M,7584(__v4di) _mm256_broadcastq_epi64(__A),7585(__v4di) __O);7586}75877588static __inline__ __m256i __DEFAULT_FN_ATTRS7589_mm256_maskz_broadcastq_epi64 (__mmask8 __M, __m128i __A)7590{7591return (__m256i)__builtin_ia32_selectq_256(__M,7592(__v4di) _mm256_broadcastq_epi64(__A),7593(__v4di) _mm256_setzero_si256());7594}75957596static __inline__ __m128i __DEFAULT_FN_ATTRS7597_mm_cvtsepi32_epi8 (__m128i __A)7598{7599return (__m128i) __builtin_ia32_pmovsdb128_mask ((__v4si) __A,7600(__v16qi)_mm_undefined_si128(),7601(__mmask8) -1);7602}76037604static __inline__ __m128i __DEFAULT_FN_ATTRS7605_mm_mask_cvtsepi32_epi8 (__m128i __O, __mmask8 __M, __m128i __A)7606{7607return (__m128i) __builtin_ia32_pmovsdb128_mask ((__v4si) __A,7608(__v16qi) __O, __M);7609}76107611static __inline__ __m128i __DEFAULT_FN_ATTRS7612_mm_maskz_cvtsepi32_epi8 (__mmask8 __M, __m128i __A)7613{7614return (__m128i) __builtin_ia32_pmovsdb128_mask ((__v4si) __A,7615(__v16qi) _mm_setzero_si128 (),7616__M);7617}76187619static __inline__ void __DEFAULT_FN_ATTRS7620_mm_mask_cvtsepi32_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)7621{7622__builtin_ia32_pmovsdb128mem_mask ((__v16qi *) __P, (__v4si) __A, __M);7623}76247625static __inline__ __m128i __DEFAULT_FN_ATTRS7626_mm256_cvtsepi32_epi8 (__m256i __A)7627{7628return (__m128i) __builtin_ia32_pmovsdb256_mask ((__v8si) __A,7629(__v16qi)_mm_undefined_si128(),7630(__mmask8) -1);7631}76327633static __inline__ __m128i __DEFAULT_FN_ATTRS7634_mm256_mask_cvtsepi32_epi8 (__m128i __O, __mmask8 __M, __m256i __A)7635{7636return (__m128i) __builtin_ia32_pmovsdb256_mask ((__v8si) __A,7637(__v16qi) __O, __M);7638}76397640static __inline__ __m128i __DEFAULT_FN_ATTRS7641_mm256_maskz_cvtsepi32_epi8 (__mmask8 __M, __m256i __A)7642{7643return (__m128i) __builtin_ia32_pmovsdb256_mask ((__v8si) __A,7644(__v16qi) _mm_setzero_si128 (),7645__M);7646}76477648static __inline__ void __DEFAULT_FN_ATTRS7649_mm256_mask_cvtsepi32_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)7650{7651__builtin_ia32_pmovsdb256mem_mask ((__v16qi *) __P, (__v8si) __A, __M);7652}76537654static __inline__ __m128i __DEFAULT_FN_ATTRS7655_mm_cvtsepi32_epi16 (__m128i __A)7656{7657return (__m128i) __builtin_ia32_pmovsdw128_mask ((__v4si) __A,7658(__v8hi)_mm_setzero_si128 (),7659(__mmask8) -1);7660}76617662static __inline__ __m128i __DEFAULT_FN_ATTRS7663_mm_mask_cvtsepi32_epi16 (__m128i __O, __mmask8 __M, __m128i __A)7664{7665return (__m128i) __builtin_ia32_pmovsdw128_mask ((__v4si) __A,7666(__v8hi)__O,7667__M);7668}76697670static __inline__ __m128i __DEFAULT_FN_ATTRS7671_mm_maskz_cvtsepi32_epi16 (__mmask8 __M, __m128i __A)7672{7673return (__m128i) __builtin_ia32_pmovsdw128_mask ((__v4si) __A,7674(__v8hi) _mm_setzero_si128 (),7675__M);7676}76777678static __inline__ void __DEFAULT_FN_ATTRS7679_mm_mask_cvtsepi32_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)7680{7681__builtin_ia32_pmovsdw128mem_mask ((__v8hi *) __P, (__v4si) __A, __M);7682}76837684static __inline__ __m128i __DEFAULT_FN_ATTRS7685_mm256_cvtsepi32_epi16 (__m256i __A)7686{7687return (__m128i) __builtin_ia32_pmovsdw256_mask ((__v8si) __A,7688(__v8hi)_mm_undefined_si128(),7689(__mmask8) -1);7690}76917692static __inline__ __m128i __DEFAULT_FN_ATTRS7693_mm256_mask_cvtsepi32_epi16 (__m128i __O, __mmask8 __M, __m256i __A)7694{7695return (__m128i) __builtin_ia32_pmovsdw256_mask ((__v8si) __A,7696(__v8hi) __O, __M);7697}76987699static __inline__ __m128i __DEFAULT_FN_ATTRS7700_mm256_maskz_cvtsepi32_epi16 (__mmask8 __M, __m256i __A)7701{7702return (__m128i) __builtin_ia32_pmovsdw256_mask ((__v8si) __A,7703(__v8hi) _mm_setzero_si128 (),7704__M);7705}77067707static __inline__ void __DEFAULT_FN_ATTRS7708_mm256_mask_cvtsepi32_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)7709{7710__builtin_ia32_pmovsdw256mem_mask ((__v8hi *) __P, (__v8si) __A, __M);7711}77127713static __inline__ __m128i __DEFAULT_FN_ATTRS7714_mm_cvtsepi64_epi8 (__m128i __A)7715{7716return (__m128i) __builtin_ia32_pmovsqb128_mask ((__v2di) __A,7717(__v16qi)_mm_undefined_si128(),7718(__mmask8) -1);7719}77207721static __inline__ __m128i __DEFAULT_FN_ATTRS7722_mm_mask_cvtsepi64_epi8 (__m128i __O, __mmask8 __M, __m128i __A)7723{7724return (__m128i) __builtin_ia32_pmovsqb128_mask ((__v2di) __A,7725(__v16qi) __O, __M);7726}77277728static __inline__ __m128i __DEFAULT_FN_ATTRS7729_mm_maskz_cvtsepi64_epi8 (__mmask8 __M, __m128i __A)7730{7731return (__m128i) __builtin_ia32_pmovsqb128_mask ((__v2di) __A,7732(__v16qi) _mm_setzero_si128 (),7733__M);7734}77357736static __inline__ void __DEFAULT_FN_ATTRS7737_mm_mask_cvtsepi64_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)7738{7739__builtin_ia32_pmovsqb128mem_mask ((__v16qi *) __P, (__v2di) __A, __M);7740}77417742static __inline__ __m128i __DEFAULT_FN_ATTRS7743_mm256_cvtsepi64_epi8 (__m256i __A)7744{7745return (__m128i) __builtin_ia32_pmovsqb256_mask ((__v4di) __A,7746(__v16qi)_mm_undefined_si128(),7747(__mmask8) -1);7748}77497750static __inline__ __m128i __DEFAULT_FN_ATTRS7751_mm256_mask_cvtsepi64_epi8 (__m128i __O, __mmask8 __M, __m256i __A)7752{7753return (__m128i) __builtin_ia32_pmovsqb256_mask ((__v4di) __A,7754(__v16qi) __O, __M);7755}77567757static __inline__ __m128i __DEFAULT_FN_ATTRS7758_mm256_maskz_cvtsepi64_epi8 (__mmask8 __M, __m256i __A)7759{7760return (__m128i) __builtin_ia32_pmovsqb256_mask ((__v4di) __A,7761(__v16qi) _mm_setzero_si128 (),7762__M);7763}77647765static __inline__ void __DEFAULT_FN_ATTRS7766_mm256_mask_cvtsepi64_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)7767{7768__builtin_ia32_pmovsqb256mem_mask ((__v16qi *) __P, (__v4di) __A, __M);7769}77707771static __inline__ __m128i __DEFAULT_FN_ATTRS7772_mm_cvtsepi64_epi32 (__m128i __A)7773{7774return (__m128i) __builtin_ia32_pmovsqd128_mask ((__v2di) __A,7775(__v4si)_mm_undefined_si128(),7776(__mmask8) -1);7777}77787779static __inline__ __m128i __DEFAULT_FN_ATTRS7780_mm_mask_cvtsepi64_epi32 (__m128i __O, __mmask8 __M, __m128i __A)7781{7782return (__m128i) __builtin_ia32_pmovsqd128_mask ((__v2di) __A,7783(__v4si) __O, __M);7784}77857786static __inline__ __m128i __DEFAULT_FN_ATTRS7787_mm_maskz_cvtsepi64_epi32 (__mmask8 __M, __m128i __A)7788{7789return (__m128i) __builtin_ia32_pmovsqd128_mask ((__v2di) __A,7790(__v4si) _mm_setzero_si128 (),7791__M);7792}77937794static __inline__ void __DEFAULT_FN_ATTRS7795_mm_mask_cvtsepi64_storeu_epi32 (void * __P, __mmask8 __M, __m128i __A)7796{7797__builtin_ia32_pmovsqd128mem_mask ((__v4si *) __P, (__v2di) __A, __M);7798}77997800static __inline__ __m128i __DEFAULT_FN_ATTRS7801_mm256_cvtsepi64_epi32 (__m256i __A)7802{7803return (__m128i) __builtin_ia32_pmovsqd256_mask ((__v4di) __A,7804(__v4si)_mm_undefined_si128(),7805(__mmask8) -1);7806}78077808static __inline__ __m128i __DEFAULT_FN_ATTRS7809_mm256_mask_cvtsepi64_epi32 (__m128i __O, __mmask8 __M, __m256i __A)7810{7811return (__m128i) __builtin_ia32_pmovsqd256_mask ((__v4di) __A,7812(__v4si)__O,7813__M);7814}78157816static __inline__ __m128i __DEFAULT_FN_ATTRS7817_mm256_maskz_cvtsepi64_epi32 (__mmask8 __M, __m256i __A)7818{7819return (__m128i) __builtin_ia32_pmovsqd256_mask ((__v4di) __A,7820(__v4si) _mm_setzero_si128 (),7821__M);7822}78237824static __inline__ void __DEFAULT_FN_ATTRS7825_mm256_mask_cvtsepi64_storeu_epi32 (void * __P, __mmask8 __M, __m256i __A)7826{7827__builtin_ia32_pmovsqd256mem_mask ((__v4si *) __P, (__v4di) __A, __M);7828}78297830static __inline__ __m128i __DEFAULT_FN_ATTRS7831_mm_cvtsepi64_epi16 (__m128i __A)7832{7833return (__m128i) __builtin_ia32_pmovsqw128_mask ((__v2di) __A,7834(__v8hi)_mm_undefined_si128(),7835(__mmask8) -1);7836}78377838static __inline__ __m128i __DEFAULT_FN_ATTRS7839_mm_mask_cvtsepi64_epi16 (__m128i __O, __mmask8 __M, __m128i __A)7840{7841return (__m128i) __builtin_ia32_pmovsqw128_mask ((__v2di) __A,7842(__v8hi) __O, __M);7843}78447845static __inline__ __m128i __DEFAULT_FN_ATTRS7846_mm_maskz_cvtsepi64_epi16 (__mmask8 __M, __m128i __A)7847{7848return (__m128i) __builtin_ia32_pmovsqw128_mask ((__v2di) __A,7849(__v8hi) _mm_setzero_si128 (),7850__M);7851}78527853static __inline__ void __DEFAULT_FN_ATTRS7854_mm_mask_cvtsepi64_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)7855{7856__builtin_ia32_pmovsqw128mem_mask ((__v8hi *) __P, (__v2di) __A, __M);7857}78587859static __inline__ __m128i __DEFAULT_FN_ATTRS7860_mm256_cvtsepi64_epi16 (__m256i __A)7861{7862return (__m128i) __builtin_ia32_pmovsqw256_mask ((__v4di) __A,7863(__v8hi)_mm_undefined_si128(),7864(__mmask8) -1);7865}78667867static __inline__ __m128i __DEFAULT_FN_ATTRS7868_mm256_mask_cvtsepi64_epi16 (__m128i __O, __mmask8 __M, __m256i __A)7869{7870return (__m128i) __builtin_ia32_pmovsqw256_mask ((__v4di) __A,7871(__v8hi) __O, __M);7872}78737874static __inline__ __m128i __DEFAULT_FN_ATTRS7875_mm256_maskz_cvtsepi64_epi16 (__mmask8 __M, __m256i __A)7876{7877return (__m128i) __builtin_ia32_pmovsqw256_mask ((__v4di) __A,7878(__v8hi) _mm_setzero_si128 (),7879__M);7880}78817882static __inline__ void __DEFAULT_FN_ATTRS7883_mm256_mask_cvtsepi64_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)7884{7885__builtin_ia32_pmovsqw256mem_mask ((__v8hi *) __P, (__v4di) __A, __M);7886}78877888static __inline__ __m128i __DEFAULT_FN_ATTRS7889_mm_cvtusepi32_epi8 (__m128i __A)7890{7891return (__m128i) __builtin_ia32_pmovusdb128_mask ((__v4si) __A,7892(__v16qi)_mm_undefined_si128(),7893(__mmask8) -1);7894}78957896static __inline__ __m128i __DEFAULT_FN_ATTRS7897_mm_mask_cvtusepi32_epi8 (__m128i __O, __mmask8 __M, __m128i __A)7898{7899return (__m128i) __builtin_ia32_pmovusdb128_mask ((__v4si) __A,7900(__v16qi) __O,7901__M);7902}79037904static __inline__ __m128i __DEFAULT_FN_ATTRS7905_mm_maskz_cvtusepi32_epi8 (__mmask8 __M, __m128i __A)7906{7907return (__m128i) __builtin_ia32_pmovusdb128_mask ((__v4si) __A,7908(__v16qi) _mm_setzero_si128 (),7909__M);7910}79117912static __inline__ void __DEFAULT_FN_ATTRS7913_mm_mask_cvtusepi32_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)7914{7915__builtin_ia32_pmovusdb128mem_mask ((__v16qi *) __P, (__v4si) __A, __M);7916}79177918static __inline__ __m128i __DEFAULT_FN_ATTRS7919_mm256_cvtusepi32_epi8 (__m256i __A)7920{7921return (__m128i) __builtin_ia32_pmovusdb256_mask ((__v8si) __A,7922(__v16qi)_mm_undefined_si128(),7923(__mmask8) -1);7924}79257926static __inline__ __m128i __DEFAULT_FN_ATTRS7927_mm256_mask_cvtusepi32_epi8 (__m128i __O, __mmask8 __M, __m256i __A)7928{7929return (__m128i) __builtin_ia32_pmovusdb256_mask ((__v8si) __A,7930(__v16qi) __O,7931__M);7932}79337934static __inline__ __m128i __DEFAULT_FN_ATTRS7935_mm256_maskz_cvtusepi32_epi8 (__mmask8 __M, __m256i __A)7936{7937return (__m128i) __builtin_ia32_pmovusdb256_mask ((__v8si) __A,7938(__v16qi) _mm_setzero_si128 (),7939__M);7940}79417942static __inline__ void __DEFAULT_FN_ATTRS7943_mm256_mask_cvtusepi32_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)7944{7945__builtin_ia32_pmovusdb256mem_mask ((__v16qi*) __P, (__v8si) __A, __M);7946}79477948static __inline__ __m128i __DEFAULT_FN_ATTRS7949_mm_cvtusepi32_epi16 (__m128i __A)7950{7951return (__m128i) __builtin_ia32_pmovusdw128_mask ((__v4si) __A,7952(__v8hi)_mm_undefined_si128(),7953(__mmask8) -1);7954}79557956static __inline__ __m128i __DEFAULT_FN_ATTRS7957_mm_mask_cvtusepi32_epi16 (__m128i __O, __mmask8 __M, __m128i __A)7958{7959return (__m128i) __builtin_ia32_pmovusdw128_mask ((__v4si) __A,7960(__v8hi) __O, __M);7961}79627963static __inline__ __m128i __DEFAULT_FN_ATTRS7964_mm_maskz_cvtusepi32_epi16 (__mmask8 __M, __m128i __A)7965{7966return (__m128i) __builtin_ia32_pmovusdw128_mask ((__v4si) __A,7967(__v8hi) _mm_setzero_si128 (),7968__M);7969}79707971static __inline__ void __DEFAULT_FN_ATTRS7972_mm_mask_cvtusepi32_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)7973{7974__builtin_ia32_pmovusdw128mem_mask ((__v8hi *) __P, (__v4si) __A, __M);7975}79767977static __inline__ __m128i __DEFAULT_FN_ATTRS7978_mm256_cvtusepi32_epi16 (__m256i __A)7979{7980return (__m128i) __builtin_ia32_pmovusdw256_mask ((__v8si) __A,7981(__v8hi) _mm_undefined_si128(),7982(__mmask8) -1);7983}79847985static __inline__ __m128i __DEFAULT_FN_ATTRS7986_mm256_mask_cvtusepi32_epi16 (__m128i __O, __mmask8 __M, __m256i __A)7987{7988return (__m128i) __builtin_ia32_pmovusdw256_mask ((__v8si) __A,7989(__v8hi) __O, __M);7990}79917992static __inline__ __m128i __DEFAULT_FN_ATTRS7993_mm256_maskz_cvtusepi32_epi16 (__mmask8 __M, __m256i __A)7994{7995return (__m128i) __builtin_ia32_pmovusdw256_mask ((__v8si) __A,7996(__v8hi) _mm_setzero_si128 (),7997__M);7998}79998000static __inline__ void __DEFAULT_FN_ATTRS8001_mm256_mask_cvtusepi32_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)8002{8003__builtin_ia32_pmovusdw256mem_mask ((__v8hi *) __P, (__v8si) __A, __M);8004}80058006static __inline__ __m128i __DEFAULT_FN_ATTRS8007_mm_cvtusepi64_epi8 (__m128i __A)8008{8009return (__m128i) __builtin_ia32_pmovusqb128_mask ((__v2di) __A,8010(__v16qi)_mm_undefined_si128(),8011(__mmask8) -1);8012}80138014static __inline__ __m128i __DEFAULT_FN_ATTRS8015_mm_mask_cvtusepi64_epi8 (__m128i __O, __mmask8 __M, __m128i __A)8016{8017return (__m128i) __builtin_ia32_pmovusqb128_mask ((__v2di) __A,8018(__v16qi) __O,8019__M);8020}80218022static __inline__ __m128i __DEFAULT_FN_ATTRS8023_mm_maskz_cvtusepi64_epi8 (__mmask8 __M, __m128i __A)8024{8025return (__m128i) __builtin_ia32_pmovusqb128_mask ((__v2di) __A,8026(__v16qi) _mm_setzero_si128 (),8027__M);8028}80298030static __inline__ void __DEFAULT_FN_ATTRS8031_mm_mask_cvtusepi64_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)8032{8033__builtin_ia32_pmovusqb128mem_mask ((__v16qi *) __P, (__v2di) __A, __M);8034}80358036static __inline__ __m128i __DEFAULT_FN_ATTRS8037_mm256_cvtusepi64_epi8 (__m256i __A)8038{8039return (__m128i) __builtin_ia32_pmovusqb256_mask ((__v4di) __A,8040(__v16qi)_mm_undefined_si128(),8041(__mmask8) -1);8042}80438044static __inline__ __m128i __DEFAULT_FN_ATTRS8045_mm256_mask_cvtusepi64_epi8 (__m128i __O, __mmask8 __M, __m256i __A)8046{8047return (__m128i) __builtin_ia32_pmovusqb256_mask ((__v4di) __A,8048(__v16qi) __O,8049__M);8050}80518052static __inline__ __m128i __DEFAULT_FN_ATTRS8053_mm256_maskz_cvtusepi64_epi8 (__mmask8 __M, __m256i __A)8054{8055return (__m128i) __builtin_ia32_pmovusqb256_mask ((__v4di) __A,8056(__v16qi) _mm_setzero_si128 (),8057__M);8058}80598060static __inline__ void __DEFAULT_FN_ATTRS8061_mm256_mask_cvtusepi64_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)8062{8063__builtin_ia32_pmovusqb256mem_mask ((__v16qi *) __P, (__v4di) __A, __M);8064}80658066static __inline__ __m128i __DEFAULT_FN_ATTRS8067_mm_cvtusepi64_epi32 (__m128i __A)8068{8069return (__m128i) __builtin_ia32_pmovusqd128_mask ((__v2di) __A,8070(__v4si)_mm_undefined_si128(),8071(__mmask8) -1);8072}80738074static __inline__ __m128i __DEFAULT_FN_ATTRS8075_mm_mask_cvtusepi64_epi32 (__m128i __O, __mmask8 __M, __m128i __A)8076{8077return (__m128i) __builtin_ia32_pmovusqd128_mask ((__v2di) __A,8078(__v4si) __O, __M);8079}80808081static __inline__ __m128i __DEFAULT_FN_ATTRS8082_mm_maskz_cvtusepi64_epi32 (__mmask8 __M, __m128i __A)8083{8084return (__m128i) __builtin_ia32_pmovusqd128_mask ((__v2di) __A,8085(__v4si) _mm_setzero_si128 (),8086__M);8087}80888089static __inline__ void __DEFAULT_FN_ATTRS8090_mm_mask_cvtusepi64_storeu_epi32 (void * __P, __mmask8 __M, __m128i __A)8091{8092__builtin_ia32_pmovusqd128mem_mask ((__v4si *) __P, (__v2di) __A, __M);8093}80948095static __inline__ __m128i __DEFAULT_FN_ATTRS8096_mm256_cvtusepi64_epi32 (__m256i __A)8097{8098return (__m128i) __builtin_ia32_pmovusqd256_mask ((__v4di) __A,8099(__v4si)_mm_undefined_si128(),8100(__mmask8) -1);8101}81028103static __inline__ __m128i __DEFAULT_FN_ATTRS8104_mm256_mask_cvtusepi64_epi32 (__m128i __O, __mmask8 __M, __m256i __A)8105{8106return (__m128i) __builtin_ia32_pmovusqd256_mask ((__v4di) __A,8107(__v4si) __O, __M);8108}81098110static __inline__ __m128i __DEFAULT_FN_ATTRS8111_mm256_maskz_cvtusepi64_epi32 (__mmask8 __M, __m256i __A)8112{8113return (__m128i) __builtin_ia32_pmovusqd256_mask ((__v4di) __A,8114(__v4si) _mm_setzero_si128 (),8115__M);8116}81178118static __inline__ void __DEFAULT_FN_ATTRS8119_mm256_mask_cvtusepi64_storeu_epi32 (void * __P, __mmask8 __M, __m256i __A)8120{8121__builtin_ia32_pmovusqd256mem_mask ((__v4si *) __P, (__v4di) __A, __M);8122}81238124static __inline__ __m128i __DEFAULT_FN_ATTRS8125_mm_cvtusepi64_epi16 (__m128i __A)8126{8127return (__m128i) __builtin_ia32_pmovusqw128_mask ((__v2di) __A,8128(__v8hi)_mm_undefined_si128(),8129(__mmask8) -1);8130}81318132static __inline__ __m128i __DEFAULT_FN_ATTRS8133_mm_mask_cvtusepi64_epi16 (__m128i __O, __mmask8 __M, __m128i __A)8134{8135return (__m128i) __builtin_ia32_pmovusqw128_mask ((__v2di) __A,8136(__v8hi) __O, __M);8137}81388139static __inline__ __m128i __DEFAULT_FN_ATTRS8140_mm_maskz_cvtusepi64_epi16 (__mmask8 __M, __m128i __A)8141{8142return (__m128i) __builtin_ia32_pmovusqw128_mask ((__v2di) __A,8143(__v8hi) _mm_setzero_si128 (),8144__M);8145}81468147static __inline__ void __DEFAULT_FN_ATTRS8148_mm_mask_cvtusepi64_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)8149{8150__builtin_ia32_pmovusqw128mem_mask ((__v8hi *) __P, (__v2di) __A, __M);8151}81528153static __inline__ __m128i __DEFAULT_FN_ATTRS8154_mm256_cvtusepi64_epi16 (__m256i __A)8155{8156return (__m128i) __builtin_ia32_pmovusqw256_mask ((__v4di) __A,8157(__v8hi)_mm_undefined_si128(),8158(__mmask8) -1);8159}81608161static __inline__ __m128i __DEFAULT_FN_ATTRS8162_mm256_mask_cvtusepi64_epi16 (__m128i __O, __mmask8 __M, __m256i __A)8163{8164return (__m128i) __builtin_ia32_pmovusqw256_mask ((__v4di) __A,8165(__v8hi) __O, __M);8166}81678168static __inline__ __m128i __DEFAULT_FN_ATTRS8169_mm256_maskz_cvtusepi64_epi16 (__mmask8 __M, __m256i __A)8170{8171return (__m128i) __builtin_ia32_pmovusqw256_mask ((__v4di) __A,8172(__v8hi) _mm_setzero_si128 (),8173__M);8174}81758176static __inline__ void __DEFAULT_FN_ATTRS8177_mm256_mask_cvtusepi64_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)8178{8179return __builtin_ia32_pmovusqw256mem_mask ((__v8hi *) __P, (__v4di) __A, __M);8180}81818182static __inline__ __m128i __DEFAULT_FN_ATTRS8183_mm_cvtepi32_epi8 (__m128i __A)8184{8185return (__m128i) __builtin_ia32_pmovdb128_mask ((__v4si) __A,8186(__v16qi)_mm_undefined_si128(),8187(__mmask8) -1);8188}81898190static __inline__ __m128i __DEFAULT_FN_ATTRS8191_mm_mask_cvtepi32_epi8 (__m128i __O, __mmask8 __M, __m128i __A)8192{8193return (__m128i) __builtin_ia32_pmovdb128_mask ((__v4si) __A,8194(__v16qi) __O, __M);8195}81968197static __inline__ __m128i __DEFAULT_FN_ATTRS8198_mm_maskz_cvtepi32_epi8 (__mmask8 __M, __m128i __A)8199{8200return (__m128i) __builtin_ia32_pmovdb128_mask ((__v4si) __A,8201(__v16qi)8202_mm_setzero_si128 (),8203__M);8204}82058206static __inline__ void __DEFAULT_FN_ATTRS8207_mm_mask_cvtepi32_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)8208{8209__builtin_ia32_pmovdb128mem_mask ((__v16qi *) __P, (__v4si) __A, __M);8210}82118212static __inline__ __m128i __DEFAULT_FN_ATTRS8213_mm256_cvtepi32_epi8 (__m256i __A)8214{8215return (__m128i) __builtin_ia32_pmovdb256_mask ((__v8si) __A,8216(__v16qi)_mm_undefined_si128(),8217(__mmask8) -1);8218}82198220static __inline__ __m128i __DEFAULT_FN_ATTRS8221_mm256_mask_cvtepi32_epi8 (__m128i __O, __mmask8 __M, __m256i __A)8222{8223return (__m128i) __builtin_ia32_pmovdb256_mask ((__v8si) __A,8224(__v16qi) __O, __M);8225}82268227static __inline__ __m128i __DEFAULT_FN_ATTRS8228_mm256_maskz_cvtepi32_epi8 (__mmask8 __M, __m256i __A)8229{8230return (__m128i) __builtin_ia32_pmovdb256_mask ((__v8si) __A,8231(__v16qi) _mm_setzero_si128 (),8232__M);8233}82348235static __inline__ void __DEFAULT_FN_ATTRS8236_mm256_mask_cvtepi32_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)8237{8238__builtin_ia32_pmovdb256mem_mask ((__v16qi *) __P, (__v8si) __A, __M);8239}82408241static __inline__ __m128i __DEFAULT_FN_ATTRS8242_mm_cvtepi32_epi16 (__m128i __A)8243{8244return (__m128i) __builtin_ia32_pmovdw128_mask ((__v4si) __A,8245(__v8hi) _mm_setzero_si128 (),8246(__mmask8) -1);8247}82488249static __inline__ __m128i __DEFAULT_FN_ATTRS8250_mm_mask_cvtepi32_epi16 (__m128i __O, __mmask8 __M, __m128i __A)8251{8252return (__m128i) __builtin_ia32_pmovdw128_mask ((__v4si) __A,8253(__v8hi) __O, __M);8254}82558256static __inline__ __m128i __DEFAULT_FN_ATTRS8257_mm_maskz_cvtepi32_epi16 (__mmask8 __M, __m128i __A)8258{8259return (__m128i) __builtin_ia32_pmovdw128_mask ((__v4si) __A,8260(__v8hi) _mm_setzero_si128 (),8261__M);8262}82638264static __inline__ void __DEFAULT_FN_ATTRS8265_mm_mask_cvtepi32_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)8266{8267__builtin_ia32_pmovdw128mem_mask ((__v8hi *) __P, (__v4si) __A, __M);8268}82698270static __inline__ __m128i __DEFAULT_FN_ATTRS8271_mm256_cvtepi32_epi16 (__m256i __A)8272{8273return (__m128i) __builtin_ia32_pmovdw256_mask ((__v8si) __A,8274(__v8hi)_mm_setzero_si128 (),8275(__mmask8) -1);8276}82778278static __inline__ __m128i __DEFAULT_FN_ATTRS8279_mm256_mask_cvtepi32_epi16 (__m128i __O, __mmask8 __M, __m256i __A)8280{8281return (__m128i) __builtin_ia32_pmovdw256_mask ((__v8si) __A,8282(__v8hi) __O, __M);8283}82848285static __inline__ __m128i __DEFAULT_FN_ATTRS8286_mm256_maskz_cvtepi32_epi16 (__mmask8 __M, __m256i __A)8287{8288return (__m128i) __builtin_ia32_pmovdw256_mask ((__v8si) __A,8289(__v8hi) _mm_setzero_si128 (),8290__M);8291}82928293static __inline__ void __DEFAULT_FN_ATTRS8294_mm256_mask_cvtepi32_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)8295{8296__builtin_ia32_pmovdw256mem_mask ((__v8hi *) __P, (__v8si) __A, __M);8297}82988299static __inline__ __m128i __DEFAULT_FN_ATTRS8300_mm_cvtepi64_epi8 (__m128i __A)8301{8302return (__m128i) __builtin_ia32_pmovqb128_mask ((__v2di) __A,8303(__v16qi) _mm_undefined_si128(),8304(__mmask8) -1);8305}83068307static __inline__ __m128i __DEFAULT_FN_ATTRS8308_mm_mask_cvtepi64_epi8 (__m128i __O, __mmask8 __M, __m128i __A)8309{8310return (__m128i) __builtin_ia32_pmovqb128_mask ((__v2di) __A,8311(__v16qi) __O, __M);8312}83138314static __inline__ __m128i __DEFAULT_FN_ATTRS8315_mm_maskz_cvtepi64_epi8 (__mmask8 __M, __m128i __A)8316{8317return (__m128i) __builtin_ia32_pmovqb128_mask ((__v2di) __A,8318(__v16qi) _mm_setzero_si128 (),8319__M);8320}83218322static __inline__ void __DEFAULT_FN_ATTRS8323_mm_mask_cvtepi64_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)8324{8325__builtin_ia32_pmovqb128mem_mask ((__v16qi *) __P, (__v2di) __A, __M);8326}83278328static __inline__ __m128i __DEFAULT_FN_ATTRS8329_mm256_cvtepi64_epi8 (__m256i __A)8330{8331return (__m128i) __builtin_ia32_pmovqb256_mask ((__v4di) __A,8332(__v16qi) _mm_undefined_si128(),8333(__mmask8) -1);8334}83358336static __inline__ __m128i __DEFAULT_FN_ATTRS8337_mm256_mask_cvtepi64_epi8 (__m128i __O, __mmask8 __M, __m256i __A)8338{8339return (__m128i) __builtin_ia32_pmovqb256_mask ((__v4di) __A,8340(__v16qi) __O, __M);8341}83428343static __inline__ __m128i __DEFAULT_FN_ATTRS8344_mm256_maskz_cvtepi64_epi8 (__mmask8 __M, __m256i __A)8345{8346return (__m128i) __builtin_ia32_pmovqb256_mask ((__v4di) __A,8347(__v16qi) _mm_setzero_si128 (),8348__M);8349}83508351static __inline__ void __DEFAULT_FN_ATTRS8352_mm256_mask_cvtepi64_storeu_epi8 (void * __P, __mmask8 __M, __m256i __A)8353{8354__builtin_ia32_pmovqb256mem_mask ((__v16qi *) __P, (__v4di) __A, __M);8355}83568357static __inline__ __m128i __DEFAULT_FN_ATTRS8358_mm_cvtepi64_epi32 (__m128i __A)8359{8360return (__m128i) __builtin_ia32_pmovqd128_mask ((__v2di) __A,8361(__v4si)_mm_undefined_si128(),8362(__mmask8) -1);8363}83648365static __inline__ __m128i __DEFAULT_FN_ATTRS8366_mm_mask_cvtepi64_epi32 (__m128i __O, __mmask8 __M, __m128i __A)8367{8368return (__m128i) __builtin_ia32_pmovqd128_mask ((__v2di) __A,8369(__v4si) __O, __M);8370}83718372static __inline__ __m128i __DEFAULT_FN_ATTRS8373_mm_maskz_cvtepi64_epi32 (__mmask8 __M, __m128i __A)8374{8375return (__m128i) __builtin_ia32_pmovqd128_mask ((__v2di) __A,8376(__v4si) _mm_setzero_si128 (),8377__M);8378}83798380static __inline__ void __DEFAULT_FN_ATTRS8381_mm_mask_cvtepi64_storeu_epi32 (void * __P, __mmask8 __M, __m128i __A)8382{8383__builtin_ia32_pmovqd128mem_mask ((__v4si *) __P, (__v2di) __A, __M);8384}83858386static __inline__ __m128i __DEFAULT_FN_ATTRS8387_mm256_cvtepi64_epi32 (__m256i __A)8388{8389return (__m128i) __builtin_ia32_pmovqd256_mask ((__v4di) __A,8390(__v4si) _mm_undefined_si128(),8391(__mmask8) -1);8392}83938394static __inline__ __m128i __DEFAULT_FN_ATTRS8395_mm256_mask_cvtepi64_epi32 (__m128i __O, __mmask8 __M, __m256i __A)8396{8397return (__m128i) __builtin_ia32_pmovqd256_mask ((__v4di) __A,8398(__v4si) __O, __M);8399}84008401static __inline__ __m128i __DEFAULT_FN_ATTRS8402_mm256_maskz_cvtepi64_epi32 (__mmask8 __M, __m256i __A)8403{8404return (__m128i) __builtin_ia32_pmovqd256_mask ((__v4di) __A,8405(__v4si) _mm_setzero_si128 (),8406__M);8407}84088409static __inline__ void __DEFAULT_FN_ATTRS8410_mm256_mask_cvtepi64_storeu_epi32 (void * __P, __mmask8 __M, __m256i __A)8411{8412__builtin_ia32_pmovqd256mem_mask ((__v4si *) __P, (__v4di) __A, __M);8413}84148415static __inline__ __m128i __DEFAULT_FN_ATTRS8416_mm_cvtepi64_epi16 (__m128i __A)8417{8418return (__m128i) __builtin_ia32_pmovqw128_mask ((__v2di) __A,8419(__v8hi) _mm_undefined_si128(),8420(__mmask8) -1);8421}84228423static __inline__ __m128i __DEFAULT_FN_ATTRS8424_mm_mask_cvtepi64_epi16 (__m128i __O, __mmask8 __M, __m128i __A)8425{8426return (__m128i) __builtin_ia32_pmovqw128_mask ((__v2di) __A,8427(__v8hi)__O,8428__M);8429}84308431static __inline__ __m128i __DEFAULT_FN_ATTRS8432_mm_maskz_cvtepi64_epi16 (__mmask8 __M, __m128i __A)8433{8434return (__m128i) __builtin_ia32_pmovqw128_mask ((__v2di) __A,8435(__v8hi) _mm_setzero_si128 (),8436__M);8437}84388439static __inline__ void __DEFAULT_FN_ATTRS8440_mm_mask_cvtepi64_storeu_epi16 (void * __P, __mmask8 __M, __m128i __A)8441{8442__builtin_ia32_pmovqw128mem_mask ((__v8hi *) __P, (__v2di) __A, __M);8443}84448445static __inline__ __m128i __DEFAULT_FN_ATTRS8446_mm256_cvtepi64_epi16 (__m256i __A)8447{8448return (__m128i) __builtin_ia32_pmovqw256_mask ((__v4di) __A,8449(__v8hi)_mm_undefined_si128(),8450(__mmask8) -1);8451}84528453static __inline__ __m128i __DEFAULT_FN_ATTRS8454_mm256_mask_cvtepi64_epi16 (__m128i __O, __mmask8 __M, __m256i __A)8455{8456return (__m128i) __builtin_ia32_pmovqw256_mask ((__v4di) __A,8457(__v8hi) __O, __M);8458}84598460static __inline__ __m128i __DEFAULT_FN_ATTRS8461_mm256_maskz_cvtepi64_epi16 (__mmask8 __M, __m256i __A)8462{8463return (__m128i) __builtin_ia32_pmovqw256_mask ((__v4di) __A,8464(__v8hi) _mm_setzero_si128 (),8465__M);8466}84678468static __inline__ void __DEFAULT_FN_ATTRS8469_mm256_mask_cvtepi64_storeu_epi16 (void * __P, __mmask8 __M, __m256i __A)8470{8471__builtin_ia32_pmovqw256mem_mask ((__v8hi *) __P, (__v4di) __A, __M);8472}84738474#define _mm256_extractf32x4_ps(A, imm) __extension__ ({ \8475(__m128)__builtin_ia32_extractf32x4_256_mask((__v8sf)(__m256)(A), \8476(int)(imm), \8477(__v4sf)_mm_setzero_ps(), \8478(__mmask8)-1); })84798480#define _mm256_mask_extractf32x4_ps(W, U, A, imm) __extension__ ({ \8481(__m128)__builtin_ia32_extractf32x4_256_mask((__v8sf)(__m256)(A), \8482(int)(imm), \8483(__v4sf)(__m128)(W), \8484(__mmask8)(U)); })84858486#define _mm256_maskz_extractf32x4_ps(U, A, imm) __extension__ ({ \8487(__m128)__builtin_ia32_extractf32x4_256_mask((__v8sf)(__m256)(A), \8488(int)(imm), \8489(__v4sf)_mm_setzero_ps(), \8490(__mmask8)(U)); })84918492#define _mm256_extracti32x4_epi32(A, imm) __extension__ ({ \8493(__m128i)__builtin_ia32_extracti32x4_256_mask((__v8si)(__m256i)(A), \8494(int)(imm), \8495(__v4si)_mm_setzero_si128(), \8496(__mmask8)-1); })84978498#define _mm256_mask_extracti32x4_epi32(W, U, A, imm) __extension__ ({ \8499(__m128i)__builtin_ia32_extracti32x4_256_mask((__v8si)(__m256i)(A), \8500(int)(imm), \8501(__v4si)(__m128i)(W), \8502(__mmask8)(U)); })85038504#define _mm256_maskz_extracti32x4_epi32(U, A, imm) __extension__ ({ \8505(__m128i)__builtin_ia32_extracti32x4_256_mask((__v8si)(__m256i)(A), \8506(int)(imm), \8507(__v4si)_mm_setzero_si128(), \8508(__mmask8)(U)); })85098510#define _mm256_insertf32x4(A, B, imm) __extension__ ({ \8511(__m256)__builtin_ia32_insertf32x4_256_mask((__v8sf)(__m256)(A), \8512(__v4sf)(__m128)(B), (int)(imm), \8513(__v8sf)_mm256_setzero_ps(), \8514(__mmask8)-1); })85158516#define _mm256_mask_insertf32x4(W, U, A, B, imm) __extension__ ({ \8517(__m256)__builtin_ia32_insertf32x4_256_mask((__v8sf)(__m256)(A), \8518(__v4sf)(__m128)(B), (int)(imm), \8519(__v8sf)(__m256)(W), \8520(__mmask8)(U)); })85218522#define _mm256_maskz_insertf32x4(U, A, B, imm) __extension__ ({ \8523(__m256)__builtin_ia32_insertf32x4_256_mask((__v8sf)(__m256)(A), \8524(__v4sf)(__m128)(B), (int)(imm), \8525(__v8sf)_mm256_setzero_ps(), \8526(__mmask8)(U)); })85278528#define _mm256_inserti32x4(A, B, imm) __extension__ ({ \8529(__m256i)__builtin_ia32_inserti32x4_256_mask((__v8si)(__m256i)(A), \8530(__v4si)(__m128i)(B), \8531(int)(imm), \8532(__v8si)_mm256_setzero_si256(), \8533(__mmask8)-1); })85348535#define _mm256_mask_inserti32x4(W, U, A, B, imm) __extension__ ({ \8536(__m256i)__builtin_ia32_inserti32x4_256_mask((__v8si)(__m256i)(A), \8537(__v4si)(__m128i)(B), \8538(int)(imm), \8539(__v8si)(__m256i)(W), \8540(__mmask8)(U)); })85418542#define _mm256_maskz_inserti32x4(U, A, B, imm) __extension__ ({ \8543(__m256i)__builtin_ia32_inserti32x4_256_mask((__v8si)(__m256i)(A), \8544(__v4si)(__m128i)(B), \8545(int)(imm), \8546(__v8si)_mm256_setzero_si256(), \8547(__mmask8)(U)); })85488549#define _mm_getmant_pd(A, B, C) __extension__({\8550(__m128d)__builtin_ia32_getmantpd128_mask((__v2df)(__m128d)(A), \8551(int)(((C)<<2) | (B)), \8552(__v2df)_mm_setzero_pd(), \8553(__mmask8)-1); })85548555#define _mm_mask_getmant_pd(W, U, A, B, C) __extension__({\8556(__m128d)__builtin_ia32_getmantpd128_mask((__v2df)(__m128d)(A), \8557(int)(((C)<<2) | (B)), \8558(__v2df)(__m128d)(W), \8559(__mmask8)(U)); })85608561#define _mm_maskz_getmant_pd(U, A, B, C) __extension__({\8562(__m128d)__builtin_ia32_getmantpd128_mask((__v2df)(__m128d)(A), \8563(int)(((C)<<2) | (B)), \8564(__v2df)_mm_setzero_pd(), \8565(__mmask8)(U)); })85668567#define _mm256_getmant_pd(A, B, C) __extension__ ({ \8568(__m256d)__builtin_ia32_getmantpd256_mask((__v4df)(__m256d)(A), \8569(int)(((C)<<2) | (B)), \8570(__v4df)_mm256_setzero_pd(), \8571(__mmask8)-1); })85728573#define _mm256_mask_getmant_pd(W, U, A, B, C) __extension__ ({ \8574(__m256d)__builtin_ia32_getmantpd256_mask((__v4df)(__m256d)(A), \8575(int)(((C)<<2) | (B)), \8576(__v4df)(__m256d)(W), \8577(__mmask8)(U)); })85788579#define _mm256_maskz_getmant_pd(U, A, B, C) __extension__ ({ \8580(__m256d)__builtin_ia32_getmantpd256_mask((__v4df)(__m256d)(A), \8581(int)(((C)<<2) | (B)), \8582(__v4df)_mm256_setzero_pd(), \8583(__mmask8)(U)); })85848585#define _mm_getmant_ps(A, B, C) __extension__ ({ \8586(__m128)__builtin_ia32_getmantps128_mask((__v4sf)(__m128)(A), \8587(int)(((C)<<2) | (B)), \8588(__v4sf)_mm_setzero_ps(), \8589(__mmask8)-1); })85908591#define _mm_mask_getmant_ps(W, U, A, B, C) __extension__ ({ \8592(__m128)__builtin_ia32_getmantps128_mask((__v4sf)(__m128)(A), \8593(int)(((C)<<2) | (B)), \8594(__v4sf)(__m128)(W), \8595(__mmask8)(U)); })85968597#define _mm_maskz_getmant_ps(U, A, B, C) __extension__ ({ \8598(__m128)__builtin_ia32_getmantps128_mask((__v4sf)(__m128)(A), \8599(int)(((C)<<2) | (B)), \8600(__v4sf)_mm_setzero_ps(), \8601(__mmask8)(U)); })86028603#define _mm256_getmant_ps(A, B, C) __extension__ ({ \8604(__m256)__builtin_ia32_getmantps256_mask((__v8sf)(__m256)(A), \8605(int)(((C)<<2) | (B)), \8606(__v8sf)_mm256_setzero_ps(), \8607(__mmask8)-1); })86088609#define _mm256_mask_getmant_ps(W, U, A, B, C) __extension__ ({ \8610(__m256)__builtin_ia32_getmantps256_mask((__v8sf)(__m256)(A), \8611(int)(((C)<<2) | (B)), \8612(__v8sf)(__m256)(W), \8613(__mmask8)(U)); })86148615#define _mm256_maskz_getmant_ps(U, A, B, C) __extension__ ({ \8616(__m256)__builtin_ia32_getmantps256_mask((__v8sf)(__m256)(A), \8617(int)(((C)<<2) | (B)), \8618(__v8sf)_mm256_setzero_ps(), \8619(__mmask8)(U)); })86208621#define _mm_mmask_i64gather_pd(v1_old, mask, index, addr, scale) __extension__ ({\8622(__m128d)__builtin_ia32_gather3div2df((__v2df)(__m128d)(v1_old), \8623(double const *)(addr), \8624(__v2di)(__m128i)(index), \8625(__mmask8)(mask), (int)(scale)); })86268627#define _mm_mmask_i64gather_epi64(v1_old, mask, index, addr, scale) __extension__ ({\8628(__m128i)__builtin_ia32_gather3div2di((__v2di)(__m128i)(v1_old), \8629(long long const *)(addr), \8630(__v2di)(__m128i)(index), \8631(__mmask8)(mask), (int)(scale)); })86328633#define _mm256_mmask_i64gather_pd(v1_old, mask, index, addr, scale) __extension__ ({\8634(__m256d)__builtin_ia32_gather3div4df((__v4df)(__m256d)(v1_old), \8635(double const *)(addr), \8636(__v4di)(__m256i)(index), \8637(__mmask8)(mask), (int)(scale)); })86388639#define _mm256_mmask_i64gather_epi64(v1_old, mask, index, addr, scale) __extension__ ({\8640(__m256i)__builtin_ia32_gather3div4di((__v4di)(__m256i)(v1_old), \8641(long long const *)(addr), \8642(__v4di)(__m256i)(index), \8643(__mmask8)(mask), (int)(scale)); })86448645#define _mm_mmask_i64gather_ps(v1_old, mask, index, addr, scale) __extension__ ({\8646(__m128)__builtin_ia32_gather3div4sf((__v4sf)(__m128)(v1_old), \8647(float const *)(addr), \8648(__v2di)(__m128i)(index), \8649(__mmask8)(mask), (int)(scale)); })86508651#define _mm_mmask_i64gather_epi32(v1_old, mask, index, addr, scale) __extension__ ({\8652(__m128i)__builtin_ia32_gather3div4si((__v4si)(__m128i)(v1_old), \8653(int const *)(addr), \8654(__v2di)(__m128i)(index), \8655(__mmask8)(mask), (int)(scale)); })86568657#define _mm256_mmask_i64gather_ps(v1_old, mask, index, addr, scale) __extension__ ({\8658(__m128)__builtin_ia32_gather3div8sf((__v4sf)(__m128)(v1_old), \8659(float const *)(addr), \8660(__v4di)(__m256i)(index), \8661(__mmask8)(mask), (int)(scale)); })86628663#define _mm256_mmask_i64gather_epi32(v1_old, mask, index, addr, scale) __extension__ ({\8664(__m128i)__builtin_ia32_gather3div8si((__v4si)(__m128i)(v1_old), \8665(int const *)(addr), \8666(__v4di)(__m256i)(index), \8667(__mmask8)(mask), (int)(scale)); })86688669#define _mm_mmask_i32gather_pd(v1_old, mask, index, addr, scale) __extension__ ({\8670(__m128d)__builtin_ia32_gather3siv2df((__v2df)(__m128d)(v1_old), \8671(double const *)(addr), \8672(__v4si)(__m128i)(index), \8673(__mmask8)(mask), (int)(scale)); })86748675#define _mm_mmask_i32gather_epi64(v1_old, mask, index, addr, scale) __extension__ ({\8676(__m128i)__builtin_ia32_gather3siv2di((__v2di)(__m128i)(v1_old), \8677(long long const *)(addr), \8678(__v4si)(__m128i)(index), \8679(__mmask8)(mask), (int)(scale)); })86808681#define _mm256_mmask_i32gather_pd(v1_old, mask, index, addr, scale) __extension__ ({\8682(__m256d)__builtin_ia32_gather3siv4df((__v4df)(__m256d)(v1_old), \8683(double const *)(addr), \8684(__v4si)(__m128i)(index), \8685(__mmask8)(mask), (int)(scale)); })86868687#define _mm256_mmask_i32gather_epi64(v1_old, mask, index, addr, scale) __extension__ ({\8688(__m256i)__builtin_ia32_gather3siv4di((__v4di)(__m256i)(v1_old), \8689(long long const *)(addr), \8690(__v4si)(__m128i)(index), \8691(__mmask8)(mask), (int)(scale)); })86928693#define _mm_mmask_i32gather_ps(v1_old, mask, index, addr, scale) __extension__ ({\8694(__m128)__builtin_ia32_gather3siv4sf((__v4sf)(__m128)(v1_old), \8695(float const *)(addr), \8696(__v4si)(__m128i)(index), \8697(__mmask8)(mask), (int)(scale)); })86988699#define _mm_mmask_i32gather_epi32(v1_old, mask, index, addr, scale) __extension__ ({\8700(__m128i)__builtin_ia32_gather3siv4si((__v4si)(__m128i)(v1_old), \8701(int const *)(addr), \8702(__v4si)(__m128i)(index), \8703(__mmask8)(mask), (int)(scale)); })87048705#define _mm256_mmask_i32gather_ps(v1_old, mask, index, addr, scale) __extension__ ({\8706(__m256)__builtin_ia32_gather3siv8sf((__v8sf)(__m256)(v1_old), \8707(float const *)(addr), \8708(__v8si)(__m256i)(index), \8709(__mmask8)(mask), (int)(scale)); })87108711#define _mm256_mmask_i32gather_epi32(v1_old, mask, index, addr, scale) __extension__ ({\8712(__m256i)__builtin_ia32_gather3siv8si((__v8si)(__m256i)(v1_old), \8713(int const *)(addr), \8714(__v8si)(__m256i)(index), \8715(__mmask8)(mask), (int)(scale)); })87168717#define _mm256_permutex_pd(X, C) __extension__ ({ \8718(__m256d)__builtin_shufflevector((__v4df)(__m256d)(X), \8719(__v4df)_mm256_undefined_pd(), \8720((C) >> 0) & 0x3, ((C) >> 2) & 0x3, \8721((C) >> 4) & 0x3, ((C) >> 6) & 0x3); })87228723#define _mm256_mask_permutex_pd(W, U, X, C) __extension__ ({ \8724(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \8725(__v4df)_mm256_permutex_pd((X), (C)), \8726(__v4df)(__m256d)(W)); })87278728#define _mm256_maskz_permutex_pd(U, X, C) __extension__ ({ \8729(__m256d)__builtin_ia32_selectpd_256((__mmask8)(U), \8730(__v4df)_mm256_permutex_pd((X), (C)), \8731(__v4df)_mm256_setzero_pd()); })87328733#define _mm256_permutex_epi64(X, C) __extension__ ({ \8734(__m256i)__builtin_shufflevector((__v4di)(__m256i)(X), \8735(__v4di)_mm256_undefined_si256(), \8736((C) >> 0) & 0x3, ((C) >> 2) & 0x3, \8737((C) >> 4) & 0x3, ((C) >> 6) & 0x3); })87388739#define _mm256_mask_permutex_epi64(W, U, X, C) __extension__ ({ \8740(__m256i)__builtin_ia32_selectq_256((__mmask8)(U), \8741(__v4di)_mm256_permutex_epi64((X), (C)), \8742(__v4di)(__m256i)(W)); })87438744#define _mm256_maskz_permutex_epi64(U, X, C) __extension__ ({ \8745(__m256i)__builtin_ia32_selectq_256((__mmask8)(U), \8746(__v4di)_mm256_permutex_epi64((X), (C)), \8747(__v4di)_mm256_setzero_si256()); })87488749static __inline__ __m256d __DEFAULT_FN_ATTRS8750_mm256_permutexvar_pd (__m256i __X, __m256d __Y)8751{8752return (__m256d) __builtin_ia32_permvardf256_mask ((__v4df) __Y,8753(__v4di) __X,8754(__v4df) _mm256_undefined_si256 (),8755(__mmask8) -1);8756}87578758static __inline__ __m256d __DEFAULT_FN_ATTRS8759_mm256_mask_permutexvar_pd (__m256d __W, __mmask8 __U, __m256i __X,8760__m256d __Y)8761{8762return (__m256d) __builtin_ia32_permvardf256_mask ((__v4df) __Y,8763(__v4di) __X,8764(__v4df) __W,8765(__mmask8) __U);8766}87678768static __inline__ __m256d __DEFAULT_FN_ATTRS8769_mm256_maskz_permutexvar_pd (__mmask8 __U, __m256i __X, __m256d __Y)8770{8771return (__m256d) __builtin_ia32_permvardf256_mask ((__v4df) __Y,8772(__v4di) __X,8773(__v4df) _mm256_setzero_pd (),8774(__mmask8) __U);8775}87768777static __inline__ __m256i __DEFAULT_FN_ATTRS8778_mm256_maskz_permutexvar_epi64 (__mmask8 __M, __m256i __X, __m256i __Y)8779{8780return (__m256i) __builtin_ia32_permvardi256_mask ((__v4di) __Y,8781(__v4di) __X,8782(__v4di) _mm256_setzero_si256 (),8783(__mmask8) __M);8784}87858786static __inline__ __m256i __DEFAULT_FN_ATTRS8787_mm256_permutexvar_epi64 ( __m256i __X, __m256i __Y)8788{8789return (__m256i) __builtin_ia32_permvardi256_mask ((__v4di) __Y,8790(__v4di) __X,8791(__v4di) _mm256_undefined_si256 (),8792(__mmask8) -1);8793}87948795static __inline__ __m256i __DEFAULT_FN_ATTRS8796_mm256_mask_permutexvar_epi64 (__m256i __W, __mmask8 __M, __m256i __X,8797__m256i __Y)8798{8799return (__m256i) __builtin_ia32_permvardi256_mask ((__v4di) __Y,8800(__v4di) __X,8801(__v4di) __W,8802__M);8803}88048805static __inline__ __m256 __DEFAULT_FN_ATTRS8806_mm256_mask_permutexvar_ps (__m256 __W, __mmask8 __U, __m256i __X,8807__m256 __Y)8808{8809return (__m256) __builtin_ia32_permvarsf256_mask ((__v8sf) __Y,8810(__v8si) __X,8811(__v8sf) __W,8812(__mmask8) __U);8813}88148815static __inline__ __m256 __DEFAULT_FN_ATTRS8816_mm256_maskz_permutexvar_ps (__mmask8 __U, __m256i __X, __m256 __Y)8817{8818return (__m256) __builtin_ia32_permvarsf256_mask ((__v8sf) __Y,8819(__v8si) __X,8820(__v8sf) _mm256_setzero_ps (),8821(__mmask8) __U);8822}88238824static __inline__ __m256 __DEFAULT_FN_ATTRS8825_mm256_permutexvar_ps (__m256i __X, __m256 __Y)8826{8827return (__m256) __builtin_ia32_permvarsf256_mask ((__v8sf) __Y,8828(__v8si) __X,8829(__v8sf) _mm256_undefined_si256 (),8830(__mmask8) -1);8831}88328833static __inline__ __m256i __DEFAULT_FN_ATTRS8834_mm256_maskz_permutexvar_epi32 (__mmask8 __M, __m256i __X, __m256i __Y)8835{8836return (__m256i) __builtin_ia32_permvarsi256_mask ((__v8si) __Y,8837(__v8si) __X,8838(__v8si) _mm256_setzero_si256 (),8839__M);8840}88418842static __inline__ __m256i __DEFAULT_FN_ATTRS8843_mm256_mask_permutexvar_epi32 (__m256i __W, __mmask8 __M, __m256i __X,8844__m256i __Y)8845{8846return (__m256i) __builtin_ia32_permvarsi256_mask ((__v8si) __Y,8847(__v8si) __X,8848(__v8si) __W,8849(__mmask8) __M);8850}88518852static __inline__ __m256i __DEFAULT_FN_ATTRS8853_mm256_permutexvar_epi32 (__m256i __X, __m256i __Y)8854{8855return (__m256i) __builtin_ia32_permvarsi256_mask ((__v8si) __Y,8856(__v8si) __X,8857(__v8si) _mm256_undefined_si256(),8858(__mmask8) -1);8859}88608861#define _mm_alignr_epi32(A, B, imm) __extension__ ({ \8862(__m128i)__builtin_ia32_alignd128_mask((__v4si)(__m128i)(A), \8863(__v4si)(__m128i)(B), (int)(imm), \8864(__v4si)_mm_undefined_si128(), \8865(__mmask8)-1); })88668867#define _mm_mask_alignr_epi32(W, U, A, B, imm) __extension__ ({ \8868(__m128i)__builtin_ia32_alignd128_mask((__v4si)(__m128i)(A), \8869(__v4si)(__m128i)(B), (int)(imm), \8870(__v4si)(__m128i)(W), \8871(__mmask8)(U)); })88728873#define _mm_maskz_alignr_epi32(U, A, B, imm) __extension__ ({ \8874(__m128i)__builtin_ia32_alignd128_mask((__v4si)(__m128i)(A), \8875(__v4si)(__m128i)(B), (int)(imm), \8876(__v4si)_mm_setzero_si128(), \8877(__mmask8)(U)); })88788879#define _mm256_alignr_epi32(A, B, imm) __extension__ ({ \8880(__m256i)__builtin_ia32_alignd256_mask((__v8si)(__m256i)(A), \8881(__v8si)(__m256i)(B), (int)(imm), \8882(__v8si)_mm256_undefined_si256(), \8883(__mmask8)-1); })88848885#define _mm256_mask_alignr_epi32(W, U, A, B, imm) __extension__ ({ \8886(__m256i)__builtin_ia32_alignd256_mask((__v8si)(__m256i)(A), \8887(__v8si)(__m256i)(B), (int)(imm), \8888(__v8si)(__m256i)(W), \8889(__mmask8)(U)); })88908891#define _mm256_maskz_alignr_epi32(U, A, B, imm) __extension__ ({ \8892(__m256i)__builtin_ia32_alignd256_mask((__v8si)(__m256i)(A), \8893(__v8si)(__m256i)(B), (int)(imm), \8894(__v8si)_mm256_setzero_si256(), \8895(__mmask8)(U)); })88968897#define _mm_alignr_epi64(A, B, imm) __extension__ ({ \8898(__m128i)__builtin_ia32_alignq128_mask((__v2di)(__m128i)(A), \8899(__v2di)(__m128i)(B), (int)(imm), \8900(__v2di)_mm_setzero_di(), \8901(__mmask8)-1); })89028903#define _mm_mask_alignr_epi64(W, U, A, B, imm) __extension__ ({ \8904(__m128i)__builtin_ia32_alignq128_mask((__v2di)(__m128i)(A), \8905(__v2di)(__m128i)(B), (int)(imm), \8906(__v2di)(__m128i)(W), \8907(__mmask8)(U)); })89088909#define _mm_maskz_alignr_epi64(U, A, B, imm) __extension__ ({ \8910(__m128i)__builtin_ia32_alignq128_mask((__v2di)(__m128i)(A), \8911(__v2di)(__m128i)(B), (int)(imm), \8912(__v2di)_mm_setzero_di(), \8913(__mmask8)(U)); })89148915#define _mm256_alignr_epi64(A, B, imm) __extension__ ({ \8916(__m256i)__builtin_ia32_alignq256_mask((__v4di)(__m256i)(A), \8917(__v4di)(__m256i)(B), (int)(imm), \8918(__v4di)_mm256_undefined_pd(), \8919(__mmask8)-1); })89208921#define _mm256_mask_alignr_epi64(W, U, A, B, imm) __extension__ ({ \8922(__m256i)__builtin_ia32_alignq256_mask((__v4di)(__m256i)(A), \8923(__v4di)(__m256i)(B), (int)(imm), \8924(__v4di)(__m256i)(W), \8925(__mmask8)(U)); })89268927#define _mm256_maskz_alignr_epi64(U, A, B, imm) __extension__ ({ \8928(__m256i)__builtin_ia32_alignq256_mask((__v4di)(__m256i)(A), \8929(__v4di)(__m256i)(B), (int)(imm), \8930(__v4di)_mm256_setzero_si256(), \8931(__mmask8)(U)); })89328933static __inline__ __m128 __DEFAULT_FN_ATTRS8934_mm_mask_movehdup_ps (__m128 __W, __mmask8 __U, __m128 __A)8935{8936return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,8937(__v4sf)_mm_movehdup_ps(__A),8938(__v4sf)__W);8939}89408941static __inline__ __m128 __DEFAULT_FN_ATTRS8942_mm_maskz_movehdup_ps (__mmask8 __U, __m128 __A)8943{8944return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,8945(__v4sf)_mm_movehdup_ps(__A),8946(__v4sf)_mm_setzero_ps());8947}89488949static __inline__ __m256 __DEFAULT_FN_ATTRS8950_mm256_mask_movehdup_ps (__m256 __W, __mmask8 __U, __m256 __A)8951{8952return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,8953(__v8sf)_mm256_movehdup_ps(__A),8954(__v8sf)__W);8955}89568957static __inline__ __m256 __DEFAULT_FN_ATTRS8958_mm256_maskz_movehdup_ps (__mmask8 __U, __m256 __A)8959{8960return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,8961(__v8sf)_mm256_movehdup_ps(__A),8962(__v8sf)_mm256_setzero_ps());8963}89648965static __inline__ __m128 __DEFAULT_FN_ATTRS8966_mm_mask_moveldup_ps (__m128 __W, __mmask8 __U, __m128 __A)8967{8968return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,8969(__v4sf)_mm_moveldup_ps(__A),8970(__v4sf)__W);8971}89728973static __inline__ __m128 __DEFAULT_FN_ATTRS8974_mm_maskz_moveldup_ps (__mmask8 __U, __m128 __A)8975{8976return (__m128)__builtin_ia32_selectps_128((__mmask8)__U,8977(__v4sf)_mm_moveldup_ps(__A),8978(__v4sf)_mm_setzero_ps());8979}89808981static __inline__ __m256 __DEFAULT_FN_ATTRS8982_mm256_mask_moveldup_ps (__m256 __W, __mmask8 __U, __m256 __A)8983{8984return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,8985(__v8sf)_mm256_moveldup_ps(__A),8986(__v8sf)__W);8987}89888989static __inline__ __m256 __DEFAULT_FN_ATTRS8990_mm256_maskz_moveldup_ps (__mmask8 __U, __m256 __A)8991{8992return (__m256)__builtin_ia32_selectps_256((__mmask8)__U,8993(__v8sf)_mm256_moveldup_ps(__A),8994(__v8sf)_mm256_setzero_ps());8995}89968997#define _mm256_mask_shuffle_epi32(W, U, A, I) __extension__({\8998(__m256i)__builtin_ia32_selectd_256((__mmask8)(U), \8999(__v8si)_mm256_shuffle_epi32((A), (I)), \9000(__v8si)(__m256i)(W)); })90019002#define _mm256_maskz_shuffle_epi32(U, A, I) __extension__({\9003(__m256i)__builtin_ia32_selectd_256((__mmask8)(U), \9004(__v8si)_mm256_shuffle_epi32((A), (I)), \9005(__v8si)_mm256_setzero_si256()); })90069007#define _mm_mask_shuffle_epi32(W, U, A, I) __extension__({\9008(__m128i)__builtin_ia32_selectd_128((__mmask8)(U), \9009(__v4si)_mm_shuffle_epi32((A), (I)), \9010(__v4si)(__m128i)(W)); })90119012#define _mm_maskz_shuffle_epi32(U, A, I) __extension__({\9013(__m128i)__builtin_ia32_selectd_128((__mmask8)(U), \9014(__v4si)_mm_shuffle_epi32((A), (I)), \9015(__v4si)_mm_setzero_si128()); })90169017static __inline__ __m128d __DEFAULT_FN_ATTRS9018_mm_mask_mov_pd (__m128d __W, __mmask8 __U, __m128d __A)9019{9020return (__m128d) __builtin_ia32_selectpd_128 ((__mmask8) __U,9021(__v2df) __A,9022(__v2df) __W);9023}90249025static __inline__ __m128d __DEFAULT_FN_ATTRS9026_mm_maskz_mov_pd (__mmask8 __U, __m128d __A)9027{9028return (__m128d) __builtin_ia32_selectpd_128 ((__mmask8) __U,9029(__v2df) __A,9030(__v2df) _mm_setzero_pd ());9031}90329033static __inline__ __m256d __DEFAULT_FN_ATTRS9034_mm256_mask_mov_pd (__m256d __W, __mmask8 __U, __m256d __A)9035{9036return (__m256d) __builtin_ia32_selectpd_256 ((__mmask8) __U,9037(__v4df) __A,9038(__v4df) __W);9039}90409041static __inline__ __m256d __DEFAULT_FN_ATTRS9042_mm256_maskz_mov_pd (__mmask8 __U, __m256d __A)9043{9044return (__m256d) __builtin_ia32_selectpd_256 ((__mmask8) __U,9045(__v4df) __A,9046(__v4df) _mm256_setzero_pd ());9047}90489049static __inline__ __m128 __DEFAULT_FN_ATTRS9050_mm_mask_mov_ps (__m128 __W, __mmask8 __U, __m128 __A)9051{9052return (__m128) __builtin_ia32_selectps_128 ((__mmask8) __U,9053(__v4sf) __A,9054(__v4sf) __W);9055}90569057static __inline__ __m128 __DEFAULT_FN_ATTRS9058_mm_maskz_mov_ps (__mmask8 __U, __m128 __A)9059{9060return (__m128) __builtin_ia32_selectps_128 ((__mmask8) __U,9061(__v4sf) __A,9062(__v4sf) _mm_setzero_ps ());9063}90649065static __inline__ __m256 __DEFAULT_FN_ATTRS9066_mm256_mask_mov_ps (__m256 __W, __mmask8 __U, __m256 __A)9067{9068return (__m256) __builtin_ia32_selectps_256 ((__mmask8) __U,9069(__v8sf) __A,9070(__v8sf) __W);9071}90729073static __inline__ __m256 __DEFAULT_FN_ATTRS9074_mm256_maskz_mov_ps (__mmask8 __U, __m256 __A)9075{9076return (__m256) __builtin_ia32_selectps_256 ((__mmask8) __U,9077(__v8sf) __A,9078(__v8sf) _mm256_setzero_ps ());9079}90809081static __inline__ __m128 __DEFAULT_FN_ATTRS9082_mm_mask_cvtph_ps (__m128 __W, __mmask8 __U, __m128i __A)9083{9084return (__m128) __builtin_ia32_vcvtph2ps_mask ((__v8hi) __A,9085(__v4sf) __W,9086(__mmask8) __U);9087}90889089static __inline__ __m128 __DEFAULT_FN_ATTRS9090_mm_maskz_cvtph_ps (__mmask8 __U, __m128i __A)9091{9092return (__m128) __builtin_ia32_vcvtph2ps_mask ((__v8hi) __A,9093(__v4sf)9094_mm_setzero_ps (),9095(__mmask8) __U);9096}90979098static __inline__ __m256 __DEFAULT_FN_ATTRS9099_mm256_mask_cvtph_ps (__m256 __W, __mmask8 __U, __m128i __A)9100{9101return (__m256) __builtin_ia32_vcvtph2ps256_mask ((__v8hi) __A,9102(__v8sf) __W,9103(__mmask8) __U);9104}91059106static __inline__ __m256 __DEFAULT_FN_ATTRS9107_mm256_maskz_cvtph_ps (__mmask8 __U, __m128i __A)9108{9109return (__m256) __builtin_ia32_vcvtph2ps256_mask ((__v8hi) __A,9110(__v8sf)9111_mm256_setzero_ps (),9112(__mmask8) __U);9113}91149115static __inline __m128i __DEFAULT_FN_ATTRS9116_mm_mask_cvtps_ph (__m128i __W, __mmask8 __U, __m128 __A)9117{9118return (__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf) __A, _MM_FROUND_CUR_DIRECTION,9119(__v8hi) __W,9120(__mmask8) __U);9121}91229123static __inline __m128i __DEFAULT_FN_ATTRS9124_mm_maskz_cvtps_ph (__mmask8 __U, __m128 __A)9125{9126return (__m128i) __builtin_ia32_vcvtps2ph_mask ((__v4sf) __A, _MM_FROUND_CUR_DIRECTION,9127(__v8hi) _mm_setzero_si128 (),9128(__mmask8) __U);9129}91309131#define _mm_mask_cvt_roundps_ph(W, U, A, I) __extension__ ({ \9132(__m128i)__builtin_ia32_vcvtps2ph_mask((__v4sf)(__m128)(A), (int)(I), \9133(__v8hi)(__m128i)(W), \9134(__mmask8)(U)); })91359136#define _mm_maskz_cvt_roundps_ph(U, A, I) __extension__ ({ \9137(__m128i)__builtin_ia32_vcvtps2ph_mask((__v4sf)(__m128)(A), (int)(I), \9138(__v8hi)_mm_setzero_si128(), \9139(__mmask8)(U)); })91409141static __inline __m128i __DEFAULT_FN_ATTRS9142_mm256_mask_cvtps_ph (__m128i __W, __mmask8 __U, __m256 __A)9143{9144return (__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf) __A, _MM_FROUND_CUR_DIRECTION,9145(__v8hi) __W,9146(__mmask8) __U);9147}91489149static __inline __m128i __DEFAULT_FN_ATTRS9150_mm256_maskz_cvtps_ph ( __mmask8 __U, __m256 __A)9151{9152return (__m128i) __builtin_ia32_vcvtps2ph256_mask ((__v8sf) __A, _MM_FROUND_CUR_DIRECTION,9153(__v8hi) _mm_setzero_si128(),9154(__mmask8) __U);9155}9156#define _mm256_mask_cvt_roundps_ph(W, U, A, I) __extension__ ({ \9157(__m128i)__builtin_ia32_vcvtps2ph256_mask((__v8sf)(__m256)(A), (int)(I), \9158(__v8hi)(__m128i)(W), \9159(__mmask8)(U)); })91609161#define _mm256_maskz_cvt_roundps_ph(U, A, I) __extension__ ({ \9162(__m128i)__builtin_ia32_vcvtps2ph256_mask((__v8sf)(__m256)(A), (int)(I), \9163(__v8hi)_mm_setzero_si128(), \9164(__mmask8)(U)); })916591669167#undef __DEFAULT_FN_ATTRS91689169#endif /* __AVX512VLINTRIN_H */917091719172