Lines Matching defs:__M

546 _mm_maskz_packs_epi32(__mmask8 __M, __m128i __A, __m128i __B) {
547 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
553 _mm_mask_packs_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
555 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
561 _mm256_maskz_packs_epi32(__mmask16 __M, __m256i __A, __m256i __B)
563 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
569 _mm256_mask_packs_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
571 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
577 _mm_maskz_packs_epi16(__mmask16 __M, __m128i __A, __m128i __B)
579 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
585 _mm_mask_packs_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
587 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
593 _mm256_maskz_packs_epi16(__mmask32 __M, __m256i __A, __m256i __B)
595 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
601 _mm256_mask_packs_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
603 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
609 _mm_maskz_packus_epi32(__mmask8 __M, __m128i __A, __m128i __B)
611 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
617 _mm_mask_packus_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
619 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
625 _mm256_maskz_packus_epi32(__mmask16 __M, __m256i __A, __m256i __B)
627 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
633 _mm256_mask_packus_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
635 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
641 _mm_maskz_packus_epi16(__mmask16 __M, __m128i __A, __m128i __B)
643 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
649 _mm_mask_packus_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
651 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
657 _mm256_maskz_packus_epi16(__mmask32 __M, __m256i __A, __m256i __B)
659 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
665 _mm256_mask_packus_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
667 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
865 _mm_maskz_max_epi8(__mmask16 __M, __m128i __A, __m128i __B)
867 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
873 _mm_mask_max_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
875 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
881 _mm256_maskz_max_epi8(__mmask32 __M, __m256i __A, __m256i __B)
883 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
889 _mm256_mask_max_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
891 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
897 _mm_maskz_max_epi16(__mmask8 __M, __m128i __A, __m128i __B)
899 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
905 _mm_mask_max_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
907 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
913 _mm256_maskz_max_epi16(__mmask16 __M, __m256i __A, __m256i __B)
915 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
921 _mm256_mask_max_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
923 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
929 _mm_maskz_max_epu8(__mmask16 __M, __m128i __A, __m128i __B)
931 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
937 _mm_mask_max_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
939 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
945 _mm256_maskz_max_epu8 (__mmask32 __M, __m256i __A, __m256i __B)
947 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
953 _mm256_mask_max_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
955 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
961 _mm_maskz_max_epu16(__mmask8 __M, __m128i __A, __m128i __B)
963 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
969 _mm_mask_max_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
971 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
977 _mm256_maskz_max_epu16(__mmask16 __M, __m256i __A, __m256i __B)
979 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
985 _mm256_mask_max_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
987 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
993 _mm_maskz_min_epi8(__mmask16 __M, __m128i __A, __m128i __B)
995 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1001 _mm_mask_min_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
1003 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1009 _mm256_maskz_min_epi8(__mmask32 __M, __m256i __A, __m256i __B)
1011 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
1017 _mm256_mask_min_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
1019 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
1025 _mm_maskz_min_epi16(__mmask8 __M, __m128i __A, __m128i __B)
1027 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
1033 _mm_mask_min_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
1035 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
1041 _mm256_maskz_min_epi16(__mmask16 __M, __m256i __A, __m256i __B)
1043 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
1049 _mm256_mask_min_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
1051 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
1057 _mm_maskz_min_epu8(__mmask16 __M, __m128i __A, __m128i __B)
1059 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1065 _mm_mask_min_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
1067 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1073 _mm256_maskz_min_epu8 (__mmask32 __M, __m256i __A, __m256i __B)
1075 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
1081 _mm256_mask_min_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
1083 return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
1089 _mm_maskz_min_epu16(__mmask8 __M, __m128i __A, __m128i __B)
1091 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
1097 _mm_mask_min_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
1099 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
1105 _mm256_maskz_min_epu16(__mmask16 __M, __m256i __A, __m256i __B)
1107 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
1113 _mm256_mask_min_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
1115 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
1413 _mm_mask_cvtsepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {
1416 __M);
1420 _mm_maskz_cvtsepi16_epi8 (__mmask8 __M, __m128i __A) {
1423 __M);
1434 _mm256_mask_cvtsepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {
1437 __M);
1441 _mm256_maskz_cvtsepi16_epi8 (__mmask16 __M, __m256i __A) {
1444 __M);
1455 _mm_mask_cvtusepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {
1458 __M);
1462 _mm_maskz_cvtusepi16_epi8 (__mmask8 __M, __m128i __A) {
1465 __M);
1476 _mm256_mask_cvtusepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {
1479 __M);
1483 _mm256_maskz_cvtusepi16_epi8 (__mmask16 __M, __m256i __A) {
1486 __M);
1498 _mm_mask_cvtepi16_epi8 (__m128i __O, __mmask8 __M, __m128i __A) {
1501 __M);
1505 _mm_maskz_cvtepi16_epi8 (__mmask8 __M, __m128i __A) {
1508 __M);
1512 _mm_mask_cvtepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)
1514 __builtin_ia32_pmovwb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);
1519 _mm_mask_cvtsepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)
1521 __builtin_ia32_pmovswb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);
1525 _mm_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)
1527 __builtin_ia32_pmovuswb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);
1536 _mm256_mask_cvtepi16_epi8 (__m128i __O, __mmask16 __M, __m256i __A) {
1537 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1543 _mm256_maskz_cvtepi16_epi8 (__mmask16 __M, __m256i __A) {
1544 return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
1550 _mm256_mask_cvtepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)
1552 __builtin_ia32_pmovwb256mem_mask ((__v16qi *) __P, (__v16hi) __A, __M);
1556 _mm256_mask_cvtsepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)
1558 __builtin_ia32_pmovswb256mem_mask ((__v16qi *) __P, (__v16hi) __A, __M);
1562 _mm256_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)
1564 __builtin_ia32_pmovuswb256mem_mask ((__v16qi*) __P, (__v16hi) __A, __M);
2263 _mm_mask_set1_epi8 (__m128i __O, __mmask16 __M, char __A)
2265 return (__m128i) __builtin_ia32_selectb_128(__M,
2271 _mm_maskz_set1_epi8 (__mmask16 __M, char __A)
2273 return (__m128i) __builtin_ia32_selectb_128(__M,
2279 _mm256_mask_set1_epi8 (__m256i __O, __mmask32 __M, char __A)
2281 return (__m256i) __builtin_ia32_selectb_256(__M,
2287 _mm256_maskz_set1_epi8 (__mmask32 __M, char __A)
2289 return (__m256i) __builtin_ia32_selectb_256(__M,
2622 _mm_mask_broadcastb_epi8 (__m128i __O, __mmask16 __M, __m128i __A)
2624 return (__m128i)__builtin_ia32_selectb_128(__M,
2630 _mm_maskz_broadcastb_epi8 (__mmask16 __M, __m128i __A)
2632 return (__m128i)__builtin_ia32_selectb_128(__M,
2638 _mm256_mask_broadcastb_epi8 (__m256i __O, __mmask32 __M, __m128i __A)
2640 return (__m256i)__builtin_ia32_selectb_256(__M,
2646 _mm256_maskz_broadcastb_epi8 (__mmask32 __M, __m128i __A)
2648 return (__m256i)__builtin_ia32_selectb_256(__M,
2654 _mm_mask_broadcastw_epi16 (__m128i __O, __mmask8 __M, __m128i __A)
2656 return (__m128i)__builtin_ia32_selectw_128(__M,
2662 _mm_maskz_broadcastw_epi16 (__mmask8 __M, __m128i __A)
2664 return (__m128i)__builtin_ia32_selectw_128(__M,
2670 _mm256_mask_broadcastw_epi16 (__m256i __O, __mmask16 __M, __m128i __A)
2672 return (__m256i)__builtin_ia32_selectw_256(__M,
2678 _mm256_maskz_broadcastw_epi16 (__mmask16 __M, __m128i __A)
2680 return (__m256i)__builtin_ia32_selectw_256(__M,
2686 _mm256_mask_set1_epi16 (__m256i __O, __mmask16 __M, short __A)
2688 return (__m256i) __builtin_ia32_selectw_256 (__M,
2694 _mm256_maskz_set1_epi16 (__mmask16 __M, short __A)
2696 return (__m256i) __builtin_ia32_selectw_256(__M,
2702 _mm_mask_set1_epi16 (__m128i __O, __mmask8 __M, short __A)
2704 return (__m128i) __builtin_ia32_selectw_128(__M,
2710 _mm_maskz_set1_epi16 (__mmask8 __M, short __A)
2712 return (__m128i) __builtin_ia32_selectw_128(__M,
2724 _mm_maskz_permutexvar_epi16 (__mmask8 __M, __m128i __A, __m128i __B)
2726 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
2732 _mm_mask_permutexvar_epi16 (__m128i __W, __mmask8 __M, __m128i __A,
2735 return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
2747 _mm256_maskz_permutexvar_epi16 (__mmask16 __M, __m256i __A,
2750 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
2756 _mm256_mask_permutexvar_epi16 (__m256i __W, __mmask16 __M, __m256i __A,
2759 return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
2833 _mm_mask_reduce_add_epi16( __mmask8 __M, __m128i __W) {
2834 __W = _mm_maskz_mov_epi16(__M, __W);
2839 _mm_mask_reduce_mul_epi16( __mmask8 __M, __m128i __W) {
2840 __W = _mm_mask_mov_epi16(_mm_set1_epi16(1), __M, __W);
2845 _mm_mask_reduce_and_epi16( __mmask8 __M, __m128i __W) {
2846 __W = _mm_mask_mov_epi16(_mm_set1_epi16(-1), __M, __W);
2851 _mm_mask_reduce_or_epi16(__mmask8 __M, __m128i __W) {
2852 __W = _mm_maskz_mov_epi16(__M, __W);
2877 _mm_mask_reduce_max_epi16(__mmask16 __M, __m128i __V) {
2878 __V = _mm_mask_mov_epi16(_mm_set1_epi16(-32767-1), __M, __V);
2883 _mm_mask_reduce_max_epu16(__mmask16 __M, __m128i __V) {
2884 __V = _mm_maskz_mov_epi16(__M, __V);
2889 _mm_mask_reduce_min_epi16(__mmask16 __M, __m128i __V) {
2890 __V = _mm_mask_mov_epi16(_mm_set1_epi16(32767), __M, __V);
2895 _mm_mask_reduce_min_epu16(__mmask16 __M, __m128i __V) {
2896 __V = _mm_mask_mov_epi16(_mm_set1_epi16(-1), __M, __V);
2921 _mm256_mask_reduce_add_epi16( __mmask16 __M, __m256i __W) {
2922 __W = _mm256_maskz_mov_epi16(__M, __W);
2927 _mm256_mask_reduce_mul_epi16( __mmask16 __M, __m256i __W) {
2928 __W = _mm256_mask_mov_epi16(_mm256_set1_epi16(1), __M, __W);
2933 _mm256_mask_reduce_and_epi16( __mmask16 __M, __m256i __W) {
2934 __W = _mm256_mask_mov_epi16(_mm256_set1_epi16(-1), __M, __W);
2939 _mm256_mask_reduce_or_epi16(__mmask16 __M, __m256i __W) {
2940 __W = _mm256_maskz_mov_epi16(__M, __W);
2965 _mm256_mask_reduce_max_epi16(__mmask16 __M, __m256i __V) {
2966 __V = _mm256_mask_mov_epi16(_mm256_set1_epi16(-32767-1), __M, __V);
2971 _mm256_mask_reduce_max_epu16(__mmask16 __M, __m256i __V) {
2972 __V = _mm256_maskz_mov_epi16(__M, __V);
2977 _mm256_mask_reduce_min_epi16(__mmask16 __M, __m256i __V) {
2978 __V = _mm256_mask_mov_epi16(_mm256_set1_epi16(32767), __M, __V);
2983 _mm256_mask_reduce_min_epu16(__mmask16 __M, __m256i __V) {
2984 __V = _mm256_mask_mov_epi16(_mm256_set1_epi16(-1), __M, __V);
3009 _mm_mask_reduce_add_epi8(__mmask16 __M, __m128i __W) {
3010 __W = _mm_maskz_mov_epi8(__M, __W);
3015 _mm_mask_reduce_mul_epi8(__mmask16 __M, __m128i __W) {
3016 __W = _mm_mask_mov_epi8(_mm_set1_epi8(1), __M, __W);
3021 _mm_mask_reduce_and_epi8(__mmask16 __M, __m128i __W) {
3022 __W = _mm_mask_mov_epi8(_mm_set1_epi8(-1), __M, __W);
3027 _mm_mask_reduce_or_epi8(__mmask16 __M, __m128i __W) {
3028 __W = _mm_maskz_mov_epi8(__M, __W);
3053 _mm_mask_reduce_max_epi8(__mmask16 __M, __m128i __V) {
3054 __V = _mm_mask_mov_epi8(_mm_set1_epi8(-127-1), __M, __V);
3059 _mm_mask_reduce_max_epu8(__mmask16 __M, __m128i __V) {
3060 __V = _mm_maskz_mov_epi8(__M, __V);
3065 _mm_mask_reduce_min_epi8(__mmask16 __M, __m128i __V) {
3066 __V = _mm_mask_mov_epi8(_mm_set1_epi8(127), __M, __V);
3071 _mm_mask_reduce_min_epu8(__mmask16 __M, __m128i __V) {
3072 __V = _mm_mask_mov_epi8(_mm_set1_epi8(-1), __M, __V);
3097 _mm256_mask_reduce_add_epi8(__mmask32 __M, __m256i __W) {
3098 __W = _mm256_maskz_mov_epi8(__M, __W);
3103 _mm256_mask_reduce_mul_epi8(__mmask32 __M, __m256i __W) {
3104 __W = _mm256_mask_mov_epi8(_mm256_set1_epi8(1), __M, __W);
3109 _mm256_mask_reduce_and_epi8(__mmask32 __M, __m256i __W) {
3110 __W = _mm256_mask_mov_epi8(_mm256_set1_epi8(-1), __M, __W);
3115 _mm256_mask_reduce_or_epi8(__mmask32 __M, __m256i __W) {
3116 __W = _mm256_maskz_mov_epi8(__M, __W);
3141 _mm256_mask_reduce_max_epi8(__mmask32 __M, __m256i __V) {
3142 __V = _mm256_mask_mov_epi8(_mm256_set1_epi8(-127-1), __M, __V);
3147 _mm256_mask_reduce_max_epu8(__mmask32 __M, __m256i __V) {
3148 __V = _mm256_maskz_mov_epi8(__M, __V);
3153 _mm256_mask_reduce_min_epi8(__mmask32 __M, __m256i __V) {
3154 __V = _mm256_mask_mov_epi8(_mm256_set1_epi8(127), __M, __V);
3159 _mm256_mask_reduce_min_epu8(__mmask32 __M, __m256i __V) {
3160 __V = _mm256_mask_mov_epi8(_mm256_set1_epi8(-1), __M, __V);