@zigc/lib 0.17.0-dev.27 → 0.17.0-dev.296
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/c/fcntl.zig +6 -1
- package/c/inttypes.zig +0 -10
- package/c/math.zig +52 -112
- package/c/pthread.zig +57 -0
- package/c/search.zig +1 -27
- package/c/stdlib/drand48.zig +0 -57
- package/c/stdlib.zig +31 -121
- package/c/string.zig +20 -7
- package/c/strings.zig +0 -38
- package/c/unistd.zig +27 -26
- package/c/wchar.zig +10 -0
- package/c.zig +2 -2
- package/compiler/aro/aro/CodeGen.zig +7 -8
- package/compiler/aro/aro/Compilation.zig +17 -17
- package/compiler/aro/aro/Driver.zig +14 -13
- package/compiler/aro/aro/Parser.zig +20 -15
- package/compiler/aro/aro/Pragma.zig +3 -2
- package/compiler/aro/aro/Preprocessor.zig +9 -6
- package/compiler/aro/aro/pragmas/message.zig +3 -2
- package/compiler/aro/aro/text_literal.zig +3 -2
- package/compiler/aro/assembly_backend/x86_64.zig +4 -4
- package/compiler/build_runner.zig +2 -4
- package/compiler/reduce/Walk.zig +8 -13
- package/compiler/resinator/compile.zig +1 -1
- package/compiler/resinator/cvtres.zig +4 -4
- package/compiler/resinator/errors.zig +7 -7
- package/compiler/resinator/ico.zig +4 -4
- package/compiler/resinator/parse.zig +2 -2
- package/compiler/resinator/res.zig +1 -1
- package/compiler/std-docs.zig +1 -1
- package/compiler/test_runner.zig +1 -1
- package/compiler/translate-c/MacroTranslator.zig +1 -1
- package/compiler/translate-c/Translator.zig +6 -2
- package/compiler/translate-c/ast.zig +16 -23
- package/compiler/translate-c/main.zig +1 -1
- package/compiler_rt/addf3.zig +1 -1
- package/compiler_rt/arm.zig +3 -3
- package/compiler_rt/atomics.zig +1 -1
- package/compiler_rt/comparef.zig +3 -3
- package/compiler_rt/cos.zig +1 -3
- package/compiler_rt/count0bits.zig +1 -1
- package/compiler_rt/divdf3.zig +2 -2
- package/compiler_rt/divsf3.zig +1 -1
- package/compiler_rt/divtf3.zig +1 -1
- package/compiler_rt/divxf3.zig +1 -1
- package/compiler_rt/exp.zig +0 -2
- package/compiler_rt/exp2.zig +0 -2
- package/compiler_rt/extendf.zig +5 -5
- package/compiler_rt/fabs.zig +1 -3
- package/compiler_rt/float_from_int.zig +3 -4
- package/compiler_rt/fma.zig +0 -2
- package/compiler_rt/fmax.zig +1 -3
- package/compiler_rt/fmin.zig +1 -3
- package/compiler_rt/fmod.zig +2 -4
- package/compiler_rt/limb64.zig +3 -2
- package/compiler_rt/log.zig +0 -2
- package/compiler_rt/log10.zig +0 -2
- package/compiler_rt/log2.zig +0 -2
- package/compiler_rt/mulf3.zig +2 -2
- package/compiler_rt/rem_pio2l.zig +1 -1
- package/compiler_rt/round.zig +0 -2
- package/compiler_rt/sin.zig +1 -3
- package/compiler_rt/sincos.zig +1 -3
- package/compiler_rt/sqrt.zig +0 -2
- package/compiler_rt/ssp.zig +2 -2
- package/compiler_rt/tan.zig +1 -3
- package/compiler_rt/trunc.zig +0 -2
- package/compiler_rt/truncf.zig +3 -3
- package/compiler_rt/trunctfhf2.zig +3 -0
- package/compiler_rt.zig +5 -26
- package/docs/wasm/Walk.zig +1 -3
- package/docs/wasm/html_render.zig +1 -2
- package/docs/wasm/markdown/Parser.zig +16 -20
- package/fuzzer.zig +2 -0
- package/include/__clang_spirv_builtins.h +12 -12
- package/include/__float_float.h +176 -0
- package/include/__float_header_macro.h +12 -0
- package/include/__float_infinity_nan.h +20 -0
- package/include/amo.h +131 -0
- package/include/amxavx512intrin.h +215 -1
- package/include/amxintrin.h +0 -2
- package/include/arm_acle.h +37 -27
- package/include/arm_neon.h +218 -82
- package/include/arm_sme.h +8 -8
- package/include/arm_sve.h +4162 -3782
- package/include/avx10_2_512bf16intrin.h +19 -12
- package/include/avx10_2_512convertintrin.h +1 -1
- package/include/avx10_2_512niintrin.h +31 -31
- package/include/avx10_2_512satcvtdsintrin.h +1 -1
- package/include/avx10_2bf16intrin.h +54 -45
- package/include/avx10_2convertintrin.h +2 -2
- package/include/avx10_2copyintrin.h +1 -1
- package/include/avx10_2niintrin.h +14 -14
- package/include/avx10_2satcvtdsintrin.h +2 -2
- package/include/avx2intrin.h +275 -377
- package/include/avx512bf16intrin.h +25 -16
- package/include/avx512bitalgintrin.h +19 -30
- package/include/avx512bwintrin.h +386 -505
- package/include/avx512cdintrin.h +42 -55
- package/include/avx512dqintrin.h +132 -161
- package/include/avx512fintrin.h +1015 -1424
- package/include/avx512fp16intrin.h +112 -110
- package/include/avx512ifmaintrin.h +32 -34
- package/include/avx512ifmavlintrin.h +73 -46
- package/include/avx512vbmi2intrin.h +43 -32
- package/include/avx512vbmiintrin.h +19 -27
- package/include/avx512vbmivlintrin.h +35 -49
- package/include/avx512vlbf16intrin.h +32 -22
- package/include/avx512vlbitalgintrin.h +37 -53
- package/include/avx512vlbwintrin.h +470 -573
- package/include/avx512vlcdintrin.h +74 -102
- package/include/avx512vldqintrin.h +110 -127
- package/include/avx512vlfp16intrin.h +130 -111
- package/include/avx512vlintrin.h +945 -1299
- package/include/avx512vlvbmi2intrin.h +78 -63
- package/include/avx512vlvnniintrin.h +21 -18
- package/include/avx512vlvp2intersectintrin.h +2 -2
- package/include/avx512vnniintrin.h +10 -10
- package/include/avx512vp2intersectintrin.h +1 -2
- package/include/avx512vpopcntdqintrin.h +8 -10
- package/include/avx512vpopcntdqvlintrin.h +17 -15
- package/include/avxifmaintrin.h +16 -0
- package/include/avxintrin.h +165 -241
- package/include/avxvnniint16intrin.h +118 -99
- package/include/avxvnniint8intrin.h +56 -32
- package/include/avxvnniintrin.h +16 -8
- package/include/cpuid.h +101 -4
- package/include/emmintrin.h +168 -168
- package/include/f16cintrin.h +23 -9
- package/include/float.h +16 -155
- package/include/fma4intrin.h +98 -96
- package/include/fmaintrin.h +96 -66
- package/include/gfniintrin.h +21 -16
- package/include/hexagon_types.h +23 -20
- package/include/hvx_hexagon_protos.h +649 -860
- package/include/immintrin.h +0 -12
- package/include/intrin.h +4 -0
- package/include/lasxintrin.h +113 -0
- package/include/llvm_libc_wrappers/assert.h +3 -5
- package/include/llvm_libc_wrappers/ctype.h +3 -115
- package/include/llvm_libc_wrappers/inttypes.h +3 -5
- package/include/llvm_libc_wrappers/stdio.h +10 -38
- package/include/llvm_libc_wrappers/stdlib.h +3 -24
- package/include/llvm_libc_wrappers/string.h +2 -70
- package/include/llvm_libc_wrappers/time.h +4 -10
- package/include/mmintrin.h +188 -257
- package/include/module.modulemap +23 -4
- package/include/movrs_avx10_2_512intrin.h +2 -2
- package/include/movrs_avx10_2intrin.h +4 -4
- package/include/pmmintrin.h +12 -24
- package/include/ptrauth.h +16 -2
- package/include/riscv_mips.h +34 -0
- package/include/riscv_nds.h +89 -0
- package/include/sifive_vector.h +58 -2
- package/include/sm4evexintrin.h +2 -2
- package/include/smmintrin.h +77 -59
- package/include/spirvintrin.h +194 -0
- package/include/stddefer.h +19 -0
- package/include/tmmintrin.h +116 -147
- package/include/vaesintrin.h +1 -2
- package/include/xmmintrin.h +44 -70
- package/include/xopintrin.h +20 -10
- package/libc/include/aarch64-linux-any/asm/hwcap.h +1 -0
- package/libc/include/aarch64-linux-any/asm/unistd_64.h +1 -0
- package/libc/include/any-linux-any/asm-generic/errno.h +2 -0
- package/libc/include/any-linux-any/asm-generic/unistd.h +4 -1
- package/libc/include/any-linux-any/drm/amdgpu_drm.h +20 -6
- package/libc/include/any-linux-any/drm/amdxdna_accel.h +8 -0
- package/libc/include/any-linux-any/drm/drm_fourcc.h +6 -6
- package/libc/include/any-linux-any/drm/panfrost_drm.h +75 -1
- package/libc/include/any-linux-any/drm/panthor_drm.h +154 -3
- package/libc/include/any-linux-any/drm/rocket_accel.h +74 -24
- package/libc/include/any-linux-any/drm/xe_drm.h +89 -6
- package/libc/include/any-linux-any/linux/android/binder.h +1 -1
- package/libc/include/any-linux-any/linux/bpf.h +28 -0
- package/libc/include/any-linux-any/linux/btrfs.h +1 -0
- package/libc/include/any-linux-any/linux/btrfs_tree.h +32 -2
- package/libc/include/any-linux-any/linux/dma-buf.h +1 -0
- package/libc/include/any-linux-any/linux/dpll.h +1 -0
- package/libc/include/any-linux-any/linux/elf.h +2 -0
- package/libc/include/any-linux-any/linux/ethtool.h +21 -5
- package/libc/include/any-linux-any/linux/fs.h +1 -0
- package/libc/include/any-linux-any/linux/hyperv.h +1 -1
- package/libc/include/any-linux-any/linux/idxd.h +134 -134
- package/libc/include/any-linux-any/linux/if_alg.h +1 -1
- package/libc/include/any-linux-any/linux/if_link.h +1 -0
- package/libc/include/any-linux-any/linux/input-event-codes.h +4 -0
- package/libc/include/any-linux-any/linux/io_uring/bpf_filter.h +68 -0
- package/libc/include/any-linux-any/linux/io_uring/query.h +5 -1
- package/libc/include/any-linux-any/linux/io_uring.h +33 -2
- package/libc/include/any-linux-any/linux/iommufd.h +39 -0
- package/libc/include/any-linux-any/linux/kfd_ioctl.h +13 -3
- package/libc/include/any-linux-any/linux/kfd_sysfs.h +2 -1
- package/libc/include/any-linux-any/linux/kvm.h +30 -6
- package/libc/include/any-linux-any/linux/landlock.h +22 -8
- package/libc/include/any-linux-any/linux/magic.h +1 -0
- package/libc/include/any-linux-any/linux/mempolicy.h +3 -0
- package/libc/include/any-linux-any/linux/mount.h +11 -2
- package/libc/include/any-linux-any/linux/mptcp_pm.h +1 -1
- package/libc/include/any-linux-any/linux/mshv.h +2 -0
- package/libc/include/any-linux-any/linux/netfilter_bridge.h +5 -4
- package/libc/include/any-linux-any/linux/netfilter_ipv4.h +4 -5
- package/libc/include/any-linux-any/linux/netfilter_ipv6.h +3 -4
- package/libc/include/any-linux-any/linux/nfs.h +1 -1
- package/libc/include/any-linux-any/linux/nfsd_netlink.h +1 -0
- package/libc/include/any-linux-any/linux/nilfs2_api.h +2 -2
- package/libc/include/any-linux-any/linux/nilfs2_ondisk.h +97 -66
- package/libc/include/any-linux-any/linux/nl80211.h +104 -3
- package/libc/include/any-linux-any/linux/pci.h +7 -0
- package/libc/include/any-linux-any/linux/pci_regs.h +65 -6
- package/libc/include/any-linux-any/linux/pcitest.h +1 -0
- package/libc/include/any-linux-any/linux/perf_event.h +24 -3
- package/libc/include/any-linux-any/linux/pkt_sched.h +1 -0
- package/libc/include/any-linux-any/linux/prctl.h +30 -0
- package/libc/include/any-linux-any/linux/rseq.h +62 -5
- package/libc/include/any-linux-any/linux/shm.h +0 -1
- package/libc/include/any-linux-any/linux/stddef.h +4 -0
- package/libc/include/any-linux-any/linux/sysctl.h +1 -2
- package/libc/include/any-linux-any/linux/taskstats.h +12 -1
- package/libc/include/any-linux-any/linux/tcp.h +23 -3
- package/libc/include/any-linux-any/linux/typelimits.h +8 -0
- package/libc/include/any-linux-any/linux/ublk_cmd.h +120 -1
- package/libc/include/any-linux-any/linux/v4l2-controls.h +63 -0
- package/libc/include/any-linux-any/linux/vbox_vmmdev_types.h +2 -2
- package/libc/include/any-linux-any/linux/vduse.h +80 -5
- package/libc/include/any-linux-any/linux/version.h +3 -3
- package/libc/include/any-linux-any/linux/vfio.h +4 -0
- package/libc/include/any-linux-any/linux/videodev2.h +3 -0
- package/libc/include/any-linux-any/linux/virtio_ring.h +1 -2
- package/libc/include/any-linux-any/linux/vmclock-abi.h +20 -0
- package/libc/include/any-linux-any/rdma/bnxt_re-abi.h +16 -0
- package/libc/include/any-linux-any/rdma/ib_user_ioctl_cmds.h +16 -0
- package/libc/include/any-linux-any/rdma/mana-abi.h +3 -0
- package/libc/include/any-linux-any/scsi/scsi_bsg_ufs.h +8 -9
- package/libc/include/any-linux-any/sound/sof/tokens.h +6 -0
- package/libc/include/arc-linux-any/asm/swab.h +0 -63
- package/libc/include/arc-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/arm-linux-any/asm/ptrace.h +0 -9
- package/libc/include/arm-linux-any/asm/unistd-eabi.h +1 -0
- package/libc/include/arm-linux-any/asm/unistd-oabi.h +1 -0
- package/libc/include/csky-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/hexagon-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/loongarch-linux-any/asm/hwcap.h +1 -0
- package/libc/include/loongarch-linux-any/asm/kvm.h +1 -0
- package/libc/include/loongarch-linux-any/asm/kvm_para.h +1 -0
- package/libc/include/loongarch-linux-any/asm/unistd_32.h +2 -0
- package/libc/include/loongarch-linux-any/asm/unistd_64.h +2 -0
- package/libc/include/m68k-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/mips-linux-any/asm/errno.h +2 -0
- package/libc/include/mips-linux-any/asm/unistd_n32.h +1 -0
- package/libc/include/mips-linux-any/asm/unistd_n64.h +1 -0
- package/libc/include/mips-linux-any/asm/unistd_o32.h +1 -0
- package/libc/include/powerpc-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/powerpc-linux-any/asm/unistd_64.h +1 -0
- package/libc/include/riscv-linux-any/asm/hwprobe.h +4 -0
- package/libc/include/riscv-linux-any/asm/kvm.h +3 -0
- package/libc/include/riscv-linux-any/asm/ptrace.h +37 -0
- package/libc/include/riscv-linux-any/asm/sigcontext.h +1 -0
- package/libc/include/riscv-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/riscv-linux-any/asm/unistd_64.h +1 -0
- package/libc/include/s390x-linux-any/asm/unistd_64.h +1 -0
- package/libc/include/sparc-linux-any/asm/errno.h +2 -0
- package/libc/include/sparc-linux-any/asm/ioctls.h +4 -4
- package/libc/include/sparc-linux-any/asm/unistd_32.h +2 -0
- package/libc/include/sparc-linux-any/asm/unistd_64.h +2 -0
- package/libc/include/x86-linux-any/asm/auxvec.h +0 -4
- package/libc/include/x86-linux-any/asm/kvm.h +13 -8
- package/libc/include/x86-linux-any/asm/svm.h +16 -16
- package/libc/include/x86-linux-any/asm/unistd_32.h +1 -0
- package/libc/include/x86-linux-any/asm/unistd_64.h +1 -0
- package/libc/include/x86-linux-any/asm/unistd_x32.h +1 -0
- package/libc/include/xtensa-linux-any/asm/unistd_32.h +1 -0
- package/libc/musl/arch/mipsn32/syscall_arch.h +35 -32
- package/libcxx/include/__algorithm/all_of.h +11 -5
- package/libcxx/include/__algorithm/comp.h +4 -0
- package/libcxx/include/__algorithm/copy.h +28 -147
- package/libcxx/include/__algorithm/copy_backward.h +9 -24
- package/libcxx/include/__algorithm/copy_n.h +50 -16
- package/libcxx/include/__algorithm/count.h +2 -2
- package/libcxx/include/__algorithm/equal.h +43 -55
- package/libcxx/include/__algorithm/fill.h +26 -8
- package/libcxx/include/__algorithm/fill_n.h +32 -46
- package/libcxx/include/__algorithm/find.h +96 -39
- package/libcxx/include/__algorithm/find_end.h +105 -0
- package/libcxx/include/__algorithm/for_each.h +18 -24
- package/libcxx/include/__algorithm/for_each_n.h +20 -47
- package/libcxx/include/__algorithm/for_each_n_segment.h +1 -1
- package/libcxx/include/__algorithm/for_each_segment.h +26 -0
- package/libcxx/include/__algorithm/generate.h +4 -2
- package/libcxx/include/__algorithm/generate_n.h +19 -6
- package/libcxx/include/__algorithm/is_permutation.h +4 -4
- package/libcxx/include/__algorithm/iterator_operations.h +3 -0
- package/libcxx/include/__algorithm/lexicographical_compare.h +2 -2
- package/libcxx/include/__algorithm/lexicographical_compare_three_way.h +6 -6
- package/libcxx/include/__algorithm/make_heap.h +16 -4
- package/libcxx/include/__algorithm/mismatch.h +2 -2
- package/libcxx/include/__algorithm/move.h +8 -19
- package/libcxx/include/__algorithm/move_backward.h +9 -24
- package/libcxx/include/__algorithm/none_of.h +4 -4
- package/libcxx/include/__algorithm/partial_sort.h +1 -1
- package/libcxx/include/__algorithm/partial_sort_copy.h +1 -1
- package/libcxx/include/__algorithm/pstl.h +9 -9
- package/libcxx/include/__algorithm/radix_sort.h +27 -25
- package/libcxx/include/__algorithm/ranges_copy_n.h +3 -26
- package/libcxx/include/__algorithm/ranges_equal.h +17 -26
- package/libcxx/include/__algorithm/ranges_fill.h +7 -6
- package/libcxx/include/__algorithm/ranges_for_each.h +9 -1
- package/libcxx/include/__algorithm/ranges_generate_n.h +2 -6
- package/libcxx/include/__algorithm/ranges_search_n.h +2 -2
- package/libcxx/include/__algorithm/rotate.h +27 -44
- package/libcxx/include/__algorithm/search_n.h +49 -37
- package/libcxx/include/__algorithm/sift_down.h +19 -18
- package/libcxx/include/__algorithm/simd_utils.h +33 -4
- package/libcxx/include/__algorithm/specialized_algorithms.h +54 -0
- package/libcxx/include/__algorithm/stable_sort.h +1 -1
- package/libcxx/include/__assertion_handler +31 -4
- package/libcxx/include/__atomic/atomic.h +36 -60
- package/libcxx/include/__atomic/atomic_flag.h +19 -37
- package/libcxx/include/__atomic/atomic_ref.h +29 -12
- package/libcxx/include/__atomic/atomic_sync.h +127 -55
- package/libcxx/include/__atomic/atomic_sync_timed.h +144 -0
- package/libcxx/include/__atomic/atomic_waitable_traits.h +103 -0
- package/libcxx/include/__atomic/contention_t.h +27 -3
- package/libcxx/include/__atomic/floating_point_helper.h +55 -0
- package/libcxx/include/__bit/countl.h +1 -2
- package/libcxx/include/__bit/countr.h +1 -2
- package/libcxx/include/__bit/has_single_bit.h +1 -1
- package/libcxx/include/__bit/popcount.h +0 -1
- package/libcxx/include/__bit/rotate.h +15 -26
- package/libcxx/include/__bit_reference +207 -18
- package/libcxx/include/__charconv/from_chars_integral.h +1 -1
- package/libcxx/include/__charconv/from_chars_result.h +1 -1
- package/libcxx/include/__charconv/to_chars_integral.h +1 -0
- package/libcxx/include/__charconv/to_chars_result.h +1 -1
- package/libcxx/include/__charconv/traits.h +3 -24
- package/libcxx/include/__chrono/day.h +11 -0
- package/libcxx/include/__chrono/duration.h +58 -33
- package/libcxx/include/__chrono/file_clock.h +4 -2
- package/libcxx/include/__chrono/is_clock.h +72 -0
- package/libcxx/include/__chrono/leap_second.h +13 -0
- package/libcxx/include/__chrono/month.h +13 -0
- package/libcxx/include/__chrono/month_weekday.h +22 -0
- package/libcxx/include/__chrono/monthday.h +20 -0
- package/libcxx/include/__chrono/steady_clock.h +1 -1
- package/libcxx/include/__chrono/system_clock.h +3 -3
- package/libcxx/include/__chrono/time_point.h +37 -13
- package/libcxx/include/__chrono/weekday.h +25 -0
- package/libcxx/include/__chrono/year.h +11 -0
- package/libcxx/include/__chrono/year_month.h +13 -0
- package/libcxx/include/__chrono/year_month_day.h +23 -0
- package/libcxx/include/__chrono/year_month_weekday.h +26 -0
- package/libcxx/include/__chrono/zoned_time.h +16 -0
- package/libcxx/include/__compare/is_eq.h +6 -6
- package/libcxx/include/__compare/strong_order.h +12 -30
- package/libcxx/include/__compare/three_way_comparable.h +2 -2
- package/libcxx/include/__concepts/comparison_common_type.h +40 -0
- package/libcxx/include/__concepts/equality_comparable.h +2 -1
- package/libcxx/include/__condition_variable/condition_variable.h +1 -1
- package/libcxx/include/__config +63 -280
- package/libcxx/include/__configuration/abi.h +14 -24
- package/libcxx/include/__configuration/availability.h +65 -118
- package/libcxx/include/__configuration/compiler.h +6 -6
- package/libcxx/include/__configuration/experimental.h +38 -0
- package/libcxx/include/__configuration/hardening.h +215 -0
- package/libcxx/include/__configuration/language.h +3 -0
- package/libcxx/include/__configuration/platform.h +9 -16
- package/libcxx/include/__coroutine/coroutine_handle.h +9 -9
- package/libcxx/include/__coroutine/noop_coroutine_handle.h +11 -13
- package/libcxx/include/__debug_utils/strict_weak_ordering_check.h +1 -1
- package/libcxx/include/__exception/exception.h +6 -4
- package/libcxx/include/__exception/exception_ptr.h +27 -5
- package/libcxx/include/__exception/nested_exception.h +2 -2
- package/libcxx/include/__exception/operations.h +5 -5
- package/libcxx/include/__expected/bad_expected_access.h +8 -6
- package/libcxx/include/__expected/expected.h +62 -64
- package/libcxx/include/__expected/unexpected.h +4 -4
- package/libcxx/include/__filesystem/copy_options.h +4 -4
- package/libcxx/include/__filesystem/directory_entry.h +37 -33
- package/libcxx/include/__filesystem/directory_iterator.h +9 -11
- package/libcxx/include/__filesystem/directory_options.h +7 -4
- package/libcxx/include/__filesystem/file_status.h +3 -3
- package/libcxx/include/__filesystem/filesystem_error.h +9 -10
- package/libcxx/include/__filesystem/operations.h +97 -66
- package/libcxx/include/__filesystem/path.h +68 -64
- package/libcxx/include/__filesystem/path_iterator.h +1 -3
- package/libcxx/include/__filesystem/perm_options.h +4 -4
- package/libcxx/include/__filesystem/perms.h +4 -4
- package/libcxx/include/__filesystem/recursive_directory_iterator.h +9 -14
- package/libcxx/include/__filesystem/space_info.h +1 -1
- package/libcxx/include/__filesystem/u8path.h +12 -14
- package/libcxx/include/__flat_map/flat_map.h +88 -71
- package/libcxx/include/__flat_map/flat_multimap.h +251 -172
- package/libcxx/include/__flat_map/key_value_iterator.h +0 -1
- package/libcxx/include/__flat_map/utils.h +1 -0
- package/libcxx/include/__flat_set/flat_multiset.h +211 -143
- package/libcxx/include/__flat_set/flat_set.h +86 -68
- package/libcxx/include/__format/concepts.h +0 -14
- package/libcxx/include/__format/extended_grapheme_cluster_table.h +3 -2
- package/libcxx/include/__format/fmt_pair_like.h +42 -0
- package/libcxx/include/__format/format_arg.h +7 -10
- package/libcxx/include/__format/format_args.h +1 -1
- package/libcxx/include/__format/format_context.h +5 -5
- package/libcxx/include/__format/format_parse_context.h +2 -2
- package/libcxx/include/__format/formatter_output.h +30 -34
- package/libcxx/include/__format/indic_conjunct_break_table.h +3 -2
- package/libcxx/include/__format/range_default_formatter.h +2 -41
- package/libcxx/include/__format/range_format.h +71 -0
- package/libcxx/include/__format/range_formatter.h +1 -0
- package/libcxx/include/__format/width_estimation_table.h +4 -2
- package/libcxx/include/__functional/bind.h +10 -15
- package/libcxx/include/__functional/bind_back.h +1 -1
- package/libcxx/include/__functional/bind_front.h +1 -1
- package/libcxx/include/__functional/function.h +57 -75
- package/libcxx/include/__functional/hash.h +1 -10
- package/libcxx/include/__functional/identity.h +1 -1
- package/libcxx/include/__functional/is_transparent.h +8 -0
- package/libcxx/include/__functional/mem_fn.h +2 -1
- package/libcxx/include/__functional/operations.h +18 -0
- package/libcxx/include/__functional/ranges_operations.h +7 -0
- package/libcxx/include/__functional/reference_wrapper.h +7 -5
- package/libcxx/include/__functional/weak_result_type.h +14 -28
- package/libcxx/include/__fwd/ios.h +1 -1
- package/libcxx/include/__fwd/tuple.h +14 -0
- package/libcxx/include/__hash_table +371 -357
- package/libcxx/include/__ios/fpos.h +4 -4
- package/libcxx/include/__iterator/back_insert_iterator.h +1 -7
- package/libcxx/include/__iterator/bounded_iter.h +7 -8
- package/libcxx/include/__iterator/concepts.h +6 -9
- package/libcxx/include/__iterator/cpp17_iterator_concepts.h +13 -12
- package/libcxx/include/__iterator/distance.h +40 -18
- package/libcxx/include/__iterator/front_insert_iterator.h +1 -7
- package/libcxx/include/__iterator/insert_iterator.h +1 -7
- package/libcxx/include/__iterator/istream_iterator.h +6 -7
- package/libcxx/include/__iterator/istreambuf_iterator.h +6 -7
- package/libcxx/include/__iterator/iter_move.h +1 -1
- package/libcxx/include/__iterator/iterator.h +13 -0
- package/libcxx/include/__iterator/iterator_traits.h +13 -14
- package/libcxx/include/__iterator/ostream_iterator.h +1 -7
- package/libcxx/include/__iterator/ostreambuf_iterator.h +1 -7
- package/libcxx/include/__iterator/reverse_iterator.h +8 -13
- package/libcxx/include/__iterator/segmented_iterator.h +3 -8
- package/libcxx/include/__iterator/static_bounded_iter.h +3 -3
- package/libcxx/include/__iterator/wrap_iter.h +8 -6
- package/libcxx/include/__locale +3 -10
- package/libcxx/include/__locale_dir/locale_base_api/bsd_locale_fallbacks.h +0 -10
- package/libcxx/include/__locale_dir/locale_base_api.h +5 -28
- package/libcxx/include/__locale_dir/messages.h +1 -1
- package/libcxx/include/__locale_dir/money.h +2 -2
- package/libcxx/include/__locale_dir/num.h +190 -243
- package/libcxx/include/__locale_dir/pad_and_output.h +5 -6
- package/libcxx/include/__locale_dir/support/bsd_like.h +0 -20
- package/libcxx/include/__locale_dir/support/fuchsia.h +0 -7
- package/libcxx/include/__locale_dir/support/linux.h +0 -37
- package/libcxx/include/__locale_dir/support/netbsd.h +0 -2
- package/libcxx/include/__locale_dir/support/newlib.h +243 -0
- package/libcxx/include/__locale_dir/support/no_locale/characters.h +0 -4
- package/libcxx/include/__locale_dir/support/no_locale/strtonum.h +0 -9
- package/libcxx/include/__locale_dir/support/windows.h +0 -29
- package/libcxx/include/__locale_dir/time.h +3 -7
- package/libcxx/include/__math/hypot.h +1 -1
- package/libcxx/include/__math/logarithms.h +1 -1
- package/libcxx/include/__math/traits.h +80 -11
- package/libcxx/include/__mdspan/extents.h +7 -4
- package/libcxx/include/__mdspan/layout_stride.h +4 -5
- package/libcxx/include/__mdspan/mdspan.h +29 -23
- package/libcxx/include/__memory/addressof.h +7 -5
- package/libcxx/include/__memory/align.h +18 -1
- package/libcxx/include/__memory/allocate_at_least.h +15 -10
- package/libcxx/include/__memory/allocator.h +14 -26
- package/libcxx/include/__memory/allocator_traits.h +6 -4
- package/libcxx/include/__memory/compressed_pair.h +15 -9
- package/libcxx/include/__memory/construct_at.h +12 -23
- package/libcxx/include/__memory/inout_ptr.h +1 -1
- package/libcxx/include/__memory/is_sufficiently_aligned.h +1 -1
- package/libcxx/include/__memory/out_ptr.h +1 -1
- package/libcxx/include/__memory/pointer_traits.h +1 -1
- package/libcxx/include/__memory/raw_storage_iterator.h +3 -9
- package/libcxx/include/__memory/shared_count.h +9 -30
- package/libcxx/include/__memory/shared_ptr.h +100 -145
- package/libcxx/include/__memory/temp_value.h +1 -2
- package/libcxx/include/__memory/uninitialized_algorithms.h +44 -115
- package/libcxx/include/__memory/unique_ptr.h +14 -16
- package/libcxx/include/__memory/uses_allocator_construction.h +1 -0
- package/libcxx/include/__memory_resource/memory_resource.h +4 -2
- package/libcxx/include/__memory_resource/monotonic_buffer_resource.h +1 -1
- package/libcxx/include/__memory_resource/polymorphic_allocator.h +13 -8
- package/libcxx/include/__memory_resource/pool_options.h +1 -1
- package/libcxx/include/__memory_resource/synchronized_pool_resource.h +4 -2
- package/libcxx/include/__memory_resource/unsynchronized_pool_resource.h +1 -1
- package/libcxx/include/__mutex/mutex.h +2 -2
- package/libcxx/include/__mutex/once_flag.h +14 -11
- package/libcxx/include/__mutex/tag_types.h +3 -3
- package/libcxx/include/__mutex/unique_lock.h +8 -7
- package/libcxx/include/__new/align_val_t.h +6 -0
- package/libcxx/include/__new/allocate.h +1 -2
- package/libcxx/include/__new/exceptions.h +8 -2
- package/libcxx/include/__new/global_new_delete.h +4 -11
- package/libcxx/include/__new/interference_size.h +0 -4
- package/libcxx/include/__new/launder.h +3 -5
- package/libcxx/include/__new/nothrow_t.h +1 -1
- package/libcxx/include/__numeric/gcd_lcm.h +24 -34
- package/libcxx/include/__numeric/midpoint.h +9 -14
- package/libcxx/include/__numeric/pstl.h +2 -2
- package/libcxx/include/__numeric/saturation_arithmetic.h +13 -5
- package/libcxx/include/__ostream/basic_ostream.h +8 -8
- package/libcxx/include/__pstl/backends/default.h +14 -14
- package/libcxx/include/__pstl/backends/libdispatch.h +2 -2
- package/libcxx/include/__pstl/cpu_algos/find_if.h +1 -1
- package/libcxx/include/__pstl/cpu_algos/transform.h +5 -6
- package/libcxx/include/__pstl/cpu_algos/transform_reduce.h +5 -4
- package/libcxx/include/__random/binomial_distribution.h +10 -4
- package/libcxx/include/__random/mersenne_twister_engine.h +50 -154
- package/libcxx/include/__random/piecewise_constant_distribution.h +3 -2
- package/libcxx/include/__random/piecewise_linear_distribution.h +3 -2
- package/libcxx/include/__ranges/adjacent_transform_view.h +406 -0
- package/libcxx/include/__ranges/adjacent_view.h +419 -0
- package/libcxx/include/__ranges/as_rvalue_view.h +9 -9
- package/libcxx/include/__ranges/chunk_by_view.h +6 -6
- package/libcxx/include/__ranges/common_view.h +7 -7
- package/libcxx/include/__ranges/drop_view.h +8 -8
- package/libcxx/include/__ranges/drop_while_view.h +5 -5
- package/libcxx/include/__ranges/elements_of.h +49 -0
- package/libcxx/include/__ranges/empty_view.h +5 -5
- package/libcxx/include/__ranges/filter_view.h +10 -10
- package/libcxx/include/__ranges/iota_view.h +41 -22
- package/libcxx/include/__ranges/owning_view.h +15 -15
- package/libcxx/include/__ranges/ref_view.h +6 -6
- package/libcxx/include/__ranges/repeat_view.h +17 -10
- package/libcxx/include/__ranges/single_view.h +8 -8
- package/libcxx/include/__ranges/take_view.h +9 -9
- package/libcxx/include/__ranges/transform_view.h +1 -2
- package/libcxx/include/__ranges/view_interface.h +10 -10
- package/libcxx/include/__ranges/zip_transform_view.h +357 -0
- package/libcxx/include/__ranges/zip_view.h +20 -20
- package/libcxx/include/__split_buffer +612 -240
- package/libcxx/include/__stop_token/atomic_unique_lock.h +1 -1
- package/libcxx/include/__stop_token/stop_callback.h +2 -2
- package/libcxx/include/__stop_token/stop_source.h +1 -1
- package/libcxx/include/__stop_token/stop_state.h +4 -4
- package/libcxx/include/__stop_token/stop_token.h +1 -1
- package/libcxx/include/__string/char_traits.h +51 -31
- package/libcxx/include/__string/constexpr_c_functions.h +5 -5
- package/libcxx/include/__support/xlocale/__strtonum_fallback.h +0 -8
- package/libcxx/include/__system_error/error_category.h +8 -8
- package/libcxx/include/__system_error/error_code.h +5 -5
- package/libcxx/include/__system_error/error_condition.h +4 -4
- package/libcxx/include/__system_error/system_error.h +1 -1
- package/libcxx/include/__thread/id.h +1 -1
- package/libcxx/include/__thread/jthread.h +1 -1
- package/libcxx/include/__thread/poll_with_backoff.h +27 -8
- package/libcxx/include/__thread/support/c11.h +8 -8
- package/libcxx/include/__thread/support/pthread.h +8 -8
- package/libcxx/include/__thread/support/windows.h +8 -8
- package/libcxx/include/__thread/thread.h +13 -8
- package/libcxx/include/__thread/timed_backoff_policy.h +3 -2
- package/libcxx/include/__tree +849 -701
- package/libcxx/include/__tuple/sfinae_helpers.h +1 -44
- package/libcxx/include/__tuple/tuple_element.h +0 -12
- package/libcxx/include/__tuple/tuple_size.h +0 -4
- package/libcxx/include/__tuple/tuple_transform.h +45 -0
- package/libcxx/include/__type_traits/aligned_storage.h +13 -40
- package/libcxx/include/__type_traits/desugars_to.h +4 -0
- package/libcxx/include/__type_traits/invoke.h +8 -0
- package/libcxx/include/__type_traits/is_allocator.h +6 -7
- package/libcxx/include/__type_traits/is_array.h +26 -0
- package/libcxx/include/__type_traits/is_equality_comparable.h +16 -21
- package/libcxx/include/__type_traits/is_final.h +1 -1
- package/libcxx/include/__type_traits/is_floating_point.h +7 -6
- package/libcxx/include/__type_traits/is_generic_transparent_comparator.h +30 -0
- package/libcxx/include/__type_traits/is_specialization.h +2 -6
- package/libcxx/include/__type_traits/is_within_lifetime.h +29 -0
- package/libcxx/include/__type_traits/make_transparent.h +52 -0
- package/libcxx/include/__type_traits/reference_constructs_from_temporary.h +1 -7
- package/libcxx/include/__type_traits/reference_converts_from_temporary.h +1 -1
- package/libcxx/include/__utility/cmp.h +19 -7
- package/libcxx/include/__utility/default_three_way_comparator.h +70 -0
- package/libcxx/include/__utility/in_place.h +1 -1
- package/libcxx/include/__utility/integer_sequence.h +56 -41
- package/libcxx/include/__utility/lazy_synth_three_way_comparator.h +120 -0
- package/libcxx/include/__utility/pair.h +22 -25
- package/libcxx/include/__utility/scope_guard.h +2 -0
- package/libcxx/include/__utility/try_key_extraction.h +114 -0
- package/libcxx/include/__vector/vector.h +187 -160
- package/libcxx/include/__vector/vector_bool.h +76 -83
- package/libcxx/include/any +118 -155
- package/libcxx/include/array +88 -56
- package/libcxx/include/atomic +2 -0
- package/libcxx/include/barrier +20 -24
- package/libcxx/include/bitset +49 -30
- package/libcxx/include/ccomplex +3 -11
- package/libcxx/include/chrono +47 -0
- package/libcxx/include/ciso646 +3 -6
- package/libcxx/include/complex +77 -65
- package/libcxx/include/complex.h +10 -10
- package/libcxx/include/condition_variable +3 -3
- package/libcxx/include/cstdalign +3 -10
- package/libcxx/include/cstdbool +3 -10
- package/libcxx/include/ctgmath +2 -11
- package/libcxx/include/ctype.h +24 -24
- package/libcxx/include/cwchar +2 -2
- package/libcxx/include/deque +109 -225
- package/libcxx/include/errno.h +269 -269
- package/libcxx/include/exception +4 -1
- package/libcxx/include/ext/hash_map +7 -48
- package/libcxx/include/ext/hash_set +2 -8
- package/libcxx/include/fenv.h +43 -43
- package/libcxx/include/flat_map +663 -11
- package/libcxx/include/flat_set +543 -8
- package/libcxx/include/float.h +16 -16
- package/libcxx/include/forward_list +33 -53
- package/libcxx/include/fstream +57 -42
- package/libcxx/include/future +41 -51
- package/libcxx/include/initializer_list +9 -3
- package/libcxx/include/inttypes.h +16 -16
- package/libcxx/include/ios +28 -28
- package/libcxx/include/istream +19 -13
- package/libcxx/include/iterator +10 -0
- package/libcxx/include/latch +7 -5
- package/libcxx/include/limits +4 -4
- package/libcxx/include/list +61 -79
- package/libcxx/include/map +386 -274
- package/libcxx/include/math.h +19 -0
- package/libcxx/include/mdspan +1 -5
- package/libcxx/include/mutex +29 -19
- package/libcxx/include/optional +644 -149
- package/libcxx/include/print +9 -5
- package/libcxx/include/queue +39 -37
- package/libcxx/include/ranges +48 -0
- package/libcxx/include/regex +33 -31
- package/libcxx/include/scoped_allocator +16 -11
- package/libcxx/include/semaphore +15 -18
- package/libcxx/include/set +220 -192
- package/libcxx/include/shared_mutex +3 -8
- package/libcxx/include/span +53 -37
- package/libcxx/include/sstream +34 -28
- package/libcxx/include/stack +13 -15
- package/libcxx/include/stddef.h +10 -10
- package/libcxx/include/stdexcept +2 -2
- package/libcxx/include/stdio.h +20 -21
- package/libcxx/include/streambuf +59 -19
- package/libcxx/include/string +574 -573
- package/libcxx/include/string_view +113 -89
- package/libcxx/include/strstream +10 -10
- package/libcxx/include/syncstream +4 -4
- package/libcxx/include/tgmath.h +12 -12
- package/libcxx/include/tuple +242 -212
- package/libcxx/include/type_traits +8 -2
- package/libcxx/include/typeindex +5 -3
- package/libcxx/include/typeinfo +92 -89
- package/libcxx/include/unordered_map +179 -304
- package/libcxx/include/unordered_set +168 -195
- package/libcxx/include/utility +12 -0
- package/libcxx/include/valarray +106 -161
- package/libcxx/include/variant +25 -33
- package/libcxx/include/version +41 -24
- package/libcxx/include/wctype.h +29 -29
- package/libcxx/libc/hdr/errno_macros.h +3 -1
- package/libcxx/libc/hdr/stdint_proxy.h +18 -0
- package/libcxx/libc/hdr/types/wchar_t.h +23 -0
- package/libcxx/libc/hdr/wchar_overlay.h +69 -0
- package/libcxx/libc/include/llvm-libc-macros/cfloat128-macros.h +41 -0
- package/libcxx/libc/include/llvm-libc-macros/cfloat16-macros.h +20 -0
- package/libcxx/libc/include/llvm-libc-macros/wchar-macros.h +18 -0
- package/libcxx/libc/include/llvm-libc-types/cfloat128.h +11 -28
- package/libcxx/libc/include/llvm-libc-types/cfloat16.h +4 -7
- package/libcxx/libc/include/llvm-libc-types/wint_t.h +14 -0
- package/libcxx/libc/shared/libc_common.h +5 -0
- package/libcxx/libc/src/__support/CPP/bit.h +50 -12
- package/libcxx/libc/src/__support/CPP/type_traits/is_complex.h +7 -0
- package/libcxx/libc/src/__support/CPP/type_traits/is_destructible.h +2 -1
- package/libcxx/libc/src/__support/CPP/type_traits/is_unsigned.h +6 -0
- package/libcxx/libc/src/__support/CPP/utility/integer_sequence.h +10 -0
- package/libcxx/libc/src/__support/FPUtil/FPBits.h +6 -7
- package/libcxx/libc/src/__support/FPUtil/rounding_mode.h +50 -4
- package/libcxx/libc/src/__support/big_int.h +14 -14
- package/libcxx/libc/src/__support/common.h +3 -2
- package/libcxx/libc/src/__support/ctype_utils.h +19 -12
- package/libcxx/libc/src/__support/detailed_powers_of_ten.h +1 -2
- package/libcxx/libc/src/__support/high_precision_decimal.h +33 -14
- package/libcxx/libc/src/__support/libc_assert.h +2 -0
- package/libcxx/libc/src/__support/macros/attributes.h +44 -1
- package/libcxx/libc/src/__support/macros/config.h +23 -0
- package/libcxx/libc/src/__support/macros/null_check.h +1 -2
- package/libcxx/libc/src/__support/macros/optimization.h +3 -0
- package/libcxx/libc/src/__support/macros/properties/architectures.h +5 -1
- package/libcxx/libc/src/__support/macros/properties/compiler.h +8 -3
- package/libcxx/libc/src/__support/macros/properties/cpu_features.h +17 -1
- package/libcxx/libc/src/__support/macros/properties/types.h +2 -3
- package/libcxx/libc/src/__support/macros/sanitizer.h +0 -10
- package/libcxx/libc/src/__support/math_extras.h +20 -4
- package/libcxx/libc/src/__support/str_to_float.h +98 -125
- package/libcxx/libc/src/__support/str_to_integer.h +39 -27
- package/libcxx/libc/src/__support/wctype_utils.h +588 -0
- package/libcxx/src/any.cpp +4 -0
- package/libcxx/src/atomic.cpp +365 -80
- package/libcxx/src/barrier.cpp +4 -3
- package/libcxx/src/charconv.cpp +6 -3
- package/libcxx/src/condition_variable_destructor.cpp +1 -1
- package/libcxx/src/error_category.cpp +3 -1
- package/libcxx/src/exception.cpp +2 -10
- package/libcxx/src/experimental/time_zone.cpp +1 -1
- package/libcxx/src/experimental/tzdb.cpp +4 -1
- package/libcxx/src/filesystem/error.h +4 -22
- package/libcxx/src/filesystem/format_string.h +9 -18
- package/libcxx/src/filesystem/int128_builtins.cpp +2 -0
- package/libcxx/src/filesystem/operations.cpp +2 -9
- package/libcxx/src/filesystem/path.cpp +3 -1
- package/libcxx/src/include/aligned_alloc.h +65 -0
- package/libcxx/src/include/config_elast.h +1 -1
- package/libcxx/src/include/from_chars_floating_point.h +11 -7
- package/libcxx/src/include/overridable_function.h +8 -10
- package/libcxx/src/iostream.cpp +56 -37
- package/libcxx/src/locale.cpp +213 -196
- package/libcxx/src/memory.cpp +12 -14
- package/libcxx/src/mutex_destructor.cpp +1 -1
- package/libcxx/src/new.cpp +5 -5
- package/libcxx/src/optional.cpp +4 -0
- package/libcxx/src/print.cpp +9 -1
- package/libcxx/src/random.cpp +0 -26
- package/libcxx/src/string.cpp +10 -25
- package/libcxx/src/support/runtime/exception_fallback.ipp +2 -0
- package/libcxx/src/support/runtime/exception_glibcxx.ipp +3 -0
- package/libcxx/src/support/runtime/exception_libcxxabi.ipp +6 -2
- package/libcxx/src/support/runtime/exception_libcxxrt.ipp +2 -0
- package/libcxx/src/support/runtime/exception_msvc.ipp +2 -0
- package/libcxx/src/support/runtime/exception_pointer_cxxabi.ipp +9 -10
- package/libcxx/src/support/runtime/exception_pointer_glibcxx.ipp +2 -0
- package/libcxx/src/support/runtime/exception_pointer_msvc.ipp +1 -0
- package/libcxx/src/support/runtime/exception_pointer_unimplemented.ipp +1 -0
- package/libcxx/src/support/win32/locale_win32.cpp +1 -1
- package/libcxx/src/system_error.cpp +2 -0
- package/libcxx/src/thread.cpp +1 -3
- package/libcxx/src/valarray.cpp +1 -2
- package/libcxx/src/vector.cpp +2 -2
- package/libcxxabi/include/__cxxabi_config.h +42 -23
- package/libcxxabi/src/cxa_exception.cpp +4 -2
- package/libcxxabi/src/cxa_exception.h +16 -14
- package/libcxxabi/src/cxa_personality.cpp +126 -9
- package/libcxxabi/src/cxa_thread_atexit.cpp +2 -1
- package/libcxxabi/src/demangle/DemangleConfig.h +4 -0
- package/libcxxabi/src/demangle/ItaniumDemangle.h +9 -6
- package/libcxxabi/src/demangle/Utility.h +21 -7
- package/libcxxabi/src/fallback_malloc.cpp +1 -1
- package/libcxxabi/src/private_typeinfo.cpp +6 -0
- package/libcxxabi/src/stdlib_new_delete.cpp +5 -5
- package/libtsan/LICENSE.TXT +311 -0
- package/libtsan/builtins/assembly.h +41 -8
- package/libtsan/interception/interception_win.cpp +4 -0
- package/libtsan/sanitizer_common/sanitizer_allocator_primary32.h +1 -0
- package/libtsan/sanitizer_common/sanitizer_allocator_primary64.h +18 -0
- package/libtsan/sanitizer_common/sanitizer_common.h +15 -2
- package/libtsan/sanitizer_common/sanitizer_common_interceptors.inc +30 -4
- package/libtsan/sanitizer_common/sanitizer_common_interceptors_ioctl.inc +4 -0
- package/libtsan/sanitizer_common/sanitizer_common_interceptors_vfork_aarch64.inc.S +2 -1
- package/libtsan/sanitizer_common/sanitizer_common_interceptors_vfork_i386.inc.S +2 -0
- package/libtsan/sanitizer_common/sanitizer_common_interceptors_vfork_x86_64.inc.S +2 -0
- package/libtsan/sanitizer_common/sanitizer_common_syscalls.inc +18 -0
- package/libtsan/sanitizer_common/sanitizer_file.cpp +40 -12
- package/libtsan/sanitizer_common/sanitizer_file.h +3 -0
- package/libtsan/sanitizer_common/sanitizer_flags.inc +7 -0
- package/libtsan/sanitizer_common/sanitizer_fuchsia.cpp +30 -3
- package/libtsan/sanitizer_common/sanitizer_haiku.cpp +2 -2
- package/libtsan/sanitizer_common/sanitizer_internal_defs.h +1 -1
- package/libtsan/sanitizer_common/sanitizer_libc.cpp +8 -0
- package/libtsan/sanitizer_common/sanitizer_libc.h +1 -0
- package/libtsan/sanitizer_common/sanitizer_linux.cpp +15 -7
- package/libtsan/sanitizer_common/sanitizer_linux.h +3 -3
- package/libtsan/sanitizer_common/sanitizer_linux_libcdep.cpp +1 -0
- package/libtsan/sanitizer_common/sanitizer_mac.cpp +255 -104
- package/libtsan/sanitizer_common/sanitizer_mac.h +5 -0
- package/libtsan/sanitizer_common/sanitizer_netbsd.cpp +2 -2
- package/libtsan/sanitizer_common/sanitizer_platform.h +27 -1
- package/libtsan/sanitizer_common/sanitizer_platform_interceptors.h +5 -4
- package/libtsan/sanitizer_common/sanitizer_platform_limits_posix.cpp +15 -17
- package/libtsan/sanitizer_common/sanitizer_platform_limits_posix.h +32 -6
- package/libtsan/sanitizer_common/sanitizer_posix.cpp +3 -12
- package/libtsan/sanitizer_common/sanitizer_posix.h +2 -1
- package/libtsan/sanitizer_common/sanitizer_posix_libcdep.cpp +19 -0
- package/libtsan/sanitizer_common/sanitizer_procmaps_mac.cpp +102 -37
- package/libtsan/sanitizer_common/sanitizer_redefine_builtins.h +1 -1
- package/libtsan/sanitizer_common/sanitizer_signal_interceptors.inc +40 -2
- package/libtsan/sanitizer_common/sanitizer_stoptheworld.h +1 -1
- package/libtsan/sanitizer_common/sanitizer_stoptheworld_linux_libcdep.cpp +83 -12
- package/libtsan/sanitizer_common/sanitizer_stoptheworld_mac.cpp +3 -3
- package/libtsan/sanitizer_common/sanitizer_stoptheworld_netbsd_libcdep.cpp +7 -7
- package/libtsan/sanitizer_common/sanitizer_stoptheworld_win.cpp +2 -2
- package/libtsan/sanitizer_common/sanitizer_symbolizer_internal.h +5 -1
- package/libtsan/sanitizer_common/sanitizer_symbolizer_libcdep.cpp +11 -1
- package/libtsan/sanitizer_common/sanitizer_symbolizer_mac.cpp +86 -29
- package/libtsan/sanitizer_common/sanitizer_symbolizer_posix_libcdep.cpp +27 -16
- package/libtsan/sanitizer_common/sanitizer_thread_registry.cpp +5 -4
- package/libtsan/sanitizer_common/sanitizer_thread_registry.h +4 -4
- package/libtsan/sanitizer_common/sanitizer_win.cpp +1 -3
- package/libtsan/tsan_debugging.cpp +2 -2
- package/libtsan/tsan_flags.cpp +37 -0
- package/libtsan/tsan_flags.h +8 -0
- package/libtsan/tsan_flags.inc +12 -0
- package/libtsan/tsan_interceptors.h +9 -1
- package/libtsan/tsan_interceptors_mac.cpp +19 -0
- package/libtsan/tsan_interceptors_posix.cpp +78 -32
- package/libtsan/tsan_interface.h +3 -3
- package/libtsan/tsan_interface_ann.cpp +23 -9
- package/libtsan/tsan_mman.cpp +18 -4
- package/libtsan/tsan_platform.h +44 -7
- package/libtsan/tsan_platform_linux.cpp +42 -14
- package/libtsan/tsan_platform_mac.cpp +16 -3
- package/libtsan/tsan_report.h +14 -1
- package/libtsan/tsan_rtl.cpp +14 -0
- package/libtsan/tsan_rtl.h +7 -2
- package/libtsan/tsan_rtl_aarch64.S +3 -5
- package/libtsan/tsan_rtl_access.cpp +8 -3
- package/libtsan/tsan_rtl_amd64.S +2 -0
- package/libtsan/tsan_rtl_mutex.cpp +94 -49
- package/libtsan/tsan_rtl_report.cpp +132 -65
- package/libtsan/tsan_rtl_thread.cpp +31 -9
- package/libtsan/tsan_symbolize.cpp +1 -1
- package/libtsan/tsan_symbolize.h +1 -1
- package/libtsan/tsan_trace.h +1 -1
- package/libunwind/include/__libunwind_config.h +11 -2
- package/libunwind/include/libunwind.h +117 -11
- package/libunwind/include/unwind_arm_ehabi.h +4 -1
- package/libunwind/src/AddressSpace.hpp +42 -20
- package/libunwind/src/CompactUnwinder.hpp +16 -5
- package/libunwind/src/DwarfInstructions.hpp +24 -13
- package/libunwind/src/DwarfParser.hpp +62 -23
- package/libunwind/src/EHHeaderParser.hpp +7 -4
- package/libunwind/src/Registers.hpp +226 -22
- package/libunwind/src/Unwind-seh.cpp +6 -7
- package/libunwind/src/Unwind-wasm.c +7 -7
- package/libunwind/src/UnwindCursor.hpp +167 -49
- package/libunwind/src/UnwindLevel1.c +46 -17
- package/libunwind/src/UnwindRegistersRestore.S +46 -5
- package/libunwind/src/UnwindRegistersSave.S +86 -2
- package/libunwind/src/assembly.h +5 -1
- package/libunwind/src/config.h +9 -0
- package/libunwind/src/gcc_personality_v0.c +79 -6
- package/libunwind/src/libunwind.cpp +104 -4
- package/libunwind/src/libunwind_ext.h +7 -1
- package/libunwind/src/shadow_stack_unwind.h +2 -2
- package/lldb/pretty_printers.py +948 -0
- package/package.json +1 -1
- package/std/Build/Cache/Path.zig +1 -1
- package/std/Build/Cache.zig +6 -6
- package/std/Build/Step/Compile.zig +18 -20
- package/std/Build/Step/ConfigHeader.zig +1 -1
- package/std/Build/Step/Run.zig +15 -8
- package/std/Build/Step.zig +3 -7
- package/std/Build/Watch/FsEvents.zig +1 -1
- package/std/Build/WebServer.zig +2 -2
- package/std/Build/abi.zig +1 -1
- package/std/Build.zig +0 -3
- package/std/Io/Dir.zig +9 -4
- package/std/Io/Dispatch.zig +8 -18
- package/std/Io/File/Writer.zig +8 -6
- package/std/Io/File.zig +0 -9
- package/std/Io/Kqueue.zig +3 -3
- package/std/Io/Reader.zig +8 -14
- package/std/Io/Semaphore.zig +112 -17
- package/std/Io/Terminal.zig +1 -1
- package/std/Io/Threaded.zig +183 -46
- package/std/Io/Uring.zig +18 -20
- package/std/Io/Writer.zig +10 -7
- package/std/Io/net/HostName.zig +11 -6
- package/std/Io/net.zig +11 -11
- package/std/Io.zig +104 -38
- package/std/Random/ChaCha.zig +2 -2
- package/std/Random/benchmark.zig +2 -2
- package/std/Random.zig +6 -6
- package/std/SemanticVersion.zig +1 -1
- package/std/Target/Query.zig +2 -2
- package/std/Target/aarch64.zig +620 -77
- package/std/Target/amdgcn.zig +421 -21
- package/std/Target/arm.zig +40 -6
- package/std/Target/bpf.zig +6 -0
- package/std/Target/hexagon.zig +41 -6
- package/std/Target/loongarch.zig +18 -0
- package/std/Target/mips.zig +6 -0
- package/std/Target/nvptx.zig +58 -35
- package/std/Target/powerpc.zig +27 -19
- package/std/Target/riscv.zig +415 -177
- package/std/Target/sparc.zig +17 -0
- package/std/Target/wasm.zig +7 -0
- package/std/Target/x86.zig +200 -31
- package/std/Target/xtensa.zig +65 -0
- package/std/Target.zig +67 -14
- package/std/Thread.zig +5 -2
- package/std/array_hash_map.zig +103 -57
- package/std/array_list.zig +10 -31
- package/std/base64.zig +5 -5
- package/std/bit_set.zig +86 -69
- package/std/c/haiku.zig +3 -0
- package/std/c/serenity.zig +1 -6
- package/std/c.zig +123 -32
- package/std/compress/flate/Decompress.zig +3 -4
- package/std/compress/zstd/Decompress.zig +7 -9
- package/std/crypto/25519/curve25519.zig +2 -2
- package/std/crypto/25519/edwards25519.zig +3 -3
- package/std/crypto/25519/ristretto255.zig +2 -2
- package/std/crypto/25519/scalar.zig +6 -6
- package/std/crypto/25519/x25519.zig +1 -1
- package/std/crypto/Certificate.zig +14 -2
- package/std/crypto/Sha1.zig +1 -1
- package/std/crypto/aegis.zig +45 -39
- package/std/crypto/aes_ccm.zig +22 -22
- package/std/crypto/aes_gcm.zig +10 -12
- package/std/crypto/aes_ocb.zig +9 -9
- package/std/crypto/argon2.zig +15 -15
- package/std/crypto/ascon.zig +75 -33
- package/std/crypto/bcrypt.zig +20 -10
- package/std/crypto/benchmark.zig +7 -7
- package/std/crypto/blake2.zig +100 -64
- package/std/crypto/cbc_mac.zig +1 -1
- package/std/crypto/chacha20.zig +10 -10
- package/std/crypto/cmac.zig +3 -3
- package/std/crypto/codecs/asn1/Oid.zig +12 -1
- package/std/crypto/codecs/asn1/der/Encoder.zig +1 -1
- package/std/crypto/codecs/asn1.zig +1 -1
- package/std/crypto/codecs/base64_hex_ct.zig +3 -5
- package/std/crypto/ecdsa.zig +9 -9
- package/std/crypto/ff.zig +4 -5
- package/std/crypto/ghash_polyval.zig +4 -4
- package/std/crypto/hkdf.zig +1 -1
- package/std/crypto/isap.zig +3 -3
- package/std/crypto/kangarootwelve.zig +1 -1
- package/std/crypto/keccak_p.zig +8 -8
- package/std/crypto/md5.zig +1 -1
- package/std/crypto/ml_dsa.zig +39 -39
- package/std/crypto/ml_kem.zig +12 -34
- package/std/crypto/modes.zig +2 -2
- package/std/crypto/pbkdf2.zig +1 -1
- package/std/crypto/pcurves/common.zig +4 -5
- package/std/crypto/pcurves/p256/scalar.zig +3 -3
- package/std/crypto/pcurves/p384/scalar.zig +2 -2
- package/std/crypto/pcurves/secp256k1/scalar.zig +3 -3
- package/std/crypto/pcurves/tests/p256.zig +5 -5
- package/std/crypto/pcurves/tests/p384.zig +5 -5
- package/std/crypto/pcurves/tests/secp256k1.zig +3 -3
- package/std/crypto/salsa20.zig +8 -8
- package/std/crypto/sha2.zig +2 -2
- package/std/crypto/sha3.zig +2 -2
- package/std/crypto/siphash.zig +1 -1
- package/std/crypto/timing_safe.zig +10 -9
- package/std/crypto/tls/Client.zig +89 -13
- package/std/crypto/tls.zig +1 -1
- package/std/crypto.zig +4 -3
- package/std/debug/Dwarf.zig +15 -12
- package/std/debug/Pdb.zig +25 -17
- package/std/debug.zig +14 -8
- package/std/deque.zig +1 -1
- package/std/elf.zig +1 -1
- package/std/enums.zig +8 -8
- package/std/fmt/parse_float/decimal.zig +1 -1
- package/std/fmt/parse_float.zig +1 -1
- package/std/fmt.zig +14 -10
- package/std/fs/path.zig +7 -5
- package/std/hash/Adler32.zig +3 -3
- package/std/hash/benchmark.zig +2 -2
- package/std/hash/wyhash.zig +2 -2
- package/std/hash/xxhash.zig +0 -6
- package/std/hash_map.zig +20 -1
- package/std/heap/BufferFirstAllocator.zig +165 -0
- package/std/heap/debug_allocator.zig +2 -2
- package/std/heap/memory_pool.zig +34 -197
- package/std/heap.zig +2 -133
- package/std/http/Client.zig +21 -24
- package/std/http.zig +4 -5
- package/std/json/Scanner.zig +2 -2
- package/std/json/static.zig +2 -2
- package/std/{builtin.zig → lang.zig} +5 -1
- package/std/leb128.zig +2 -2
- package/std/math/big/int.zig +5 -5
- package/std/math/big.zig +4 -4
- package/std/math/copysign.zig +1 -1
- package/std/math/float.zig +62 -0
- package/std/math/frexp.zig +4 -4
- package/std/math/ilogb.zig +1 -1
- package/std/math/isfinite.zig +1 -1
- package/std/math/isinf.zig +1 -1
- package/std/math/isnan.zig +1 -2
- package/std/math/isnormal.zig +2 -2
- package/std/math/iszero.zig +2 -2
- package/std/math/ldexp.zig +2 -2
- package/std/math/log10.zig +0 -2
- package/std/math/modf.zig +1 -2
- package/std/math/nextafter.zig +3 -4
- package/std/math/pow.zig +1 -1
- package/std/math/powi.zig +2 -3
- package/std/math/signbit.zig +0 -1
- package/std/math.zig +21 -26
- package/std/mem/Allocator.zig +0 -6
- package/std/mem.zig +31 -31
- package/std/meta/trailer_flags.zig +1 -1
- package/std/meta.zig +4 -36
- package/std/multi_array_list.zig +24 -0
- package/std/os/emscripten.zig +7 -6
- package/std/os/linux/IoUring.zig +2 -0
- package/std/os/linux/aarch64.zig +41 -12
- package/std/os/linux/arc.zig +41 -12
- package/std/os/linux/arm.zig +41 -12
- package/std/os/linux/bpf.zig +6 -0
- package/std/os/linux/hexagon.zig +33 -11
- package/std/os/linux/ioctl.zig +2 -2
- package/std/os/linux/loongarch32.zig +41 -13
- package/std/os/linux/loongarch64.zig +41 -12
- package/std/os/linux/m68k.zig +41 -13
- package/std/os/linux/mips.zig +67 -36
- package/std/os/linux/mips64.zig +60 -29
- package/std/os/linux/mipsn32.zig +60 -29
- package/std/os/linux/or1k.zig +41 -12
- package/std/os/linux/powerpc.zig +41 -12
- package/std/os/linux/powerpc64.zig +41 -12
- package/std/os/linux/riscv32.zig +41 -12
- package/std/os/linux/riscv64.zig +41 -12
- package/std/os/linux/s390x.zig +44 -7
- package/std/os/linux/sparc64.zig +83 -52
- package/std/os/linux/syscalls.zig +26 -1
- package/std/os/linux/thumb.zig +52 -36
- package/std/os/linux/x32.zig +41 -12
- package/std/os/linux/x86.zig +44 -15
- package/std/os/linux/x86_64.zig +41 -12
- package/std/os/linux.zig +416 -450
- package/std/os/plan9.zig +1 -1
- package/std/os/uefi/hii.zig +1 -1
- package/std/os/uefi/tables/boot_services.zig +9 -8
- package/std/os/uefi/tables/runtime_services.zig +1 -1
- package/std/os/windows.zig +130 -1
- package/std/os.zig +41 -0
- package/std/posix.zig +1 -1
- package/std/process/Environ.zig +1 -1
- package/std/process.zig +5 -4
- package/std/simd.zig +4 -21
- package/std/sort.zig +3 -3
- package/std/start.zig +17 -4
- package/std/std.zig +8 -1
- package/std/tar/Writer.zig +39 -33
- package/std/tar.zig +8 -4
- package/std/testing.zig +2 -2
- package/std/unicode.zig +13 -8
- package/std/zig/Ast/Render.zig +6 -30
- package/std/zig/Ast.zig +12 -37
- package/std/zig/AstGen.zig +175 -332
- package/std/zig/AstRlAnnotate.zig +1 -22
- package/std/zig/AstSmith.zig +5 -11
- package/std/zig/BuiltinFn.zig +0 -32
- package/std/zig/ErrorBundle.zig +6 -2
- package/std/zig/LibCDirs.zig +15 -6
- package/std/zig/LibCInstallation.zig +34 -12
- package/std/zig/Parse.zig +11 -76
- package/std/zig/TokenSmith.zig +0 -6
- package/std/zig/WindowsSdk.zig +18 -18
- package/std/zig/Zir.zig +65 -132
- package/std/zig/ZonGen.zig +19 -27
- package/std/zig/llvm/Builder.zig +39 -33
- package/std/zig/llvm/bitcode_writer.zig +3 -3
- package/std/zig/llvm/ir.zig +8 -8
- package/std/zig/system/arm.zig +56 -2
- package/std/zig/system/windows.zig +34 -1
- package/std/zig/system/x86.zig +60 -16
- package/std/zig/system.zig +0 -10
- package/std/zig/target.zig +1 -4
- package/std/zig/tokenizer.zig +4 -43
- package/std/zig.zig +3 -14
- package/std/zip.zig +5 -5
- package/std/zon/parse.zig +1 -1
- package/zig.h +340 -1
- package/compiler_rt/long_double.zig +0 -37
- package/include/amxbf16transposeintrin.h +0 -94
- package/include/amxcomplextransposeintrin.h +0 -303
- package/include/amxfp16transposeintrin.h +0 -94
- package/include/amxmovrstransposeintrin.h +0 -200
- package/include/amxtf32transposeintrin.h +0 -105
- package/include/amxtransposeintrin.h +0 -248
- package/libc/include/hexagon-linux-any/asm/signal.h +0 -29
- package/libc/include/s390x-linux-any/asm/tape390.h +0 -103
- package/libc/mingw/math/lrintl.c +0 -18
- package/libc/mingw/math/rintl.c +0 -16
- package/libc/mingw/winpthreads/spinlock.c +0 -82
- package/libc/musl/src/linux/tee.c +0 -8
- package/libc/musl/src/math/i386/lrintl.c +0 -8
- package/libc/musl/src/math/i386/rintl.c +0 -7
- package/libc/musl/src/math/lrintl.c +0 -36
- package/libc/musl/src/math/rintl.c +0 -29
- package/libc/musl/src/math/s390x/rintl.c +0 -15
- package/libc/musl/src/math/x32/lrintl.s +0 -7
- package/libc/musl/src/math/x32/rintl.s +0 -6
- package/libc/musl/src/math/x86_64/lrintl.c +0 -8
- package/libc/musl/src/math/x86_64/rintl.c +0 -7
- package/libc/musl/src/string/strdup.c +0 -10
- package/libc/musl/src/string/strndup.c +0 -12
- package/libc/musl/src/string/wcsdup.c +0 -10
- package/libc/musl/src/thread/pthread_spin_destroy.c +0 -6
- package/libc/musl/src/thread/pthread_spin_init.c +0 -6
- package/libc/musl/src/thread/pthread_spin_lock.c +0 -8
- package/libc/musl/src/thread/pthread_spin_trylock.c +0 -7
- package/libc/musl/src/thread/pthread_spin_unlock.c +0 -7
- package/libc/musl/src/unistd/dup2.c +0 -20
- package/libc/musl/src/unistd/dup3.c +0 -26
- package/libc/wasi/thread-stub/pthread_spin_lock.c +0 -8
- package/libc/wasi/thread-stub/pthread_spin_trylock.c +0 -8
- package/libc/wasi/thread-stub/pthread_spin_unlock.c +0 -7
- package/libtsan/sanitizer_common/sanitizer_coverage_interface.inc +0 -43
- package/std/Build/Step/CheckObject.zig +0 -2764
- /package/std/{builtin → lang}/assembly.zig +0 -0
|
@@ -17,12 +17,18 @@
|
|
|
17
17
|
/* Define the default attributes for the functions in this file. */
|
|
18
18
|
#define __DEFAULT_FN_ATTRS128 \
|
|
19
19
|
__attribute__((__always_inline__, __nodebug__, \
|
|
20
|
-
__target__("avx512vl,avx512bw
|
|
21
|
-
__min_vector_width__(128)))
|
|
20
|
+
__target__("avx512vl,avx512bw"), __min_vector_width__(128)))
|
|
22
21
|
#define __DEFAULT_FN_ATTRS256 \
|
|
23
22
|
__attribute__((__always_inline__, __nodebug__, \
|
|
24
|
-
__target__("avx512vl,avx512bw
|
|
25
|
-
|
|
23
|
+
__target__("avx512vl,avx512bw"), __min_vector_width__(256)))
|
|
24
|
+
|
|
25
|
+
#if defined(__cplusplus) && (__cplusplus >= 201103L)
|
|
26
|
+
#define __DEFAULT_FN_ATTRS128_CONSTEXPR __DEFAULT_FN_ATTRS128 constexpr
|
|
27
|
+
#define __DEFAULT_FN_ATTRS256_CONSTEXPR __DEFAULT_FN_ATTRS256 constexpr
|
|
28
|
+
#else
|
|
29
|
+
#define __DEFAULT_FN_ATTRS128_CONSTEXPR __DEFAULT_FN_ATTRS128
|
|
30
|
+
#define __DEFAULT_FN_ATTRS256_CONSTEXPR __DEFAULT_FN_ATTRS256
|
|
31
|
+
#endif
|
|
26
32
|
|
|
27
33
|
/* Integer compare */
|
|
28
34
|
|
|
@@ -306,250 +312,238 @@
|
|
|
306
312
|
#define _mm256_mask_cmpneq_epu16_mask(k, A, B) \
|
|
307
313
|
_mm256_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_NE)
|
|
308
314
|
|
|
309
|
-
static __inline__ __m256i
|
|
310
|
-
_mm256_mask_add_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B){
|
|
315
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
316
|
+
_mm256_mask_add_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
311
317
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
312
318
|
(__v32qi)_mm256_add_epi8(__A, __B),
|
|
313
319
|
(__v32qi)__W);
|
|
314
320
|
}
|
|
315
321
|
|
|
316
|
-
static __inline__ __m256i
|
|
322
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
317
323
|
_mm256_maskz_add_epi8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
318
324
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
319
325
|
(__v32qi)_mm256_add_epi8(__A, __B),
|
|
320
326
|
(__v32qi)_mm256_setzero_si256());
|
|
321
327
|
}
|
|
322
328
|
|
|
323
|
-
static __inline__ __m256i
|
|
329
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
324
330
|
_mm256_mask_add_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
325
331
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
326
332
|
(__v16hi)_mm256_add_epi16(__A, __B),
|
|
327
333
|
(__v16hi)__W);
|
|
328
334
|
}
|
|
329
335
|
|
|
330
|
-
static __inline__ __m256i
|
|
336
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
331
337
|
_mm256_maskz_add_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
332
338
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
333
339
|
(__v16hi)_mm256_add_epi16(__A, __B),
|
|
334
340
|
(__v16hi)_mm256_setzero_si256());
|
|
335
341
|
}
|
|
336
342
|
|
|
337
|
-
static __inline__ __m256i
|
|
343
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
338
344
|
_mm256_mask_sub_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
339
345
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
340
346
|
(__v32qi)_mm256_sub_epi8(__A, __B),
|
|
341
347
|
(__v32qi)__W);
|
|
342
348
|
}
|
|
343
349
|
|
|
344
|
-
static __inline__ __m256i
|
|
350
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
345
351
|
_mm256_maskz_sub_epi8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
346
352
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
347
353
|
(__v32qi)_mm256_sub_epi8(__A, __B),
|
|
348
354
|
(__v32qi)_mm256_setzero_si256());
|
|
349
355
|
}
|
|
350
356
|
|
|
351
|
-
static __inline__ __m256i
|
|
357
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
352
358
|
_mm256_mask_sub_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
353
359
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
354
360
|
(__v16hi)_mm256_sub_epi16(__A, __B),
|
|
355
361
|
(__v16hi)__W);
|
|
356
362
|
}
|
|
357
363
|
|
|
358
|
-
static __inline__ __m256i
|
|
364
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
359
365
|
_mm256_maskz_sub_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
360
366
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
361
367
|
(__v16hi)_mm256_sub_epi16(__A, __B),
|
|
362
368
|
(__v16hi)_mm256_setzero_si256());
|
|
363
369
|
}
|
|
364
370
|
|
|
365
|
-
static __inline__ __m128i
|
|
371
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
366
372
|
_mm_mask_add_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
367
373
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
368
374
|
(__v16qi)_mm_add_epi8(__A, __B),
|
|
369
375
|
(__v16qi)__W);
|
|
370
376
|
}
|
|
371
377
|
|
|
372
|
-
static __inline__ __m128i
|
|
378
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
373
379
|
_mm_maskz_add_epi8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
374
380
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
375
381
|
(__v16qi)_mm_add_epi8(__A, __B),
|
|
376
382
|
(__v16qi)_mm_setzero_si128());
|
|
377
383
|
}
|
|
378
384
|
|
|
379
|
-
static __inline__ __m128i
|
|
385
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
380
386
|
_mm_mask_add_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
381
387
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
382
388
|
(__v8hi)_mm_add_epi16(__A, __B),
|
|
383
389
|
(__v8hi)__W);
|
|
384
390
|
}
|
|
385
391
|
|
|
386
|
-
static __inline__ __m128i
|
|
392
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
387
393
|
_mm_maskz_add_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
388
394
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
389
395
|
(__v8hi)_mm_add_epi16(__A, __B),
|
|
390
396
|
(__v8hi)_mm_setzero_si128());
|
|
391
397
|
}
|
|
392
398
|
|
|
393
|
-
static __inline__ __m128i
|
|
399
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
394
400
|
_mm_mask_sub_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
395
401
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
396
402
|
(__v16qi)_mm_sub_epi8(__A, __B),
|
|
397
403
|
(__v16qi)__W);
|
|
398
404
|
}
|
|
399
405
|
|
|
400
|
-
static __inline__ __m128i
|
|
406
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
401
407
|
_mm_maskz_sub_epi8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
402
408
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
403
409
|
(__v16qi)_mm_sub_epi8(__A, __B),
|
|
404
410
|
(__v16qi)_mm_setzero_si128());
|
|
405
411
|
}
|
|
406
412
|
|
|
407
|
-
static __inline__ __m128i
|
|
413
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
408
414
|
_mm_mask_sub_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
409
415
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
410
416
|
(__v8hi)_mm_sub_epi16(__A, __B),
|
|
411
417
|
(__v8hi)__W);
|
|
412
418
|
}
|
|
413
419
|
|
|
414
|
-
static __inline__ __m128i
|
|
420
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
415
421
|
_mm_maskz_sub_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
416
422
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
417
423
|
(__v8hi)_mm_sub_epi16(__A, __B),
|
|
418
424
|
(__v8hi)_mm_setzero_si128());
|
|
419
425
|
}
|
|
420
426
|
|
|
421
|
-
static __inline__ __m256i
|
|
427
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
422
428
|
_mm256_mask_mullo_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
423
429
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
424
430
|
(__v16hi)_mm256_mullo_epi16(__A, __B),
|
|
425
431
|
(__v16hi)__W);
|
|
426
432
|
}
|
|
427
433
|
|
|
428
|
-
static __inline__ __m256i
|
|
434
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
429
435
|
_mm256_maskz_mullo_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
430
436
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
431
437
|
(__v16hi)_mm256_mullo_epi16(__A, __B),
|
|
432
438
|
(__v16hi)_mm256_setzero_si256());
|
|
433
439
|
}
|
|
434
440
|
|
|
435
|
-
static __inline__ __m128i
|
|
441
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
436
442
|
_mm_mask_mullo_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
437
443
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
438
444
|
(__v8hi)_mm_mullo_epi16(__A, __B),
|
|
439
445
|
(__v8hi)__W);
|
|
440
446
|
}
|
|
441
447
|
|
|
442
|
-
static __inline__ __m128i
|
|
448
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
443
449
|
_mm_maskz_mullo_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
444
450
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
445
451
|
(__v8hi)_mm_mullo_epi16(__A, __B),
|
|
446
452
|
(__v8hi)_mm_setzero_si128());
|
|
447
453
|
}
|
|
448
454
|
|
|
449
|
-
static __inline__ __m128i
|
|
450
|
-
_mm_mask_blend_epi8
|
|
451
|
-
{
|
|
455
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
456
|
+
_mm_mask_blend_epi8(__mmask16 __U, __m128i __A, __m128i __W) {
|
|
452
457
|
return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,
|
|
453
458
|
(__v16qi) __W,
|
|
454
459
|
(__v16qi) __A);
|
|
455
460
|
}
|
|
456
461
|
|
|
457
|
-
static __inline__ __m256i
|
|
458
|
-
_mm256_mask_blend_epi8
|
|
459
|
-
{
|
|
462
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
463
|
+
_mm256_mask_blend_epi8(__mmask32 __U, __m256i __A, __m256i __W) {
|
|
460
464
|
return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,
|
|
461
465
|
(__v32qi) __W,
|
|
462
466
|
(__v32qi) __A);
|
|
463
467
|
}
|
|
464
468
|
|
|
465
|
-
static __inline__ __m128i
|
|
466
|
-
_mm_mask_blend_epi16
|
|
467
|
-
{
|
|
469
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
470
|
+
_mm_mask_blend_epi16(__mmask8 __U, __m128i __A, __m128i __W) {
|
|
468
471
|
return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,
|
|
469
472
|
(__v8hi) __W,
|
|
470
473
|
(__v8hi) __A);
|
|
471
474
|
}
|
|
472
475
|
|
|
473
|
-
static __inline__ __m256i
|
|
474
|
-
_mm256_mask_blend_epi16
|
|
475
|
-
{
|
|
476
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
477
|
+
_mm256_mask_blend_epi16(__mmask16 __U, __m256i __A, __m256i __W) {
|
|
476
478
|
return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,
|
|
477
479
|
(__v16hi) __W,
|
|
478
480
|
(__v16hi) __A);
|
|
479
481
|
}
|
|
480
482
|
|
|
481
|
-
static __inline__ __m128i
|
|
482
|
-
_mm_mask_abs_epi8(__m128i __W, __mmask16 __U, __m128i __A)
|
|
483
|
-
{
|
|
483
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
484
|
+
_mm_mask_abs_epi8(__m128i __W, __mmask16 __U, __m128i __A) {
|
|
484
485
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
485
486
|
(__v16qi)_mm_abs_epi8(__A),
|
|
486
487
|
(__v16qi)__W);
|
|
487
488
|
}
|
|
488
489
|
|
|
489
|
-
static __inline__ __m128i
|
|
490
|
-
_mm_maskz_abs_epi8(__mmask16 __U, __m128i __A)
|
|
491
|
-
{
|
|
490
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
491
|
+
_mm_maskz_abs_epi8(__mmask16 __U, __m128i __A) {
|
|
492
492
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
493
493
|
(__v16qi)_mm_abs_epi8(__A),
|
|
494
494
|
(__v16qi)_mm_setzero_si128());
|
|
495
495
|
}
|
|
496
496
|
|
|
497
|
-
static __inline__ __m256i
|
|
498
|
-
_mm256_mask_abs_epi8(__m256i __W, __mmask32 __U, __m256i __A)
|
|
499
|
-
{
|
|
497
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
498
|
+
_mm256_mask_abs_epi8(__m256i __W, __mmask32 __U, __m256i __A) {
|
|
500
499
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
501
500
|
(__v32qi)_mm256_abs_epi8(__A),
|
|
502
501
|
(__v32qi)__W);
|
|
503
502
|
}
|
|
504
503
|
|
|
505
|
-
static __inline__ __m256i
|
|
506
|
-
_mm256_maskz_abs_epi8
|
|
507
|
-
{
|
|
504
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
505
|
+
_mm256_maskz_abs_epi8(__mmask32 __U, __m256i __A) {
|
|
508
506
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
509
507
|
(__v32qi)_mm256_abs_epi8(__A),
|
|
510
508
|
(__v32qi)_mm256_setzero_si256());
|
|
511
509
|
}
|
|
512
510
|
|
|
513
|
-
static __inline__ __m128i
|
|
514
|
-
_mm_mask_abs_epi16(__m128i __W, __mmask8 __U, __m128i __A)
|
|
515
|
-
{
|
|
511
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
512
|
+
_mm_mask_abs_epi16(__m128i __W, __mmask8 __U, __m128i __A) {
|
|
516
513
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
517
514
|
(__v8hi)_mm_abs_epi16(__A),
|
|
518
515
|
(__v8hi)__W);
|
|
519
516
|
}
|
|
520
517
|
|
|
521
|
-
static __inline__ __m128i
|
|
522
|
-
_mm_maskz_abs_epi16(__mmask8 __U, __m128i __A)
|
|
523
|
-
{
|
|
518
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
519
|
+
_mm_maskz_abs_epi16(__mmask8 __U, __m128i __A) {
|
|
524
520
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
525
521
|
(__v8hi)_mm_abs_epi16(__A),
|
|
526
522
|
(__v8hi)_mm_setzero_si128());
|
|
527
523
|
}
|
|
528
524
|
|
|
529
|
-
static __inline__ __m256i
|
|
530
|
-
_mm256_mask_abs_epi16(__m256i __W, __mmask16 __U, __m256i __A)
|
|
531
|
-
{
|
|
525
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
526
|
+
_mm256_mask_abs_epi16(__m256i __W, __mmask16 __U, __m256i __A) {
|
|
532
527
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
533
528
|
(__v16hi)_mm256_abs_epi16(__A),
|
|
534
529
|
(__v16hi)__W);
|
|
535
530
|
}
|
|
536
531
|
|
|
537
|
-
static __inline__ __m256i
|
|
538
|
-
_mm256_maskz_abs_epi16(__mmask16 __U, __m256i __A)
|
|
539
|
-
{
|
|
532
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
533
|
+
_mm256_maskz_abs_epi16(__mmask16 __U, __m256i __A) {
|
|
540
534
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
541
535
|
(__v16hi)_mm256_abs_epi16(__A),
|
|
542
536
|
(__v16hi)_mm256_setzero_si256());
|
|
543
537
|
}
|
|
544
538
|
|
|
545
|
-
static __inline__ __m128i
|
|
539
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
546
540
|
_mm_maskz_packs_epi32(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
547
541
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
548
542
|
(__v8hi)_mm_packs_epi32(__A, __B),
|
|
549
543
|
(__v8hi)_mm_setzero_si128());
|
|
550
544
|
}
|
|
551
545
|
|
|
552
|
-
static __inline__ __m128i
|
|
546
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
553
547
|
_mm_mask_packs_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
554
548
|
{
|
|
555
549
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
@@ -557,7 +551,7 @@ _mm_mask_packs_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
|
557
551
|
(__v8hi)__W);
|
|
558
552
|
}
|
|
559
553
|
|
|
560
|
-
static __inline__ __m256i
|
|
554
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
561
555
|
_mm256_maskz_packs_epi32(__mmask16 __M, __m256i __A, __m256i __B)
|
|
562
556
|
{
|
|
563
557
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
@@ -565,7 +559,7 @@ _mm256_maskz_packs_epi32(__mmask16 __M, __m256i __A, __m256i __B)
|
|
|
565
559
|
(__v16hi)_mm256_setzero_si256());
|
|
566
560
|
}
|
|
567
561
|
|
|
568
|
-
static __inline__ __m256i
|
|
562
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
569
563
|
_mm256_mask_packs_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
570
564
|
{
|
|
571
565
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
@@ -573,7 +567,7 @@ _mm256_mask_packs_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
|
573
567
|
(__v16hi)__W);
|
|
574
568
|
}
|
|
575
569
|
|
|
576
|
-
static __inline__ __m128i
|
|
570
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
577
571
|
_mm_maskz_packs_epi16(__mmask16 __M, __m128i __A, __m128i __B)
|
|
578
572
|
{
|
|
579
573
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
@@ -581,7 +575,7 @@ _mm_maskz_packs_epi16(__mmask16 __M, __m128i __A, __m128i __B)
|
|
|
581
575
|
(__v16qi)_mm_setzero_si128());
|
|
582
576
|
}
|
|
583
577
|
|
|
584
|
-
static __inline__ __m128i
|
|
578
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
585
579
|
_mm_mask_packs_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
586
580
|
{
|
|
587
581
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
@@ -589,7 +583,7 @@ _mm_mask_packs_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
|
589
583
|
(__v16qi)__W);
|
|
590
584
|
}
|
|
591
585
|
|
|
592
|
-
static __inline__ __m256i
|
|
586
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
593
587
|
_mm256_maskz_packs_epi16(__mmask32 __M, __m256i __A, __m256i __B)
|
|
594
588
|
{
|
|
595
589
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
@@ -597,7 +591,7 @@ _mm256_maskz_packs_epi16(__mmask32 __M, __m256i __A, __m256i __B)
|
|
|
597
591
|
(__v32qi)_mm256_setzero_si256());
|
|
598
592
|
}
|
|
599
593
|
|
|
600
|
-
static __inline__ __m256i
|
|
594
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
601
595
|
_mm256_mask_packs_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
602
596
|
{
|
|
603
597
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
@@ -605,7 +599,7 @@ _mm256_mask_packs_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
|
605
599
|
(__v32qi)__W);
|
|
606
600
|
}
|
|
607
601
|
|
|
608
|
-
static __inline__ __m128i
|
|
602
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
609
603
|
_mm_maskz_packus_epi32(__mmask8 __M, __m128i __A, __m128i __B)
|
|
610
604
|
{
|
|
611
605
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
@@ -613,7 +607,7 @@ _mm_maskz_packus_epi32(__mmask8 __M, __m128i __A, __m128i __B)
|
|
|
613
607
|
(__v8hi)_mm_setzero_si128());
|
|
614
608
|
}
|
|
615
609
|
|
|
616
|
-
static __inline__ __m128i
|
|
610
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
617
611
|
_mm_mask_packus_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
618
612
|
{
|
|
619
613
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
@@ -621,7 +615,7 @@ _mm_mask_packus_epi32(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
|
621
615
|
(__v8hi)__W);
|
|
622
616
|
}
|
|
623
617
|
|
|
624
|
-
static __inline__ __m256i
|
|
618
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
625
619
|
_mm256_maskz_packus_epi32(__mmask16 __M, __m256i __A, __m256i __B)
|
|
626
620
|
{
|
|
627
621
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
@@ -629,7 +623,7 @@ _mm256_maskz_packus_epi32(__mmask16 __M, __m256i __A, __m256i __B)
|
|
|
629
623
|
(__v16hi)_mm256_setzero_si256());
|
|
630
624
|
}
|
|
631
625
|
|
|
632
|
-
static __inline__ __m256i
|
|
626
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
633
627
|
_mm256_mask_packus_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
634
628
|
{
|
|
635
629
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
@@ -637,7 +631,7 @@ _mm256_mask_packus_epi32(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
|
637
631
|
(__v16hi)__W);
|
|
638
632
|
}
|
|
639
633
|
|
|
640
|
-
static __inline__ __m128i
|
|
634
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
641
635
|
_mm_maskz_packus_epi16(__mmask16 __M, __m128i __A, __m128i __B)
|
|
642
636
|
{
|
|
643
637
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
@@ -645,7 +639,7 @@ _mm_maskz_packus_epi16(__mmask16 __M, __m128i __A, __m128i __B)
|
|
|
645
639
|
(__v16qi)_mm_setzero_si128());
|
|
646
640
|
}
|
|
647
641
|
|
|
648
|
-
static __inline__ __m128i
|
|
642
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
649
643
|
_mm_mask_packus_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
650
644
|
{
|
|
651
645
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
@@ -653,7 +647,7 @@ _mm_mask_packus_epi16(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
|
653
647
|
(__v16qi)__W);
|
|
654
648
|
}
|
|
655
649
|
|
|
656
|
-
static __inline__ __m256i
|
|
650
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
657
651
|
_mm256_maskz_packus_epi16(__mmask32 __M, __m256i __A, __m256i __B)
|
|
658
652
|
{
|
|
659
653
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
@@ -661,7 +655,7 @@ _mm256_maskz_packus_epi16(__mmask32 __M, __m256i __A, __m256i __B)
|
|
|
661
655
|
(__v32qi)_mm256_setzero_si256());
|
|
662
656
|
}
|
|
663
657
|
|
|
664
|
-
static __inline__ __m256i
|
|
658
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
665
659
|
_mm256_mask_packus_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
666
660
|
{
|
|
667
661
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
@@ -669,7 +663,7 @@ _mm256_mask_packus_epi16(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
|
669
663
|
(__v32qi)__W);
|
|
670
664
|
}
|
|
671
665
|
|
|
672
|
-
static __inline__ __m128i
|
|
666
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
673
667
|
_mm_mask_adds_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
674
668
|
{
|
|
675
669
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -677,7 +671,7 @@ _mm_mask_adds_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
|
677
671
|
(__v16qi)__W);
|
|
678
672
|
}
|
|
679
673
|
|
|
680
|
-
static __inline__ __m128i
|
|
674
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
681
675
|
_mm_maskz_adds_epi8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
682
676
|
{
|
|
683
677
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -685,7 +679,7 @@ _mm_maskz_adds_epi8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
|
685
679
|
(__v16qi)_mm_setzero_si128());
|
|
686
680
|
}
|
|
687
681
|
|
|
688
|
-
static __inline__ __m256i
|
|
682
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
689
683
|
_mm256_mask_adds_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
690
684
|
{
|
|
691
685
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -693,7 +687,7 @@ _mm256_mask_adds_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
|
693
687
|
(__v32qi)__W);
|
|
694
688
|
}
|
|
695
689
|
|
|
696
|
-
static __inline__ __m256i
|
|
690
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
697
691
|
_mm256_maskz_adds_epi8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
698
692
|
{
|
|
699
693
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -701,7 +695,7 @@ _mm256_maskz_adds_epi8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
|
701
695
|
(__v32qi)_mm256_setzero_si256());
|
|
702
696
|
}
|
|
703
697
|
|
|
704
|
-
static __inline__ __m128i
|
|
698
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
705
699
|
_mm_mask_adds_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
706
700
|
{
|
|
707
701
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -709,7 +703,7 @@ _mm_mask_adds_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
709
703
|
(__v8hi)__W);
|
|
710
704
|
}
|
|
711
705
|
|
|
712
|
-
static __inline__ __m128i
|
|
706
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
713
707
|
_mm_maskz_adds_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
714
708
|
{
|
|
715
709
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -717,7 +711,7 @@ _mm_maskz_adds_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
|
717
711
|
(__v8hi)_mm_setzero_si128());
|
|
718
712
|
}
|
|
719
713
|
|
|
720
|
-
static __inline__ __m256i
|
|
714
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
721
715
|
_mm256_mask_adds_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
722
716
|
{
|
|
723
717
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -725,7 +719,7 @@ _mm256_mask_adds_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
725
719
|
(__v16hi)__W);
|
|
726
720
|
}
|
|
727
721
|
|
|
728
|
-
static __inline__ __m256i
|
|
722
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
729
723
|
_mm256_maskz_adds_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
730
724
|
{
|
|
731
725
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -733,7 +727,7 @@ _mm256_maskz_adds_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
733
727
|
(__v16hi)_mm256_setzero_si256());
|
|
734
728
|
}
|
|
735
729
|
|
|
736
|
-
static __inline__ __m128i
|
|
730
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
737
731
|
_mm_mask_adds_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
738
732
|
{
|
|
739
733
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -741,7 +735,7 @@ _mm_mask_adds_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
|
741
735
|
(__v16qi)__W);
|
|
742
736
|
}
|
|
743
737
|
|
|
744
|
-
static __inline__ __m128i
|
|
738
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
745
739
|
_mm_maskz_adds_epu8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
746
740
|
{
|
|
747
741
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -749,7 +743,7 @@ _mm_maskz_adds_epu8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
|
749
743
|
(__v16qi)_mm_setzero_si128());
|
|
750
744
|
}
|
|
751
745
|
|
|
752
|
-
static __inline__ __m256i
|
|
746
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
753
747
|
_mm256_mask_adds_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
754
748
|
{
|
|
755
749
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -757,7 +751,7 @@ _mm256_mask_adds_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
|
757
751
|
(__v32qi)__W);
|
|
758
752
|
}
|
|
759
753
|
|
|
760
|
-
static __inline__ __m256i
|
|
754
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
761
755
|
_mm256_maskz_adds_epu8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
762
756
|
{
|
|
763
757
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -765,7 +759,7 @@ _mm256_maskz_adds_epu8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
|
765
759
|
(__v32qi)_mm256_setzero_si256());
|
|
766
760
|
}
|
|
767
761
|
|
|
768
|
-
static __inline__ __m128i
|
|
762
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
769
763
|
_mm_mask_adds_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
770
764
|
{
|
|
771
765
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -773,7 +767,7 @@ _mm_mask_adds_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
773
767
|
(__v8hi)__W);
|
|
774
768
|
}
|
|
775
769
|
|
|
776
|
-
static __inline__ __m128i
|
|
770
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
777
771
|
_mm_maskz_adds_epu16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
778
772
|
{
|
|
779
773
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -781,7 +775,7 @@ _mm_maskz_adds_epu16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
|
781
775
|
(__v8hi)_mm_setzero_si128());
|
|
782
776
|
}
|
|
783
777
|
|
|
784
|
-
static __inline__ __m256i
|
|
778
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
785
779
|
_mm256_mask_adds_epu16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
786
780
|
{
|
|
787
781
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -789,7 +783,7 @@ _mm256_mask_adds_epu16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
789
783
|
(__v16hi)__W);
|
|
790
784
|
}
|
|
791
785
|
|
|
792
|
-
static __inline__ __m256i
|
|
786
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
793
787
|
_mm256_maskz_adds_epu16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
794
788
|
{
|
|
795
789
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -797,359 +791,311 @@ _mm256_maskz_adds_epu16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
797
791
|
(__v16hi)_mm256_setzero_si256());
|
|
798
792
|
}
|
|
799
793
|
|
|
800
|
-
static __inline__ __m128i
|
|
801
|
-
_mm_mask_avg_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
802
|
-
|
|
803
|
-
|
|
804
|
-
(__v16qi)_mm_avg_epu8(__A, __B),
|
|
805
|
-
(__v16qi)__W);
|
|
794
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
795
|
+
_mm_mask_avg_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
796
|
+
return (__m128i)__builtin_ia32_selectb_128(
|
|
797
|
+
(__mmask16)__U, (__v16qi)_mm_avg_epu8(__A, __B), (__v16qi)__W);
|
|
806
798
|
}
|
|
807
799
|
|
|
808
|
-
static __inline__ __m128i
|
|
809
|
-
_mm_maskz_avg_epu8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
810
|
-
{
|
|
800
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
801
|
+
_mm_maskz_avg_epu8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
811
802
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
812
803
|
(__v16qi)_mm_avg_epu8(__A, __B),
|
|
813
804
|
(__v16qi)_mm_setzero_si128());
|
|
814
805
|
}
|
|
815
806
|
|
|
816
|
-
static __inline__ __m256i
|
|
817
|
-
_mm256_mask_avg_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
818
|
-
|
|
819
|
-
|
|
820
|
-
(__v32qi)_mm256_avg_epu8(__A, __B),
|
|
821
|
-
(__v32qi)__W);
|
|
807
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
808
|
+
_mm256_mask_avg_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
809
|
+
return (__m256i)__builtin_ia32_selectb_256(
|
|
810
|
+
(__mmask32)__U, (__v32qi)_mm256_avg_epu8(__A, __B), (__v32qi)__W);
|
|
822
811
|
}
|
|
823
812
|
|
|
824
|
-
static __inline__ __m256i
|
|
825
|
-
_mm256_maskz_avg_epu8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
826
|
-
{
|
|
813
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
814
|
+
_mm256_maskz_avg_epu8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
827
815
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
828
816
|
(__v32qi)_mm256_avg_epu8(__A, __B),
|
|
829
817
|
(__v32qi)_mm256_setzero_si256());
|
|
830
818
|
}
|
|
831
819
|
|
|
832
|
-
static __inline__ __m128i
|
|
833
|
-
_mm_mask_avg_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
834
|
-
|
|
835
|
-
|
|
836
|
-
(__v8hi)_mm_avg_epu16(__A, __B),
|
|
837
|
-
(__v8hi)__W);
|
|
820
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
821
|
+
_mm_mask_avg_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
822
|
+
return (__m128i)__builtin_ia32_selectw_128(
|
|
823
|
+
(__mmask8)__U, (__v8hi)_mm_avg_epu16(__A, __B), (__v8hi)__W);
|
|
838
824
|
}
|
|
839
825
|
|
|
840
|
-
static __inline__ __m128i
|
|
841
|
-
_mm_maskz_avg_epu16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
842
|
-
{
|
|
826
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
827
|
+
_mm_maskz_avg_epu16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
843
828
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
844
829
|
(__v8hi)_mm_avg_epu16(__A, __B),
|
|
845
830
|
(__v8hi)_mm_setzero_si128());
|
|
846
831
|
}
|
|
847
832
|
|
|
848
|
-
static __inline__ __m256i
|
|
849
|
-
_mm256_mask_avg_epu16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
850
|
-
|
|
851
|
-
|
|
852
|
-
(__v16hi)_mm256_avg_epu16(__A, __B),
|
|
853
|
-
(__v16hi)__W);
|
|
833
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
834
|
+
_mm256_mask_avg_epu16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
835
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
836
|
+
(__mmask16)__U, (__v16hi)_mm256_avg_epu16(__A, __B), (__v16hi)__W);
|
|
854
837
|
}
|
|
855
838
|
|
|
856
|
-
static __inline__ __m256i
|
|
857
|
-
_mm256_maskz_avg_epu16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
858
|
-
|
|
859
|
-
|
|
860
|
-
|
|
861
|
-
(__v16hi)_mm256_setzero_si256());
|
|
839
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
840
|
+
_mm256_maskz_avg_epu16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
841
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
842
|
+
(__mmask16)__U, (__v16hi)_mm256_avg_epu16(__A, __B),
|
|
843
|
+
(__v16hi)_mm256_setzero_si256());
|
|
862
844
|
}
|
|
863
845
|
|
|
864
|
-
static __inline__ __m128i
|
|
865
|
-
_mm_maskz_max_epi8(__mmask16 __M, __m128i __A, __m128i __B)
|
|
866
|
-
{
|
|
846
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
847
|
+
_mm_maskz_max_epi8(__mmask16 __M, __m128i __A, __m128i __B) {
|
|
867
848
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
868
849
|
(__v16qi)_mm_max_epi8(__A, __B),
|
|
869
850
|
(__v16qi)_mm_setzero_si128());
|
|
870
851
|
}
|
|
871
852
|
|
|
872
|
-
static __inline__ __m128i
|
|
873
|
-
_mm_mask_max_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
874
|
-
{
|
|
853
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
854
|
+
_mm_mask_max_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B) {
|
|
875
855
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
876
856
|
(__v16qi)_mm_max_epi8(__A, __B),
|
|
877
857
|
(__v16qi)__W);
|
|
878
858
|
}
|
|
879
859
|
|
|
880
|
-
static __inline__ __m256i
|
|
881
|
-
_mm256_maskz_max_epi8(__mmask32 __M, __m256i __A, __m256i __B)
|
|
882
|
-
{
|
|
860
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
861
|
+
_mm256_maskz_max_epi8(__mmask32 __M, __m256i __A, __m256i __B) {
|
|
883
862
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
884
863
|
(__v32qi)_mm256_max_epi8(__A, __B),
|
|
885
864
|
(__v32qi)_mm256_setzero_si256());
|
|
886
865
|
}
|
|
887
866
|
|
|
888
|
-
static __inline__ __m256i
|
|
889
|
-
_mm256_mask_max_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
890
|
-
{
|
|
867
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
868
|
+
_mm256_mask_max_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B) {
|
|
891
869
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
892
870
|
(__v32qi)_mm256_max_epi8(__A, __B),
|
|
893
871
|
(__v32qi)__W);
|
|
894
872
|
}
|
|
895
873
|
|
|
896
|
-
static __inline__ __m128i
|
|
897
|
-
_mm_maskz_max_epi16(__mmask8 __M, __m128i __A, __m128i __B)
|
|
898
|
-
{
|
|
874
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
875
|
+
_mm_maskz_max_epi16(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
899
876
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
900
877
|
(__v8hi)_mm_max_epi16(__A, __B),
|
|
901
878
|
(__v8hi)_mm_setzero_si128());
|
|
902
879
|
}
|
|
903
880
|
|
|
904
|
-
static __inline__ __m128i
|
|
905
|
-
_mm_mask_max_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
906
|
-
{
|
|
881
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
882
|
+
_mm_mask_max_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B) {
|
|
907
883
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
908
884
|
(__v8hi)_mm_max_epi16(__A, __B),
|
|
909
885
|
(__v8hi)__W);
|
|
910
886
|
}
|
|
911
887
|
|
|
912
|
-
static __inline__ __m256i
|
|
913
|
-
_mm256_maskz_max_epi16(__mmask16 __M, __m256i __A, __m256i __B)
|
|
914
|
-
{
|
|
888
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
889
|
+
_mm256_maskz_max_epi16(__mmask16 __M, __m256i __A, __m256i __B) {
|
|
915
890
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
916
891
|
(__v16hi)_mm256_max_epi16(__A, __B),
|
|
917
892
|
(__v16hi)_mm256_setzero_si256());
|
|
918
893
|
}
|
|
919
894
|
|
|
920
|
-
static __inline__ __m256i
|
|
921
|
-
_mm256_mask_max_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
922
|
-
{
|
|
895
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
896
|
+
_mm256_mask_max_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B) {
|
|
923
897
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
924
898
|
(__v16hi)_mm256_max_epi16(__A, __B),
|
|
925
899
|
(__v16hi)__W);
|
|
926
900
|
}
|
|
927
901
|
|
|
928
|
-
static __inline__ __m128i
|
|
929
|
-
_mm_maskz_max_epu8(__mmask16 __M, __m128i __A, __m128i __B)
|
|
930
|
-
{
|
|
902
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
903
|
+
_mm_maskz_max_epu8(__mmask16 __M, __m128i __A, __m128i __B) {
|
|
931
904
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
932
905
|
(__v16qi)_mm_max_epu8(__A, __B),
|
|
933
906
|
(__v16qi)_mm_setzero_si128());
|
|
934
907
|
}
|
|
935
908
|
|
|
936
|
-
static __inline__ __m128i
|
|
937
|
-
_mm_mask_max_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
938
|
-
{
|
|
909
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
910
|
+
_mm_mask_max_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B) {
|
|
939
911
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
940
912
|
(__v16qi)_mm_max_epu8(__A, __B),
|
|
941
913
|
(__v16qi)__W);
|
|
942
914
|
}
|
|
943
915
|
|
|
944
|
-
static __inline__ __m256i
|
|
945
|
-
_mm256_maskz_max_epu8
|
|
946
|
-
{
|
|
916
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
917
|
+
_mm256_maskz_max_epu8(__mmask32 __M, __m256i __A, __m256i __B) {
|
|
947
918
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
948
919
|
(__v32qi)_mm256_max_epu8(__A, __B),
|
|
949
920
|
(__v32qi)_mm256_setzero_si256());
|
|
950
921
|
}
|
|
951
922
|
|
|
952
|
-
static __inline__ __m256i
|
|
953
|
-
_mm256_mask_max_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
954
|
-
{
|
|
923
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
924
|
+
_mm256_mask_max_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B) {
|
|
955
925
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
956
926
|
(__v32qi)_mm256_max_epu8(__A, __B),
|
|
957
927
|
(__v32qi)__W);
|
|
958
928
|
}
|
|
959
929
|
|
|
960
|
-
static __inline__ __m128i
|
|
961
|
-
_mm_maskz_max_epu16(__mmask8 __M, __m128i __A, __m128i __B)
|
|
962
|
-
{
|
|
930
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
931
|
+
_mm_maskz_max_epu16(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
963
932
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
964
933
|
(__v8hi)_mm_max_epu16(__A, __B),
|
|
965
934
|
(__v8hi)_mm_setzero_si128());
|
|
966
935
|
}
|
|
967
936
|
|
|
968
|
-
static __inline__ __m128i
|
|
969
|
-
_mm_mask_max_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
970
|
-
{
|
|
937
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
938
|
+
_mm_mask_max_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B) {
|
|
971
939
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
972
940
|
(__v8hi)_mm_max_epu16(__A, __B),
|
|
973
941
|
(__v8hi)__W);
|
|
974
942
|
}
|
|
975
943
|
|
|
976
|
-
static __inline__ __m256i
|
|
977
|
-
_mm256_maskz_max_epu16(__mmask16 __M, __m256i __A, __m256i __B)
|
|
978
|
-
{
|
|
944
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
945
|
+
_mm256_maskz_max_epu16(__mmask16 __M, __m256i __A, __m256i __B) {
|
|
979
946
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
980
947
|
(__v16hi)_mm256_max_epu16(__A, __B),
|
|
981
948
|
(__v16hi)_mm256_setzero_si256());
|
|
982
949
|
}
|
|
983
950
|
|
|
984
|
-
static __inline__ __m256i
|
|
985
|
-
_mm256_mask_max_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
986
|
-
{
|
|
951
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
952
|
+
_mm256_mask_max_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B) {
|
|
987
953
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
988
954
|
(__v16hi)_mm256_max_epu16(__A, __B),
|
|
989
955
|
(__v16hi)__W);
|
|
990
956
|
}
|
|
991
957
|
|
|
992
|
-
static __inline__ __m128i
|
|
993
|
-
_mm_maskz_min_epi8(__mmask16 __M, __m128i __A, __m128i __B)
|
|
994
|
-
{
|
|
958
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
959
|
+
_mm_maskz_min_epi8(__mmask16 __M, __m128i __A, __m128i __B) {
|
|
995
960
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
996
961
|
(__v16qi)_mm_min_epi8(__A, __B),
|
|
997
962
|
(__v16qi)_mm_setzero_si128());
|
|
998
963
|
}
|
|
999
964
|
|
|
1000
|
-
static __inline__ __m128i
|
|
1001
|
-
_mm_mask_min_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
1002
|
-
{
|
|
965
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
966
|
+
_mm_mask_min_epi8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B) {
|
|
1003
967
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
1004
968
|
(__v16qi)_mm_min_epi8(__A, __B),
|
|
1005
969
|
(__v16qi)__W);
|
|
1006
970
|
}
|
|
1007
971
|
|
|
1008
|
-
static __inline__ __m256i
|
|
1009
|
-
_mm256_maskz_min_epi8(__mmask32 __M, __m256i __A, __m256i __B)
|
|
1010
|
-
{
|
|
972
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
973
|
+
_mm256_maskz_min_epi8(__mmask32 __M, __m256i __A, __m256i __B) {
|
|
1011
974
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
1012
975
|
(__v32qi)_mm256_min_epi8(__A, __B),
|
|
1013
976
|
(__v32qi)_mm256_setzero_si256());
|
|
1014
977
|
}
|
|
1015
978
|
|
|
1016
|
-
static __inline__ __m256i
|
|
1017
|
-
_mm256_mask_min_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
1018
|
-
{
|
|
979
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
980
|
+
_mm256_mask_min_epi8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B) {
|
|
1019
981
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
1020
982
|
(__v32qi)_mm256_min_epi8(__A, __B),
|
|
1021
983
|
(__v32qi)__W);
|
|
1022
984
|
}
|
|
1023
985
|
|
|
1024
|
-
static __inline__ __m128i
|
|
1025
|
-
_mm_maskz_min_epi16(__mmask8 __M, __m128i __A, __m128i __B)
|
|
1026
|
-
{
|
|
986
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
987
|
+
_mm_maskz_min_epi16(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
1027
988
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
1028
989
|
(__v8hi)_mm_min_epi16(__A, __B),
|
|
1029
990
|
(__v8hi)_mm_setzero_si128());
|
|
1030
991
|
}
|
|
1031
992
|
|
|
1032
|
-
static __inline__ __m128i
|
|
1033
|
-
_mm_mask_min_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
1034
|
-
{
|
|
993
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
994
|
+
_mm_mask_min_epi16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B) {
|
|
1035
995
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
1036
996
|
(__v8hi)_mm_min_epi16(__A, __B),
|
|
1037
997
|
(__v8hi)__W);
|
|
1038
998
|
}
|
|
1039
999
|
|
|
1040
|
-
static __inline__ __m256i
|
|
1041
|
-
_mm256_maskz_min_epi16(__mmask16 __M, __m256i __A, __m256i __B)
|
|
1042
|
-
{
|
|
1000
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1001
|
+
_mm256_maskz_min_epi16(__mmask16 __M, __m256i __A, __m256i __B) {
|
|
1043
1002
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
1044
1003
|
(__v16hi)_mm256_min_epi16(__A, __B),
|
|
1045
1004
|
(__v16hi)_mm256_setzero_si256());
|
|
1046
1005
|
}
|
|
1047
1006
|
|
|
1048
|
-
static __inline__ __m256i
|
|
1049
|
-
_mm256_mask_min_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
1050
|
-
{
|
|
1007
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1008
|
+
_mm256_mask_min_epi16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B) {
|
|
1051
1009
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
1052
1010
|
(__v16hi)_mm256_min_epi16(__A, __B),
|
|
1053
1011
|
(__v16hi)__W);
|
|
1054
1012
|
}
|
|
1055
1013
|
|
|
1056
|
-
static __inline__ __m128i
|
|
1057
|
-
_mm_maskz_min_epu8(__mmask16 __M, __m128i __A, __m128i __B)
|
|
1058
|
-
{
|
|
1014
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1015
|
+
_mm_maskz_min_epu8(__mmask16 __M, __m128i __A, __m128i __B) {
|
|
1059
1016
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
1060
1017
|
(__v16qi)_mm_min_epu8(__A, __B),
|
|
1061
1018
|
(__v16qi)_mm_setzero_si128());
|
|
1062
1019
|
}
|
|
1063
1020
|
|
|
1064
|
-
static __inline__ __m128i
|
|
1065
|
-
_mm_mask_min_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B)
|
|
1066
|
-
{
|
|
1021
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1022
|
+
_mm_mask_min_epu8(__m128i __W, __mmask16 __M, __m128i __A, __m128i __B) {
|
|
1067
1023
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
1068
1024
|
(__v16qi)_mm_min_epu8(__A, __B),
|
|
1069
1025
|
(__v16qi)__W);
|
|
1070
1026
|
}
|
|
1071
1027
|
|
|
1072
|
-
static __inline__ __m256i
|
|
1073
|
-
_mm256_maskz_min_epu8
|
|
1074
|
-
{
|
|
1028
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1029
|
+
_mm256_maskz_min_epu8(__mmask32 __M, __m256i __A, __m256i __B) {
|
|
1075
1030
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
1076
1031
|
(__v32qi)_mm256_min_epu8(__A, __B),
|
|
1077
1032
|
(__v32qi)_mm256_setzero_si256());
|
|
1078
1033
|
}
|
|
1079
1034
|
|
|
1080
|
-
static __inline__ __m256i
|
|
1081
|
-
_mm256_mask_min_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B)
|
|
1082
|
-
{
|
|
1035
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1036
|
+
_mm256_mask_min_epu8(__m256i __W, __mmask32 __M, __m256i __A, __m256i __B) {
|
|
1083
1037
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__M,
|
|
1084
1038
|
(__v32qi)_mm256_min_epu8(__A, __B),
|
|
1085
1039
|
(__v32qi)__W);
|
|
1086
1040
|
}
|
|
1087
1041
|
|
|
1088
|
-
static __inline__ __m128i
|
|
1089
|
-
_mm_maskz_min_epu16(__mmask8 __M, __m128i __A, __m128i __B)
|
|
1090
|
-
{
|
|
1042
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1043
|
+
_mm_maskz_min_epu16(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
1091
1044
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
1092
1045
|
(__v8hi)_mm_min_epu16(__A, __B),
|
|
1093
1046
|
(__v8hi)_mm_setzero_si128());
|
|
1094
1047
|
}
|
|
1095
1048
|
|
|
1096
|
-
static __inline__ __m128i
|
|
1097
|
-
_mm_mask_min_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B)
|
|
1098
|
-
{
|
|
1049
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1050
|
+
_mm_mask_min_epu16(__m128i __W, __mmask8 __M, __m128i __A, __m128i __B) {
|
|
1099
1051
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
1100
1052
|
(__v8hi)_mm_min_epu16(__A, __B),
|
|
1101
1053
|
(__v8hi)__W);
|
|
1102
1054
|
}
|
|
1103
1055
|
|
|
1104
|
-
static __inline__ __m256i
|
|
1105
|
-
_mm256_maskz_min_epu16(__mmask16 __M, __m256i __A, __m256i __B)
|
|
1106
|
-
{
|
|
1056
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1057
|
+
_mm256_maskz_min_epu16(__mmask16 __M, __m256i __A, __m256i __B) {
|
|
1107
1058
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
1108
1059
|
(__v16hi)_mm256_min_epu16(__A, __B),
|
|
1109
1060
|
(__v16hi)_mm256_setzero_si256());
|
|
1110
1061
|
}
|
|
1111
1062
|
|
|
1112
|
-
static __inline__ __m256i
|
|
1113
|
-
_mm256_mask_min_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B)
|
|
1114
|
-
{
|
|
1063
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1064
|
+
_mm256_mask_min_epu16(__m256i __W, __mmask16 __M, __m256i __A, __m256i __B) {
|
|
1115
1065
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
1116
1066
|
(__v16hi)_mm256_min_epu16(__A, __B),
|
|
1117
1067
|
(__v16hi)__W);
|
|
1118
1068
|
}
|
|
1119
1069
|
|
|
1120
|
-
static __inline__ __m128i
|
|
1121
|
-
_mm_mask_shuffle_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
1122
|
-
{
|
|
1070
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1071
|
+
_mm_mask_shuffle_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
1123
1072
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
1124
1073
|
(__v16qi)_mm_shuffle_epi8(__A, __B),
|
|
1125
1074
|
(__v16qi)__W);
|
|
1126
1075
|
}
|
|
1127
1076
|
|
|
1128
|
-
static __inline__ __m128i
|
|
1129
|
-
_mm_maskz_shuffle_epi8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
1130
|
-
{
|
|
1077
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1078
|
+
_mm_maskz_shuffle_epi8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
1131
1079
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
1132
1080
|
(__v16qi)_mm_shuffle_epi8(__A, __B),
|
|
1133
1081
|
(__v16qi)_mm_setzero_si128());
|
|
1134
1082
|
}
|
|
1135
1083
|
|
|
1136
|
-
static __inline__ __m256i
|
|
1137
|
-
_mm256_mask_shuffle_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
1138
|
-
{
|
|
1084
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1085
|
+
_mm256_mask_shuffle_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
1139
1086
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1140
1087
|
(__v32qi)_mm256_shuffle_epi8(__A, __B),
|
|
1141
1088
|
(__v32qi)__W);
|
|
1142
1089
|
}
|
|
1143
1090
|
|
|
1144
|
-
static __inline__ __m256i
|
|
1145
|
-
_mm256_maskz_shuffle_epi8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
1146
|
-
{
|
|
1091
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1092
|
+
_mm256_maskz_shuffle_epi8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
1147
1093
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1148
1094
|
(__v32qi)_mm256_shuffle_epi8(__A, __B),
|
|
1149
1095
|
(__v32qi)_mm256_setzero_si256());
|
|
1150
1096
|
}
|
|
1151
1097
|
|
|
1152
|
-
static __inline__ __m128i
|
|
1098
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1153
1099
|
_mm_mask_subs_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
1154
1100
|
{
|
|
1155
1101
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -1157,7 +1103,7 @@ _mm_mask_subs_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
|
1157
1103
|
(__v16qi)__W);
|
|
1158
1104
|
}
|
|
1159
1105
|
|
|
1160
|
-
static __inline__ __m128i
|
|
1106
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1161
1107
|
_mm_maskz_subs_epi8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
1162
1108
|
{
|
|
1163
1109
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -1165,7 +1111,7 @@ _mm_maskz_subs_epi8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
|
1165
1111
|
(__v16qi)_mm_setzero_si128());
|
|
1166
1112
|
}
|
|
1167
1113
|
|
|
1168
|
-
static __inline__ __m256i
|
|
1114
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1169
1115
|
_mm256_mask_subs_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
1170
1116
|
{
|
|
1171
1117
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -1173,7 +1119,7 @@ _mm256_mask_subs_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
|
1173
1119
|
(__v32qi)__W);
|
|
1174
1120
|
}
|
|
1175
1121
|
|
|
1176
|
-
static __inline__ __m256i
|
|
1122
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1177
1123
|
_mm256_maskz_subs_epi8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
1178
1124
|
{
|
|
1179
1125
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -1181,7 +1127,7 @@ _mm256_maskz_subs_epi8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
|
1181
1127
|
(__v32qi)_mm256_setzero_si256());
|
|
1182
1128
|
}
|
|
1183
1129
|
|
|
1184
|
-
static __inline__ __m128i
|
|
1130
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1185
1131
|
_mm_mask_subs_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
1186
1132
|
{
|
|
1187
1133
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1189,7 +1135,7 @@ _mm_mask_subs_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
1189
1135
|
(__v8hi)__W);
|
|
1190
1136
|
}
|
|
1191
1137
|
|
|
1192
|
-
static __inline__ __m128i
|
|
1138
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1193
1139
|
_mm_maskz_subs_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
1194
1140
|
{
|
|
1195
1141
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1197,7 +1143,7 @@ _mm_maskz_subs_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
|
1197
1143
|
(__v8hi)_mm_setzero_si128());
|
|
1198
1144
|
}
|
|
1199
1145
|
|
|
1200
|
-
static __inline__ __m256i
|
|
1146
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1201
1147
|
_mm256_mask_subs_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
1202
1148
|
{
|
|
1203
1149
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1205,7 +1151,7 @@ _mm256_mask_subs_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1205
1151
|
(__v16hi)__W);
|
|
1206
1152
|
}
|
|
1207
1153
|
|
|
1208
|
-
static __inline__ __m256i
|
|
1154
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1209
1155
|
_mm256_maskz_subs_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
1210
1156
|
{
|
|
1211
1157
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1213,7 +1159,7 @@ _mm256_maskz_subs_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1213
1159
|
(__v16hi)_mm256_setzero_si256());
|
|
1214
1160
|
}
|
|
1215
1161
|
|
|
1216
|
-
static __inline__ __m128i
|
|
1162
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1217
1163
|
_mm_mask_subs_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
1218
1164
|
{
|
|
1219
1165
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -1221,7 +1167,7 @@ _mm_mask_subs_epu8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B)
|
|
|
1221
1167
|
(__v16qi)__W);
|
|
1222
1168
|
}
|
|
1223
1169
|
|
|
1224
|
-
static __inline__ __m128i
|
|
1170
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1225
1171
|
_mm_maskz_subs_epu8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
1226
1172
|
{
|
|
1227
1173
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
@@ -1229,7 +1175,7 @@ _mm_maskz_subs_epu8(__mmask16 __U, __m128i __A, __m128i __B)
|
|
|
1229
1175
|
(__v16qi)_mm_setzero_si128());
|
|
1230
1176
|
}
|
|
1231
1177
|
|
|
1232
|
-
static __inline__ __m256i
|
|
1178
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1233
1179
|
_mm256_mask_subs_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
1234
1180
|
{
|
|
1235
1181
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -1237,7 +1183,7 @@ _mm256_mask_subs_epu8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B)
|
|
|
1237
1183
|
(__v32qi)__W);
|
|
1238
1184
|
}
|
|
1239
1185
|
|
|
1240
|
-
static __inline__ __m256i
|
|
1186
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1241
1187
|
_mm256_maskz_subs_epu8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
1242
1188
|
{
|
|
1243
1189
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
@@ -1245,7 +1191,7 @@ _mm256_maskz_subs_epu8(__mmask32 __U, __m256i __A, __m256i __B)
|
|
|
1245
1191
|
(__v32qi)_mm256_setzero_si256());
|
|
1246
1192
|
}
|
|
1247
1193
|
|
|
1248
|
-
static __inline__ __m128i
|
|
1194
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1249
1195
|
_mm_mask_subs_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
1250
1196
|
{
|
|
1251
1197
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1253,7 +1199,7 @@ _mm_mask_subs_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
1253
1199
|
(__v8hi)__W);
|
|
1254
1200
|
}
|
|
1255
1201
|
|
|
1256
|
-
static __inline__ __m128i
|
|
1202
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1257
1203
|
_mm_maskz_subs_epu16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
1258
1204
|
{
|
|
1259
1205
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1261,7 +1207,7 @@ _mm_maskz_subs_epu16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
|
1261
1207
|
(__v8hi)_mm_setzero_si128());
|
|
1262
1208
|
}
|
|
1263
1209
|
|
|
1264
|
-
static __inline__ __m256i
|
|
1210
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1265
1211
|
_mm256_mask_subs_epu16(__m256i __W, __mmask16 __U, __m256i __A,
|
|
1266
1212
|
__m256i __B) {
|
|
1267
1213
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1269,7 +1215,7 @@ _mm256_mask_subs_epu16(__m256i __W, __mmask16 __U, __m256i __A,
|
|
|
1269
1215
|
(__v16hi)__W);
|
|
1270
1216
|
}
|
|
1271
1217
|
|
|
1272
|
-
static __inline__ __m256i
|
|
1218
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1273
1219
|
_mm256_maskz_subs_epu16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
1274
1220
|
{
|
|
1275
1221
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1277,89 +1223,81 @@ _mm256_maskz_subs_epu16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1277
1223
|
(__v16hi)_mm256_setzero_si256());
|
|
1278
1224
|
}
|
|
1279
1225
|
|
|
1280
|
-
static __inline__ __m128i
|
|
1281
|
-
_mm_permutex2var_epi16(__m128i __A, __m128i __I, __m128i __B)
|
|
1282
|
-
{
|
|
1226
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1227
|
+
_mm_permutex2var_epi16(__m128i __A, __m128i __I, __m128i __B) {
|
|
1283
1228
|
return (__m128i)__builtin_ia32_vpermi2varhi128((__v8hi)__A, (__v8hi)__I,
|
|
1284
1229
|
(__v8hi) __B);
|
|
1285
1230
|
}
|
|
1286
1231
|
|
|
1287
|
-
static __inline__ __m128i
|
|
1232
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1288
1233
|
_mm_mask_permutex2var_epi16(__m128i __A, __mmask8 __U, __m128i __I,
|
|
1289
|
-
__m128i __B)
|
|
1290
|
-
{
|
|
1234
|
+
__m128i __B) {
|
|
1291
1235
|
return (__m128i)__builtin_ia32_selectw_128(__U,
|
|
1292
1236
|
(__v8hi)_mm_permutex2var_epi16(__A, __I, __B),
|
|
1293
1237
|
(__v8hi)__A);
|
|
1294
1238
|
}
|
|
1295
1239
|
|
|
1296
|
-
static __inline__ __m128i
|
|
1240
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1297
1241
|
_mm_mask2_permutex2var_epi16(__m128i __A, __m128i __I, __mmask8 __U,
|
|
1298
|
-
__m128i __B)
|
|
1299
|
-
{
|
|
1242
|
+
__m128i __B) {
|
|
1300
1243
|
return (__m128i)__builtin_ia32_selectw_128(__U,
|
|
1301
1244
|
(__v8hi)_mm_permutex2var_epi16(__A, __I, __B),
|
|
1302
1245
|
(__v8hi)__I);
|
|
1303
1246
|
}
|
|
1304
1247
|
|
|
1305
|
-
static __inline__ __m128i
|
|
1306
|
-
_mm_maskz_permutex2var_epi16
|
|
1307
|
-
|
|
1308
|
-
{
|
|
1248
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1249
|
+
_mm_maskz_permutex2var_epi16(__mmask8 __U, __m128i __A, __m128i __I,
|
|
1250
|
+
__m128i __B) {
|
|
1309
1251
|
return (__m128i)__builtin_ia32_selectw_128(__U,
|
|
1310
1252
|
(__v8hi)_mm_permutex2var_epi16(__A, __I, __B),
|
|
1311
1253
|
(__v8hi)_mm_setzero_si128());
|
|
1312
1254
|
}
|
|
1313
1255
|
|
|
1314
|
-
static __inline__ __m256i
|
|
1315
|
-
_mm256_permutex2var_epi16(__m256i __A, __m256i __I, __m256i __B)
|
|
1316
|
-
{
|
|
1256
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1257
|
+
_mm256_permutex2var_epi16(__m256i __A, __m256i __I, __m256i __B) {
|
|
1317
1258
|
return (__m256i)__builtin_ia32_vpermi2varhi256((__v16hi)__A, (__v16hi)__I,
|
|
1318
1259
|
(__v16hi)__B);
|
|
1319
1260
|
}
|
|
1320
1261
|
|
|
1321
|
-
static __inline__ __m256i
|
|
1262
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1322
1263
|
_mm256_mask_permutex2var_epi16(__m256i __A, __mmask16 __U, __m256i __I,
|
|
1323
|
-
__m256i __B)
|
|
1324
|
-
{
|
|
1264
|
+
__m256i __B) {
|
|
1325
1265
|
return (__m256i)__builtin_ia32_selectw_256(__U,
|
|
1326
1266
|
(__v16hi)_mm256_permutex2var_epi16(__A, __I, __B),
|
|
1327
1267
|
(__v16hi)__A);
|
|
1328
1268
|
}
|
|
1329
1269
|
|
|
1330
|
-
static __inline__ __m256i
|
|
1270
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1331
1271
|
_mm256_mask2_permutex2var_epi16(__m256i __A, __m256i __I, __mmask16 __U,
|
|
1332
|
-
__m256i __B)
|
|
1333
|
-
{
|
|
1272
|
+
__m256i __B) {
|
|
1334
1273
|
return (__m256i)__builtin_ia32_selectw_256(__U,
|
|
1335
1274
|
(__v16hi)_mm256_permutex2var_epi16(__A, __I, __B),
|
|
1336
1275
|
(__v16hi)__I);
|
|
1337
1276
|
}
|
|
1338
1277
|
|
|
1339
|
-
static __inline__ __m256i
|
|
1340
|
-
_mm256_maskz_permutex2var_epi16
|
|
1341
|
-
|
|
1342
|
-
{
|
|
1278
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1279
|
+
_mm256_maskz_permutex2var_epi16(__mmask16 __U, __m256i __A, __m256i __I,
|
|
1280
|
+
__m256i __B) {
|
|
1343
1281
|
return (__m256i)__builtin_ia32_selectw_256(__U,
|
|
1344
1282
|
(__v16hi)_mm256_permutex2var_epi16(__A, __I, __B),
|
|
1345
1283
|
(__v16hi)_mm256_setzero_si256());
|
|
1346
1284
|
}
|
|
1347
1285
|
|
|
1348
|
-
static __inline__ __m128i
|
|
1286
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1349
1287
|
_mm_mask_maddubs_epi16(__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) {
|
|
1350
1288
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1351
1289
|
(__v8hi)_mm_maddubs_epi16(__X, __Y),
|
|
1352
1290
|
(__v8hi)__W);
|
|
1353
1291
|
}
|
|
1354
1292
|
|
|
1355
|
-
static __inline__ __m128i
|
|
1293
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1356
1294
|
_mm_maskz_maddubs_epi16(__mmask8 __U, __m128i __X, __m128i __Y) {
|
|
1357
1295
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1358
1296
|
(__v8hi)_mm_maddubs_epi16(__X, __Y),
|
|
1359
1297
|
(__v8hi)_mm_setzero_si128());
|
|
1360
1298
|
}
|
|
1361
1299
|
|
|
1362
|
-
static __inline__ __m256i
|
|
1300
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1363
1301
|
_mm256_mask_maddubs_epi16(__m256i __W, __mmask16 __U, __m256i __X,
|
|
1364
1302
|
__m256i __Y) {
|
|
1365
1303
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1367,35 +1305,35 @@ _mm256_mask_maddubs_epi16(__m256i __W, __mmask16 __U, __m256i __X,
|
|
|
1367
1305
|
(__v16hi)__W);
|
|
1368
1306
|
}
|
|
1369
1307
|
|
|
1370
|
-
static __inline__ __m256i
|
|
1308
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1371
1309
|
_mm256_maskz_maddubs_epi16(__mmask16 __U, __m256i __X, __m256i __Y) {
|
|
1372
1310
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1373
1311
|
(__v16hi)_mm256_maddubs_epi16(__X, __Y),
|
|
1374
1312
|
(__v16hi)_mm256_setzero_si256());
|
|
1375
1313
|
}
|
|
1376
1314
|
|
|
1377
|
-
static __inline__ __m128i
|
|
1315
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1378
1316
|
_mm_mask_madd_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
1379
1317
|
return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,
|
|
1380
1318
|
(__v4si)_mm_madd_epi16(__A, __B),
|
|
1381
1319
|
(__v4si)__W);
|
|
1382
1320
|
}
|
|
1383
1321
|
|
|
1384
|
-
static __inline__ __m128i
|
|
1322
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1385
1323
|
_mm_maskz_madd_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
1386
1324
|
return (__m128i)__builtin_ia32_selectd_128((__mmask8)__U,
|
|
1387
1325
|
(__v4si)_mm_madd_epi16(__A, __B),
|
|
1388
1326
|
(__v4si)_mm_setzero_si128());
|
|
1389
1327
|
}
|
|
1390
1328
|
|
|
1391
|
-
static __inline__ __m256i
|
|
1329
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1392
1330
|
_mm256_mask_madd_epi16(__m256i __W, __mmask8 __U, __m256i __A, __m256i __B) {
|
|
1393
1331
|
return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,
|
|
1394
1332
|
(__v8si)_mm256_madd_epi16(__A, __B),
|
|
1395
1333
|
(__v8si)__W);
|
|
1396
1334
|
}
|
|
1397
1335
|
|
|
1398
|
-
static __inline__ __m256i
|
|
1336
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1399
1337
|
_mm256_maskz_madd_epi16(__mmask8 __U, __m256i __A, __m256i __B) {
|
|
1400
1338
|
return (__m256i)__builtin_ia32_selectd_256((__mmask8)__U,
|
|
1401
1339
|
(__v8si)_mm256_madd_epi16(__A, __B),
|
|
@@ -1486,8 +1424,8 @@ _mm256_maskz_cvtusepi16_epi8 (__mmask16 __M, __m256i __A) {
|
|
|
1486
1424
|
__M);
|
|
1487
1425
|
}
|
|
1488
1426
|
|
|
1489
|
-
static __inline__ __m128i
|
|
1490
|
-
_mm_cvtepi16_epi8
|
|
1427
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1428
|
+
_mm_cvtepi16_epi8(__m128i __A) {
|
|
1491
1429
|
return (__m128i)__builtin_shufflevector(
|
|
1492
1430
|
__builtin_convertvector((__v8hi)__A, __v8qi),
|
|
1493
1431
|
(__v8qi){0, 0, 0, 0, 0, 0, 0, 0}, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11,
|
|
@@ -1527,20 +1465,20 @@ _mm_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask8 __M, __m128i __A)
|
|
|
1527
1465
|
__builtin_ia32_pmovuswb128mem_mask ((__v16qi *) __P, (__v8hi) __A, __M);
|
|
1528
1466
|
}
|
|
1529
1467
|
|
|
1530
|
-
static __inline__ __m128i
|
|
1531
|
-
_mm256_cvtepi16_epi8
|
|
1468
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1469
|
+
_mm256_cvtepi16_epi8(__m256i __A) {
|
|
1532
1470
|
return (__m128i)__builtin_convertvector((__v16hi) __A, __v16qi);
|
|
1533
1471
|
}
|
|
1534
1472
|
|
|
1535
|
-
static __inline__ __m128i
|
|
1536
|
-
_mm256_mask_cvtepi16_epi8
|
|
1473
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1474
|
+
_mm256_mask_cvtepi16_epi8(__m128i __O, __mmask16 __M, __m256i __A) {
|
|
1537
1475
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
1538
1476
|
(__v16qi)_mm256_cvtepi16_epi8(__A),
|
|
1539
1477
|
(__v16qi)__O);
|
|
1540
1478
|
}
|
|
1541
1479
|
|
|
1542
|
-
static __inline__ __m128i
|
|
1543
|
-
_mm256_maskz_cvtepi16_epi8
|
|
1480
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1481
|
+
_mm256_maskz_cvtepi16_epi8(__mmask16 __M, __m256i __A) {
|
|
1544
1482
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__M,
|
|
1545
1483
|
(__v16qi)_mm256_cvtepi16_epi8(__A),
|
|
1546
1484
|
(__v16qi)_mm_setzero_si128());
|
|
@@ -1564,203 +1502,198 @@ _mm256_mask_cvtusepi16_storeu_epi8 (void * __P, __mmask16 __M, __m256i __A)
|
|
|
1564
1502
|
__builtin_ia32_pmovuswb256mem_mask ((__v16qi*) __P, (__v16hi) __A, __M);
|
|
1565
1503
|
}
|
|
1566
1504
|
|
|
1567
|
-
static __inline__ __m128i
|
|
1505
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1568
1506
|
_mm_mask_mulhrs_epi16(__m128i __W, __mmask8 __U, __m128i __X, __m128i __Y) {
|
|
1569
1507
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1570
1508
|
(__v8hi)_mm_mulhrs_epi16(__X, __Y),
|
|
1571
1509
|
(__v8hi)__W);
|
|
1572
1510
|
}
|
|
1573
1511
|
|
|
1574
|
-
static __inline__ __m128i
|
|
1512
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1575
1513
|
_mm_maskz_mulhrs_epi16(__mmask8 __U, __m128i __X, __m128i __Y) {
|
|
1576
1514
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1577
1515
|
(__v8hi)_mm_mulhrs_epi16(__X, __Y),
|
|
1578
1516
|
(__v8hi)_mm_setzero_si128());
|
|
1579
1517
|
}
|
|
1580
1518
|
|
|
1581
|
-
static __inline__ __m256i
|
|
1519
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1582
1520
|
_mm256_mask_mulhrs_epi16(__m256i __W, __mmask16 __U, __m256i __X, __m256i __Y) {
|
|
1583
1521
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1584
1522
|
(__v16hi)_mm256_mulhrs_epi16(__X, __Y),
|
|
1585
1523
|
(__v16hi)__W);
|
|
1586
1524
|
}
|
|
1587
1525
|
|
|
1588
|
-
static __inline__ __m256i
|
|
1526
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1589
1527
|
_mm256_maskz_mulhrs_epi16(__mmask16 __U, __m256i __X, __m256i __Y) {
|
|
1590
1528
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1591
1529
|
(__v16hi)_mm256_mulhrs_epi16(__X, __Y),
|
|
1592
1530
|
(__v16hi)_mm256_setzero_si256());
|
|
1593
1531
|
}
|
|
1594
1532
|
|
|
1595
|
-
static __inline__ __m128i
|
|
1533
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1596
1534
|
_mm_mask_mulhi_epu16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
1597
|
-
return (__m128i)__builtin_ia32_selectw_128(
|
|
1598
|
-
|
|
1599
|
-
(__v8hi)__W);
|
|
1535
|
+
return (__m128i)__builtin_ia32_selectw_128(
|
|
1536
|
+
(__mmask8)__U, (__v8hi)_mm_mulhi_epu16(__A, __B), (__v8hi)__W);
|
|
1600
1537
|
}
|
|
1601
1538
|
|
|
1602
|
-
static __inline__ __m128i
|
|
1539
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1603
1540
|
_mm_maskz_mulhi_epu16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
1604
1541
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1605
1542
|
(__v8hi)_mm_mulhi_epu16(__A, __B),
|
|
1606
1543
|
(__v8hi)_mm_setzero_si128());
|
|
1607
1544
|
}
|
|
1608
1545
|
|
|
1609
|
-
static __inline__ __m256i
|
|
1546
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1610
1547
|
_mm256_mask_mulhi_epu16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
1611
|
-
return (__m256i)__builtin_ia32_selectw_256(
|
|
1612
|
-
|
|
1613
|
-
(__v16hi)__W);
|
|
1548
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
1549
|
+
(__mmask16)__U, (__v16hi)_mm256_mulhi_epu16(__A, __B), (__v16hi)__W);
|
|
1614
1550
|
}
|
|
1615
1551
|
|
|
1616
|
-
static __inline__ __m256i
|
|
1552
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1617
1553
|
_mm256_maskz_mulhi_epu16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
1618
|
-
return (__m256i)__builtin_ia32_selectw_256(
|
|
1619
|
-
|
|
1620
|
-
|
|
1554
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
1555
|
+
(__mmask16)__U, (__v16hi)_mm256_mulhi_epu16(__A, __B),
|
|
1556
|
+
(__v16hi)_mm256_setzero_si256());
|
|
1621
1557
|
}
|
|
1622
1558
|
|
|
1623
|
-
static __inline__ __m128i
|
|
1559
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1624
1560
|
_mm_mask_mulhi_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
1625
|
-
return (__m128i)__builtin_ia32_selectw_128(
|
|
1626
|
-
|
|
1627
|
-
(__v8hi)__W);
|
|
1561
|
+
return (__m128i)__builtin_ia32_selectw_128(
|
|
1562
|
+
(__mmask8)__U, (__v8hi)_mm_mulhi_epi16(__A, __B), (__v8hi)__W);
|
|
1628
1563
|
}
|
|
1629
1564
|
|
|
1630
|
-
static __inline__ __m128i
|
|
1565
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1631
1566
|
_mm_maskz_mulhi_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
1632
1567
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1633
1568
|
(__v8hi)_mm_mulhi_epi16(__A, __B),
|
|
1634
1569
|
(__v8hi)_mm_setzero_si128());
|
|
1635
1570
|
}
|
|
1636
1571
|
|
|
1637
|
-
static __inline__ __m256i
|
|
1572
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1638
1573
|
_mm256_mask_mulhi_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
1639
|
-
return (__m256i)__builtin_ia32_selectw_256(
|
|
1640
|
-
|
|
1641
|
-
(__v16hi)__W);
|
|
1574
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
1575
|
+
(__mmask16)__U, (__v16hi)_mm256_mulhi_epi16(__A, __B), (__v16hi)__W);
|
|
1642
1576
|
}
|
|
1643
1577
|
|
|
1644
|
-
static __inline__ __m256i
|
|
1578
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1645
1579
|
_mm256_maskz_mulhi_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
1646
|
-
return (__m256i)__builtin_ia32_selectw_256(
|
|
1647
|
-
|
|
1648
|
-
|
|
1580
|
+
return (__m256i)__builtin_ia32_selectw_256(
|
|
1581
|
+
(__mmask16)__U, (__v16hi)_mm256_mulhi_epi16(__A, __B),
|
|
1582
|
+
(__v16hi)_mm256_setzero_si256());
|
|
1649
1583
|
}
|
|
1650
1584
|
|
|
1651
|
-
static __inline__ __m128i
|
|
1585
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1652
1586
|
_mm_mask_unpackhi_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
1653
|
-
return (__m128i)__builtin_ia32_selectb_128(
|
|
1654
|
-
|
|
1655
|
-
(__v16qi)__W);
|
|
1587
|
+
return (__m128i)__builtin_ia32_selectb_128(
|
|
1588
|
+
(__mmask16)__U, (__v16qi)_mm_unpackhi_epi8(__A, __B), (__v16qi)__W);
|
|
1656
1589
|
}
|
|
1657
1590
|
|
|
1658
|
-
static __inline__ __m128i
|
|
1591
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1659
1592
|
_mm_maskz_unpackhi_epi8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
1660
1593
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
1661
1594
|
(__v16qi)_mm_unpackhi_epi8(__A, __B),
|
|
1662
1595
|
(__v16qi)_mm_setzero_si128());
|
|
1663
1596
|
}
|
|
1664
1597
|
|
|
1665
|
-
static __inline__ __m256i
|
|
1598
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1666
1599
|
_mm256_mask_unpackhi_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
1667
1600
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1668
1601
|
(__v32qi)_mm256_unpackhi_epi8(__A, __B),
|
|
1669
1602
|
(__v32qi)__W);
|
|
1670
1603
|
}
|
|
1671
1604
|
|
|
1672
|
-
static __inline__ __m256i
|
|
1605
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1673
1606
|
_mm256_maskz_unpackhi_epi8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
1674
1607
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1675
1608
|
(__v32qi)_mm256_unpackhi_epi8(__A, __B),
|
|
1676
1609
|
(__v32qi)_mm256_setzero_si256());
|
|
1677
1610
|
}
|
|
1678
1611
|
|
|
1679
|
-
static __inline__ __m128i
|
|
1612
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1680
1613
|
_mm_mask_unpackhi_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
1681
1614
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1682
1615
|
(__v8hi)_mm_unpackhi_epi16(__A, __B),
|
|
1683
1616
|
(__v8hi)__W);
|
|
1684
1617
|
}
|
|
1685
1618
|
|
|
1686
|
-
static __inline__ __m128i
|
|
1619
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1687
1620
|
_mm_maskz_unpackhi_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
1688
1621
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1689
1622
|
(__v8hi)_mm_unpackhi_epi16(__A, __B),
|
|
1690
1623
|
(__v8hi) _mm_setzero_si128());
|
|
1691
1624
|
}
|
|
1692
1625
|
|
|
1693
|
-
static __inline__ __m256i
|
|
1626
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1694
1627
|
_mm256_mask_unpackhi_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
1695
1628
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1696
1629
|
(__v16hi)_mm256_unpackhi_epi16(__A, __B),
|
|
1697
1630
|
(__v16hi)__W);
|
|
1698
1631
|
}
|
|
1699
1632
|
|
|
1700
|
-
static __inline__ __m256i
|
|
1633
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1701
1634
|
_mm256_maskz_unpackhi_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
1702
1635
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1703
1636
|
(__v16hi)_mm256_unpackhi_epi16(__A, __B),
|
|
1704
1637
|
(__v16hi)_mm256_setzero_si256());
|
|
1705
1638
|
}
|
|
1706
1639
|
|
|
1707
|
-
static __inline__ __m128i
|
|
1640
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1708
1641
|
_mm_mask_unpacklo_epi8(__m128i __W, __mmask16 __U, __m128i __A, __m128i __B) {
|
|
1709
1642
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
1710
1643
|
(__v16qi)_mm_unpacklo_epi8(__A, __B),
|
|
1711
1644
|
(__v16qi)__W);
|
|
1712
1645
|
}
|
|
1713
1646
|
|
|
1714
|
-
static __inline__ __m128i
|
|
1647
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1715
1648
|
_mm_maskz_unpacklo_epi8(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
1716
1649
|
return (__m128i)__builtin_ia32_selectb_128((__mmask16)__U,
|
|
1717
1650
|
(__v16qi)_mm_unpacklo_epi8(__A, __B),
|
|
1718
1651
|
(__v16qi)_mm_setzero_si128());
|
|
1719
1652
|
}
|
|
1720
1653
|
|
|
1721
|
-
static __inline__ __m256i
|
|
1654
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1722
1655
|
_mm256_mask_unpacklo_epi8(__m256i __W, __mmask32 __U, __m256i __A, __m256i __B) {
|
|
1723
1656
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1724
1657
|
(__v32qi)_mm256_unpacklo_epi8(__A, __B),
|
|
1725
1658
|
(__v32qi)__W);
|
|
1726
1659
|
}
|
|
1727
1660
|
|
|
1728
|
-
static __inline__ __m256i
|
|
1661
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1729
1662
|
_mm256_maskz_unpacklo_epi8(__mmask32 __U, __m256i __A, __m256i __B) {
|
|
1730
1663
|
return (__m256i)__builtin_ia32_selectb_256((__mmask32)__U,
|
|
1731
1664
|
(__v32qi)_mm256_unpacklo_epi8(__A, __B),
|
|
1732
1665
|
(__v32qi)_mm256_setzero_si256());
|
|
1733
1666
|
}
|
|
1734
1667
|
|
|
1735
|
-
static __inline__ __m128i
|
|
1668
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1736
1669
|
_mm_mask_unpacklo_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B) {
|
|
1737
1670
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1738
1671
|
(__v8hi)_mm_unpacklo_epi16(__A, __B),
|
|
1739
1672
|
(__v8hi)__W);
|
|
1740
1673
|
}
|
|
1741
1674
|
|
|
1742
|
-
static __inline__ __m128i
|
|
1675
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1743
1676
|
_mm_maskz_unpacklo_epi16(__mmask8 __U, __m128i __A, __m128i __B) {
|
|
1744
1677
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
1745
1678
|
(__v8hi)_mm_unpacklo_epi16(__A, __B),
|
|
1746
1679
|
(__v8hi) _mm_setzero_si128());
|
|
1747
1680
|
}
|
|
1748
1681
|
|
|
1749
|
-
static __inline__ __m256i
|
|
1682
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1750
1683
|
_mm256_mask_unpacklo_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B) {
|
|
1751
1684
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1752
1685
|
(__v16hi)_mm256_unpacklo_epi16(__A, __B),
|
|
1753
1686
|
(__v16hi)__W);
|
|
1754
1687
|
}
|
|
1755
1688
|
|
|
1756
|
-
static __inline__ __m256i
|
|
1689
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1757
1690
|
_mm256_maskz_unpacklo_epi16(__mmask16 __U, __m256i __A, __m256i __B) {
|
|
1758
1691
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1759
1692
|
(__v16hi)_mm256_unpacklo_epi16(__A, __B),
|
|
1760
1693
|
(__v16hi)_mm256_setzero_si256());
|
|
1761
1694
|
}
|
|
1762
1695
|
|
|
1763
|
-
static __inline__ __m128i
|
|
1696
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1764
1697
|
_mm_mask_cvtepi8_epi16(__m128i __W, __mmask8 __U, __m128i __A)
|
|
1765
1698
|
{
|
|
1766
1699
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1768,7 +1701,7 @@ _mm_mask_cvtepi8_epi16(__m128i __W, __mmask8 __U, __m128i __A)
|
|
|
1768
1701
|
(__v8hi)__W);
|
|
1769
1702
|
}
|
|
1770
1703
|
|
|
1771
|
-
static __inline__ __m128i
|
|
1704
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1772
1705
|
_mm_maskz_cvtepi8_epi16(__mmask8 __U, __m128i __A)
|
|
1773
1706
|
{
|
|
1774
1707
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1776,7 +1709,7 @@ _mm_maskz_cvtepi8_epi16(__mmask8 __U, __m128i __A)
|
|
|
1776
1709
|
(__v8hi)_mm_setzero_si128());
|
|
1777
1710
|
}
|
|
1778
1711
|
|
|
1779
|
-
static __inline__ __m256i
|
|
1712
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1780
1713
|
_mm256_mask_cvtepi8_epi16(__m256i __W, __mmask16 __U, __m128i __A)
|
|
1781
1714
|
{
|
|
1782
1715
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1784,7 +1717,7 @@ _mm256_mask_cvtepi8_epi16(__m256i __W, __mmask16 __U, __m128i __A)
|
|
|
1784
1717
|
(__v16hi)__W);
|
|
1785
1718
|
}
|
|
1786
1719
|
|
|
1787
|
-
static __inline__ __m256i
|
|
1720
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1788
1721
|
_mm256_maskz_cvtepi8_epi16(__mmask16 __U, __m128i __A)
|
|
1789
1722
|
{
|
|
1790
1723
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1793,7 +1726,7 @@ _mm256_maskz_cvtepi8_epi16(__mmask16 __U, __m128i __A)
|
|
|
1793
1726
|
}
|
|
1794
1727
|
|
|
1795
1728
|
|
|
1796
|
-
static __inline__ __m128i
|
|
1729
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1797
1730
|
_mm_mask_cvtepu8_epi16(__m128i __W, __mmask8 __U, __m128i __A)
|
|
1798
1731
|
{
|
|
1799
1732
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1801,7 +1734,7 @@ _mm_mask_cvtepu8_epi16(__m128i __W, __mmask8 __U, __m128i __A)
|
|
|
1801
1734
|
(__v8hi)__W);
|
|
1802
1735
|
}
|
|
1803
1736
|
|
|
1804
|
-
static __inline__ __m128i
|
|
1737
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1805
1738
|
_mm_maskz_cvtepu8_epi16(__mmask8 __U, __m128i __A)
|
|
1806
1739
|
{
|
|
1807
1740
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1809,7 +1742,7 @@ _mm_maskz_cvtepu8_epi16(__mmask8 __U, __m128i __A)
|
|
|
1809
1742
|
(__v8hi)_mm_setzero_si128());
|
|
1810
1743
|
}
|
|
1811
1744
|
|
|
1812
|
-
static __inline__ __m256i
|
|
1745
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1813
1746
|
_mm256_mask_cvtepu8_epi16(__m256i __W, __mmask16 __U, __m128i __A)
|
|
1814
1747
|
{
|
|
1815
1748
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1817,7 +1750,7 @@ _mm256_mask_cvtepu8_epi16(__m256i __W, __mmask16 __U, __m128i __A)
|
|
|
1817
1750
|
(__v16hi)__W);
|
|
1818
1751
|
}
|
|
1819
1752
|
|
|
1820
|
-
static __inline__ __m256i
|
|
1753
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1821
1754
|
_mm256_maskz_cvtepu8_epi16 (__mmask16 __U, __m128i __A)
|
|
1822
1755
|
{
|
|
1823
1756
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1868,13 +1801,13 @@ _mm256_maskz_cvtepu8_epi16 (__mmask16 __U, __m128i __A)
|
|
|
1868
1801
|
(imm)), \
|
|
1869
1802
|
(__v16hi)_mm256_setzero_si256()))
|
|
1870
1803
|
|
|
1871
|
-
static __inline__ __m256i
|
|
1804
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1872
1805
|
_mm256_sllv_epi16(__m256i __A, __m256i __B)
|
|
1873
1806
|
{
|
|
1874
1807
|
return (__m256i)__builtin_ia32_psllv16hi((__v16hi)__A, (__v16hi)__B);
|
|
1875
1808
|
}
|
|
1876
1809
|
|
|
1877
|
-
static __inline__ __m256i
|
|
1810
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1878
1811
|
_mm256_mask_sllv_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
1879
1812
|
{
|
|
1880
1813
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1882,7 +1815,7 @@ _mm256_mask_sllv_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1882
1815
|
(__v16hi)__W);
|
|
1883
1816
|
}
|
|
1884
1817
|
|
|
1885
|
-
static __inline__ __m256i
|
|
1818
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1886
1819
|
_mm256_maskz_sllv_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
1887
1820
|
{
|
|
1888
1821
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1890,13 +1823,13 @@ _mm256_maskz_sllv_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1890
1823
|
(__v16hi)_mm256_setzero_si256());
|
|
1891
1824
|
}
|
|
1892
1825
|
|
|
1893
|
-
static __inline__ __m128i
|
|
1826
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1894
1827
|
_mm_sllv_epi16(__m128i __A, __m128i __B)
|
|
1895
1828
|
{
|
|
1896
1829
|
return (__m128i)__builtin_ia32_psllv8hi((__v8hi)__A, (__v8hi)__B);
|
|
1897
1830
|
}
|
|
1898
1831
|
|
|
1899
|
-
static __inline__ __m128i
|
|
1832
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1900
1833
|
_mm_mask_sllv_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
1901
1834
|
{
|
|
1902
1835
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1904,7 +1837,7 @@ _mm_mask_sllv_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
1904
1837
|
(__v8hi)__W);
|
|
1905
1838
|
}
|
|
1906
1839
|
|
|
1907
|
-
static __inline__ __m128i
|
|
1840
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1908
1841
|
_mm_maskz_sllv_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
1909
1842
|
{
|
|
1910
1843
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1944,7 +1877,7 @@ _mm256_maskz_sll_epi16(__mmask16 __U, __m256i __A, __m128i __B)
|
|
|
1944
1877
|
(__v16hi)_mm256_setzero_si256());
|
|
1945
1878
|
}
|
|
1946
1879
|
|
|
1947
|
-
static __inline__ __m128i
|
|
1880
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1948
1881
|
_mm_mask_slli_epi16(__m128i __W, __mmask8 __U, __m128i __A, unsigned int __B)
|
|
1949
1882
|
{
|
|
1950
1883
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1952,7 +1885,7 @@ _mm_mask_slli_epi16(__m128i __W, __mmask8 __U, __m128i __A, unsigned int __B)
|
|
|
1952
1885
|
(__v8hi)__W);
|
|
1953
1886
|
}
|
|
1954
1887
|
|
|
1955
|
-
static __inline__ __m128i
|
|
1888
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
1956
1889
|
_mm_maskz_slli_epi16 (__mmask8 __U, __m128i __A, unsigned int __B)
|
|
1957
1890
|
{
|
|
1958
1891
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -1960,30 +1893,28 @@ _mm_maskz_slli_epi16 (__mmask8 __U, __m128i __A, unsigned int __B)
|
|
|
1960
1893
|
(__v8hi)_mm_setzero_si128());
|
|
1961
1894
|
}
|
|
1962
1895
|
|
|
1963
|
-
static __inline__ __m256i
|
|
1896
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1964
1897
|
_mm256_mask_slli_epi16(__m256i __W, __mmask16 __U, __m256i __A,
|
|
1965
|
-
unsigned int __B)
|
|
1966
|
-
{
|
|
1898
|
+
unsigned int __B) {
|
|
1967
1899
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1968
1900
|
(__v16hi)_mm256_slli_epi16(__A, (int)__B),
|
|
1969
1901
|
(__v16hi)__W);
|
|
1970
1902
|
}
|
|
1971
1903
|
|
|
1972
|
-
static __inline__ __m256i
|
|
1973
|
-
_mm256_maskz_slli_epi16(__mmask16 __U, __m256i __A, unsigned int __B)
|
|
1974
|
-
{
|
|
1904
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1905
|
+
_mm256_maskz_slli_epi16(__mmask16 __U, __m256i __A, unsigned int __B) {
|
|
1975
1906
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
1976
1907
|
(__v16hi)_mm256_slli_epi16(__A, (int)__B),
|
|
1977
1908
|
(__v16hi)_mm256_setzero_si256());
|
|
1978
1909
|
}
|
|
1979
1910
|
|
|
1980
|
-
static __inline__ __m256i
|
|
1911
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1981
1912
|
_mm256_srlv_epi16(__m256i __A, __m256i __B)
|
|
1982
1913
|
{
|
|
1983
1914
|
return (__m256i)__builtin_ia32_psrlv16hi((__v16hi)__A, (__v16hi)__B);
|
|
1984
1915
|
}
|
|
1985
1916
|
|
|
1986
|
-
static __inline__ __m256i
|
|
1917
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1987
1918
|
_mm256_mask_srlv_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
1988
1919
|
{
|
|
1989
1920
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1991,7 +1922,7 @@ _mm256_mask_srlv_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1991
1922
|
(__v16hi)__W);
|
|
1992
1923
|
}
|
|
1993
1924
|
|
|
1994
|
-
static __inline__ __m256i
|
|
1925
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
1995
1926
|
_mm256_maskz_srlv_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
1996
1927
|
{
|
|
1997
1928
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -1999,13 +1930,13 @@ _mm256_maskz_srlv_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
1999
1930
|
(__v16hi)_mm256_setzero_si256());
|
|
2000
1931
|
}
|
|
2001
1932
|
|
|
2002
|
-
static __inline__ __m128i
|
|
1933
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2003
1934
|
_mm_srlv_epi16(__m128i __A, __m128i __B)
|
|
2004
1935
|
{
|
|
2005
1936
|
return (__m128i)__builtin_ia32_psrlv8hi((__v8hi)__A, (__v8hi)__B);
|
|
2006
1937
|
}
|
|
2007
1938
|
|
|
2008
|
-
static __inline__ __m128i
|
|
1939
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2009
1940
|
_mm_mask_srlv_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
2010
1941
|
{
|
|
2011
1942
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -2013,7 +1944,7 @@ _mm_mask_srlv_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
2013
1944
|
(__v8hi)__W);
|
|
2014
1945
|
}
|
|
2015
1946
|
|
|
2016
|
-
static __inline__ __m128i
|
|
1947
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2017
1948
|
_mm_maskz_srlv_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
2018
1949
|
{
|
|
2019
1950
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -2021,13 +1952,13 @@ _mm_maskz_srlv_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
|
2021
1952
|
(__v8hi)_mm_setzero_si128());
|
|
2022
1953
|
}
|
|
2023
1954
|
|
|
2024
|
-
static __inline__ __m256i
|
|
1955
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2025
1956
|
_mm256_srav_epi16(__m256i __A, __m256i __B)
|
|
2026
1957
|
{
|
|
2027
1958
|
return (__m256i)__builtin_ia32_psrav16hi((__v16hi)__A, (__v16hi)__B);
|
|
2028
1959
|
}
|
|
2029
1960
|
|
|
2030
|
-
static __inline__ __m256i
|
|
1961
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2031
1962
|
_mm256_mask_srav_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
2032
1963
|
{
|
|
2033
1964
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -2035,7 +1966,7 @@ _mm256_mask_srav_epi16(__m256i __W, __mmask16 __U, __m256i __A, __m256i __B)
|
|
|
2035
1966
|
(__v16hi)__W);
|
|
2036
1967
|
}
|
|
2037
1968
|
|
|
2038
|
-
static __inline__ __m256i
|
|
1969
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2039
1970
|
_mm256_maskz_srav_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
2040
1971
|
{
|
|
2041
1972
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
@@ -2043,13 +1974,13 @@ _mm256_maskz_srav_epi16(__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
2043
1974
|
(__v16hi)_mm256_setzero_si256());
|
|
2044
1975
|
}
|
|
2045
1976
|
|
|
2046
|
-
static __inline__ __m128i
|
|
1977
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2047
1978
|
_mm_srav_epi16(__m128i __A, __m128i __B)
|
|
2048
1979
|
{
|
|
2049
1980
|
return (__m128i)__builtin_ia32_psrav8hi((__v8hi)__A, (__v8hi)__B);
|
|
2050
1981
|
}
|
|
2051
1982
|
|
|
2052
|
-
static __inline__ __m128i
|
|
1983
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2053
1984
|
_mm_mask_srav_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
2054
1985
|
{
|
|
2055
1986
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -2057,7 +1988,7 @@ _mm_mask_srav_epi16(__m128i __W, __mmask8 __U, __m128i __A, __m128i __B)
|
|
|
2057
1988
|
(__v8hi)__W);
|
|
2058
1989
|
}
|
|
2059
1990
|
|
|
2060
|
-
static __inline__ __m128i
|
|
1991
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2061
1992
|
_mm_maskz_srav_epi16(__mmask8 __U, __m128i __A, __m128i __B)
|
|
2062
1993
|
{
|
|
2063
1994
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
@@ -2097,34 +2028,30 @@ _mm256_maskz_sra_epi16(__mmask16 __U, __m256i __A, __m128i __B)
|
|
|
2097
2028
|
(__v16hi)_mm256_setzero_si256());
|
|
2098
2029
|
}
|
|
2099
2030
|
|
|
2100
|
-
static __inline__ __m128i
|
|
2101
|
-
_mm_mask_srai_epi16(__m128i __W, __mmask8 __U, __m128i __A, unsigned int __B)
|
|
2102
|
-
{
|
|
2031
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2032
|
+
_mm_mask_srai_epi16(__m128i __W, __mmask8 __U, __m128i __A, unsigned int __B) {
|
|
2103
2033
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
2104
2034
|
(__v8hi)_mm_srai_epi16(__A, (int)__B),
|
|
2105
2035
|
(__v8hi)__W);
|
|
2106
2036
|
}
|
|
2107
2037
|
|
|
2108
|
-
static __inline__ __m128i
|
|
2109
|
-
_mm_maskz_srai_epi16(__mmask8 __U, __m128i __A, unsigned int __B)
|
|
2110
|
-
{
|
|
2038
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2039
|
+
_mm_maskz_srai_epi16(__mmask8 __U, __m128i __A, unsigned int __B) {
|
|
2111
2040
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
2112
2041
|
(__v8hi)_mm_srai_epi16(__A, (int)__B),
|
|
2113
2042
|
(__v8hi)_mm_setzero_si128());
|
|
2114
2043
|
}
|
|
2115
2044
|
|
|
2116
|
-
static __inline__ __m256i
|
|
2045
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2117
2046
|
_mm256_mask_srai_epi16(__m256i __W, __mmask16 __U, __m256i __A,
|
|
2118
|
-
unsigned int __B)
|
|
2119
|
-
{
|
|
2047
|
+
unsigned int __B) {
|
|
2120
2048
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
2121
2049
|
(__v16hi)_mm256_srai_epi16(__A, (int)__B),
|
|
2122
2050
|
(__v16hi)__W);
|
|
2123
2051
|
}
|
|
2124
2052
|
|
|
2125
|
-
static __inline__ __m256i
|
|
2126
|
-
_mm256_maskz_srai_epi16(__mmask16 __U, __m256i __A, unsigned int __B)
|
|
2127
|
-
{
|
|
2053
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2054
|
+
_mm256_maskz_srai_epi16(__mmask16 __U, __m256i __A, unsigned int __B) {
|
|
2128
2055
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
2129
2056
|
(__v16hi)_mm256_srai_epi16(__A, (int)__B),
|
|
2130
2057
|
(__v16hi)_mm256_setzero_si256());
|
|
@@ -2162,104 +2089,91 @@ _mm256_maskz_srl_epi16(__mmask16 __U, __m256i __A, __m128i __B)
|
|
|
2162
2089
|
(__v16hi)_mm256_setzero_si256());
|
|
2163
2090
|
}
|
|
2164
2091
|
|
|
2165
|
-
static __inline__ __m128i
|
|
2166
|
-
_mm_mask_srli_epi16(__m128i __W, __mmask8 __U, __m128i __A, int __B)
|
|
2167
|
-
{
|
|
2092
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2093
|
+
_mm_mask_srli_epi16(__m128i __W, __mmask8 __U, __m128i __A, int __B) {
|
|
2168
2094
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
2169
2095
|
(__v8hi)_mm_srli_epi16(__A, __B),
|
|
2170
2096
|
(__v8hi)__W);
|
|
2171
2097
|
}
|
|
2172
2098
|
|
|
2173
|
-
static __inline__ __m128i
|
|
2174
|
-
_mm_maskz_srli_epi16
|
|
2175
|
-
{
|
|
2099
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2100
|
+
_mm_maskz_srli_epi16(__mmask8 __U, __m128i __A, int __B) {
|
|
2176
2101
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__U,
|
|
2177
2102
|
(__v8hi)_mm_srli_epi16(__A, __B),
|
|
2178
2103
|
(__v8hi)_mm_setzero_si128());
|
|
2179
2104
|
}
|
|
2180
2105
|
|
|
2181
|
-
static __inline__ __m256i
|
|
2182
|
-
_mm256_mask_srli_epi16(__m256i __W, __mmask16 __U, __m256i __A, int __B)
|
|
2183
|
-
{
|
|
2106
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2107
|
+
_mm256_mask_srli_epi16(__m256i __W, __mmask16 __U, __m256i __A, int __B) {
|
|
2184
2108
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
2185
2109
|
(__v16hi)_mm256_srli_epi16(__A, __B),
|
|
2186
2110
|
(__v16hi)__W);
|
|
2187
2111
|
}
|
|
2188
2112
|
|
|
2189
|
-
static __inline__ __m256i
|
|
2190
|
-
_mm256_maskz_srli_epi16(__mmask16 __U, __m256i __A, int __B)
|
|
2191
|
-
{
|
|
2113
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2114
|
+
_mm256_maskz_srli_epi16(__mmask16 __U, __m256i __A, int __B) {
|
|
2192
2115
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__U,
|
|
2193
2116
|
(__v16hi)_mm256_srli_epi16(__A, __B),
|
|
2194
2117
|
(__v16hi)_mm256_setzero_si256());
|
|
2195
2118
|
}
|
|
2196
2119
|
|
|
2197
|
-
static __inline__ __m128i
|
|
2198
|
-
_mm_mask_mov_epi16
|
|
2199
|
-
{
|
|
2120
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2121
|
+
_mm_mask_mov_epi16(__m128i __W, __mmask8 __U, __m128i __A) {
|
|
2200
2122
|
return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,
|
|
2201
2123
|
(__v8hi) __A,
|
|
2202
2124
|
(__v8hi) __W);
|
|
2203
2125
|
}
|
|
2204
2126
|
|
|
2205
|
-
static __inline__ __m128i
|
|
2206
|
-
_mm_maskz_mov_epi16
|
|
2207
|
-
{
|
|
2127
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2128
|
+
_mm_maskz_mov_epi16(__mmask8 __U, __m128i __A) {
|
|
2208
2129
|
return (__m128i) __builtin_ia32_selectw_128 ((__mmask8) __U,
|
|
2209
2130
|
(__v8hi) __A,
|
|
2210
2131
|
(__v8hi) _mm_setzero_si128 ());
|
|
2211
2132
|
}
|
|
2212
2133
|
|
|
2213
|
-
static __inline__ __m256i
|
|
2214
|
-
_mm256_mask_mov_epi16
|
|
2215
|
-
{
|
|
2134
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2135
|
+
_mm256_mask_mov_epi16(__m256i __W, __mmask16 __U, __m256i __A) {
|
|
2216
2136
|
return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,
|
|
2217
2137
|
(__v16hi) __A,
|
|
2218
2138
|
(__v16hi) __W);
|
|
2219
2139
|
}
|
|
2220
2140
|
|
|
2221
|
-
static __inline__ __m256i
|
|
2222
|
-
_mm256_maskz_mov_epi16
|
|
2223
|
-
{
|
|
2141
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2142
|
+
_mm256_maskz_mov_epi16(__mmask16 __U, __m256i __A) {
|
|
2224
2143
|
return (__m256i) __builtin_ia32_selectw_256 ((__mmask16) __U,
|
|
2225
2144
|
(__v16hi) __A,
|
|
2226
2145
|
(__v16hi) _mm256_setzero_si256 ());
|
|
2227
2146
|
}
|
|
2228
2147
|
|
|
2229
|
-
static __inline__ __m128i
|
|
2230
|
-
_mm_mask_mov_epi8
|
|
2231
|
-
{
|
|
2148
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2149
|
+
_mm_mask_mov_epi8(__m128i __W, __mmask16 __U, __m128i __A) {
|
|
2232
2150
|
return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,
|
|
2233
2151
|
(__v16qi) __A,
|
|
2234
2152
|
(__v16qi) __W);
|
|
2235
2153
|
}
|
|
2236
2154
|
|
|
2237
|
-
static __inline__ __m128i
|
|
2238
|
-
_mm_maskz_mov_epi8
|
|
2239
|
-
{
|
|
2155
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2156
|
+
_mm_maskz_mov_epi8(__mmask16 __U, __m128i __A) {
|
|
2240
2157
|
return (__m128i) __builtin_ia32_selectb_128 ((__mmask16) __U,
|
|
2241
2158
|
(__v16qi) __A,
|
|
2242
2159
|
(__v16qi) _mm_setzero_si128 ());
|
|
2243
2160
|
}
|
|
2244
2161
|
|
|
2245
|
-
static __inline__ __m256i
|
|
2246
|
-
_mm256_mask_mov_epi8
|
|
2247
|
-
{
|
|
2162
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2163
|
+
_mm256_mask_mov_epi8(__m256i __W, __mmask32 __U, __m256i __A) {
|
|
2248
2164
|
return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,
|
|
2249
2165
|
(__v32qi) __A,
|
|
2250
2166
|
(__v32qi) __W);
|
|
2251
2167
|
}
|
|
2252
2168
|
|
|
2253
|
-
static __inline__ __m256i
|
|
2254
|
-
_mm256_maskz_mov_epi8
|
|
2255
|
-
{
|
|
2169
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2170
|
+
_mm256_maskz_mov_epi8(__mmask32 __U, __m256i __A) {
|
|
2256
2171
|
return (__m256i) __builtin_ia32_selectb_256 ((__mmask32) __U,
|
|
2257
2172
|
(__v32qi) __A,
|
|
2258
2173
|
(__v32qi) _mm256_setzero_si256 ());
|
|
2259
2174
|
}
|
|
2260
2175
|
|
|
2261
|
-
|
|
2262
|
-
static __inline__ __m128i __DEFAULT_FN_ATTRS128
|
|
2176
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2263
2177
|
_mm_mask_set1_epi8 (__m128i __O, __mmask16 __M, char __A)
|
|
2264
2178
|
{
|
|
2265
2179
|
return (__m128i) __builtin_ia32_selectb_128(__M,
|
|
@@ -2267,7 +2181,7 @@ _mm_mask_set1_epi8 (__m128i __O, __mmask16 __M, char __A)
|
|
|
2267
2181
|
(__v16qi) __O);
|
|
2268
2182
|
}
|
|
2269
2183
|
|
|
2270
|
-
static __inline__ __m128i
|
|
2184
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2271
2185
|
_mm_maskz_set1_epi8 (__mmask16 __M, char __A)
|
|
2272
2186
|
{
|
|
2273
2187
|
return (__m128i) __builtin_ia32_selectb_128(__M,
|
|
@@ -2275,7 +2189,7 @@ _mm_maskz_set1_epi8 (__mmask16 __M, char __A)
|
|
|
2275
2189
|
(__v16qi) _mm_setzero_si128());
|
|
2276
2190
|
}
|
|
2277
2191
|
|
|
2278
|
-
static __inline__ __m256i
|
|
2192
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2279
2193
|
_mm256_mask_set1_epi8 (__m256i __O, __mmask32 __M, char __A)
|
|
2280
2194
|
{
|
|
2281
2195
|
return (__m256i) __builtin_ia32_selectb_256(__M,
|
|
@@ -2283,7 +2197,7 @@ _mm256_mask_set1_epi8 (__m256i __O, __mmask32 __M, char __A)
|
|
|
2283
2197
|
(__v32qi) __O);
|
|
2284
2198
|
}
|
|
2285
2199
|
|
|
2286
|
-
static __inline__ __m256i
|
|
2200
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2287
2201
|
_mm256_maskz_set1_epi8 (__mmask32 __M, char __A)
|
|
2288
2202
|
{
|
|
2289
2203
|
return (__m256i) __builtin_ia32_selectb_256(__M,
|
|
@@ -2463,22 +2377,19 @@ _mm256_mask_storeu_epi8 (void *__P, __mmask32 __U, __m256i __A)
|
|
|
2463
2377
|
(__mmask32) __U);
|
|
2464
2378
|
}
|
|
2465
2379
|
|
|
2466
|
-
static __inline__ __mmask16
|
|
2467
|
-
_mm_test_epi8_mask
|
|
2468
|
-
{
|
|
2380
|
+
static __inline__ __mmask16 __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2381
|
+
_mm_test_epi8_mask(__m128i __A, __m128i __B) {
|
|
2469
2382
|
return _mm_cmpneq_epi8_mask (_mm_and_si128(__A, __B), _mm_setzero_si128());
|
|
2470
2383
|
}
|
|
2471
2384
|
|
|
2472
|
-
static __inline__ __mmask16
|
|
2473
|
-
_mm_mask_test_epi8_mask
|
|
2474
|
-
{
|
|
2385
|
+
static __inline__ __mmask16 __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2386
|
+
_mm_mask_test_epi8_mask(__mmask16 __U, __m128i __A, __m128i __B) {
|
|
2475
2387
|
return _mm_mask_cmpneq_epi8_mask (__U, _mm_and_si128 (__A, __B),
|
|
2476
2388
|
_mm_setzero_si128());
|
|
2477
2389
|
}
|
|
2478
2390
|
|
|
2479
|
-
static __inline__ __mmask32
|
|
2480
|
-
_mm256_test_epi8_mask
|
|
2481
|
-
{
|
|
2391
|
+
static __inline__ __mmask32 __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2392
|
+
_mm256_test_epi8_mask(__m256i __A, __m256i __B) {
|
|
2482
2393
|
return _mm256_cmpneq_epi8_mask (_mm256_and_si256(__A, __B),
|
|
2483
2394
|
_mm256_setzero_si256());
|
|
2484
2395
|
}
|
|
@@ -2517,9 +2428,8 @@ _mm256_mask_test_epi16_mask (__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
2517
2428
|
_mm256_setzero_si256());
|
|
2518
2429
|
}
|
|
2519
2430
|
|
|
2520
|
-
static __inline__ __mmask16
|
|
2521
|
-
_mm_testn_epi8_mask
|
|
2522
|
-
{
|
|
2431
|
+
static __inline__ __mmask16 __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2432
|
+
_mm_testn_epi8_mask(__m128i __A, __m128i __B) {
|
|
2523
2433
|
return _mm_cmpeq_epi8_mask (_mm_and_si128 (__A, __B), _mm_setzero_si128());
|
|
2524
2434
|
}
|
|
2525
2435
|
|
|
@@ -2570,55 +2480,47 @@ _mm256_mask_testn_epi16_mask (__mmask16 __U, __m256i __A, __m256i __B)
|
|
|
2570
2480
|
_mm256_setzero_si256());
|
|
2571
2481
|
}
|
|
2572
2482
|
|
|
2573
|
-
static __inline__ __mmask16
|
|
2574
|
-
_mm_movepi8_mask
|
|
2575
|
-
{
|
|
2483
|
+
static __inline__ __mmask16 __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2484
|
+
_mm_movepi8_mask(__m128i __A) {
|
|
2576
2485
|
return (__mmask16) __builtin_ia32_cvtb2mask128 ((__v16qi) __A);
|
|
2577
2486
|
}
|
|
2578
2487
|
|
|
2579
|
-
static __inline__ __mmask32
|
|
2580
|
-
_mm256_movepi8_mask
|
|
2581
|
-
{
|
|
2488
|
+
static __inline__ __mmask32 __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2489
|
+
_mm256_movepi8_mask(__m256i __A) {
|
|
2582
2490
|
return (__mmask32) __builtin_ia32_cvtb2mask256 ((__v32qi) __A);
|
|
2583
2491
|
}
|
|
2584
2492
|
|
|
2585
|
-
static __inline__ __mmask8
|
|
2586
|
-
_mm_movepi16_mask
|
|
2587
|
-
{
|
|
2493
|
+
static __inline__ __mmask8 __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2494
|
+
_mm_movepi16_mask(__m128i __A) {
|
|
2588
2495
|
return (__mmask8) __builtin_ia32_cvtw2mask128 ((__v8hi) __A);
|
|
2589
2496
|
}
|
|
2590
2497
|
|
|
2591
|
-
static __inline__ __mmask16
|
|
2592
|
-
_mm256_movepi16_mask
|
|
2593
|
-
{
|
|
2498
|
+
static __inline__ __mmask16 __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2499
|
+
_mm256_movepi16_mask(__m256i __A) {
|
|
2594
2500
|
return (__mmask16) __builtin_ia32_cvtw2mask256 ((__v16hi) __A);
|
|
2595
2501
|
}
|
|
2596
2502
|
|
|
2597
|
-
static __inline__ __m128i
|
|
2598
|
-
_mm_movm_epi8
|
|
2599
|
-
{
|
|
2503
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2504
|
+
_mm_movm_epi8(__mmask16 __A) {
|
|
2600
2505
|
return (__m128i) __builtin_ia32_cvtmask2b128 (__A);
|
|
2601
2506
|
}
|
|
2602
2507
|
|
|
2603
|
-
static __inline__ __m256i
|
|
2604
|
-
_mm256_movm_epi8
|
|
2605
|
-
{
|
|
2508
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2509
|
+
_mm256_movm_epi8(__mmask32 __A) {
|
|
2606
2510
|
return (__m256i) __builtin_ia32_cvtmask2b256 (__A);
|
|
2607
2511
|
}
|
|
2608
2512
|
|
|
2609
|
-
static __inline__ __m128i
|
|
2610
|
-
_mm_movm_epi16
|
|
2611
|
-
{
|
|
2513
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2514
|
+
_mm_movm_epi16(__mmask8 __A) {
|
|
2612
2515
|
return (__m128i) __builtin_ia32_cvtmask2w128 (__A);
|
|
2613
2516
|
}
|
|
2614
2517
|
|
|
2615
|
-
static __inline__ __m256i
|
|
2616
|
-
_mm256_movm_epi16
|
|
2617
|
-
{
|
|
2518
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2519
|
+
_mm256_movm_epi16(__mmask16 __A) {
|
|
2618
2520
|
return (__m256i) __builtin_ia32_cvtmask2w256 (__A);
|
|
2619
2521
|
}
|
|
2620
2522
|
|
|
2621
|
-
static __inline__ __m128i
|
|
2523
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2622
2524
|
_mm_mask_broadcastb_epi8 (__m128i __O, __mmask16 __M, __m128i __A)
|
|
2623
2525
|
{
|
|
2624
2526
|
return (__m128i)__builtin_ia32_selectb_128(__M,
|
|
@@ -2626,7 +2528,7 @@ _mm_mask_broadcastb_epi8 (__m128i __O, __mmask16 __M, __m128i __A)
|
|
|
2626
2528
|
(__v16qi) __O);
|
|
2627
2529
|
}
|
|
2628
2530
|
|
|
2629
|
-
static __inline__ __m128i
|
|
2531
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2630
2532
|
_mm_maskz_broadcastb_epi8 (__mmask16 __M, __m128i __A)
|
|
2631
2533
|
{
|
|
2632
2534
|
return (__m128i)__builtin_ia32_selectb_128(__M,
|
|
@@ -2634,7 +2536,7 @@ _mm_maskz_broadcastb_epi8 (__mmask16 __M, __m128i __A)
|
|
|
2634
2536
|
(__v16qi) _mm_setzero_si128());
|
|
2635
2537
|
}
|
|
2636
2538
|
|
|
2637
|
-
static __inline__ __m256i
|
|
2539
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2638
2540
|
_mm256_mask_broadcastb_epi8 (__m256i __O, __mmask32 __M, __m128i __A)
|
|
2639
2541
|
{
|
|
2640
2542
|
return (__m256i)__builtin_ia32_selectb_256(__M,
|
|
@@ -2642,7 +2544,7 @@ _mm256_mask_broadcastb_epi8 (__m256i __O, __mmask32 __M, __m128i __A)
|
|
|
2642
2544
|
(__v32qi) __O);
|
|
2643
2545
|
}
|
|
2644
2546
|
|
|
2645
|
-
static __inline__ __m256i
|
|
2547
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2646
2548
|
_mm256_maskz_broadcastb_epi8 (__mmask32 __M, __m128i __A)
|
|
2647
2549
|
{
|
|
2648
2550
|
return (__m256i)__builtin_ia32_selectb_256(__M,
|
|
@@ -2650,7 +2552,7 @@ _mm256_maskz_broadcastb_epi8 (__mmask32 __M, __m128i __A)
|
|
|
2650
2552
|
(__v32qi) _mm256_setzero_si256());
|
|
2651
2553
|
}
|
|
2652
2554
|
|
|
2653
|
-
static __inline__ __m128i
|
|
2555
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2654
2556
|
_mm_mask_broadcastw_epi16 (__m128i __O, __mmask8 __M, __m128i __A)
|
|
2655
2557
|
{
|
|
2656
2558
|
return (__m128i)__builtin_ia32_selectw_128(__M,
|
|
@@ -2658,7 +2560,7 @@ _mm_mask_broadcastw_epi16 (__m128i __O, __mmask8 __M, __m128i __A)
|
|
|
2658
2560
|
(__v8hi) __O);
|
|
2659
2561
|
}
|
|
2660
2562
|
|
|
2661
|
-
static __inline__ __m128i
|
|
2563
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2662
2564
|
_mm_maskz_broadcastw_epi16 (__mmask8 __M, __m128i __A)
|
|
2663
2565
|
{
|
|
2664
2566
|
return (__m128i)__builtin_ia32_selectw_128(__M,
|
|
@@ -2666,7 +2568,7 @@ _mm_maskz_broadcastw_epi16 (__mmask8 __M, __m128i __A)
|
|
|
2666
2568
|
(__v8hi) _mm_setzero_si128());
|
|
2667
2569
|
}
|
|
2668
2570
|
|
|
2669
|
-
static __inline__ __m256i
|
|
2571
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2670
2572
|
_mm256_mask_broadcastw_epi16 (__m256i __O, __mmask16 __M, __m128i __A)
|
|
2671
2573
|
{
|
|
2672
2574
|
return (__m256i)__builtin_ia32_selectw_256(__M,
|
|
@@ -2674,7 +2576,7 @@ _mm256_mask_broadcastw_epi16 (__m256i __O, __mmask16 __M, __m128i __A)
|
|
|
2674
2576
|
(__v16hi) __O);
|
|
2675
2577
|
}
|
|
2676
2578
|
|
|
2677
|
-
static __inline__ __m256i
|
|
2579
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2678
2580
|
_mm256_maskz_broadcastw_epi16 (__mmask16 __M, __m128i __A)
|
|
2679
2581
|
{
|
|
2680
2582
|
return (__m256i)__builtin_ia32_selectw_256(__M,
|
|
@@ -2682,7 +2584,7 @@ _mm256_maskz_broadcastw_epi16 (__mmask16 __M, __m128i __A)
|
|
|
2682
2584
|
(__v16hi) _mm256_setzero_si256());
|
|
2683
2585
|
}
|
|
2684
2586
|
|
|
2685
|
-
static __inline__ __m256i
|
|
2587
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2686
2588
|
_mm256_mask_set1_epi16 (__m256i __O, __mmask16 __M, short __A)
|
|
2687
2589
|
{
|
|
2688
2590
|
return (__m256i) __builtin_ia32_selectw_256 (__M,
|
|
@@ -2690,7 +2592,7 @@ _mm256_mask_set1_epi16 (__m256i __O, __mmask16 __M, short __A)
|
|
|
2690
2592
|
(__v16hi) __O);
|
|
2691
2593
|
}
|
|
2692
2594
|
|
|
2693
|
-
static __inline__ __m256i
|
|
2595
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2694
2596
|
_mm256_maskz_set1_epi16 (__mmask16 __M, short __A)
|
|
2695
2597
|
{
|
|
2696
2598
|
return (__m256i) __builtin_ia32_selectw_256(__M,
|
|
@@ -2698,7 +2600,7 @@ _mm256_maskz_set1_epi16 (__mmask16 __M, short __A)
|
|
|
2698
2600
|
(__v16hi) _mm256_setzero_si256());
|
|
2699
2601
|
}
|
|
2700
2602
|
|
|
2701
|
-
static __inline__ __m128i
|
|
2603
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2702
2604
|
_mm_mask_set1_epi16 (__m128i __O, __mmask8 __M, short __A)
|
|
2703
2605
|
{
|
|
2704
2606
|
return (__m128i) __builtin_ia32_selectw_128(__M,
|
|
@@ -2706,7 +2608,7 @@ _mm_mask_set1_epi16 (__m128i __O, __mmask8 __M, short __A)
|
|
|
2706
2608
|
(__v8hi) __O);
|
|
2707
2609
|
}
|
|
2708
2610
|
|
|
2709
|
-
static __inline__ __m128i
|
|
2611
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2710
2612
|
_mm_maskz_set1_epi16 (__mmask8 __M, short __A)
|
|
2711
2613
|
{
|
|
2712
2614
|
return (__m128i) __builtin_ia32_selectw_128(__M,
|
|
@@ -2714,48 +2616,41 @@ _mm_maskz_set1_epi16 (__mmask8 __M, short __A)
|
|
|
2714
2616
|
(__v8hi) _mm_setzero_si128());
|
|
2715
2617
|
}
|
|
2716
2618
|
|
|
2717
|
-
static __inline__ __m128i
|
|
2718
|
-
_mm_permutexvar_epi16
|
|
2719
|
-
{
|
|
2619
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2620
|
+
_mm_permutexvar_epi16(__m128i __A, __m128i __B) {
|
|
2720
2621
|
return (__m128i)__builtin_ia32_permvarhi128((__v8hi) __B, (__v8hi) __A);
|
|
2721
2622
|
}
|
|
2722
2623
|
|
|
2723
|
-
static __inline__ __m128i
|
|
2724
|
-
_mm_maskz_permutexvar_epi16
|
|
2725
|
-
{
|
|
2624
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2625
|
+
_mm_maskz_permutexvar_epi16(__mmask8 __M, __m128i __A, __m128i __B) {
|
|
2726
2626
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
2727
2627
|
(__v8hi)_mm_permutexvar_epi16(__A, __B),
|
|
2728
2628
|
(__v8hi) _mm_setzero_si128());
|
|
2729
2629
|
}
|
|
2730
2630
|
|
|
2731
|
-
static __inline__ __m128i
|
|
2732
|
-
_mm_mask_permutexvar_epi16
|
|
2733
|
-
|
|
2734
|
-
{
|
|
2631
|
+
static __inline__ __m128i __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2632
|
+
_mm_mask_permutexvar_epi16(__m128i __W, __mmask8 __M, __m128i __A,
|
|
2633
|
+
__m128i __B) {
|
|
2735
2634
|
return (__m128i)__builtin_ia32_selectw_128((__mmask8)__M,
|
|
2736
2635
|
(__v8hi)_mm_permutexvar_epi16(__A, __B),
|
|
2737
2636
|
(__v8hi)__W);
|
|
2738
2637
|
}
|
|
2739
2638
|
|
|
2740
|
-
static __inline__ __m256i
|
|
2741
|
-
_mm256_permutexvar_epi16
|
|
2742
|
-
{
|
|
2639
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2640
|
+
_mm256_permutexvar_epi16(__m256i __A, __m256i __B) {
|
|
2743
2641
|
return (__m256i)__builtin_ia32_permvarhi256((__v16hi) __B, (__v16hi) __A);
|
|
2744
2642
|
}
|
|
2745
2643
|
|
|
2746
|
-
static __inline__ __m256i
|
|
2747
|
-
_mm256_maskz_permutexvar_epi16
|
|
2748
|
-
__m256i __B)
|
|
2749
|
-
{
|
|
2644
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2645
|
+
_mm256_maskz_permutexvar_epi16(__mmask16 __M, __m256i __A, __m256i __B) {
|
|
2750
2646
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
2751
2647
|
(__v16hi)_mm256_permutexvar_epi16(__A, __B),
|
|
2752
2648
|
(__v16hi)_mm256_setzero_si256());
|
|
2753
2649
|
}
|
|
2754
2650
|
|
|
2755
|
-
static __inline__ __m256i
|
|
2756
|
-
_mm256_mask_permutexvar_epi16
|
|
2757
|
-
|
|
2758
|
-
{
|
|
2651
|
+
static __inline__ __m256i __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2652
|
+
_mm256_mask_permutexvar_epi16(__m256i __W, __mmask16 __M, __m256i __A,
|
|
2653
|
+
__m256i __B) {
|
|
2759
2654
|
return (__m256i)__builtin_ia32_selectw_256((__mmask16)__M,
|
|
2760
2655
|
(__v16hi)_mm256_permutexvar_epi16(__A, __B),
|
|
2761
2656
|
(__v16hi)__W);
|
|
@@ -2809,353 +2704,353 @@ _mm256_mask_permutexvar_epi16 (__m256i __W, __mmask16 __M, __m256i __A,
|
|
|
2809
2704
|
(__v16hi)_mm256_dbsad_epu8((A), (B), (imm)), \
|
|
2810
2705
|
(__v16hi)_mm256_setzero_si256()))
|
|
2811
2706
|
|
|
2812
|
-
static __inline__ short
|
|
2707
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2813
2708
|
_mm_reduce_add_epi16(__m128i __W) {
|
|
2814
2709
|
return __builtin_reduce_add((__v8hi)__W);
|
|
2815
2710
|
}
|
|
2816
2711
|
|
|
2817
|
-
static __inline__ short
|
|
2712
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2818
2713
|
_mm_reduce_mul_epi16(__m128i __W) {
|
|
2819
2714
|
return __builtin_reduce_mul((__v8hi)__W);
|
|
2820
2715
|
}
|
|
2821
2716
|
|
|
2822
|
-
static __inline__ short
|
|
2717
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2823
2718
|
_mm_reduce_and_epi16(__m128i __W) {
|
|
2824
2719
|
return __builtin_reduce_and((__v8hi)__W);
|
|
2825
2720
|
}
|
|
2826
2721
|
|
|
2827
|
-
static __inline__ short
|
|
2722
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2828
2723
|
_mm_reduce_or_epi16(__m128i __W) {
|
|
2829
2724
|
return __builtin_reduce_or((__v8hi)__W);
|
|
2830
2725
|
}
|
|
2831
2726
|
|
|
2832
|
-
static __inline__ short
|
|
2833
|
-
_mm_mask_reduce_add_epi16(
|
|
2727
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2728
|
+
_mm_mask_reduce_add_epi16(__mmask8 __M, __m128i __W) {
|
|
2834
2729
|
__W = _mm_maskz_mov_epi16(__M, __W);
|
|
2835
2730
|
return __builtin_reduce_add((__v8hi)__W);
|
|
2836
2731
|
}
|
|
2837
2732
|
|
|
2838
|
-
static __inline__ short
|
|
2839
|
-
_mm_mask_reduce_mul_epi16(
|
|
2733
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2734
|
+
_mm_mask_reduce_mul_epi16(__mmask8 __M, __m128i __W) {
|
|
2840
2735
|
__W = _mm_mask_mov_epi16(_mm_set1_epi16(1), __M, __W);
|
|
2841
2736
|
return __builtin_reduce_mul((__v8hi)__W);
|
|
2842
2737
|
}
|
|
2843
2738
|
|
|
2844
|
-
static __inline__ short
|
|
2845
|
-
_mm_mask_reduce_and_epi16(
|
|
2739
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2740
|
+
_mm_mask_reduce_and_epi16(__mmask8 __M, __m128i __W) {
|
|
2846
2741
|
__W = _mm_mask_mov_epi16(_mm_set1_epi16(-1), __M, __W);
|
|
2847
2742
|
return __builtin_reduce_and((__v8hi)__W);
|
|
2848
2743
|
}
|
|
2849
2744
|
|
|
2850
|
-
static __inline__ short
|
|
2745
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2851
2746
|
_mm_mask_reduce_or_epi16(__mmask8 __M, __m128i __W) {
|
|
2852
2747
|
__W = _mm_maskz_mov_epi16(__M, __W);
|
|
2853
2748
|
return __builtin_reduce_or((__v8hi)__W);
|
|
2854
2749
|
}
|
|
2855
2750
|
|
|
2856
|
-
static __inline__ short
|
|
2751
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2857
2752
|
_mm_reduce_max_epi16(__m128i __V) {
|
|
2858
2753
|
return __builtin_reduce_max((__v8hi)__V);
|
|
2859
2754
|
}
|
|
2860
2755
|
|
|
2861
|
-
static __inline__ unsigned short
|
|
2756
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2862
2757
|
_mm_reduce_max_epu16(__m128i __V) {
|
|
2863
2758
|
return __builtin_reduce_max((__v8hu)__V);
|
|
2864
2759
|
}
|
|
2865
2760
|
|
|
2866
|
-
static __inline__ short
|
|
2761
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2867
2762
|
_mm_reduce_min_epi16(__m128i __V) {
|
|
2868
2763
|
return __builtin_reduce_min((__v8hi)__V);
|
|
2869
2764
|
}
|
|
2870
2765
|
|
|
2871
|
-
static __inline__ unsigned short
|
|
2766
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2872
2767
|
_mm_reduce_min_epu16(__m128i __V) {
|
|
2873
2768
|
return __builtin_reduce_min((__v8hu)__V);
|
|
2874
2769
|
}
|
|
2875
2770
|
|
|
2876
|
-
static __inline__ short
|
|
2771
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2877
2772
|
_mm_mask_reduce_max_epi16(__mmask16 __M, __m128i __V) {
|
|
2878
2773
|
__V = _mm_mask_mov_epi16(_mm_set1_epi16(-32767-1), __M, __V);
|
|
2879
2774
|
return __builtin_reduce_max((__v8hi)__V);
|
|
2880
2775
|
}
|
|
2881
2776
|
|
|
2882
|
-
static __inline__ unsigned short
|
|
2777
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2883
2778
|
_mm_mask_reduce_max_epu16(__mmask16 __M, __m128i __V) {
|
|
2884
2779
|
__V = _mm_maskz_mov_epi16(__M, __V);
|
|
2885
2780
|
return __builtin_reduce_max((__v8hu)__V);
|
|
2886
2781
|
}
|
|
2887
2782
|
|
|
2888
|
-
static __inline__ short
|
|
2783
|
+
static __inline__ short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2889
2784
|
_mm_mask_reduce_min_epi16(__mmask16 __M, __m128i __V) {
|
|
2890
2785
|
__V = _mm_mask_mov_epi16(_mm_set1_epi16(32767), __M, __V);
|
|
2891
2786
|
return __builtin_reduce_min((__v8hi)__V);
|
|
2892
2787
|
}
|
|
2893
2788
|
|
|
2894
|
-
static __inline__ unsigned short
|
|
2789
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2895
2790
|
_mm_mask_reduce_min_epu16(__mmask16 __M, __m128i __V) {
|
|
2896
2791
|
__V = _mm_mask_mov_epi16(_mm_set1_epi16(-1), __M, __V);
|
|
2897
2792
|
return __builtin_reduce_min((__v8hu)__V);
|
|
2898
2793
|
}
|
|
2899
2794
|
|
|
2900
|
-
static __inline__ short
|
|
2795
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2901
2796
|
_mm256_reduce_add_epi16(__m256i __W) {
|
|
2902
2797
|
return __builtin_reduce_add((__v16hi)__W);
|
|
2903
2798
|
}
|
|
2904
2799
|
|
|
2905
|
-
static __inline__ short
|
|
2800
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2906
2801
|
_mm256_reduce_mul_epi16(__m256i __W) {
|
|
2907
2802
|
return __builtin_reduce_mul((__v16hi)__W);
|
|
2908
2803
|
}
|
|
2909
2804
|
|
|
2910
|
-
static __inline__ short
|
|
2805
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2911
2806
|
_mm256_reduce_and_epi16(__m256i __W) {
|
|
2912
2807
|
return __builtin_reduce_and((__v16hi)__W);
|
|
2913
2808
|
}
|
|
2914
2809
|
|
|
2915
|
-
static __inline__ short
|
|
2810
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2916
2811
|
_mm256_reduce_or_epi16(__m256i __W) {
|
|
2917
2812
|
return __builtin_reduce_or((__v16hi)__W);
|
|
2918
2813
|
}
|
|
2919
2814
|
|
|
2920
|
-
static __inline__ short
|
|
2921
|
-
_mm256_mask_reduce_add_epi16(
|
|
2815
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2816
|
+
_mm256_mask_reduce_add_epi16(__mmask16 __M, __m256i __W) {
|
|
2922
2817
|
__W = _mm256_maskz_mov_epi16(__M, __W);
|
|
2923
2818
|
return __builtin_reduce_add((__v16hi)__W);
|
|
2924
2819
|
}
|
|
2925
2820
|
|
|
2926
|
-
static __inline__ short
|
|
2927
|
-
_mm256_mask_reduce_mul_epi16(
|
|
2821
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2822
|
+
_mm256_mask_reduce_mul_epi16(__mmask16 __M, __m256i __W) {
|
|
2928
2823
|
__W = _mm256_mask_mov_epi16(_mm256_set1_epi16(1), __M, __W);
|
|
2929
2824
|
return __builtin_reduce_mul((__v16hi)__W);
|
|
2930
2825
|
}
|
|
2931
2826
|
|
|
2932
|
-
static __inline__ short
|
|
2933
|
-
_mm256_mask_reduce_and_epi16(
|
|
2827
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2828
|
+
_mm256_mask_reduce_and_epi16(__mmask16 __M, __m256i __W) {
|
|
2934
2829
|
__W = _mm256_mask_mov_epi16(_mm256_set1_epi16(-1), __M, __W);
|
|
2935
2830
|
return __builtin_reduce_and((__v16hi)__W);
|
|
2936
2831
|
}
|
|
2937
2832
|
|
|
2938
|
-
static __inline__ short
|
|
2833
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2939
2834
|
_mm256_mask_reduce_or_epi16(__mmask16 __M, __m256i __W) {
|
|
2940
2835
|
__W = _mm256_maskz_mov_epi16(__M, __W);
|
|
2941
2836
|
return __builtin_reduce_or((__v16hi)__W);
|
|
2942
2837
|
}
|
|
2943
2838
|
|
|
2944
|
-
static __inline__ short
|
|
2839
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2945
2840
|
_mm256_reduce_max_epi16(__m256i __V) {
|
|
2946
2841
|
return __builtin_reduce_max((__v16hi)__V);
|
|
2947
2842
|
}
|
|
2948
2843
|
|
|
2949
|
-
static __inline__ unsigned short
|
|
2844
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2950
2845
|
_mm256_reduce_max_epu16(__m256i __V) {
|
|
2951
2846
|
return __builtin_reduce_max((__v16hu)__V);
|
|
2952
2847
|
}
|
|
2953
2848
|
|
|
2954
|
-
static __inline__ short
|
|
2849
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2955
2850
|
_mm256_reduce_min_epi16(__m256i __V) {
|
|
2956
2851
|
return __builtin_reduce_min((__v16hi)__V);
|
|
2957
2852
|
}
|
|
2958
2853
|
|
|
2959
|
-
static __inline__ unsigned short
|
|
2854
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2960
2855
|
_mm256_reduce_min_epu16(__m256i __V) {
|
|
2961
2856
|
return __builtin_reduce_min((__v16hu)__V);
|
|
2962
2857
|
}
|
|
2963
2858
|
|
|
2964
|
-
static __inline__ short
|
|
2859
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2965
2860
|
_mm256_mask_reduce_max_epi16(__mmask16 __M, __m256i __V) {
|
|
2966
2861
|
__V = _mm256_mask_mov_epi16(_mm256_set1_epi16(-32767-1), __M, __V);
|
|
2967
2862
|
return __builtin_reduce_max((__v16hi)__V);
|
|
2968
2863
|
}
|
|
2969
2864
|
|
|
2970
|
-
static __inline__ unsigned short
|
|
2865
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2971
2866
|
_mm256_mask_reduce_max_epu16(__mmask16 __M, __m256i __V) {
|
|
2972
2867
|
__V = _mm256_maskz_mov_epi16(__M, __V);
|
|
2973
2868
|
return __builtin_reduce_max((__v16hu)__V);
|
|
2974
2869
|
}
|
|
2975
2870
|
|
|
2976
|
-
static __inline__ short
|
|
2871
|
+
static __inline__ short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2977
2872
|
_mm256_mask_reduce_min_epi16(__mmask16 __M, __m256i __V) {
|
|
2978
2873
|
__V = _mm256_mask_mov_epi16(_mm256_set1_epi16(32767), __M, __V);
|
|
2979
2874
|
return __builtin_reduce_min((__v16hi)__V);
|
|
2980
2875
|
}
|
|
2981
2876
|
|
|
2982
|
-
static __inline__ unsigned short
|
|
2877
|
+
static __inline__ unsigned short __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
2983
2878
|
_mm256_mask_reduce_min_epu16(__mmask16 __M, __m256i __V) {
|
|
2984
2879
|
__V = _mm256_mask_mov_epi16(_mm256_set1_epi16(-1), __M, __V);
|
|
2985
2880
|
return __builtin_reduce_min((__v16hu)__V);
|
|
2986
2881
|
}
|
|
2987
2882
|
|
|
2988
|
-
static __inline__ signed char
|
|
2883
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2989
2884
|
_mm_reduce_add_epi8(__m128i __W) {
|
|
2990
2885
|
return __builtin_reduce_add((__v16qs)__W);
|
|
2991
2886
|
}
|
|
2992
2887
|
|
|
2993
|
-
static __inline__ signed char
|
|
2888
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2994
2889
|
_mm_reduce_mul_epi8(__m128i __W) {
|
|
2995
2890
|
return __builtin_reduce_mul((__v16qs)__W);
|
|
2996
2891
|
}
|
|
2997
2892
|
|
|
2998
|
-
static __inline__ signed char
|
|
2893
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
2999
2894
|
_mm_reduce_and_epi8(__m128i __W) {
|
|
3000
2895
|
return __builtin_reduce_and((__v16qs)__W);
|
|
3001
2896
|
}
|
|
3002
2897
|
|
|
3003
|
-
static __inline__ signed char
|
|
2898
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3004
2899
|
_mm_reduce_or_epi8(__m128i __W) {
|
|
3005
2900
|
return __builtin_reduce_or((__v16qs)__W);
|
|
3006
2901
|
}
|
|
3007
2902
|
|
|
3008
|
-
static __inline__ signed char
|
|
2903
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3009
2904
|
_mm_mask_reduce_add_epi8(__mmask16 __M, __m128i __W) {
|
|
3010
2905
|
__W = _mm_maskz_mov_epi8(__M, __W);
|
|
3011
2906
|
return __builtin_reduce_add((__v16qs)__W);
|
|
3012
2907
|
}
|
|
3013
2908
|
|
|
3014
|
-
static __inline__ signed char
|
|
2909
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3015
2910
|
_mm_mask_reduce_mul_epi8(__mmask16 __M, __m128i __W) {
|
|
3016
2911
|
__W = _mm_mask_mov_epi8(_mm_set1_epi8(1), __M, __W);
|
|
3017
2912
|
return __builtin_reduce_mul((__v16qs)__W);
|
|
3018
2913
|
}
|
|
3019
2914
|
|
|
3020
|
-
static __inline__ signed char
|
|
2915
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3021
2916
|
_mm_mask_reduce_and_epi8(__mmask16 __M, __m128i __W) {
|
|
3022
2917
|
__W = _mm_mask_mov_epi8(_mm_set1_epi8(-1), __M, __W);
|
|
3023
2918
|
return __builtin_reduce_and((__v16qs)__W);
|
|
3024
2919
|
}
|
|
3025
2920
|
|
|
3026
|
-
static __inline__ signed char
|
|
2921
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3027
2922
|
_mm_mask_reduce_or_epi8(__mmask16 __M, __m128i __W) {
|
|
3028
2923
|
__W = _mm_maskz_mov_epi8(__M, __W);
|
|
3029
2924
|
return __builtin_reduce_or((__v16qs)__W);
|
|
3030
2925
|
}
|
|
3031
2926
|
|
|
3032
|
-
static __inline__ signed char
|
|
2927
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3033
2928
|
_mm_reduce_max_epi8(__m128i __V) {
|
|
3034
2929
|
return __builtin_reduce_max((__v16qs)__V);
|
|
3035
2930
|
}
|
|
3036
2931
|
|
|
3037
|
-
static __inline__ unsigned char
|
|
2932
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3038
2933
|
_mm_reduce_max_epu8(__m128i __V) {
|
|
3039
2934
|
return __builtin_reduce_max((__v16qu)__V);
|
|
3040
2935
|
}
|
|
3041
2936
|
|
|
3042
|
-
static __inline__ signed char
|
|
2937
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3043
2938
|
_mm_reduce_min_epi8(__m128i __V) {
|
|
3044
2939
|
return __builtin_reduce_min((__v16qs)__V);
|
|
3045
2940
|
}
|
|
3046
2941
|
|
|
3047
|
-
static __inline__ unsigned char
|
|
2942
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3048
2943
|
_mm_reduce_min_epu8(__m128i __V) {
|
|
3049
2944
|
return __builtin_reduce_min((__v16qu)__V);
|
|
3050
2945
|
}
|
|
3051
2946
|
|
|
3052
|
-
static __inline__ signed char
|
|
2947
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3053
2948
|
_mm_mask_reduce_max_epi8(__mmask16 __M, __m128i __V) {
|
|
3054
2949
|
__V = _mm_mask_mov_epi8(_mm_set1_epi8(-127-1), __M, __V);
|
|
3055
2950
|
return __builtin_reduce_max((__v16qs)__V);
|
|
3056
2951
|
}
|
|
3057
2952
|
|
|
3058
|
-
static __inline__ unsigned char
|
|
2953
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3059
2954
|
_mm_mask_reduce_max_epu8(__mmask16 __M, __m128i __V) {
|
|
3060
2955
|
__V = _mm_maskz_mov_epi8(__M, __V);
|
|
3061
2956
|
return __builtin_reduce_max((__v16qu)__V);
|
|
3062
2957
|
}
|
|
3063
2958
|
|
|
3064
|
-
static __inline__ signed char
|
|
2959
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3065
2960
|
_mm_mask_reduce_min_epi8(__mmask16 __M, __m128i __V) {
|
|
3066
2961
|
__V = _mm_mask_mov_epi8(_mm_set1_epi8(127), __M, __V);
|
|
3067
2962
|
return __builtin_reduce_min((__v16qs)__V);
|
|
3068
2963
|
}
|
|
3069
2964
|
|
|
3070
|
-
static __inline__ unsigned char
|
|
2965
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3071
2966
|
_mm_mask_reduce_min_epu8(__mmask16 __M, __m128i __V) {
|
|
3072
2967
|
__V = _mm_mask_mov_epi8(_mm_set1_epi8(-1), __M, __V);
|
|
3073
2968
|
return __builtin_reduce_min((__v16qu)__V);
|
|
3074
2969
|
}
|
|
3075
2970
|
|
|
3076
|
-
static __inline__ signed char
|
|
2971
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3077
2972
|
_mm256_reduce_add_epi8(__m256i __W) {
|
|
3078
2973
|
return __builtin_reduce_add((__v32qs)__W);
|
|
3079
2974
|
}
|
|
3080
2975
|
|
|
3081
|
-
static __inline__ signed char
|
|
2976
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3082
2977
|
_mm256_reduce_mul_epi8(__m256i __W) {
|
|
3083
2978
|
return __builtin_reduce_mul((__v32qs)__W);
|
|
3084
2979
|
}
|
|
3085
2980
|
|
|
3086
|
-
static __inline__ signed char
|
|
2981
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3087
2982
|
_mm256_reduce_and_epi8(__m256i __W) {
|
|
3088
2983
|
return __builtin_reduce_and((__v32qs)__W);
|
|
3089
2984
|
}
|
|
3090
2985
|
|
|
3091
|
-
static __inline__ signed char
|
|
2986
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3092
2987
|
_mm256_reduce_or_epi8(__m256i __W) {
|
|
3093
2988
|
return __builtin_reduce_or((__v32qs)__W);
|
|
3094
2989
|
}
|
|
3095
2990
|
|
|
3096
|
-
static __inline__ signed char
|
|
2991
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3097
2992
|
_mm256_mask_reduce_add_epi8(__mmask32 __M, __m256i __W) {
|
|
3098
2993
|
__W = _mm256_maskz_mov_epi8(__M, __W);
|
|
3099
2994
|
return __builtin_reduce_add((__v32qs)__W);
|
|
3100
2995
|
}
|
|
3101
2996
|
|
|
3102
|
-
static __inline__ signed char
|
|
2997
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3103
2998
|
_mm256_mask_reduce_mul_epi8(__mmask32 __M, __m256i __W) {
|
|
3104
2999
|
__W = _mm256_mask_mov_epi8(_mm256_set1_epi8(1), __M, __W);
|
|
3105
3000
|
return __builtin_reduce_mul((__v32qs)__W);
|
|
3106
3001
|
}
|
|
3107
3002
|
|
|
3108
|
-
static __inline__ signed char
|
|
3003
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3109
3004
|
_mm256_mask_reduce_and_epi8(__mmask32 __M, __m256i __W) {
|
|
3110
3005
|
__W = _mm256_mask_mov_epi8(_mm256_set1_epi8(-1), __M, __W);
|
|
3111
3006
|
return __builtin_reduce_and((__v32qs)__W);
|
|
3112
3007
|
}
|
|
3113
3008
|
|
|
3114
|
-
static __inline__ signed char
|
|
3009
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3115
3010
|
_mm256_mask_reduce_or_epi8(__mmask32 __M, __m256i __W) {
|
|
3116
3011
|
__W = _mm256_maskz_mov_epi8(__M, __W);
|
|
3117
3012
|
return __builtin_reduce_or((__v32qs)__W);
|
|
3118
3013
|
}
|
|
3119
3014
|
|
|
3120
|
-
static __inline__ signed char
|
|
3015
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3121
3016
|
_mm256_reduce_max_epi8(__m256i __V) {
|
|
3122
3017
|
return __builtin_reduce_max((__v32qs)__V);
|
|
3123
3018
|
}
|
|
3124
3019
|
|
|
3125
|
-
static __inline__ unsigned char
|
|
3020
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3126
3021
|
_mm256_reduce_max_epu8(__m256i __V) {
|
|
3127
3022
|
return __builtin_reduce_max((__v32qu)__V);
|
|
3128
3023
|
}
|
|
3129
3024
|
|
|
3130
|
-
static __inline__ signed char
|
|
3025
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3131
3026
|
_mm256_reduce_min_epi8(__m256i __V) {
|
|
3132
3027
|
return __builtin_reduce_min((__v32qs)__V);
|
|
3133
3028
|
}
|
|
3134
3029
|
|
|
3135
|
-
static __inline__ unsigned char
|
|
3030
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3136
3031
|
_mm256_reduce_min_epu8(__m256i __V) {
|
|
3137
3032
|
return __builtin_reduce_min((__v32qu)__V);
|
|
3138
3033
|
}
|
|
3139
3034
|
|
|
3140
|
-
static __inline__ signed char
|
|
3035
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3141
3036
|
_mm256_mask_reduce_max_epi8(__mmask32 __M, __m256i __V) {
|
|
3142
3037
|
__V = _mm256_mask_mov_epi8(_mm256_set1_epi8(-127-1), __M, __V);
|
|
3143
3038
|
return __builtin_reduce_max((__v32qs)__V);
|
|
3144
3039
|
}
|
|
3145
3040
|
|
|
3146
|
-
static __inline__ unsigned char
|
|
3041
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3147
3042
|
_mm256_mask_reduce_max_epu8(__mmask32 __M, __m256i __V) {
|
|
3148
3043
|
__V = _mm256_maskz_mov_epi8(__M, __V);
|
|
3149
3044
|
return __builtin_reduce_max((__v32qu)__V);
|
|
3150
3045
|
}
|
|
3151
3046
|
|
|
3152
|
-
static __inline__ signed char
|
|
3047
|
+
static __inline__ signed char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3153
3048
|
_mm256_mask_reduce_min_epi8(__mmask32 __M, __m256i __V) {
|
|
3154
3049
|
__V = _mm256_mask_mov_epi8(_mm256_set1_epi8(127), __M, __V);
|
|
3155
3050
|
return __builtin_reduce_min((__v32qs)__V);
|
|
3156
3051
|
}
|
|
3157
3052
|
|
|
3158
|
-
static __inline__ unsigned char
|
|
3053
|
+
static __inline__ unsigned char __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3159
3054
|
_mm256_mask_reduce_min_epu8(__mmask32 __M, __m256i __V) {
|
|
3160
3055
|
__V = _mm256_mask_mov_epi8(_mm256_set1_epi8(-1), __M, __V);
|
|
3161
3056
|
return __builtin_reduce_min((__v32qu)__V);
|
|
@@ -3163,5 +3058,7 @@ _mm256_mask_reduce_min_epu8(__mmask32 __M, __m256i __V) {
|
|
|
3163
3058
|
|
|
3164
3059
|
#undef __DEFAULT_FN_ATTRS128
|
|
3165
3060
|
#undef __DEFAULT_FN_ATTRS256
|
|
3061
|
+
#undef __DEFAULT_FN_ATTRS128_CONSTEXPR
|
|
3062
|
+
#undef __DEFAULT_FN_ATTRS256_CONSTEXPR
|
|
3166
3063
|
|
|
3167
3064
|
#endif /* __AVX512VLBWINTRIN_H */
|