vsimd/
mask.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
use crate::isa::{AVX2, NEON, SSE2, WASM128};
use crate::vector::{V128, V256};
use crate::{SIMD128, SIMD256};

use core::ops::Not;

#[inline(always)]
pub fn mask8x16_all<S: SIMD128>(s: S, x: V128) -> bool {
    if matches_isa!(S, SSE2 | WASM128) {
        return s.u8x16_bitmask(x) == u16::MAX;
    }
    if matches_isa!(S, NEON) {
        if cfg!(target_arch = "arm") {
            return s.u8x16_any_zero(x).not();
        }
        if cfg!(target_arch = "aarch64") {
            return s.u8x16_reduce_min(x) != 0;
        }
    }
    unreachable!()
}

#[inline(always)]
pub fn mask8x32_all<S: SIMD256>(s: S, x: V256) -> bool {
    if matches_isa!(S, AVX2) {
        return s.u8x32_bitmask(x) == u32::MAX;
    }
    if matches_isa!(S, SSE2 | WASM128 | NEON) {
        let x = x.to_v128x2();
        let x = s.v128_and(x.0, x.1);
        return mask8x16_all(s, x);
    }
    unreachable!()
}

#[inline(always)]
pub fn mask8x16_any<S: SIMD128>(s: S, x: V128) -> bool {
    if matches_isa!(S, SSE2 | WASM128) {
        return s.u8x16_bitmask(x) != 0;
    }
    if matches_isa!(S, NEON) {
        return s.v128_all_zero(x).not();
    }
    unreachable!()
}

#[inline(always)]
pub fn mask8x32_any<S: SIMD256>(s: S, x: V256) -> bool {
    if matches_isa!(S, AVX2) {
        return s.u8x32_bitmask(x) != 0;
    }
    if matches_isa!(S, SSE2 | WASM128 | NEON) {
        let x = x.to_v128x2();
        let x = s.v128_or(x.0, x.1);
        return mask8x16_any(s, x);
    }
    unreachable!()
}

#[inline(always)]
pub fn u8x16_highbit_all<S: SIMD128>(s: S, x: V128) -> bool {
    if matches_isa!(S, SSE2 | WASM128) {
        return s.u8x16_bitmask(x) == u16::MAX;
    }
    if matches_isa!(S, NEON) {
        if cfg!(target_arch = "arm") {
            return mask8x16_all(s, s.i8x16_lt(x, s.v128_create_zero()));
        }
        if cfg!(target_arch = "aarch64") {
            return s.u8x16_reduce_min(x) >= 0x80;
        }
    }
    unreachable!()
}

#[inline(always)]
pub fn u8x32_highbit_all<S: SIMD256>(s: S, x: V256) -> bool {
    if matches_isa!(S, AVX2) {
        return s.u8x32_bitmask(x) == u32::MAX;
    }
    if matches_isa!(S, SSE2 | WASM128 | NEON) {
        let x = x.to_v128x2();
        let x = s.v128_and(x.0, x.1);
        return u8x16_highbit_all(s, x);
    }
    unreachable!()
}

#[inline(always)]
pub fn u8x16_highbit_any<S: SIMD128>(s: S, x: V128) -> bool {
    if matches_isa!(S, SSE2 | WASM128) {
        return s.u8x16_bitmask(x) != 0;
    }
    if matches_isa!(S, NEON) {
        if cfg!(target_arch = "arm") {
            return mask8x16_any(s, s.i8x16_lt(x, s.v128_create_zero()));
        }
        if cfg!(target_arch = "aarch64") {
            return s.u8x16_reduce_max(x) >= 0x80;
        }
    }
    unreachable!()
}

#[inline(always)]
pub fn u8x32_highbit_any<S: SIMD256>(s: S, x: V256) -> bool {
    if matches_isa!(S, AVX2) {
        return s.u8x32_bitmask(x) != 0;
    }
    if matches_isa!(S, SSE2 | WASM128 | NEON) {
        let x = x.to_v128x2();
        let x = s.v128_or(x.0, x.1);
        return u8x16_highbit_any(s, x);
    }
    unreachable!()
}