Skip to content

Commit 723122a

Browse files
committed
add inlines
Signed-off-by: Connor Tsui <[email protected]>
1 parent 6d7b18e commit 723122a

File tree

2 files changed

+12
-2
lines changed

2 files changed

+12
-2
lines changed

vortex-compute/benches/avx512.rs

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ fn in_place_scalar(bencher: divan::Bencher, (size, probability): (usize, f64)) {
5353
.bench_refs(|(data, mask)| filter_in_place_scalar(data, mask))
5454
}
5555

56-
#[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
56+
#[cfg(all(any(target_arch = "x86", target_arch = "x86_64"), not(codspeed)))]
5757
#[divan::bench(sample_size = SAMPLE_SIZE, args = SIZES.iter().copied().cartesian_product(PROBABILITIES.iter().copied()))]
5858
fn in_place_avx512(bencher: divan::Bencher, (size, probability): (usize, f64)) {
5959
let mask = divan::black_box(create_random_mask(size, probability));
@@ -75,7 +75,7 @@ fn out_scalar(bencher: divan::Bencher, (size, probability): (usize, f64)) {
7575
.bench_refs(|(src, dest, mask)| filter_into_scalar(src, dest, mask))
7676
}
7777

78-
#[cfg(any(target_arch = "x86", target_arch = "x86_64"))]
78+
#[cfg(all(any(target_arch = "x86", target_arch = "x86_64"), not(codspeed)))]
7979
#[divan::bench(sample_size = SAMPLE_SIZE, args = SIZES.iter().copied().cartesian_product(PROBABILITIES.iter().copied()))]
8080
fn out_avx512(bencher: divan::Bencher, (size, probability): (usize, f64)) {
8181
let mask = divan::black_box(create_random_mask(size, probability));

vortex-compute/src/filter/slice/simd_compress.rs

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,7 @@ impl SimdCompress for i32 {
5555
type MaskType = u16;
5656

5757
#[target_feature(enable = "avx512f")]
58+
#[inline]
5859
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
5960
_mm512_maskz_compress_epi32(mask, vec)
6061
}
@@ -76,6 +77,7 @@ impl SimdCompress for u32 {
7677
type MaskType = u16;
7778

7879
#[target_feature(enable = "avx512f")]
80+
#[inline]
7981
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
8082
_mm512_maskz_compress_epi32(mask, vec)
8183
}
@@ -97,6 +99,7 @@ impl SimdCompress for f32 {
9799
type MaskType = u16;
98100

99101
#[target_feature(enable = "avx512f")]
102+
#[inline]
100103
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
101104
unsafe {
102105
let float_vec = std::mem::transmute::<__m512i, __m512>(vec);
@@ -126,6 +129,7 @@ impl SimdCompress for i64 {
126129
type MaskType = u8;
127130

128131
#[target_feature(enable = "avx512f")]
132+
#[inline]
129133
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
130134
_mm512_maskz_compress_epi64(mask, vec)
131135
}
@@ -147,6 +151,7 @@ impl SimdCompress for u64 {
147151
type MaskType = u8;
148152

149153
#[target_feature(enable = "avx512f")]
154+
#[inline]
150155
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
151156
_mm512_maskz_compress_epi64(mask, vec)
152157
}
@@ -168,6 +173,7 @@ impl SimdCompress for f64 {
168173
type MaskType = u8;
169174

170175
#[target_feature(enable = "avx512f")]
176+
#[inline]
171177
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
172178
unsafe {
173179
let double_vec = std::mem::transmute::<__m512i, __m512d>(vec);
@@ -197,6 +203,7 @@ impl SimdCompress for i16 {
197203
type MaskType = u32;
198204

199205
#[target_feature(enable = "avx512vbmi2")]
206+
#[inline]
200207
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
201208
_mm512_maskz_compress_epi16(mask, vec)
202209
}
@@ -218,6 +225,7 @@ impl SimdCompress for u16 {
218225
type MaskType = u32;
219226

220227
#[target_feature(enable = "avx512vbmi2")]
228+
#[inline]
221229
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
222230
_mm512_maskz_compress_epi16(mask, vec)
223231
}
@@ -243,6 +251,7 @@ impl SimdCompress for i8 {
243251
type MaskType = u64;
244252

245253
#[target_feature(enable = "avx512vbmi2")]
254+
#[inline]
246255
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
247256
_mm512_maskz_compress_epi8(mask, vec)
248257
}
@@ -264,6 +273,7 @@ impl SimdCompress for u8 {
264273
type MaskType = u64;
265274

266275
#[target_feature(enable = "avx512vbmi2")]
276+
#[inline]
267277
unsafe fn compress_vector(mask: Self::MaskType, vec: __m512i) -> __m512i {
268278
_mm512_maskz_compress_epi8(mask, vec)
269279
}

0 commit comments

Comments
 (0)