Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
56 changes: 41 additions & 15 deletions benches/destride.rs
Original file line number Diff line number Diff line change
@@ -1,12 +1,14 @@
#![feature(stdsimd, test)]

#[cfg(test)] extern crate test;
#[macro_use] extern crate faster;
#[cfg(test)]
extern crate test;
#[macro_use]
extern crate faster;

#[cfg(test)]
mod destride {
use faster::prelude::*;
use test::{Bencher, black_box};
use test::{black_box, Bencher};

#[bench]
#[cfg(feature = "std")]
Expand Down Expand Up @@ -79,8 +81,12 @@ mod destride {
fn destride_four_naiive(b: &mut Bencher) {
let a = [0u8; 4096];
b.iter(|| {
(&a[..]).stride_four(tuplify!(4, u8s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_four(tuplify!(4, u8s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}

Expand All @@ -89,8 +95,12 @@ mod destride {
fn destride_two_naiive(b: &mut Bencher) {
let a = [0u8; 4096];
b.iter(|| {
(&a[..]).stride_two(tuplify!(2, u8s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_two(tuplify!(2, u8s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}

Expand All @@ -99,8 +109,12 @@ mod destride {
fn destride_four_naiive_16(b: &mut Bencher) {
let a = [0u16; 4096];
b.iter(|| {
(&a[..]).stride_four(tuplify!(4, u16s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_four(tuplify!(4, u16s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}

Expand All @@ -109,8 +123,12 @@ mod destride {
fn destride_two_naiive_16(b: &mut Bencher) {
let a = [0u16; 4096];
b.iter(|| {
(&a[..]).stride_two(tuplify!(2, u16s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_two(tuplify!(2, u16s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}

Expand All @@ -119,8 +137,12 @@ mod destride {
fn destride_four_naiive_32(b: &mut Bencher) {
let a = [0u32; 4096];
b.iter(|| {
(&a[..]).stride_four(tuplify!(4, u32s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_four(tuplify!(4, u32s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}

Expand All @@ -129,8 +151,12 @@ mod destride {
fn destride_two_naiive_32(b: &mut Bencher) {
let a = [0u32; 4096];
b.iter(|| {
(&a[..]).stride_two(tuplify!(2, u32s(0))).zip()
.simd_do_each(|x| { black_box(x); });
(&a[..])
.stride_two(tuplify!(2, u32s(0)))
.zip()
.simd_do_each(|x| {
black_box(x);
});
})
}
}
70 changes: 49 additions & 21 deletions benches/intrin.rs
Original file line number Diff line number Diff line change
@@ -1,7 +1,8 @@
#![feature(test, stdsimd)]

#[cfg(test)] extern crate test;
extern crate faster;
#[cfg(test)]
extern crate test;

const ARRAY_F32: &[f32] = &[-123.456f32; 1024];

Expand All @@ -10,54 +11,81 @@ macro_rules! bench_intrin_1 {
#[bench]
#[cfg(feature = "std")]
fn $scalar_name(b: &mut Bencher) {
b.iter(|| { black_box(
crate::ARRAY_F32.iter().map(|v| { $scalar_fn(*v) }).collect::<Vec<f32>>()
)})
b.iter(|| {
black_box(
crate::ARRAY_F32
.iter()
.map(|v| $scalar_fn(*v))
.collect::<Vec<f32>>(),
)
})
}

#[bench]
#[cfg(feature = "std")]
fn $simd_name(b: &mut Bencher) {
b.iter(|| { black_box(
crate::ARRAY_F32.simd_iter(f32s(0.0)).simd_map(|v| { $simd_fn(v) }).scalar_collect()
)});
b.iter(|| {
black_box(
crate::ARRAY_F32
.simd_iter(f32s(0.0))
.simd_map(|v| $simd_fn(v))
.scalar_collect(),
)
});
}
}
};
}

macro_rules! bench_intrin_2 {
($simd_name:ident, $simd_fn:ident, $scalar_name:ident, $scalar_fn:ident) => {
#[bench]
#[cfg(feature = "std")]
fn $scalar_name(b: &mut Bencher) {
b.iter(|| { black_box(
crate::ARRAY_F32.iter().map(|v| { v.$scalar_fn(*v) }).collect::<Vec<f32>>()
)})
b.iter(|| {
black_box(
crate::ARRAY_F32
.iter()
.map(|v| v.$scalar_fn(*v))
.collect::<Vec<f32>>(),
)
})
}

#[bench]
#[cfg(feature = "std")]
fn $simd_name(b: &mut Bencher) {
b.iter(|| { black_box(
crate::ARRAY_F32.simd_iter(f32s(0.0)).simd_map(|v| {v.$simd_fn(v) }).scalar_collect()
)});
b.iter(|| {
black_box(
crate::ARRAY_F32
.simd_iter(f32s(0.0))
.simd_map(|v| v.$simd_fn(v))
.scalar_collect(),
)
});
}
}
};
}


#[cfg(test)]
mod intrin {
use faster::prelude::*;
use test::{Bencher, black_box};
use test::{black_box, Bencher};

bench_intrin_1!(abs_simd, |x: f32s| x.abs(), abs_scala, |x: f32| x.abs());
bench_intrin_1!(ceil_simd, |x: f32s| x.ceil(), ceil_scala, |x: f32| x.ceil());
bench_intrin_1!(floor_simd, |x: f32s| x.floor(), floor_scala, |x: f32| x.floor());
bench_intrin_1!(floor_simd, |x: f32s| x.floor(), floor_scala, |x: f32| x
.floor());
bench_intrin_2!(min_simd, min, min_scala, min);
bench_intrin_2!(max_simd, max, max_scala, max);
bench_intrin_1!(recip_simd, |x: f32s| x.recip(), recip_scala, |x: f32| 1.0f32 / x);
bench_intrin_1!(round_simd, |x: f32s| x.round(), round_scala, |x: f32| x.round());
bench_intrin_1!(
recip_simd,
|x: f32s| x.recip(),
recip_scala,
|x: f32| 1.0f32 / x
);
bench_intrin_1!(round_simd, |x: f32s| x.round(), round_scala, |x: f32| x
.round());
bench_intrin_1!(sqrt_simd, |x: f32s| x.sqrt(), sqrt_scala, |x: f32| x.sqrt());
bench_intrin_1!(trunc_simd, |x: f32s| x.trunc(), trunc_scala, |x: f32| x.trunc());
bench_intrin_1!(trunc_simd, |x: f32s| x.trunc(), trunc_scala, |x: f32| x
.trunc());
}
Loading