You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
320 lines
7.9 KiB
320 lines
7.9 KiB
use criterion::{criterion_group, criterion_main, Bencher, Criterion};
|
|
use half::prelude::*;
|
|
use std::{f32, f64, iter};
|
|
|
|
const SIMD_LARGE_BENCH_SLICE_LEN: usize = 1024;
|
|
|
|
fn bench_f32_to_f16(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"f16::from_f32",
|
|
|b: &mut Bencher<'_>, i: &f32| b.iter(|| f16::from_f32(*i)),
|
|
vec![
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f32::MIN,
|
|
f32::MAX,
|
|
f32::MIN_POSITIVE,
|
|
f32::NEG_INFINITY,
|
|
f32::INFINITY,
|
|
f32::NAN,
|
|
f32::consts::E,
|
|
f32::consts::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_f64_to_f16(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"f16::from_f64",
|
|
|b: &mut Bencher<'_>, i: &f64| b.iter(|| f16::from_f64(*i)),
|
|
vec![
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f64::MIN,
|
|
f64::MAX,
|
|
f64::MIN_POSITIVE,
|
|
f64::NEG_INFINITY,
|
|
f64::INFINITY,
|
|
f64::NAN,
|
|
f64::consts::E,
|
|
f64::consts::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_f16_to_f32(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"f16::to_f32",
|
|
|b: &mut Bencher<'_>, i: &f16| b.iter(|| i.to_f32()),
|
|
vec![
|
|
f16::ZERO,
|
|
f16::NEG_ZERO,
|
|
f16::ONE,
|
|
f16::MIN,
|
|
f16::MAX,
|
|
f16::MIN_POSITIVE,
|
|
f16::NEG_INFINITY,
|
|
f16::INFINITY,
|
|
f16::NAN,
|
|
f16::E,
|
|
f16::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_f16_to_f64(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"f16::to_f64",
|
|
|b: &mut Bencher<'_>, i: &f16| b.iter(|| i.to_f64()),
|
|
vec![
|
|
f16::ZERO,
|
|
f16::NEG_ZERO,
|
|
f16::ONE,
|
|
f16::MIN,
|
|
f16::MAX,
|
|
f16::MIN_POSITIVE,
|
|
f16::NEG_INFINITY,
|
|
f16::INFINITY,
|
|
f16::NAN,
|
|
f16::E,
|
|
f16::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
criterion_group!(
|
|
f16_sisd,
|
|
bench_f32_to_f16,
|
|
bench_f64_to_f16,
|
|
bench_f16_to_f32,
|
|
bench_f16_to_f64
|
|
);
|
|
|
|
fn bench_slice_f32_to_f16(c: &mut Criterion) {
|
|
let mut constant_buffer = [f16::ZERO; 11];
|
|
let constants = [
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f32::MIN,
|
|
f32::MAX,
|
|
f32::MIN_POSITIVE,
|
|
f32::NEG_INFINITY,
|
|
f32::INFINITY,
|
|
f32::NAN,
|
|
f32::consts::E,
|
|
f32::consts::PI,
|
|
];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_from_f32_slice/constants",
|
|
|b: &mut Bencher<'_>| b.iter(|| constant_buffer.convert_from_f32_slice(&constants)),
|
|
);
|
|
|
|
let large: Vec<_> = iter::repeat(0)
|
|
.enumerate()
|
|
.map(|(i, _)| i as f32)
|
|
.take(SIMD_LARGE_BENCH_SLICE_LEN)
|
|
.collect();
|
|
let mut large_buffer = [f16::ZERO; SIMD_LARGE_BENCH_SLICE_LEN];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_from_f32_slice/large",
|
|
|b: &mut Bencher<'_>| b.iter(|| large_buffer.convert_from_f32_slice(&large)),
|
|
);
|
|
}
|
|
|
|
fn bench_slice_f64_to_f16(c: &mut Criterion) {
|
|
let mut constant_buffer = [f16::ZERO; 11];
|
|
let constants = [
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f64::MIN,
|
|
f64::MAX,
|
|
f64::MIN_POSITIVE,
|
|
f64::NEG_INFINITY,
|
|
f64::INFINITY,
|
|
f64::NAN,
|
|
f64::consts::E,
|
|
f64::consts::PI,
|
|
];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_from_f64_slice/constants",
|
|
|b: &mut Bencher<'_>| b.iter(|| constant_buffer.convert_from_f64_slice(&constants)),
|
|
);
|
|
|
|
let large: Vec<_> = iter::repeat(0)
|
|
.enumerate()
|
|
.map(|(i, _)| i as f64)
|
|
.take(SIMD_LARGE_BENCH_SLICE_LEN)
|
|
.collect();
|
|
let mut large_buffer = [f16::ZERO; SIMD_LARGE_BENCH_SLICE_LEN];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_from_f64_slice/large",
|
|
|b: &mut Bencher<'_>| b.iter(|| large_buffer.convert_from_f64_slice(&large)),
|
|
);
|
|
}
|
|
|
|
fn bench_slice_f16_to_f32(c: &mut Criterion) {
|
|
let mut constant_buffer = [0f32; 11];
|
|
let constants = [
|
|
f16::ZERO,
|
|
f16::NEG_ZERO,
|
|
f16::ONE,
|
|
f16::MIN,
|
|
f16::MAX,
|
|
f16::MIN_POSITIVE,
|
|
f16::NEG_INFINITY,
|
|
f16::INFINITY,
|
|
f16::NAN,
|
|
f16::E,
|
|
f16::PI,
|
|
];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_to_f32_slice/constants",
|
|
|b: &mut Bencher<'_>| b.iter(|| constants.convert_to_f32_slice(&mut constant_buffer)),
|
|
);
|
|
|
|
let large: Vec<_> = iter::repeat(0)
|
|
.enumerate()
|
|
.map(|(i, _)| f16::from_f32(i as f32))
|
|
.take(SIMD_LARGE_BENCH_SLICE_LEN)
|
|
.collect();
|
|
let mut large_buffer = [0f32; SIMD_LARGE_BENCH_SLICE_LEN];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_to_f32_slice/large",
|
|
|b: &mut Bencher<'_>| b.iter(|| large.convert_to_f32_slice(&mut large_buffer)),
|
|
);
|
|
}
|
|
|
|
fn bench_slice_f16_to_f64(c: &mut Criterion) {
|
|
let mut constant_buffer = [0f64; 11];
|
|
let constants = [
|
|
f16::ZERO,
|
|
f16::NEG_ZERO,
|
|
f16::ONE,
|
|
f16::MIN,
|
|
f16::MAX,
|
|
f16::MIN_POSITIVE,
|
|
f16::NEG_INFINITY,
|
|
f16::INFINITY,
|
|
f16::NAN,
|
|
f16::E,
|
|
f16::PI,
|
|
];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_to_f64_slice/constants",
|
|
|b: &mut Bencher<'_>| b.iter(|| constants.convert_to_f64_slice(&mut constant_buffer)),
|
|
);
|
|
|
|
let large: Vec<_> = iter::repeat(0)
|
|
.enumerate()
|
|
.map(|(i, _)| f16::from_f64(i as f64))
|
|
.take(SIMD_LARGE_BENCH_SLICE_LEN)
|
|
.collect();
|
|
let mut large_buffer = [0f64; SIMD_LARGE_BENCH_SLICE_LEN];
|
|
c.bench_function(
|
|
"HalfFloatSliceExt::convert_to_f64_slice/large",
|
|
|b: &mut Bencher<'_>| b.iter(|| large.convert_to_f64_slice(&mut large_buffer)),
|
|
);
|
|
}
|
|
|
|
criterion_group!(
|
|
f16_simd,
|
|
bench_slice_f32_to_f16,
|
|
bench_slice_f64_to_f16,
|
|
bench_slice_f16_to_f32,
|
|
bench_slice_f16_to_f64
|
|
);
|
|
|
|
fn bench_f32_to_bf16(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"bf16::from_f32",
|
|
|b: &mut Bencher<'_>, i: &f32| b.iter(|| bf16::from_f32(*i)),
|
|
vec![
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f32::MIN,
|
|
f32::MAX,
|
|
f32::MIN_POSITIVE,
|
|
f32::NEG_INFINITY,
|
|
f32::INFINITY,
|
|
f32::NAN,
|
|
f32::consts::E,
|
|
f32::consts::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_f64_to_bf16(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"bf16::from_f64",
|
|
|b: &mut Bencher<'_>, i: &f64| b.iter(|| bf16::from_f64(*i)),
|
|
vec![
|
|
0.,
|
|
-0.,
|
|
1.,
|
|
f64::MIN,
|
|
f64::MAX,
|
|
f64::MIN_POSITIVE,
|
|
f64::NEG_INFINITY,
|
|
f64::INFINITY,
|
|
f64::NAN,
|
|
f64::consts::E,
|
|
f64::consts::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_bf16_to_f32(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"bf16::to_f32",
|
|
|b: &mut Bencher<'_>, i: &bf16| b.iter(|| i.to_f32()),
|
|
vec![
|
|
bf16::ZERO,
|
|
bf16::NEG_ZERO,
|
|
bf16::ONE,
|
|
bf16::MIN,
|
|
bf16::MAX,
|
|
bf16::MIN_POSITIVE,
|
|
bf16::NEG_INFINITY,
|
|
bf16::INFINITY,
|
|
bf16::NAN,
|
|
bf16::E,
|
|
bf16::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
fn bench_bf16_to_f64(c: &mut Criterion) {
|
|
c.bench_function_over_inputs(
|
|
"bf16::to_f64",
|
|
|b: &mut Bencher<'_>, i: &bf16| b.iter(|| i.to_f64()),
|
|
vec![
|
|
bf16::ZERO,
|
|
bf16::NEG_ZERO,
|
|
bf16::ONE,
|
|
bf16::MIN,
|
|
bf16::MAX,
|
|
bf16::MIN_POSITIVE,
|
|
bf16::NEG_INFINITY,
|
|
bf16::INFINITY,
|
|
bf16::NAN,
|
|
bf16::E,
|
|
bf16::PI,
|
|
],
|
|
);
|
|
}
|
|
|
|
criterion_group!(
|
|
bf16_sisd,
|
|
bench_f32_to_bf16,
|
|
bench_f64_to_bf16,
|
|
bench_bf16_to_f32,
|
|
bench_bf16_to_f64
|
|
);
|
|
|
|
criterion_main!(f16_sisd, bf16_sisd, f16_simd);
|