1 #![feature(portable_simd)]
2 extern crate std_float;
4 /// Benchmarks game nbody code
5 /// Taken from the `packed_simd` crate
6 /// Run this benchmark with `cargo test --example nbody`
8 use core_simd::simd::*;
9 #[allow(unused)] // False positive?
10 use std_float::StdFloat;
12 use std::f64::consts::PI;
13 const SOLAR_MASS: f64 = 4.0 * PI * PI;
14 const DAYS_PER_YEAR: f64 = 365.24;
16 #[derive(Debug, Clone, Copy)]
23 const N_BODIES: usize = 5;
24 const BODIES: [Body; N_BODIES] = [
27 x: f64x4::from_array([0., 0., 0., 0.]),
28 v: f64x4::from_array([0., 0., 0., 0.]),
33 x: f64x4::from_array([
34 4.84143144246472090e+00,
35 -1.16032004402742839e+00,
36 -1.03622044471123109e-01,
39 v: f64x4::from_array([
40 1.66007664274403694e-03 * DAYS_PER_YEAR,
41 7.69901118419740425e-03 * DAYS_PER_YEAR,
42 -6.90460016972063023e-05 * DAYS_PER_YEAR,
45 mass: 9.54791938424326609e-04 * SOLAR_MASS,
49 x: f64x4::from_array([
50 8.34336671824457987e+00,
51 4.12479856412430479e+00,
52 -4.03523417114321381e-01,
55 v: f64x4::from_array([
56 -2.76742510726862411e-03 * DAYS_PER_YEAR,
57 4.99852801234917238e-03 * DAYS_PER_YEAR,
58 2.30417297573763929e-05 * DAYS_PER_YEAR,
61 mass: 2.85885980666130812e-04 * SOLAR_MASS,
65 x: f64x4::from_array([
66 1.28943695621391310e+01,
67 -1.51111514016986312e+01,
68 -2.23307578892655734e-01,
71 v: f64x4::from_array([
72 2.96460137564761618e-03 * DAYS_PER_YEAR,
73 2.37847173959480950e-03 * DAYS_PER_YEAR,
74 -2.96589568540237556e-05 * DAYS_PER_YEAR,
77 mass: 4.36624404335156298e-05 * SOLAR_MASS,
81 x: f64x4::from_array([
82 1.53796971148509165e+01,
83 -2.59193146099879641e+01,
84 1.79258772950371181e-01,
87 v: f64x4::from_array([
88 2.68067772490389322e-03 * DAYS_PER_YEAR,
89 1.62824170038242295e-03 * DAYS_PER_YEAR,
90 -9.51592254519715870e-05 * DAYS_PER_YEAR,
93 mass: 5.15138902046611451e-05 * SOLAR_MASS,
97 fn offset_momentum(bodies: &mut [Body; N_BODIES]) {
98 let (sun, rest) = bodies.split_at_mut(1);
99 let sun = &mut sun[0];
101 let m_ratio = body.mass / SOLAR_MASS;
102 sun.v -= body.v * Simd::splat(m_ratio);
106 fn energy(bodies: &[Body; N_BODIES]) -> f64 {
108 for i in 0..N_BODIES {
110 e += bi.mass * (bi.v * bi.v).reduce_sum() * 0.5;
111 for bj in bodies.iter().take(N_BODIES).skip(i + 1) {
112 let dx = bi.x - bj.x;
113 e -= bi.mass * bj.mass / (dx * dx).reduce_sum().sqrt()
119 fn advance(bodies: &mut [Body; N_BODIES], dt: f64) {
120 const N: usize = N_BODIES * (N_BODIES - 1) / 2;
122 // compute distance between bodies:
123 let mut r = [f64x4::splat(0.); N];
126 for j in 0..N_BODIES {
127 for k in j + 1..N_BODIES {
128 r[i] = bodies[j].x - bodies[k].x;
134 let mut mag = [0.0; N];
135 for i in (0..N).step_by(2) {
136 let d2s = f64x2::from_array([
137 (r[i] * r[i]).reduce_sum(),
138 (r[i + 1] * r[i + 1]).reduce_sum(),
140 let dmags = f64x2::splat(dt) / (d2s * d2s.sqrt());
142 mag[i + 1] = dmags[1];
146 for j in 0..N_BODIES {
147 for k in j + 1..N_BODIES {
148 let f = r[i] * Simd::splat(mag[i]);
149 bodies[j].v -= f * Simd::splat(bodies[k].mass);
150 bodies[k].v += f * Simd::splat(bodies[j].mass);
155 body.x += Simd::splat(dt) * body.v
159 pub fn run(n: usize) -> (f64, f64) {
160 let mut bodies = BODIES;
161 offset_momentum(&mut bodies);
162 let energy_before = energy(&bodies);
164 advance(&mut bodies, 0.01);
166 let energy_after = energy(&bodies);
168 (energy_before, energy_after)
174 // Good enough for demonstration purposes, not going for strictness here.
175 fn approx_eq_f64(a: f64, b: f64) -> bool {
176 (a - b).abs() < 0.00001
180 const OUTPUT: [f64; 2] = [-0.169075164, -0.169087605];
181 let (energy_before, energy_after) = super::nbody::run(1000);
182 assert!(approx_eq_f64(energy_before, OUTPUT[0]));
183 assert!(approx_eq_f64(energy_after, OUTPUT[1]));
189 let (energy_before, energy_after) = nbody::run(1000);
190 println!("Energy before: {energy_before}");
191 println!("Energy after: {energy_after}");