From 2167abcf72d978b4ac2f08fa7cbbddaada01f165 Mon Sep 17 00:00:00 2001 From: metamuffin Date: Tue, 7 Mar 2023 08:00:00 +0100 Subject: a --- lvc/src/diff.rs | 105 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 105 insertions(+) create mode 100644 lvc/src/diff.rs (limited to 'lvc/src/diff.rs') diff --git a/lvc/src/diff.rs b/lvc/src/diff.rs new file mode 100644 index 0000000..5c65c29 --- /dev/null +++ b/lvc/src/diff.rs @@ -0,0 +1,105 @@ +use crate::{Frame, Ref, View, P2}; +use std::simd::{i32x16, SimdInt}; + +// 4ms +pub fn diff([frame1, frame2]: [&Frame; 2], view: View, rp: Ref) -> u32 { + let mut k = 0; + for y in view.a.y..view.b.y { + for x in view.a.x..view.b.x { + let p1 = frame1[P2 { x, y }] + rp.color_off; + let p2 = frame2[P2 { x, y }]; + k += p1.r.abs_diff(p2.r) as u32 + + p1.g.abs_diff(p2.g) as u32 + + p1.b.abs_diff(p2.b) as u32; + } + } + k +} + +pub fn fast_diff([frame1, frame2]: [&Frame; 2], view: View, rp: Ref) -> u32 { + let mut k = 0; + + let mut diff_lanes = i32x16::from_array([0; 16]); + let mut k1 = [0; 16]; + let mut k2 = [0; 16]; + + let next_line = frame1.size.x as usize - view.size().x as usize; + let index_start = view.a.x as usize + view.a.y as usize * frame1.size.x as usize; + let index_end = view.b.x as usize + (view.b.y as usize - 1) * frame1.size.x as usize; + + let mut i = index_start; + let mut x = view.a.x; + let mut kfill = 0; + + while i < index_end { + k1[kfill] = frame1.pixels[i].r as i32; + k2[kfill] = frame2.pixels[i].r as i32; + kfill += 1; + k1[kfill] = frame1.pixels[i].g as i32; + k2[kfill] = frame2.pixels[i].g as i32; + kfill += 1; + k1[kfill] = frame1.pixels[i].b as i32; + k2[kfill] = frame2.pixels[i].b as i32; + kfill += 1; + + i += 1; + x += 1; + if x > view.b.x { + i += next_line; + x = view.a.x + } + + if kfill == 15 { + let pl1 = i32x16::from_array(k1); + let pl2 = i32x16::from_array(k2); + diff_lanes += (pl1 - pl2).abs(); + kfill = 0; + } + } + + return diff_lanes.reduce_sum() as u32; +} + +// pub fn fast_diff([frame1, frame2]: [&Frame; 2], view: View, rp: Ref) -> u32 { +// let mut k = 0; + +// let mut diff_lanes = i32x16::from_array([0; 16]); +// let mut k1 = [0; 16]; +// let mut k2 = [0; 16]; + +// let next_line = frame1.size.x as usize - view.size().x as usize; +// let index_start = view.a.x as usize + view.a.y as usize * frame1.size.x as usize; +// let index_end = view.b.x as usize + (view.b.y as usize - 1) * frame1.size.x as usize; + +// let mut i = index_start; +// let mut x = view.a.x; +// let mut kfill = 0; + +// while i < index_end { +// k1[kfill] = frame1.pixels[i].r as i32; +// k2[kfill] = frame2.pixels[i].r as i32; +// kfill += 1; +// k1[kfill] = frame1.pixels[i].g as i32; +// k2[kfill] = frame2.pixels[i].g as i32; +// kfill += 1; +// k1[kfill] = frame1.pixels[i].b as i32; +// k2[kfill] = frame2.pixels[i].b as i32; +// kfill += 1; + +// i += 1; +// x += 1; +// if x > view.b.x { +// i += next_line; +// x = view.a.x +// } + +// if kfill == 15 { +// let pl1 = i32x16::from_array(k1); +// let pl2 = i32x16::from_array(k2); +// diff_lanes += (pl1 - pl2).abs(); +// kfill = 0; +// } +// } + +// return diff_lanes.reduce_sum() as u32; +// } -- cgit v1.2.3-70-g09d2