From d0ce1d9134968a15d37135622138f6b8b7667454 Mon Sep 17 00:00:00 2001 From: metamuffin Date: Wed, 20 Sep 2023 21:40:05 +0200 Subject: replace cosinesim with L2-norm euclidean --- src/embedders/vecmetric.rs | 13 ++++++------- 1 file changed, 6 insertions(+), 7 deletions(-) (limited to 'src') diff --git a/src/embedders/vecmetric.rs b/src/embedders/vecmetric.rs index 0c63911..1bda3a8 100644 --- a/src/embedders/vecmetric.rs +++ b/src/embedders/vecmetric.rs @@ -19,15 +19,14 @@ impl VecMetric for ManhattenDistance {} impl MetricElem for CosineSimilarity { fn dist(&self, other: &Self) -> f64 { - let x = self - .0 + let len_a = self.0.iter().map(|x| x.powi(2)).sum::().sqrt(); + let len_b = other.0.iter().map(|x| x.powi(2)).sum::().sqrt(); + self.0 .iter() .zip(other.0.iter()) - .map(|(a, b)| *a * *b) - .sum::(); - let mag_a = self.0.iter().map(|x| x.powi(2)).sum::(); - let mag_b = other.0.iter().map(|x| x.powi(2)).sum::(); - (x / (mag_a * mag_b).sqrt()) as f64 + .map(|(a, b)| (*a / len_a - *b / len_b).powi(2)) + .sum::() + .sqrt() as f64 } } impl MetricElem for EuclidianDistance { -- cgit v1.2.3-70-g09d2