lance-format
diff --git a/‎rust/lance-linalg/benches/cosine.rs‎
Lines changed: 37 additions & 0 deletions b/‎rust/lance-linalg/benches/cosine.rs‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎rust/lance-linalg/benches/l2.rs‎
Lines changed: 12 additions & 0 deletions b/‎rust/lance-linalg/benches/l2.rs‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎rust/lance-linalg/src/distance.rs‎
Lines changed: 2 additions & 0 deletions b/‎rust/lance-linalg/src/distance.rs‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎rust/lance-linalg/src/distance/cosine.rs‎
Lines changed: 6 additions & 1 deletion b/‎rust/lance-linalg/src/distance/cosine.rs‎
Lines changed: 6 additions & 1 deletion
@@ -8,6 +8,7 @@ use arrow_array::{
 use criterion::{Criterion, black_box, criterion_group, criterion_main};
 use lance_arrow::{ArrowFloatType, FloatArray, bfloat16::BFloat16Type};
 use lance_linalg::distance::cosine::{Cosine, cosine_distance_batch};
+use lance_linalg::distance::cosine_u8::{cosine_u8, cosine_u8_scalar};
 use num_traits::Float;
 
 #[cfg(target_os = "linux")]
@@ -76,6 +77,42 @@ fn bench_distance(c: &mut Criterion) {
             black_box(cosine_distance_batch(key.values(), target.values(), 8).collect::<Vec<_>>())
         })
     });
+
+    // u8 cosine benchmarks
+    {
+        use rand::Rng;
+        use std::iter::repeat_with;
+
+        const DIMENSION: usize = 1024;
+        const TOTAL: usize = 1024 * 1024;
+        let mut rng = rand::rng();
+        let key_u8: Vec<u8> = repeat_with(|| rng.random()).take(DIMENSION).collect();
+        let target_u8: Vec<u8> = repeat_with(|| rng.random())
+            .take(TOTAL * DIMENSION)
+            .collect();
+
+        c.bench_function("Cosine(u8, scalar)", |b| {
+            b.iter(|| {
+                black_box(
+                    target_u8
+                        .chunks_exact(DIMENSION)
+                        .map(|tgt| cosine_u8_scalar(&key_u8, tgt))
+                        .fold(0.0, |acc: f32, v| acc + v),
+                );
+            });
+        });
+
+        c.bench_function("Cosine(u8, SIMD)", |b| {
+            b.iter(|| {
+                black_box(
+                    target_u8
+                        .chunks_exact(DIMENSION)
+                        .map(|tgt| cosine_u8(&key_u8, tgt))
+                        .fold(0.0, |acc: f32, v| acc + v),
+                );
+            });
+        });
+    }
 }
 
 #[cfg(target_os = "linux")]
 
@@ -15,6 +15,7 @@ use rand::Rng;
 use pprof::criterion::{Output, PProfProfiler};
 
 use lance_arrow::{ArrowFloatType, FloatArray};
+use lance_linalg::distance::l2_u8::l2_u8;
 use lance_linalg::distance::{L2, l2::l2, l2_distance_batch, l2_distance_uint_scalar};
 use lance_testing::datagen::generate_random_array_with_seed;
 
@@ -157,6 +158,17 @@ fn bench_uint_distance(c: &mut Criterion) {
             );
         });
     });
+
+    c.bench_function("L2(u8, SIMD)", |b| {
+        b.iter(|| {
+            black_box(
+                target
+                    .chunks_exact(DIMENSION)
+                    .map(|tgt| l2_u8(&key, tgt) as f32)
+                    .fold(0.0, |acc, v| acc + v),
+            );
+        });
+    });
 }
 
 #[cfg(target_os = "linux")]
 
@@ -17,9 +17,11 @@ use arrow_array::{Array, ArrowPrimitiveType, FixedSizeListArray, Float32Array, L
 use arrow_schema::{ArrowError, DataType};
 
 pub mod cosine;
+pub mod cosine_u8;
 pub mod dot;
 pub mod hamming;
 pub mod l2;
+pub mod l2_u8;
 pub mod norm_l2;
 
 pub use cosine::*;
 
@@ -65,7 +65,12 @@ pub trait Cosine: Dot + Normalize {
     }
 }
 
-impl Cosine for u8 {}
+impl Cosine for u8 {
+    #[inline]
+    fn cosine(x: &[Self], other: &[Self]) -> f32 {
+        super::cosine_u8::cosine_u8(x, other)
+    }
+}
 
 impl Cosine for bf16 {}
Original file line number	Diff line number	Diff line change
`@@ -65,7 +65,12 @@ pub trait Cosine: Dot + Normalize {`
`65`	`65`	`}`
`66`	`66`	`}`
`67`	`67`
`68`		`-impl Cosine for u8 {}`
	`68`	`+impl Cosine for u8 {`
	`69`	`+ #[inline]`
	`70`	`+ fn cosine(x: &[Self], other: &[Self]) -> f32 {`
	`71`	`+ super::cosine_u8::cosine_u8(x, other)`
	`72`	`+ }`
	`73`	`+}`
`69`	`74`
`70`	`75`	`impl Cosine for bf16 {}`
`71`	`76`