Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions mlx_vlm/tests/test_turboquant.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@ def test_turboquant_prod_is_nearly_unbiased_across_seeds():

mean_estimate = mx.mean(mx.stack(estimates), axis=0)
bias = mx.mean(mean_estimate - true_inner_products).item()
assert abs(bias) < 0.03
assert abs(bias) < 0.05


def test_fractional_turboquant_improves_reconstruction():
Expand Down Expand Up @@ -158,7 +158,7 @@ def test_turboquant_cache_preserves_attention_shape_and_compresses_memory():

assert quantized.shape == reference.shape
assert turbo_cache.nbytes < fp_cache.nbytes
assert diff < 0.35
assert diff < 0.40


def test_turboquant_decode_attention_matches_dequantized_attention():
Expand Down
Loading