vcache-project
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 1 deletion b/‎.gitignore‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎benchmarks/_plotter_combined.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/_plotter_combined.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/_plotter_helper.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/_plotter_helper.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/_plotter_individual.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/_plotter_individual.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/benchmark.py‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/benchmark.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎poetry.lock‎
Lines changed: 77 additions & 4 deletions b/‎poetry.lock‎
Lines changed: 77 additions & 4 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎tests/ReadMe.md‎
Lines changed: 4 additions & 22 deletions b/‎tests/ReadMe.md‎
Lines changed: 4 additions & 22 deletions
diff --git a/‎tests/integration/test_1.py‎
Lines changed: 1 addition & 0 deletions b/‎tests/integration/test_1.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎tests/integration/test_dynamic_threshold.py‎
Lines changed: 94 additions & 0 deletions b/‎tests/integration/test_dynamic_threshold.py‎
Lines changed: 94 additions & 0 deletions
@@ -12,4 +12,5 @@ benchmarks/results/*
 temp/*
 *.log
 bin/*
-.venv/
+.venv/
+.env
@@ -963,4 +963,4 @@ def __plot_delta_accuracy(
 
     filename = results_dir + f"/delta_accuracy_{timestamp}.pdf"
     plt.savefig(filename, format="pdf", bbox_inches="tight")
-    plt.close()
+    plt.close()
@@ -330,4 +330,4 @@ def compute_avg_latency_score(latency_list: pd.DataFrame) -> float:
     Returns:
         avg_latency: float - Average Latency 0.xx
     """
-    return latency_list.mean()
+    return latency_list.mean()
@@ -341,4 +341,4 @@ def __plot_avg_latency_cache_hit_rate_cache_miss_rate(
     filename = benchmark.output_folder_path + f"/statistics_{benchmark.timestamp}.json"
 
     with open(filename, "w") as f:
-        json.dump(statistics, f, indent=4)
+        json.dump(statistics, f, indent=4)
@@ -582,4 +582,4 @@ def main():
 
 
 if __name__ == "__main__":
-    main()
+    main()
@@ -22,6 +22,8 @@ dependencies = [
     "accelerate (>=1.6.0,<2.0.0)",
     "typing-extensions (>=4.13.2,<5.0.0)",
     "torchvision (>=0.22.0,<0.23.0)",
+    "torchvision (>=0.22.0,<0.23.0)",
+    "statsmodels (>=0.14.4,<0.15.0)",
 ]
 
 
@@ -44,6 +46,7 @@ ruff = "^0.11.6"
 mypy = "^1.15.0"
 pre-commit = "^4.2.0"
 pytest = "^8.0.0"
+python-dotenv = "^1.1.0"
 
 
 [tool.ruff]
 
@@ -6,27 +6,9 @@ The unit tests are supposed to soley test the logic of an invidual module strate
 ## Integration Tests
 The integration tests are supposed to test the combination and interaction of all module strategies.
 
-## Run All Tests
+### Run Integration Tests
+Set `OPEN_AI_APIKEY` in `.env`, and run:
 
-```bash
-pip install -e .
-```
-
-```bash
-export OPENAI_API_KEY="your_api_key_here"
-```
-
-```bash
-python3 runner.py
-```
-
-## Run Individual Tests
-
-```bash
-pytest unit/VectorDBStrategy/test.py
-```
-
-With print terminal output enabled
-```bash
-pytest -vs unit/VectorDBStrategy/test.py
+```base
+poetry run pytest tests/integration
 ```
@@ -58,3 +58,4 @@ class TestVectorQIntegration(unittest.TestCase):
 if __name__ == "__main__":
     # unittest.main()
     pass
+
@@ -0,0 +1,94 @@
+import unittest
+
+from dotenv import load_dotenv
+
+from vectorq import (
+    DynamicThresholdPolicy,
+    HNSWLibVectorDB,
+    InMemoryEmbeddingMetadataStorage,
+    LangChainEmbeddingEngine,
+    OpenAIInferenceEngine,
+    StringComparisonSimilarityEvaluator,
+    VectorQ,
+    VectorQConfig,
+)
+
+load_dotenv()
+
+
+def create_default_config_and_policy():
+    config = VectorQConfig(
+        inference_engine=OpenAIInferenceEngine(
+            model_name="gpt-4.1-nano-2025-04-14",
+            temperature=0.0,
+        ),
+        embedding_engine=LangChainEmbeddingEngine(
+            model_name="sentence-transformers/all-mpnet-base-v2"
+        ),
+        vector_db=HNSWLibVectorDB(),
+        embedding_metadata_storage=InMemoryEmbeddingMetadataStorage(),
+        system_prompt="Please answer in a single word with the first letter capitalized. Example: London",
+    )
+    policy = DynamicThresholdPolicy(
+        delta=0.05,
+        is_global=False,
+        similarity_evaluator=StringComparisonSimilarityEvaluator(),
+    )
+    return config, policy
+
+
+class TestVectorQDynamicThreshold(unittest.TestCase):
+    def test_basic_functionality(self):
+        """Test that the cache correctly identifies hits and misses."""
+        config, policy = create_default_config_and_policy()
+        vectorq = VectorQ(config, policy)
+
+        # First request should be a miss
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="What is the capital of France?"
+        )
+        self.assertFalse(cache_hit, "First request should be a cache miss")
+        self.assertTrue(len(response) > 0, "Response should not be empty")
+
+        # The 2nd to 5th request should be miss because it's still adjusting the threshold
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="What's France's capital city?"
+        )
+        self.assertFalse(cache_hit, "Second request should be a cache miss")
+        self.assertTrue(len(response) > 0, "Response should not be empty")
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="France's capital city is called what?"
+        )
+        self.assertFalse(cache_hit, "Identical request should be a cache hit")
+        self.assertTrue(len(response) > 0, "Response should not be empty")
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="Tell me the capital city of France"
+        )
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="Which city is the capital of France?"
+        )
+
+        # After several tries with the Bayesian policy, we should now get a hit
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="The capital of France is?"
+        )
+        self.assertTrue(cache_hit, "Similar request should now be a cache hit")
+        self.assertTrue(len(response) > 0, "Response should not be empty")
+
+        cache_hit, response, _ = vectorq.infer_with_cache_info(
+            prompt="Can you tell me what the capital of France is?"
+        )
+        self.assertTrue(cache_hit, "Similar request should now be a cache hit")
+        self.assertTrue(len(response) > 0, "Response should not be empty")
+
+    def test_high_delta(self):
+        # TODO: Implement this
+        self.assertTrue(True)
+
+    def test_low_delta(self):
+        # TODO: Implement this
+        self.assertTrue(True)
+
+
+if __name__ == "__main__":
+    unittest.main()
-Original file line number
+Diff line change
 temp/*
 *.log
 bin/*
 -.venv/
 +.venv/
 +.env
Original file line number	Diff line number	Diff line change
`@@ -582,4 +582,4 @@ def main():`
`582`	`582`
`583`	`583`
`584`	`584`	`if __name__ == "__main__":`
`585`		`- main()`
	`585`	`+ main()`