tests: add tests for new runner

NorbertKlockiewicz · NorbertKlockiewicz · commit 09954c910bc1 · 2026-03-10T10:48:40.000+01:00
diff --git a/docs/docs/03-hooks/01-natural-language-processing/useLLM.md b/docs/docs/03-hooks/01-natural-language-processing/useLLM.md
@@ -563,4 +563,4 @@ const handleGenerate = async () => {
 | [SmolLM 2](https://huggingface.co/software-mansion/react-native-executorch-smolLm-2)                         | 135M, 360M, 1.7B |    ✅     |      -       |
 | [LLaMA 3.2](https://huggingface.co/software-mansion/react-native-executorch-llama-3.2)                       |      1B, 3B      |    ✅     |      -       |
 | [LFM2.5-1.2B-Instruct](https://huggingface.co/software-mansion/react-native-executorch-lfm2.5-1.2B-instruct) |       1.2B       |    ✅     |      -       |
-| [LFM2.5-VL-1.6B](https://huggingface.co/nklockiewicz/lfm2-vl-et)                                             |       1.6B       |    ✅     |    vision    |
+| [LFM2.5-VL-1.6B](https://huggingface.co/software-mansion/react-native-executorch-lfm2.5-VL-1.6B)             |       1.6B       |    ✅     |    vision    |
diff --git a/packages/react-native-executorch/common/rnexecutorch/tests/CMakeLists.txt b/packages/react-native-executorch/common/rnexecutorch/tests/CMakeLists.txt
@@ -135,6 +135,14 @@ function(add_rn_test TEST_TARGET TEST_FILENAME)
 endfunction()
 
 add_rn_test(NumericalTests unit/NumericalTest.cpp)
+add_rn_test(RunnerTests unit/RunnerTest.cpp
+    SOURCES
+        ${COMMON_DIR}/runner/base_llm_runner.cpp
+        ${COMMON_DIR}/runner/sampler.cpp
+        ${COMMON_DIR}/runner/arange_util.cpp
+        integration/stubs/jsi_stubs.cpp
+    LIBS tokenizers_deps
+)
 add_rn_test(LogTests unit/LogTest.cpp)
 add_rn_test(FileUtilsTest unit/FileUtilsTest.cpp)
 add_rn_test(ImageProcessingTest unit/ImageProcessingTest.cpp
diff --git a/packages/react-native-executorch/common/rnexecutorch/tests/integration/LLMTest.cpp b/packages/react-native-executorch/common/rnexecutorch/tests/integration/LLMTest.cpp
@@ -161,54 +161,106 @@ TEST_F(LLMTest, EmptyPromptThrows) {
   EXPECT_THROW((void)model.generate("", nullptr), RnExecutorchError);
 }
 
+TEST_F(LLMTest, CountTextTokensPositive) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  EXPECT_GT(model.countTextTokens("hello world"), 0);
+}
+
+TEST_F(LLMTest, CountTextTokensEmptyString) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  EXPECT_GE(model.countTextTokens(""), 0);
+}
+
+TEST_F(LLMTest, GetMaxContextLengthPositive) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  EXPECT_GT(model.getMaxContextLength(), 0);
+}
+
+TEST_F(LLMTest, ResetZerosGeneratedTokenCount) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  model.generate(formatChatML(kSystemPrompt, "Hi"), nullptr);
+  EXPECT_GT(model.getGeneratedTokenCount(), 0);
+  model.reset();
+  EXPECT_EQ(model.getGeneratedTokenCount(), 0);
+}
+
+TEST_F(LLMTest, PromptTokenCountNonZeroAfterGenerate) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  model.generate(formatChatML(kSystemPrompt, "Hi"), nullptr);
+  EXPECT_GT(model.getPromptTokenCount(), 0);
+}
+
 TEST(VisionEncoderTest, LoadFailsWithClearErrorWhenMethodMissing) {
   // smolLm2_135M_8da4w.pte has no vision_encoder method
   auto module = std::make_unique<::executorch::extension::Module>(
       "smolLm2_135M_8da4w.pte",
       ::executorch::extension::Module::LoadMode::File);
 
   auto encoder =
-      std::make_unique<executorch::extension::llm::VisionEncoder>(module.get());
+      std::make_unique<executorch::extension::llm::VisionEncoder>(*module);
 
   EXPECT_THROW(encoder->load(), rnexecutorch::RnExecutorchError);
 }
 
-#include <runner/base_llm_runner.h>
+// ============================================================================
+// VLM-specific tests
+// ============================================================================
+constexpr auto kVlmModelPath = "lfm2_5_vl_quantized_xnnpack_v2.pte";
+constexpr auto kVlmTokenizerPath = "lfm2_vl_tokenizer.json";
+constexpr auto kVlmImageToken = "<image>";
+constexpr auto kTestImagePath =
+    "file:///data/local/tmp/rnexecutorch_tests/test_image.jpg";
+
+TEST_F(LLMTest, TextModelIsNotMultimodal) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  EXPECT_EQ(model.getVisualTokenCount(), 0);
+}
+
+TEST_F(LLMTest, GenerateMultimodalOnTextModelThrows) {
+  LLM model(kValidModelPath, kValidTokenizerPath, {}, mockInvoker_);
+  EXPECT_THROW(model.generateMultimodal("hello", {}, "<image>", nullptr),
+               RnExecutorchError);
+}
 
-// Minimal concrete subclass — only used in tests to verify base class behavior
-class StubRunner : public rnexecutorch::llm::runner::BaseLLMRunner {
-public:
-  using BaseLLMRunner::BaseLLMRunner;
-  bool is_loaded() const override { return loaded_; }
-  ::executorch::runtime::Error load_subcomponents() override {
-    loaded_ = true;
-    return ::executorch::runtime::Error::Ok;
+// Fixture that loads the VLM model once for all VLM tests
+class VLMTest : public ::testing::Test {
+protected:
+  static void SetUpTestSuite() {
+    invoker_ = createMockCallInvoker();
+    model_ =
+        std::make_unique<LLM>(kVlmModelPath, kVlmTokenizerPath,
+                              std::vector<std::string>{"vision"}, invoker_);
   }
-  ::executorch::runtime::Error generate_internal(
-      const std::vector<::executorch::extension::llm::MultimodalInput> &,
-      std::function<void(const std::string &)>) override {
-    return ::executorch::runtime::Error::Ok;
+
+  static void TearDownTestSuite() {
+    model_.reset();
+    invoker_.reset();
   }
-  void stop_impl() override {}
-  void set_temperature_impl(float t) override { last_temp_ = t; }
-  void set_topp_impl(float) override {}
-  void set_count_interval_impl(size_t) override {}
-  void set_time_interval_impl(size_t) override {}
-
-  bool loaded_ = false;
-  float last_temp_ = -1.f;
+
+  static std::shared_ptr<facebook::react::CallInvoker> invoker_;
+  static std::unique_ptr<LLM> model_;
 };
 
-TEST(BaseLLMRunnerTest, SetTemperatureWritesConfigAndCallsImpl) {
-  StubRunner runner(nullptr, "dummy_tokenizer.json");
-  runner.set_temperature(0.5f);
-  EXPECT_FLOAT_EQ(runner.config_.temperature, 0.5f);
-  EXPECT_FLOAT_EQ(runner.last_temp_, 0.5f);
+std::shared_ptr<facebook::react::CallInvoker> VLMTest::invoker_;
+std::unique_ptr<LLM> VLMTest::model_;
+
+TEST_F(VLMTest, GenerateMultimodalEmptyImageTokenThrows) {
+  EXPECT_THROW(
+      model_->generateMultimodal("hello", {kTestImagePath}, "", nullptr),
+      RnExecutorchError);
 }
 
-TEST(BaseLLMRunnerTest, ResetZerosPos) {
-  StubRunner runner(nullptr, "dummy_tokenizer.json");
-  runner.pos_ = 42;
-  runner.reset();
-  EXPECT_EQ(runner.pos_, 0);
+TEST_F(VLMTest, GenerateMultimodalMorePlaceholdersThanImagePaths) {
+  std::string prompt = std::string(kVlmImageToken) + " and " + kVlmImageToken;
+  EXPECT_THROW(model_->generateMultimodal(prompt, {kTestImagePath},
+                                          kVlmImageToken, nullptr),
+               RnExecutorchError);
+}
+
+TEST_F(VLMTest, GenerateMultimodalMoreImagePathsThanPlaceholders) {
+  std::string prompt = std::string(kVlmImageToken) + " describe";
+  EXPECT_THROW(model_->generateMultimodal(prompt,
+                                          {kTestImagePath, kTestImagePath},
+                                          kVlmImageToken, nullptr),
+               RnExecutorchError);
 }
diff --git a/packages/react-native-executorch/common/rnexecutorch/tests/integration/stubs/StubRunner.h b/packages/react-native-executorch/common/rnexecutorch/tests/integration/stubs/StubRunner.h
@@ -0,0 +1,33 @@
+#pragma once
+
+#include <runner/base_llm_runner.h>
+
+// Minimal concrete subclass of BaseLLMRunner — only used in tests to verify
+// base class behavior without a full runner implementation.
+class StubRunner : public ::executorch::extension::llm::BaseLLMRunner {
+public:
+  using BaseLLMRunner::BaseLLMRunner;
+  bool is_loaded() const override { return loaded_; }
+  ::executorch::runtime::Error load_subcomponents() override {
+    loaded_ = true;
+    return ::executorch::runtime::Error::Ok;
+  }
+  ::executorch::runtime::Error generate_internal(
+      const std::vector<::executorch::extension::llm::MultimodalInput> &,
+      std::function<void(const std::string &)>) override {
+    return ::executorch::runtime::Error::Ok;
+  }
+  void stop_impl() override {}
+  void set_temperature_impl(float t) override { last_temp_ = t; }
+  void set_topp_impl(float) override {}
+  void set_count_interval_impl(size_t) override {}
+  void set_time_interval_impl(size_t) override {}
+
+  int32_t resolve_max(int32_t prompt, int32_t seq_len, int32_t ctx_len,
+                      int32_t max_new = -1) const {
+    return resolve_max_new_tokens(prompt, seq_len, ctx_len, max_new);
+  }
+
+  bool loaded_ = false;
+  float last_temp_ = -1.f;
+};
diff --git a/packages/react-native-executorch/common/rnexecutorch/tests/run_tests.sh b/packages/react-native-executorch/common/rnexecutorch/tests/run_tests.sh
@@ -16,6 +16,7 @@ MODELS_DIR="$SCRIPT_DIR/integration/assets/models"
 # ============================================================================
 TEST_EXECUTABLES=(
   "NumericalTests"
+  "RunnerTests"
   "LogTests"
   "FileUtilsTest"
   "ImageProcessingTest"
@@ -67,6 +68,9 @@ MODELS=(
   "t2i_encoder.pte|https://huggingface.co/software-mansion/react-native-executorch-bk-sdm-tiny/resolve/v0.6.0/text_encoder/model.pte"
   "t2i_unet.pte|https://huggingface.co/software-mansion/react-native-executorch-bk-sdm-tiny/resolve/v0.6.0/unet/model.256.pte"
   "t2i_decoder.pte|https://huggingface.co/software-mansion/react-native-executorch-bk-sdm-tiny/resolve/v0.6.0/vae/model.256.pte"
+  "lfm2_5_vl_quantized_xnnpack_v2.pte|https://huggingface.co/software-mansion/react-native-executorch-lfm2.5-VL-1.6B/resolve/main/quantized/lfm2_5_vl_1_6b_8da4w_xnnpack.pte"
+  "lfm2_vl_tokenizer.json|https://huggingface.co/software-mansion/react-native-executorch-lfm2.5-VL-1.6B/resolve/main/tokenizer.json"
+  "lfm2_vl_tokenizer_config.json|https://huggingface.co/software-mansion/react-native-executorch-lfm2.5-VL-1.6B/resolve/main/tokenizer_config.json"
 )
 
 # ============================================================================
diff --git a/packages/react-native-executorch/common/rnexecutorch/tests/unit/RunnerTest.cpp b/packages/react-native-executorch/common/rnexecutorch/tests/unit/RunnerTest.cpp
@@ -0,0 +1,91 @@
+#include "../integration/stubs/StubRunner.h"
+#include <gtest/gtest.h>
+#include <runner/irunner.h>
+#include <runner/multimodal_input.h>
+
+using namespace executorch::extension::llm;
+
+// ============================================================================
+// resolve_max_new_tokens tests
+// ============================================================================
+
+class ResolveMaxNewTokensTest : public ::testing::Test {
+protected:
+  StubRunner runner{nullptr, "dummy"};
+};
+
+TEST_F(ResolveMaxNewTokensTest, BothMinusOne_UsesContextMinusPrompt) {
+  EXPECT_EQ(runner.resolve_max(10, -1, 128, -1), 118);
+}
+
+TEST_F(ResolveMaxNewTokensTest, OnlySeqLenMinusOne_CapsAtMaxNew) {
+  EXPECT_EQ(runner.resolve_max(10, -1, 128, 50), 50);
+  EXPECT_EQ(runner.resolve_max(10, -1, 128, 200), 118);
+}
+
+TEST_F(ResolveMaxNewTokensTest, OnlyMaxNewMinusOne_CapsAtSeqLen) {
+  EXPECT_EQ(runner.resolve_max(10, 64, 128, -1), 54);
+  EXPECT_EQ(runner.resolve_max(10, 200, 128, -1), 118);
+}
+
+TEST_F(ResolveMaxNewTokensTest, NeitherMinusOne_TakesSmallest) {
+  EXPECT_EQ(runner.resolve_max(10, 64, 128, 30), 30);
+  EXPECT_EQ(runner.resolve_max(10, 64, 128, 100), 54);
+}
+
+TEST_F(ResolveMaxNewTokensTest, ClampedToZeroWhenPromptExceedsContext) {
+  EXPECT_EQ(runner.resolve_max(200, -1, 128, -1), 0);
+  EXPECT_EQ(runner.resolve_max(200, 64, 128, -1), 0);
+}
+
+// ============================================================================
+// MultimodalInput edge cases
+// ============================================================================
+
+TEST(MultimodalInputTest, GetTextOnImageThrows) {
+  auto input = make_image_input("/some/path.jpg");
+  EXPECT_THROW(input.get_text(), std::bad_variant_access);
+}
+
+TEST(MultimodalInputTest, GetImagePathOnTextThrows) {
+  MultimodalInput input(std::string("hello"));
+  EXPECT_THROW(input.get_image_path(), std::bad_variant_access);
+}
+
+TEST(MultimodalInputTest, EmptyStringIsStillText) {
+  MultimodalInput input(std::string(""));
+  EXPECT_TRUE(input.is_text());
+  EXPECT_EQ(input.get_text(), "");
+}
+
+// ============================================================================
+// BaseLLMRunner via StubRunner
+// ============================================================================
+
+TEST(BaseLLMRunnerTest, SetTemperatureUpdatesConfigAndCallsImpl) {
+  StubRunner runner(nullptr, "dummy");
+  runner.set_temperature(0.42f);
+  EXPECT_FLOAT_EQ(runner.config_.temperature, 0.42f);
+  EXPECT_FLOAT_EQ(runner.last_temp_, 0.42f);
+}
+
+TEST(BaseLLMRunnerTest, SetToppUpdatesConfig) {
+  StubRunner runner(nullptr, "dummy");
+  runner.set_topp(0.7f);
+  EXPECT_FLOAT_EQ(runner.config_.topp, 0.7f);
+}
+
+TEST(BaseLLMRunnerTest, ResetZerosPosAndStats) {
+  StubRunner runner(nullptr, "dummy");
+  runner.pos_ = 99;
+  runner.stats_.num_generated_tokens = 5;
+  runner.reset();
+  EXPECT_EQ(runner.pos_, 0);
+  EXPECT_EQ(runner.stats_.num_generated_tokens, 0);
+}
+
+TEST(BaseLLMRunnerTest, GenerateEmptyStringReturnsError) {
+  StubRunner runner(nullptr, "dummy");
+  auto err = runner.generate("", {}, {}, {});
+  EXPECT_NE(err, ::executorch::runtime::Error::Ok);
+}
diff --git a/packages/react-native-executorch/common/runner/base_llm_runner.cpp b/packages/react-native-executorch/common/runner/base_llm_runner.cpp
@@ -86,7 +86,8 @@ Error BaseLLMRunner::generate(
     std::function<void(const std::string &)> token_callback,
     std::function<void(const Stats &)> stats_callback) {
 
-  ET_CHECK_MSG(!prompt.empty(), "Prompt cannot be null");
+  ET_CHECK_OR_RETURN_ERROR(!prompt.empty(), InvalidArgument,
+                           "Prompt cannot be null");
 
   std::vector<MultimodalInput> inputs = {make_text_input(prompt)};
   auto err = generate_internal(inputs, token_callback);