ggml-org · brettp · Apr 6, 2026
@@ -511,9 +511,14 @@ static hf_cache::hf_files get_split_files(const hf_cache::hf_files & files,
     if (split.count <= 1) {
         return {file};
     }
-    hf_cache::hf_files result;
 
-    for (const auto & f : files) {
+    hf_cache::hf_files sorted_files = files;
+    std::sort(sorted_files.begin(), sorted_files.end(), [](const hf_cache::hf_file & a, const hf_cache::hf_file & b) {
+        return a.path < b.path;
+    });
+
+    hf_cache::hf_files result;
+    for (const auto & f : sorted_files) {
         auto split_f = get_gguf_split_info(f.path);
         if (split_f.count == split.count && split_f.prefix == split.prefix) {
             result.push_back(f);

@@ -1,6 +1,11 @@
 #include "gguf-model-data.h"
+#include "common.h"
+#include "download.h"
+#include "hf-cache.h"
 
 #include <cstdio>
+#include <filesystem>
+#include <fstream>
 
 #define TEST_ASSERT(cond, msg) \
     do { \
@@ -10,9 +15,54 @@
         } \
     } while (0)
 
+static common_download_model_result get_cached_split_files_reverse_order() {
+    // Offline split GGUF must return files in sequential order, not filesystem order.
+    namespace fs = std::filesystem;
+
+    auto tmp = fs::temp_directory_path() / "llama-test-gguf-model-data";
+    fs::remove_all(tmp);
+    fs::create_directories(tmp);
+
+    const std::string commit(40, 'a');
+    fs::path repo_dir = tmp / "models--testowner--testrepo";
+    fs::path snap_dir = repo_dir / "snapshots" / commit;
+
+    fs::create_directories(repo_dir / "refs");
+    { std::ofstream f(repo_dir / "refs" / "main"); f << commit; }
+
+    // Create files out of order to confirm sort works
+    fs::create_directories(snap_dir);
+    { std::ofstream f(snap_dir / "model-Q4_K_M-00002-of-00002.gguf"); }
+    { std::ofstream f(snap_dir / "model-Q4_K_M-00001-of-00002.gguf"); }
+
+#ifdef _WIN32
+    _putenv_s("LLAMA_CACHE", tmp.string().c_str());
+#else
+    setenv("LLAMA_CACHE", tmp.string().c_str(), 1);
+#endif
+
+    common_params_model model;
+    model.hf_repo = "testowner/testrepo";
+
+    common_download_model_opts opts;
+    opts.offline = true;
+
+    auto split_result = common_download_model(model, "", opts);
+
+    fs::remove_all(tmp);
+#ifdef _WIN32
+    _putenv_s("LLAMA_CACHE", "");
+#else
+    unsetenv("LLAMA_CACHE");
+#endif
+
+    return split_result;
+}
+
 int main() {
     fprintf(stderr, "=== test-gguf-model-data ===\n");
 
+
     // Fetch Qwen3-0.6B Q8_0 metadata
     auto result = gguf_fetch_model_meta("ggml-org/Qwen3-0.6B-GGUF", "Q8_0");
 
@@ -149,6 +199,11 @@ int main() {
     TEST_ASSERT(model4.n_vocab == 128896, "expected n_vocab == 128896");
     TEST_ASSERT(model4.tensors.size() == 754, "expected tensor count == 754");
 
+    auto split_result = get_cached_split_files_reverse_order();
+
+    TEST_ASSERT(!split_result.model_path.empty(), "expected non-empty model path");
+    TEST_ASSERT(split_result.model_path.find("00001-of-00002") != std::string::npos, "expected first file 00001");
+
     fprintf(stderr, "=== ALL TESTS PASSED ===\n");
     return 0;
 }