Fix jbang

mikepapadim · mikepapadim · commit 80040bf41d14 · 2025-12-15T13:04:02.000+02:00
diff --git a/LlamaTornadoCli.java b/LlamaTornadoCli.java
@@ -5,6 +5,8 @@
 //DEPS io.github.beehive-lab:tornado-runtime:2.1.0
 
 //SOURCES TornadoFlags.java
+// === Set to not get annoying warnings about annotation processing
+//JAVAC_OPTIONS -proc:full
 
 // Compiler options
 //JAVAC_OPTIONS --enable-preview
@@ -87,7 +89,7 @@ public static void main(String[] args) throws IOException {
 
         // Check if help requested
         if (args.length == 0 || hasHelpFlag(args)) {
-            Options.printUsage(System.out);
+//            Options.printUsage(System.out);
             System.exit(0);
         }
 
@@ -137,8 +139,8 @@ private static boolean hasHelpFlag(String[] args) {
     private static void printBanner() {
         System.out.println("""
             ╔══════════════════════════════════════════════════════════╗
-            ║        Llama-Tornado CLI - GPU-Accelerated LLM          ║
-            ║           Powered by TornadoVM & Java 21                ║
+            ║        Llama-Tornado CLI - GPU-Accelerated LLM           ║
+            ║           Powered by TornadoVM & Java 21                 ║
             ╚══════════════════════════════════════════════════════════╝
             """);
     }
diff --git a/src/main/java/org/beehive/gpullama3/Options.java b/src/main/java/org/beehive/gpullama3/Options.java
@@ -28,7 +28,7 @@ private static boolean getDefaultTornadoVM() {
         return Boolean.parseBoolean(System.getProperty("use.tornadovm", "false"));
     }
 
-    static void printUsage(PrintStream out) {
+    public static void printUsage(PrintStream out) {
         out.println("Usage:  jbang Llama3.java [options]");
         out.println();
         out.println("Options:");
diff --git a/src/main/java/org/beehive/gpullama3/cli/LlamaTornadoCli.java b/src/main/java/org/beehive/gpullama3/cli/LlamaTornadoCli.java
@@ -1,129 +1,129 @@
-package org.beehive.gpullama3.cli;
-
-import org.beehive.gpullama3.Options;
-import org.beehive.gpullama3.auxiliary.LastRunMetrics;
-import org.beehive.gpullama3.inference.sampler.Sampler;
-import org.beehive.gpullama3.model.Model;
-
-import java.io.IOException;
-
-import static org.beehive.gpullama3.inference.sampler.Sampler.createSampler;
-import static org.beehive.gpullama3.model.loader.ModelLoader.loadModel;
-
-/**
- * LlamaTornadoCli - Pure Java CLI for running llama-tornado models
- *
- * This class provides a standalone command-line interface for running LLaMA models
- * with TornadoVM acceleration. This version is compiled as part of the Maven build.
- *
- * For JBang usage, use the LlamaTornadoCli.java file in the root directory.
- *
- * Usage as compiled application:
- *   java --enable-preview --add-modules jdk.incubator.vector \
- *        -cp target/gpu-llama3-0.3.1.jar \
- *        org.beehive.gpullama3.cli.LlamaTornadoCli \
- *        --model path/to/model.gguf --prompt "Your prompt here"
- *
- * Examples:
- *   # Interactive chat mode
- *   java -cp target/gpu-llama3-0.3.1.jar \
- *        org.beehive.gpullama3.cli.LlamaTornadoCli \
- *        -m model.gguf --interactive
- *
- *   # Single instruction mode
- *   java -cp target/gpu-llama3-0.3.1.jar \
- *        org.beehive.gpullama3.cli.LlamaTornadoCli \
- *        -m model.gguf -p "Explain quantum computing"
- *
- *   # With TornadoVM acceleration (requires TornadoVM runtime setup)
- *   java -cp target/gpu-llama3-0.3.1.jar \
- *        org.beehive.gpullama3.cli.LlamaTornadoCli \
- *        -m model.gguf -p "Hello" --use-tornadovm true
- */
-public class LlamaTornadoCli {
-
-    // Configuration flags
-    public static final boolean USE_VECTOR_API = Boolean.parseBoolean(
-        System.getProperty("llama.VectorAPI", "true"));
-    public static final boolean SHOW_PERF_INTERACTIVE = Boolean.parseBoolean(
-        System.getProperty("llama.ShowPerfInteractive", "true"));
-
-    /**
-     * Run a single instruction and display the response
-     */
-    private static void runSingleInstruction(Model model, Sampler sampler, Options options) {
-        String response = model.runInstructOnce(sampler, options);
-        System.out.println(response);
-        if (SHOW_PERF_INTERACTIVE) {
-            LastRunMetrics.printMetrics();
-        }
-    }
-
-    /**
-     * Main entry point for the CLI application
-     *
-     * @param args command-line arguments (see Options.parseOptions for details)
-     * @throws IOException if model loading fails
-     */
-    public static void main(String[] args) throws IOException {
-        // Print banner
-        printBanner();
-
-        // Check if help requested
-        if (args.length == 0 || hasHelpFlag(args)) {
-            Options.printUsage(System.out);
-            System.exit(0);
-        }
-
-        try {
-            // Parse options
-            Options options = Options.parseOptions(args);
-
-            // Load model
-            System.out.println("Loading model from: " + options.modelPath());
-            Model model = loadModel(options);
-            System.out.println("Model loaded successfully!");
-
-            // Create sampler
-            Sampler sampler = createSampler(model, options);
-
-            // Run in interactive or single-instruction mode
-            if (options.interactive()) {
-                System.out.println("Starting interactive chat mode...");
-                System.out.println("Type your messages below (Ctrl+C to exit):");
-                System.out.println();
-                model.runInteractive(sampler, options);
-            } else {
-                runSingleInstruction(model, sampler, options);
-            }
-        } catch (Exception e) {
-            System.err.println("Error: " + e.getMessage());
-            e.printStackTrace();
-            System.exit(1);
-        }
-    }
-
-    /**
-     * Check if help flag is present in arguments
-     */
-    private static boolean hasHelpFlag(String[] args) {
-        for (String arg : args) {
-            if (arg.equals("--help") || arg.equals("-h")) {
-                return true;
-            }
-        }
-        return false;
-    }
-
-    /**
-     * Print ASCII banner
-     */
-    private static void printBanner() {
-        System.out.println("""
-            ╔══════════════════════════════════════════════════════════╗
-            ║        Llama-Tornado CLI - GPU-Accelerated LLM          ║
-            ║           Powered by TornadoVM & Java 21                ║
-            ╚══════════════════════════════════════════════════════════╝
-            """);
-    }
-}
+//package org.beehive.gpullama3.cli;
+//
+//import org.beehive.gpullama3.Options;
+//import org.beehive.gpullama3.auxiliary.LastRunMetrics;
+//import org.beehive.gpullama3.inference.sampler.Sampler;
+//import org.beehive.gpullama3.model.Model;
+//
+//import java.io.IOException;
+//
+//import static org.beehive.gpullama3.inference.sampler.Sampler.createSampler;
+//import static org.beehive.gpullama3.model.loader.ModelLoader.loadModel;
+//
+///**
+// * LlamaTornadoCli - Pure Java CLI for running llama-tornado models
+// *
+// * This class provides a standalone command-line interface for running LLaMA models
+// * with TornadoVM acceleration. This version is compiled as part of the Maven build.
+// *
+// * For JBang usage, use the LlamaTornadoCli.java file in the root directory.
+// *
+// * Usage as compiled application:
+// *   java --enable-preview --add-modules jdk.incubator.vector \
+// *        -cp target/gpu-llama3-0.3.1.jar \
+// *        org.beehive.gpullama3.cli.LlamaTornadoCli \
+// *        --model path/to/model.gguf --prompt "Your prompt here"
+// *
+// * Examples:
+// *   # Interactive chat mode
+// *   java -cp target/gpu-llama3-0.3.1.jar \
+// *        org.beehive.gpullama3.cli.LlamaTornadoCli \
+// *        -m model.gguf --interactive
+// *
+// *   # Single instruction mode
+// *   java -cp target/gpu-llama3-0.3.1.jar \
+// *        org.beehive.gpullama3.cli.LlamaTornadoCli \
+// *        -m model.gguf -p "Explain quantum computing"
+// *
+// *   # With TornadoVM acceleration (requires TornadoVM runtime setup)
+// *   java -cp target/gpu-llama3-0.3.1.jar \
+// *        org.beehive.gpullama3.cli.LlamaTornadoCli \
+// *        -m model.gguf -p "Hello" --use-tornadovm true
+// */
+//public class LlamaTornadoCli {
+//
+//    // Configuration flags
+//    public static final boolean USE_VECTOR_API = Boolean.parseBoolean(
+//        System.getProperty("llama.VectorAPI", "true"));
+//    public static final boolean SHOW_PERF_INTERACTIVE = Boolean.parseBoolean(
+//        System.getProperty("llama.ShowPerfInteractive", "true"));
+//
+//    /**
+//     * Run a single instruction and display the response
+//     */
+//    private static void runSingleInstruction(Model model, Sampler sampler, Options options) {
+//        String response = model.runInstructOnce(sampler, options);
+//        System.out.println(response);
+//        if (SHOW_PERF_INTERACTIVE) {
+//            LastRunMetrics.printMetrics();
+//        }
+//    }
+//
+//    /**
+//     * Main entry point for the CLI application
+//     *
+//     * @param args command-line arguments (see Options.parseOptions for details)
+//     * @throws IOException if model loading fails
+//     */
+//    public static void main(String[] args) throws IOException {
+//        // Print banner
+//        printBanner();
+//
+//        // Check if help requested
+//        if (args.length == 0 || hasHelpFlag(args)) {
+////            Options.printUsage(System.out);
+//            System.exit(0);
+//        }
+//
+//        try {
+//            // Parse options
+//            Options options = Options.parseOptions(args);
+//
+//            // Load model
+//            System.out.println("Loading model from: " + options.modelPath());
+//            Model model = loadModel(options);
+//            System.out.println("Model loaded successfully!");
+//
+//            // Create sampler
+//            Sampler sampler = createSampler(model, options);
+//
+//            // Run in interactive or single-instruction mode
+//            if (options.interactive()) {
+//                System.out.println("Starting interactive chat mode...");
+//                System.out.println("Type your messages below (Ctrl+C to exit):");
+//                System.out.println();
+//                model.runInteractive(sampler, options);
+//            } else {
+//                runSingleInstruction(model, sampler, options);
+//            }
+//        } catch (Exception e) {
+//            System.err.println("Error: " + e.getMessage());
+//            e.printStackTrace();
+//            System.exit(1);
+//        }
+//    }
+//
+//    /**
+//     * Check if help flag is present in arguments
+//     */
+//    private static boolean hasHelpFlag(String[] args) {
+//        for (String arg : args) {
+//            if (arg.equals("--help") || arg.equals("-h")) {
+//                return true;
+//            }
+//        }
+//        return false;
+//    }
+//
+//    /**
+//     * Print ASCII banner
+//     */
+//    private static void printBanner() {
+//        System.out.println("""
+//            ╔══════════════════════════════════════════════════════════╗
+//            ║        Llama-Tornado CLI - GPU-Accelerated LLM          ║
+//            ║           Powered by TornadoVM & Java 21                ║
+//            ╚══════════════════════════════════════════════════════════╝
+//            """);
+//    }
+//}

Original file line number	Diff line number	Diff line change
`@@ -28,7 +28,7 @@ private static boolean getDefaultTornadoVM() {`
`28`	`28`	`return Boolean.parseBoolean(System.getProperty("use.tornadovm", "false"));`
`29`	`29`	`}`
`30`	`30`
`31`		`- static void printUsage(PrintStream out) {`
	`31`	`+ public static void printUsage(PrintStream out) {`
`32`	`32`	`out.println("Usage: jbang Llama3.java [options]");`
`33`	`33`	`out.println();`
`34`	`34`	`out.println("Options:");`