Reformat TornadoVMMasterPlan by re-organizing line breaks, updating parameter annotations, and consolidating documentation for improved readability and consistency.

mikepapadim · mikepapadim · commit 8ffc2826195d · 2025-08-03T13:14:13.000+03:00
diff --git a/src/main/java/com/example/tornadovm/TornadoVMMasterPlan.java b/src/main/java/com/example/tornadovm/TornadoVMMasterPlan.java
@@ -39,14 +39,13 @@ public TornadoVMMasterPlan(State state, Model model) {
     }
 
     /**
-     * Initializes the TornadoVM plan for GPU acceleration with optional timing.
-     * This method handles:
-     * 1. Creation of the TornadoVM master plan
-     * 2. Warming up the JIT compiler for better performance
-     * 3. Copying read-only model weights to the GPU
+     * Initializes the TornadoVM plan for GPU acceleration with optional timing. This method handles: 1. Creation of the TornadoVM master plan 2. Warming up the JIT compiler for better performance 3.
+     * Copying read-only model weights to the GPU
      *
-     * @param state The model state containing KV cache
-     * @param model The Llama model instance
+     * @param state
+     *         The model state containing KV cache
+     * @param model
+     *         The Llama model instance
      * @return The initialized TornadoVMMasterPlan ready for inference
      */
     public static TornadoVMMasterPlan initializeTornadoVMPlan(State state, Model model) {
@@ -94,26 +93,13 @@ public static TornadoVMMasterPlan initializeTornadoVMPlan(State state, Model mod
     }
 
     /**
-     * Dispatcher method to select the TornadoVMLayerPlanner for the model.
-     */
-    TornadoVMLayerPlanner createPlanner(State state, Model model) {
-        return switch (model.getModelType()) {
-            case LLAMA_3, MISTRAL -> new TornadoVMLayerPlanner(state, model);
-            case QWEN_3 -> new Qwen3TornadoVMLayerPlanner((Qwen3State) state, model);
-            case PHI_3 -> new Phi3TornadoVMLayerPlanner((Phi3State) state, model);
-            case UNKNOWN -> throw new UnsupportedOperationException("Unknown model type");
-        };
-    }
-
-    /**
-     * Determines whether the NVIDIA-specific scheduler should be used based on the current
-     * hardware backend and the model type.
+     * Determines whether the NVIDIA-specific scheduler should be used based on the current hardware backend and the model type.
      * <p>
-     * The scheduler is used only if the runtime is targeting an NVIDIA backend and the model
-     * is not of type {@code MISTRAL}. If either the hardware is not NVIDIA or the model is
-     * {@code MISTRAL}, the NVIDIA-specific scheduler should not be used.
+     * The scheduler is used only if the runtime is targeting an NVIDIA backend and the model is not of type {@code MISTRAL}. If either the hardware is not NVIDIA or the model is {@code MISTRAL}, the
+     * NVIDIA-specific scheduler should not be used.
      *
-     * @param model the model whose type may affect the scheduler decision
+     * @param model
+     *         the model whose type may affect the scheduler decision
      * @return {@code true} if the NVIDIA-specific scheduler should be used; {@code false} otherwise
      */
     public static boolean shouldUseNvidiaScheduler(Model model) {
@@ -129,8 +115,19 @@ public static boolean shouldUseNvidiaScheduler(Model model) {
     }
 
     /**
-     * Executes the forward pass of a LLaMA transformer model using TornadoVM acceleration.
-     *This method processes the transformer layers in sequence for a particular token position in the context
+     * Dispatcher method to select the TornadoVMLayerPlanner for the model.
+     */
+    TornadoVMLayerPlanner createPlanner(State state, Model model) {
+        return switch (model.getModelType()) {
+            case LLAMA_3, MISTRAL -> new TornadoVMLayerPlanner(state, model);
+            case QWEN_3 -> new Qwen3TornadoVMLayerPlanner((Qwen3State) state, model);
+            case PHI_3 -> new Phi3TornadoVMLayerPlanner((Phi3State) state, model);
+            case UNKNOWN -> throw new UnsupportedOperationException("Unknown model type");
+        };
+    }
+
+    /**
+     * Executes the forward pass of a LLaMA transformer model using TornadoVM acceleration. This method processes the transformer layers in sequence for a particular token position in the context
      * window.
      *
      * <p>The execution happens in three phases:
@@ -140,7 +137,6 @@ public static boolean shouldUseNvidiaScheduler(Model model) {
      *   <li>Final projection to logits using TornadoVM</li>
      * </ol>
      *
-     *
      * @param position
      *         The current position in the sequence being processed
      * @return FloatTensor containing the output logits for token prediction
@@ -183,7 +179,9 @@ private int getPreprocessingGraphIndex() {
 
     /**
      * Returns the graph index for the given transformer layer.
-     * @param layerIndex Index of the transformer layer (0-based)
+     *
+     * @param layerIndex
+     *         Index of the transformer layer (0-based)
      */
     private int getLayerGraphIndex(int layerIndex) {
         return 1 + layerIndex;
@@ -196,8 +194,7 @@ private int getFinalLogitsGraphIndex() {
         return taskGraphs.size() - 1;
     }
 
-    /// Execute the forward pass of the LLaMA transformer model using TornadoVM acceleration
-    /// just once to copy the data into the read-only data layer.
+    /// Execute the forward pass of the LLaMA transformer model using TornadoVM acceleration just once to copy the data into the read-only data layer.
     public void forceCopyInReadOnlyDataLayered() {
         // Execute all TornadoVM graphs
         state.wrapX.init(0.0f);
@@ -216,9 +213,7 @@ public void forceCopyInReadOnlyDataLayered() {
     }
 
     /**
-     * Frees the device memory allocated for the TornadoVM execution plan.
-     * This method should be called when the execution plan is no longer needed
-     * to release resources and avoid memory leaks.
+     * Frees the device memory allocated for the TornadoVM execution plan. This method should be called when the execution plan is no longer needed to release resources and avoid memory leaks.
      */
     public void freeTornadoExecutionPlan() {
         executionPlan.freeDeviceMemory();