Finalize review comments

orionpapadakis · orionpapadakis · commit 16f5114b23bc · 2025-07-31T16:36:31.000+03:00
diff --git a/src/main/java/com/example/model/Configuration.java b/src/main/java/com/example/model/Configuration.java
@@ -34,7 +34,6 @@ public interface Configuration {
     /** Base value for RoPE (Rotary Position Embedding) calculations */
     float ropeTheta();
 
-    /** Size of each attention head (derived from dim / numberOfHeads) */
     int headSize();
 
     int kvDim();
diff --git a/src/main/java/com/example/model/llama/LlamaConfiguration.java b/src/main/java/com/example/model/llama/LlamaConfiguration.java
@@ -15,6 +15,7 @@ public int contextLengthModel() {
         throw new UnsupportedOperationException("Not supported for Llama.");
     }
 
+    /** Size of each attention head (derived from dim / numberOfHeads) */
     public int headSize() {
         return dim / numberOfHeads;
     }
diff --git a/src/main/java/com/example/model/loader/ModelLoader.java b/src/main/java/com/example/model/loader/ModelLoader.java
@@ -38,9 +38,9 @@ public abstract class ModelLoader {
     private static final String TOKENIZER_MISTRAL_MODEL = "llama";
 
     protected FileChannel fileChannel;
-    GGUF gguf;
-    int contextLength;
-    boolean loadWeights;
+    protected GGUF gguf;
+    protected int contextLength;
+    protected boolean loadWeights;
 
     public ModelLoader(FileChannel fileChannel, GGUF gguf, int contextLength, boolean loadWeights) {
         this.fileChannel = fileChannel;
diff --git a/src/main/java/com/example/tornadovm/Qwen3TornadoVMLayerPlanner.java b/src/main/java/com/example/tornadovm/Qwen3TornadoVMLayerPlanner.java
@@ -18,14 +18,13 @@
 
 public class Qwen3TornadoVMLayerPlanner extends TornadoVMLayerPlanner<Qwen3State, Qwen3Configuration, Qwen3TornadoWeights> {
 
-    int nHeadKv;
-    int nEmbdHeadK;
-    int nEmbdHeadV;
-    int nEmbdVGqa;
-    int nEmbdHead;
-    int nEmbdGqa;
-    int gqa;
-    float sqrtHeadSize;
+    private final int nHeadKv;
+    private final int nEmbdHeadK;
+    private final int nEmbdHeadV;
+    private final int nEmbdVGqa;
+    private final int nEmbdHead;
+    private final int nEmbdGqa;
+    private final int gqa;
 
     public Qwen3TornadoVMLayerPlanner(Qwen3State state, Model model) {
         super(state, model);
@@ -37,7 +36,6 @@ public Qwen3TornadoVMLayerPlanner(Qwen3State state, Model model) {
         this.nEmbdHead = nEmbdHeadV;
         this.nEmbdGqa = nEmbdVGqa;
         this.gqa = config.numberOfHeads() / config.numberOfKeyValueHeads(); // integer multiplier of the kv sharing in multiquery
-        this.sqrtHeadSize = (float) Math.sqrt(nEmbdHead);
     }
 
     // @formatter:off

Original file line number	Diff line number	Diff line change
`@@ -15,6 +15,7 @@ public int contextLengthModel() {`
`15`	`15`	`throw new UnsupportedOperationException("Not supported for Llama.");`
`16`	`16`	`}`
`17`	`17`
	`18`	`+ /** Size of each attention head (derived from dim / numberOfHeads) */`
`18`	`19`	`public int headSize() {`
`19`	`20`	`return dim / numberOfHeads;`
`20`	`21`	`}`