Skip to content

Commit 27a764b

Browse files
Move Qwen2Q8_0TornadoVMLayerPlanner to tornadovm package and weights to corresponding subpackages (fp16 & q8)
1 parent 851bb07 commit 27a764b

18 files changed

+20
-18
lines changed

src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/fp16/FP16Weights.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.fp16;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
4+
import org.beehive.gpullama3.inference.weights.tornado.TornadoWeights;
45
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;
56
import uk.ac.manchester.tornado.api.types.arrays.HalfFloatArray;
67

src/main/java/org/beehive/gpullama3/inference/weights/tornado/LlamaTornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/fp16/LlamaTornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.fp16;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Phi3TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/fp16/Phi3TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.fp16;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen2TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/fp16/Qwen2TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.fp16;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen3TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/fp16/Qwen3TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.fp16;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Phi3TornadoWeightsQ8_0.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/q8_0/Phi3TornadoWeightsQ8_0.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.q8_0;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Q8_0Weights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/q8_0/Q8_0Weights.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,8 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.q8_0;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;
5+
import org.beehive.gpullama3.inference.weights.tornado.TornadoWeights;
56
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;
67

78
public class Q8_0Weights implements TornadoWeights {

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen2TornadoWeightsQ8_0.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/q8_0/Qwen2TornadoWeightsQ8_0.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.q8_0;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen3Q8_0TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/q8_0/Qwen3Q8_0TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.q8_0;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;

src/main/java/org/beehive/gpullama3/tornadovm/Phi3TornadoVMLayerPlanner.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22

33
import org.beehive.gpullama3.auxiliary.Tuple2;
44
import org.beehive.gpullama3.inference.state.Phi3State;
5-
import org.beehive.gpullama3.inference.weights.tornado.Phi3TornadoWeights;
5+
import org.beehive.gpullama3.inference.weights.tornado.fp16.Phi3TornadoWeights;
66
import org.beehive.gpullama3.model.Model;
77
import org.beehive.gpullama3.model.phi3.Phi3Configuration;
88
import uk.ac.manchester.tornado.api.GridScheduler;

0 commit comments

Comments
 (0)