Skip to content

Commit 3ead7e4

Browse files
committed
[WIP] refactoring
1 parent ba4abdc commit 3ead7e4

54 files changed

Lines changed: 910 additions & 820 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

src/main/java/org/beehive/gpullama3/LlamaApp.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,5 @@
11
package org.beehive.gpullama3;
22

3-
import org.beehive.gpullama3.aot.AOT;
43
import org.beehive.gpullama3.auxiliary.LastRunMetrics;
54
import org.beehive.gpullama3.inference.sampler.Sampler;
65
import org.beehive.gpullama3.model.Model;

src/main/java/org/beehive/gpullama3/aot/AOT.java

Lines changed: 0 additions & 85 deletions
This file was deleted.

src/main/java/org/beehive/gpullama3/inference/InferenceEngine.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
import org.beehive.gpullama3.inference.state.State;
66
import org.beehive.gpullama3.model.Configuration;
77
import org.beehive.gpullama3.model.Model;
8-
import org.beehive.gpullama3.tokenizer.impl.Tokenizer;
8+
import org.beehive.gpullama3.tokenizer.Tokenizer;
99
import org.beehive.gpullama3.tornadovm.TornadoVMMasterPlan;
1010
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;
1111

src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights/FP16Weights.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.FP16Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
4+
import org.beehive.gpullama3.inference.weights.tornado.TornadoWeights;
45
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;
56
import uk.ac.manchester.tornado.api.types.arrays.HalfFloatArray;
67

src/main/java/org/beehive/gpullama3/inference/weights/tornado/LlamaTornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights/LlamaTornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.FP16Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Phi3TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights/Phi3TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.FP16Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen2TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights/Qwen2TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.FP16Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Qwen3TornadoWeights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/FP16Weights/Qwen3TornadoWeights.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.FP16Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Phi3TornadoWeightsQ8_0.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/Q8_0Weights/Phi3TornadoWeightsQ8_0.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.Q8_0Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;

src/main/java/org/beehive/gpullama3/inference/weights/tornado/Q8_0Weights.java renamed to src/main/java/org/beehive/gpullama3/inference/weights/tornado/Q8_0Weights/Q8_0Weights.java

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,8 @@
1-
package org.beehive.gpullama3.inference.weights.tornado;
1+
package org.beehive.gpullama3.inference.weights.tornado.Q8_0Weights;
22

33
import org.beehive.gpullama3.core.model.GGMLType;
44
import org.beehive.gpullama3.core.model.tensor.Q8_0QuantizedTensor;
5+
import org.beehive.gpullama3.inference.weights.tornado.TornadoWeights;
56
import uk.ac.manchester.tornado.api.types.arrays.FloatArray;
67

78
public class Q8_0Weights implements TornadoWeights {

0 commit comments

Comments
 (0)