Skip to content

Commit a26f2a9

Browse files
[refactor] Move FP16LayerPlanner and Q8_0LayerPlanner to quantized-specific subpackages
1 parent 170db11 commit a26f2a9

14 files changed

Lines changed: 4 additions & 32 deletions

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/quantization/FP16LayerPlanner.java renamed to src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/FP16LayerPlanner.java

Lines changed: 2 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,19 +1,11 @@
1-
package org.beehive.gpullama3.tornadovm.layerplanner.quantization;
1+
package org.beehive.gpullama3.tornadovm.layerplanner.model.fp16;
22

33
import org.beehive.gpullama3.tensor.GGMLType;
44
import org.beehive.gpullama3.inference.state.State;
55
import org.beehive.gpullama3.inference.weights.tornado.TornadoWeights;
66
import org.beehive.gpullama3.model.Configuration;
77
import org.beehive.gpullama3.model.Model;
8-
import org.beehive.gpullama3.tornadovm.layerplanner.base.QuantizedLayerPlanner;
9-
import org.beehive.gpullama3.tornadovm.layers.AbstractFFNLayers;
10-
import org.beehive.gpullama3.tornadovm.layers.Activation;
11-
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;
12-
import uk.ac.manchester.tornado.api.GridScheduler;
13-
import uk.ac.manchester.tornado.api.ImmutableTaskGraph;
14-
15-
import java.util.ArrayList;
16-
import java.util.List;
8+
import org.beehive.gpullama3.tornadovm.layerplanner.QuantizedLayerPlanner;
179

1810
/**
1911
* Base for all FP16-quantized layer planners.

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/GraniteFP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.GraniteTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.granite.GraniteConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.ActivationGranite;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.GraniteFP16FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsGraniteFP16Layer;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/LlamaFP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.LlamaTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.llama.LlamaConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LlamaFP16FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/MistralFP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.LlamaTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.mistral.MistralConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.MistralFP16FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/Phi3FP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.Phi3TornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.phi3.Phi3Configuration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.Phi3FP16FFNLayers;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/Qwen2FP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.Qwen2TornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.qwen2.Qwen2Configuration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.Qwen2FP16FFNLayers;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/fp16/Qwen3FP16LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.Qwen3TornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.qwen3.Qwen3Configuration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.FP16LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.fp16.LogitsFP16Layer;
109
import org.beehive.gpullama3.tornadovm.layers.type.fp16.Qwen3FP16FFNLayers;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/q8_0/GraniteQ8_0LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.GraniteTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.granite.GraniteConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.Q8_0LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.ActivationGranite;
98
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.GraniteQ8_0FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.LogitsGraniteQ8_0Layer;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/q8_0/LlamaQ8_0LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.LlamaTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.llama.LlamaConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.Q8_0LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.LlamaQ8_0FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.LogitsQ8_0Layer;

src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model/q8_0/MistralQ8_0LayerPlanner.java

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,6 @@
44
import org.beehive.gpullama3.inference.weights.tornado.LlamaTornadoWeights;
55
import org.beehive.gpullama3.model.Model;
66
import org.beehive.gpullama3.model.mistral.MistralConfiguration;
7-
import org.beehive.gpullama3.tornadovm.layerplanner.quantization.Q8_0LayerPlanner;
87
import org.beehive.gpullama3.tornadovm.layers.Activation;
98
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.MistralQ8_0FFNLayers;
109
import org.beehive.gpullama3.tornadovm.layers.type.q8_0.LogitsQ8_0Layer;

0 commit comments

Comments
 (0)