File tree Expand file tree Collapse file tree
src/main/java/org/beehive/gpullama3/tornadovm/layerplanner/model Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1- package org .beehive .gpullama3 .tornadovm .layerplanner .quantization ;
1+ package org .beehive .gpullama3 .tornadovm .layerplanner .model . fp16 ;
22
33import org .beehive .gpullama3 .tensor .GGMLType ;
44import org .beehive .gpullama3 .inference .state .State ;
55import org .beehive .gpullama3 .inference .weights .tornado .TornadoWeights ;
66import org .beehive .gpullama3 .model .Configuration ;
77import org .beehive .gpullama3 .model .Model ;
8- import org .beehive .gpullama3 .tornadovm .layerplanner .base .QuantizedLayerPlanner ;
9- import org .beehive .gpullama3 .tornadovm .layers .AbstractFFNLayers ;
10- import org .beehive .gpullama3 .tornadovm .layers .Activation ;
11- import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
12- import uk .ac .manchester .tornado .api .GridScheduler ;
13- import uk .ac .manchester .tornado .api .ImmutableTaskGraph ;
14-
15- import java .util .ArrayList ;
16- import java .util .List ;
8+ import org .beehive .gpullama3 .tornadovm .layerplanner .QuantizedLayerPlanner ;
179
1810/**
1911 * Base for all FP16-quantized layer planners.
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .GraniteTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .granite .GraniteConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .ActivationGranite ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .GraniteFP16FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsGraniteFP16Layer ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .LlamaTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .llama .LlamaConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LlamaFP16FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .LlamaTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .mistral .MistralConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .MistralFP16FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .Phi3TornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .phi3 .Phi3Configuration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .Phi3FP16FFNLayers ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .Qwen2TornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .qwen2 .Qwen2Configuration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .Qwen2FP16FFNLayers ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .Qwen3TornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .qwen3 .Qwen3Configuration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .FP16LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .LogitsFP16Layer ;
109import org .beehive .gpullama3 .tornadovm .layers .type .fp16 .Qwen3FP16FFNLayers ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .GraniteTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .granite .GraniteConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .Q8_0LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .ActivationGranite ;
98import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .GraniteQ8_0FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .LogitsGraniteQ8_0Layer ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .LlamaTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .llama .LlamaConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .Q8_0LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .LlamaQ8_0FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .LogitsQ8_0Layer ;
Original file line number Diff line number Diff line change 44import org .beehive .gpullama3 .inference .weights .tornado .LlamaTornadoWeights ;
55import org .beehive .gpullama3 .model .Model ;
66import org .beehive .gpullama3 .model .mistral .MistralConfiguration ;
7- import org .beehive .gpullama3 .tornadovm .layerplanner .quantization .Q8_0LayerPlanner ;
87import org .beehive .gpullama3 .tornadovm .layers .Activation ;
98import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .MistralQ8_0FFNLayers ;
109import org .beehive .gpullama3 .tornadovm .layers .type .q8_0 .LogitsQ8_0Layer ;
You can’t perform that action at this time.
0 commit comments