We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2e91650 commit 5c7ec7aCopy full SHA for 5c7ec7a
1 file changed
compute/gpu_engine.go
@@ -484,8 +484,7 @@ func (e *GPUEngine[T]) UploadWeights(tensors []*tensor.TensorNumeric[float32]) e
484
if _, ok := any(t.GetStorage()).(*tensor.Q8Storage); ok {
485
continue
486
}
487
- // Skip Q4Storage — already uploaded as raw Q4 bytes by the Q4 handler
488
- // above (line ~272). Q4 GEMV reads quantized data directly (0.5 bytes/weight).
+ // Skip Q4_0: already uploaded as raw Q4 bytes by the Q4 handler above.
489
if _, ok := any(t.GetStorage()).(*tensor.Q4Storage); ok {
490
491
0 commit comments