From 599335c63330787d4908e02c8d7e8093b63be298 Mon Sep 17 00:00:00 2001 From: Mustafa Cavus Date: Tue, 13 Jan 2026 12:27:33 -0800 Subject: [PATCH] Update ggml/src/ggml-openvino/ggml-openvino-extra.cpp --- .../src/ggml-openvino/ggml-openvino-extra.cpp | 19 +++++++++---------- 1 file changed, 9 insertions(+), 10 deletions(-) diff --git a/ggml/src/ggml-openvino/ggml-openvino-extra.cpp b/ggml/src/ggml-openvino/ggml-openvino-extra.cpp index bc0362ee46..76871cc4be 100644 --- a/ggml/src/ggml-openvino/ggml-openvino-extra.cpp +++ b/ggml/src/ggml-openvino/ggml-openvino-extra.cpp @@ -268,34 +268,33 @@ ggml_openvino_extracted_layout ggml_openvino_get_extracted_layout(const ggml_ten } // Normal extraction (no requant) - determine format based on tensor type + layout.is_u4 = false; + layout.weights_per_block = 32; + layout.is_symmetric = false; + switch (tensor->type) { case GGML_TYPE_Q4_0: layout.is_u4 = true; - layout.weights_per_block = 32; layout.is_symmetric = true; break; + case GGML_TYPE_Q4_1: - layout.is_u4 = true; - layout.weights_per_block = 32; - break; case GGML_TYPE_Q4_K: layout.is_u4 = true; - layout.weights_per_block = 32; break; + case GGML_TYPE_Q8_0: - layout.is_u4 = false; - layout.weights_per_block = 32; layout.is_symmetric = true; break; + case GGML_TYPE_Q6_K: - layout.is_u4 = false; layout.weights_per_block = 16; layout.is_symmetric = true; break; + case GGML_TYPE_Q5_K: - layout.is_u4 = false; - layout.weights_per_block = 32; break; + default: // Unsupported quantization type return layout;