From 469325c6dab3ad5bb0feb4ea9074d36783983ba0 Mon Sep 17 00:00:00 2001 From: "Yu, Zijun" Date: Mon, 8 Dec 2025 16:17:40 +0800 Subject: [PATCH] GPU remove Q6_K requantization --- ggml/src/ggml-openvino/utils.cpp | 6 ------ 1 file changed, 6 deletions(-) diff --git a/ggml/src/ggml-openvino/utils.cpp b/ggml/src/ggml-openvino/utils.cpp index 1f94d4bad6..ad99447f30 100644 --- a/ggml/src/ggml-openvino/utils.cpp +++ b/ggml/src/ggml-openvino/utils.cpp @@ -422,12 +422,6 @@ std::map get_types_to_requant(const std::string & dev {GGML_TYPE_Q5_K, ExtraQuantType::F16 }, }; } - if (device == "GPU") { - return { - // gs16 will be supported on openvino-2025.4 - {GGML_TYPE_Q6_K, ExtraQuantType::Q8_0_32}, - }; - } return {}; }