GPU remove Q6_K requantization
This commit is contained in:
parent
28da9a9adc
commit
469325c6da
|
|
@ -422,12 +422,6 @@ std::map<ggml_type, ExtraQuantType> get_types_to_requant(const std::string & dev
|
|||
{GGML_TYPE_Q5_K, ExtraQuantType::F16 },
|
||||
};
|
||||
}
|
||||
if (device == "GPU") {
|
||||
return {
|
||||
// gs16 will be supported on openvino-2025.4
|
||||
{GGML_TYPE_Q6_K, ExtraQuantType::Q8_0_32},
|
||||
};
|
||||
}
|
||||
return {};
|
||||
}
|
||||
|
||||
|
|
|
|||
Loading…
Reference in New Issue