Always apply Eliminate_ZP to fix GPU compile issue on some platforms
This commit is contained in:
parent
fdadca1e89
commit
973a80fd02
|
|
@ -80,6 +80,7 @@ EliminateZeroPoints::EliminateZeroPoints() {
|
||||||
|
|
||||||
std::shared_ptr<ov::op::v0::Constant> new_constant;
|
std::shared_ptr<ov::op::v0::Constant> new_constant;
|
||||||
|
|
||||||
|
// TODO improve performance
|
||||||
if (data_type == ov::element::u4) {
|
if (data_type == ov::element::u4) {
|
||||||
auto data_values = data_constant->cast_vector<uint8_t>();
|
auto data_values = data_constant->cast_vector<uint8_t>();
|
||||||
std::vector<int8_t> adjusted_values(total_elements);
|
std::vector<int8_t> adjusted_values(total_elements);
|
||||||
|
|
|
||||||
|
|
@ -233,9 +233,9 @@ std::shared_ptr<Model> TranslateSession::apply_transformations(std::shared_ptr<M
|
||||||
manager.register_pass<ov::pass::MakeStateful>(kv_param_res_pairs);
|
manager.register_pass<ov::pass::MakeStateful>(kv_param_res_pairs);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (ggml_model_decoder->is_static()) {
|
// if (ggml_model_decoder->is_static()) {
|
||||||
manager.register_pass<pass::EliminateZeroPoints>();
|
manager.register_pass<pass::EliminateZeroPoints>();
|
||||||
}
|
// }
|
||||||
manager.run_passes(model);
|
manager.run_passes(model);
|
||||||
}
|
}
|
||||||
return model;
|
return model;
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue