From 1a19566b23b097a84f30ccd86319eca72e8bcff6 Mon Sep 17 00:00:00 2001 From: Cavus Mustafa Date: Tue, 29 Jul 2025 21:37:57 -0700 Subject: [PATCH] add mark decomp pass --- ...decompression_convert_constant_folding.hpp | 29 +++++++++++++++++++ .../openvino/translate_session.cpp | 5 +++- 2 files changed, 33 insertions(+), 1 deletion(-) create mode 100644 ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.hpp diff --git a/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.hpp b/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.hpp new file mode 100644 index 0000000000..163422bf33 --- /dev/null +++ b/ggml/src/ggml-openvino/openvino/pass/mark_decompression_convert_constant_folding.hpp @@ -0,0 +1,29 @@ +#pragma once + +#include "mark_decompression_convert_constant_folding.hpp" +#include "openvino/pass/matcher_pass.hpp" +#include "openvino/core/visibility.hpp" + +#ifdef OPENVINO_STATIC_LIBRARY +# define TRANSFORMATIONS_API +#else +# ifdef IMPLEMENT_OPENVINO_API +# define TRANSFORMATIONS_API OPENVINO_CORE_EXPORTS +# else +# define TRANSFORMATIONS_API OPENVINO_CORE_IMPORTS +# endif // IMPLEMENT_OPENVINO_API +#endif // OPENVINO_STATIC_LIBRARY + +namespace ov { +namespace pass { + +class TRANSFORMATIONS_API MarkCompressedFloatConstants; + +} // namespace pass +} // namespace ov + +class ov::pass::MarkCompressedFloatConstants : public MatcherPass { +public: + OPENVINO_MATCHER_PASS_RTTI("MarkCompressedFloatConstants"); + MarkCompressedFloatConstants(); +}; diff --git a/ggml/src/ggml-openvino/openvino/translate_session.cpp b/ggml/src/ggml-openvino/openvino/translate_session.cpp index c4fe8c88ee..ed7db61414 100644 --- a/ggml/src/ggml-openvino/openvino/translate_session.cpp +++ b/ggml/src/ggml-openvino/openvino/translate_session.cpp @@ -28,6 +28,7 @@ #include "ggml-openvino/openvino/utils.hpp" #include "input_model.hpp" #include "pass/fuse_to_sdpa.hpp" +#include "pass/mark_decompression_convert_constant_folding.hpp" namespace ov { namespace frontend { @@ -259,6 +260,8 @@ std::shared_ptr TranslateSession::apply_transformations(std::shared_ptr(); + manager.register_pass(); if (!ggml_model_decoder->is_static()) { const auto kv_param_res_names = ggml_model_decoder->get_kv_param_res_names(); @@ -267,7 +270,7 @@ std::shared_ptr TranslateSession::apply_transformations(std::shared_ptr(); + manager.register_pass(); manager.run_passes(model); } auto preprocessor = ov::preprocess::PrePostProcessor(model);