Add GGML_OV_FRONTEND option. Add readme.

2024-11-23 06:03:08 +08:00 · 2024-11-23 06:03:08 +08:00 · 31bd816426
parent 9b7b63d12c
commit 31bd816426
2 changed files with 0 additions and 114 deletions
--- a/ggml/src/ggml-openvino/ggml-ov-frontend-utils.cpp
+++ b/ggml/src/ggml-openvino/ggml-ov-frontend-utils.cpp
@ -1,108 +0,0 @@
-#include "ggml-ov-frontend-utils.h"
-#include "ggml-backend-impl.h"
-#include <openvino/frontend/manager.hpp>
-#include <openvino/openvino.hpp>
-
-using ov::frontend::tensorflow::ggml::GgmlOvGraphIterator;
-
-std::shared_ptr<GgmlOvGraphIterator> get_ggml_graph_iterator(struct ggml_cgraph * cgraph) {
-    return std::make_shared<GgmlOvGraphIterator>(cgraph);
-}
-
-std::vector<ov::Tensor> get_ggml_graph_input_tensors(std::shared_ptr<GgmlOvGraphIterator> ggml_graph_iterator) {
-    std::vector<ov::Tensor> input_tensors;
-    auto input_names = ggml_graph_iterator->get_input_names();
-    ggml_graph_iterator->reset();
-    for (; !ggml_graph_iterator->is_end(); ggml_graph_iterator->next()) {
-        auto decoder = std::dynamic_pointer_cast<GgmlOvDecoder>(ggml_graph_iterator->get_decoder()); 
-        for (size_t inp = 0; inp < decoder->get_input_size(); ++inp) {
-            if (std::find(input_names.begin(), input_names.end(), decoder->get_input_name(inp)) != input_names.end()) {
-                auto input_data = decoder->get_input_ggml_tensor(inp)->data;
-                ov::Tensor input_tensor = ov::Tensor(decoder->get_input_type(inp), decoder->get_input_shape(inp).to_shape(), input_data);
-                input_tensors.push_back(input_tensor);
-            }
-        }
-    }
-    return input_tensors;
-}
-
-static ov::frontend::FrontEnd::Ptr get_ggml_frontend() {
-    ov::frontend::FrontEnd::Ptr front_end = nullptr;
-    auto fem = ov::frontend::FrontEndManager();
-    // std::string fe_so_path = "/home/yumeng/Code/test/openvino/bin/intel64/Release/libopenvino_ggml_frontend.so";
-    std::string fe_so_path = "/home/yumeng/Code/ov-ggml-frontend/openvino/bin/intel64/Release/libopenvino_ggml_frontend.so";
-    fem.register_front_end("ggml", fe_so_path);
-    front_end = fem.load_by_framework("ggml");
-    return front_end;
-}
-
-enum ggml_status openvino_frontend_compute (ggml_backend_t backend, struct ggml_cgraph * cgraph) {
-    ov::Core core;
-    auto devices = core.get_available_devices();
-    #ifdef GGML_OPENVINO_DEBUG
-        GGML_LOG_INFO("Device numbers: %d\n", devices.size());
-    #endif
-    // Get GGML Frontend 
-    auto front_end = get_ggml_frontend();
-    if (!front_end) {
-        GGML_LOG_ERROR("GGML FrontEnd is not initialized \n");
-        return GGML_STATUS_FAILED;
-    } else {
-        #ifdef GGML_OPENVINO_DEBUG
-            GGML_LOG_INFO("GGML FrontEnd is initialized \n");
-        #endif
-    }
-
-    auto ggml_graph_iterator = get_ggml_graph_iterator(cgraph);
-    std::shared_ptr<ov::frontend::tensorflow::GraphIterator> graph_iterator = ggml_graph_iterator;
-    
-    // Load GraphIterator -> InputModel
-    ov::frontend::InputModel::Ptr input_model = front_end->load(graph_iterator);
-    if (!input_model) {
-        GGML_LOG_ERROR("Input Model is not loaded \n");
-        return GGML_STATUS_FAILED;
-    } else {
-        #ifdef GGML_OPENVINO_DEBUG
-            GGML_LOG_INFO("Input Model loaded \n");
-        #endif
-    }
-
-    // TODO: Convert InputModel -> ov::Model 
-    std::shared_ptr<ov::Model> model = front_end->convert(input_model);
-    if (!model) {
-        GGML_LOG_ERROR("Model is not converted \n");
-    } else {
-        #ifdef GGML_OPENVINO_DEBUG
-            GGML_LOG_INFO("Model converted \n");
-        #endif
-    }
-
-
-    //  Loading a model to the device
-    ov::CompiledModel compiled_model = core.compile_model(model);
-
-    // Create infer request
-    ov::InferRequest infer_request = compiled_model.create_infer_request();
-
-    // Get input tensor
-    auto input_tensor = get_ggml_graph_input_tensors(ggml_graph_iterator);
-
-    // Set input tensor
-    for (size_t i = 0; i < input_tensor.size(); i++) {
-        infer_request.set_input_tensor(i, input_tensor[i]);
-    }
-
-    infer_request.infer();
-
-    ov::Tensor output_tensor = infer_request.get_output_tensor();
-    // Put data in output tensor to the last node -> data in cgraph
-    // Get output type
-    ggml_tensor* dst = cgraph->nodes[cgraph->n_nodes - 1];
-    std::memcpy(dst->data, output_tensor.data(), output_tensor.get_byte_size());
-    #ifdef GGML_OPENVINO_DEBUG
-        GGML_LOG_INFO("%f\n", *output_tensor.data<float>());
-    #endif
-    
-    return GGML_STATUS_SUCCESS;
-    GGML_UNUSED(backend);
-}
--- a/ggml/src/ggml-openvino/ggml-ov-frontend-utils.h
+++ b/ggml/src/ggml-openvino/ggml-ov-frontend-utils.h
@ -1,6 +0,0 @@
-#include "ggml-graph-iterator.h"
-#include "ggml-backend-impl.h"
-
-std::shared_ptr<ov::frontend::tensorflow::ggml::GgmlOvGraphIterator> get_ggml_graph_iterator(struct ggml_cgraph * cgraph);
-
-enum ggml_status openvino_frontend_compute (ggml_backend_t backend, struct ggml_cgraph * cgraph);