From 4ccbfe43763bfd6965dab2e00f96b0be5c14c074 Mon Sep 17 00:00:00 2001 From: Xuejun Zhai Date: Thu, 4 Dec 2025 22:14:05 -0800 Subject: [PATCH] Fix error for decoder cache --- ggml/src/ggml-openvino/ggml-decoder.h | 2 +- ggml/src/ggml-openvino/utils.cpp | 6 ++++-- 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/ggml/src/ggml-openvino/ggml-decoder.h b/ggml/src/ggml-openvino/ggml-decoder.h index 1e51a7e1a8d..111eb7200b8 100644 --- a/ggml/src/ggml-openvino/ggml-decoder.h +++ b/ggml/src/ggml-openvino/ggml-decoder.h @@ -210,10 +210,10 @@ class GgmlOvDecoder : public ov::frontend::ggml::GgmlDecoder { static std::vector get_stride(const ggml_tensor * tensor); static ov::element::Type get_ov_type(const ggml_tensor * tensor); static std::string compute_op_type(const ggml_tensor * node); + void add_extra_inputs(); private: void set_input_output(ggml_tensor * node, bool naive = false); - void add_extra_inputs(); int compute_op_case(const ggml_tensor * node) const; void validate_cgraph() const; diff --git a/ggml/src/ggml-openvino/utils.cpp b/ggml/src/ggml-openvino/utils.cpp index 018199def58..935404136c4 100644 --- a/ggml/src/ggml-openvino/utils.cpp +++ b/ggml/src/ggml-openvino/utils.cpp @@ -102,8 +102,10 @@ enum ggml_status ov_graph_compute_dynamic(ggml_cgraph * cgraph, const std::strin if (cache_hit) { std::map> model_weights; - ggml_decoder = std::make_shared(cgraph, m_params, c_params, model_weights, is_static); - decoder_cache[key] = ggml_decoder; + ggml_decoder = decoder_cache[key]; + ggml_decoder->set_compute_params(c_params); + ggml_decoder->set_model_params(m_params); + ggml_decoder->add_extra_inputs(); infer_request = infer_request_cache[key]; decoder_end_time = ggml_time_us();