File tree Expand file tree Collapse file tree 2 files changed +4
-3
lines changed
ggml/src/ggml-openvino/openvino Expand file tree Collapse file tree 2 files changed +4
-3
lines changed Original file line number Diff line number Diff line change @@ -19,6 +19,7 @@ namespace ggml {
1919namespace pass {
2020
2121FuseToSDPA::FuseToSDPA () {
22+ // Not maintained since FLASH_ATTN_EXT has replaced this pattern
2223 const auto m_k = ov::pass::pattern::any_input ();
2324 const auto m_q = ov::pass::pattern::any_input ();
2425 const auto m_qk = ov::pass::pattern::wrap_type<ov::op::v0::MatMul>({m_q, m_k});
Original file line number Diff line number Diff line change 2727#include " ggml-openvino/openvino/utils.hpp"
2828#include " input_model.hpp"
2929#include " pass/eliminate_zp.hpp"
30- #include " pass/fuse_to_sdpa.hpp"
3130#include " pass/mark_decompression_convert_constant_folding.hpp"
3231
3332namespace ov {
@@ -220,8 +219,9 @@ std::shared_ptr<Model> TranslateSession::apply_transformations(std::shared_ptr<M
220219 manager.register_pass <ov::pass::MakeStateful>(kv_param_res_pairs);
221220 }
222221
223- manager.register_pass <pass::EliminateZeroPoints>();
224- manager.register_pass <pass::FuseToSDPA>();
222+ if (ggml_model_decoder->is_static ()) {
223+ manager.register_pass <pass::EliminateZeroPoints>();
224+ }
225225 manager.run_passes (model);
226226 }
227227 return model;
You can’t perform that action at this time.
0 commit comments