Skip to content

Commit 5708bda

Browse files
committed
support GQA
1 parent 2d82713 commit 5708bda

File tree

2 files changed

+2
-0
lines changed

2 files changed

+2
-0
lines changed

onnxruntime/core/providers/openvino/backends/basic_backend.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,7 @@ struct OnnxToOvNetworkBindings {
5757
"beam_idx",
5858
"past_key_values",
5959
"present",
60+
"total_seq_len",
6061
};
6162

6263
OnnxToOvNetworkBindings(OVExeNetwork& exec_network, SubGraphContext& subgraph_context, SessionContext& session_context) {

onnxruntime/core/providers/openvino/ov_versions/data_ops.cc

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,7 @@ std::vector<SupportedOp> supported_op_mode = {
9696
{"Atanh", V_2020_4, {"CPU"}},
9797
{"Atanh", V_2022_1, {"GPU"}},
9898
{"Attention", V_2023_0, {"CPU", "GPU"}},
99+
{"GroupQueryAttention", V_2025_1, {"CPU", "GPU"}},
99100
{"AveragePool", V_2020_4, {"CPU", "GPU"}},
100101
{"BatchNormalization", V_2020_4, {"CPU", "GPU"}},
101102
{"BiasGelu", V_2023_0, {"CPU", "GPU"}},

0 commit comments

Comments
 (0)