diff --git a/cmake/onnxruntime_providers_openvino.cmake b/cmake/onnxruntime_providers_openvino.cmake index f149030c15702..03f67983c70ab 100644 --- a/cmake/onnxruntime_providers_openvino.cmake +++ b/cmake/onnxruntime_providers_openvino.cmake @@ -46,7 +46,7 @@ set_target_properties(onnxruntime_providers_openvino PROPERTIES FOLDER "ONNXRuntime") target_compile_options(onnxruntime_providers_openvino PRIVATE - $<$>:-DNOT_RELEASE> + $<$:-DRELEASE> ) if(NOT MSVC) diff --git a/onnxruntime/core/providers/openvino/backend_manager.cc b/onnxruntime/core/providers/openvino/backend_manager.cc index d758430f39108..13f09b9d9acdb 100644 --- a/onnxruntime/core/providers/openvino/backend_manager.cc +++ b/onnxruntime/core/providers/openvino/backend_manager.cc @@ -13,13 +13,13 @@ #include #include "core/providers/shared_library/provider_api.h" -#include "core/providers/openvino/ov_versions/capability.h" -#include "core/providers/openvino/contexts.h" #include "core/providers/openvino/backend_manager.h" -#include "core/providers/openvino/ibackend.h" #include "core/providers/openvino/backend_utils.h" -#include "core/providers/openvino/qdq_transformations/qdq_stripping.h" +#include "core/providers/openvino/contexts.h" +#include "core/providers/openvino/ibackend.h" #include "core/providers/openvino/ov_interface.h" +#include "core/providers/openvino/ov_versions/capability.h" +#include "core/providers/openvino/qdq_transformations/qdq_stripping.h" namespace onnxruntime { namespace openvino_ep { @@ -324,7 +324,7 @@ static bool IsQDQGraph(const onnxruntime::GraphViewer& graph_viewer) { static void DumpOpenVINOEPModel([[maybe_unused]] const std::filesystem::path& onnx_model_path_name, [[maybe_unused]] ONNX_NAMESPACE::ModelProto* model_proto, [[maybe_unused]] const onnxruntime::Node& fused_node) { -#ifdef NOT_RELEASE +#ifndef RELEASE if (openvino_ep::backend_utils::IsDebugEnabled()) { auto model_name = onnx_model_path_name.empty() ? "unknown.onnx" : onnx_model_path_name.filename(); @@ -384,7 +384,7 @@ BackendManager::GetModelProtoFromFusedNode(const onnxruntime::Node& fused_node, if (session_context_.device_type.find("NPU") != std::string::npos && (enable_ovep_qdq_optimizer || session_context_.so_share_ep_contexts)) { std::unique_ptr model; - Status status = CreateModelWithStrippedQDQNodes(subgraph, logger, session_context_.so_share_ep_contexts, model, shared_context_.shared_weights, enable_ovep_qdq_optimizer); + Status status = CreateModelWithStrippedQDQNodes(subgraph, logger, session_context_.so_share_ep_contexts, enable_ovep_qdq_optimizer, model, shared_context_.shared_weights); auto model_proto = model->ToProto(); model_proto->set_ir_version(ONNX_NAMESPACE::Version::IR_VERSION); print_model_proto_duration(); diff --git a/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.cc b/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.cc index c071db9c3a4fb..860cfb5713903 100644 --- a/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.cc +++ b/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.cc @@ -448,8 +448,8 @@ static bool HandleDoubleQDQ(onnxruntime::Graph& dst_graph, const onnxruntime::Gr static void AddStandaloneNodeUnit(onnxruntime::Graph& dst_graph, const onnxruntime::GraphViewer& src_graph, const NodeUnit& node_unit, std::set& initializers_to_keep, - const logging::Logger& /* logger */, - bool IsWeightSharingWithoutOVEPQDQStripping) { + bool IsWeightSharingWithoutOVEPQDQStripping, + const logging::Logger& /* logger */) { assert(node_unit.UnitType() == NodeUnit::Type::SingleNode); // this is the scenario where WAI is enabled and ovep stripping is disabled @@ -520,8 +520,8 @@ static void AddQDQNodeUnit(onnxruntime::Graph& dst_graph, const onnxruntime::GraphViewer& src_graph, const NodeUnit& node_unit, std::set& initializers_to_keep, - const logging::Logger& /* logger */, - bool IsWeightSharingWithoutOVEPQDQStripping) { + bool IsWeightSharingWithoutOVEPQDQStripping, + const logging::Logger& /* logger */) { assert(node_unit.UnitType() == NodeUnit::Type::QDQGroup); // Collect inputs coming into the node unit. @@ -684,9 +684,9 @@ static void AddInitializerAsInput(onnxruntime::Graph& dst_graph, Status CreateModelWithStrippedQDQNodes(const GraphViewer& src_graph, const logging::Logger& logger, bool enable_ovep_weight_sharing, + bool enable_ovep_qdq_optimizer, /*out*/ std::unique_ptr& model, - /*out*/ sw& shared_weights, - bool enable_ovep_qdq_optimizer) { + /*out*/ sw& shared_weights) { // NOTE: This function is a re-implementation of GraphViewerToProto() in core/graph/graph_proto_serializer.cc // with the following differences: // - Uses onnxruntime::Graph APIs instead of onnx::GraphProto APIs. @@ -780,9 +780,9 @@ Status CreateModelWithStrippedQDQNodes(const GraphViewer& src_graph, bool IsWeightSharingWithoutOVEPQDQStripping = enable_ovep_weight_sharing && !enable_ovep_qdq_optimizer; if (node_unit->UnitType() == NodeUnit::Type::SingleNode) { - AddStandaloneNodeUnit(dst_graph, src_graph, *node_unit, initializers_to_keep, logger, IsWeightSharingWithoutOVEPQDQStripping); + AddStandaloneNodeUnit(dst_graph, src_graph, *node_unit, initializers_to_keep, IsWeightSharingWithoutOVEPQDQStripping, logger); } else { - AddQDQNodeUnit(dst_graph, src_graph, *node_unit, initializers_to_keep, logger, IsWeightSharingWithoutOVEPQDQStripping); + AddQDQNodeUnit(dst_graph, src_graph, *node_unit, initializers_to_keep, IsWeightSharingWithoutOVEPQDQStripping, logger); } seen_node_units.insert(node_unit); diff --git a/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.h b/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.h index 4b5696f4411bd..53de0fd019311 100644 --- a/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.h +++ b/onnxruntime/core/providers/openvino/qdq_transformations/qdq_stripping.h @@ -16,9 +16,9 @@ using sw = SharedContext::SharedWeights; Status CreateModelWithStrippedQDQNodes(const GraphViewer& src_graph, const logging::Logger& logger, bool enable_ovep_weight_sharing, + bool enable_ovep_qdq_optimizer, /*out*/ std::unique_ptr& model, - /*out*/ sw& shared_weights, - bool enable_ovep_qdq_optimizer); + /*out*/ sw& shared_weights); bool dumpMetaDataMapToBinary(const sw::Metadata::Map& shared_weights, const std::string& filename); } // namespace openvino_ep