Skip to content

Commit

Permalink
support Qnn 2 28 (microsoft#22724)
Browse files Browse the repository at this point in the history
### Description
support Qnn 2.28
update default qnn vesion to 2.28 in build pipeline
  • Loading branch information
HectorSVC authored and ankitm3k committed Dec 11, 2024
1 parent 685f5a5 commit d00a2fa
Show file tree
Hide file tree
Showing 19 changed files with 77 additions and 40 deletions.
11 changes: 8 additions & 3 deletions onnxruntime/core/providers/qnn/builder/qnn_backend_manager.cc
Original file line number Diff line number Diff line change
Expand Up @@ -641,12 +641,17 @@ Status QnnBackendManager::LoadCachedQnnContextFromBuffer(char* buffer, uint64_t
ORT_RETURN_IF(nullptr == binary_info, "Qnn cached binary info is nullptr.");
uint32_t graph_count = 0;
QnnSystemContext_GraphInfo_t* graphs_info = nullptr;
if (binary_info->version == QNN_SYSTEM_CONTEXT_BINARY_INFO_VERSION_1) {
graph_count = binary_info->contextBinaryInfoV1.numGraphs;
graphs_info = binary_info->contextBinaryInfoV1.graphs;
if (binary_info->version == QNN_SYSTEM_CONTEXT_BINARY_INFO_VERSION_3) {
graph_count = binary_info->contextBinaryInfoV3.numGraphs;
graphs_info = binary_info->contextBinaryInfoV3.graphs;
} else if (binary_info->version == QNN_SYSTEM_CONTEXT_BINARY_INFO_VERSION_2) {
graph_count = binary_info->contextBinaryInfoV2.numGraphs;
graphs_info = binary_info->contextBinaryInfoV2.graphs;
} else if (binary_info->version == QNN_SYSTEM_CONTEXT_BINARY_INFO_VERSION_1) {
graph_count = binary_info->contextBinaryInfoV1.numGraphs;
graphs_info = binary_info->contextBinaryInfoV1.graphs;
} else {
return ORT_MAKE_STATUS(ONNXRUNTIME, FAIL, "Unsupported context binary info version.");
}

ORT_RETURN_IF(graph_count < 1 || graphs_info == nullptr, "Failed to get graph info from Qnn cached context.");
Expand Down
61 changes: 41 additions & 20 deletions onnxruntime/core/providers/qnn/builder/qnn_model.cc
Original file line number Diff line number Diff line change
Expand Up @@ -321,29 +321,50 @@ Status QnnModel::DeserializeGraphInfoFromBinaryInfo(const QnnSystemContext_Graph
std::vector<QnnTensorWrapper> output_tensor_wrappers;

std::string graph_name;
if (qnn_sys_ctx_graph_info.version == QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_1) {
Qnn_Tensor_t* input_tensors = nullptr;
Qnn_Tensor_t* output_tensors = nullptr;
uint32_t graph_input_num = 0;
uint32_t graph_output_num = 0;
if (qnn_sys_ctx_graph_info.version == QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_3) {
graph_name.assign(qnn_sys_ctx_graph_info.graphInfoV3.graphName);
graph_input_num = qnn_sys_ctx_graph_info.graphInfoV3.numGraphInputs;
graph_output_num = qnn_sys_ctx_graph_info.graphInfoV3.numGraphOutputs;

input_tensors = qnn_sys_ctx_graph_info.graphInfoV3.graphInputs;
output_tensors = qnn_sys_ctx_graph_info.graphInfoV3.graphOutputs;
} else if (qnn_sys_ctx_graph_info.version == QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_2) {
graph_name.assign(qnn_sys_ctx_graph_info.graphInfoV2.graphName);
graph_input_num = qnn_sys_ctx_graph_info.graphInfoV2.numGraphInputs;
graph_output_num = qnn_sys_ctx_graph_info.graphInfoV2.numGraphOutputs;

input_tensors = qnn_sys_ctx_graph_info.graphInfoV2.graphInputs;
output_tensors = qnn_sys_ctx_graph_info.graphInfoV2.graphOutputs;
} else if (qnn_sys_ctx_graph_info.version == QNN_SYSTEM_CONTEXT_GRAPH_INFO_VERSION_1) {
graph_name.assign(qnn_sys_ctx_graph_info.graphInfoV1.graphName);
auto graph_input_num = qnn_sys_ctx_graph_info.graphInfoV1.numGraphInputs;
auto graph_output_num = qnn_sys_ctx_graph_info.graphInfoV1.numGraphOutputs;
ORT_RETURN_IF(nullptr == qnn_sys_ctx_graph_info.graphInfoV1.graphInputs, "Graph from cached context doesn't have any inputs.");
ORT_RETURN_IF(nullptr == qnn_sys_ctx_graph_info.graphInfoV1.graphOutputs, "Graph from cached context doesn't have any outputs.");

// Copy graph input
Qnn_Tensor_t* input_tensors = qnn_sys_ctx_graph_info.graphInfoV1.graphInputs;
for (size_t i = 0; i < graph_input_num; ++i) {
QnnTensorWrapper tensorwrapper;
ORT_RETURN_IF_ERROR(tensorwrapper.Init(input_tensors[i]));
input_tensor_wrappers.push_back(std::move(tensorwrapper));
}
graph_input_num = qnn_sys_ctx_graph_info.graphInfoV1.numGraphInputs;
graph_output_num = qnn_sys_ctx_graph_info.graphInfoV1.numGraphOutputs;

// Copy graph output
Qnn_Tensor_t* output_tensors = qnn_sys_ctx_graph_info.graphInfoV1.graphOutputs;
for (size_t i = 0; i < graph_output_num; ++i) {
QnnTensorWrapper tensorwrapper;
ORT_RETURN_IF_ERROR(tensorwrapper.Init(output_tensors[i]));
output_tensor_wrappers.push_back(std::move(tensorwrapper));
}
input_tensors = qnn_sys_ctx_graph_info.graphInfoV1.graphInputs;
output_tensors = qnn_sys_ctx_graph_info.graphInfoV1.graphOutputs;
} else {
return ORT_MAKE_STATUS(ONNXRUNTIME, FAIL, "Unsupported context graph info version.");
}
ORT_RETURN_IF(nullptr == input_tensors, "Graph from cached context doesn't have any inputs.");
ORT_RETURN_IF(nullptr == output_tensors, "Graph from cached context doesn't have any outputs.");

// Copy graph input
for (size_t i = 0; i < graph_input_num; ++i) {
QnnTensorWrapper tensorwrapper;
ORT_RETURN_IF_ERROR(tensorwrapper.Init(input_tensors[i]));
input_tensor_wrappers.push_back(std::move(tensorwrapper));
}
// Copy graph output
for (size_t i = 0; i < graph_output_num; ++i) {
QnnTensorWrapper tensorwrapper;
ORT_RETURN_IF_ERROR(tensorwrapper.Init(output_tensors[i]));
output_tensor_wrappers.push_back(std::move(tensorwrapper));
}

Qnn_GraphHandle_t graph;
auto qnn_interface = qnn_backend_manager_->GetQnnInterface();
auto rt = qnn_interface.graphRetrieve(context, graph_name.c_str(), &graph);
Expand Down
6 changes: 5 additions & 1 deletion onnxruntime/test/providers/qnn/gather_op_htp_test.cc
Original file line number Diff line number Diff line change
Expand Up @@ -131,11 +131,15 @@ TEST_F(QnnHTPBackendTests, GatherOp_IndicesDynamicInt32_Axis0) {
ExpectedEPNodeAssignment::All);
}

// disabled for QNN 2.28.0.241029 failed for accuracy validation
// qdq@QNN_EP val: 3.6094117164611816 (err: 1.3094117641448975, err/output_range: 22.19342041015625%)
// qdq@CPU_EP val: 2.2905881404876709 (err: 0.0094118118286132812, err/output_range: 0.15952222049236298%)
// abs(qdq@QNN_EP - qdq@CPU_EP) / output_range = 22.033897399902344%
// Test creates a DQ -> Gather -> Q -> DQ graph, and checks that all
// nodes are supported by the QNN EP, and that the inference results are as accurate as CPU EP.
//
// Static int32 indices with axis = 1
TEST_F(QnnHTPBackendTests, GatherOp_IndicesStaticInt32_Axis1) {
TEST_F(QnnHTPBackendTests, DISABLED_GatherOp_IndicesStaticInt32_Axis1) {
RunQDQGatherOpTest<uint8_t, int32_t>(TestInputDef<float>({3, 3}, false, {1.0f, 1.2f, 1.9f, 2.3f, 3.4f, 3.9f, 4.5f, 5.7f, 5.9f}),
TestInputDef<int32_t>({1, 2}, true, {0, 2}),
{utils::MakeAttribute("axis", static_cast<int64_t>(1))},
Expand Down
9 changes: 8 additions & 1 deletion onnxruntime/test/providers/qnn/simple_op_htp_test.cc
Original file line number Diff line number Diff line change
Expand Up @@ -229,8 +229,15 @@ TEST_F(QnnHTPBackendTests, UnaryOp_Tanh) {
ExpectedEPNodeAssignment::All);
}

// disabled for QNN 2.28.0.241029 backendValidateOpConfig failed
// QnnDsp <E> [4294967295] has incorrect Value -32768, expected equal to 0.
// QnnDsp <V> validateNativeOps node_token_6:qti.aisw:Tanh htp op validator failed 3110
// QnnDsp <V> registered validator failed => 3110
// QnnDsp <E> QnnBackend_validateOpConfig failed 3110
// QnnDsp <V> Wake up free backend (id: 1)'s thread(s)
// QnnDsp <E> Failed to validate op node_token_6 with error 0xc26
// Tests accuracy of 16-bit QDQ Tanh.
TEST_F(QnnHTPBackendTests, UnaryOp_Tanh_U16) {
TEST_F(QnnHTPBackendTests, DISABLED_UnaryOp_Tanh_U16) {
RunQDQOpTest<uint16_t>("Tanh",
{TestInputDef<float>({1, 2, 3}, false, GetFloatDataInRange(-10.0f, 10.0f, 6))},
{},
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -32,7 +32,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

jobs:
- job: Build_QNN_EP
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -62,7 +62,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK Version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

resources:
repositories:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

jobs:
- job: Build_QNN_EP
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ parameters:
- name: qnn_sdk_version
type: string
displayName: 'QNN SDK version. Only for QNN packages.'
default: 2.27.0.240926
default: 2.28.0.241029

trigger: none

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK Version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

- name: build_config
displayName: Build Configuration
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ parameters:
- name: qnn_sdk_version
type: string
displayName: 'QNN SDK version. Only for QNN packages.'
default: 2.27.0.240926
default: 2.28.0.241029

stages:
- ${{ if eq(parameters.enable_windows_cpu, true) }}:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
parameters:
- name: QnnSDKVersion
type: string
default: '2.27.0.240926'
default: '2.28.0.241029'

steps:
- script: |
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
parameters:
- name: QnnSDKVersion
type: string
default: '2.27.0.240926'
default: '2.28.0.241029'

steps:
- powershell: |
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

jobs:
- job: Linux_py_qnn_Wheels_x64
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ parameters:
- name: QNN_SDK
displayName: QNN SDK Version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

- name: ENV_SETUP_SCRIPT
type: string
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ parameters:
- name: QNN_SDK
displayName: QNN SDK Version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

- name: ENV_SETUP_SCRIPT
type: string
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@ parameters:
- name: QNN_SDK
displayName: QNN SDK Version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

- name: ENV_SETUP_SCRIPT
type: string
Expand Down
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
parameters:
QnnSdk: '2.27.0.240926'
QnnSdk: '2.28.0.241029'
build_config: 'RelWithDebInfo'
IsReleaseBuild: false
DoEsrp: false
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

jobs:
- job: 'build'
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,7 +33,7 @@ parameters:
- name: QnnSdk
displayName: QNN SDK version
type: string
default: 2.27.0.240926
default: 2.28.0.241029

jobs:
- job: 'build'
Expand Down

0 comments on commit d00a2fa

Please sign in to comment.