pytorch
diff --git a/‎backends/qualcomm/CMakeLists.txt
Lines changed: 9 additions & 1 deletion b/‎backends/qualcomm/CMakeLists.txt
Lines changed: 9 additions & 1 deletion
diff --git a/‎backends/qualcomm/aot/python/PyQnnManagerAdaptor.h
Lines changed: 9 additions & 6 deletions b/‎backends/qualcomm/aot/python/PyQnnManagerAdaptor.h
Lines changed: 9 additions & 6 deletions
diff --git a/‎backends/qualcomm/qnn_preprocess.py
Lines changed: 9 additions & 0 deletions b/‎backends/qualcomm/qnn_preprocess.py
Lines changed: 9 additions & 0 deletions
diff --git a/‎backends/qualcomm/runtime/QnnExecuTorchBackend.cpp
Lines changed: 4 additions & 5 deletions b/‎backends/qualcomm/runtime/QnnExecuTorchBackend.cpp
Lines changed: 4 additions & 5 deletions
@@ -73,6 +73,7 @@ endif()
 
 include_directories(
   BEFORE ${_common_include_directories} ${QNN_SDK_ROOT}/include/QNN
+  ${QNN_SDK_ROOT}/share/QNN/converter/jni
   ${EXECUTORCH_SOURCE_DIR}/third-party/flatbuffers/include
   ${EXECUTORCH_SOURCE_DIR}/runtime/core/portable_type/c10
 )
@@ -183,8 +184,15 @@ target_link_libraries(
   PRIVATE qnn_schema qnn_backend qnn_device qnn_context qnn_graph
           qnn_mem_manager qnn_custom_protocol
 )
+
+target_include_directories(qnn_manager PUBLIC
+    ${QNN_SDK_ROOT}/include/QNN
+    ${QNN_SDK_ROOT}/share/QNN/converter/jni/
+    ${PROJECT_SOURCE_DIR})
+target_link_directories(qnn_manager PUBLIC ${QNN_SDK_ROOT}/lib/${ARCHITECTURE}/)
+
 target_link_libraries(
-  qnn_manager PRIVATE qnn_factory wrappers qnn_schema utils shared_buffer
+  qnn_manager PRIVATE qnn_factory wrappers qnn_schema utils shared_buffer QnnModelDlc
 )
 target_link_libraries(
   qnn_executorch_backend PRIVATE qnn_executorch_header qnn_schema qnn_manager
 
@@ -34,7 +34,7 @@ class PyQnnManager {
     auto qnn_executorch_options = GetQnnExecuTorchOptions(
         qnn_executorch_option_ptr_.cast<std::string_view>().data());
     qnn_manager_ = std::make_shared<QnnManager>(
-        qnn_executorch_options, qnn_executorch_context_binary_);
+        qnn_executorch_options, qnn_executorch_context_binary_, false);
   }
 
   // used for loading context binary directly
@@ -47,7 +47,7 @@ class PyQnnManager {
     qnn_executorch_context_binary_.buffer = info.ptr;
     qnn_executorch_context_binary_.nbytes = info.size * info.itemsize;
     qnn_manager_ = std::make_shared<QnnManager>(
-        qnn_executorch_options, qnn_executorch_context_binary_);
+        qnn_executorch_options, qnn_executorch_context_binary_, false);
   }
 
   // used during stage 2 of multi-graph mode
@@ -160,7 +160,7 @@ class PyQnnManager {
     qnn_executorch_context_binary_ =
         MakeQcirCustomBinaryInfo(qcir_bin, tensor_data);
     qnn_manager_ = std::make_shared<QnnManager>(
-        qnn_executorch_options, qnn_executorch_context_binary_);
+        qnn_executorch_options, qnn_executorch_context_binary_, false);
   }
 
   executorch::runtime::Error Init() {
@@ -195,7 +195,7 @@ class PyQnnManager {
       std::vector<std::shared_ptr<OpWrapper>>& op_wrappers) {
     QnnExecuTorchContextBinary binary_info;
 
-    if (qnn_manager_->IsOnlinePrepare() || qnn_manager_->IsMultipleGraphs()) {
+    if (qnn_manager_->IsMultipleGraphs()) {
       builder_.Reset();
       std::vector<uint8_t> tensor_data;
       std::vector<uint64_t> offsets;
@@ -305,8 +305,11 @@ class PyQnnManager {
         QNN_EXECUTORCH_LOG_ERROR("Fail to compile QNN graph");
         return py::array_t<char>(0);
       }
-      if (qnn_manager_->GetContextBinary(binary_info) !=
-          executorch::runtime::Error::Ok) {
+      auto qnn_executorch_options = GetQnnExecuTorchOptions(
+          qnn_executorch_option_ptr_.cast<std::string_view>().data());
+      if (qnn_executorch_options->saver() ||
+          qnn_manager_->GetContextBinary(binary_info) !=
+              executorch::runtime::Error::Ok) {
         return py::array_t<char>(0);
       }
     }
 
@@ -20,6 +20,9 @@
 from executorch.backends.qualcomm.builders.node_visitor import get_node_visitors
 from executorch.backends.qualcomm.builders.qnn_constants import OpContextLoader
 from executorch.backends.qualcomm.partition.utils import generate_qnn_executorch_option
+from executorch.backends.qualcomm.serialization.qc_schema_serialize import (
+    flatbuffer_to_option,
+)
 from executorch.exir.backend.backend_details import (
     BackendDetails,
     CompileSpec,
@@ -107,6 +110,12 @@ def preprocess(
             qnn_manager.GetGraphNames()[0],
             [py_op_wrapper.GetOpWrapper() for py_op_wrapper in py_op_wrapper_list],
         )
+
+        obj_options = flatbuffer_to_option(option)
+        if obj_options.saver:
+            exit(
+                f"Records all QNN API calls from saver backend at: {obj_options.saver_output_dir}"
+            )
         assert len(qnn_context_binary) != 0, "Failed to generate Qnn context binary."
         qnn_manager.Destroy()
         # For now, debug_handle_map is not used by QNN ExecuTorch
 
@@ -36,7 +36,6 @@ Result<DelegateHandle*> QnnExecuTorchBackend::init(
   // covert SizedBuffer to qnn ExecuTorch option
   QnnExecuTorchContextBinary qnn_context_blob;
   const qnn_delegate::QnnExecuTorchOptions* qnn_executorch_options = nullptr;
-
   auto [status, signature, ctx_size, ctx_bin] =
       QnnContextCustomProtocol().DeserializeContextCustomBuffer(
           const_cast<void*>(processed->data()));
@@ -49,6 +48,7 @@ Result<DelegateHandle*> QnnExecuTorchBackend::init(
     qnn_context_blob.buffer = ctx_bin;
   } else {
     // This buffer will be verified again in QnnBackendCache.
+
     QNN_EXECUTORCH_LOG_INFO(
         "Deserializing processed data using QnnQcirCustomProtocol");
     qnn_context_blob.buffer = const_cast<void*>(processed->data());
@@ -71,8 +71,7 @@ Result<DelegateHandle*> QnnExecuTorchBackend::init(
 
   // NOTE: Since we use placement new and since this type is not trivially
   // destructible, we must call the destructor manually in destroy().
-  new (qnn_manager) QnnManager(qnn_executorch_options, qnn_context_blob);
-
+  new (qnn_manager) QnnManager(qnn_executorch_options, qnn_context_blob, true);
   // TODO: this is a temporal solution for multi-graph support, will be
   //       removed once framework starts to accept runtime configuration
   // ---
@@ -94,9 +93,9 @@ Result<DelegateHandle*> QnnExecuTorchBackend::init(
 
   if (qnn_manager->IsOnlinePrepare()) {
     ET_CHECK_OR_RETURN_ERROR(
-        qnn_manager->CompileQcir() == Error::Ok,
+        qnn_manager->CompileGraphsFromDlc() == Error::Ok,
         Internal,
-        "Fail to compile binary in qcir format");
+        "Fail to compile binary in Dlc format");
   } else {
     for (const std::string& graph_name : qnn_manager->GetGraphNames()) {
       ET_CHECK_OR_RETURN_ERROR(