Extend MTK dispatch API to support DMA-BUF buffers

PiperOrigin-RevId: 713677908
2026-01-15 12:15:41 +00:00 · 2025-01-09 08:14:08 -08:00
parent 765be4d43e
commit 7fab320b49
6 changed files with 377 additions and 28 deletions
--- a/tensorflow/lite/experimental/litert/cc/litert_tensor_buffer.h
+++ b/tensorflow/lite/experimental/litert/cc/litert_tensor_buffer.h
@@ -136,6 +136,27 @@ class TensorBuffer
 #endif
  }

+  struct DmaBuf {
+    void* addr;
+    int fd;
+  };
+
+  litert::Expected<DmaBuf> GetDmaBuf() const {
+#if LITERT_HAS_DMABUF_SUPPORT
+    DmaBuf dma_buf;
+    if (LiteRtGetTensorBufferDmaBufBuffer(Get(), &dma_buf.addr, &dma_buf.fd) ==
+        kLiteRtStatusOk) {
+      return dma_buf;
+    } else {
+      return litert::Unexpected(kLiteRtStatusErrorRuntimeFailure,
+                                "Failed to get DMA-BUF from tensor buffer");
+    }
+#else
+    return litert::Unexpected(kLiteRtStatusErrorRuntimeFailure,
+                              "DMA-BUF is not supported on this platform");
+#endif
+  }
+
  Expected<LiteRtTensorBufferType> BufferType() const {
    LiteRtTensorBufferType tensor_buffer_type;
    if (auto status = LiteRtGetTensorBufferType(Get(), &tensor_buffer_type);
--- a/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/dispatch_api_mediatek_test.cc
+++ b/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/dispatch_api_mediatek_test.cc
@@ -30,7 +30,7 @@

 using ::testing::Pointwise;

-TEST(DispatchApi, MediaTek) {
+TEST(MediaTek, DispatchApiWithAhwb) {
 #if !defined(__ANDROID__)
  GTEST_SKIP()
      << "This test is specific to Android devices with a MediaTek NPU";
@@ -331,3 +331,305 @@ TEST(DispatchApi, MediaTek) {
  EXPECT_EQ(LiteRtDispatchDeviceContextDestroy(device_context),
            kLiteRtStatusOk);
 }
+
+TEST(MediaTek, DispatchApiWithDmaBuf) {
+#if !defined(__ANDROID__)
+  GTEST_SKIP()
+      << "This test is specific to Android devices with a MediaTek NPU";
+#endif
+
+  EXPECT_EQ(LiteRtDispatchInitialize(/*options=*/nullptr, /*num_options=*/0),
+            kLiteRtStatusOk);
+
+  const char* vendor_id;
+  EXPECT_EQ(LiteRtDispatchGetVendorId(&vendor_id), kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "vendor_id: " << vendor_id;
+
+  const char* build_id;
+  EXPECT_EQ(LiteRtDispatchGetBuildId(&build_id), kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "build_id: " << build_id;
+
+  LiteRtApiVersion api_version;
+  EXPECT_EQ(LiteRtDispatchGetApiVersion(&api_version), kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "api_version: " << api_version.major << "."
+                 << api_version.minor << "." << api_version.patch;
+
+  int capabilities;
+  EXPECT_EQ(LiteRtDispatchGetCapabilities(&capabilities), kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "capabilities: " << capabilities;
+
+  LiteRtDispatchDeviceContext device_context = nullptr;
+  EXPECT_EQ(LiteRtDispatchDeviceContextCreate(&device_context),
+            kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "device_context: " << device_context;
+
+  auto model_file_name =
+      litert::testing::GetTestFilePath(kMediaTekModelFileName);
+  auto model = litert::internal::LoadBinaryFile(model_file_name);
+  EXPECT_TRUE(model) << model.Error();
+  ABSL_LOG(INFO) << "Loaded model " << model_file_name << ", " << model->Size()
+                 << " bytes";
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Set up an invocation context for a given model.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  LiteRtDispatchInvocationContext invocation_context = nullptr;
+  EXPECT_EQ(LiteRtDispatchInvocationContextCreate(
+                device_context, kLiteRtDispatchExecutableTypeMlModel,
+                model->Data(), model->Size(), /*function_name=*/nullptr,
+                /*num_inputs=*/2, /*num_outputs=*/1, &invocation_context),
+            kLiteRtStatusOk);
+  ABSL_LOG(INFO) << "Invocation context: " << invocation_context;
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Determine tensor buffer requirements.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  int num_tensor_buffer_types;
+  LiteRtTensorBufferRequirements input_0_tensor_buffer_requirements;
+  EXPECT_EQ(LiteRtDispatchGetInputRequirements(
+                invocation_context, /*input_index=*/0, &kInput0TensorType,
+                &input_0_tensor_buffer_requirements),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtGetNumTensorBufferRequirementsSupportedBufferTypes(
+                input_0_tensor_buffer_requirements, &num_tensor_buffer_types),
+            kLiteRtStatusOk);
+  EXPECT_GE(num_tensor_buffer_types, 2);
+  LiteRtTensorBufferType input_0_tensor_buffer_type;
+  EXPECT_EQ(LiteRtGetTensorBufferRequirementsSupportedTensorBufferType(
+                input_0_tensor_buffer_requirements, /*type_index=*/1,
+                &input_0_tensor_buffer_type),
+            kLiteRtStatusOk);
+  EXPECT_EQ(input_0_tensor_buffer_type, kLiteRtTensorBufferTypeDmaBuf);
+  size_t input_0_tensor_buffer_size;
+  EXPECT_EQ(
+      LiteRtGetTensorBufferRequirementsBufferSize(
+          input_0_tensor_buffer_requirements, &input_0_tensor_buffer_size),
+      kLiteRtStatusOk);
+  EXPECT_GE(input_0_tensor_buffer_size, sizeof(kTestInput0Tensor));
+
+  LiteRtTensorBufferRequirements input_1_tensor_buffer_requirements;
+  EXPECT_EQ(LiteRtDispatchGetInputRequirements(
+                invocation_context, /*input_index=*/1, &kInput1TensorType,
+                &input_1_tensor_buffer_requirements),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtGetNumTensorBufferRequirementsSupportedBufferTypes(
+                input_1_tensor_buffer_requirements, &num_tensor_buffer_types),
+            kLiteRtStatusOk);
+  EXPECT_GE(num_tensor_buffer_types, 2);
+  LiteRtTensorBufferType input_1_tensor_buffer_type;
+  EXPECT_EQ(LiteRtGetTensorBufferRequirementsSupportedTensorBufferType(
+                input_1_tensor_buffer_requirements, /*type_index=*/1,
+                &input_1_tensor_buffer_type),
+            kLiteRtStatusOk);
+  EXPECT_EQ(input_1_tensor_buffer_type, kLiteRtTensorBufferTypeDmaBuf);
+  size_t input_1_tensor_buffer_size;
+  EXPECT_EQ(
+      LiteRtGetTensorBufferRequirementsBufferSize(
+          input_1_tensor_buffer_requirements, &input_1_tensor_buffer_size),
+      kLiteRtStatusOk);
+  EXPECT_GE(input_1_tensor_buffer_size, sizeof(kTestInput1Tensor));
+
+  LiteRtTensorBufferRequirements output_tensor_buffer_requirements;
+  EXPECT_EQ(LiteRtDispatchGetOutputRequirements(
+                invocation_context, /*output_index=*/0, &kOutputTensorType,
+                &output_tensor_buffer_requirements),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtGetNumTensorBufferRequirementsSupportedBufferTypes(
+                output_tensor_buffer_requirements, &num_tensor_buffer_types),
+            kLiteRtStatusOk);
+  EXPECT_GE(num_tensor_buffer_types, 2);
+  LiteRtTensorBufferType output_tensor_buffer_type;
+  EXPECT_EQ(LiteRtGetTensorBufferRequirementsSupportedTensorBufferType(
+                output_tensor_buffer_requirements, /*type_index=*/1,
+                &output_tensor_buffer_type),
+            kLiteRtStatusOk);
+  EXPECT_EQ(output_tensor_buffer_type, kLiteRtTensorBufferTypeDmaBuf);
+  size_t output_tensor_buffer_size;
+  EXPECT_EQ(LiteRtGetTensorBufferRequirementsBufferSize(
+                output_tensor_buffer_requirements, &output_tensor_buffer_size),
+            kLiteRtStatusOk);
+  EXPECT_GE(output_tensor_buffer_size, sizeof(kTestOutputTensor));
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Allocate tensor buffers.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  LiteRtTensorBuffer input_0_tensor_buffer;
+  EXPECT_EQ(LiteRtCreateManagedTensorBuffer(
+                input_0_tensor_buffer_type, &kInput0TensorType,
+                input_0_tensor_buffer_size, &input_0_tensor_buffer),
+            kLiteRtStatusOk);
+
+  LiteRtTensorBuffer input_1_tensor_buffer;
+  EXPECT_EQ(LiteRtCreateManagedTensorBuffer(
+                input_1_tensor_buffer_type, &kInput1TensorType,
+                input_1_tensor_buffer_size, &input_1_tensor_buffer),
+            kLiteRtStatusOk);
+
+  LiteRtTensorBuffer output_tensor_buffer;
+  EXPECT_EQ(LiteRtCreateManagedTensorBuffer(
+                output_tensor_buffer_type, &kOutputTensorType,
+                output_tensor_buffer_size, &output_tensor_buffer),
+            kLiteRtStatusOk);
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Register tensor buffers.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  LiteRtTensorBufferHandle input_1_handle;
+  EXPECT_EQ(LiteRtDispatchRegisterTensorBuffer(
+                device_context, input_1_tensor_buffer, &input_1_handle),
+            kLiteRtStatusOk);
+
+  LiteRtTensorBufferHandle input_0_handle;
+  EXPECT_EQ(LiteRtDispatchRegisterTensorBuffer(
+                device_context, input_0_tensor_buffer, &input_0_handle),
+            kLiteRtStatusOk);
+
+  LiteRtTensorBufferHandle output_handle;
+  EXPECT_EQ(LiteRtDispatchRegisterTensorBuffer(
+                device_context, output_tensor_buffer, &output_handle),
+            kLiteRtStatusOk);
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Attach tensor buffers.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  EXPECT_EQ(LiteRtDispatchAttachInput(invocation_context,
+                                      /*graph_input_index=*/0, input_0_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchAttachInput(invocation_context,
+                                      /*graph_input_index=*/1, input_1_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchAttachOutput(invocation_context,
+                                       /*graph_output_index=*/0, output_handle),
+            kLiteRtStatusOk);
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Fill the input buffers with data.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  {
+    ABSL_LOG(INFO) << "Filling inputs with data";
+    void* host_mem_addr;
+
+    ASSERT_EQ(LiteRtLockTensorBuffer(input_0_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    std::memcpy(host_mem_addr, kTestInput0Tensor, sizeof(kTestInput0Tensor));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(input_0_tensor_buffer), kLiteRtStatusOk);
+
+    ASSERT_EQ(LiteRtLockTensorBuffer(input_1_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    std::memcpy(host_mem_addr, kTestInput1Tensor, sizeof(kTestInput1Tensor));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(input_1_tensor_buffer), kLiteRtStatusOk);
+  }
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Execute model.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  ABSL_LOG(INFO) << "Invoking execution...";
+  EXPECT_EQ(LiteRtDispatchInvoke(invocation_context), kLiteRtStatusOk);
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Check output for correctness.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  {
+    ABSL_LOG(INFO) << "Checking output...";
+    void* host_mem_addr;
+    ASSERT_EQ(LiteRtLockTensorBuffer(output_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    auto output = absl::MakeSpan(static_cast<const float*>(host_mem_addr),
+                                 kTestOutputSize);
+    for (auto i = 0; i < kTestOutputSize; ++i) {
+      ABSL_LOG(INFO) << output[i] << "\t" << kTestOutputTensor[i];
+    }
+    EXPECT_THAT(output, Pointwise(testing::FloatNear(1e-3), kTestOutputTensor));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(output_tensor_buffer), kLiteRtStatusOk);
+  }
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Fill the input buffers with more data.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  {
+    ABSL_LOG(INFO) << "Filling inputs with data";
+    void* host_mem_addr;
+
+    ASSERT_EQ(LiteRtLockTensorBuffer(input_0_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    std::memcpy(host_mem_addr, kTestInput0Tensor_2,
+                sizeof(kTestInput0Tensor_2));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(input_0_tensor_buffer), kLiteRtStatusOk);
+
+    ASSERT_EQ(LiteRtLockTensorBuffer(input_1_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    std::memcpy(host_mem_addr, kTestInput1Tensor_2,
+                sizeof(kTestInput1Tensor_2));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(input_1_tensor_buffer), kLiteRtStatusOk);
+  }
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Execute model once more.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  ABSL_LOG(INFO) << "Invoking second execution...";
+  EXPECT_EQ(LiteRtDispatchInvoke(invocation_context), kLiteRtStatusOk);
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Check output for correctness.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  {
+    ABSL_LOG(INFO) << "Checking output...";
+    void* host_mem_addr;
+    ASSERT_EQ(LiteRtLockTensorBuffer(output_tensor_buffer, &host_mem_addr,
+                                     /*event=*/nullptr),
+              kLiteRtStatusOk);
+    auto output = absl::MakeSpan(static_cast<const float*>(host_mem_addr),
+                                 kTestOutputSize);
+    for (auto i = 0; i < kTestOutputSize; ++i) {
+      ABSL_LOG(INFO) << output[i] << "\t" << kTestOutputTensor_2[i];
+    }
+    EXPECT_THAT(output,
+                Pointwise(testing::FloatNear(1e-3), kTestOutputTensor_2));
+    ASSERT_EQ(LiteRtUnlockTensorBuffer(output_tensor_buffer), kLiteRtStatusOk);
+  }
+
+  // ///////////////////////////////////////////////////////////////////////////
+  // Clean up resources.
+  // ///////////////////////////////////////////////////////////////////////////
+
+  EXPECT_EQ(LiteRtDispatchDetachInput(invocation_context,
+                                      /*graph_input_index=*/0, input_0_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchDetachInput(invocation_context,
+                                      /*graph_input_index=*/1, input_1_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchDetachOutput(invocation_context,
+                                       /*graph_output_index=*/0, output_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchUnregisterTensorBuffer(device_context, output_handle),
+            kLiteRtStatusOk);
+  EXPECT_EQ(
+      LiteRtDispatchUnregisterTensorBuffer(device_context, input_1_handle),
+      kLiteRtStatusOk);
+  EXPECT_EQ(
+      LiteRtDispatchUnregisterTensorBuffer(device_context, input_0_handle),
+      kLiteRtStatusOk);
+  LiteRtDestroyTensorBuffer(output_tensor_buffer);
+  LiteRtDestroyTensorBuffer(input_1_tensor_buffer);
+  LiteRtDestroyTensorBuffer(input_0_tensor_buffer);
+  EXPECT_EQ(LiteRtDispatchInvocationContextDestroy(invocation_context),
+            kLiteRtStatusOk);
+  EXPECT_EQ(LiteRtDispatchDeviceContextDestroy(device_context),
+            kLiteRtStatusOk);
+}
--- a/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/litert_dispatch_device_context.cc
+++ b/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/litert_dispatch_device_context.cc
@@ -14,6 +14,8 @@

 #include "tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/litert_dispatch_device_context.h"

+#include <sys/mman.h>
+
 #include <cstddef>
 #include <memory>

@@ -46,12 +48,6 @@ LiteRtDispatchDeviceContextT::RegisterTensorBuffer(
    return tensor_buffer_type.Error();
  }

-  if (*tensor_buffer_type != kLiteRtTensorBufferTypeAhwb) {
-    LITERT_LOG(LITERT_ERROR, "Unsupported buffer type: %d",
-               *tensor_buffer_type);
-    return litert::Unexpected(kLiteRtStatusErrorUnsupported);
-  }
-
  auto tensor_buffer_size = tensor_buffer.Size();
  if (!tensor_buffer_size) {
    return tensor_buffer_size.Error();
@@ -62,26 +58,52 @@ LiteRtDispatchDeviceContextT::RegisterTensorBuffer(
    return tensor_buffer_offset.Error();
  }

-  auto ahwb = tensor_buffer.GetAhwb();
-  if (!ahwb) {
-    return ahwb.Error();
-  }
-
+  switch (*tensor_buffer_type) {
+    case kLiteRtTensorBufferTypeAhwb:
+      if (auto ahwb = tensor_buffer.GetAhwb(); ahwb) {
 #ifdef __ANDROID__
-  NeuronMemory* neuron_memory;
-  if (neuron_adapter_.api().memory_create_from_ahwb(*ahwb, &neuron_memory) !=
-      NEURON_NO_ERROR) {
-    return litert::Unexpected(kLiteRtStatusErrorRuntimeFailure,
-                              "Failed to create NeuronMemory from AHWB");
-  }
-  return neuron_memory_registry_.Register(neuron_memory, *tensor_buffer_size,
-                                          *tensor_buffer_offset);
+        NeuronMemory* neuron_memory;
+        if (neuron_adapter_.api().memory_create_from_ahwb(
+                *ahwb, &neuron_memory) != NEURON_NO_ERROR) {
+          return litert::Unexpected(kLiteRtStatusErrorRuntimeFailure,
+                                    "Failed to create NeuronMemory from AHWB");
+        }
+        return neuron_memory_registry_.Register(
+            neuron_memory, *tensor_buffer_size, *tensor_buffer_offset);
 #else
-  (void)neuron_adapter_;
-  return litert::Unexpected(
-      kLiteRtStatusErrorRuntimeFailure,
-      "AHardwareBuffer is not supported on this platform");
+        (void)neuron_adapter_;
+        return litert::Unexpected(
+            kLiteRtStatusErrorRuntimeFailure,
+            "AHardwareBuffer is not supported on this platform");
 #endif
+      } else {
+        return ahwb.Error();
+      }
+      break;
+
+    case kLiteRtTensorBufferTypeDmaBuf:
+      if (auto dma_buf = tensor_buffer.GetDmaBuf(); dma_buf) {
+        NeuronMemory* neuron_memory;
+        if (neuron_adapter_.api().memory_create_from_fd(
+                *tensor_buffer_size, /*protect*/ PROT_READ | PROT_WRITE,
+                dma_buf->fd, *tensor_buffer_offset,
+                &neuron_memory) != NEURON_NO_ERROR) {
+          return litert::Unexpected(
+              kLiteRtStatusErrorRuntimeFailure,
+              "Failed to create NeuronMemory from DMA-BUF");
+        }
+        return neuron_memory_registry_.Register(
+            neuron_memory, *tensor_buffer_size, *tensor_buffer_offset);
+      } else {
+        return dma_buf.Error();
+      }
+      break;
+
+    default:
+      LITERT_LOG(LITERT_ERROR, "Unsupported buffer type: %d",
+                 *tensor_buffer_type);
+      return litert::Unexpected(kLiteRtStatusErrorUnsupported);
+  }
 }

 LiteRtDispatchDeviceContextT::NeuronMemoryRegistry::~NeuronMemoryRegistry() {
--- a/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/litert_dispatch_invocation_context.cc
+++ b/tensorflow/lite/experimental/litert/vendors/mediatek/dispatch/litert_dispatch_invocation_context.cc
@@ -288,10 +288,10 @@ LiteRtDispatchInvocationContextT::IoRequirementsBuilder::IoRequirementsBuilder(

 Expected<LiteRtTensorBufferRequirements>
 LiteRtDispatchInvocationContextT::IoRequirementsBuilder::Create() {
-  static constexpr std::array<LiteRtTensorBufferType, 1>
-      kSupportedTensorBufferTypes = {
-          kLiteRtTensorBufferTypeAhwb,
-      };
+  static constexpr std::array kSupportedTensorBufferTypes = {
+      kLiteRtTensorBufferTypeAhwb,
+      kLiteRtTensorBufferTypeDmaBuf,
+  };

  LiteRtTensorBufferRequirements requirements;
  if (auto status = LiteRtCreateTensorBufferRequirements(
--- a/tensorflow/lite/experimental/litert/vendors/mediatek/neuron_adapter.cc
+++ b/tensorflow/lite/experimental/litert/vendors/mediatek/neuron_adapter.cc
@@ -107,6 +107,7 @@ litert::Expected<void> NeuronAdapter::LoadSymbols(
            api_->execution_set_output_from_memory);
  LOAD_SYMB(NeuronMemory_createFromAHardwareBuffer,
            api_->memory_create_from_ahwb);
+  LOAD_SYMB(NeuronMemory_createFromFd, api_->memory_create_from_fd);
  LOAD_SYMB(NeuronMemory_free, api_->memory_free);
  LOAD_SYMB(NeuronModel_addOperand, api_->model_add_operand);
  LOAD_SYMB(NeuronModel_addOperation, api_->model_add_operation);
--- a/tensorflow/lite/experimental/litert/vendors/mediatek/neuron_adapter.h
+++ b/tensorflow/lite/experimental/litert/vendors/mediatek/neuron_adapter.h
@@ -114,6 +114,8 @@ int NeuronExecution_setOutputFromMemory(NeuronExecution* execution,
                                        size_t offset, size_t length);
 int NeuronMemory_createFromAHardwareBuffer(const AHardwareBuffer* ahwb,
                                           NeuronMemory** memory);
+int NeuronMemory_createFromFd(size_t size, int protect, int fd, size_t offset,
+                              NeuronMemory** memory);
 int NeuronModel_addOperand(NeuronModel* model, const NeuronOperandType* type);
 int NeuronModel_addOperation(NeuronModel* model, NeuronOperationType type,
                             uint32_t inputCount, const uint32_t* inputs,
@@ -232,6 +234,7 @@ struct NeuronAdapter::Api {
      execution_set_output_from_memory = nullptr;
  decltype(&NeuronMemory_createFromAHardwareBuffer) memory_create_from_ahwb =
      nullptr;
+  decltype(&NeuronMemory_createFromFd) memory_create_from_fd = nullptr;
  decltype(&NeuronMemory_free) memory_free = nullptr;
  decltype(&NeuronModel_addOperand) model_add_operand = nullptr;
  decltype(&NeuronModel_addOperation) model_add_operation = nullptr;