diff --git a/binaries/dnn_benchmark.cpp b/binaries/dnn_benchmark.cpp
index 1a834a6..304d438 100644
--- a/binaries/dnn_benchmark.cpp
+++ b/binaries/dnn_benchmark.cpp
@@ -39,7 +39,7 @@ bool hasEnding(std::string const &fullString, std::string const &ending) {
 }
 
 auto GetModel(css &daqName, const bool allow_fp16,
-              const PreferenceCode &compile_preference) {
+              const int compile_preference) {
     std::unique_ptr<Model> model;
     ModelBuilder builder;
     if (hasEnding(daqName, ".daq")) {
@@ -64,7 +64,7 @@ auto GetModel(css &daqName, const bool allow_fp16,
     return model;
 }
 
-auto PrefCodeToStr(const PreferenceCode &preference_code) {
+auto PrefCodeToStr(const int &preference_code) {
     if (preference_code == ANEURALNETWORKS_PREFER_FAST_SINGLE_ANSWER) {
         return "fast single";
     }
@@ -129,13 +129,13 @@ int main(int argc, char **argv) {
         }                                                                      \
     }
 
-    const std::vector<PreferenceCode> preference_candidates{
+    const std::vector<int> preference_candidates{
         ANEURALNETWORKS_PREFER_FAST_SINGLE_ANSWER,
         ANEURALNETWORKS_PREFER_SUSTAINED_SPEED,
         ANEURALNETWORKS_PREFER_LOW_POWER};
     if (quant) {
         uint8_t data[input_len];
-        uint8_t output[output_len];
+        float output[output_len];
         WARM_UP;
         const std::vector<bool> fp16_candidates{false};
         BENCHMARK(fp16_candidates, preference_candidates);
@@ -149,7 +149,7 @@ int main(int argc, char **argv) {
         WARM_UP;
 
         const std::vector<bool> fp16_candidates =
-            ModelBuilder::GetAndroidSdkVersion() >= __ANDROID_API_P__
+            GetAndroidSdkVersion() >= __ANDROID_API_P__
                 ? std::vector<bool>{false, true}
                 : std::vector<bool>{false};
         BENCHMARK(fp16_candidates, preference_candidates);
diff --git a/dnnlibrary/CMakeLists.txt b/dnnlibrary/CMakeLists.txt
index bb6adf8..0042cc0 100644
--- a/dnnlibrary/CMakeLists.txt
+++ b/dnnlibrary/CMakeLists.txt
@@ -4,7 +4,7 @@ set(dnnlibrary_src
     ${PROJECT_SOURCE_DIR}/include/dnnlibrary/ModelBuilder.h
     ${PROJECT_SOURCE_DIR}/include/dnnlibrary/Model.h
     ${PROJECT_SOURCE_DIR}/include/dnnlibrary/DaqReader.h
-    ${PROJECT_SOURCE_DIR}/include/dnnlibrary/NeuralNetworksWrapper.h
+    ${PROJECT_SOURCE_DIR}/include/dnnlibrary/nnapi_implementation.h
     android_log_helper.h
     operand_helper.h
     flatbuffers_helper.h
@@ -12,6 +12,7 @@ set(dnnlibrary_src
     Model.cpp
     DaqReader.cpp 
     NeuralNetworksWrapper.cpp
+    nnapi_implementation.cc
     ${PROJECT_SOURCE_DIR}/include/common/Shaper.h
     ${PROJECT_SOURCE_DIR}/common/Shaper.cpp
     ${PROJECT_SOURCE_DIR}/include/common/StrKeyMap.h 
diff --git a/dnnlibrary/DaqReader.cpp b/dnnlibrary/DaqReader.cpp
index fd7869b..abbae5f 100644
--- a/dnnlibrary/DaqReader.cpp
+++ b/dnnlibrary/DaqReader.cpp
@@ -59,13 +59,13 @@ std::string layer_type_to_str(DNN::LayerType type) {
 int convert_fuse_code_to_nnapi(const DNN::FuseCode fuse_code) {
     switch (fuse_code) {
         case DNN::FuseCode::None:
-            return FuseCode::ANEURALNETWORKS_FUSED_NONE;
+            return ANEURALNETWORKS_FUSED_NONE;
         case DNN::FuseCode::Relu:
-            return FuseCode::ANEURALNETWORKS_FUSED_RELU;
+            return ANEURALNETWORKS_FUSED_RELU;
         case DNN::FuseCode::Relu1:
-            return FuseCode::ANEURALNETWORKS_FUSED_RELU1;
+            return ANEURALNETWORKS_FUSED_RELU1;
         case DNN::FuseCode::Relu6:
-            return FuseCode::ANEURALNETWORKS_FUSED_RELU6;
+            return ANEURALNETWORKS_FUSED_RELU6;
     }
     throw std::invalid_argument("Invalid fuse_code");
 }
diff --git a/dnnlibrary/Model.cpp b/dnnlibrary/Model.cpp
index 299790a..be564b4 100644
--- a/dnnlibrary/Model.cpp
+++ b/dnnlibrary/Model.cpp
@@ -29,15 +29,19 @@ void Model::PrepareForExecution() {
         throw std::invalid_argument(
             "Error in PrepareForExecution, compilation_ == nullptr");
     }
-    THROW_ON_ERROR(ANeuralNetworksExecution_create(compilation_, &execution_));
+    THROW_ON_ERROR(
+        nnapi_->ANeuralNetworksExecution_create(compilation_, &execution_));
     prepared_for_exe_ = true;
 }
 
+Model::Model() : nnapi_(NnApiImplementation()) {
+}
+
 Model::~Model() {
     munmap(data_, data_size_);
-    ANeuralNetworksModel_free(model_);
-    ANeuralNetworksCompilation_free(compilation_);
-    ANeuralNetworksMemory_free(memory_);
+    nnapi_->ANeuralNetworksModel_free(model_);
+    nnapi_->ANeuralNetworksCompilation_free(compilation_);
+    nnapi_->ANeuralNetworksMemory_free(memory_);
 }
 
 void Model::SetInputBuffer(const int32_t index, const float *buffer) {
@@ -52,8 +56,8 @@ void Model::SetInputBuffer(const int32_t index, const void *buffer,
                            const size_t elemsize) {
     if (!prepared_for_exe_) PrepareForExecution();
     auto size = shaper_.GetSize(input_names_[index]) * elemsize;
-    THROW_ON_ERROR(ANeuralNetworksExecution_setInput(execution_, index, nullptr,
-                                                     buffer, size))
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksExecution_setInput(
+        execution_, index, nullptr, buffer, size))
 }
 
 void Model::SetOutputBuffer(const int32_t index, float *buffer) {
@@ -72,17 +76,18 @@ void Model::SetOutputBuffer(const int32_t index, void *buffer,
                             const size_t elemsize) {
     if (!prepared_for_exe_) PrepareForExecution();
     auto size = shaper_.GetSize(output_names_[index]) * elemsize;
-    THROW_ON_ERROR(ANeuralNetworksExecution_setOutput(execution_, index,
-                                                      nullptr, buffer, size))
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksExecution_setOutput(
+        execution_, index, nullptr, buffer, size))
 }
 
 void Model::PredictAfterSetInputBuffer() {
     ANeuralNetworksEvent *event = nullptr;
-    THROW_ON_ERROR(ANeuralNetworksExecution_startCompute(execution_, &event));
-    THROW_ON_ERROR(ANeuralNetworksEvent_wait(event));
+    THROW_ON_ERROR(
+        nnapi_->ANeuralNetworksExecution_startCompute(execution_, &event));
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksEvent_wait(event));
 
-    ANeuralNetworksEvent_free(event);
-    ANeuralNetworksExecution_free(execution_);
+    nnapi_->ANeuralNetworksEvent_free(event);
+    nnapi_->ANeuralNetworksExecution_free(execution_);
     prepared_for_exe_ = false;
 }
 
diff --git a/dnnlibrary/ModelBuilder.cpp b/dnnlibrary/ModelBuilder.cpp
index 728c18e..09ba49e 100644
--- a/dnnlibrary/ModelBuilder.cpp
+++ b/dnnlibrary/ModelBuilder.cpp
@@ -30,41 +30,6 @@ using std::stringstream;
 using std::vector;
 using namespace android::nn::wrapper;
 
-// Copy from
-// https://github.com/tensorflow/tensorflow/blob/master/tensorflow/lite/nnapi/nnapi_implementation.cc
-int32_t ModelBuilder::GetAndroidSdkVersion() {
-    const char *sdkProp = "ro.build.version.sdk";
-    char sdkVersion[PROP_VALUE_MAX];
-    int length = __system_property_get(sdkProp, sdkVersion);
-    if (length != 0) {
-        int32_t result = 0;
-        for (int i = 0; i < length; ++i) {
-            int digit = sdkVersion[i] - '0';
-            if (digit < 0 || digit > 9) {
-                // Non-numeric SDK version, assume it's higher than expected;
-                return 0xffff;
-            }
-            result = result * 10 + digit;
-        }
-        // TODO(levp): remove once SDK gets updated to 29th level
-        // Upgrade SDK version for pre-release Q to be able to test
-        // functionality available from SDK level 29.
-        if (result == 28) {
-            char versionCodename[PROP_VALUE_MAX];
-            const char *versionCodenameProp = "ro.build.version.codename";
-            length =
-                __system_property_get(versionCodenameProp, versionCodename);
-            if (length != 0) {
-                if (versionCodename[0] == 'Q') {
-                    return 29;
-                }
-            }
-        }
-        return result;
-    }
-    return 0;
-}
-
 void ModelBuilder::RegisterOperand(const std::string &name,
                                    ModelBuilder::Index index,
                                    const OperandType &operand_type) {
@@ -539,7 +504,7 @@ ModelBuilder::Index ModelBuilder::AddDequantize(const std::string &input,
     input_indexes.push_back(input_idx);
     shaper_.Identity(input, output);
     const OperandType operand_type =
-        GetOperandType(Type::FLOAT32, shaper_[output]);
+        GetOperandType(Type::TENSOR_FLOAT32, shaper_[output]);
     const auto output_idx = AddOperation(ANEURALNETWORKS_DEQUANTIZE,
                                          input_indexes, operand_type)[0];
     RegisterOperand(output, output_idx, operand_type);
@@ -696,7 +661,7 @@ OperandType ModelBuilder::GetOperandType(const QuantInfo &quant_info,
             map_type##_operand_map_.end()) {                                 \
             const auto index = AddNewOperand({Type::op_type});               \
             THROW_ON_ERROR_WITH_NOTE(                                        \
-                ANeuralNetworksModel_setOperandValue(                        \
+                nnapi_->ANeuralNetworksModel_setOperandValue(                \
                     dnn_model_->model_, index, &value, sizeof(value)),       \
                 "value: " + std::to_string(value));                          \
             map_type##_operand_map_[value] = index;                          \
@@ -713,15 +678,15 @@ DEFINE_OPERAND_FROM_SCALAR(float, float32, FLOAT32);
 ModelBuilder::Index ModelBuilder::AddMissingOperand(
     const OperandType &operand_type) {
     const auto index = AddNewOperand(operand_type);
-    THROW_ON_ERROR(ANeuralNetworksModel_setOperandValue(dnn_model_->model_,
-                                                        index, nullptr, 0));
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksModel_setOperandValue(
+        dnn_model_->model_, index, nullptr, 0));
     return index;
 }
 
 ModelBuilder::Index ModelBuilder::AddNewOperand(
     const OperandType &operand_type) {
-    THROW_ON_ERROR(ANeuralNetworksModel_addOperand(dnn_model_->model_,
-                                                   &operand_type.operandType));
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksModel_addOperand(
+        dnn_model_->model_, &operand_type.operandType));
     return next_index_++;
 }
 
@@ -732,7 +697,7 @@ ModelBuilder::Index ModelBuilder::AddTensorFromMemory(const string &name,
     throw std::invalid_argument("");
     DNN_ASSERT(!dimen.empty(), "");
     const auto index = AddNewOperand({Type::TENSOR_FLOAT32, dimen});
-    THROW_ON_ERROR(ANeuralNetworksModel_setOperandValueFromMemory(
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksModel_setOperandValueFromMemory(
         dnn_model_->model_, index, dnn_model_->memory_,
         addr - dnn_model_->data_, Product(dimen) * sizeof(float)));
     shaper_.AddShape(name, dimen);
@@ -775,7 +740,7 @@ ModelBuilder::Index ModelBuilder::AddTensorFromBuffer(
                                         typeToStr(operand_type.type));
     }
     uint32_t index = AddNewOperand(operand_type);
-    THROW_ON_ERROR(ANeuralNetworksModel_setOperandValue(
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksModel_setOperandValue(
         dnn_model_->model_, index, buffer,
         Product(operand_type.dimensions) * element_size));
     shaper_.AddShape(name, operand_type.dimensions);
@@ -797,27 +762,28 @@ std::unique_ptr<Model> ModelBuilder::Compile(uint32_t preference) {
         }
     }
     THROW_ON_ERROR_WITH_NOTE(
-        ANeuralNetworksModel_identifyInputsAndOutputs(
+        nnapi_->ANeuralNetworksModel_identifyInputsAndOutputs(
             dnn_model_->model_, static_cast<uint32_t>(input_index_vec_.size()),
             &input_index_vec_[0],
             static_cast<uint32_t>(output_index_vec_.size()),
             &output_index_vec_[0]),
         "on identifyInputsAndOutputs");
 
-    THROW_ON_ERROR_WITH_NOTE(ANeuralNetworksModel_finish(dnn_model_->model_),
-                             "on model finish");
+    THROW_ON_ERROR_WITH_NOTE(
+        nnapi_->ANeuralNetworksModel_finish(dnn_model_->model_),
+        "on model finish");
 
     ;
-    THROW_ON_ERROR_WITH_NOTE(ANeuralNetworksCompilation_create(
+    THROW_ON_ERROR_WITH_NOTE(nnapi_->ANeuralNetworksCompilation_create(
                                  dnn_model_->model_, &dnn_model_->compilation_),
                              "on create");
 
-    THROW_ON_ERROR_WITH_NOTE(ANeuralNetworksCompilation_setPreference(
+    THROW_ON_ERROR_WITH_NOTE(nnapi_->ANeuralNetworksCompilation_setPreference(
                                  dnn_model_->compilation_, preference),
                              "on setPreference");
 
     THROW_ON_ERROR_WITH_NOTE(
-        ANeuralNetworksCompilation_finish(dnn_model_->compilation_),
+        nnapi_->ANeuralNetworksCompilation_finish(dnn_model_->compilation_),
         "on compilation finish");
 
     VLOG(5) << "Finishing.. Here are operands in the model:";
@@ -904,7 +870,7 @@ ModelBuilder::IndexSeq ModelBuilder::AddOperation(
     }
 
     THROW_ON_ERROR_WITH_NOTE(
-        ANeuralNetworksModel_addOperation(
+        nnapi_->ANeuralNetworksModel_addOperation(
             dnn_model_->model_, op, input_indexes.size(), &input_indexes[0],
             output_indexes.size(), &output_indexes[0]),
         "op = " + std::to_string(op));
@@ -914,7 +880,7 @@ ModelBuilder::IndexSeq ModelBuilder::AddOperation(
 
 void ModelBuilder::Prepare() {
     dnn_model_ = std::unique_ptr<Model>(new Model());
-    const auto ret = ANeuralNetworksModel_create(&dnn_model_->model_);
+    const auto ret = nnapi_->ANeuralNetworksModel_create(&dnn_model_->model_);
     if (ret == ANEURALNETWORKS_OUT_OF_MEMORY) {
         throw std::bad_alloc();
     }
@@ -922,8 +888,8 @@ void ModelBuilder::Prepare() {
 
 void ModelBuilder::SetMemory(int fd, size_t size, size_t offset) {
     ANeuralNetworksMemory *mem = nullptr;
-    THROW_ON_ERROR(
-        ANeuralNetworksMemory_createFromFd(size, PROT_READ, fd, offset, &mem));
+    THROW_ON_ERROR(nnapi_->ANeuralNetworksMemory_createFromFd(
+        size, PROT_READ, fd, offset, &mem));
     dnn_model_->memory_ = mem;
 }
 
@@ -938,10 +904,14 @@ ModelBuilder &ModelBuilder::AddOutput(const std::string &name) {
 }
 
 ModelBuilder &ModelBuilder::AllowFp16(const bool allowed) {
-    if (GetAndroidSdkVersion() >= __ANDROID_API_P__) {
-        ANeuralNetworksModel_relaxComputationFloat32toFloat16(
+    if (nnapi_->ANeuralNetworksModel_relaxComputationFloat32toFloat16 !=
+        nullptr) {
+        nnapi_->ANeuralNetworksModel_relaxComputationFloat32toFloat16(
             dnn_model_->model_, allowed);
     }
     return *this;
 }
+
+ModelBuilder::ModelBuilder() : nnapi_(NnApiImplementation()) {
+}
 }  // namespace dnn
diff --git a/dnnlibrary/NeuralNetworksWrapper.cpp b/dnnlibrary/NeuralNetworksWrapper.cpp
index 5638539..57be2c9 100644
--- a/dnnlibrary/NeuralNetworksWrapper.cpp
+++ b/dnnlibrary/NeuralNetworksWrapper.cpp
@@ -14,7 +14,7 @@ OperandType::OperandType(Type type, std::vector<uint32_t> d, float scale,
             dimensions = {1};
         }
     } else {
-        DNN_ASSERT(!isScalarType(type), typeToStr(type));
+        DNN_ASSERT(!isScalarType(type), typeToStr(type), " ", dimensions);
     }
     operandType = {
         .type = static_cast<int32_t>(type),
diff --git a/dnnlibrary/nnapi_helper.h b/dnnlibrary/nnapi_helper.h
index 0d07aaf..a85c2ec 100644
--- a/dnnlibrary/nnapi_helper.h
+++ b/dnnlibrary/nnapi_helper.h
@@ -3,7 +3,7 @@
 
 #include <string>
 
-#include <dnnlibrary/NeuralNetworksWrapper.h>
+#include <dnnlibrary/NeuralNetworksTypes.h>
 
 #define THROW_ON_ERROR(val)                                                   \
     {                                                                         \
diff --git a/dnnlibrary/nnapi_implementation.cc b/dnnlibrary/nnapi_implementation.cc
new file mode 100644
index 0000000..f5a4d8a
--- /dev/null
+++ b/dnnlibrary/nnapi_implementation.cc
@@ -0,0 +1,225 @@
+/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+#include <dnnlibrary/nnapi_implementation.h>
+
+#include <dlfcn.h>
+#include <fcntl.h>
+#include <sys/mman.h>
+#include <sys/stat.h>
+#include <unistd.h>
+
+#include <cstdlib>
+
+#ifdef __ANDROID__
+#include <sys/system_properties.h>
+#endif  // __ANDROID__
+
+#define NNAPI_LOG(format, ...) fprintf(stderr, format "\n", __VA_ARGS__);
+
+#ifdef __ANDROID__
+int32_t GetAndroidSdkVersion() {
+  const char* sdkProp = "ro.build.version.sdk";
+  char sdkVersion[PROP_VALUE_MAX];
+  int length = __system_property_get(sdkProp, sdkVersion);
+  if (length != 0) {
+    int32_t result = 0;
+    for (int i = 0; i < length; ++i) {
+      int digit = sdkVersion[i] - '0';
+      if (digit < 0 || digit > 9) {
+        // Non-numeric SDK version, assume it's higher than expected;
+        return 0xffff;
+      }
+      result = result * 10 + digit;
+    }
+    // TODO(levp): remove once SDK gets updated to 29th level
+    // Upgrade SDK version for pre-release Q to be able to test functionality
+    // available from SDK level 29.
+    if (result == 28) {
+      char versionCodename[PROP_VALUE_MAX];
+      const char* versionCodenameProp = "ro.build.version.codename";
+      length = __system_property_get(versionCodenameProp, versionCodename);
+      if (length != 0) {
+        if (versionCodename[0] == 'Q') {
+          return 29;
+        }
+      }
+    }
+    return result;
+  }
+  return 0;
+}
+#endif  // __ANDROID__
+
+namespace {
+
+void* LoadFunction(void* handle, const char* name, bool optional) {
+  if (handle == nullptr) {
+    return nullptr;
+  }
+  void* fn = dlsym(handle, name);
+  if (fn == nullptr && !optional) {
+    NNAPI_LOG("nnapi error: unable to open function %s", name);
+  }
+  return fn;
+}
+
+#ifndef __ANDROID__
+// Add /dev/shm implementation of shared memory for non-Android platforms
+int ASharedMemory_create(const char* name, size_t size) {
+  int fd = shm_open(name, O_RDWR | O_CREAT, 0644);
+  if (fd < 0) {
+    return fd;
+  }
+  int result = ftruncate(fd, size);
+  if (result < 0) {
+    close(fd);
+    return -1;
+  }
+  return fd;
+}
+#endif  // __ANDROID__
+
+#define LOAD_FUNCTION(handle, name)         \
+  nnapi.name = reinterpret_cast<name##_fn>( \
+      LoadFunction(handle, #name, /*optional*/ false));
+
+#define LOAD_FUNCTION_OPTIONAL(handle, name) \
+  nnapi.name = reinterpret_cast<name##_fn>(  \
+      LoadFunction(handle, #name, /*optional*/ true));
+
+#define LOAD_FUNCTION_RENAME(handle, name, symbol) \
+  nnapi.name = reinterpret_cast<name##_fn>(        \
+      LoadFunction(handle, symbol, /*optional*/ false));
+
+const NnApi LoadNnApi() {
+  NnApi nnapi = {};
+  nnapi.android_sdk_version = 0;
+
+#ifdef __ANDROID__
+  nnapi.android_sdk_version = GetAndroidSdkVersion();
+  if (nnapi.android_sdk_version < 27) {
+    NNAPI_LOG("nnapi error: requires android sdk version to be at least %d",
+              27);
+    nnapi.nnapi_exists = false;
+    return nnapi;
+  }
+#endif  // __ANDROID__
+
+  void* libneuralnetworks = nullptr;
+  // TODO(b/123243014): change RTLD_LOCAL? Assumes there can be multiple
+  // instances of nn api RT
+  libneuralnetworks = dlopen("libneuralnetworks.so", RTLD_LAZY | RTLD_LOCAL);
+  if (libneuralnetworks == nullptr) {
+    NNAPI_LOG("nnapi error: unable to open library %s", "libneuralnetworks.so");
+  }
+
+  nnapi.nnapi_exists = libneuralnetworks != nullptr;
+
+  // API 27 (NN 1.0) methods.
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksMemory_createFromFd);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksMemory_free);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_create);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_free);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_finish);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_addOperand);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_setOperandValue);
+  LOAD_FUNCTION_OPTIONAL(
+      libneuralnetworks,
+      ANeuralNetworksModel_setOperandSymmPerChannelQuantParams);
+  LOAD_FUNCTION(libneuralnetworks,
+                ANeuralNetworksModel_setOperandValueFromMemory);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksModel_addOperation);
+  LOAD_FUNCTION(libneuralnetworks,
+                ANeuralNetworksModel_identifyInputsAndOutputs);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksCompilation_create);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksCompilation_free);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksCompilation_setPreference);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksCompilation_finish);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_create);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_free);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_setInput);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_setInputFromMemory);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_setOutput);
+  LOAD_FUNCTION(libneuralnetworks,
+                ANeuralNetworksExecution_setOutputFromMemory);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksExecution_startCompute);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksEvent_wait);
+  LOAD_FUNCTION(libneuralnetworks, ANeuralNetworksEvent_free);
+
+  // ASharedMemory_create has different implementations in Android depending on
+  // the partition. Generally it can be loaded from libandroid.so but in vendor
+  // partition (e.g. if a HAL wants to use NNAPI) it is only accessible through
+  // libcutils.
+#ifdef __ANDROID__
+  void* libandroid = nullptr;
+  libandroid = dlopen("libandroid.so", RTLD_LAZY | RTLD_LOCAL);
+  if (libandroid != nullptr) {
+    LOAD_FUNCTION(libandroid, ASharedMemory_create);
+  } else {
+    void* cutils_handle = dlopen("libcutils.so", RTLD_LAZY | RTLD_LOCAL);
+    if (cutils_handle != nullptr) {
+      LOAD_FUNCTION_RENAME(cutils_handle, ASharedMemory_create,
+                           "ashmem_create_region");
+    } else {
+      NNAPI_LOG("nnapi error: unable to open neither libraries %s and %s",
+                "libandroid.so", "libcutils.so");
+    }
+  }
+#else
+  nnapi.ASharedMemory_create = ASharedMemory_create;
+#endif  // __ANDROID__
+
+  // API 28 (NN 1.1) methods.
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksModel_relaxComputationFloat32toFloat16);
+
+  // API 29 (NN 1.2) methods.
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworks_getDeviceCount);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworks_getDevice);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksDevice_getName);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksDevice_getVersion);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksDevice_getFeatureLevel);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksDevice_getType);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksModel_getSupportedOperationsForDevices);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksCompilation_createForDevices);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksCompilation_setCaching);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksExecution_compute);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksExecution_getOutputOperandRank);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksExecution_getOutputOperandDimensions);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksBurst_create);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks, ANeuralNetworksBurst_free);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksExecution_burstCompute);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksMemory_createFromAHardwareBuffer);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksExecution_setMeasureTiming);
+  LOAD_FUNCTION_OPTIONAL(libneuralnetworks,
+                         ANeuralNetworksExecution_getDuration);
+  return nnapi;
+}
+
+}  // namespace
+
+const NnApi* NnApiImplementation() {
+  static const NnApi nnapi = LoadNnApi();
+  return &nnapi;
+}
diff --git a/include/dnnlibrary/Model.h b/include/dnnlibrary/Model.h
index 3b320b4..91761a2 100644
--- a/include/dnnlibrary/Model.h
+++ b/include/dnnlibrary/Model.h
@@ -18,12 +18,12 @@ class Model {
     friend class ModelBuilder;
 
    private:
-    ANeuralNetworksModel *model_;
-    ANeuralNetworksCompilation *compilation_;
-    ANeuralNetworksExecution *execution_;
-    ANeuralNetworksMemory *memory_;
-    unsigned char *data_;
-    size_t data_size_;
+    ANeuralNetworksModel *model_ = nullptr;
+    ANeuralNetworksCompilation *compilation_ = nullptr;
+    ANeuralNetworksExecution *execution_ = nullptr;
+    ANeuralNetworksMemory *memory_ = nullptr;
+    unsigned char *data_ = nullptr;
+    size_t data_size_ = 0;
     std::vector<std::unique_ptr<uint8_t[]>> uint8_buf_pointers_;
     std::vector<std::unique_ptr<int8_t[]>> int8_buf_pointers_;
     std::vector<std::unique_ptr<float[]>> float_buf_pointers_;
@@ -39,8 +39,9 @@ class Model {
                         const size_t elemsize);
     void PrepareForExecution();
     void PredictAfterSetInputBuffer();
-    bool prepared_for_exe_;
-    Model() = default;
+    bool prepared_for_exe_ = false;
+    const NnApi *nnapi_ = nullptr;
+    Model();
 
    public:
     template <typename T>
diff --git a/include/dnnlibrary/ModelBuilder.h b/include/dnnlibrary/ModelBuilder.h
index fd04699..2cdc92c 100644
--- a/include/dnnlibrary/ModelBuilder.h
+++ b/include/dnnlibrary/ModelBuilder.h
@@ -86,7 +86,11 @@ class ModelBuilder {
     android::nn::wrapper::OperandType GetOperandType(
         const QuantInfo &quant_info, const Shape &dims);
 
+
+    const NnApi* nnapi_ = nullptr;
+
    public:
+    ModelBuilder();
     enum class PoolingType { MAX_POOL, AVE_POOL };
 
     static const int32_t ACTIVATION_NONE = ANEURALNETWORKS_FUSED_NONE;
diff --git a/include/dnnlibrary/NeuralNetworksMock.h b/include/dnnlibrary/NeuralNetworksMock.h
deleted file mode 100644
index fe253cc..0000000
--- a/include/dnnlibrary/NeuralNetworksMock.h
+++ /dev/null
@@ -1,5820 +0,0 @@
-/*
- * Copyright (C) 2017 The Android Open Source Project
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *      http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-/**
- * @addtogroup NeuralNetworks
- * @{
- */
-/**
- * @file NeuralNetworks.h
- */
-#ifndef ANDROID_ML_NN_RUNTIME_NEURAL_NETWORKS_MOCK_H
-#define ANDROID_ML_NN_RUNTIME_NEURAL_NETWORKS_MOCK_H
-/******************************************************************
- *
- * IMPORTANT NOTICE:
- *
- *   This file is part of Android's set of stable system headers
- *   exposed by the Android NDK (Native Development Kit).
- *
- *   Third-party source AND binary code relies on the definitions
- *   here to be FROZEN ON ALL UPCOMING PLATFORM RELEASES.
- *
- *   - DO NOT MODIFY ENUMS (EXCEPT IF YOU ADD NEW 32-BIT VALUES)
- *   - DO NOT MODIFY CONSTANTS OR FUNCTIONAL MACROS
- *   - DO NOT CHANGE THE SIGNATURE OF FUNCTIONS IN ANY WAY
- *   - DO NOT CHANGE THE LAYOUT OR SIZE OF STRUCTURES
- */
-#include <android/hardware_buffer.h>
-#include <stddef.h>
-#include <stdint.h>
-#include <sys/cdefs.h>
-__BEGIN_DECLS
-/**
- * Operand types.
- *
- * The type of operands that can be added to a model.
- *
- * Although we define many types, most operators accept just a few
- * types. Most used are {@link ANEURALNETWORKS_TENSOR_FLOAT32},
- * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
- * and {@link ANEURALNETWORKS_INT32}.
- *
- * Available since API level 27.
- */
-typedef enum {
-    /** A 32 bit floating point scalar value. */
-    ANEURALNETWORKS_FLOAT32 = 0,
-    /** A signed 32 bit integer scalar value. */
-    ANEURALNETWORKS_INT32 = 1,
-    /** An unsigned 32 bit integer scalar value. */
-    ANEURALNETWORKS_UINT32 = 2,
-    /** A tensor of 32 bit floating point values. */
-    ANEURALNETWORKS_TENSOR_FLOAT32 = 3,
-    /** A tensor of 32 bit integer values. */
-    ANEURALNETWORKS_TENSOR_INT32 = 4,
-    /**
-     * A tensor of 8 bit unsigned integers that represent real numbers.
-     *
-     * Attached to this tensor are two numbers that be used to convert the
-     * 8 bit integer to the real value and vice versa. These two numbers are:
-     * - scale: a 32 bit floating point value greater than zero.
-     * - zeroPoint: a 32 bit integer, in range [0, 255].
-     *
-     * The formula is:
-     *   real_value = (integer_value - zeroPoint) * scale.
-     */
-    ANEURALNETWORKS_TENSOR_QUANT8_ASYMM = 5,
-    /**
-     * An 8 bit boolean scalar value.
-     *
-     * Values of this operand type are either true or false. A zero value
-     * represents false; any other value represents true.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_BOOL = 6,
-    /**
-     * A tensor of 16 bit signed integers that represent real numbers.
-     *
-     * Attached to this tensor is a number representing real value scale that is
-     * used to convert the 16 bit number to a real value in the following way:
-     * realValue = integerValue * scale.
-     *
-     * scale is a 32 bit floating point with value greater then zero.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_QUANT16_SYMM = 7,
-    /**
-     * A tensor of IEEE 754 16 bit floating point values.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_FLOAT16 = 8,
-    /**
-     * A tensor of 8 bit boolean values.
-     *
-     * Values of this operand type are either true or false. A zero value
-     * represents false; any other value represents true.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_BOOL8 = 9,
-    /**
-     * An IEEE 754 16 bit floating point scalar value.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_FLOAT16 = 10,
-    /**
-     * A tensor of 8 bit signed integers that represent real numbers.
-     *
-     * This tensor is associated with additional fields that can
-     * be used to convert the 8 bit signed integer to the real value and vice versa.
-     * These fields are:
-     * - channelDim: a 32 bit unsigned integer indicating channel dimension.
-     * - scales: an array of positive 32 bit floating point values.
-     * The size of the scales array must be equal to dimensions[channelDim].
-     *
-     * {@link ANeuralNetworksModel_setOperandSymmPerChannelQuantParams} must be used
-     * to set the parameters for an Operand of this type.
-     *
-     * The channel dimension of this tensor must not be unknown (dimensions[channelDim] != 0).
-     *
-     * The formula is:
-     * realValue[..., C, ...] =
-     *     integerValue[..., C, ...] * scales[C]
-     * where C is an index in the Channel dimension.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL = 11,
-    /**
-     * A tensor of 16 bit unsigned integers that represent real numbers.
-     *
-     * Attached to this tensor are two numbers that can be used to convert the
-     * 16 bit integer to the real value and vice versa. These two numbers are:
-     * - scale: a 32 bit floating point value greater than zero.
-     * - zeroPoint: a 32 bit integer, in range [0, 65535].
-     *
-     * The formula is:
-     * real_value = (integer_value - zeroPoint) * scale.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_QUANT16_ASYMM = 12,
-    /**
-     * A tensor of 8 bit signed integers that represent real numbers.
-     *
-     * Attached to this tensor is a number representing real value scale that is
-     * used to convert the 8 bit number to a real value in the following way:
-     * realValue = integerValue * scale.
-     *
-     * scale is a 32 bit floating point with value greater then zero.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TENSOR_QUANT8_SYMM = 13,
-} OperandCode;
-/**
- * Operation types.
- *
- * The type of operations that can be added to a model.
- *
- * Available since API level 27.
- */
-typedef enum {
-    // Operations below are available since API level 27.
-    /**
-     * Adds two tensors, element-wise.
-     *
-     * Takes two input tensors of identical {@link OperandCode} and compatible
-     * dimensions. The output is the sum of both input tensors, optionally
-     * modified by an activation function.
-     *
-     * Two dimensions are compatible when:
-     *     1. they are equal, or
-     *     2. one of them is 1
-     *
-     * The size of the output is the maximum size along each dimension of the
-     * input operands. It starts with the trailing dimensions, and works its
-     * way forward.
-     *
-     * Example:
-     *
-     *     input1.dimension = {4, 1, 2}
-     *     input2.dimension = {5, 4, 3, 1}
-     *     output.dimension = {5, 4, 3, 2}
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode}, and compatible dimensions
-     *      as input0.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     *
-     * Outputs:
-     * * 0: The sum, a tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_ADD = 0,
-    /**
-     * Performs a 2-D average pooling operation.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, channel] =
-     *         sum_{di, dj}(
-     *             input[b, strides[1] * i + di, strides[2] * j + dj, channel]
-     *         ) / sum(1)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 10: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *       Set to true to specify NCHW data layout for input0 and output0.
-     *       Available since API level 29.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 7: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_AVERAGE_POOL_2D = 1,
-    /**
-     * Concatenates the input tensors along the given dimension.
-     *
-     * The input tensors must have identical {@link OperandCode} and the same
-     * dimensions except the dimension along the concatenation axis.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} (full support since API
-     *   level 29, see the input section)
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0 ~ n-1: The list of n input tensors, of shape
-     *            [D0, D1, ..., Daxis(i), ..., Dm].
-     *            Before API level 29, all input tensors of
-     *            {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *            must have the same scale and zeroPoint as the output tensor.
-     * * n: An {@link ANEURALNETWORKS_INT32} scalar, specifying the
-     *      concatenation axis.
-     *
-     * Outputs:
-     * * 0: The output, a tensor of the same {@link OperandCode} as the input
-     *      tensors. The output shape is [D0, D1, ..., sum(Daxis(i)), ..., Dm].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_CONCATENATION = 2,
-    /**
-     * Performs an 2-D convolution operation.
-     *
-     * The CONV_2D op sweeps a 2-D filter that can mix channels together over a
-     * batch of images, applying the filter to each window of each image of the
-     * appropriate size.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, channel] =
-     *         sum_{di, dj, k} (
-     *             input[b, strides[1] * i + di, strides[2] * j + dj, k] *
-     *             filter[channel, di, dj, k]
-     *         ) + bias[channel]
-     *
-     * Supported tensor {@link OperandCode} configurations:
-     * * 32 bit Floating point :
-     * * * {@link ANEURALNETWORKS_TENSOR_FLOAT32} for input, filter, output, and bias.
-     *
-     * * Quantized:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, filter, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (with scale set to
-     * * * input.scale * filter.scale).
-     *
-     * Available since API level 29:
-     * * Quantized with symetric per channel quantization for the filter:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} for filter.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (scale set to 0.0,
-     * * * each value scaling is separate and equal to input.scale * filter.scales[channel]).
-     *
-     * * 16 bit Floating point:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} for input, filter, output, and bias.
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_in], specifying the
-     *      filter. For tensor of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} the channel
-     *      dimension (extraParams.channelQuant.channelDim) must be set to 0.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 10: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     * * 11: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for width. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on width dimension. If this input is set,
-     *      input 12 (dilation factor for height) must be specified as well.
-     *      Available since API level 29.
-     * * 12: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for height. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on height dimension. If this input is set,
-     *      input 11 (dilation factor for width) must be specified as well.
-     *      Available since API level 29.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_in], specifying the
-     *      filter. For tensor of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} the channel
-     *      dimension (extraParams.channelQuant.channelDim) must be set to 0.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 7: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     * * 8: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for width. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on width dimension. If this input is set,
-     *      input 9 (dilation factor for height) must be specified as well.
-     *      Available since API level 29.
-     * * 9: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for height. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on height dimension. If this input is set,
-     *      input 8 (dilation factor for width) must be specified as well.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth_out]. For output tensor of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the following condition
-     *      must be satisfied: output_scale > input_scale * filter_scale (for
-     *      filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}
-     *      this condition must be true for all filter scales).
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_CONV_2D = 3,
-    /**
-     * Performs a depthwise 2-D convolution operation.
-     *
-     * Given an input tensor of shape [batches, height, width, depth_in] and a
-     * filter tensor of shape [1, filter_height, filter_width, depth_out]
-     * containing depth_out convolutional filters of depth 1, DEPTHWISE_CONV
-     * applies a different filter to each input channel (expanding from 1
-     * channel to channel_multiplier channels for each), then concatenates the
-     * results together.
-     *
-     * The output has depth_out = depth_in * depth_multiplier channels.
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, k * channel_multiplier + q] =
-     *         sum_{di, dj} (
-     *             input[b, strides[1] * i + di, strides[2] * j + dj, k] *
-     *             filter[1, di, dj, k * channel_multiplier + q]
-     *         ) + bias[k * channel_multiplier + q]
-     *
-     * Supported tensor {@link OperandCode} configurations:
-     * * 32 bit Floating point :
-     * * * {@link ANEURALNETWORKS_TENSOR_FLOAT32} for input, filter, output, and bias.
-     *
-     * * Quantized:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, filter, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (with scale set to
-     * * * input.scale * filter.scale).
-     *
-     * Available since API level 29:
-     * * Quantized with symetric per channel quantization for the filter:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} for filter.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (scale set to 0.0,
-     * * * each value scaling is separate and equal to input.scale * filter.scales[channel]).
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape [1, filter_height, filter_width, depth_out],
-     *      specifying the filter. For tensor of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} the channel
-     *      dimension (extraParams.channelQuant.channelDim) must be set to 3.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, specifying the depthwise
-     *      multiplier.
-     * * 10: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *       {@link FuseCode} values. Specifies the activation to
-     *       invoke on the result.
-     * * 11: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *       Set to true to specify NCHW data layout for input0 and output0.
-     *       Available since API level 29.
-     * * 12: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for width. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on width dimension. If this input is set,
-     *      input 13 (dilation factor for height) must be specified as well.
-     *      Available since API level 29.
-     * * 13: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for height. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on height dimension. If this input is set,
-     *      input 12 (dilation factor for width) must be specified as well.
-     *      Available since API level 29.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape [1, filter_height, filter_width, depth_out],
-     *      specifying the filter.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the depthwise
-     *      multiplier.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 8: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     * * 9: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for width. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on width dimension. If this input is set,
-     *      input 10 (dilation factor for height) must be specified as well.
-     *      Available since API level 29.
-     * * 10: An optional {@link ANEURALNETWORKS_INT32} scalar, specifying the dilation
-     *      factor for height. Defaults to 1. If set to k > 1, there will be k-1 skipped
-     *      cells between each filter element on height dimension. If this input is set,
-     *      input 9 (dilation factor for width) must be specified as well.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth_out]. For output tensor of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the following condition
-     *      must be satisfied: output_scale > input_scale * filter_scale (for
-     *      filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}
-     *      this condition must be true for all filter scales).
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_DEPTHWISE_CONV_2D = 4,
-    /**
-     * Rearranges data from depth into blocks of spatial data.
-     *
-     * More specifically, this op outputs a copy of the input tensor where
-     * values from the depth dimension are moved in spatial blocks to the height
-     * and width dimensions. The value block_size indicates the input block size
-     * and how the data is moved.
-     *
-     * Chunks of data of size block_size * block_size from depth are rearranged
-     * into non-overlapping blocks of size block_size x block_size.
-     *
-     * The width of the output tensor is input_depth * block_size, whereas the
-     * height is input_height * block_size. The depth of the input tensor must
-     * be divisible by block_size * block_size
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the block_size.
-     *      block_size must be >=1 and block_size * block_size must be a divisor
-     *      of the input depth.
-     * * 2: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape [batch, height*block_size,
-     *      width*block_size, depth/(block_size*block_size)].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_DEPTH_TO_SPACE = 5,
-    /**
-     * Dequantizes the input tensor.
-     *
-     * The formula is:
-     *
-     *     output = (input - zeroPoint) * scale.
-     *
-     * Supported input tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} (since API level 29)
-     *
-     * Supported output tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}.
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: A tensor with the same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_DEQUANTIZE = 6,
-    /**
-     * Looks up sub-tensors in the input tensor.
-     *
-     * This operator takes for input a tensor of values (Values) and
-     * a one-dimensional tensor of selection indices (Lookups).
-     * The output tensor is the concatenation of sub-tensors of Values as
-     * selected by Lookups.
-     *
-     * Think of Values as being sliced along its first dimension:
-     * The entries in Lookups select which slices are concatenated together
-     * to create the output tensor.
-     *
-     * For example, if Values has shape of [40, 200, 300] and
-     * Lookups has shape of [3], all three values found in Lookups are
-     * expected to be between 0 and 39. The resulting tensor must
-     * have shape of [3, 200, 300].
-     *
-     * If a value in Lookups is out of bounds, the operation must fail
-     * and an error must be reported.
-     *
-     * Supported value tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported value tensor rank: from 2
-     *
-     * Inputs:
-     * * 0: Lookups. A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}.
-     *      The values are indices into the first dimension of Values.
-     * * 1: Values. An n-D tensor, where n >= 2, from which sub-tensors are
-     *      extracted.
-     *
-     * Output:
-     * * 0: A n-D tensor with the same rank and shape as the Values
-     *      tensor, except for the first dimension which has the same size
-     *      as Lookups' only dimension.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_EMBEDDING_LOOKUP = 7,
-    /**
-     * Computes element-wise floor() on the input tensor.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor, of the same {@link OperandCode} and dimensions as
-     *      the input tensor.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_FLOOR = 8,
-    /**
-     * Denotes a fully (densely) connected layer, which connects all elements
-     * in the input tensor with each element in the output tensor.
-     *
-     * This layer implements the operation:
-     *
-     *     outputs = activation(inputs * weights’ + bias)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor of at least rank 2, specifying the input. If rank is
-     *      greater than 2, then it gets flattened to a 2-D Tensor. The
-     *      (flattened) 2-D Tensor is reshaped (if necessary) to
-     *      [batch_size, input_size], where "input_size" corresponds to the
-     *      number of inputs to the layer, matching the second dimension of
-     *      weights, and "batch_size" is calculated by dividing the number of
-     *      elements by "input_size".
-     * * 1: A 2-D tensor, specifying the weights, of shape
-     *      [num_units, input_size], where "num_units" corresponds to the number
-     *      of output nodes.
-     * * 2: A 1-D tensor, of shape [num_units], specifying the bias. For input
-     *      tensor of {@link ANEURALNETWORKS_TENSOR_FLOAT32}, the bias should
-     *      also be of {@link ANEURALNETWORKS_TENSOR_FLOAT32}. For input tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the bias should be
-     *      of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of 0 and
-     *      bias_scale == input_scale * filter_scale.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     *
-     * Outputs:
-     * * 0: The output tensor, of shape [batch_size, num_units]. For output
-     *      tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the following
-     *      condition must be satisfied:
-     *      output_scale > input_scale * filter_scale.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_FULLY_CONNECTED = 9,
-    /**
-     * Looks up sub-tensors in the input tensor using a key-value map.
-     *
-     * This operator takes for input a tensor of values (Values),
-     * a one-dimensional tensor of selection values (Lookups) and
-     * a one-dimensional tensor that maps these values to Values
-     * indexes. The output tensor is the concatenation of sub-tensors of
-     * Values as selected by Lookups via Keys.
-     *
-     * Think of Values as being sliced along its outer-most dimension.
-     * The output is a concatenation of selected slices, with one slice
-     * for each entry of Lookups. The slice selected is the one at the
-     * same index as the Maps entry that matches the value in Lookups.
-     *
-     * For a hit, the corresponding sub-tensor of Values is included
-     * in the Output tensor. For a miss, the corresponding sub-tensor in
-     * Output must have zero values.
-     *
-     * For example, if Values has shape of [40, 200, 300],
-     * Keys should have a shape of [40]. If Lookups tensor has shape
-     * of [3], three slices are being concatenated, so the resulting tensor
-     * must have the shape of [3, 200, 300]. If the first entry in Lookups
-     * has the value 123456, that value must be located in Keys tensor.
-     * If the sixth entry of Keys contains 123456, the sixth slice of Values
-     * must be selected. If no entry in Keys has 123456, a slice of zeroes
-     * must be concatenated.
-     *
-     * Supported value tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported value tensor rank: from 2
-     *
-     * Inputs:
-     * * 0: Lookups. A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor with
-     *      shape [ k ].
-     * * 1: Keys. A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor with shape
-     *      [ n ]; Keys and Values pair represent a map, i.e., the ith element
-     *      in Keys (Keys[i]) is the key to select the ith sub-tensor in Values
-     *      (Values[i]), where 0 <= i <= n-1. Keys tensor *MUST* be sorted in
-     *      ascending order.
-     * * 2: Values. A tensor with shape of [ n, … ]; i.e., the first dimension
-     *      must be n.
-     *
-     * Outputs:
-     * * 0: Output. A tensor with shape [ k …].
-     * * 1: Hits. A boolean tensor with shape [ k ] indicates whether the lookup
-     *      hits (True) or not (False).
-     *      Stored as {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} with offset 0
-     *      and scale 1.0f.
-     *      A non-zero byte represents True, a hit. A zero indicates otherwise.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_HASHTABLE_LOOKUP = 10,
-    /**
-     * Applies L2 normalization along the depth dimension.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[batch, row, col, channel] =
-     *         input[batch, row, col, channel] /
-     *         sqrt(sum_{c} pow(input[batch, row, col, c], 2))
-     *
-     * For input tensor with rank less than 4, independently normalizes each
-     * 1-D slice along dimension dim.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     * Tensors with rank less than 4 are only supported since API level 29.
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be normalized.
-     * * 1: An optional {@link ANEURALNETWORKS_INT32} scalar, default to -1,
-     *      specifying the dimension normalization would be performed on.
-     *      Negative index is used to specify axis from the end (e.g. -1 for
-     *      the last axis). Must be in the range [-n, n).
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} and same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_L2_NORMALIZATION = 11,
-    /**
-     * Performs an 2-D L2 pooling operation.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, c] =
-     *         sqrt(sum_{di, dj} pow(input[b, strides[1] * i + di, strides[2] * j + dj, c], 2) /
-     *              sum(1))
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 10: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *       Set to true to specify NCHW data layout for input0 and output0.
-     *       Available since API level 29.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 7: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_L2_POOL_2D = 12,
-    /**
-     * Applies Local Response Normalization along the depth dimension.
-     *
-     * The 4-D input tensor is treated as a 3-D array of 1-D vectors (along the
-     * last dimension), and each vector is normalized independently. Within a
-     * given vector, each component is divided by the weighted, squared sum of
-     * inputs within depth_radius.
-     *
-     * The output is calculated using this formula:
-     *
-     *     sqr_sum[a, b, c, d] = sum(
-     *         pow(input[a, b, c, d - depth_radius : d + depth_radius + 1], 2))
-     *     output = input / pow((bias + alpha * sqr_sum), beta)
-     *
-     * For input tensor with rank less than 4, independently normalizes each
-     * 1-D slice along specified dimension.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     * Tensors with rank less than 4 are only supported since API level 29.
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the radius of
-     *      the normalization window.
-     * * 2: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the bias, must
-     *      not be zero.
-     * * 3: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the scale
-     *      factor, alpha.
-     * * 4: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the exponent,
-     *      beta.
-     * * 5: An optional {@link ANEURALNETWORKS_INT32} scalar, default to -1,
-     *      specifying the dimension normalization would be performed on.
-     *      Negative index is used to specify axis from the end (e.g. -1 for
-     *      the last axis). Must be in the range [-n, n).
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_LOCAL_RESPONSE_NORMALIZATION = 13,
-    /**
-     * Computes sigmoid activation on the input tensor element-wise.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = 1 / (1 + exp(-input))
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *      For {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the scale must be 1.f / 256 and the zeroPoint must be 0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_LOGISTIC = 14,
-    /**
-     * Projects an input to a bit vector via locality senstive hashing.
-     *
-     * Supported input tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported input tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: Hash functions. Dim.size == 2, DataType: Float.
-     *      Tensor[0].Dim[0]: Number of hash functions.
-     *      Tensor[0].Dim[1]: Number of projected output bits generated by each
-     *      hash function.
-     *      If the projection type is Sparse:
-     *      Tensor[0].Dim[1] + ceil(log2(Tensor[0].Dim[0])) <= 32
-     *
-     * * 1: Input. Dim.size >= 1, no restriction on DataType.
-     * * 2: Weight. Optional. Dim.size == 1, DataType: Float.
-     *      If not set, each input element is considered to have the same weight
-     *      of 1.0.
-     *      Tensor[1].Dim[0] == Tensor[2].Dim[0]
-     * * 3: Type:
-     *        Sparse:
-     *          Value LSHProjectionType_SPARSE(=3) (since API level 29).
-     *          Computed bit vector is considered to be sparse.
-     *          Each output element is an int32 made up of multiple bits
-     *          computed from hash functions.
-     *
-     *          NOTE: To avoid collisions across hash functions, an offset value
-     *          of k * (1 << Tensor[0].Dim[1]) will be added to each signature,
-     *          where k is the index of the hash function.
-     *
-     *          Value LSHProjectionType_SPARSE_DEPRECATED(=1).
-     *          Legacy behavior that does not include the offset value.
-     *
-     *        Dense:
-     *          Value LSHProjectionType_DENSE(=2).
-     *          Computed bit vector is considered to be dense. Each output
-     *          element represents a bit and can take the value of either
-     *          0 or 1.
-     *
-     * Outputs:
-     * * 0: If the projection type is Sparse:
-     *      Output.Dim == { Tensor[0].Dim[0] }
-     *      A tensor of int32 that represents hash signatures,
-     *
-     *      If the projection type is Dense:
-     *      Output.Dim == { Tensor[0].Dim[0] * Tensor[0].Dim[1] }
-     *      A flattened tensor that represents projected bit vectors.
-     *
-     * Available since API level 27.
-     * The offset value for sparse projections was added in API level 29.
-     */
-    ANEURALNETWORKS_LSH_PROJECTION = 15,
-    /**
-     * Performs a single time step in a Long Short-Term Memory (LSTM) layer
-     *
-     * The LSTM operation is described by the following equations.
-     *
-     * \f{eqnarray*}{
-     * i_t =& \sigma(W_{xi}x_t+W_{hi}h_{t-1}+W_{ci}C_{t-1}+b_i) & \\
-     * f_t =& \sigma(W_{xf}x_t+W_{hf}h_{t-1}+W_{cf}C_{t-1}+b_f) & \\
-     * C_t =& clip(f_t \odot C_{t-1} + i_t \odot
-     *        g(W_{xc}x_t+W_{hc}h_{t-1}+b_c),\ t_{cell}) & \\
-     * o_t =& \sigma(W_{xo}x_t+W_{ho}h_{t-1}+W_{co}C_t+b_o) & \\
-     *      & & \\
-     *      & clip(W_{proj}(o_t \odot g(C_t))+b_{proj},\ t_{proj})
-     *      & if\ there\ is\ a\ projection; \\
-     * h_t =& & \\
-     *      & o_t \odot g(C_t) & otherwise. \\
-     * \f}
-     * Where:
-     * * \f$x_t\f$ is the input,
-     * * \f$i_t\f$ is the input gate,
-     * * \f$f_t\f$ is the forget gate,
-     * * \f$C_t\f$ is the cell state,
-     * * \f$o_t\f$ is the output,
-     * * \f$h_t\f$ is the output state,
-     * * \f$\sigma\f$ is the logistic sigmoid function,
-     * * \f$g\f$ is the cell input and cell output activation function, usually
-     *   \f$tahn\f$,
-     * * \f$W_{xi}\f$ is the input-to-input weight matrix,
-     * * \f$W_{hi}\f$ is the recurrent to input weight matrix,
-     * * \f$W_{ci}\f$ is the cell-to-input weight matrix,
-     * * \f$b_i\f$ is the input gate bias,
-     * * \f$W_{xf}\f$ is the input-to-forget weight matrix,
-     * * \f$W_{hf}\f$ is the recurrent-to-forget weight matrix,
-     * * \f$W_{cf}\f$ is the cell-to-forget weight matrix,
-     * * \f$b_f\f$ is the forget gate bias,
-     * * \f$W_{xc}\f$ is the input-to-cell weight matrix,
-     * * \f$W_{hc}\f$ is the recurrent-to-cell weight matrix,
-     * * \f$b_c\f$ is the cell bias,
-     * * \f$W_{xo}\f$ is the input-to-output weight matrix,
-     * * \f$W_{ho}\f$ is the recurrent-to-output weight matrix,
-     * * \f$W_{co}\f$ is the cell-to-output weight matrix,
-     * * \f$b_o\f$ is the output gate bias,
-     * * \f$W_{proj}\f$ is the projection weight matrix,
-     * * \f$b_{proj}\f$ is the projection bias,
-     * * \f$t_{cell}\f$ is the threshold for clipping the cell state, and
-     * * \f$t_{proj}\f$ is the threshold for clipping the projected output.
-     * * \f$\odot\f$ is the
-     *   <a href="https://en.wikipedia.org/wiki/Hadamard_product_(matrices)">
-     *   Hadamard product</a> that takes two matrices and produces another
-     *   matrix, each element of which is the product of the corresponding
-     *   elements of the input matrices.
-     *
-     * Since API level 29 LSTM supports layer normalization.
-     * In case layer normalization is used, the inputs to internal activation
-     * functions (sigmoid and \f$g\f$) are normalized, rescaled and recentered
-     * following an approach from section 3.1 from
-     * https://arxiv.org/pdf/1607.06450.pdf
-     *
-     * The operation has the following independently optional inputs:
-     * * The input-to-input weights (\f$W_{xi}\f$), recurrent-to-input weights
-     *   (\f$W_{hi}\f$), cell-to-input (\f$W_{ci}\f$) weights, and input gate
-     *   bias (\f$b_i\f$) either all have values, or none of them have values
-     *   (i.e., all set to null). If they have no values, coupling of input and
-     *   forget gates (CIFG) is used, in which case the input gate (\f$i_t\f$)
-     *   is calculated using the following equation instead.
-     *   \f{eqnarray*}{
-     *   i_t = 1 - f_t
-     *   \f}
-     * * The cell-to-forget weights (\f$W_{cf}\f$) and cell-to-output weights
-     *   (\f$W_{co}\f$) either both have values or neither of them have values.
-     *   If they have values, the peephole optimization is used. Additionally,
-     *   if CIFG is not used, cell-to-input weights (\f$W_{ci}\f$) is also
-     *   required to have values for peephole optimization.
-     * * The projection weights (\f$W_{proj}\f$) is required only for the
-     *   recurrent projection layer, and should otherwise have no value.
-     * * The projection bias (\f$b_{proj}\f$) may (but not required to) have a
-     *   value if the recurrent projection layer exists, and should otherwise
-     *   have no value.
-     * * (API level >= 29) The four layer normalization weights either all have
-     *   values or none of them have values. Layer normalization is used when
-     *   values are present.
-     *
-     * References:
-     *
-     * The default non-peephole non-CIFG implementation is based on:
-     * http://www.bioinf.jku.at/publications/older/2604.pdf
-     * S. Hochreiter and J. Schmidhuber. "Long Short-Term Memory". Neural
-     * Computation, 9(8):1735-1780, 1997.
-     *
-     * The peephole implementation and projection layer is based on:
-     * https://research.google.com/pubs/archive/43905.pdf
-     * Hasim Sak, Andrew Senior, and Francoise Beaufays. "Long short-term memory
-     * recurrent neural network architectures for large scale acoustic
-     * modeling." INTERSPEECH, 2014.
-     * (However, the concept of peephole optimization was introduced in work
-     * prior to this paper.)
-     *
-     * The coupling of input and forget gate (CIFG) is based on:
-     * http://arxiv.org/pdf/1503.04069.pdf
-     * Greff et al. "LSTM: A Search Space Odyssey"
-     *
-     * The layer normalization is based on:
-     * https://arxiv.org/pdf/1607.06450.pdf
-     * Jimmy Ba et al. "Layer Normalization"
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * All input and output tensors must be of the same type.
-     *
-     * Inputs:
-     * * 0: The input (\f$x_t\f$).
-     *      A 2-D tensor of shape [batch_size, input_size], where “batch_size”
-     *      corresponds to the batching dimension, and “input_size” is the size
-     *      of the input.
-     * * 1: The input-to-input weights (\f$W_{xi}\f$). Optional.
-     *      A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *      corresponds to the number of cell units.
-     * * 2: The input-to-forget weights (\f$W_{xf}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 3: The input-to-cell weights (\f$W_{xc}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 4: The input-to-output weights (\f$W_{xo}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 5: The recurrent-to-input weights (\f$W_{hi}\f$). Optional.
-     *      A 2-D tensor of shape [num_units, output_size], where “output_size”
-     *      corresponds to either the number of cell units (i.e., “num_units”),
-     *      or the second dimension of the “projection_weights”, if defined.
-     * * 6: The recurrent-to-forget weights (\f$W_{hf}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 7: The recurrent-to-cell weights (\f$W_{hc}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 8: The recurrent-to-output weights (\f$W_{ho}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 9: The cell-to-input weights (\f$W_{ci}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 10:The cell-to-forget weights (\f$W_{cf}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 11:The cell-to-output weights (\f$W_{co}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 12:The input gate bias (\f$b_i\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 13:The forget gate bias (\f$b_f\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 14:The cell bias (\f$b_c\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 15:The output gate bias (\f$b_o\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 16:The projection weights (\f$W_{proj}\f$). Optional.
-     *      A 2-D tensor of shape [output_size, num_units].
-     * * 17:The projection bias (\f$b_{proj}\f$). Optional.
-     *      A 1-D tensor of shape [output_size].
-     * * 18:The output state (in) (\f$h_{t-1}\f$).
-     *      A 2-D tensor of shape [batch_size, output_size].
-     * * 19:The cell state (in) (\f$C_{t-1}\f$).
-     *      A 2-D tensor of shape [batch_size, num_units].
-     * * 20:The activation function (\f$g\f$).
-     *      A value indicating the activation function:
-     *      <ul>
-     *      <li>0: None;
-     *      <li>1: Relu;
-     *      <li>3: Relu6;
-     *      <li>4: Tanh;
-     *      <li>6: Sigmoid.
-     *      </ul>
-     * * 21:The clipping threshold (\f$t_{cell}\f$) for the cell state, such
-     *      that values are bound within [-cell_clip, cell_clip]. If set to 0.0
-     *      then clipping is disabled.
-     *      Until API level 29 this scalar must be of type {@link
-     *      ANEURALNETWORKS_FLOAT32}. Since API level 29, if all the input
-     *      tensors have type {@link ANEURALNETWORKS_TENSOR_FLOAT32}, this
-     *      scalar must be of the type {@link ANEURALNETWORKS_FLOAT32},
-     *      otherwise if all the input tensors have the type {@link
-     *      ANEURALNETWORKS_TENSOR_FLOAT16}, this scalar must be of type {@link
-     *      ANEURALNETWORKS_FLOAT16}.
-     * * 22:The clipping threshold (\f$t_{proj}\f$) for the output from the
-     *      projection layer, such that values are bound within
-     *      [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.
-     *      Until API level 29 this scalar must be of type {@link
-     *      ANEURALNETWORKS_FLOAT32}. Since API level 29, if all the input
-     *      tensors have type {@link ANEURALNETWORKS_TENSOR_FLOAT32}, this
-     *      scalar must be of the type {@link ANEURALNETWORKS_FLOAT32},
-     *      otherwise if all the input tensors have the type {@link
-     *      ANEURALNETWORKS_TENSOR_FLOAT16}, this scalar must be of type {@link
-     *      ANEURALNETWORKS_FLOAT16}.
-     * Since API level 29 there are additional inputs to this op:
-     * * 23:The input layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at input gate.
-     * * 24:The forget layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at forget gate.
-     * * 25:The cell layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at cell gate.
-     * * 26:The output layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at output gate.
-     *
-     * Outputs:
-     * * 0: The scratch buffer.
-     *      A 2-D tensor of shape [batch_size, num_units * 3] with CIFG, or
-     *      [batch_size, num_units * 4] without CIFG.
-     * * 1: The output state (out) (\f$h_t\f$).
-     *      A 2-D tensor of shape [batch_size, output_size].
-     * * 2: The cell state (out) (\f$C_t\f$).
-     *      A 2-D tensor of shape [batch_size, num_units].
-     * * 3: The output (\f$o_t\f$).
-     *      A 2-D tensor of shape [batch_size, output_size]. This is effectively
-     *      the same as the current “output state (out)” value.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_LSTM = 16,
-    /**
-     * Performs an 2-D max pooling operation.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, channel] =
-     *         max_{di, dj} (
-     *             input[b, strides[1] * i + di, strides[2] * j + dj, channel]
-     *         )
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 10: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *       Set to true to specify NCHW data layout for input0 and output0.
-     *       Available since API level 29.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      width.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the filter
-     *      height.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 7: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_MAX_POOL_2D = 17,
-    /**
-     * Multiplies two tensors, element-wise.
-     *
-     * Takes two input tensors of identical {@link OperandCode} and compatible
-     * dimensions. The output is the product of both input tensors, optionally
-     * modified by an activation function.
-     *
-     * Two dimensions are compatible when:
-     *     1. they are equal, or
-     *     2. one of them is 1
-     *
-     * The size of the resulting output is the maximum size along each dimension
-     * of the input operands. It starts with the trailing dimensions, and works
-     * its way forward.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode}, and compatible dimensions
-     *      as input0.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     *
-     * Outputs:
-     * * 0: The product, a tensor of the same {@link OperandCode} as input0.
-     *      For output tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the following condition must be satisfied:
-     *      output_scale > input1_scale * input2_scale.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_MUL = 18,
-    /**
-     * Computes rectified linear activation on the input tensor element-wise.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = max(0, input)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RELU = 19,
-    /**
-     * Computes rectified linear 1 activation on the input tensor element-wise.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = min(1.f, max(-1.f, input))
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RELU1 = 20,
-    /**
-     * Computes rectified linear 6 activation on the input tensor element-wise.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = min(6, max(0, input))
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RELU6 = 21,
-    /**
-     * Reshapes a tensor.
-     *
-     * Given tensor, this operation returns a tensor that has the same values as
-     * tensor, but with a newly specified shape.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the tensor to be reshaped.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, defining the
-     *      shape of the output tensor. The number of elements implied by shape
-     *      must be the same as the number of elements in the input tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor, of shape specified by the input shape.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RESHAPE = 22,
-    /**
-     * Resizes images to given size using the bilinear interpretation.
-     *
-     * Resized images must be distorted if their output aspect ratio is not the
-     * same as input aspect ratio. The corner pixels of output may not be the
-     * same as corner pixels of input.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth], specifying
-     *      the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      height of the output tensor.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      width of the output tensor.
-     * * 3: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, new_height, new_width, depth].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RESIZE_BILINEAR = 23,
-    /**
-     * A basic recurrent neural network layer.
-     *
-     * This layer implements the operation:
-     * outputs = state = activation(inputs * input_weights +
-     *                              state * recurrent_weights + bias)
-     *
-     * Where:
-     * * “input_weights” is a weight matrix that multiplies the inputs;
-     * * “recurrent_weights” is a weight matrix that multiplies the current
-     *    “state” which itself is the output from the previous time step
-     *    computation;
-     * * “bias” is a bias vector (added to each output vector in the batch);
-     * * “activation” is the function passed as the “fused_activation_function”
-     *   argument (if not “NONE”).
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * The input tensors must all be the same type.
-     *
-     * Inputs:
-     * * 0: input.
-     *      A 2-D tensor of shape [batch_size, input_size], where “batch_size”
-     *      corresponds to the batching dimension, and “input_size” is the size
-     *      of the input.
-     * * 1: weights.
-     *      A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *      corresponds to the number of units.
-     * * 2: recurrent_weights.
-     *      A 2-D tensor of shape [num_units, num_units], with columns
-     *      corresponding to the weights from each unit.
-     * * 3: bias.
-     *      A 1-D tensor of shape [num_units].
-     * * 4: hidden state (in).
-     *      A 2-D tensor of shape [batch_size, num_units].
-     * * 5: fused_activation_function.
-     *      An optional {@link FuseCode} value indicating the
-     *      activation function. If “NONE” is specified then it results in a
-     *      linear activation.
-     *
-     * Outputs:
-     * * 0: hidden state (out).
-     *      A 2-D tensor of shape [batch_size, num_units].
-     *
-     * * 1: output.
-     *      A 2-D tensor of shape [batch_size, num_units]. This is effectively
-     *      the same as the current state value.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_RNN = 24,
-    /**
-     * Computes the softmax activation on the input tensor element-wise, per
-     * batch, by normalizing the input vector so the maximum coefficient is
-     * zero.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output[batch, i] =
-     *         exp((input[batch, i] - max(input[batch, :])) * beta) /
-     *         sum_{k}{exp((input[batch, k] - max(input[batch, :])) * beta)}
-     *
-     * For input tensor with rank other than 2, the activation will be applied
-     * independently on each 1-D slice along specified dimension.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4.
-     * Tensors with rank other than 2 or 4 are only supported since API level 29.
-     *
-     * Inputs:
-     * * 0: A 2-D or 4-D tensor, specifying the tensor to be reshaped.
-     * * 1: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the positive
-     *      scaling factor for the exponent, beta.
-     * * 2: An optional {@link ANEURALNETWORKS_INT32} scalar, default to -1,
-     *      specifying the dimension the activation would be performed on.
-     *      Negative index is used to specify axis from the end (e.g. -1 for
-     *      the last axis). Must be in the range [-n, n).
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *      For {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the scale must be 1.f / 256 and the zeroPoint must be 0.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_SOFTMAX = 25,
-    /**
-     * Rearranges blocks of spatial data, into depth.
-     *
-     * More specifically, this op outputs a copy of the input tensor where
-     * values from the height and width dimensions are moved to the depth
-     * dimension. The value block_size indicates the input block size and how
-     * the data is moved.
-     *
-     * Chunks of data of size block_size * block_size from depth are rearranged
-     * into non-overlapping blocks of size block_size x block_size.
-     *
-     * The depth of the output tensor is input_depth * block_size * block_size.
-     * The input tensor's height and width must be divisible by block_size.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the block_size.
-     *      block_size must be >=1 and block_size must be a divisor of both the
-     *      input height and width.
-     * * 2: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape [batches, height/block_size,
-     *      width/block_size, depth_in*block_size*block_size].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_SPACE_TO_DEPTH = 26,
-    /**
-     * SVDF op is a kind of stateful layer derived from the notion that a
-     * densely connected layer that's processing a sequence of input frames can
-     * be approximated by using a singular value decomposition of each of its
-     * nodes. The implementation is based on:
-     *
-     * https://research.google.com/pubs/archive/43813.pdf
-     *
-     * P. Nakkiran, R. Alvarez, R. Prabhavalkar, C. Parada.
-     * “Compressing Deep Neural Networks using a Rank-Constrained Topology”.
-     * INTERSPEECH, 2015.
-     *
-     * It processes the incoming input using a 2-stage filtering mechanism:
-     * * stage 1 performs filtering on the "features" dimension, whose outputs
-     *   get pushed into a memory of fixed-size memory_size.
-     * * stage 2 performs filtering on the "time" dimension of the memory_size
-     *   memoized outputs of stage 1.
-     *
-     * Specifically, for rank 1, this layer implements the operation:
-     *
-     *     memory = push(conv1d(inputs, weights_feature, feature_dim,
-     *                          "ANEURALNETWORKS_PADDING_VALID"));
-     *     outputs = activation(memory * weights_time + bias);
-     *
-     * Where:
-     * * “weights_feature” is a weights matrix that processes the inputs (by
-     *   convolving the input with every “feature filter”), and whose outputs
-     *   get pushed, stacked in order, into the fixed-size “memory” (the oldest
-     *   entry gets dropped);
-     * * “weights_time” is a weights matrix that processes the “memory” (by a
-     *   batched matrix multiplication on the num_units);
-     * * “bias” is an optional bias vector (added to each output vector in the
-     *   batch); and
-     * * “activation” is the function passed as the “fused_activation_function”
-     *   argument (if not “NONE”).
-     *
-     * Each rank adds a dimension to the weights matrices by means of stacking
-     * the filters.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * All input tensors must be the same type.
-     *
-     * Inputs:
-     * * 0: input.
-     *      A 2-D tensor of shape [batch_size, input_size], where “batch_size”
-     *      corresponds to the batching dimension, and “input_size” is the size
-     *      of the input.
-     * * 1: weights_feature.
-     *      A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *      corresponds to the number of units.
-     * * 2: weights_time.
-     *      A 2-D tensor of shape [num_units, memory_size], where “memory_size”
-     *      corresponds to the fixed-size of the memory.
-     * * 3: bias.
-     *      An optional 1-D tensor of shape [num_units].
-     * * 4: state (in).
-     *      A 2-D tensor of shape [batch_size, (memory_size - 1) * num_units * rank].
-     * * 5: rank.
-     *      The rank of the SVD approximation.
-     * * 6: fused_activation_function.
-     *      An optional {@link FuseCode} value indicating the
-     *      activation function. If “NONE” is specified then it results in a
-     *      linear activation.
-     *
-     * Outputs:
-     * * 0: state (out).
-     *      A 2-D tensor of the same {@link OperandCode} as the inputs, with shape
-     *      [batch_size, (memory_size - 1) * num_units * rank].
-     * * 1: output.
-     *      A 2-D tensor of the same {@link OperandCode} as the inputs, with shape
-     *      [batch_size, num_units].
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_SVDF = 27,
-    /**
-     * Computes hyperbolic tangent of input tensor element-wise.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = tanh(input)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} (since API level 29)
-     *
-     * Supported tensor rank: up to 4.
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *      For {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the scale must be 1.f / 128 and the zeroPoint must be 128.
-     *
-     * Available since API level 27.
-     */
-    ANEURALNETWORKS_TANH = 28,
-    // Operations below are available since API level 28.
-    // TODO: make the description easier to understand.
-    /**
-     * BatchToSpace for N-dimensional tensors.
-     *
-     * This operation reshapes the batch dimension (dimension 0) into M + 1
-     * dimensions of shape block_shape + [batch], interleaves these blocks back
-     * into the grid defined by the spatial dimensions [1, ..., M], to obtain a
-     * result with the same rank as the input.
-     *
-     * This is the reverse of SpaceToBatch.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be reshaped
-     * * 1: A 1-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, the block
-     *      sizes for each spatial dimension of the input tensor. All values
-     *      must be >= 1.
-     * * 2: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_BATCH_TO_SPACE_ND = 29,
-    /**
-     * Element-wise division of two tensors.
-     *
-     * Takes two input tensors of identical {@link OperandCode} and compatible
-     * dimensions. The output is the result of dividing the first input tensor
-     * by the second, optionally modified by an activation function.
-     *
-     * Two dimensions are compatible when:
-     *     1. they are equal, or
-     *     2. one of them is 1
-     *
-     * The size of the output is the maximum size along each dimension of the
-     * input operands. It starts with the trailing dimensions, and works its way
-     * forward.
-     *
-     * Example:
-     *     input1.dimension =    {4, 1, 2}
-     *     input2.dimension = {5, 4, 3, 1}
-     *     output.dimension = {5, 4, 3, 2}
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the first input.
-     * * 1: A tensor of the same {@link OperandCode}, and compatible dimensions
-     *      as input0.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_DIV = 30,
-    /**
-     * Computes the mean of elements across dimensions of a tensor.
-     *
-     * Reduces the input tensor along the given dimensions to reduce. Unless
-     * keep_dims is true, the rank of the tensor is reduced by 1 for each entry
-     * in axis. If keep_dims is true, the reduced dimensions are retained with
-     * length 1.
-     *
-     * If dimensions to reduce have no entries, all dimensions are reduced, and
-     * a tensor with a single element is returned.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     * * 1: A 1-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. If None (the default), reduces all dimensions. Must be in
-     *      the range [-rank(input_tensor), rank(input_tensor)).
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, keep_dims. If positive,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_MEAN = 31,
-    /**
-     * Pads a tensor with zeros.
-     *
-     * This operation pads a tensor according to the specified paddings.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be padded.
-     * * 1: A 2-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, the paddings
-     *      for each spatial dimension of the input tensor. The shape of the
-     *      tensor must be {rank(input0), 2}.
-     *      padding[i, 0] specifies the number of elements to be padded in the
-     *      front of dimension i.
-     *      padding[i, 1] specifies the number of elements to be padded after the
-     *      end of dimension i.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0. The
-     *      output tensor has the same rank as input0, and each
-     *      dimension of the output tensor has the same size as the
-     *      corresponding dimension of the input tensor plus the size
-     *      of the padding:
-     *          output0.dimension[i] =
-     *              padding[i, 0] + input0.dimension[i] + padding[i, 1]
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_PAD = 32,
-    // TODO: make the description easier to understand.
-    /**
-     * SpaceToBatch for N-Dimensional tensors.
-     *
-     * This operation divides "spatial" dimensions [1, ..., M] of the input into
-     * a grid of blocks of shape block_shape, and interleaves these blocks with
-     * the "batch" dimension (0) such that in the output, the spatial dimensions
-     * [1, ..., M] correspond to the position within the grid, and the batch
-     * dimension combines both the position within a spatial block and the
-     * original batch position. Prior to division into blocks, the spatial
-     * dimensions of the input are optionally zero padded according to paddings.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the input.
-     * * 1: A 1-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, the block
-     *      sizes for each spatial dimension of the input tensor. All values
-     *      must be >= 1.
-     * * 2: A 2-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, the paddings
-     *      for each spatial dimension of the input tensor. All values must be
-     *      >= 0. The shape of the tensor must be {rank(input0), 2}.
-     *      padding[i, 0] specifies the number of element to be padded in the
-     *      front of dimension i.
-     *      padding[i, 1] specifies the number of element to be padded after the
-     *      end of dimension i.
-     * * 3: An optional {@link ANEURALNETWORKS_BOOL} scalar, default to false.
-     *      Set to true to specify NCHW data layout for input0 and output0.
-     *      Available since API level 29.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_SPACE_TO_BATCH_ND = 33,
-    /**
-     * Removes dimensions of size 1 from the shape of a tensor.
-     *
-     * Given a tensor input, this operation returns a tensor of the same
-     * {@link OperandCode} with all dimensions of size 1 removed. If you don't
-     * want to remove all size 1 dimensions, you can remove specific size 1
-     * dimensions by specifying the axes (input1).
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, the tensor to be squeezed.
-     * * 1: An optional 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The
-     *      dimensions to squeeze. If specified only squeezes the dimensions
-     *      listed. Otherwise, squeezes all dimensions. The dimension index
-     *      starts at 0. An error must be reported if squeezing a dimension that
-     *      is not 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0. Contains the
-     *      same data as input, but has one or more dimensions of size 1
-     *      removed.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_SQUEEZE = 34,
-    /**
-     * Extracts a strided slice of a tensor.
-     *
-     * Roughly speaking, this op extracts a slice of size (end - begin) / stride
-     * from the given input tensor. Starting at the location specified by begin
-     * the slice continues by adding stride to the index until all dimensions
-     * are not less than end. Note that a stride can be negative, which causes a
-     * reverse slice.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be sliced.
-     * * 1: begin, a 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The
-     *      starts of the dimensions of the input tensor to be sliced. The
-     *      length must be of rank(input0).
-     * * 2: end, a 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The
-     *      ends of the dimensions of the input tensor to be sliced. The length
-     *      must be of rank(input0).
-     * * 3: strides, a 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The
-     *      strides of the dimensions of the input tensor to be sliced. The
-     *      length must be of rank(input0). The entries must be non-zero.
-     * * 4: begin_mask, an {@link ANEURALNETWORKS_INT32} scalar. If the ith bit
-     *      of begin_mask is set, begin[i] is ignored and the fullest possible
-     *      range in that dimension is used instead.
-     * * 5: end_mask, an {@link ANEURALNETWORKS_INT32} scalar. If the ith bit of
-     *      end_mask is set, end[i] is ignored and the fullest possible range in
-     *      that dimension is used instead.
-     * * 6: shrink_axis_mask, an {@link ANEURALNETWORKS_INT32} scalar. If the
-     *      ith bit of shrink_axis_mask is set, the ith dimension specification
-     *      shrinks the dimensionality by 1, taking on the value at index
-     *      begin[i]. In this case, the ith specification must define a
-     *      slice of size 1, e.g. begin[i] = x, end[i] = x + 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0 and rank (n - k),
-     *      where k is the number of bits set in shrink_axis_mask.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_STRIDED_SLICE = 35,
-    /**
-     * Element-wise subtraction of two tensors.
-     *
-     * Takes two input tensors of identical {@link OperandCode} and compatible
-     * dimensions. The output is the result of subtracting the second input
-     * tensor from the first one, optionally modified by an activation function.
-     *
-     * Two dimensions are compatible when:
-     *     1. they are equal, or
-     *     2. one of them is 1
-     *
-     * The size of the output is the maximum size along each dimension of the
-     * input operands. It starts with the trailing dimensions, and works its way
-     * forward.
-     *
-     * Example:
-     *     input1.dimension =    {4, 1, 2}
-     *     input2.dimension = {5, 4, 3, 1}
-     *     output.dimension = {5, 4, 3, 2}
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} (since API level 29)
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the first input.
-     * * 1: A tensor of the same {@link OperandCode}, and compatible dimensions
-     *      as input0.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_SUB = 36,
-    /**
-     * Transposes the input tensor, permuting the dimensions according to the
-     * perm tensor.
-     *
-     * The returned tensor's dimension i corresponds to the input dimension
-     * perm[i]. If perm is not given, it is set to (n-1...0), where n is the
-     * rank of the input tensor. Hence by default, this operation performs a
-     * regular matrix transpose on 2-D input Tensors.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be transposed.
-     * * 1: An optional 1-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32},
-     *      the permutation of the dimensions of the input tensor.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 28.
-     */
-    ANEURALNETWORKS_TRANSPOSE = 37,
-    // Operations below are available since API level 29.
-    /**
-     * Computes the absolute value of a tensor, element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_ABS = 38,
-    /**
-     * Returns the index of the largest element along an axis.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor specifying the input. Must be non-empty.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar specifying the axis to
-     *      reduce across. Negative index is used to specify axis from the
-     *      end (e.g. -1 for the last axis). Must be in the range [-n, n).
-     *
-     * Outputs:
-     * * 0: An (n - 1)-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor.
-     *
-     * Available since API level 29.
-     */
-    // There is no underscore in ARG_MAX to avoid name conflict with
-    // the macro defined in libc/kernel/uapi/linux/limits.h.
-    ANEURALNETWORKS_ARGMAX = 39,
-    /**
-     * Returns the index of the smallest element along an axis.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor specifying the input. Must be non-empty.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar specifying the axis to
-     *      reduce across. Negative index is used to specify axis from the
-     *      end (e.g. -1 for the last axis). Must be in the range [-n, n).
-     *
-     * Outputs:
-     * * 0: An (n - 1)-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_ARGMIN = 40,  // See ARGMAX for naming discussion.
-    /**
-     * Transform axis-aligned bounding box proposals using bounding box deltas.
-     *
-     * Given the positions of bounding box proposals and the corresponding
-     * bounding box deltas for each class, return the refined bounding box
-     * regions. The resulting bounding boxes are cliped against the edges of
-     * the image.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Inputs:
-     * * 0: A 2-D Tensor of shape [num_rois, 4], specifying the locations of the
-     *      bounding box proposals, each line with format [x1, y1, x2, y2].
-     *      For tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM},
-     *      the zeroPoint must be 0 and the scale must be 0.125.
-     * * 1: A 2-D Tensor of shape [num_rois, num_classes * 4], specifying the
-     *      bounding box delta for each region of interest and each class. The
-     *      bounding box deltas are organized in the following order
-     *      [dx, dy, dw, dh], where dx and dy is the relative correction factor
-     *      for the center position of the bounding box with respect to the width
-     *      and height, dw and dh is the log-scale relative correction factor
-     *      for the width and height. For input0 of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM}, this tensor should be
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}.
-     * * 2: An 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches], specifying the number of output boxes for each batch.
-     * * 3: A 2-D Tensor of shape [batches, 2], specifying the information of
-     *      each image in the batch, each line with format
-     *      [image_height, image_width].
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0, with shape
-     *      [num_rois, num_classes * 4], specifying the coordinates of each
-     *      output bounding box for each class, with format [x1, y1, x2, y2].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_AXIS_ALIGNED_BBOX_TRANSFORM = 41,
-    /**
-     * Performs a forward LSTM on the input followed by a backward LSTM.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: 3, either time-major or batch-major.
-     *
-     * All input and output tensors must be of the same type.
-     *
-     *
-     * Inputs:
-     * * 0: The input.
-     *      A 3-D tensor of shape:
-     *        If time-major: [max_time, batch_size, output_size]
-     *        If batch-major: [batch_size, max_time, output_size]
-     *      where "max_time" is the number of timesteps (sequence length),
-     *      "batch_size" corresponds to the batching dimension, and
-     *      "input_size" is the size of the input.
-     * * 1: The forward input-to-input weights. Optional.
-     *      A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *      corresponds to the number of cell units.
-     * * 2: The forward input-to-forget weights.
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 3: The forward input-to-cell weights.
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 4: The forward input-to-output weights.
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 5: The forward recurrent-to-input weights. Optional.
-     *      A 2-D tensor of shape [num_units, output_size], where “output_size”
-     *      corresponds to either the number of cell units (i.e., “num_units”),
-     *      or the second dimension of the “projection_weights”, if defined.
-     * * 6: The forward recurrent-to-forget weights.
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 7: The forward recurrent-to-cell weights.
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 8: The forward recurrent-to-output weights.
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 9: The forward cell-to-input weights. Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 10: The forward cell-to-forget weights. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 11: The forward cell-to-output weights. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 12: The forward input gate bias. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 13: The forward forget gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 14: The forward cell gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 15: The forward output gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 16: The forward projection weights. Optional.
-     *       A 2-D tensor of shape [output_size, num_units].
-     * * 17: The forward projection bias. Optional.
-     *       A 1-D tensor of shape [output_size].
-     * * 18: The backward input-to-input weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *       corresponds to the number of cell units.
-     * * 19: The backward input-to-forget weights.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 20: The backward input-to-cell weights.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 21: The backward input-to-output weights.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 22: The backward recurrent-to-input weights. Optional.
-     *       A 2-D tensor of shape [num_units, output_size], where “output_size”
-     *       corresponds to either the number of cell units (i.e., “num_units”),
-     *       or the second dimension of the “projection_weights”, if defined.
-     * * 23: The backward recurrent-to-forget weights.
-     *       A 2-D tensor of shape [num_units, output_size].
-     * * 24: The backward recurrent-to-cell weights.
-     *       A 2-D tensor of shape [num_units, output_size].
-     * * 25: The backward recurrent-to-output weights.
-     *       A 2-D tensor of shape [num_units, output_size].
-     * * 26: The backward cell-to-input weights. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 27: The backward cell-to-forget weights. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 28: The backward cell-to-output weights. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 29: The backward input gate bias. Optional.
-     *       A 1-D tensor of shape [num_units].
-     * * 30: The backward forget gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 31: The backward cell gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 32: The backward output gate bias.
-     *       A 1-D tensor of shape [num_units].
-     * * 33: The backward projection weights. Optional.
-     *       A 2-D tensor of shape [output_size, num_units].
-     * * 34: The backward projection bias. Optional.
-     *       A 1-D tensor of shape [output_size].
-     * * 35: The forward input activation state.
-     *       A 2-D tensor of shape [batch_size, output_size].
-     * * 36: The forward input cell state.
-     *       A 2-D tensor of shape [batch_size, num_units].
-     * * 37: The backward input activation state.
-     *       A 2-D tensor of shape [batch_size, output_size].
-     * * 38: The backward input cell state.
-     *       A 2-D tensor of shape [batch_size, num_units].
-     * * 39: The auxiliary input. Optional.
-     *       A 3-D tensor of shape [max_time, batch_size, input_size], where “batch_size”
-     *       corresponds to the batching dimension, and “input_size” is the size
-     *       of the input.
-     * * 40: The forward auxiliary input-to-input weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 41: The forward auxiliary input-to-forget weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 42: The forward auxiliary input-to-cell weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 43: The forward auxiliary input-to-output weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 44: The backward auxiliary input-to-input weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 45: The backward auxiliary input-to-forget weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 46: The backward auxiliary input-to-cell weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 47: The backward auxiliary input-to-output weights. Optional.
-     *       A 2-D tensor of shape [num_units, input_size].
-     * * 48: The activation function.
-     *       A value indicating the activation function:
-     *       <ul>
-     *       <li>0: None;
-     *       <li>1: Relu;
-     *       <li>3: Relu6;
-     *       <li>4: Tanh;
-     *       <li>6: Sigmoid.
-     *       </ul>
-     * * 49: The clipping threshold for the cell state, such
-     *       that values are bound within [-cell_clip, cell_clip]. If set to 0.0
-     *       then clipping is disabled.
-     *       If all the input tensors have type {@link ANEURALNETWORKS_TENSOR_FLOAT32},
-     *       this scalar must be of the type {@link ANEURALNETOWORKS_FLOAT32},
-     *       otherwise if all the input tensors have the type {@link
-     *       ANEURALNETWORKS_TENSOR_FLOAT16}, this scalar must be of type {@link
-     *       ANEURALNETWORKS_FLOAT16}.
-     * * 50: The clipping threshold for the output from the
-     *       projection layer, such that values are bound within
-     *       [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.
-     *       If all the input tensors have type {@link ANEURALNETWORKS_TENSOR_FLOAT32},
-     *       this scalar must be of the type {@link ANEURALNETOWORKS_FLOAT32},
-     *       otherwise if all the input tensors have the type {@link
-     *       ANEURALNETWORKS_TENSOR_FLOAT16}, this scalar must be of type {@link
-     *       ANEURALNETWORKS_FLOAT16}.
-     * * 51: merge_outputs
-     *       An {@link ANEURALNETWORKS_BOOL} scalar specifying if the outputs
-     *       from forward and backward cells should be merged.
-     * * 52: time_major
-     *       An {@link ANEURALNETWORKS_BOOL} scalar specifying the shape format
-     *       of input and output tensors.
-     *
-     * Outputs:
-     * * 0: The forward output.
-     *      A 3-D tensor of shape:
-     *        If time-major: [max_time, batch_size, output_size]
-     *        If batch-major: [batch_size, max_time, output_size]
-     * * 1: The backward output.  Unused if merge_outputs is true.
-     *      A 3-D tensor of shape:
-     *        If time-major: [max_time, batch_size, output_size]
-     *        If batch-major: [batch_size, max_time, output_size]
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_BIDIRECTIONAL_SEQUENCE_LSTM = 42,
-    /**
-     * A recurrent neural network layer that applies a basic RNN cell to a
-     * sequence of inputs in forward and backward directions.
-     *
-     * This Op unrolls the input along the sequence dimension, and implements
-     * the following operation for each element in the sequence s =
-     * 1...sequence_length:
-     *   fw_outputs[s] = fw_state = activation(inputs[s] * fw_input_weights’ +
-     *          fw_state * fw_recurrent_weights’ + fw_bias)
-     *
-     * And for each element in sequence t = sequence_length : 1
-     *   bw_outputs[t] = bw_state = activation(inputs[t] * bw_input_weights’ +
-     *          bw_state * bw_recurrent_weights’ + bw_bias)
-     *
-     * Where:
-     * * “{fw,bw}_input_weights” is a weight matrix that multiplies the inputs;
-     * * “{fw,bw}_recurrent_weights” is a weight matrix that multiplies the
-     *    current “state” which itself is the output from the previous time step
-     *    computation;
-     * * “{fw,bw}_bias” is a bias vector (added to each output vector in the
-     *    batch);
-     * * “activation” is the function passed as the “fused_activation_function”
-     *   argument (if not “NONE”).
-     *
-     * The op also supports an auxiliary input. Regular cell feeds one input
-     * into the two RNN cells in the following way:
-     *
-     *       INPUT  (INPUT_REVERSED)
-     *         |         |
-     *    ---------------------
-     *    | FW_RNN     BW_RNN |
-     *    ---------------------
-     *         |         |
-     *      FW_OUT     BW_OUT
-     *
-     * An op with an auxiliary input takes two inputs and feeds them into the
-     * RNN cells in the following way:
-     *
-     *       AUX_INPUT   (AUX_INPUT_REVERSED)
-     *           |             |
-     *     INPUT | (INPUT_R'D.)|
-     *       |   |       |     |
-     *    -----------------------
-     *    |  \  /        \    / |
-     *    | FW_RNN       BW_RNN |
-     *    -----------------------
-     *         |           |
-     *      FW_OUT      BW_OUT
-     *
-     * While stacking this op on top of itself, this allows to connect both
-     * forward and backward outputs from previous cell to the next cell's
-     * inputs.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * The input tensors must all be the same type.
-     *
-     * Inputs:
-     * * 0: input.
-     *      A 3-D tensor. The shape is defined by the input 6 (timeMajor). If
-     *      it is set to true, then the input has a shape [maxTime, batchSize,
-     *      inputSize], otherwise the input has a shape [batchSize, maxTime,
-     *      inputSize].
-     * * 1: fwWeights.
-     *      A 2-D tensor of shape [fwNumUnits, inputSize].
-     * * 2: fwRecurrentWeights.
-     *      A 2-D tensor of shape [fwNumUnits, fwNumUnits].
-     * * 3: fwBias.
-     *      A 1-D tensor of shape [fwNumUnits].
-     * * 4: fwHiddenState.
-     *      A 2-D tensor of shape [batchSize, fwNumUnits]. Specifies a hidden
-     *      state input for the first time step of the computation.
-     * * 5: bwWeights.
-     *      A 2-D tensor of shape [bwNumUnits, inputSize].
-     * * 6: bwRecurrentWeights.
-     *      A 2-D tensor of shape [bwNumUnits, bwNumUnits].
-     * * 7: bwBias.
-     *      A 1-D tensor of shape [bwNumUnits].
-     * * 8: bwHiddenState
-     *      A 2-D tensor of shape [batchSize, bwNumUnits]. Specifies a hidden
-     *      state input for the first time step of the computation.
-     * * 9: auxInput.
-     *      A 3-D tensor. The shape is the same as of the input 0.
-     * * 10:fwAuxWeights.
-     *      A 2-D tensor of shape [fwNumUnits, inputSize].
-     * * 11:bwAuxWeights.
-     *      A 2-D tensor of shape [bwNumUnits, inputSize].
-     * * 12:fusedActivationFunction.
-     *      A {@link FuseCode} value indicating the activation function. If
-     *      “NONE” is specified then it results in a linear activation.
-     * * 13:timeMajor
-     *      An {@link ANEURALNETWORKS_BOOL} scalar specifying the shape format
-     *      of input and output tensors.
-     * * 14:mergeOutputs
-     *      An {@link ANEURALNETWORKS_BOOL} scalar specifying if the outputs
-     *      from forward and backward cells are separate (if set to false) or
-     *      concatenated (if set to true).
-     * Outputs:
-     * * 0: fwOutput.
-     *      A 3-D tensor. The first two dimensions of the shape are defined by
-     *      the input 6 (timeMajor) and the third dimension is defined by the
-     *      input 14 (mergeOutputs). If timeMajor is set to true, then the first
-     *      two dimensions are [maxTime, batchSize], otherwise they are set to
-     *      [batchSize, maxTime]. If mergeOutputs is set to true, then the third
-     *      dimension is equal to (fwNumUnits + bwNumUnits), otherwise it is set
-     *      to fwNumUnits.
-     * * 1: bwOutput.
-     *      A 3-D tensor. If the input 14 (mergeOutputs) is set to true, then
-     *      this tensor is not produced. The shape is defined by the input 6
-     *      (timeMajor). If it is set to true, then the shape is set to
-     *      [maxTime, batchSize, bwNumUnits], otherwise the shape is set to
-     *      [batchSize, maxTime, bwNumUnits].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_BIDIRECTIONAL_SEQUENCE_RNN = 43,
-    /**
-     * Greedily selects a subset of bounding boxes in descending order of score.
-     *
-     * This op applies hard NMS algorithm to each class. In each loop of
-     * execution, the box with maximum score gets selected, and any boxes with
-     * the intersection-over-union (IOU) greater than a threshold are removed
-     * from the pending set.
-     *
-     * Axis-aligned bounding boxes are represented by its upper-left corner
-     * coordinate (x1,y1) and lower-right corner coordinate (x2,y2). A valid
-     * bounding box should satisfy x1 <= x2 and y1 <= y2.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Inputs:
-     * * 0: A 2-D Tensor of shape [num_rois, num_classes], specifying the score
-     *      of each bounding box proposal. The boxes are grouped by batches in the
-     *      first dimension.
-     * * 1: A 2-D Tensor specifying the bounding boxes of shape
-     *      [num_rois, num_classes * 4], organized in the order [x1, y1, x2, y2].
-     *      The boxes are grouped by batches in the first dimension. The sequential
-     *      order of the boxes corresponds with input0. For input0 of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, this tensor should be of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM}, with zeroPoint of 0 and
-     *      scale of 0.125.
-     * * 2: A 1-D Tensor of shape [batches], specifying the number of boxes
-     *      for each image in the batch.
-     * * 3: An {@link ANEURALNETWORKS_FLOAT32} scalar, score_threshold. Boxes
-     *      with scores lower than the threshold are filtered before sending
-     *      to the NMS algorithm.
-     * * 4: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the IoU
-     *      threshold.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the maximum
-     *      number of selected bounding boxes for each image. Set to a negative
-     *      value for unlimited number of output bounding boxes.
-     *
-     * Outputs:
-     * * 0: A 1-D Tensor of the same {@link OperandCode} as input0, with shape
-     *      [num_output_rois], specifying the score of each output box. The boxes
-     *      are grouped by batches, but the sequential order in each batch is not
-     *      guaranteed. For type of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the scale and zero point must be the same as input0.
-     * * 1: A 2-D Tensor of the same {@link OperandCode} as input1, with shape
-     *      [num_output_rois, 4], specifying the coordinates of each
-     *      output bounding box with the same format as input1. The sequential
-     *      order of the boxes corresponds with output0. For type of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM}, the scale must be
-     *      0.125 and the zero point must be 0.
-     * * 2: A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [num_output_rois], specifying the class of each output box. The
-     *      sequential order of the boxes corresponds with output0.
-     * * 3: A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches], specifying the number of output boxes for each image.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_BOX_WITH_NMS_LIMIT = 44,
-    /**
-     * Casts a tensor to a new type.
-     *
-     * This operation ignores the scale and zeroPoint of quanized tensors,
-     * e.g. it treats a {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} input
-     * as a tensor of uint8 values.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: A tensor with the same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_CAST = 45,
-    /**
-     * Shuffle the channels of the input tensor.
-     *
-     * Given an input tensor and a integer value of num_groups, CHANNEL_SHUFFLE
-     * divide the channel dimension into num_groups groups, and reorganize the
-     * channels by grouping channels with the same index in each group.
-     *
-     * Along the channel dimension, the output is calculated using this formula:
-     *
-     *     output_channel[k * num_groups + g] = input_channel[g * group_size + k]
-     *
-     * where group_size = num_channels / num_groups
-     *
-     * The number of channels must be divisible by num_groups.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be shuffled.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-     *      groups.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar, specifying the dimension
-     *      channel shuffle would be performed on. Negative index is used to
-     *      specify axis from the end (e.g. -1 for the last axis). Must be in
-     *      the range [-n, n).
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} and same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_CHANNEL_SHUFFLE = 46,
-    /**
-     * Apply postprocessing steps to bounding box detections.
-     *
-     * Bounding box detections are generated by applying transformation on a set
-     * of predefined anchors with the bounding box deltas from bounding box
-     * regression. A final step of hard NMS is applied to limit the number of
-     * returned boxes.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Inputs:
-     * * 0: A 3-D Tensor of shape [batches, num_anchors, num_classes], specifying
-     *      the score of each anchor with each class. Class 0 for each
-     *      [batches, num_anchors, 0] is background and will be ignored.
-     * * 1: A 3-D Tensor of shape [batches, num_anchors, length_box_encoding], with
-     *      the first four values in length_box_encoding specifying the bounding
-     *      box deltas. The box deltas are encoded in the order of [dy, dx, dh, dw],
-     *      where dy and dx is the linear-scale relative correction factor for the
-     *      center position of the bounding box with respect to the width and height,
-     *      dh and dw is the log-scale relative correction factor for the width and
-     *      height. All the entries in length_box_encoding beyond the first four
-     *      values are ignored in this operation.
-     * * 2: A 2-D Tensor of shape [num_anchors, 4], specifying the shape of each
-     *      predefined anchor, with format [ctr_y, ctr_x, h, w], where ctr_y and
-     *      ctr_x are the center position of the box, and h and w are the height
-     *      and the width.
-     * * 3: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the scaling
-     *      factor for dy in bounding box deltas.
-     * * 4: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the scaling
-     *      factor for dx in bounding box deltas.
-     * * 5: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the scaling
-     *      factor for dh in bounding box deltas.
-     * * 6: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the scaling
-     *      factor for dw in bounding box deltas.
-     * * 7: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to use regular
-     *      multi-class NMS algorithm that do NMS separately for each class,
-     *      set to false for a faster algorithm that only do one single NMS
-     *      using the highest class score..
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, max_num_detections, specifying
-     *      the maximum number of boxes for the output. Boxes with the lowest
-     *      scores are discarded to meet the limit.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, only used when input7 is
-     *      set to false, specifying the maximum number of classes per detection.
-     * * 10: An {@link ANEURALNETWORKS_INT32} scalar, only used when input7 is
-     *       set to true, specifying the maximum number of detections when
-     *       applying NMS algorithm for each single class.
-     * * 11: An {@link ANEURALNETWORKS_FLOAT32} scalar, score_threshold. Boxes
-     *       with scores lower than the threshold are filtered before sending
-     *       to the NMS algorithm.
-     * * 12: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the IoU
-     *       threshold for hard NMS.
-     * * 13: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to include
-     *       background class in the list of label map for the output, set
-     *       to false to not include the background. When the background
-     *       class is included, it has label 0 and the output classes start
-     *       at 1 in the label map, otherwise, the output classes start at 0.
-     *
-     * Outputs:
-     * * 0: A 2-D tensor of the same {@link OperandCode} as input0, with shape
-     *      [batches, max_num_detections], specifying the score of each output
-     *      detections.
-     * * 1: A 3-D tensor of shape [batches, max_num_detections, 4], specifying the
-     *      coordinates of each output bounding box, with format
-     *      [y1, x1, y2, x2].
-     * * 2: A 2-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches, max_num_detections], specifying the class label for each
-     *      output detection.
-     * * 3: An 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape [batches],
-     *      specifying the number of valid output detections for each batch.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_DETECTION_POSTPROCESSING = 47,
-    /**
-     * For input tensors x and y, computes x == y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_EQUAL = 48,
-    /**
-     * Computes exponential of x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_EXP = 49,
-    /**
-     * Inserts a dimension of 1 into a tensor's shape.
-     *
-     * Given a tensor input, this operation inserts a dimension of 1 at the
-     * given dimension index of input's shape. The dimension index starts at
-     * zero; if you specify a negative dimension index, it is counted backward
-     * from the end.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar specifying the dimension
-     *      index to expand. Must be in the range [-(n + 1), (n + 1)).
-     *
-     * Outputs:
-     * * 0: An (n + 1)-D tensor with the same {@link OperandCode} and data as
-     *      input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_EXPAND_DIMS = 50,
-    /**
-     * Gathers values along an axis.
-     *
-     * Produces an output tensor with shape
-     *     input0.dimension[:axis] + indices.dimension + input0.dimension[axis + 1:]
-     * where:
-     *     # Vector indices (output is rank(input0)).
-     *     output[a_0, ..., a_n, i, b_0, ..., b_n] =
-     *       input0[a_0, ..., a_n, indices[i], b_0, ..., b_n]
-     *
-     *     # Higher rank indices (output is rank(input0) + rank(indices) - 1).
-     *     output[a_0, ..., a_n, i, ..., j, b_0, ... b_n] =
-     *       input0[a_0, ..., a_n, indices[i, ..., j], b_0, ..., b_n]
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor from which to gather values.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar specifying the axis.
-     *      Negative index is used to specify axis from the end
-     *      (e.g. -1 for the last axis). Must be in the range [-n, n).
-     * * 2: A k-D tensor {@link ANEURALNETWORKS_TENSOR_INT32} of indices.
-     *      The values must be in the bounds of the corresponding dimensions
-     *      of input0.
-     *
-     * Outputs:
-     * * 0: An (n + k - 1)-D tensor with the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_GATHER = 51,
-    /**
-     * Generate aixs-aligned bounding box proposals.
-     *
-     * Bounding box proposals are generated by applying transformation on a set
-     * of predefined anchors with the bounding box deltas from bounding box
-     * regression. A final step of hard NMS is applied to limit the number of
-     * returned boxes.
-     *
-     * Axis-aligned bounding boxes are represented by its upper-left corner
-     * coordinate (x1,y1) and lower-right corner coordinate (x2,y2). A valid
-     * bounding box should satisfy x1 <= x2 and y1 <= y2.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Inputs:
-     * * 0: A 4-D Tensor specifying the score of each anchor at each
-     *      location. With "NHWC" data layout, the tensor shape is
-     *      [batches, height, width, num_anchors]. With "NCHW" data layout,
-     *      the tensor shape is [batches, num_anchors, height, width].
-     * * 1: A 4-D Tensor specifying the bounding box deltas. With "NHWC" data
-     *      layout, the tensor shape is [batches, height, width, num_anchors * 4].
-     *      With "NCHW" data layout, the tensor shape is
-     *      [batches, num_anchors * 4, height, width]. The box deltas are encoded
-     *      in the order of [dx, dy, dw, dh], where dx and dy is the linear-scale
-     *      relative correction factor for the center position of the bounding box
-     *      with respect to the width and height, dw and dh is the log-scale
-     *      relative correction factor for the width and height. The last
-     *      dimensions is the channel dimension.
-     * * 2: A 2-D Tensor of shape [num_anchors, 4], specifying the shape of each
-     *      predefined anchor, with format [x1, y1, x2, y2]. For input0 of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, this tensor should be of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT16_SYMM}, with scale of 0.125.
-     * * 3: A 2-D Tensor of shape [batches, 2], specifying the size of
-     *      each image in the batch, with format [image_height, image_width].
-     * * 4: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the height of original image to the height of feature map.
-     * * 5: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the width of original image to the width of feature map.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the maximum
-     *      number of boxes before going into the hard NMS algorithm. Boxes
-     *      with the lowest scores are discarded to meet the limit. Set to
-     *      a non-positive value for unlimited number.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the maximum
-     *      number of boxes returning from the hard NMS algorithm. Boxes
-     *      with the lowest scores are discarded to meet the limit. Set to
-     *      a non-positive value for unlimited number.
-     * * 8: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the IoU
-     *      threshold for hard NMS.
-     * * 9: An {@link ANEURALNETWORKS_FLOAT32} scalar, min_size. Boxes with
-     *      height or width lower than the absolute threshold are filtered out.
-     * * 10: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *       NCHW data layout for input0 and input1. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0, of shape
-     *      [num_output_rois], specifying the score of each output box.
-     *      The boxes are grouped by batches, but the sequential order in
-     *      each batch is not guaranteed. For type of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the scale and zero
-     *      point must be the same as input0.
-     * * 1: A tensor of the same {@link OperandCode} as input1, of shape
-     *      [num_output_rois, 4], specifying the coordinates of each output
-     *      bounding box for each class, with format [x1, y1, x2, y2].
-     *      The sequential order of the boxes corresponds with output0.
-     *      For type of {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM}, the
-     *      scale must be 0.125 and the zero point must be 0.
-     * * 2: A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches], specifying the number of output boxes for each image.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_GENERATE_PROPOSALS = 52,
-    /**
-     * For input tensors x and y, computes x > y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_GREATER = 53,
-    /**
-     * For input tensors x and y, computes x >= y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_GREATER_EQUAL = 54,
-    /**
-     * Performs a grouped 2-D convolution operation.
-     *
-     * Given an input tensor of shape [batches, height, width, depth_in] and a
-     * filter tensor of shape [depth_out, filter_height, filter_width, depth_group]
-     * containing depth_out convolutional filters of depth depth_group, GROUPED_CONV
-     * applies a group of different filters to each input channel group, then
-     * concatenates the results together.
-     *
-     * Specifically, the input channels are divided into num_groups groups, each with
-     * depth depth_group, i.e. depth_in = num_groups * depth_group. The convolutional
-     * filters are also divided into num_groups groups, i.e. depth_out is divisible
-     * by num_groups. GROUPED_CONV applies each group of filters to the corresponding
-     * input channel group, and the result are concatenated together.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, i, j, g * channel_multiplier + q] =
-     *         sum_{di, dj, dk} (
-     *             input[b, strides[1] * i + di, strides[2] * j + dj,
-     *                   g * depth_group + dk] *
-     *             filter[g * channel_multiplier + q, di, dj, dk]
-     *         ) + bias[channel]
-     *
-     * where channel_multiplier = depth_out / num_groups
-     *
-     * Supported tensor {@link OperandCode} configurations:
-     * * 32 bit Floating point :
-     * * * {@link ANEURALNETWORKS_TENSOR_FLOAT32} for input, filter, output, and bias.
-     *
-     * * 16 bit Floating point:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} for input, filter, output, and bias.
-     *
-     * * Quantized:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, filter, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (with scale set to
-     * * * input.scale * filter.scale).
-     *
-     * * Quantized with symetric per channel quantization for the filter:
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM} for input, and output.
-     * * * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} for filter.
-     * * * {@link ANEURALNETWORKS_TENSOR_INT32} for bias (scale set to 0.0,
-     * * * each value scaling is separate and equal to input.scale * filter.scales[channel]).
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input, where depth_in = num_groups * depth_group.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_group], specifying
-     *      the filter, where depth_out must be divisible by num_groups.  For
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}
-     *      the channel dimension (channelDim at
-     *      {@link ANeuralNetworksSymmPerChannelQuantParams}) must be set to 0.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-            groups.
-     * * 10: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *       {@link FuseCode} values. Specifies the activation to
-     *       invoke on the result.
-     * * 11: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *       NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input, where depth_in = num_groups * depth_group.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_group], specifying
-     *      the filter, where depth_out must be divisible by num_groups.  For
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}
-     *      the channel dimension (channelDim at
-     *      {@link ANeuralNetworksSymmPerChannelQuantParams}) must be set to 0.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias must be of the same
-     *      type. For filter tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the bias should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint
-     *      of 0 and bias_scale == input_scale * filter_scale. For filter tensor
-     *      of {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}, the bias
-     *      should be of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of
-     *      0 and bias_scale of 0. The actual scale of each value 'i' is equal to
-     *      bias_scale[i] = input_scale * filter_scale[i].
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-     *      groups.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 8: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth_out]. For output tensor of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the following condition
-     *      must be satisfied: output_scale > input_scale * filter_scale (for
-     *      filter tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}
-     *      this condition must be true for all filter scales).
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_GROUPED_CONV_2D = 55,
-    /**
-     * Localize the maximum keypoints from heatmaps.
-     *
-     * This operation approximates the accurate maximum keypoint scores and
-     * indices after bicubic upscaling by using Taylor expansion up to the
-     * quadratic term.
-     *
-     * The bounding box is represented by its upper-left corner coordinate
-     * (x1,y1) and lower-right corner coordinate (x2,y2) in the original image.
-     * A valid bounding box should satisfy x1 <= x2 and y1 <= y2.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D Tensor of shape
-     *      [num_boxes, heatmap_size, heatmap_size, num_keypoints],
-     *      specifying the heatmaps, the height and width of heatmaps should
-     *      be the same, and must be greater than or equal to 2.
-     * * 1: A 2-D Tensor of shape [num_boxes, 4], specifying the bounding boxes,
-     *      each with format [x1, y1, x2, y2]. For input0 of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, this tensor should
-     *      be of {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM}, with zeroPoint
-     *      of 0 and scale of 0.125.
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0, with shape
-     *      [num_boxes, num_keypoints], specifying score of the keypoints.
-     * * 1: A tensor of the same {@link OperandCode} as input1, with shape
-     *      [num_boxes, num_keypoints, 2], specifying the location of
-     *      the keypoints, the second dimension is organized as
-     *      [keypoint_x, keypoint_y].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_HEATMAP_MAX_KEYPOINT = 56,
-    /**
-     * Applies instance normalization to the input tensor.
-     *
-     * The values in the output tensor are computed as:
-     *
-     *     output[b, h, w, c] =
-     *         (input[b, h, w, c] - mean[b, c]) * gamma /
-     *         sqrt(var[b, c] + epsilon) + beta
-     *
-     * Where the mean and variance are computed across the spatial dimensions:
-     *
-     *     mean[b, c] =
-     *         sum_{h, w}(input[b, h, w, c]) / sum(1)
-     *
-     *     var[b, c] =
-     *         sum_{h, w}(pow(input[b, h, w, c] - mean[b, c], 2)) / sum(1)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be normalized.
-     * * 1: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying gamma, the
-     *      scale applied to the normalized tensor.
-     * * 2: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying beta, the
-     *      offset applied to the normalized tensor.
-     * * 3: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying epsilon, the
-     *      small value added to variance to avoid dividing by zero.
-     * * 4: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} and same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_INSTANCE_NORMALIZATION = 57,
-    /**
-     * For input tensors x and y, computes x < y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LESS = 58,
-    /**
-     * For input tensors x and y, computes x <= y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LESS_EQUAL = 59,
-    /**
-     * Computes natural logarithm of x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LOG = 60,
-    /**
-     * Returns the truth value of x AND y element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     * * 1: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8} and dimensions
-     *      compatible with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LOGICAL_AND = 61,
-    /**
-     * Computes the truth value of NOT x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LOGICAL_NOT = 62,
-    /**
-     * Returns the truth value of x OR y element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     * * 1: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8} and dimensions
-     *      compatible with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LOGICAL_OR = 63,
-    /**
-     * Computes the log softmax activations given logits.
-     *
-     * The output is calculated using this formula:
-     *
-     *     output = logits * beta - log(reduce_sum(exp(logits * beta), axis))
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor specifying the input logits.
-     * * 1: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the positive
-     *      scaling factor for the exponent, beta.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar specifying the axis to
-     *      reduce across. Negative index is used to specify axis from the
-     *      end (e.g. -1 for the last axis). Must be in the range [-n, n).
-     *
-     * Outputs:
-     * * 0: The output tensor of the same {@link OperandCode} and shape as
-     *      input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_LOG_SOFTMAX = 64,
-    /**
-     * Returns the element-wise maximum of two tensors.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and compatible dimensions
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: The sum, a tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_MAXIMUM = 65,
-    /**
-     * Returns the element-wise minimum of two tensors.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and compatible dimensions
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: The sum, a tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_MINIMUM = 66,
-    /**
-     * Computes numerical negative value element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_NEG = 67,
-    /**
-     * For input tensors x and y, computes x != y elementwise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * This operation supports broadcasting.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     * * 1: A tensor of the same {@link OperandCode} and dimensions compatible
-     *      with input0.
-     *
-     * Outputs:
-     * * 0: A tensor of {@link ANEURALNETWORKS_TENSOR_BOOL8}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_NOT_EQUAL = 68,
-    /**
-     * Pads a tensor with the given constant value according to the specified
-     * paddings.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor, specifying the tensor to be padded.
-     * * 1: A 2-D Tensor of {@link ANEURALNETWORKS_TENSOR_INT32}, the paddings
-     *      for each spatial dimension of the input tensor. The shape of the
-     *      tensor must be {rank(input0), 2}.
-     *      padding[i, 0] specifies the number of elements to be padded in the
-     *      front of dimension i.
-     *      padding[i, 1] specifies the number of elements to be padded after
-     *      the end of dimension i.
-     * * 2: An scalar specifying the value to use for padding input0.
-     *      For input tensor of {@link ANEURALNETWORKS_TENSOR_FLOAT32}, the
-     *      pad value should be of {@link ANEURALNETWORKS_FLOAT32}.
-     *      For input tensor of {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      the pad value should be of {@link ANEURALNETWORKS_INT32}. The
-     *      scale and zeroPoint are assumed to be the same as in input0.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0. The
-     *      output tensor has the same rank as input0, and each
-     *      dimension of the output tensor has the same size as the
-     *      corresponding dimension of the input tensor plus the size
-     *      of the padding:
-     *          output0.dimension[i] =
-     *              padding[i, 0] + input0.dimension[i] + padding[i, 1]
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_PAD_V2 = 69,
-    /**
-     * Computes the power of one value to another.
-     *
-     * Given a tensor base and a tensor exponent, this operation computes
-     * base^exponent elementwise.
-     *
-     * This operations supports broadcasting. The size of the output is the
-     * maximum size along each dimension of the input operands. It starts with
-     * the trailing dimensions, and works its way forward.
-     *
-     * For example:
-     *     base.dimension     =    {4, 1, 2}
-     *     exponent.dimension = {5, 4, 3, 1}
-     *     output.dimension   = {5, 4, 3, 2}
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: A tensor specifying the base.
-     * * 1: A tensor specifying the exponent.
-     *
-     * Outputs:
-     * * 0: An output tensor.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_POW = 70,
-    /**
-     * Parametric Rectified Linear Unit.
-     *
-     * It follows: f(x) = alpha * x for x < 0, f(x) = x for x >= 0, where alpha
-     * is a learned array with the same {@link OperandCode} and compatible
-     * dimensions as input x.
-     *
-     * Two dimensions are compatible when:
-     *     1. they are equal, or
-     *     2. one of them is 1
-     *
-     * The size of the output is the maximum size along each dimension of the
-     * input operands. It starts with the trailing dimensions, and works its way
-     * forward.
-     *
-     * Example:
-     *     input.dimension  =    {4, 1, 2}
-     *     alpha.dimension  = {5, 4, 3, 1}
-     *     output.dimension = {5, 4, 3, 2}
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: A tensor, specifying the input.
-     * * 1: A tensor of the same {@link OperandCode}, and compatible dimensions
-     *      as input0, specifying the alpha.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_PRELU = 71,
-    /**
-     * Quantizes the input tensor.
-     *
-     * The formula is:
-     *
-     *     output = max(0, min(255, round(input / scale) + zeroPoint)
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0, but with
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_QUANTIZE = 72,
-    /**
-     * A version of quantized LSTM, using 16 bit quantization for internal
-     * state.
-     *
-     * There is no projection layer, so cell state size is equal to the output
-     * size.
-     *
-     * Inputs:
-     * * 0: A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [numBatches, inputSize] specifying the input to the LSTM
-     *      cell. Tensor is quantized with a fixed quantization range of
-     *      [-1, 127/128] (scale = 1/128, zeroPoint = 128).
-     * * 1: The input-to-input weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying input-to-input part of
-     *      weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 2: The input-to-forget weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying input-to-forget part of
-     *      weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 3: The input-to-cell weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying input-to-cell part of
-     *      weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 4: The input-to-output weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying input-to-output part of
-     *      weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 5: The recurrent-to-input weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying recurrent-to-input part
-     *      of weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 6: The recurrent-to-forget weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying recurrent-to-forget
-     *      part of weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 7: The recurrent-to-cell weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying recurrent-to-cell part
-     *      of weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 8: The recurrent-to-output weights.
-     *      A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [outputSize, inputSize] specifying recurrent-to-output
-     *      part of weights for fully-connected layer inside the LSTM cell.
-     *      Quantization zero point and scale must be the same across all the
-     *      weights.
-     * * 9: The input gate bias.
-     *      A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} and shape
-     *      [outputSize] specifying the bias for the fully-connected layer
-     *      inside the LSTM cell. Bias is quantized with scale being a product
-     *      of input and weights scales and zeroPoint equal to 0.
-     * * 10:The forget gate bias.
-     *      A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} and shape
-     *      [outputSize] specifying the bias for the fully-connected layer
-     *      inside the LSTM cell. Bias is quantized with scale being a product
-     *      of input and weights scales and zeroPoint equal to 0.
-     * * 11:The cell bias.
-     *      A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} and shape
-     *      [outputSize] specifying the bias for the fully-connected layer
-     *      inside the LSTM cell. Bias is quantized with scale being a product
-     *      of input and weights scales and zeroPoint equal to 0.
-     * * 12:The output gate bias.
-     *      A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} and shape
-     *      [outputSize] specifying the bias for the fully-connected layer
-     *      inside the LSTM cell. Bias is quantized with scale being a product
-     *      of input and weights scales and zeroPoint equal to 0.
-     * * 13: A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT16_SYMM}
-     *       and shape [numBatches, outputSize] specifying the cell state from the
-     *       previous time step of the LSTM cell. It is quantized using a
-     *       quantization range of [-2^4, 2^4 * 32767/32768] (scale = 2^4 /
-     *       32768, zeroPoint = 0).
-     * * 14: A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *       and shape [numBathes, outputSize] specifying the output of the LSTM
-     *       cell from previous time-step. Tensor is quantized with a fixed
-     *       quantization range of [-1, 127/128] (scale = 1/128, zeroPoint =
-     *       128).
-     *
-     *
-     * Outputs:
-     * * 0: A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT16_SYMM}
-     *      and shape [numBatches, outputSize] which contains a cell state from
-     *      the current time step. Tensor is quantized using a quantization
-     *      range of [-2^4, 2^4 * 32767/32768] (scale = 2^4 / 32768, zeroPoint =
-     *      0).
-     * * 1: A 2-D tensor of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *      and shape [numBathes, outputSize] which contains the output value.
-     *      Tensor is quantized with a fixed quantization range of [-1, 127/128]
-     *      (scale = 1/128, zeroPoint = 128).
-     */
-    ANEURALNETWORKS_QUANTIZED_16BIT_LSTM = 73,
-    /**
-     * Draws samples from a multinomial distribution.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Inputs:
-     * * 0: A 2-D tensor with shape [batches, classes], specifying the
-     *      unnormalized log-probabilities for all classes.
-     * * 1: A scalar {@link ANEURALNETWORKS_INT32}, specifying the number of
-     *      independent samples to draw for each row slice.
-     * * 2: A 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor with shape [2],
-     *      specifying seeds used to initialize the random distribution.
-     * Outputs:
-     * * 0: A 2-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor with shape
-     *      [batches, samples], containing the drawn samples.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_RANDOM_MULTINOMIAL = 74,
-    /**
-     * Reduces a tensor by computing the "logical and" of elements along given
-     * dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_ALL = 75,
-    /**
-     * Reduces a tensor by computing the "logical or" of elements along given
-     * dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_BOOL8}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_ANY = 76,
-    /**
-     * Reduces a tensor by computing the maximum of elements along given
-     * dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_MAX = 77,
-    /**
-     * Reduces a tensor by computing the minimum of elements along given
-     * dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_MIN = 78,
-    /**
-     * Reduces a tensor by multiplying elements along given dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_PROD = 79,
-    /**
-     * Reduces a tensor by summing elements along given dimensions.
-     *
-     * If keep_dims is true, the reduced dimensions are
-     * retained with length 1. Otherwise, the rank of the tensor is reduced by
-     * 1 for each entry in dimensions.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: up to 4
-     *
-     * Inputs:
-     * * 0: An n-D tensor.
-     * * 1: A 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}. The dimensions
-     *      to reduce. Dimension values must be in the range [-n, n).
-     * * 2: An {@link ANEURALNETWORKS_BOOL} scalar, keep_dims. If true,
-     *      retains reduced dimensions with length 1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_REDUCE_SUM = 80,
-    /**
-     * Select and scale the feature map of each region of interest to a unified
-     * output size by average pooling sampling points from bilinear interpolation.
-     *
-     * The region of interest is represented by its upper-left corner coordinate
-     * (x1,y1) and lower-right corner coordinate (x2,y2) in the original image.
-     * A spatial scaling factor is applied to map into feature map coordinate.
-     * A valid region of interest should satisfy x1 <= x2 and y1 <= y2.
-     *
-     * No rounding is applied in this operation. The sampling points are unified
-     * distributed in the pooling bin and their values are calculated by bilinear
-     * interpolation.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16} (since API level 29)
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, specifying the feature map.
-     * * 1: A 2-D Tensor of shape [num_rois, 4], specifying the locations of
-     *      the regions of interest, each line with format [x1, y1, x2, y2].
-     *      For input0 of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      this tensor should be of {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM},
-     *      with zeroPoint of 0 and scale of 0.125.
-     * * 2: An 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches], specifying the number of output boxes for each batch.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      height of the output tensor.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      width of the output tensor.
-     * * 5: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the height of original image to the height of feature map.
-     * * 6: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the width of original image to the width of feature map.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-     *      sampling points in height dimension used to compute the output.
-     *      Set to 0 for adaptive value of ceil(roi_height/out_height).
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-     *      sampling points in width dimension used to compute the output.
-     *      Set to 0 for adaptive value of ceil(roi_width/out_width).
-     * * 9: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0. The output
-     *      shape is [num_rois, out_height, out_width, depth].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_ROI_ALIGN = 81,
-    /**
-     * Select and scale the feature map of each region of interest to a unified
-     * output size by max-pooling.
-     *
-     * The region of interest is represented by its upper-left corner coordinate
-     * (x1,y1) and lower-right corner coordinate (x2,y2) in the original image.
-     * A spatial scaling factor is applied to map into feature map coordinate.
-     * A valid region of interest should satisfy x1 <= x2 and y1 <= y2.
-     *
-     * Rounding is applied in this operation to ensure integer boundary for
-     * regions of interest and pooling bins.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Inputs:
-     * * 0: A 4-D tensor, specifying the feature map.
-     * * 1: A 2-D Tensor of shape [num_rois, 4], specifying the locations of
-     *      the regions of interest, each line with format [x1, y1, x2, y2].
-     *      For input0 of type {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM},
-     *      this tensor should be of {@link ANEURALNETWORKS_TENSOR_QUANT16_ASYMM},
-     *      with zeroPoint of 0 and scale of 0.125.
-     * * 2: An 1-D {@link ANEURALNETWORKS_TENSOR_INT32} tensor, of shape
-     *      [batches], specifying the number of output boxes for each batch.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      height of the output tensor.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the output
-     *      width of the output tensor.
-     * * 5: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the height of original image to the height of feature map.
-     * * 6: An {@link ANEURALNETWORKS_FLOAT32} scalar, specifying the ratio
-     *      from the width of original image to the width of feature map.
-     * * 7: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: A tensor of the same {@link OperandCode} as input0. The output
-     *      shape is [num_rois, out_height, out_width, depth].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_ROI_POOLING = 82,
-    /**
-     * Computes reciprocal of square root of x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_RSQRT = 83,
-    /**
-     * Using a tensor of booleans c and input tensors x and y select values
-     * elementwise from both input tensors:
-     *
-     * O[i] = C[i] ? x[i] : y[i].
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: A tensor of type {@link ANEURALNETWORKS_TENSOR_BOOL8} acting as a
-     *      mask that chooses, based on the value at each element, whether the
-     *      corresponding element in the output should be taken from input1 (if
-     *      true) or input2 (if false).
-     * * 1: An input tensor of the same shape as input0.
-     * * 2: An input tensor of the same shape and type as input1.
-     *
-     * Outputs:
-     * * 0: A tensor of the same type and shape as input1 and input2.
-     *
-     */
-    ANEURALNETWORKS_SELECT = 84,
-    /**
-     * Computes sin of x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_SIN = 85,
-    /**
-     * Extracts a slice of specified size from the input tensor starting at a
-     * specified location.
-     *
-     * The starting location is specified as a 1-D tensor containing offsets
-     * for each dimension. The size is specified as a 1-D tensor containing
-     * either size of a slice along corresponding dimension or -1. In the latter
-     * case, all the remaining elements in dimension are included in the slice.
-     * Slice size in each dimension cannot be zero.
-     *
-     * A sum of begin offset and a size of a slice must not exceed size of a
-     * corresponding dimension.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor to take slice from.
-     * * 1: A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} specifying
-     *      the beginning indices of the slice in each dimension.
-     * * 2: A 1-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32} specifying
-     *      the size of the slice in each dimension.
-     *
-     * Outputs:
-     * * 0: An n-D tensor of the same type as the input containing the slice.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_SLICE = 86,
-    /**
-     * Splits a tensor along a given axis into num_splits subtensors.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: An n-D tensor to split.
-     * * 1: An {@link ANEURALNETWORKS_INT32} scalar specifying the axis along
-     *      which to split.
-     * * 2: An {@link ANEURALNETWORKS_INT32} scalar indicating the number of
-     *      splits along given axis. Must evenly divide axis size.
-     *
-     * Outputs:
-     * * 0 ~ (num_splits - 1): Resulting subtensors.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_SPLIT = 87,
-    /**
-     * Computes square root of x element-wise.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: from 1.
-     *
-     * Inputs:
-     * * 0: A tensor.
-     *
-     * Outputs:
-     * * 0: The output tensor of same shape as input0.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_SQRT = 88,
-    /**
-     * Constructs a tensor by tiling a given tensor.
-     *
-     * This operation creates a new tensor by replicating `input` `multiples`
-     * times. The output tensor's i-th dimension has `input.dims(i) * multiples[i]`
-     * elements, and the values of `input` are replicated `multiples[i]` times
-     * along the i-th dimension.
-     * For example, tiling `[a b c d]` by `[2]` produces `[a b c d a b c d]`.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: input, an n-D tensor specifying the input.
-     * * 1: multiples, a 1-D tensor of {@link ANEURALNETWORKS_TENSOR_INT32}.
-     *      The length of multiples must be n.
-     *
-     * Outputs:
-     * * 0: A tiled tensor of the same {@link OperandCode} and rank as `input`.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TILE = 89,
-    /**
-     * Finds values and indices of the k largest entries for the last dimension.
-     *
-     * Resulting values in each dimensions are sorted in descending order. If
-     * two values are equal, the one with larger index appears first.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_INT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: from 1
-     *
-     * Inputs:
-     * * 0: input, an n-D tensor specifying the input.
-     * * 1: k, an {@link ANEURALNETWORKS_INT32} scalar, specifying the number of
-     *      top elements to look for along the last dimension.
-     *
-     * Outputs:
-     * * 0: An n-D tensor of the same type as the input, containing the k
-     *      largest elements along each last dimensional slice.
-     * * 1: An n-D tensor of type {@link ANEURALNETWORKS_TENSOR_INT32}
-     *      containing the indices of values within the last dimension of input.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TOPK_V2 = 90,
-    /**
-     * Performs the tranpose of 2-D convolution operation.
-     *
-     * This operation is sometimes called "deconvolution" after Deconvolutional
-     * Networks, but is actually the transpose (gradient) of
-     * {@link ANEURALNETWORKS_CONV_2D} rather than an actual deconvolution.
-     *
-     * The output dimensions are functions of the filter dimensions, stride, and
-     * padding.
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     * * {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}
-     *
-     * Supported tensor rank: 4, with "NHWC" or "NCHW" data layout.
-     * With the default data layout NHWC, the data is stored in the order of:
-     * [batch, height, width, channels]. Alternatively, the data layout could
-     * be NCHW, the data storage order of: [batch, channels, height, width].
-     *
-     * Both explicit padding and implicit padding are supported.
-     *
-     * Inputs (explicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_in], specifying the
-     *      filter.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias should be of the
-     *      same type. For input tensor of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the bias should be
-     *      of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of 0 and
-     *      bias_scale == input_scale * filter_scale.
-     * * 3: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the left, in the ‘width’ dimension.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the right, in the ‘width’ dimension.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the top, in the ‘height’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the padding on
-     *      the bottom, in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 8: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 9: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 10: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *       NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Inputs (implicit padding):
-     * * 0: A 4-D tensor, of shape [batches, height, width, depth_in],
-     *      specifying the input.
-     * * 1: A 4-D tensor, of shape
-     *      [depth_out, filter_height, filter_width, depth_in], specifying the
-     *      filter.
-     * * 2: A 1-D tensor, of shape [depth_out], specifying the bias. For input
-     *      tensor of type {@link ANEURALNETWORKS_TENSOR_FLOAT32} or
-     *      {@link ANEURALNETWORKS_TENSOR_FLOAT16}, the bias should be of the
-     *      same type. For input tensor of type
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the bias should be
-     *      of {@link ANEURALNETWORKS_TENSOR_INT32}, with zeroPoint of 0 and
-     *      bias_scale == input_scale * filter_scale.
-     * * 3: An {@link ANEURALNETWORKS_TENSOR_INT32} tensor, specifying the output
-     *      tensor shape.
-     * * 4: An {@link ANEURALNETWORKS_INT32} scalar, specifying the implicit
-     *      padding scheme, has to be one of the
-     *      {@link PaddingCode} values.
-     * * 5: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘width’ dimension.
-     * * 6: An {@link ANEURALNETWORKS_INT32} scalar, specifying the stride when
-     *      walking through input in the ‘height’ dimension.
-     * * 7: An {@link ANEURALNETWORKS_INT32} scalar, and has to be one of the
-     *      {@link FuseCode} values. Specifies the activation to
-     *      invoke on the result.
-     * * 8: An {@link ANEURALNETWORKS_BOOL} scalar, set to true to specify
-     *      NCHW data layout for input0 and output0. Set to false for NHWC.
-     *
-     * Outputs:
-     * * 0: The output 4-D tensor, of shape
-     *      [batches, out_height, out_width, depth_out]. For output tensor of
-     *      {@link ANEURALNETWORKS_TENSOR_QUANT8_ASYMM}, the following condition
-     *      must be satisfied: output_scale > input_scale * filter_scale.
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_TRANSPOSE_CONV_2D = 91,
-    /**
-     * A recurrent neural network specified by an LSTM cell.
-     *
-     * Performs (fully) dynamic unrolling of input.
-     *
-     * This Op unrolls the input along the time dimension, and implements the
-     * following operation for each element in the sequence
-     * s = 1...sequence_length:
-     *   outputs[s] = projection(state = activation(LSTMOp(inputs[s])))
-     *
-     * Where LSTMOp is the LSTM op as in {@link ANEURALNETWORKS_LSTM},
-     * the "projection" is an optional projection layer from state and output
-     * and the “activation” is the function passed as the
-     * “fused_activation_function” argument (if not “NONE”).
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * Supported tensor rank: 3, either time-major or batch-major.
-     *
-     * All input and output tensors must be of the same type.
-     *
-     * Inputs:
-     * * 0: The input (\f$x_t\f$).
-     *      A 3-D tensor of shape:
-     *        If time-major: [max_time, batch_size, output_size]
-     *        If batch-major: [batch_size, max_time, output_size]
-     *      where “max_size” is the number of timesteps (sequence length),
-     *      “batch_size” corresponds to the batching dimension, and
-     *      “input_size” is the size of the input.
-     * * 1: The input-to-input weights (\f$W_{xi}\f$). Optional.
-     *      A 2-D tensor of shape [num_units, input_size], where “num_units”
-     *      corresponds to the number of cell units.
-     * * 2: The input-to-forget weights (\f$W_{xf}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 3: The input-to-cell weights (\f$W_{xc}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 4: The input-to-output weights (\f$W_{xo}\f$).
-     *      A 2-D tensor of shape [num_units, input_size].
-     * * 5: The recurrent-to-input weights (\f$W_{hi}\f$). Optional.
-     *      A 2-D tensor of shape [num_units, output_size], where “output_size”
-     *      corresponds to either the number of cell units (i.e., “num_units”),
-     *      or the second dimension of the “projection_weights”, if defined.
-     * * 6: The recurrent-to-forget weights (\f$W_{hf}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 7: The recurrent-to-cell weights (\f$W_{hc}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 8: The recurrent-to-output weights (\f$W_{ho}\f$).
-     *      A 2-D tensor of shape [num_units, output_size].
-     * * 9: The cell-to-input weights (\f$W_{ci}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 10:The cell-to-forget weights (\f$W_{cf}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 11:The cell-to-output weights (\f$W_{co}\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 12:The input gate bias (\f$b_i\f$). Optional.
-     *      A 1-D tensor of shape [num_units].
-     * * 13:The forget gate bias (\f$b_f\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 14:The cell bias (\f$b_c\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 15:The output gate bias (\f$b_o\f$).
-     *      A 1-D tensor of shape [num_units].
-     * * 16:The projection weights (\f$W_{proj}\f$). Optional.
-     *      A 2-D tensor of shape [output_size, num_units].
-     * * 17:The projection bias (\f$b_{proj}\f$). Optional.
-     *      A 1-D tensor of shape [output_size].
-     * * 18:The output state (in) (\f$h_{t-1}\f$).
-     *      A 2-D tensor of shape [batch_size, output_size].
-     * * 19:The cell state (in) (\f$C_{t-1}\f$).
-     *      A 2-D tensor of shape [batch_size, num_units].
-     * * 20:The activation function (\f$g\f$).
-     *      A value indicating the activation function:
-     *      <ul>
-     *      <li>0: None;
-     *      <li>1: Relu;
-     *      <li>3: Relu6;
-     *      <li>4: Tanh;
-     *      <li>6: Sigmoid.
-     *      </ul>
-     * * 21:The clipping threshold (\f$t_{cell}\f$) for the cell state, such
-     *      that values are bound within [-cell_clip, cell_clip]. If set to 0.0
-     *      then clipping is disabled.
-     * * 22:The clipping threshold (\f$t_{proj}\f$) for the output from the
-     *      projection layer, such that values are bound within
-     *      [-proj_clip, proj_clip]. If set to 0.0 then clipping is disabled.
-     * * 23:Time-major if true, batch-major if false.
-     * * 24:The input layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at input gate.
-     * * 25:The forget layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at forget gate.
-     * * 26:The cell layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at cell gate.
-     * * 27:The output layer normalization weights.
-     *      A 1-D tensor of shape [num_units]. Used to rescale normalized inputs
-     *      to activation at output gate.
-     *
-     * Outputs:
-     * * 0: The output (\f$o_t\f$).
-     *      A 3-D tensor of shape:
-     *        If time-major: [max_time, batch_size, output_size]
-     *        If batch-major: [batch_size, max_time, output_size]
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_UNIDIRECTIONAL_SEQUENCE_LSTM = 92,
-    /**
-     * A recurrent neural network layer that applies a basic RNN cell to a
-     * sequence of inputs.
-     *
-     * This layer unrolls the input along the sequence dimension, and implements
-     * the following operation
-     * for each element in the sequence s = 1...sequence_length:
-     *   outputs[s] = state = activation(inputs[s] * input_weights’ + state *
-     *   recurrent_weights’ + bias)
-     *
-     * Where:
-     * * “input_weights” is a weight matrix that multiplies the inputs;
-     * * “recurrent_weights” is a weight matrix that multiplies the current
-     *    “state” which itself is the output from the previous time step
-     *    computation;
-     * * “bias” is a bias vector (added to each output vector in the batch);
-     * * “activation” is the function passed as the “fused_activation_function”
-     *   argument (if not “NONE”).
-     *
-     * Supported tensor {@link OperandCode}:
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT16}
-     * * {@link ANEURALNETWORKS_TENSOR_FLOAT32}
-     *
-     * The input tensors must all be the same type.
-     *
-     * Inputs:
-     * * 0: input.
-     *      A 3-D tensor. The shape is defined by the input 6 (timeMajor). If
-     *      it is set to 1, then the input has a shape [maxTime, batchSize,
-     *      inputSize], otherwise the input has a shape [batchSize, maxTime,
-     *      inputSize].
-     * * 1: weights.
-     *      A 2-D tensor of shape [numUnits, inputSize].
-     * * 2: recurrent_weights.
-     *      A 2-D tensor of shape [numUnits, numUnits].
-     * * 3: bias.
-     *      A 1-D tensor of shape [numUnits].
-     * * 4: hidden state
-     *      A 2-D tensor of shape [batchSize, numUnits]. Specifies a hidden
-     *      state input for the first time step of the computation.
-     * * 5: fusedActivationFunction.
-     *      A {@link FuseCode} value indicating the activation function. If
-     *      “NONE” is specified then it results in a linear activation.
-     * * 6: timeMajor
-     *      An {@link ANEURALNETWORKS_INT32} scalar specifying the shape format
-     *      of input and output tensors. Must be set to either 0 or 1.
-     * Outputs:
-     * * 0: output.
-     *      A 3-D tensor. The shape is defined by the input 6 (timeMajor). If
-     *      it is set to 1, then the output has a shape [maxTime, batchSize,
-     *      numUnits], otherwise the output has a shape [batchSize, maxTime,
-     *      numUnits].
-     *
-     * Available since API level 29.
-     */
-    ANEURALNETWORKS_UNIDIRECTIONAL_SEQUENCE_RNN = 93,
-} OperationCode;
-/**
- * Fused activation function types.
- *
- *
- * Available since API level 27.
- */
-typedef enum {
-    /** NO fused activation function. */
-    ANEURALNETWORKS_FUSED_NONE = 0,
-    /** Fused ReLU activation function. */
-    ANEURALNETWORKS_FUSED_RELU = 1,
-    /** Fused ReLU1 activation function. */
-    ANEURALNETWORKS_FUSED_RELU1 = 2,
-    /** Fused ReLU6 activation function. */
-    ANEURALNETWORKS_FUSED_RELU6 = 3,
-} FuseCode;
-/**
- * Implicit padding algorithms.
- *
- *
- * Available since API level 27.
- */
-typedef enum {
-    /**
-     * SAME padding.
-     * Padding on both ends are the "same":
-     *     padding_to_beginning =  total_padding / 2
-     *     padding_to_end       = (total_padding + 1)/2.
-     * i.e., for even number of padding, padding to both ends are exactly
-     * the same; for odd number of padding, padding to the ending is bigger
-     * than the padding to the beginning by 1.
-     *
-     * total_padding is a function of input, stride and filter size.
-     * It could be computed as follows:
-     *    out_size = (input + stride - 1) / stride;
-     *    needed_input = (out_size - 1) * stride + filter_size
-     *    total_padding = max(0, needed_input - input_size)
-     *  The computation is the same for the horizontal and vertical directions.
-     */
-    ANEURALNETWORKS_PADDING_SAME = 1,
-    /**
-     * VALID padding.
-     * No padding. When the input size is not evenly divisible by
-     * the filter size, the input at the end that could not fill
-     * the whole filter tile will simply be ignored.
-     */
-    ANEURALNETWORKS_PADDING_VALID = 2,
-} PaddingCode;
-/**
- * Execution preferences.
- *
- * Available since API level 27.
- */
-typedef enum {
-    /**
-     * Prefer executing in a way that minimizes battery drain.
-     * This is desirable for compilations that will be executed often.
-     */
-    ANEURALNETWORKS_PREFER_LOW_POWER = 0,
-    /**
-     * Prefer returning a single answer as fast as possible, even if this causes
-     * more power consumption.
-     */
-    ANEURALNETWORKS_PREFER_FAST_SINGLE_ANSWER = 1,
-    /**
-     * Prefer maximizing the throughput of successive frames, for example when
-     * processing successive frames coming from the camera.
-     */
-    ANEURALNETWORKS_PREFER_SUSTAINED_SPEED = 2,
-} PreferenceCode;
-/**
- * Device types.
- *
- * The type of NNAPI device.
- */
-typedef enum {
-    /** The device type cannot be provided. */
-    ANEURALNETWORKS_DEVICE_UNKNOWN = 0,
-    /** The device does not fall into any category below. */
-    ANEURALNETWORKS_DEVICE_OTHER = 1,
-    /** The device runs NNAPI models on single or multi-core CPU. */
-    ANEURALNETWORKS_DEVICE_CPU = 2,
-    /** The device can run NNAPI models and also accelerate graphics APIs such
-     * as OpenGL ES and Vulkan. */
-    ANEURALNETWORKS_DEVICE_GPU = 3,
-    /** Dedicated accelerator for Machine Learning workloads. */
-    ANEURALNETWORKS_DEVICE_ACCELERATOR = 4,
-} DeviceTypeCode;
-/**
- * Result codes.
- *
- * <p>Any NNAPI function can return any result code, including result codes not
- * currently documented. Any value other than {@link ANEURALNETWORKS_NO_ERROR}
- * indicates a failure of some kind.</p>
- *
- * <p>Additional information about the nature of a failure can be obtained from
- * the device log after enabling NNAPI debugging by setting the debug.nn.vlog
- * property to 1, e.g., by calling "adb shell setprop debug.nn.vlog 1".</p>
- *
- * Available since API level 27.
- */
-typedef enum {
-    /**
-     * Operation was succesful.
-     */
-    ANEURALNETWORKS_NO_ERROR = 0,
-    /**
-     * Failure caused by not enough available memory.
-     */
-    ANEURALNETWORKS_OUT_OF_MEMORY = 1,
-    ANEURALNETWORKS_INCOMPLETE = 2,
-    /**
-     * Failure caused by unexpected null argument.
-     */
-    ANEURALNETWORKS_UNEXPECTED_NULL = 3,
-    /**
-     * Failure caused by invalid function arguments, invalid model definition,
-     * invalid execution definition or invalid data at execution time.
-     */
-    ANEURALNETWORKS_BAD_DATA = 4,
-    /**
-     * Failure caused by failed model execution.
-     */
-    ANEURALNETWORKS_OP_FAILED = 5,
-    /**
-     * Failure caused by object being in the wrong state.
-     */
-    ANEURALNETWORKS_BAD_STATE = 6,
-    /**
-     * Failure caused by not being able to map a file into memory.
-     * This may be caused by a file descriptor not being mappable, or an AHardwareBuffer
-     * not supported by the device.
-     * Mitigate by reading its content into memory.
-     */
-    ANEURALNETWORKS_UNMAPPABLE = 7,
-    /**
-     * Failure caused by insufficient buffer size provided to a model output.
-     */
-    ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE = 8,
-    /**
-     * Failure caused by a device not being available.
-     */
-    ANEURALNETWORKS_UNAVAILABLE_DEVICE = 9,
-} ResultCode;
-/**
- * For {@link ANeuralNetworksModel_setOperandValue}, values with a
- * length smaller or equal to this will be immediately copied into
- * the model. The size is in bytes.
- *
- * Available since API level 27.
- */
-enum { ANEURALNETWORKS_MAX_SIZE_OF_IMMEDIATELY_COPIED_VALUES = 128 };
-/**
- * For {@link ANeuralNetworksCompilation_setCaching}, specify the size
- * of the cache token required from the application. The size is in bytes.
- *
- * Available since API level 29.
- */
-enum { ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN = 32 };
-/**
- * ANeuralNetworksMemory is an opaque type that represents memory.
- *
- * This type is used to represent shared memory, memory mapped files,
- * and similar memories.
- *
- * By using shared memory, a program can efficiently communicate to the
- * runtime and drivers the tensors that define a model. See
- * {@link ANeuralNetworksModel_setOperandValueFromMemory}. An application
- * should typically create one shared memory object that contains every constant tensor
- * needed to define a model. {@link ANeuralNetworksMemory_createFromFd} can be
- * used to create shared memory from a file handle.
- * {@link ANeuralNetworksMemory_createFromAHardwareBuffer} can be used to
- * create shared memory from an AHardwareBuffer handle.
- *
- * Memory objects can also be used to specify the input and output arguments of
- * an execution. See {@link ANeuralNetworksExecution_setInputFromMemory}
- * and {@link ANeuralNetworksExecution_setOutputFromMemory}.
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksMemory ANeuralNetworksMemory;
-/**
- * ANeuralNetworksModel is an opaque type that contains a description of the
- * mathematical operations that constitute the model.
- *
- * <p>Build the model by calling<ul>
- * <li>{@link ANeuralNetworksModel_create}</li>
- * <li>{@link ANeuralNetworksModel_addOperation}</li>
- * <li>{@link ANeuralNetworksModel_addOperand}</li>
- * </ul>
- *
- * This forms a graph in which each operation and operand is a node, a
- * directed edge from an operand to an operation indicates that the
- * operand is an input to the operation, and a directed edge from an
- * operation to an operand indicates that the operand is an output
- * from the operation. This graph must be acyclic.
- *
- * A model is completed by calling {@link ANeuralNetworksModel_finish}.
- * A model is destroyed by calling {@link ANeuralNetworksModel_free}.
- *
- * <p>A model cannot be modified once {@link ANeuralNetworksModel_finish}
- * has been called on it.</p>
- *
- * <p>It is the application's responsibility to make sure that only one thread
- * modifies a model at a given time. It is however safe for more than one
- * thread to use the model once {@link ANeuralNetworksModel_finish} has returned.</p>
- *
- * <p>It is also the application's responsibility to ensure that there are no other
- * uses of the model after calling {@link ANeuralNetworksModel_free}.
- * This includes any compilation or execution object created using the model.</p>
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksModel ANeuralNetworksModel;
-/**
- * ANeuralNetworksCompilation is an opaque type that can be used to compile
- * a machine learning model.
- *
- * <p>To use:<ul>
- *    <li>Create a new compilation instance by calling the
- *        {@link ANeuralNetworksCompilation_create} function or
- *        {@link ANeuralNetworksCompilation_createForDevices}.</li>
- *    <li>Set any desired properties on the compilation (for example,
- *        {@link ANeuralNetworksCompilation_setPreference}).</li>
- *    <li>Optionally, set the caching signature and the cache directory on the
- *        compilation by calling {@link ANeuralNetworksCompilation_setCaching}.</li>
- *    <li>Complete the compilation with {@link ANeuralNetworksCompilation_finish}.</li>
- *    <li>Use the compilation as many times as needed
- *        with {@link ANeuralNetworksExecution_create} and
- *        {@link ANeuralNetworksBurst_create}.</li>
- *    <li>Destroy the compilation with {@link ANeuralNetworksCompilation_free}
- *        once all executions using the compilation have completed.</li></ul></p>
- *
- * A compilation is completed by calling {@link ANeuralNetworksCompilation_finish}.
- * A compilation is destroyed by calling {@link ANeuralNetworksCompilation_free}.
- *
- * <p>A compilation cannot be modified once {@link ANeuralNetworksCompilation_finish}
- * has been called on it.</p>
- *
- * <p>It is the application's responsibility to make sure that only
- * one thread modifies a compilation at a given time. It is however
- * safe for more than one thread to use the compilation once
- * {@link ANeuralNetworksCompilation_finish} has returned.</p>
- *
- * <p>It is also the application's responsibility to ensure that there are no other
- * uses of the compilation after calling {@link ANeuralNetworksCompilation_free}.
- * This includes any execution object created using the compilation.</p>
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksCompilation ANeuralNetworksCompilation;
-/**
- * ANeuralNetworksExecution is an opaque type that can be used to apply a machine
- * learning model to a set of inputs.
- *
- * <p>To use:<ul>
- *    <li>Create a new execution instance by calling the
- *        {@link ANeuralNetworksExecution_create} function.</li>
- *    <li>Associate input buffers or memory regions to the model inputs with
- *        {@link ANeuralNetworksExecution_setInput} or
- *        {@link ANeuralNetworksExecution_setInputFromMemory}.</li>
- *    <li>Associate output buffers or memory regions to the model outputs with
- *        {@link ANeuralNetworksExecution_setOutput} or
- *        {@link ANeuralNetworksExecution_setOutputFromMemory}.</li>
- *    <li>Apply the model with one of the following:</li><ul>
- *        <li>Asynchronously with {@link ANeuralNetworksExecution_startCompute},
- *            waiting for the execution to complete with
- *            {@link ANeuralNetworksEvent_wait}.</li>
- *        <li>Synchronously with {@link ANeuralNetworksExecution_compute}.</li>
- *        <li>Synchronously as part of an execution burst with
- *            {@link ANeuralNetworksExecution_burstCompute}.</li></ul>
- *    <li>Destroy the execution with
- *        {@link ANeuralNetworksExecution_free}.</li></ul></p>
- *
- * <p>An output buffer or memory region must not overlap with any
- * other output buffer or memory region, with an input buffer or
- * memory region, or with an operand value in a memory object
- * ({@link ANeuralNetworksModel_setOperandValueFromMemory}).</p>
- *
- * <p>An execution cannot be modified once
- * {@link ANeuralNetworksExecution_compute} or
- * {@link ANeuralNetworksExecution_startCompute} has been called on it.</p>
- *
- * <p>An execution can be applied to a model with
- * {@link ANeuralNetworksExecution_compute} or
- * {@link ANeuralNetworksExecution_startCompute} only once. Create new
- * executions to do new evaluations of the model.</p>
- *
- * <p>It is the application's responsibility to make sure that only one thread
- * modifies an execution at a given time. It is however safe for more than one
- * thread to use {@link ANeuralNetworksEvent_wait} at the same time.</p>
- *
- * <p>It is also the application's responsibility to ensure that there are no other
- * uses of the execution after calling {@link ANeuralNetworksExecution_free}.</p>
- *
- * <p>Multiple executions can be scheduled and evaluated concurrently, either by
- * means of {@link ANeuralNetworksExecution_compute} (which is synchronous) in
- * different threads or by means of
- * {@link ANeuralNetworksExecution_startCompute} (which is asynchronous). The
- * runtime makes no guarantee on the ordering of completion of executions. If
- * it's important to the application, the application should enforce the
- * ordering by ensuring that one execution completes before the next is
- * scheduled (for example, by scheduling all executions synchronously within a
- * single thread, or by scheduling all executions asynchronously and using
- * {@link ANeuralNetworksEvent_wait} between calls to
- * {@link ANeuralNetworksExecution_startCompute}).</p>
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksExecution ANeuralNetworksExecution;
-/**
- * Parameters for ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL operand.
- */
-typedef struct ANeuralNetworksSymmPerChannelQuantParams {
-    /* The index of the channel dimension. */
-    uint32_t channelDim;
-    /** The size of the scale array. Should be equal to dimension[channelDim] of the Operand. */
-    uint32_t scaleCount;
-    /** The array of scaling values for each channel. Each value must be greater than zero. */
-    const float* scales;
-} ANeuralNetworksSymmPerChannelQuantParams;
-/**
- * ANeuralNetworksBurst is an opaque type that can be used to reduce the latency
- * of a rapid sequence of executions. It will likely cause overhead if only used
- * for a single execution.
- *
- * ANeuralNetworksBurst serves as a context object for any number of inferences
- * using {@link ANeuralNetworksExecution} objects. An ANeuralNetworksBurst
- * object and the {@link ANeuralNetworksExecution} objects used with it must all
- * have been created from the same {@link ANeuralNetworksCompilation} object.
- *
- * This object is also used as a hint to drivers, providing insight to the
- * lifetime of a rapid sequence of executions. For example, a driver may choose
- * to increase the clock frequency of its accelerator for the lifetime of a
- * burst object.
- *
- * <p>To use:<ul>
- *    <li>Create a new burst object by calling the
- *        {@link ANeuralNetworksBurst_create} function.</li>
- *    <li>For each execution:</li><ul>
- *        <li>Create {@link ANeuralNetworksExecution} and configure its
- *            properties (see {@link ANeuralNetworksExecution} for details).</li>
- *        <li>Apply the model synchronously with
- *            {@link ANeuralNetworksExecution_burstCompute}, reusing the same
- *            {@link ANeuralNetworksBurst} with the new
- *            {@link ANeuralNetworksExecution}.</li>
- *        <li>Use and free the {@link ANeuralNetworksExecution}.</li></ul>
- *    <li>Destroy the burst with
- *        {@link ANeuralNetworksBurst_free}.</li></ul></p>
- *
- * Available since API level 29.
- */
-typedef struct ANeuralNetworksBurst ANeuralNetworksBurst;
-/**
- * ANeuralNetworksOperandType describes the type of an operand.
- * This structure is used to describe both scalars and tensors.
- *
- * A tensor operand type must have a specified rank (number of
- * dimensions) but may have any of its dimensions unspecified.
- *
- * A tensor operand type with all dimensions specified is "fully
- * specified".  Whenever possible (i.e., whenever the dimensions are
- * known at model construction time), a tensor operand type should be
- * (but is not required to be) fully specified, in order to enable the
- * best possible performance.
- *
- * If a tensor operand's type is not fully specified, the dimensions
- * of the operand are deduced from the operand types and values of the
- * operation for which that operand is an output.
- *
- * <p>In the following situations, a tensor operand type must be fully
- * specified:<ul>
- *     <li>The operand has a constant value, set by
- *         {@link ANeuralNetworksModel_setOperandValue} (with a
- *         non-nullptr buffer) or
- *         {@link ANeuralNetworksModel_setOperandValueFromMemory}.</li>
- *     <li>The operand is a model input or model output (see
- *         {@link ANeuralNetworksModel_identifyInputsAndOutputs}).  A
- *         fully specified tensor operand type must either be provided
- *         to {@link ANeuralNetworksModel_addOperand}; or it must be
- *         provided to the corresponding
- *         {@link ANeuralNetworksExecution_setInput},
- *         {@link ANeuralNetworksExecution_setInputFromMemory},
- *         {@link ANeuralNetworksExecution_setOutput}, or
- *         {@link ANeuralNetworksModel_setOperandValueFromMemory}.
- *         EXCEPTION: If the input or output is optional and omitted
- *         (by passing nullptr for buffer to
- *         {@link ANeuralNetworksExecution_setInput} or
- *         {@link ANeuralNetworksExecution_setOutput}) then it need
- *         not have a fully specified tensor operand type.</li></ul>
- *
- * A tensor operand type with some number of unspecified dimensions is
- * represented by setting each unspecified dimension to 0.
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksOperandType {
-    /** The data type, e.g ANEURALNETWORKS_INT8. */
-    int32_t type;
-    /** The number of dimensions (rank). It should be 0 for scalars. */
-    uint32_t dimensionCount;
-    /** The dimensions of the tensor. It should be nullptr for scalars. */
-    const uint32_t* dimensions;
-    /** These two fields are only used for quantized tensors.
-     * They should be zero for scalars and non-fixed point tensors.
-     * The dequantized value of each entry is (value - zeroPoint) * scale.
-     */
-    float scale;
-    int32_t zeroPoint;
-} ANeuralNetworksOperandType;
-typedef int32_t ANeuralNetworksOperationType;
-/**
- * ANeuralNetworksEvent is an opaque type that represents an event
- * that will be signaled once an execution completes.
- *
- * Available since API level 27.
- */
-typedef struct ANeuralNetworksEvent ANeuralNetworksEvent;
-/**
- * ANeuralNetworksDevice is an opaque type that represents a device.
- *
- * This type is used to query basic properties and supported operations of the corresponding
- * device, and control which device(s) a model is to be run on.
- *
- * Available since API level 29.
- */
-typedef struct ANeuralNetworksDevice ANeuralNetworksDevice;
-/**
- * Get the number of available devices.
- *
- * @param numDevices Used to return the number of devices.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworks_getDeviceCount(uint32_t* numDevices);
-/**
- * Get the representation of the specified device.
- *
- * @param devIndex The index of the specified device. Must be less than the
-                   number of available devices.
- * @param device The representation of the specified device.
- *               The same representation will always be returned for the specified
- *               device.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworks_getDevice(uint32_t devIndex, ANeuralNetworksDevice** device);
-/**
- * Get the name of the specified device.
- *
- * @param device The representation of the specified device.
- * @param name   The returned name of the specified device. The name will be in UTF-8
- *               and will be null-terminated. It will be recognizable as a known device name
- *               rather than a cryptic string. For devices with feature level 29 and above, the
- *               format of the name is {VENDOR}-{DEVICE}, e.g. “google-ipu”. For devices with
- *               feature level 28 or lower, the name will always be “unknown-device”.
- *               The name will remain valid for the duration of the application.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksDevice_getName(const ANeuralNetworksDevice* device, const char** name);
-/**
- * Get the type of a given device.
- *
- * The device type can be used to help application developers to distribute Machine Learning
- * workloads and other workloads such as graphical rendering.
- * E.g., for an app which renders AR scenes based on real time object detection results,
- * the developer could choose an ACCELERATOR type device for ML workloads, and reserve GPU
- * for graphical rendering.
- *
- * @param device The representation of the specified device.
- * @param type The returned {@link DeviceTypeCode} of the specified device.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksDevice_getType(const ANeuralNetworksDevice* device, int32_t* type);
-/**
- * Get the version of the driver implementation of the specified device.
- *
- * It’s the responsibility of the driver implementor to insure that this version string
- * uniquely distinguishes this implementation from all previous implementations.
- *
- * This version string must not be confused with the feature level which is solely defined
- * by {@link ANeuralNetworksDevice_getFeatureLevel}. There is no implicit ordering of the versions.
- * For example, it is not possible to filter all drivers older than a certain version.
- *
- * Application developers may use this version string to avoid or prefer specific driver
- * implementations. For example, an application may want to do so because:
- *     - A specific version of the driver does not provide the required performance,
- *       perhaps because of a performance regression.
- *     - A specific version of the driver has a bug or returns results that don’t match
- *       the minimum precision requirement for the application.
- *
- * @param device The representation of the specified device.
- * @param version The returned version string of the driver for the specified device. The
- *                string will be in UTF-8 and will be null-terminated. For devices with feature
- *                level 28 or lower, "UNKOWN" will be returned. The version string will remain
- *                valid for the duration of the application.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksDevice_getVersion(const ANeuralNetworksDevice* device, const char** version);
-/**
- * Get the supported NNAPI version of the specified device.
- *
- * Each device has a supported feature level, which is the most advanced feature this driver
- * implements. For example, if the driver implements the features introduced in Android P,
- * but does not implement the features introduced after Android P, the value would be 28.
- * Developers could decide whether or not the specified device should be used for a Model that
- * has certain feature requirements.
- *
- * @param device The representation of the specified device.
- * @param featureLevel The API level of the most advanced feature this driver implements.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksDevice_getFeatureLevel(const ANeuralNetworksDevice* device,
-                                          int64_t* featureLevel);
-/**
- * Get the supported operations for a specified set of devices. If multiple devices
- * are selected, the supported operation list is a union of supported operations of all
- * selected devices.
- *
- * @param model The model to be queried.
- * @param devices The set of devices. Must not contain duplicates.
- * @param numDevices The number of devices in the set.
- * @param supportedOps The boolean array to be filled. True means supported. The size of the
- *                     boolean array must be at least as large as the number of operations
- *                     in the model. The order of elements in the supportedOps array matches
- *                     the order in which the corresponding operations were added to the model.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksModel_getSupportedOperationsForDevices(
-        const ANeuralNetworksModel* model, const ANeuralNetworksDevice* const* devices,
-        uint32_t numDevices, bool* supportedOps);
-/**
- * Create a {@link ANeuralNetworksCompilation} to compile the given model for a specified set
- * of devices. If more than one device is specified, the compilation will
- * distribute the workload automatically across the devices. The model must be fully
- * supported by the specified set of devices. This means that
- * ANeuralNetworksModel_getSupportedOperationsForDevices() must have returned true for every
- * operation for that model/devices pair.
- *
- * @param model The {@link ANeuralNetworksModel} to be compiled.
- * @param devices The set of devices. Must not contain duplicates.
- * @param numDevices The number of devices in the set.
- * @param compilation The newly created object or NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
- *         if the model is invalid.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksCompilation_createForDevices(ANeuralNetworksModel* model,
-                                                const ANeuralNetworksDevice* const* devices,
-                                                uint32_t numDevices,
-                                                ANeuralNetworksCompilation** compilation);
-/**
- * Sets the compilation caching signature and the cache directory.
- *
- * Provides optional caching information to the runtime for faster repeated
- * compilation.
- *
- * See {@link ANeuralNetworksCompilation} for information on multithreaded usage.
- *
- * @param compilation The compilation to be modified.
- * @param cacheDir The cache directory for the runtime to store and retrieve caching
- *                 data. It is recommended to use the code cache directory provided
- *                 by the Android runtime. If not using the code cache directory, the
- *                 user should choose a directory local to the application, and is
- *                 responsible to managing the cache entries.
- * @param token The token provided by the user to specify a model must be of length
- *              ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN. The user should ensure that
- *              the token is unique to a model within the application. The NNAPI
- *              runtime cannot detect token collisions; a collision will result in a
- *              failed execution or in a successful execution that produces incorrect
- *              output values.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksCompilation_setCaching(ANeuralNetworksCompilation* compilation,
-                                          const char* cacheDir, const uint8_t* token);
-/**
- * Schedule synchronous evaluation of the execution.
- *
- * <p>Schedules synchronous evaluation of the execution. Returns once the
- * execution has completed and the outputs are ready to be consumed.
- * </p>
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * See {@link ANeuralNetworksExecution_startCompute} for asynchronous execution.
- * Synchronous execution incurs lower overhead than asynchronous execution.
- *
- * Available since API level 29.
- *
- * @param execution The execution to be scheduled and executed.
- *
- * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
- *         ANEURALNETWORKS_UNMAPPABLE if the execution input or output memory cannot
- *         be properly mapped.
- */
-int ANeuralNetworksExecution_compute(ANeuralNetworksExecution* execution);
-/**
- * Get the dimensional information of the specified output operand of the model of the
- * {@link ANeuralNetworksExecution}.
- *
- * On asynchronous execution initiated by {@link ANeuralNetworksExecution_startCompute},
- * {@link ANeuralNetworksEvent_wait} must be called prior to this function to recuperate
- * the resources used by the execution.
- *
- * @param execution The execution to be queried.
- * @param index The index of the output argument we are querying. It is
- *              an index into the lists passed to
- *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with {@link ANeuralNetworksModel_addOperand}.
- * @param rank The rank of the output operand.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE
- *         if the target output is provided an insufficient buffer at execution time,
- *         ANEURALNETWORKS_BAD_DATA if the index is invalid.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksExecution_getOutputOperandRank(ANeuralNetworksExecution* execution,
-                                                  int32_t index, uint32_t* rank);
-/**
- * Get the dimensional information of the specified output operand of the model of the
- * {@link ANeuralNetworksExecution}. The target output operand cannot be a scalar.
- *
- * On asynchronous execution initiated by {@link ANeuralNetworksExecution_startCompute},
- * {@link ANeuralNetworksEvent_wait} must be called prior to this function to recuperate
- * the resources used by the execution.
- *
- * @param execution The execution to be queried.
- * @param index The index of the output argument we are querying. It is an index into the lists
- *              passed to {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with {@link ANeuralNetworksModel_addOperand}.
- * @param dimensions The dimension array to be filled. The size of the array must be exactly as
- *                   large as the rank of the output operand to be queried in the model.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE
- *         if the target output is provided an insufficient buffer at execution time,
- *         ANEURALNETWORKS_BAD_DATA if the index is invalid or if the target is a scalar.
- *
- * Available since API level 29.
- */
-int ANeuralNetworksExecution_getOutputOperandDimensions(ANeuralNetworksExecution* execution,
-                                                        int32_t index, uint32_t* dimensions);
-/**
- * Create a {@link ANeuralNetworksBurst} to apply the given compilation.
- * This only creates the burst object. Computation is only performed once
- * {@link ANeuralNetworksExecution_burstCompute} is invoked with a valid
- * {@link ANeuralNetworksExecution} and {@link ANeuralNetworksBurst}.
- *
- * <p>The provided compilation must outlive the burst object.</p>
- *
- * Available since API level 29.
- *
- * @param compilation The {@link ANeuralNetworksCompilation} to be evaluated.
- * @param burst The newly created object or NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
- *         if the compilation is invalid.
- */
-int ANeuralNetworksBurst_create(ANeuralNetworksCompilation* compilation,
-                                ANeuralNetworksBurst** burst) __INTRODUCED_IN(29);
-/**
- * Destroys the burst object.
- *
- * Available since API level 29.
- *
- * @param burst The burst object to be destroyed. Passing NULL is acceptable and
- *              results in no operation.
- */
-void ANeuralNetworksBurst_free(ANeuralNetworksBurst* burst) __INTRODUCED_IN(29);
-/**
- * Schedule synchronous evaluation of the execution on a burst object.
- *
- * <p>Schedules synchronous evaluation of the execution. Returns once the
- * execution has completed and the outputs are ready to be consumed.</p>
- *
- * <p>There must be at most one {@link ANeuralNetworksExecution} processing at
- * any given time for any given burst object. Any
- * {@link ANeuralNetworksExecution} launched before the previous has finished
- * will result in ANEURALNETWORKS_BAD_STATE.</p>
- *
- * Available since API level 29.
- *
- * @param burst The burst object to execute on.
- * @param execution The execution to be scheduled and executed. The execution
- *                  must be created from the same {@link
- *                  ANeuralNetworksCompilation} as the burst object.
- *
- * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
- */
-int ANeuralNetworksExecution_burstCompute(ANeuralNetworksExecution* execution,
-                                          ANeuralNetworksBurst* burst) __INTRODUCED_IN(29);
-/**
- * Creates a shared memory object from an AHardwareBuffer handle.
- *
- * If the shared memory is backed by an AHardwareBuffer of AHARDWAREBUFFER_FORMAT_BLOB
- * format, it can be used the same way as shared memory created from a file handle. See
- * {@link ANeuralNetworksMemory} for a description on how to use this shared memory.
- *
- * If the shared memory is backed by an AHardwareBuffer of a format other than
- * AHARDWAREBUFFER_FORMAT_BLOB, it can only be used for Model inputs and outputs.
- * When calling {@link ANeuralNetworksExecution_setInputFromMemory} or
- * {@link ANeuralNetworksExecution_setOutputFromMemory} with the shared memory, both
- * offset and length must be set to zero and the entire memory region will be
- * associated with the specified input or output operand. There is no guarantee
- * that an arbitrary AHardwareBuffer_Format and AHardwareBuffer_UsageFlags combination
- * can be used by arbitrary devices. The execution will fail if selected set of devices
- * cannot consume the buffer.
- *
- * Calling {@link ANeuralNetworksModel_setOperandValueFromMemory} with shared memory
- * backed by an AHardwareBuffer of a format other than AHARDWAREBUFFER_FORMAT_BLOB is
- * disallowed.
- *
- * TODO(miaowang): add documentation about intended usage with introspection API.
- *
- * Available since API level 29.
- *
- * @param ahwb The AHardwareBuffer handle.
- * @param memory The memory object to be created.
- *               Set to NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if the request completed normally.
- *
- * @see AHardwareBuffer
- */
-int ANeuralNetworksMemory_createFromAHardwareBuffer(const AHardwareBuffer* ahwb,
-                                                    ANeuralNetworksMemory** memory);
-/**
- * Specifies whether duration of the {@link ANeuralNetworksExecution} is to be measured.
- * By default, duration is not measured.
- *
- * The {@link ANeuralNetworksExecution} must have been created with
- * {@link ANeuralNetworksCompilation_createForDevices} with numDevices = 1.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 29.
- *
- * @param execution The execution to be modified.
- * @param measure 'true' if duration is to be measured, 'false' if not.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksExecution_setMeasureTiming(ANeuralNetworksExecution* execution, bool measure);
-/**
- * Different duration measurements.
- *
- * Durations are measured in nanoseconds.
- *
- * Available since API level 29.
- */
-typedef enum {
-    // Execution time on hardware (not driver, which runs on host processor).
-    ANEURALNETWORKS_DURATION_ON_HARDWARE = 0,
-    // Execution time in driver (including time on hardware).  Excludes overhead
-    // such as that of the runtime itself and the IPC needed for the runtime to
-    // communicate with the driver.
-    ANEURALNETWORKS_DURATION_IN_DRIVER = 1,
-} DurationCode;
-/**
- * Get the time spent in the specified {@link ANeuralNetworksExecution}, in nanoseconds.
- * The execution must have completed.
- *
- * @param execution The execution to be queried.
- * @param durationCode The measurement to be queried, specified by {@link DurationCode}.
- * @param duration The returned duration. If no measurement was requested by
- *                 {@link ANeuralNetworksExecution_setMeasureTiming}, or for some other
- *                 reason the duration is not available, UINT64_MAX will be returned.
- *                 A particular device need not support any given measurement.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksExecution_getDuration(const ANeuralNetworksExecution* execution,
-                                         int32_t durationCode, uint64_t* duration);
-/**
- * Creates a shared memory object from a file descriptor.
- *
- * The shared memory is backed by a file descriptor via mmap.
- * See {@link ANeuralNetworksMemory} for a description on how to use
- * this shared memory.
- *
- * Available since API level 27.
- *
- * @param size The requested size in bytes.
- *             Must not be larger than the file size.
- * @param prot The desired memory protection for the mapping.
- *             It is either PROT_NONE or the bitwise OR of one or
- *             more of the following flags: PROT_READ, PROT_WRITE.
- * @param fd The requested file descriptor.
- *           The file descriptor has to be mmap-able. The file
- *           descriptor will be duplicated.
- * @param offset The offset to the beginning of the file of the area to map.
- *               The offset has to be aligned to a page size.
- * @param memory The memory object to be created.
- *               Set to NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if the request completed normally.
- */
-int ANeuralNetworksMemory_createFromFd(size_t size, int protect, int fd, size_t offset,
-                                       ANeuralNetworksMemory** memory) __INTRODUCED_IN(27);
-/**
- * Delete a memory object.
- *
- * Destroys the object used by the run time to keep track of the memory.
- * This will free the underlying actual memory if no other code has open
- * handles to this memory.
- *
- * Available since API level 27.
- *
- * @param memory The memory object to be freed.
- */
-void ANeuralNetworksMemory_free(ANeuralNetworksMemory* memory) __INTRODUCED_IN(27);
-/**
- * Create an empty {@link ANeuralNetworksModel}.
- *
- * <p>This only creates the object. Computation is performed once
- * {@link ANeuralNetworksExecution_compute} or
- * {@link ANeuralNetworksExecution_startCompute} is invoked.
- *
- * The model should be constructed with calls to
- * {@link ANeuralNetworksModel_addOperation} and
- * {@link ANeuralNetworksModel_addOperand}
- *
- * <p>{@link ANeuralNetworksModel_finish} should be called once the model
- * has been fully constructed.</p>
- *
- * <p>{@link ANeuralNetworksModel_free} should be called once the model
- * is no longer needed.</p>
- *
- * Available since API level 27.
- *
- * @param model The {@link ANeuralNetworksModel} to be created.
- *              Set to NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_create(ANeuralNetworksModel** model) __INTRODUCED_IN(27);
-/**
- * Destroy a model.
- *
- * The model need not have been finished by a call to
- * {@link ANeuralNetworksModel_finish}.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param model The model to be destroyed. Passing NULL is acceptable and
- *              results in no operation.
- */
-void ANeuralNetworksModel_free(ANeuralNetworksModel* model) __INTRODUCED_IN(27);
-/**
- * Indicate that we have finished modifying a model. Required before
- * calling {@link ANeuralNetworksCompilation_create} and
- * {@link ANeuralNetworksCompilation_createForDevices}.
- *
- * An application is responsible to make sure that no other thread uses
- * the model at the same time.
- *
- * This function must only be called once for a given model.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param model The model to be finished.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_finish(ANeuralNetworksModel* model) __INTRODUCED_IN(27);
-/**
- * Add an operand to a model.
- *
- * The order in which the operands are added is important. The first one added
- * to a model will have the index value 0, the second 1, etc. These indexes are
- * used as operand identifiers in
- * {@link ANeuralNetworksModel_addOperation},
- * {@link ANeuralNetworksModel_identifyInputsAndOutputs},
- * {@link ANeuralNetworksModel_setOperandValue},
- * {@link ANeuralNetworksModel_setOperandValueFromMemory},
- * {@link ANeuralNetworksExecution_setInput},
- * {@link ANeuralNetworksExecution_setInputFromMemory},
- * {@link ANeuralNetworksExecution_setOutput},
- * {@link ANeuralNetworksExecution_setOutputFromMemory} and
- * {@link ANeuralNetworksExecution_setOperandValue}.
- *
- * <p>Every operand must be referenced in exactly one of the following
- * ways:<ul>
- *    <li>It is identified as a model input with
- *        {@link ANeuralNetworksModel_identifyInputsAndOutputs}.</li>
- *    <li>It is identified as a constant with
- *        {@link ANeuralNetworksModel_setOperandValue} or
- *        {@link ANeuralNetworksModel_setOperandValueFromMemory}.</li>
- *    <li>It is identified as an output of exactly one operation with
- *        {@link ANeuralNetworksModel_addOperation}.</li></p>
- * <p>An operand that is identified as a model input or as a constant
- * must not also be identified as a model output with
- * {@link ANeuralNetworksModel_identifyInputsAndOutputs}.</p>
- *
- * To build a model that can accommodate inputs of various sizes, as
- * you may want to do for a CNN, leave unspecified the dimensions that
- * will vary at run time.  If you do so, fully specify dimensions
- * when calling {@link ANeuralNetworksExecution_setInput} or
- * {@link ANeuralNetworksExecution_setInputFromMemory}.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param model The model to be modified.
- * @param type The {@link ANeuralNetworksOperandType} that describes the shape
- *             of the operand.  Neither the {@link ANeuralNetworksOperandType}
- *             nor the dimensions it points to need to outlive the call to
- *             {@link ANeuralNetworksModel_addOperand}.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_addOperand(ANeuralNetworksModel* model,
-                                    const ANeuralNetworksOperandType* type) __INTRODUCED_IN(27);
-/**
- * Sets an operand to a constant value.
- *
- * Values of length smaller or equal to
- * {@link ANEURALNETWORKS_MAX_SIZE_OF_IMMEDIATELY_COPIED_VALUES}
- * are immediately copied into the model.
- *
- * For values of length greater than {@link ANEURALNETWORKS_MAX_SIZE_OF_IMMEDIATELY_COPIED_VALUES},
- * a pointer to the buffer is stored within the model. The application is responsible
- * for not changing the content of this region until all executions using this model
- * have completed. As the data may be copied during processing, modifying the data
- * after this call yields undefined results.
- *
- * For large tensors, using {@link ANeuralNetworksModel_setOperandValueFromMemory}
- * is likely to be more efficient.
- *
- * To indicate that an optional operand should be considered missing,
- * pass nullptr for buffer and 0 for length.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param model The model to be modified.
- * @param index The index of the model operand we're setting.
- * @param buffer A pointer to the data to use.
- * @param length The size in bytes of the data value.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_setOperandValue(ANeuralNetworksModel* model, int32_t index,
-                                         const void* buffer, size_t length) __INTRODUCED_IN(27);
-/**
- * Sets an operand's per channel quantization parameters.
- *
- * Sets parameters required by a tensor of type
- * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}.
- * This function must be called for every tensor of type
- * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} before
- * calling {@link ANeuralNetworksModel_finish}.
- *
- * Available since API level 29.
- *
- * @param model The model to be modified.
- * @param index The index of the model operand we're setting.
- * @param channelQuant The per channel quantization parameters for the operand.
- *                    No memory in this struct needs to outlive the call to
- *                    this function.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_setOperandSymmPerChannelQuantParams(
-        ANeuralNetworksModel* model, int32_t index,
-        const ANeuralNetworksSymmPerChannelQuantParams* channelQuant) __INTRODUCED_IN(29);
-/**
- * Sets an operand to a value stored in a memory object.
- *
- * The content of the memory is not copied. A reference to that memory is stored
- * inside the model. The application is responsible for not changing the content
- * of the memory region until all executions using this model have completed.
- * As the data may be copied during processing, modifying the data after this call
- * yields undefined results.
- *
- * To indicate that an optional operand should be considered missing,
- * use {@link ANeuralNetworksModel_setOperandValue} instead, passing nullptr for buffer.
- *
- * Is disallowed to set an operand value with shared memory backed by an AHardwareBuffer
- * of a format other than AHARDWAREBUFFER_FORMAT_BLOB.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- * See {@link ANeuralNetworksMemory_createFromAHardwarBuffer} for information on
- * AHardwareBuffer usage.
- *
- * Available since API level 27.
- *
- * @param model The model to be modified.
- * @param index The index of the model operand we're setting.
- * @param buffer A pointer to the data to use.
- * @param memory The memory containing the data.
- * @param offset This specifies the location of the data within the memory.
- *               The offset is in bytes from the start of memory.
- * @param length The size in bytes of the data value.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_setOperandValueFromMemory(ANeuralNetworksModel* model, int32_t index,
-                                                   const ANeuralNetworksMemory* memory,
-                                                   size_t offset, size_t length)
-        __INTRODUCED_IN(27);
-/**
- * Add an operation to a model.
- *
- * @param model The model to be modified.
- * @param type The {@link ANeuralNetworksOperationType} of the operation.
- * @param inputCount The number of entries in the inputs array.
- * @param inputs An array of indexes identifying each operand.
- * @param outputCount The number of entries in the outputs array.
- * @param outputs An array of indexes identifying each operand.
- *
- * The operands specified by inputs and outputs must have been
- * previously added by calls to {@link ANeuralNetworksModel_addOperand}.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksModel_addOperation(ANeuralNetworksModel* model,
-                                      ANeuralNetworksOperationType type, uint32_t inputCount,
-                                      const uint32_t* inputs, uint32_t outputCount,
-                                      const uint32_t* outputs) __INTRODUCED_IN(27);
-/**
- * Specifies which operands will be the model's inputs and
- * outputs. Every model must have at least one input and one output.
- *
- * An operand cannot be used for both input and output. Doing so will
- * return an error.
- *
- * @param model The model to be modified.
- * @param inputCount The number of entries in the inputs array.
- * @param inputs An array of indexes identifying the input operands.
- * @param outputCount The number of entries in the outputs array.
- * @param outputs An array of indexes identifying the output operands.
- *
- * The operands specified by inputs and outputs must have been
- * previously added by calls to {@link ANeuralNetworksModel_addOperand}.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- */
-int ANeuralNetworksModel_identifyInputsAndOutputs(ANeuralNetworksModel* model, uint32_t inputCount,
-                                                  const uint32_t* inputs, uint32_t outputCount,
-                                                  const uint32_t* outputs) __INTRODUCED_IN(27);
-/**
- * Specifies whether {@link ANEURALNETWORKS_TENSOR_FLOAT32} is allowed to be
- * calculated with range and/or precision as low as that of the IEEE 754 16-bit
- * floating-point format. By default, {@link ANEURALNETWORKS_TENSOR_FLOAT32}
- * must be calculated using at least the range and precision of the IEEE 754
- * 32-bit floating-point format.
- *
- * @param model The model to be modified.
- * @param allow 'true' indicates {@link ANEURALNETWORKS_TENSOR_FLOAT32} may be
- *              calculated with range and/or precision as low as that of the
- *              IEEE 754 16-bit floating point format. 'false' indicates
- *              {@link ANEURALNETWORKS_TENSOR_FLOAT32} must be calculated using
- *              at least the range and precision of the IEEE 754 32-bit floating
- *              point format.
- *
- * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has been
- * called will return an error.
- *
- * Available since API level 28.
- *
- * See {@link ANeuralNetworksModel} for information on multithreaded usage.
- */
-int ANeuralNetworksModel_relaxComputationFloat32toFloat16(ANeuralNetworksModel* model, bool allow)
-        __INTRODUCED_IN(28);
-/**
- * Create a {@link ANeuralNetworksCompilation} to compile the given model.
- *
- * <p>This only creates the object. Compilation is only performed once
- * {@link ANeuralNetworksCompilation_finish} is invoked.</p>
- *
- * <p>{@link ANeuralNetworksCompilation_finish} should be called once
- * all desired properties have been set on the compilation.</p>
- *
- * <p>{@link ANeuralNetworksModel_free} should be called once the compilation
- * is no longer needed.</p>
- *
- * <p>The provided model must outlive the compilation.</p>
- *
- * The model must already have been finished by a call to
- * {@link ANeuralNetworksModel_finish}.
- *
- * See {@link ANeuralNetworksCompilation} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param model The {@link ANeuralNetworksModel} to be compiled.
- * @param compilation The newly created object or NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
- *         if the model is invalid.
- */
-int ANeuralNetworksCompilation_create(ANeuralNetworksModel* model,
-                                      ANeuralNetworksCompilation** compilation) __INTRODUCED_IN(27);
-/**
- * Destroy a compilation.
- *
- * The compilation need not have been finished by a call to
- * {@link ANeuralNetworksModel_finish}.
- *
- * See {@link ANeuralNetworksCompilation} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param compilation The compilation to be destroyed. Passing NULL is acceptable and
- *                    results in no operation.
- */
-void ANeuralNetworksCompilation_free(ANeuralNetworksCompilation* compilation) __INTRODUCED_IN(27);
-/**
- * Sets the execution preference.
- *
- * <p>Provides guidance to the runtime when trade-offs are possible.</p>
- *
- * See {@link ANeuralNetworksCompilation} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param compilation The compilation to be modified.
- * @param preference Either {@link PREFER_LOW_POWER},
- *                  {@link PREFER_SINGLE_FAST_ANSWER}, or
- *                  {@link PREFER_SUSTAINED_SPEED}.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksCompilation_setPreference(ANeuralNetworksCompilation* compilation,
-                                             int32_t preference) __INTRODUCED_IN(27);
-/**
- * Indicate that we have finished modifying a compilation. Required before
- * calling {@link ANeuralNetworksExecution_create}.
- *
- * An application is responsible to make sure that no other thread uses
- * the compilation at the same time.
- *
- * This function must only be called once for a given compilation.
- *
- * See {@link ANeuralNetworksCompilation} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param compilation The compilation to be finished.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksCompilation_finish(ANeuralNetworksCompilation* compilation) __INTRODUCED_IN(27);
-/**
- * Create a {@link ANeuralNetworksExecution} to apply the given compilation.
- * This only creates the object. Computation is only performed once
- * {@link ANeuralNetworksExecution_compute} or
- * {@link ANeuralNetworksExecution_startCompute} is invoked.
- *
- * <p>The provided compilation must outlive the execution.</p>
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param compilation The {@link ANeuralNetworksCompilation} to be evaluated.
- * @param execution The newly created object or NULL if unsuccessful.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
- *         if the compilation is invalid.
- */
-int ANeuralNetworksExecution_create(ANeuralNetworksCompilation* compilation,
-                                    ANeuralNetworksExecution** execution) __INTRODUCED_IN(27);
-/**
- * Destroy an execution.
- *
- * <p>If called on an execution for which
- * {@link ANeuralNetworksExecution_startCompute} has been called, the
- * function will return immediately but will mark the execution to be deleted
- * once the computation completes. The related {@link ANeuralNetworksEvent}
- * will be signaled and the {@link ANeuralNetworksEvent_wait} will return
- * ANEURALNETWORKS_ERROR_DELETED.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be destroyed. Passing NULL is acceptable and
- *                  results in no operation.
- */
-void ANeuralNetworksExecution_free(ANeuralNetworksExecution* execution) __INTRODUCED_IN(27);
-/**
- * Associate a user buffer with an input of the model of the
- * {@link ANeuralNetworksExecution}.
- *
- * <p>The provided buffer must outlive the execution.</p>
- *
- * If the input is optional, you can indicate that it is omitted by
- * passing nullptr for buffer and 0 for length.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be modified.
- * @param index The index of the input argument we are setting. It is
- *              an index into the lists passed to
- *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with
- *              {@link ANeuralNetworksModel_addOperand}.
- * @param type The {@link ANeuralNetworksOperandType} of the
- *             operand. Unless the input is omitted, this should be
- *             used to specify the dimensions that were left
- *             unspecified when the operand was added to the
- *             model. All other properties of the type must be the
- *             same as specified in the model. If the type is the same
- *             as specified when the model was built, NULL can be
- *             passed. Neither the {@link ANeuralNetworksOperandType}
- *             nor the dimensions it points to need to outlive the call
- *             to {@link ANeuralNetworksExecution_setInput}.
- * @param buffer The buffer containing the data.
- * @param length The length in bytes of the buffer.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if the
- *         name is not recognized or the buffer is too small for the input.
- */
-int ANeuralNetworksExecution_setInput(ANeuralNetworksExecution* execution, int32_t index,
-                                      const ANeuralNetworksOperandType* type, const void* buffer,
-                                      size_t length) __INTRODUCED_IN(27);
-/**
- * Associate part of a memory object with an input of the model of the
- * {@link ANeuralNetworksExecution}.
- *
- * <p>The provided memory must outlive the execution.</p>
- *
- * If the input is optional, you can indicate that it is omitted by
- * using {@link ANeuralNetworks_setInput} instead, passing nullptr for buffer
- * and 0 for length.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- * See {@link ANeuralNetworksMemory_createFromAHardwarBuffer} for information on
- * AHardwareBuffer usage.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be modified.
- * @param index The index of the input argument we are setting. It is
- *              an index into the lists passed to
- *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with {@link ANeuralNetworksModel_addOperand}.
- * @param type The {@link ANeuralNetworksOperandType} of the
- *             operand. This should be used to specify the dimensions
- *             that were left unspecified when the operand was added
- *             to the model. All other properties of the type must be
- *             the same as specified in the model. If the type is the
- *             same as specified when the model was built, NULL can be
- *             passed. Neither the {@link ANeuralNetworksOperandType}
- *             nor the dimensions it points to need to outlive the call
- *             to {@link ANeuralNetworksExecution_setInputFromMemory}.
- * @param memory The memory containing the data.
- * @param offset This specifies the location of the data within the memory.
- *               The offset is in bytes from the start of memory.
- * @param length The size in bytes of the data value.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if the
- *         name is not recognized or the buffer is too small for the input.
- */
-int ANeuralNetworksExecution_setInputFromMemory(ANeuralNetworksExecution* execution, int32_t index,
-                                                const ANeuralNetworksOperandType* type,
-                                                const ANeuralNetworksMemory* memory, size_t offset,
-                                                size_t length) __INTRODUCED_IN(27);
-/**
- * Associate a user buffer with an output of the model of the
- * {@link ANeuralNetworksExecution}.
- *
- * If the output is optional, you can indicate that it is omitted by
- * passing nullptr for buffer and 0 for length.
- *
- * <p>The provided buffer must outlive the execution.</p>
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be modified.
- * @param index The index of the output argument we are setting. It is
- *              an index into the lists passed to
- *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with {@link ANeuralNetworksModel_addOperand}.
- * @param type The {@link ANeuralNetworksOperandType} of the
- *             operand. Unless the output is omitted, this should be
- *             used to specify the dimensions that were left
- *             unspecified when the operand was added to the
- *             model. All other properties of the type must be the
- *             same as specified in the model. If the type is the same
- *             as specified when the model was built, NULL can be
- *             passed. Neither the {@link ANeuralNetworksOperandType}
- *             nor the dimensions it points to need to outlive the call
- *             to {@link ANeuralNetworksExecution_setOutput}.
- * @param buffer The buffer where the data is to be written.
- * @param length The length in bytes of the buffer.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if the
- *         name is not recognized or the buffer is too small for the output.
- */
-int ANeuralNetworksExecution_setOutput(ANeuralNetworksExecution* execution, int32_t index,
-                                       const ANeuralNetworksOperandType* type, void* buffer,
-                                       size_t length) __INTRODUCED_IN(27);
-/**
- * Associate part of a memory object with an output of the model of the
- * {@link ANeuralNetworksExecution}.
- *
- * If the output is optional, you can indicate that it is omitted by
- * using {@link ANeuralNetworks_setOutput} instead, passing nullptr for buffer
- * and 0 for length.
- *
- * <p>The provided memory must outlive the execution.</p>
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- * See {@link ANeuralNetworksMemory_createFromAHardwarBuffer} for information on
- * AHardwareBuffer usage.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be modified.
- * @param index The index of the output argument we are setting. It is
- *              an index into the lists passed to
- *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is not
- *              the index associated with {@link ANeuralNetworksModel_addOperand}.
- * @param type The {@link ANeuralNetworksOperandType} of the operand. This should be
- *             used to specify the dimensions that were left
- *             unspecified when the operand was added to the
- *             model. All other properties of the type must be the
- *             same as specified in the model. If the type is the same
- *             as specified when the model was built, NULL can be
- *             passed. Neither the {@link ANeuralNetworksOperandType}
- *             nor the dimensions it points to need to outlive the call
- *             to {@link ANeuralNetworksExecution_setOutputFromMemory}.
- * @param memory The memory where the data is to be stored.
- * @param offset This specifies the location of the data within the memory.
- *               The offset is in bytes from the start of memory.
- * @param length The length in bytes of the data value.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if the
- *         name is not recognized or the buffer is too small for the output.
- */
-int ANeuralNetworksExecution_setOutputFromMemory(ANeuralNetworksExecution* execution, int32_t index,
-                                                 const ANeuralNetworksOperandType* type,
-                                                 const ANeuralNetworksMemory* memory, size_t offset,
-                                                 size_t length) __INTRODUCED_IN(27);
-/**
- * Schedule asynchronous evaluation of the execution.
- *
- * <p>Schedules asynchronous evaluation of the execution. Once the model has
- * been applied and the outputs are ready to be consumed, the returned event
- * will be signaled. Use {@link ANeuralNetworksEvent_wait} to wait for that
- * event.
- * </p>
- *
- * ANeuralNetworksEvent_wait must be called to recuperate the resources used
- * by the execution.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * See {@link ANeuralNetworksExecution_compute} for synchronous execution.
- * Synchronous execution incurs lower overhead than asynchronous execution.
- *
- * Available since API level 27.
- *
- * @param execution The execution to be scheduled and executed.
- * @param event The event that will be signaled on completion. event is set to
- *              NULL if there's an error.
- *
- * @return ANEURALNETWORKS_NO_ERROR if successful.
- */
-int ANeuralNetworksExecution_startCompute(ANeuralNetworksExecution* execution,
-                                          ANeuralNetworksEvent** event) __INTRODUCED_IN(27);
-/**
- * Waits until the execution completes.
- *
- * More than one thread can wait on an event. When the execution completes,
- * all threads will be released.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- *
- * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
- *         ANEURALNETWORKS_UNMAPPABLE if the execution input or output memory cannot
- *         be properly mapped.
- */
-int ANeuralNetworksEvent_wait(ANeuralNetworksEvent* event) __INTRODUCED_IN(27);
-/**
- * Destroys the event.
- *
- * See {@link ANeuralNetworksExecution} for information on multithreaded usage.
- *
- * Available since API level 27.
- */
-void ANeuralNetworksEvent_free(ANeuralNetworksEvent* event) __INTRODUCED_IN(27);
-__END_DECLS
-#endif  // ANDROID_ML_NN_RUNTIME_NEURAL_NETWORKS_MOCK_H
-/** @} */
diff --git a/include/dnnlibrary/NeuralNetworksTypes.h b/include/dnnlibrary/NeuralNetworksTypes.h
new file mode 100644
index 0000000..69253f1
--- /dev/null
+++ b/include/dnnlibrary/NeuralNetworksTypes.h
@@ -0,0 +1,552 @@
+/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+#ifndef TENSORFLOW_LITE_NNAPI_NEURALNETWORKSTYPES_H_
+#define TENSORFLOW_LITE_NNAPI_NEURALNETWORKSTYPES_H_
+
+#include <stdint.h>
+#include <stdio.h>
+
+typedef struct AHardwareBuffer AHardwareBuffer;
+
+// NN api types based on NNAPI header file
+// https://developer.android.com/ndk/reference/group/neural-networks
+
+/**
+ * Operand types.
+ *
+ * The type of operands that can be added to a model.
+ *
+ * Although we define many types, most operators accept just a few
+ * types.  Most used are ANEURALNETWORKS_TENSOR_FLOAT32,
+ * ANEURALNETWORKS_TENSOR_QUANT8_ASYMM, and ANEURALNETWORKS_INT32.
+ */
+enum {
+  ANEURALNETWORKS_FLOAT32 = 0,
+  ANEURALNETWORKS_INT32 = 1,
+  ANEURALNETWORKS_UINT32 = 2,
+  ANEURALNETWORKS_TENSOR_FLOAT32 = 3,
+  ANEURALNETWORKS_TENSOR_INT32 = 4,
+  ANEURALNETWORKS_TENSOR_QUANT8_ASYMM = 5,
+  ANEURALNETWORKS_BOOL = 6,
+  ANEURALNETWORKS_TENSOR_QUANT16_SYMM = 7,
+  ANEURALNETWORKS_TENSOR_FLOAT16 = 8,
+  ANEURALNETWORKS_TENSOR_BOOL8 = 9,
+  ANEURALNETWORKS_FLOAT16 = 10,
+  ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL = 11,
+  ANEURALNETWORKS_TENSOR_QUANT16_ASYMM = 12,
+  ANEURALNETWORKS_TENSOR_QUANT8_SYMM = 13,
+};
+
+/**
+ * Operation types.
+ *
+ * The type of operations that can be added to a model.
+ */
+enum {
+  ANEURALNETWORKS_ADD = 0,
+  ANEURALNETWORKS_AVERAGE_POOL_2D = 1,
+  ANEURALNETWORKS_CONCATENATION = 2,
+  ANEURALNETWORKS_CONV_2D = 3,
+  ANEURALNETWORKS_DEPTHWISE_CONV_2D = 4,
+  ANEURALNETWORKS_DEPTH_TO_SPACE = 5,
+  ANEURALNETWORKS_DEQUANTIZE = 6,
+  ANEURALNETWORKS_EMBEDDING_LOOKUP = 7,
+  ANEURALNETWORKS_FLOOR = 8,
+  ANEURALNETWORKS_FULLY_CONNECTED = 9,
+  ANEURALNETWORKS_HASHTABLE_LOOKUP = 10,
+  ANEURALNETWORKS_L2_NORMALIZATION = 11,
+  ANEURALNETWORKS_L2_POOL_2D = 12,
+  ANEURALNETWORKS_LOCAL_RESPONSE_NORMALIZATION = 13,
+  ANEURALNETWORKS_LOGISTIC = 14,
+  ANEURALNETWORKS_LSH_PROJECTION = 15,
+  ANEURALNETWORKS_LSTM = 16,
+  ANEURALNETWORKS_MAX_POOL_2D = 17,
+  ANEURALNETWORKS_MUL = 18,
+  ANEURALNETWORKS_RELU = 19,
+  ANEURALNETWORKS_RELU1 = 20,
+  ANEURALNETWORKS_RELU6 = 21,
+  ANEURALNETWORKS_RESHAPE = 22,
+  ANEURALNETWORKS_RESIZE_BILINEAR = 23,
+  ANEURALNETWORKS_RNN = 24,
+  ANEURALNETWORKS_SOFTMAX = 25,
+  ANEURALNETWORKS_SPACE_TO_DEPTH = 26,
+  ANEURALNETWORKS_SVDF = 27,
+  ANEURALNETWORKS_TANH = 28,
+  ANEURALNETWORKS_BATCH_TO_SPACE_ND = 29,
+  ANEURALNETWORKS_DIV = 30,
+  ANEURALNETWORKS_MEAN = 31,
+  ANEURALNETWORKS_PAD = 32,
+  ANEURALNETWORKS_SPACE_TO_BATCH_ND = 33,
+  ANEURALNETWORKS_SQUEEZE = 34,
+  ANEURALNETWORKS_STRIDED_SLICE = 35,
+  ANEURALNETWORKS_SUB = 36,
+  ANEURALNETWORKS_TRANSPOSE = 37,
+  ANEURALNETWORKS_ABS = 38,
+  ANEURALNETWORKS_ARGMAX = 39,
+  ANEURALNETWORKS_ARGMIN = 40,
+  ANEURALNETWORKS_BIDIRECTIONAL_SEQUENCE_LSTM = 42,
+  ANEURALNETWORKS_CAST = 45,
+  ANEURALNETWORKS_EQUAL = 48,
+  ANEURALNETWORKS_EXP = 49,
+  ANEURALNETWORKS_EXPAND_DIMS = 50,
+  ANEURALNETWORKS_GATHER = 51,
+  ANEURALNETWORKS_GREATER = 53,
+  ANEURALNETWORKS_GREATER_EQUAL = 54,
+  ANEURALNETWORKS_LESS = 58,
+  ANEURALNETWORKS_LESS_EQUAL = 59,
+  ANEURALNETWORKS_LOG = 60,
+  ANEURALNETWORKS_LOGICAL_AND = 61,
+  ANEURALNETWORKS_LOGICAL_NOT = 62,
+  ANEURALNETWORKS_LOGICAL_OR = 63,
+  ANEURALNETWORKS_LOG_SOFTMAX = 64,
+  ANEURALNETWORKS_MAXIMUM = 65,
+  ANEURALNETWORKS_MINIMUM = 66,
+  ANEURALNETWORKS_NEG = 67,
+  ANEURALNETWORKS_NOT_EQUAL = 68,
+  ANEURALNETWORKS_PAD_V2 = 69,
+  ANEURALNETWORKS_POW = 70,
+  ANEURALNETWORKS_PRELU = 71,
+  ANEURALNETWORKS_QUANTIZE = 72,
+  ANEURALNETWORKS_QUANTIZED_16BIT_LSTM = 73,
+  ANEURALNETWORKS_REDUCE_ANY = 76,
+  ANEURALNETWORKS_REDUCE_MAX = 77,
+  ANEURALNETWORKS_REDUCE_MIN = 78,
+  ANEURALNETWORKS_REDUCE_PROD = 79,
+  ANEURALNETWORKS_REDUCE_SUM = 80,
+  ANEURALNETWORKS_RSQRT = 83,
+  ANEURALNETWORKS_SELECT = 84,
+  ANEURALNETWORKS_SIN = 85,
+  ANEURALNETWORKS_SLICE = 86,
+  ANEURALNETWORKS_SPLIT = 87,
+  ANEURALNETWORKS_SQRT = 88,
+  ANEURALNETWORKS_TILE = 89,
+  ANEURALNETWORKS_TOPK_V2 = 90,
+  ANEURALNETWORKS_UNIDIRECTIONAL_SEQUENCE_LSTM = 92,
+  ANEURALNETWORKS_UNIDIRECTIONAL_SEQUENCE_RNN = 93,
+};
+
+/**
+ * Fused activation function types.
+ *
+ */
+enum {
+  ANEURALNETWORKS_FUSED_NONE = 0,
+  ANEURALNETWORKS_FUSED_RELU = 1,
+  ANEURALNETWORKS_FUSED_RELU1 = 2,
+  ANEURALNETWORKS_FUSED_RELU6 = 3,
+};
+
+/**
+ * Execution preferences.
+ */
+enum {
+  ANEURALNETWORKS_PREFER_LOW_POWER = 0,
+  ANEURALNETWORKS_PREFER_FAST_SINGLE_ANSWER = 1,
+  ANEURALNETWORKS_PREFER_SUSTAINED_SPEED = 2,
+};
+
+/**
+ * Result codes.
+ */
+enum {
+  ANEURALNETWORKS_NO_ERROR = 0,
+  ANEURALNETWORKS_OUT_OF_MEMORY = 1,
+  ANEURALNETWORKS_INCOMPLETE = 2,
+  ANEURALNETWORKS_UNEXPECTED_NULL = 3,
+  ANEURALNETWORKS_BAD_DATA = 4,
+  ANEURALNETWORKS_OP_FAILED = 5,
+  ANEURALNETWORKS_BAD_STATE = 6,
+  ANEURALNETWORKS_UNMAPPABLE = 7,
+  ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE = 8,
+  ANEURALNETWORKS_UNAVAILABLE_DEVICE = 9,
+};
+
+/**
+ * Implicit padding algorithms.
+ */
+enum {
+  ANEURALNETWORKS_PADDING_SAME = 1,
+  ANEURALNETWORKS_PADDING_VALID = 2,
+};
+
+/**
+ * Device types.
+ *
+ * The type of NNAPI device.
+ */
+enum {
+  /** The device type cannot be provided. */
+  ANEURALNETWORKS_DEVICE_UNKNOWN = 0,
+  /** The device does not fall into any category below. */
+  ANEURALNETWORKS_DEVICE_OTHER = 1,
+  /** The device runs NNAPI models on single or multi-core CPU. */
+  ANEURALNETWORKS_DEVICE_CPU = 2,
+  /** The device can run NNAPI models and also accelerate graphics APIs such
+   * as OpenGL ES and Vulkan. */
+  ANEURALNETWORKS_DEVICE_GPU = 3,
+  /** Dedicated accelerator for Machine Learning workloads. */
+  ANEURALNETWORKS_DEVICE_ACCELERATOR = 4,
+};
+
+/**
+ * ANeuralNetworksMemory is an opaque type that represents memory.
+ *
+ * This type is used to represent shared memory, memory mapped files,
+ * and similar memories.
+ *
+ * By using shared memory, a program can efficiently communicate to the
+ * runtime and drivers the tensors that define a model. See
+ * {@link ANeuralNetworksModel_setOperandValueFromMemory}. An application
+ * should typically create one shared memory object that contains every tensor
+ * needed to define a model. {@link ANeuralNetworksMemory_createFromFd} can be
+ * used to create shared memory from a file handle. {@link
+ * ANeuralNetworksMemory_createShared} can be used to directly created shared
+ * memory.
+ *
+ * Memory objects can also be used to specify the input and output arguments of
+ * an execution. See {@link ANeuralNetworksExecution_setInputFromMemory}
+ * and {@link ANeuralNetworksExecution_setOutputFromMemory}.
+ */
+typedef struct ANeuralNetworksMemory ANeuralNetworksMemory;
+
+/**
+ * ANeuralNetworksModel is an opaque type that contains a description of the
+ * mathematical operations that constitute the model.
+ *
+ * <p>The model will be built by calling<ul>
+ * <li>{@link ANeuralNetworksModel_create},</li>
+ * <li>{@link ANeuralNetworksModel_addOperation},</li>
+ * <li>{@link ANeuralNetworksModel_addOperand},</li>
+ * </ul>
+ *
+ * A model is completed by calling {@link ANeuralNetworksModel_finish}.
+ * A model is destroyed by calling {@link ANeuralNetworksModel_free}.
+ *
+ * <p>It is the application's responsibility to make sure that only one thread
+ * modifies a model at a given time. It is however safe for more than one
+ * thread to use the model once {@link ANeuralNetworksModel_finish} has
+ * returned.</p>
+ *
+ * <p>It is also the application's responsibility to ensure that there are no
+ * other uses of the model after calling {@link ANeuralNetworksModel_free}. This
+ * includes any compilation or execution object created using the model.</p>
+ */
+typedef struct ANeuralNetworksModel ANeuralNetworksModel;
+
+/**
+ * ANeuralNetworksCompilation is an opaque type that can be used to compile
+ * a machine learning model.
+ *
+ * <p>To use:<ul>
+ *    <li>Create a new compilation instance by calling the
+ *        {@link ANeuralNetworksCompilation_create} function.</li>
+ *    <li>Perform the compilation with {@link
+ * ANeuralNetworksCompilation_start}.</li> <li>Wait for the compilation to
+ * complete with {@link ANeuralNetworksCompilation_wait}.</li> <li>Use the
+ * compilation as many times as needed with {@link
+ * ANeuralNetworksExecution_create}.</li> <li>Destroy the compilation with
+ * {@link ANeuralNetworksCompilation_free} once all executions using the
+ * compilation have completed.</li></ul></p>
+ *
+ * <p>A compilation cannot be modified once {@link
+ * ANeuralNetworksCompilation_start} has been called on it.</p>
+ *
+ * <p>It is the application's responsibility to make sure that only one thread
+ * modifies a compilation at a given time. It is however safe for more than one
+ * thread to use {@link ANeuralNetworksCompilation_wait} at the same time.
+ * It is also safe for multiple threads to use a compilation object once
+ * {@link ANeuralNetworksCompilation_wait} has completed.</p>
+ *
+ * <p>It is also the application's responsibility to ensure that there are no
+ * other uses of the compilation after calling {@link
+ * ANeuralNetworksCompilation_free}. This includes any execution object created
+ * using the compilation.</p>
+ */
+typedef struct ANeuralNetworksCompilation ANeuralNetworksCompilation;
+
+/**
+ * ANeuralNetworksExecution is an opaque type that can be used to apply a
+ * machine learning model to a set of inputs.
+ *
+ * <p>To use:<ul>
+ *    <li>Create a new execution instance by calling the
+ *        {@link ANeuralNetworksExecution_create} function.</li>
+ *    <li>Associate data to the model inputs with
+ *        {@link ANeuralNetworksExecution_setInput} or
+ *        {@link ANeuralNetworksExecution_setInputFromMemory}.</li>
+ *    <li>Associate output buffers to the model outputs with
+ *        {@link ANeuralNetworksExecution_setOutput} or
+ *        {@link ANeuralNetworksExecution_setOutputFromMemory}.</li>
+ *    <li>Apply the model with {@link
+ * ANeuralNetworksExecution_startCompute}.</li> <li>Wait for the execution to
+ * complete with {@link ANeuralNetworksExecution_wait}.</li> <li>Destroy the
+ * execution with
+ *        {@link ANeuralNetworksExecution_free}.</li></ul></p>
+ *
+ * <p>An execution cannot be modified once {@link
+ * ANeuralNetworksExecution_start} has been called on it.</p>
+ *
+ * <p>An execution can be applied to a model with
+ * {@link ANeuralNetworksExecution_startCompute} only once. Create new
+ * executions to do new evaluations of the model.</p>
+ *
+ * <p>It is the application's responsibility to make sure that only one thread
+ * modifies an execution at a given time. It is however safe for more than one
+ * thread to use {@link ANeuralNetworksExecution_wait} at the same time.</p>
+ *
+ * <p>It is also the application's responsibility to ensure that there are no
+ * other uses of the request after calling {@link
+ * ANeuralNetworksRequest_free}.</p>
+ */
+typedef struct ANeuralNetworksExecution ANeuralNetworksExecution;
+
+/**
+ * Parameters for ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL operand.
+ */
+typedef struct ANeuralNetworksSymmPerChannelQuantParams {
+  /* The index of the channel dimension. */
+  uint32_t channelDim;
+  /** The size of the scale array. Should be equal to dimension[channelDim] of
+   * the Operand. */
+  uint32_t scaleCount;
+  /** The array of scaling values for each channel. Each value must be greater
+   * than zero. */
+  const float* scales;
+} ANeuralNetworksSymmPerChannelQuantParams;
+
+/**
+ * ANeuralNetworksBurst is an opaque type that can be used to reduce the latency
+ * of a rapid sequence of executions. It will likely cause overhead if only used
+ * for a single execution.
+ *
+ * ANeuralNetworksBurst serves as a context object for any number of inferences
+ * using {@link ANeuralNetworksExecution} objects. An ANeuralNetworksBurst
+ * object and the {@link ANeuralNetworksExecution} objects used with it must all
+ * have been created from the same {@link ANeuralNetworksCompilation} object.
+ *
+ * This object is also used as a hint to drivers, providing insight to the
+ * lifetime of a rapid sequence of executions. For example, a driver may choose
+ * to increase the clock frequency of its accelerator for the lifetime of a
+ * burst object.
+ *
+ * <p>To use:<ul>
+ *    <li>Create a new burst object by calling the
+ *        {@link ANeuralNetworksBurst_create} function.</li>
+ *    <li>For each execution:</li><ul>
+ *        <li>Create {@link ANeuralNetworksExecution} and configure its
+ *            properties (see {@link ANeuralNetworksExecution} for
+ * details).</li> <li>Apply the model synchronously with
+ *            {@link ANeuralNetworksExecution_burstCompute}, reusing the same
+ *            {@link ANeuralNetworksBurst} with the new
+ *            {@link ANeuralNetworksExecution}.</li>
+ *        <li>Use and free the {@link ANeuralNetworksExecution}.</li></ul>
+ *    <li>Destroy the burst with
+ *        {@link ANeuralNetworksBurst_free}.</li></ul></p>
+ *
+ * Available since API level 29.
+ */
+typedef struct ANeuralNetworksBurst ANeuralNetworksBurst;
+
+/**
+ * ANeuralNetworksOperandType describes the type of an operand.
+ * This structure is used to describe both scalars and tensors.
+ */
+typedef struct ANeuralNetworksOperandType {
+  /** The data type, e.g ANEURALNETWORKS_INT8. */
+  int32_t type;
+  /** The number of dimensions. It should be 0 for scalars. */
+  uint32_t dimensionCount;
+  /** The dimensions of the tensor. It should be nullptr for scalars. */
+  const uint32_t* dimensions;
+  /** These two fields are only used for quantized tensors.
+   * They should be zero for scalars and non-fixed point tensors.
+   * The dequantized value of each entry is (value - offset) * scale.
+   */
+  float scale;
+  int32_t zeroPoint;
+} ANeuralNetworksOperandType;
+
+/**
+ * ANeuralNetworksEvent is an opaque type that represents an event
+ * that will be signaled once an execution completes.
+ */
+typedef struct ANeuralNetworksEvent ANeuralNetworksEvent;
+
+typedef int32_t ANeuralNetworksOperationType;
+
+/**
+ * ANeuralNetworksDevice is an opaque type that represents a device.
+ *
+ * This type is used to query basic properties and supported operations of the
+ * corresponding device, and control which device(s) a model is to be run on.
+ *
+ * Available since API level 29.
+ */
+typedef struct ANeuralNetworksDevice ANeuralNetworksDevice;
+
+// nn api function types
+
+typedef int (*ANeuralNetworksMemory_createFromFd_fn)(
+    size_t size, int protect, int fd, size_t offset,
+    ANeuralNetworksMemory** memory);
+
+typedef void (*ANeuralNetworksMemory_free_fn)(ANeuralNetworksMemory* memory);
+
+typedef int (*ANeuralNetworksModel_create_fn)(ANeuralNetworksModel** model);
+
+typedef int (*ANeuralNetworksModel_finish_fn)(ANeuralNetworksModel* model);
+
+typedef void (*ANeuralNetworksModel_free_fn)(ANeuralNetworksModel* model);
+
+typedef int (*ANeuralNetworksCompilation_create_fn)(
+    ANeuralNetworksModel* model, ANeuralNetworksCompilation** compilation);
+
+typedef void (*ANeuralNetworksCompilation_free_fn)(
+    ANeuralNetworksCompilation* compilation);
+
+typedef int (*ANeuralNetworksCompilation_setPreference_fn)(
+    ANeuralNetworksCompilation* compilation, int32_t preference);
+
+typedef int (*ANeuralNetworksCompilation_finish_fn)(
+    ANeuralNetworksCompilation* compilation);
+
+typedef int (*ANeuralNetworksModel_addOperand_fn)(
+    ANeuralNetworksModel* model, const ANeuralNetworksOperandType* type);
+
+typedef int (*ANeuralNetworksModel_setOperandValue_fn)(
+    ANeuralNetworksModel* model, int32_t index, const void* buffer,
+    size_t length);
+
+typedef int (*ANeuralNetworksModel_setOperandSymmPerChannelQuantParams_fn)(
+    ANeuralNetworksModel* model, int32_t index,
+    const ANeuralNetworksSymmPerChannelQuantParams* channelQuant);
+
+typedef int (*ANeuralNetworksModel_setOperandValueFromMemory_fn)(
+    ANeuralNetworksModel* model, int32_t index,
+    const ANeuralNetworksMemory* memory, size_t offset, size_t length);
+
+typedef int (*ANeuralNetworksModel_addOperation_fn)(
+    ANeuralNetworksModel* model, ANeuralNetworksOperationType type,
+    uint32_t inputCount, const uint32_t* inputs, uint32_t outputCount,
+    const uint32_t* outputs);
+
+typedef int (*ANeuralNetworksModel_identifyInputsAndOutputs_fn)(
+    ANeuralNetworksModel* model, uint32_t inputCount, const uint32_t* inputs,
+    uint32_t outputCount, const uint32_t* outputs);
+
+typedef int (*ANeuralNetworksModel_relaxComputationFloat32toFloat16_fn)(
+    ANeuralNetworksModel* model, bool allow);
+
+typedef int (*ANeuralNetworksExecution_create_fn)(
+    ANeuralNetworksCompilation* compilation,
+    ANeuralNetworksExecution** execution);
+
+typedef void (*ANeuralNetworksExecution_free_fn)(
+    ANeuralNetworksExecution* execution);
+
+typedef int (*ANeuralNetworksExecution_setInput_fn)(
+    ANeuralNetworksExecution* execution, int32_t index,
+    const ANeuralNetworksOperandType* type, const void* buffer, size_t length);
+
+typedef int (*ANeuralNetworksExecution_setInputFromMemory_fn)(
+    ANeuralNetworksExecution* execution, int32_t index,
+    const ANeuralNetworksOperandType* type, const ANeuralNetworksMemory* memory,
+    size_t offset, size_t length);
+
+typedef int (*ANeuralNetworksExecution_setOutput_fn)(
+    ANeuralNetworksExecution* execution, int32_t index,
+    const ANeuralNetworksOperandType* type, void* buffer, size_t length);
+
+typedef int (*ANeuralNetworksExecution_setOutputFromMemory_fn)(
+    ANeuralNetworksExecution* execution, int32_t index,
+    const ANeuralNetworksOperandType* type, const ANeuralNetworksMemory* memory,
+    size_t offset, size_t length);
+
+typedef int (*ANeuralNetworksExecution_startCompute_fn)(
+    ANeuralNetworksExecution* execution, ANeuralNetworksEvent** event);
+
+typedef int (*ANeuralNetworksEvent_wait_fn)(ANeuralNetworksEvent* event);
+
+typedef void (*ANeuralNetworksEvent_free_fn)(ANeuralNetworksEvent* event);
+
+typedef int (*ASharedMemory_create_fn)(const char* name, size_t size);
+
+typedef int (*ANeuralNetworks_getDeviceCount_fn)(uint32_t* numDevices);
+
+typedef int (*ANeuralNetworks_getDevice_fn)(uint32_t devIndex,
+                                            ANeuralNetworksDevice** device);
+
+typedef int (*ANeuralNetworksDevice_getName_fn)(
+    const ANeuralNetworksDevice* device, const char** name);
+
+typedef int (*ANeuralNetworksDevice_getType_fn)(
+    const ANeuralNetworksDevice* device, int32_t* type);
+
+typedef int (*ANeuralNetworksDevice_getVersion_fn)(
+    const ANeuralNetworksDevice* device, const char** version);
+
+typedef int (*ANeuralNetworksDevice_getFeatureLevel_fn)(
+    const ANeuralNetworksDevice* device, int64_t* featureLevel);
+
+typedef int (*ANeuralNetworksModel_getSupportedOperationsForDevices_fn)(
+    const ANeuralNetworksModel* model,
+    const ANeuralNetworksDevice* const* devices, uint32_t numDevices,
+    bool* supportedOps);
+
+typedef int (*ANeuralNetworksCompilation_createForDevices_fn)(
+    ANeuralNetworksModel* model, const ANeuralNetworksDevice* const* devices,
+    uint32_t numDevices, ANeuralNetworksCompilation** compilation);
+
+typedef int (*ANeuralNetworksCompilation_setCaching_fn)(
+    ANeuralNetworksCompilation* compilation, const char* cacheDir,
+    const uint8_t* token);
+
+typedef int (*ANeuralNetworksExecution_compute_fn)(
+    ANeuralNetworksExecution* execution);
+
+typedef int (*ANeuralNetworksExecution_getOutputOperandRank_fn)(
+    ANeuralNetworksExecution* execution, int32_t index, uint32_t* rank);
+
+typedef int (*ANeuralNetworksExecution_getOutputOperandDimensions_fn)(
+    ANeuralNetworksExecution* execution, int32_t index, uint32_t* dimensions);
+
+typedef int (*ANeuralNetworksBurst_create_fn)(
+    ANeuralNetworksCompilation* compilation, ANeuralNetworksBurst** burst);
+
+typedef void (*ANeuralNetworksBurst_free_fn)(ANeuralNetworksBurst* burst);
+
+typedef int (*ANeuralNetworksExecution_burstCompute_fn)(
+    ANeuralNetworksExecution* execution, ANeuralNetworksBurst* burst);
+
+typedef int (*ANeuralNetworksMemory_createFromAHardwareBuffer_fn)(
+    const AHardwareBuffer* ahwb, ANeuralNetworksMemory** memory);
+
+typedef int (*ANeuralNetworksExecution_setMeasureTiming_fn)(
+    ANeuralNetworksExecution* execution, bool measure);
+
+typedef enum {
+  // Execution time on hardware (not driver, which runs on host processor).
+  ANEURALNETWORKS_DURATION_ON_HARDWARE = 0,
+  // Execution time in driver (including time on hardware).  Excludes overhead
+  // such as that of the runtime itself and the IPC needed for the runtime to
+  // communicate with the driver.
+  ANEURALNETWORKS_DURATION_IN_DRIVER = 1,
+} DurationCode;
+
+typedef int (*ANeuralNetworksExecution_getDuration_fn)(
+    const ANeuralNetworksExecution* execution, int32_t durationCode,
+    uint64_t* duration);
+
+#endif  // TENSORFLOW_LITE_NNAPI_NEURALNETWORKSTYPES_H_
diff --git a/include/dnnlibrary/NeuralNetworksWrapper.h b/include/dnnlibrary/NeuralNetworksWrapper.h
index ee4cfa5..7fac537 100644
--- a/include/dnnlibrary/NeuralNetworksWrapper.h
+++ b/include/dnnlibrary/NeuralNetworksWrapper.h
@@ -16,7 +16,7 @@
 // Provides C++ classes to more easily use the Neural Networks API.
 #ifndef ANDROID_ML_NN_RUNTIME_NEURAL_NETWORKS_WRAPPER_H
 #define ANDROID_ML_NN_RUNTIME_NEURAL_NETWORKS_WRAPPER_H
-#include "NeuralNetworksMock.h"
+#include <dnnlibrary/nnapi_implementation.h>
 #include <common/data_types.h>
 #include <math.h>
 #include <string>
@@ -122,72 +122,6 @@ struct OperandType {
     }
     operator ANeuralNetworksOperandType() const {return operandType; }
 };
-class Memory {
-public:
-    Memory(size_t size, int protect, int fd, size_t offset) {
-        mValid = ANeuralNetworksMemory_createFromFd(size, protect, fd, offset, &mMemory) ==
-                 ANEURALNETWORKS_NO_ERROR;
-    }
-    Memory(AHardwareBuffer* buffer) {
-        mValid = ANeuralNetworksMemory_createFromAHardwareBuffer(buffer, &mMemory) ==
-                 ANEURALNETWORKS_NO_ERROR;
-    }
-    ~Memory() { ANeuralNetworksMemory_free(mMemory); }
-    // Disallow copy semantics to ensure the runtime object can only be freed
-    // once. Copy semantics could be enabled if some sort of reference counting
-    // or deep-copy system for runtime objects is added later.
-    Memory(const Memory&) = delete;
-    Memory& operator=(const Memory&) = delete;
-    // Move semantics to remove access to the runtime object from the wrapper
-    // object that is being moved. This ensures the runtime object will be
-    // freed only once.
-    Memory(Memory&& other) { *this = std::move(other); }
-    Memory& operator=(Memory&& other) {
-        if (this != &other) {
-            ANeuralNetworksMemory_free(mMemory);
-            mMemory = other.mMemory;
-            mValid = other.mValid;
-            other.mMemory = nullptr;
-            other.mValid = false;
-        }
-        return *this;
-    }
-    ANeuralNetworksMemory* get() const { return mMemory; }
-    bool isValid() const { return mValid; }
-private:
-    ANeuralNetworksMemory* mMemory = nullptr;
-    bool mValid = true;
-};
-class Event {
-public:
-    Event() {}
-    ~Event() { ANeuralNetworksEvent_free(mEvent); }
-    // Disallow copy semantics to ensure the runtime object can only be freed
-    // once. Copy semantics could be enabled if some sort of reference counting
-    // or deep-copy system for runtime objects is added later.
-    Event(const Event&) = delete;
-    Event& operator=(const Event&) = delete;
-    // Move semantics to remove access to the runtime object from the wrapper
-    // object that is being moved. This ensures the runtime object will be
-    // freed only once.
-    Event(Event&& other) { *this = std::move(other); }
-    Event& operator=(Event&& other) {
-        if (this != &other) {
-            ANeuralNetworksEvent_free(mEvent);
-            mEvent = other.mEvent;
-            other.mEvent = nullptr;
-        }
-        return *this;
-    }
-    Result wait() { return static_cast<Result>(ANeuralNetworksEvent_wait(mEvent)); }
-    // Only for use by Execution
-    void set(ANeuralNetworksEvent* newEvent) {
-        ANeuralNetworksEvent_free(mEvent);
-        mEvent = newEvent;
-    }
-private:
-    ANeuralNetworksEvent* mEvent = nullptr;
-};
 }  // namespace wrapper
 }  // namespace nn
 }  // namespace android
diff --git a/include/dnnlibrary/nnapi_implementation.h b/include/dnnlibrary/nnapi_implementation.h
new file mode 100644
index 0000000..0df10e2
--- /dev/null
+++ b/include/dnnlibrary/nnapi_implementation.h
@@ -0,0 +1,1022 @@
+/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+#ifndef TENSORFLOW_LITE_NNAPI_NNAPI_IMPLEMENTATION_H_
+#define TENSORFLOW_LITE_NNAPI_NNAPI_IMPLEMENTATION_H_
+
+#include <stdint.h>
+#include <stdio.h>
+#include <stdlib.h>
+
+#include "NeuralNetworksTypes.h"
+
+struct NnApi {
+  bool nnapi_exists;
+  int32_t android_sdk_version;
+
+  /**
+   * Creates a shared memory object from a file descriptor.
+   *
+   * The shared memory is backed by a file descriptor via mmap.
+   * See {@link ANeuralNetworksMemory} for a description on how to use
+   * this shared memory.
+   *
+   * @param size The requested size in bytes.
+   *             Must not be larger than the file size.
+   * @param prot The desired memory protection for the mapping.
+   *             It is either PROT_NONE or the bitwise OR of one or
+   *             more of the following flags: PROT_READ, PROT_WRITE.
+   * @param fd The requested file descriptor.
+   *           The file descriptor has to be mmap-able. The file
+   *           descriptor will be duplicated.
+   * @param offset The offset to the beginning of the file of the area to map.
+   *               The offset has to be aligned to a page size.
+   * @param memory The memory object to be created.
+   *               Set to NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the request completed normally.
+   */
+  int (*ANeuralNetworksMemory_createFromFd)(size_t size, int protect, int fd,
+                                            size_t offset,
+                                            ANeuralNetworksMemory** memory);
+
+  /**
+   * Delete a memory object.
+   *
+   * Destroys the object used by the run time to keep track of the memory.
+   * This will free the underlying actual memory if no other code has open
+   * handles to this memory.
+   *
+   * @param memory The memory object to be freed.
+   */
+  void (*ANeuralNetworksMemory_free)(ANeuralNetworksMemory* memory);
+
+  /**
+   * Create an empty {@link ANeuralNetworksModel}.
+   *
+   * <p>This only creates the object. Computation is performed once
+   * {@link ANeuralNetworksExecution_startCompute} is invoked.
+   *
+   * The model should be constructed with calls to
+   * {@link ANeuralNetworksModel_addOperation} and
+   * {@link ANeuralNetworksModel_addOperand}
+   *
+   * <p>{@link ANeuralNetworksModel_finish} should be called once the model
+   * has been fully constructed.</p>
+   *
+   * <p>{@link ANeuralNetworksModel_free} should be called once the model
+   * is no longer needed.</p>
+   *
+   * @param model The {@link ANeuralNetworksModel} to be created.
+   *              Set to NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_create)(ANeuralNetworksModel** model);
+
+  /**
+   * Destroy a model.
+   *
+   * The model need not have been finished by a call to
+   * {@link ANeuralNetworksModel_finish}.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @param model The model to be destroyed. Passing NULL is acceptable and
+   *              results in no operation.
+   */
+  void (*ANeuralNetworksModel_free)(ANeuralNetworksModel* model);
+
+  /**
+   * Indicate that we have finished modifying a model. Required before
+   * calling {@link ANeuralNetworksCompilation_compile}.
+   *
+   * An application is responsible to make sure that no other thread uses
+   * the model at the same time.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @param model The model to be finished.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_finish)(ANeuralNetworksModel* model);
+
+  /**
+   * Add an operand to a model.
+   *
+   * The order in which the operands are added is important. The first one added
+   * to a model will have the index value 0, the second 1, etc. These indexes
+   * are used as operand identifiers in
+   * {@link ANeuralNetworksModel_addOperation},
+   * {@link ANeuralNetworksExecution_setInput},
+   * {@link ANeuralNetworksExecution_setInputFromMemory},
+   * {@link ANeuralNetworksExecution_setOutput},
+   * {@link ANeuralNetworksExecution_setOutputFromMemory} and
+   * {@link ANeuralNetworksExecution_setOperandValue}.
+   *
+   * To build a model that can accommodate inputs of various sizes, as you may
+   * want to do for a CNN, set the size of the dimensions that will vary at run
+   * time to 0. If you do so, provide the full dimensions when calling
+   * {@link ANeuralNetworksExecution_setInput} or {@link
+   * ANeuralNetworksExecution_setInputFromMemory}.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @param model The model to be modified.
+   * @param type The {@link ANeuralNetworksOperandType} that describes the shape
+   * of the operand.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_addOperand)(
+      ANeuralNetworksModel* model, const ANeuralNetworksOperandType* type);
+
+  /**
+   * Sets an operand to a constant value.
+   *
+   * For scalar values, the content of buffer is copied into the model.
+   *
+   * For tensor values, a pointer to the buffer is stored within the model.
+   * The application is responsible for not changing the content of this region
+   * until all executions using this model have completed. As the data may
+   * be copied during processing, modifying the data after this call yields
+   * undefined results.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @param model The model to be modified.
+   * @param index The index of the model operand we're setting.
+   * @param buffer A pointer to the data to use.
+   * @param length The size in bytes of the data value.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_setOperandValue)(ANeuralNetworksModel* model,
+                                              int32_t index, const void* buffer,
+                                              size_t length);
+
+  /**
+   * Sets an operand's per channel quantization parameters.
+   *
+   * Sets parameters required by a tensor of type
+   * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL}.
+   * This function must be called for every tensor of type
+   * {@link ANEURALNETWORKS_TENSOR_QUANT8_SYMM_PER_CHANNEL} before
+   * calling {@link ANeuralNetworksModel_finish}.
+   *
+   * Available since API level 29.
+   *
+   * @param model The model to be modified.
+   * @param index The index of the model operand we're setting.
+   * @param channelQuant The per channel quantization parameters for the
+   *                     operand. No memory in this struct needs to outlive the
+   *                     call to this function.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_setOperandSymmPerChannelQuantParams)(
+      ANeuralNetworksModel* model, int32_t index,
+      const ANeuralNetworksSymmPerChannelQuantParams* channelQuant);
+
+  /**
+   * Sets an operand to a value stored in a memory object.
+   *
+   * The content of the memory is not copied. A reference to that memory is
+   * stored inside the model. The application is responsible for not changing
+   * the content of the memory region until all executions using this model have
+   * completed.
+   * As the data may be copied during processing, modifying the data after this
+   * call yields undefined results.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @param model The model to be modified.
+   * @param index The index of the model operand we're setting.
+   * @param buffer A pointer to the data to use.
+   * @param memory The memory containing the data.
+   * @param offset This specifies the location of the data within the memory.
+   *               The offset is in bytes from the start of memory.
+   * @param length The size in bytes of the data value.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_setOperandValueFromMemory)(
+      ANeuralNetworksModel* model, int32_t index,
+      const ANeuralNetworksMemory* memory, size_t offset, size_t length);
+
+  /**
+   * Add an operation to a model.
+   *
+   * @param model The model to be modified.
+   * @param type The type of the operation.
+   * @param inputCount The number of entries in the inputs array.
+   * @param inputs An array of indexes identifying each operand.
+   * @param outputCount The number of entries in the outputs array.
+   * @param outputs An array of indexes identifying each operand.
+   *
+   * The operands specified by inputs and outputs must have been
+   * previously added by calls to {@link ANeuralNetworksModel_addOperand}.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksModel_addOperation)(ANeuralNetworksModel* model,
+                                           ANeuralNetworksOperationType type,
+                                           uint32_t inputCount,
+                                           const uint32_t* inputs,
+                                           uint32_t outputCount,
+                                           const uint32_t* outputs);
+
+  /**
+   * Specifies which operands will be the model's inputs and outputs.
+   *
+   * An operand cannot be used for both input and output. Doing so will
+   * return an error.
+   *
+   * @param model The model to be modified.
+   * @param inputCount The number of entries in the inputs array.
+   * @param inputs An array of indexes identifying the input operands.
+   * @param outputCount The number of entries in the outputs array.
+   * @param outputs An array of indexes identifying the output operands.
+   *
+   * The operands specified by inputs and outputs must have been
+   * previously added by calls to {@link ANeuralNetworksModel_addOperand}.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   *
+   */
+  int (*ANeuralNetworksModel_identifyInputsAndOutputs)(
+      ANeuralNetworksModel* model, uint32_t inputCount, const uint32_t* inputs,
+      uint32_t outputCount, const uint32_t* outputs);
+
+  /**
+   * Specifies whether {@link ANEURALNETWORKS_TENSOR_FLOAT32} is allowed to be
+   * calculated with range and/or precision as low as that of the
+   * IEEE 754 16-bit floating-point format. By default,
+   * {@link ANEURALNETWORKS_TENSOR_FLOAT32} must be calculated using at least
+   * the range and precision of the IEEE 754 32-bit floating-point format.
+   *
+   * @param model The model to be modified.
+   * @param allow 'true' indicates {@link ANEURALNETWORKS_TENSOR_FLOAT32} may be
+   *              calculated with range and/or precision as low as that of the
+   *              IEEE 754 16-bit floating point format. 'false' indicates
+   *              {@link ANEURALNETWORKS_TENSOR_FLOAT32} must be calculated
+   *              using at least the range and precision of the IEEE 754 32-bit
+   *              floating point format.
+   *
+   * Attempting to modify a model once {@link ANeuralNetworksModel_finish} has
+   * been called will return an error.
+   *
+   * Available since API level 28.
+   *
+   * See {@link ANeuralNetworksModel} for information on multithreaded usage.
+   */
+  int (*ANeuralNetworksModel_relaxComputationFloat32toFloat16)(
+      ANeuralNetworksModel* model, bool allow);
+
+  /**
+   * Create a {@link ANeuralNetworksCompilation} to compile the given model.
+   * This only creates the object. Compilation is only performed once
+   * {@link ANeuralNetworksCompilation_start} is invoked.
+   *
+   * <p>The provided model must outlive the compilation.</p>
+   *
+   * The model must already have been finished by a call to
+   * {@link ANeuralNetworksModel_finish}.
+   *
+   * See {@link ANeuralNetworksCompilation} for information on multithreaded
+   * usage.
+   *
+   * @param model The {@link ANeuralNetworksModel} to be compiled.
+   * @param compilation The newly created object or NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
+   *         if the model is invalid.
+   */
+  int (*ANeuralNetworksCompilation_create)(
+      ANeuralNetworksModel* model, ANeuralNetworksCompilation** compilation);
+
+  /**
+   * Destroy a compilation.
+   *
+   * <p>If called on a compilation for which
+   * {@link ANeuralNetworksCompilation_start} has been called, the
+   * function will return immediately but will mark the compilation to be
+   * deleted once the compilation completes. The
+   * {@link ANeuralNetworksCompilation_wait} will return ERROR_DELETED.
+   *
+   * See {@link ANeuralNetworksCompilation} for information on multithreaded
+   * usage.
+   *
+   * @param compilation The compilation to be destroyed. Passing NULL is
+   * acceptable and results in no operation.
+   */
+  void (*ANeuralNetworksCompilation_free)(
+      ANeuralNetworksCompilation* compilation);
+
+  /**
+   * Sets the execution preference.
+   *
+   * <p>Provides guidance to the runtime when trade-offs are possible.</p>
+   *
+   * See {@link ANeuralNetworksCompilation} for information on multithreaded
+   * usage.
+   *
+   * @param compilation The compilation to be modified.
+   * @param preference Either {@link PREFER_LOW_POWER},
+   *                  {@link PREFER_SINGLE_FAST_ANSWER}, or
+   *                  {@link PREFER_SUSTAINED_SPEED}.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksCompilation_setPreference)(
+      ANeuralNetworksCompilation* compilation, int32_t preference);
+
+  /**
+   * Waits until the compilation completes.
+   *
+   * More than one thread can wait on a compilation. When the compilation
+   * completes, all threads will be released.
+   *
+   * See {@link ANeuralNetworksCompilation} for information on multithreaded
+   * usage.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the compilation completed normally.
+   */
+  int (*ANeuralNetworksCompilation_finish)(
+      ANeuralNetworksCompilation* compilation);
+
+  /**
+   * Create a {@link ANeuralNetworksExecution} to apply the given compilation.
+   * This only creates the object. Computation is only performed once
+   * {@link ANeuralNetworksExecution_startCompute} is invoked.
+   *
+   * <p>The provided compilation must outlive the execution.</p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param compilation The {@link ANeuralNetworksCompilation} to be evaluated.
+   * @param execution The newly created object or NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
+   *         if the compilation is invalid.
+   */
+  int (*ANeuralNetworksExecution_create)(
+      ANeuralNetworksCompilation* compilation,
+      ANeuralNetworksExecution** execution);
+
+  /**
+   * Destroy an execution.
+   *
+   * <p>If called on an execution for which
+   * {@link ANeuralNetworksExecution_startCompute} has been called, the
+   * function will return immediately but will mark the execution to be deleted
+   * once the computation completes.   The {link ANeuralNetworksExecution_wait}
+   * will return ANEURALNETWORKS_ERROR_DELETED.
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be destroyed. Passing NULL is acceptable
+   * and results in no operation.
+   */
+  void (*ANeuralNetworksExecution_free)(ANeuralNetworksExecution* execution);
+
+  /**
+   * Associate a user buffer with an input of the model of the
+   * {@link ANeuralNetworksExecution}.
+   *
+   * <p>The provided buffer must outlive the execution.</p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be modified.
+   * @param index The index of the input argument we are setting. It is
+   *              an index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with {@link
+   * ANeuralNetworksModel_addOperand}.
+   * @param type The type of the operand. This should be used to specify the
+   *             dimensions that were set to 0 when the operand was added to the
+   *             model. All other properties of the type must be the same as
+   *             specified in the model. If the type is the same as specified
+   *             when the model was built, NULL can be passed.
+   * @param buffer The buffer containing the data.
+   * @param length The length in bytes of the buffer.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if
+   * the name is not recognized or the buffer is too small for the input.
+   */
+  int (*ANeuralNetworksExecution_setInput)(
+      ANeuralNetworksExecution* execution, int32_t index,
+      const ANeuralNetworksOperandType* type, const void* buffer,
+      size_t length);
+
+  /**
+   * Associate part of a memory object with an input of the model of the
+   * {@link ANeuralNetworksExecution}.
+   *
+   * <p>The provided memory must outlive the execution.</p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be modified.
+   * @param index The index of the input argument we are setting. It is
+   *              an index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with {@link
+   * ANeuralNetworksModel_addOperand}.
+   * @param type The type of the operand. This can be used to specify the
+   *             dimensions that were set to 0 when the operand was added to the
+   *             model. All other values must be the same as specified in the
+   *             model. If the type is the same as specified when the model
+   *             was built, NULL can be passed.
+   * @param memory The memory containing the data.
+   * @param offset This specifies the location of the data within the memory.
+   *               The offset is in bytes from the start of memory.
+   * @param length The size in bytes of the data value.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if
+   * the name is not recognized or the buffer is too small for the input.
+   */
+  int (*ANeuralNetworksExecution_setInputFromMemory)(
+      ANeuralNetworksExecution* execution, int32_t index,
+      const ANeuralNetworksOperandType* type,
+      const ANeuralNetworksMemory* memory, size_t offset, size_t length);
+
+  /**
+   * Associate a user buffer with an output of the model of the
+   * {@link ANeuralNetworksExecution}.
+   *
+   * <p>The provided buffer must outlive the execution.</p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be modified.
+   * @param index The index of the output argument we are setting. It is
+   *              an index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with {@link
+   * ANeuralNetworksModel_addOperand}.
+   * @param type The type of the operand. This can be used to specify the
+   *             dimensions that were set to 0 when the operand was added to the
+   *             model. All other values must be the same as specified in the
+   *             model. If the type is the same as specified when the model
+   *             was built, NULL can be passed.
+   * @param buffer The buffer where the data is to be written.
+   * @param length The length in bytes of the buffer.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if
+   * the name is not recognized or the buffer is too small for the output.
+   */
+  int (*ANeuralNetworksExecution_setOutput)(
+      ANeuralNetworksExecution* execution, int32_t index,
+      const ANeuralNetworksOperandType* type, void* buffer, size_t length);
+
+  /**
+   * Associate part of a memory object with an output of the model of the
+   * {@link ANeuralNetworksExecution}.
+   *
+   * <p>The provided memory must outlive the execution.</p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be modified.
+   * @param index The index of the output argument we are setting. It is
+   *              an index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with {@link
+   * ANeuralNetworksModel_addOperand}.
+   * @param type The type of the operand. This can be used to specify the
+   *             dimensions that were set to 0 when the operand was added to the
+   *             model. All other values must be the same as specified in the
+   *             model. If the type is the same as specified when the model
+   *             was built, NULL can be passed.
+   * @param memory The memory where the data is to be stored.
+   * @param offset This specifies the location of the data within the memory.
+   *               The offset is in bytes from the start of memory.
+   * @param length The length in bytes of the data value.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA if
+   * the name is not recognized or the buffer is too small for the output.
+   */
+  int (*ANeuralNetworksExecution_setOutputFromMemory)(
+      ANeuralNetworksExecution* execution, int32_t index,
+      const ANeuralNetworksOperandType* type,
+      const ANeuralNetworksMemory* memory, size_t offset, size_t length);
+
+  /**
+   * Schedule evaluation of the execution.
+   *
+   * <p>Schedules evaluation of the execution. Once the model has been
+   * applied and the outputs are ready to be consumed, the execution will be
+   * signaled. Use {@link ANeuralNetworksExecution_wait} to wait for that
+   * signal.
+   * </p>
+   *
+   * Multiple executions can be scheduled and evaluated concurrently, and
+   * compilations can be performed concurrently with executions. The runtime
+   * makes no guarantee on the ordering of the completion of compilations and
+   * executions. If it's important to the application, the application should
+   * enforce the ordering by using {@link ANeuralNetworksCompilation_wait} and
+   * {@link ANeuralNetworksExecution_wait}.
+   *
+   * ANeuralNetworksExecution_wait must be called to recuperate the resources
+   * used by the execution.
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @param execution The execution to be scheduled and executed.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksExecution_startCompute)(
+      ANeuralNetworksExecution* execution, ANeuralNetworksEvent** event);
+
+  /**
+   * Waits until the execution completes.
+   *
+   * More than one thread can wait on an event. When the execution completes,
+   * all threads will be released.
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
+   */
+  int (*ANeuralNetworksEvent_wait)(ANeuralNetworksEvent* event);
+
+  /**
+   * Destroys the event.
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   */
+  void (*ANeuralNetworksEvent_free)(ANeuralNetworksEvent* event);
+
+  // ASharedMemory_create was added in Android 8.0, so safe to use with NNAPI
+  // which was added in 8.1.
+  int (*ASharedMemory_create)(const char* name, size_t size);
+
+  /**
+   * Get the number of available devices.
+   *
+   * @param numDevices Used to return the number of devices.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworks_getDeviceCount)(uint32_t* numDevices);
+
+  /**
+   * Get the representation of the specified device.
+   *
+   * @param devIndex The index of the specified device. Must be less than the
+   *                 number of available devices.
+   * @param device The representation of the specified device.
+   *               The same representation will always be returned for the
+   *               specified device.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+
+  int (*ANeuralNetworks_getDevice)(uint32_t devIndex,
+                                   ANeuralNetworksDevice** device);
+
+  /**
+   * Get the name of the specified device.
+   *
+   * @param device The representation of the specified device.
+   * @param name The returned name of the specified device. The name will be
+   *             in UTF-8 and will be null-terminated. It will be recognizable
+   *             as a known device name rather than a cryptic string. For
+   *             devices with API level 29 and above, the format of the name is
+   *             {VENDOR}-{DEVICE}, e.g. “google-ipu”. For devices with feature
+   *             level 28 or lower, the name will always be “unknown-device”.
+   *             The name will remain valid for the duration of the application.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksDevice_getName)(const ANeuralNetworksDevice* device,
+                                       const char** name);
+
+  /**
+   * Get the version of the driver implementation of the specified device.
+   *
+   * It’s the responsibility of the driver implementor to insure that this
+   * version string uniquely distinguishes this implementation from all previous
+   * implementations.
+   *
+   * This version string must not be confused with the feature level which is
+   * solely defined by {@link ANeuralNetworksDevice_getFeatureLevel}. There is
+   * no implicit ordering of the versions. For example, it is not possible to
+   * filter all drivers older than a certain version.
+   *
+   * Application developers may use this version string to avoid or prefer
+   * specific driver implementations. For example, an application may want to do
+   * so because:
+   *     - A specific version of the driver does not provide the required
+   * performance, perhaps because of a performance regression.
+   *     - A specific version of the driver has a bug or returns results that
+   * don’t match the minimum precision requirement for the application.
+   *
+   * @param device  The representation of the specified device.
+   * @param version The returned version string of the driver for the specified
+   *                device. The string will be in UTF-8 and will be
+   *                null-terminated. For devices with feature level 28 or lower,
+   *                "UNKNOWN" will be returned. The version string will remain
+   *                valid for the duration of the application.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksDevice_getVersion)(const ANeuralNetworksDevice* device,
+                                          const char** version);
+
+  /**
+   * Get the supported NNAPI version of the specified device.
+   *
+   * Each device has a supported feature level, which is the most advanced
+   * feature this driver implements. For example, if the driver implements the
+   * features introduced in Android P, but does not implement the features
+   * introduced after Android P, the value would be 28. Developers could decide
+   * whether or not the specified device should be used for a Model that has
+   * certain feature requirements.
+   *
+   * @param device       The representation of the specified device.
+   * @param featureLevel The API level of the most advanced feature this driver
+   *                     implements.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksDevice_getFeatureLevel)(
+      const ANeuralNetworksDevice* device, int64_t* featureLevel);
+
+  /**
+   * Get the type of a given device.
+   *
+   * The device type can be used to help application developers to distribute
+   * Machine Learning workloads and other workloads such as graphical rendering.
+   * E.g., for an app which renders AR scenes based on real time object
+   * detection results, the developer could choose an ACCELERATOR type device
+   * for ML workloads, and reserve GPU for graphical rendering.
+   *
+   * @param device The representation of the specified device.
+   * @param type The returned {@link DeviceTypeCode} of the specified device.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksDevice_getType)(const ANeuralNetworksDevice* device,
+                                       int32_t* type);
+
+  /**
+   * Get the supported operations for a specified set of devices. If multiple
+   * devices are selected, the supported operation list is a union of supported
+   * operations of all selected devices.
+   *
+   * @param model        The model to be queried.
+   * @param devices      The set of devices. Must not contain duplicates.
+   * @param numDevices   The number of devices in the set.
+   * @param supportedOps The boolean array to be filled. True means supported.
+   *                     The size of the boolean array must be at least as large
+   *                     as the number of operations in the model. The order of
+   *                     elements in the supportedOps array matches the order in
+   *                     which the corresponding operations were added to the
+   *                     model.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksModel_getSupportedOperationsForDevices)(
+      const ANeuralNetworksModel* model,
+      const ANeuralNetworksDevice* const* devices, uint32_t numDevices,
+      bool* supportedOps);
+
+  /**
+   * Create a {@link ANeuralNetworksCompilation} to compile the given model for
+   * a specified set of devices. If more than one device is specified, the
+   * compilation will distribute the workload automatically across the devices.
+   * The model must be fully supported by the specified set of devices. This
+   * means that ANeuralNetworksModel_getSupportedOperationsForDevices() must
+   * have returned true for every operation for that model/devices pair.
+   *
+   * @param model       The {@link ANeuralNetworksModel} to be compiled.
+   * @param devices     The set of devices. Must not contain duplicates.
+   * @param numDevices  The number of devices in the set.
+   * @param compilation The newly created object or NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
+   *         if the model is invalid.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksCompilation_createForDevices)(
+      ANeuralNetworksModel* model, const ANeuralNetworksDevice* const* devices,
+      uint32_t numDevices, ANeuralNetworksCompilation** compilation);
+
+  /**
+   * Sets the compilation caching signature and the cache directory.
+   *
+   * Provides optional caching information to the runtime for faster repeated
+   * compilation.
+   *
+   * See {@link ANeuralNetworksCompilation} for information on multithreaded
+   * usage.
+   *
+   * @param compilation The compilation to be modified.
+   * @param cacheDir The cache directory to store and retrieve caching data. It
+   *                 is recommended to use the code_cache provided by the
+   *                 Android runtime. If not using the code_cache, the user
+   *                 should choose a directory local to the application, and is
+   *                 responsible to manage and clean the cache entries.
+   * @param token The token provided by the user to specify a model, must be of
+   *              length ANEURALNETWORKS_BYTE_SIZE_OF_CACHE_TOKEN. The user
+   *              should ensure that the token is unique to a model within the
+   *              application. The NNAPI runtime will not detected token
+   *              collisions. If there is a collision, the compilation outcome
+   *              may be incorrect without notifying with error.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksCompilation_setCaching)(
+      ANeuralNetworksCompilation* compilation, const char* cacheDir,
+      const uint8_t* token);
+
+  /**
+   * Schedule synchronous evaluation of the execution.
+   *
+   * <p>Schedules synchronous evaluation of the execution. Returns once the
+   * execution has completed and the outputs are ready to be consumed.
+   * </p>
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * See {@link ANeuralNetworksExecution_startCompute} for asynchronous
+   * execution. Synchronous execution incurs lower overhead than asynchronous
+   * execution.
+   *
+   * Available since API level 29.
+   *
+   * @param execution The execution to be scheduled and executed.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
+   *         ANEURALNETWORKS_UNMAPPABLE if the execution input or output memory
+   *         cannot be properly mapped.
+   */
+  int (*ANeuralNetworksExecution_compute)(ANeuralNetworksExecution* execution);
+
+  /**
+   * Get the dimensional information of the specified output operand of the
+   * model of the
+   * {@link ANeuralNetworksExecution}.
+   *
+   * On asynchronous execution initiated by {@link
+   * ANeuralNetworksExecution_startCompute},
+   * {@link ANeuralNetworksEvent_wait} must be called prior to this function to
+   * recuperate the resources used by the execution.
+   *
+   * @param execution The execution to be queried.
+   * @param index The index of the output argument we are querying. It is
+   *              an index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with
+   *              {@link ANeuralNetworksModel_addOperand}.
+   * @param rank The rank of the output operand.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful,
+   *         ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE if the target output is
+   *         provided an insufficient buffer at execution time,
+   *         ANEURALNETWORKS_BAD_DATA if the index is invalid.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksExecution_getOutputOperandRank)(
+      ANeuralNetworksExecution* execution, int32_t index, uint32_t* rank);
+
+  /**
+   * Get the dimensional information of the specified output operand of the
+   * model of the
+   * {@link ANeuralNetworksExecution}. The target output operand cannot be a
+   * scalar.
+   *
+   * On asynchronous execution initiated by {@link
+   * ANeuralNetworksExecution_startCompute},
+   * {@link ANeuralNetworksEvent_wait} must be called prior to this function to
+   * recuperate the resources used by the execution.
+   *
+   * @param execution The execution to be queried.
+   * @param index The index of the output argument we are querying. It is an
+   *              index into the lists passed to
+   *              {@link ANeuralNetworksModel_identifyInputsAndOutputs}. It is
+   *              not the index associated with
+   *              {@link ANeuralNetworksModel_addOperand}.
+   * @param dimensions The dimension array to be filled. The size of the array
+   *                   must be exactly as large as the rank of the output
+   *                   operand to be queried in the model.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful,
+   *         ANEURALNETWORKS_OUTPUT_INSUFFICIENT_SIZE if the target output is
+   *         provided an insufficient buffer at execution time,
+   *         ANEURALNETWORKS_BAD_DATA if the index is invalid or if the target
+   *         is a scalar.
+   *
+   * Available since API level 29.
+   */
+  int (*ANeuralNetworksExecution_getOutputOperandDimensions)(
+      ANeuralNetworksExecution* execution, int32_t index, uint32_t* dimensions);
+
+  /**
+   * Create a {@link ANeuralNetworksBurst} to apply the given compilation.
+   * This only creates the burst object. Computation is only performed once
+   * {@link ANeuralNetworksExecution_burstCompute} is invoked with a valid
+   * {@link ANeuralNetworksExecution} and {@link ANeuralNetworksBurst}.
+   *
+   * <p>The provided compilation must outlive the burst object.</p>
+   *
+   * Available since API level 29.
+   *
+   * @param compilation The {@link ANeuralNetworksCompilation} to be evaluated.
+   * @param burst The newly created object or NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful, ANEURALNETWORKS_BAD_DATA
+   *         if the compilation is invalid.
+   */
+  int (*ANeuralNetworksBurst_create)(ANeuralNetworksCompilation* compilation,
+                                     ANeuralNetworksBurst** burst);
+
+  /**
+   * Destroys the burst object.
+   *
+   * Available since API level 29.
+   *
+   * @param burst The burst object to be destroyed. Passing NULL is acceptable
+   * and results in no operation.
+   */
+  void (*ANeuralNetworksBurst_free)(ANeuralNetworksBurst* burst);
+
+  /**
+   * Schedule synchronous evaluation of the execution on a burst object.
+   *
+   * <p>Schedules synchronous evaluation of the execution. Returns once the
+   * execution has completed and the outputs are ready to be consumed.</p>
+   *
+   * <p>There must be at most one {@link ANeuralNetworksExecution} processing at
+   * any given time for any given burst object. Any
+   * {@link ANeuralNetworksExecution} launched before the previous has finished
+   * will result in ANEURALNETWORKS_BAD_STATE.</p>
+   *
+   * Available since API level 29.
+   *
+   * @param burst The burst object to execute on.
+   * @param execution The execution to be scheduled and executed. The execution
+   *                  must be created from the same {@link
+   *                  ANeuralNetworksCompilation} as the burst object.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the execution completed normally.
+   */
+  int (*ANeuralNetworksExecution_burstCompute)(
+      ANeuralNetworksExecution* execution, ANeuralNetworksBurst* burst);
+
+  /**
+   * Creates a shared memory object from an AHardwareBuffer handle.
+   *
+   * If the shared memory is backed by an AHardwareBuffer of
+   * AHARDWAREBUFFER_FORMAT_BLOB format, it can be used the same way as
+   * shared memory created from a file handle. See
+   * {@link ANeuralNetworksMemory} for a description on how to use this
+   * shared memory.
+   *
+   * If the shared memory is backed by an AHardwareBuffer of a format other
+   * than AHARDWAREBUFFER_FORMAT_BLOB, it can only be used for Model inputs
+   * and outputs. When calling
+   * {@link ANeuralNetworksExecution_setInputFromMemory} or
+   * {@link ANeuralNetworksExecution_setOutputFromMemory} with the shared
+   * memory, both offset and length must be set to zero and the entire
+   * memory region will be associated with the specified input or output
+   * operand. There is no guarantee that an arbitrary AHardwareBuffer_Format
+   * and AHardwareBuffer_UsageFlags combination can be used by arbitrary
+   * devices. The execution will fail if selected set of devices cannot
+   * consume the buffer.
+   *
+   * Calling {@link ANeuralNetworksModel_setOperandValueFromMemory} with
+   * shared memory backed by an AHardwareBuffer of a format other than
+   * AHARDWAREBUFFER_FORMAT_BLOB is disallowed.
+   *
+   * TODO(miaowang): add documentation about intended usage with
+   * introspection API.
+   *
+   * Available since API level 29.
+   *
+   * @param ahwb The AHardwareBuffer handle.
+   * @param memory The memory object to be created.
+   *               Set to NULL if unsuccessful.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if the request completed normally.
+   *
+   * @see AHardwareBuffer
+   */
+  int (*ANeuralNetworksMemory_createFromAHardwareBuffer)(
+      const AHardwareBuffer* ahwb, ANeuralNetworksMemory** memory);
+
+  /**
+   * Specifies whether duration of the {@link ANeuralNetworksExecution} is to be
+   * measured. By default, duration is not measured.
+   *
+   * The {@link ANeuralNetworksExecution} must have been created with
+   * {@link ANeuralNetworksCompilation_createForDevices} with numDevices = 1.
+   *
+   * See {@link ANeuralNetworksExecution} for information on multithreaded
+   * usage.
+   *
+   * Available since API level 29.
+   *
+   * @param execution The execution to be modified.
+   * @param measure 'true' if duration is to be measured, 'false' if not.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksExecution_setMeasureTiming)(
+      ANeuralNetworksExecution* execution, bool measure);
+
+  /**
+   * Get the time spent in the specified {@link ANeuralNetworksExecution}, in
+   * nanoseconds. The execution must have completed.
+   *
+   * @param execution The execution to be queried.
+   * @param durationCode The measurement to be queried, specified by {@link
+   * DurationCode}.
+   * @param duration The returned duration. If no measurement was requested by
+   *                 {@link ANeuralNetworksExecution_setMeasureTiming}, or for
+   * some other reason the duration is not available, UINT64_MAX will be
+   * returned. A particular device need not support any given measurement.
+   *
+   * @return ANEURALNETWORKS_NO_ERROR if successful.
+   */
+  int (*ANeuralNetworksExecution_getDuration)(
+      const ANeuralNetworksExecution* execution, int32_t durationCode,
+      uint64_t* duration);
+
+  /**/
+
+};
+
+/**
+ * Load the NNAPI implementation from the shared libraries.
+ * The NnApi structure is filled with all the pointers. If one function doesn't
+ * exist, a null pointer is stored.
+ */
+const NnApi* NnApiImplementation();
+
+#ifdef __ANDROID__
+int32_t GetAndroidSdkVersion();
+#endif
+
+#endif  // TENSORFLOW_LITE_NNAPI_NNAPI_IMPLEMENTATION_H_