nnapi_delegate_provider.cc (revision b6fb3261f9314811a0f4371741dbb8839866f948) - OpenGrok cross reference for /aosp_15_r20/external/tensorflow/tensorflow/lite/tools/delegates/nnapi_delegate_provider.cc

/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#include <string>
#include <utility>

#include "tensorflow/lite/delegates/nnapi/nnapi_delegate.h"
#include "tensorflow/lite/nnapi/nnapi_implementation.h"
#include "tensorflow/lite/nnapi/nnapi_util.h"
#include "tensorflow/lite/nnapi/sl/include/SupportLibrary.h"
#include "tensorflow/lite/tools/delegates/delegate_provider.h"

namespace tflite {
namespace tools {

namespace {

using nnapi::NnApiSupportLibrary;

// StatefulNnApiDelegate that holds onto an NnApiSupportLibrary instance
// passed to the constructor for later destruction.
// Note that the support library must outlive the delegate.
class NnApiSupportLibraryDelegate : public StatefulNnApiDelegate {
 public:
  NnApiSupportLibraryDelegate(const NnApiSupportLibrary* nnapi_sl,
                              Options options)
      : StatefulNnApiDelegate(nnapi_sl->getFL5(), options),
        nnapi_sl_(nnapi_sl) {}
  const NnApiSupportLibrary* get_nnapi_sl() const { return nnapi_sl_; }

 private:
  const NnApiSupportLibrary* const nnapi_sl_;
};

}  // namespace

class NnapiDelegateProvider : public DelegateProvider {
 public:
  NnapiDelegateProvider() {
    default_params_.AddParam("use_nnapi", ToolParam::Create<bool>(false));
    default_params_.AddParam("nnapi_execution_preference",
                             ToolParam::Create<std::string>(""));
    default_params_.AddParam("nnapi_execution_priority",
                             ToolParam::Create<std::string>(""));
    default_params_.AddParam("nnapi_accelerator_name",
                             ToolParam::Create<std::string>(""));
    default_params_.AddParam("disable_nnapi_cpu",
                             ToolParam::Create<bool>(true));
    default_params_.AddParam("nnapi_allow_fp16",
                             ToolParam::Create<bool>(false));
    default_params_.AddParam("nnapi_allow_dynamic_dimensions",
                             ToolParam::Create<bool>(false));
    default_params_.AddParam("nnapi_use_burst_mode",
                             ToolParam::Create<bool>(false));
    default_params_.AddParam("nnapi_support_library_path",
                             ToolParam::Create<std::string>(""));
  }

  std::vector<Flag> CreateFlags(ToolParams* params) const final;

  void LogParams(const ToolParams& params, bool verbose) const final;

  TfLiteDelegatePtr CreateTfLiteDelegate(const ToolParams& params) const final;
  std::pair<TfLiteDelegatePtr, int> CreateRankedTfLiteDelegate(
      const ToolParams& params) const final;

  std::string GetName() const final { return "NNAPI"; }
};
REGISTER_DELEGATE_PROVIDER(NnapiDelegateProvider);

std::vector<Flag> NnapiDelegateProvider::CreateFlags(ToolParams* params) const {
  std::vector<Flag> flags = {
      CreateFlag<bool>("use_nnapi", params, "use nnapi delegate api"),
      CreateFlag<std::string>("nnapi_execution_preference", params,
                              "execution preference for nnapi delegate. Should "
                              "be one of the following: fast_single_answer, "
                              "sustained_speed, low_power, undefined"),
      CreateFlag<std::string>("nnapi_execution_priority", params,
                              "The model execution priority in nnapi, and it "
                              "should be one of the following: default, low, "
                              "medium and high. This requires Android 11+."),
      CreateFlag<std::string>(
          "nnapi_accelerator_name", params,
          "the name of the nnapi accelerator to use (requires Android Q+)"),
      CreateFlag<bool>("disable_nnapi_cpu", params,
                       "Disable the NNAPI CPU device"),
      CreateFlag<bool>("nnapi_allow_fp16", params,
                       "Allow fp32 computation to be run in fp16"),
      CreateFlag<bool>(
          "nnapi_allow_dynamic_dimensions", params,
          "Whether to allow dynamic dimension sizes without re-compilation. "
          "This requires Android 9+."),
      CreateFlag<bool>(
          "nnapi_use_burst_mode", params,
          "use NNAPI Burst mode if supported. Burst mode allows accelerators "
          "to efficiently manage resources, which would significantly reduce "
          "overhead especially if the same delegate instance is to be used for "
          "multiple inferences."),
      CreateFlag<std::string>(
          "nnapi_support_library_path", params,
          "Path from which NNAPI support library will be loaded to construct "
          "the delegate. In order to use NNAPI delegate with support library, "
          "--nnapi_accelerator_name must be specified and must be equal to one "
          "of the devices provided by the support library."),
  };

  return flags;
}

void NnapiDelegateProvider::LogParams(const ToolParams& params,
                                      bool verbose) const {
  LOG_TOOL_PARAM(params, bool, "use_nnapi", "Use NNAPI", verbose);
  if (!params.Get<bool>("use_nnapi")) return;

  LOG_TOOL_PARAM(params, std::string, "nnapi_execution_preference",
                 "NNAPI execution preference", verbose);
  LOG_TOOL_PARAM(params, std::string, "nnapi_execution_priority",
                 "Model execution priority in nnapi", verbose);
  LOG_TOOL_PARAM(params, std::string, "nnapi_accelerator_name",
                 "NNAPI accelerator name", verbose);

  std::string string_device_names_list =
      nnapi::GetStringDeviceNamesList(NnApiImplementation());
  // Print available devices when possible as it's informative.
  if (!string_device_names_list.empty()) {
    TFLITE_LOG(INFO) << "NNAPI accelerators available: ["
                     << string_device_names_list << "]";
  }

  LOG_TOOL_PARAM(params, bool, "disable_nnapi_cpu", "Disable NNAPI cpu",
                 verbose);
  LOG_TOOL_PARAM(params, bool, "nnapi_allow_fp16", "Allow fp16 in NNAPI",
                 verbose);
  LOG_TOOL_PARAM(params, bool, "nnapi_allow_dynamic_dimensions",
                 "Allow dynamic dimensions in NNAPI", verbose);
  LOG_TOOL_PARAM(params, bool, "nnapi_use_burst_mode",
                 "Use burst mode in NNAPI", verbose);
}

TfLiteDelegatePtr NnapiDelegateProvider::CreateTfLiteDelegate(
    const ToolParams& params) const {
  TfLiteDelegatePtr null_delegate = CreateNullDelegate();
  if (params.Get<bool>("use_nnapi")) {
    StatefulNnApiDelegate::Options options;
    std::string accelerator_name =
        params.Get<std::string>("nnapi_accelerator_name");
    if (!accelerator_name.empty()) {
      options.accelerator_name = accelerator_name.c_str();
    } else {
      options.disallow_nnapi_cpu = params.Get<bool>("disable_nnapi_cpu");
    }

    if (params.Get<bool>("nnapi_allow_fp16")) {
      options.allow_fp16 = true;
    }

    if (params.Get<bool>("nnapi_allow_dynamic_dimensions")) {
      options.allow_dynamic_dimensions = true;
    }

    if (params.Get<bool>("nnapi_use_burst_mode")) {
      options.use_burst_computation = true;
    }

    std::string string_execution_preference =
        params.Get<std::string>("nnapi_execution_preference");
    // Only set execution preference if user explicitly passes one. Otherwise,
    // leave it as whatever NNAPI has as the default.
    if (!string_execution_preference.empty()) {
      tflite::StatefulNnApiDelegate::Options::ExecutionPreference
          execution_preference =
              tflite::StatefulNnApiDelegate::Options::kUndefined;
      if (string_execution_preference == "low_power") {
        execution_preference =
            tflite::StatefulNnApiDelegate::Options::kLowPower;
      } else if (string_execution_preference == "sustained_speed") {
        execution_preference =
            tflite::StatefulNnApiDelegate::Options::kSustainedSpeed;
      } else if (string_execution_preference == "fast_single_answer") {
        execution_preference =
            tflite::StatefulNnApiDelegate::Options::kFastSingleAnswer;
      } else if (string_execution_preference == "undefined") {
        execution_preference =
            tflite::StatefulNnApiDelegate::Options::kUndefined;
      } else {
        TFLITE_LOG(WARN) << "The provided value ("
                         << string_execution_preference
                         << ") is not a valid nnapi execution preference.";
      }
      options.execution_preference = execution_preference;
    }

    std::string string_execution_priority =
        params.Get<std::string>("nnapi_execution_priority");
    // Only set execution priority if user explicitly passes one. Otherwise,
    // leave it as whatever NNAPI has as the default.
    if (!string_execution_priority.empty()) {
      int execution_priority = 0;
      if (string_execution_priority == "default") {
        execution_priority = ANEURALNETWORKS_PRIORITY_DEFAULT;
      } else if (string_execution_priority == "low") {
        execution_priority = ANEURALNETWORKS_PRIORITY_LOW;
      } else if (string_execution_priority == "medium") {
        execution_priority = ANEURALNETWORKS_PRIORITY_MEDIUM;
      } else if (string_execution_priority == "high") {
        execution_priority = ANEURALNETWORKS_PRIORITY_HIGH;
      } else {
        TFLITE_LOG(WARN) << "The provided value (" << string_execution_priority
                         << ") is not a valid nnapi execution priority.";
      }
      options.execution_priority = execution_priority;
    }

    int max_delegated_partitions = params.Get<int>("max_delegated_partitions");
    if (max_delegated_partitions >= 0) {
      options.max_number_delegated_partitions = max_delegated_partitions;
    }

    // Serialization.
    std::string serialize_dir =
        params.Get<std::string>("delegate_serialize_dir");
    std::string serialize_token =
        params.Get<std::string>("delegate_serialize_token");
    if (!serialize_dir.empty() && !serialize_token.empty()) {
      options.cache_dir = serialize_dir.c_str();
      options.model_token = serialize_token.c_str();
    }

    if (params.Get<std::string>("nnapi_support_library_path").empty()) {
      const auto* nnapi_impl = NnApiImplementation();
      if (!nnapi_impl->nnapi_exists) {
        TFLITE_LOG(WARN)
            << "NNAPI acceleration is unsupported on this platform.";
        return null_delegate;
      }
      return TfLiteDelegatePtr(
          new StatefulNnApiDelegate(nnapi_impl, options),
          [](TfLiteDelegate* delegate) {
            delete reinterpret_cast<StatefulNnApiDelegate*>(delegate);
          });
    } else {
      std::string sl_path =
          params.Get<std::string>("nnapi_support_library_path");
      auto nnapi_impl = nnapi::loadNnApiSupportLibrary(sl_path);
      if (!nnapi_impl) {
        TFLITE_LOG(WARN) << "Couldn't load NNAPI support library from path: "
                         << sl_path;
        return null_delegate;
      }
      return TfLiteDelegatePtr(
          new NnApiSupportLibraryDelegate(nnapi_impl.release(), options),
          [](TfLiteDelegate* delegate) {
            NnApiSupportLibraryDelegate* sl_delegate =
                reinterpret_cast<NnApiSupportLibraryDelegate*>(delegate);
            const NnApiSupportLibrary* sl = sl_delegate->get_nnapi_sl();
            delete sl_delegate;
            delete sl;
          });
    }
  } else if (!params.Get<std::string>("nnapi_accelerator_name").empty()) {
    TFLITE_LOG(WARN)
        << "`--use_nnapi=true` must be set for the provided NNAPI accelerator ("
        << params.Get<std::string>("nnapi_accelerator_name") << ") to be used.";
  } else if (!params.Get<std::string>("nnapi_execution_preference").empty()) {
    TFLITE_LOG(WARN) << "`--use_nnapi=true` must be set for the provided NNAPI "
                        "execution preference ("
                     << params.Get<std::string>("nnapi_execution_preference")
                     << ") to be used.";
  }
  return null_delegate;
}

std::pair<TfLiteDelegatePtr, int>
NnapiDelegateProvider::CreateRankedTfLiteDelegate(
    const ToolParams& params) const {
  auto ptr = CreateTfLiteDelegate(params);
  return std::make_pair(std::move(ptr), params.GetPosition<bool>("use_nnapi"));
}

}  // namespace tools
}  // namespace tflite