Add Tensorflow Lite Hexagon Delegate which accelerate graph inference on Hexagon NN for Snapdragon Hexagon DSPs

PiperOrigin-RevId: 285512192 Change-Id: Id0f1887dff0c0605507495691dbccae07ce8dea9
2019-12-13 19:02:35 -08:00 · 2019-12-13 19:02:35 -08:00 · 8e7ed7ee5a
commit 8e7ed7ee5a
parent 0505a9e2cb
69 changed files with 6123 additions and 0 deletions
--- a/tensorflow/lite/experimental/delegates/hexagon/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/BUILD
@ -0,0 +1,110 @@
 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 load("//tensorflow/lite:build_def.bzl", "tflite_copts", "tflite_linkopts")
 package(
    default_visibility = [
        "//visibility:public",
    ],
    licenses = ["notice"],  # Apache 2.0
 )
 cc_library(
    name = "hexagon_implementation",
    srcs = ["hexagon_implementation.cc"],
    hdrs = [
        "hexagon_implementation.h",
        "hexagon_nn_interface.h",
    ],
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
        "//tensorflow/lite:minimal_logging",
        "//tensorflow/lite/experimental/delegates/hexagon/hexagon_nn:hexagon_nn_header",
        "//tensorflow/lite/kernels/internal:compatibility",
    ],
 )
 cc_library(
    name = "hexagon_delegate_kernel",
    srcs = [
        "hexagon_delegate.h",
        "hexagon_delegate_kernel.cc",
    ],
    hdrs = ["hexagon_delegate_kernel.h"],
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
        ":hexagon_implementation",
        ":utils",
        "//tensorflow/lite:kernel_api",
        "//tensorflow/lite/c:common",
        "//tensorflow/lite/experimental/delegates/hexagon/builders:op_builder",
        "//tensorflow/lite/experimental/delegates/hexagon/hexagon_nn:hexagon_nn_header",
        "//tensorflow/lite/schema:schema_fbs",
        "@hexagon_nn//:hexagon_nn_ops",
    ],
 )
 cc_library(
    name = "hexagon_delegate",
    srcs = ["hexagon_delegate.cc"],
    hdrs = ["hexagon_delegate.h"],
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
        ":hexagon_delegate_kernel",
        ":hexagon_implementation",
        ":utils",
        "//tensorflow/lite:kernel_api",
        "//tensorflow/lite/c:common",
    ],
 )
 cc_library(
    name = "utils",
    srcs = ["utils.cc"],
    hdrs = ["utils.h"],
    copts = tflite_copts(),
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
        "//tensorflow/lite:kernel_api",
        "//tensorflow/lite/c:common",
        "//tensorflow/lite/kernels:kernel_util",
    ],
 )
 cc_test(
    name = "utils_test",
    srcs = ["utils_test.cc"],
    linkopts = tflite_linkopts() + ["-lm"],
    deps = [
        ":utils",
        "//tensorflow/lite/c:common",
        "@com_google_googletest//:gtest_main",
    ],
 )
 exports_files(["version_script.lds"])
--- a/tensorflow/lite/experimental/delegates/hexagon/README.md
+++ b/tensorflow/lite/experimental/delegates/hexagon/README.md
@ -0,0 +1,99 @@
 # Hexagon Delegate
 Experimental delegate which uses Hexagon SDK to delegate the processing
 to QC DSP.
 Note that we only support quantized models, since the DSP is efficient
 with quantized versions. So all op support is for quantized versions.
 Usage:
 - Add dependency on hexagon_delegate rule.
 - Code change example:
 ```
  #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h"
  // Assuming shared libraries are under "/data/local/tmp/"
  // If files are packaged with native lib in android App then it
  // will typically be equivalent to the path provided by
  // "getContext().getApplicationInfo().nativeLibraryDir"
  const char[] library_directory_path = "/data/local/tmp/";
  TfLiteHexagonInitWithPath(library_directory_path);  // Needed once at startup.
  ::tflite::TfLiteHexagonDelegateOptions params = {0};
  // 'delegate_ptr' Need to outlive the interpreter. For example,
  // If use case will need to resize input or anything that can trigger
  // re-applying delegates then 'delegate_ptr' need to outlive the interpreter.
  auto* delegate_ptr = ::tflite::TfLiteHexagonDelegateCreate(&params);
  Interpreter::TfLiteDelegatePtr delegate(delegate_ptr,
      [](TfLiteDelegate* delegate) {
        ::tflite::TfLiteHexagonDelegateDelete(delegate);
      });
  interpreter->ModifyGraphWithDelegate(delegate.get());
  TfLiteHexagonTearDown();  // Needed once at end of app/DSP usage.
 ```
 * Shared libraries:
  - 'libhexagon_interface.so' which holds the interface that the delegate uses.
  It must be available if you linked the hexagon_delegate library to TFLite.
  You can load it either from shell by overriding
  LD_LIBRARY_PATH=$LD_LIBRARY_PATH:"path to the so",
  or add it inside your apk in a way it is available.
  - 'libhexagon_nn_skel(_v65/_v66).so' which holds the DSP code.
  Use TfLiteHexagonInitWithPath(..) and provide the path to the directory
  which holds the shared libraries for the Hexagon NN on device.
  If you're using TfLiteHexagonInit() then
  You will need to set environment variable "ADSP_LIBRARY_PATH" to
  "path_to_the_lib";/system/lib/rfsa/adsp;/system/vendor/lib/rfsa/adsp;/dsp
  Note that separator here is ';' not ':'
  You can push all 3 files, and the library will pick the one needed based
  on the runtime. Or if you are sure of what you will use on the device then
  push only one of them.
 ## Supported Ops
 Hexagon only supports ops that have inputs/outputs of <= 4 dimensions.
 The following operations have been implemented, with a few constraints that
 are verified in `IsNodeSupportedByHexagon`:
 * Add
 * ArgMax
 * ArgMin
 * AveragePool2D:
  * Constraints:
    - No Activation
 * Concat
 * Conv2D:
  * Constraints:
    - stride width/height <= 3
 * DepthwiseConv2D:
  * Constraints:
      - Filter width == 3
      - depth_multiplier == 1
      - dilation only supported when stride == 1
      - Otherwise, stride height/width <= 3
 * FullyConnected (without any activation)
 * L2Normalization (without any activation)
 * Logistic (aka Sigmoid)
 * MaxPool2D (without any activation) (b/129276536)
 * Mul (without any activation) (b/129276536)
 * Neg
 * Pad: Only supports 0 padding (b/139277813)
 * Relu
 * Relu6
 * Reshape
 * Resize Bilinear:
  * Constraints:
    - Requested size <= 65 (b/143105433)
 * Resize Nearest Neighbor
 * SoftMax
 * Split
 * Sub
 * Tanh
 * Transpose
 * TransposeConv2D:
  * Constraints:
    - stride height/width <= 3
    - dilation height/width == 1
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/BUILD
@ -0,0 +1,78 @@
 package(
    default_visibility = [
        "//visibility:public",
    ],
    licenses = ["notice"],  # Apache 2.0
 )
 cc_library(
    name = "op_builder",
    srcs = [
        "activation_builder.cc",
        "arg_min_max_builder.cc",
        "arithmetic_builder.cc",
        "concat_builder.cc",
        "conv_2d_builder.cc",
        "l2_normalization_builder.cc",
        "matmul_builder.cc",
        "neg_op_builder.cc",
        "op_builder.cc",
        "pad_builder.cc",
        "pool_2d_builder.cc",
        "reduce_builder.cc",
        "reshape_builder.cc",
        "resize_bilinear_builder.cc",
        "resize_nearest_neighbor_builder.cc",
        "softmax_builder.cc",
        "split_builder.cc",
        "transpose_builder.cc",
        "transpose_conv_2d_builder.cc",
    ],
    hdrs = [
        "activation_builder.h",
        "arg_min_max_builder.h",
        "arithmetic_builder.h",
        "concat_builder.h",
        "conv_2d_builder.h",
        "l2_normalization_builder.h",
        "matmul_builder.h",
        "neg_op_builder.h",
        "op_builder.h",
        "pad_builder.h",
        "pool_2d_builder.h",
        "reduce_builder.h",
        "reshape_builder.h",
        "resize_bilinear_builder.h",
        "resize_nearest_neighbor_builder.h",
        "softmax_builder.h",
        "split_builder.h",
        "transpose_builder.h",
        "transpose_conv_2d_builder.h",
    ],
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
        ":op_factory",
        "//tensorflow/lite:kernel_api",
        "//tensorflow/lite/c:common",
        "//tensorflow/lite/experimental/delegates/hexagon:hexagon_implementation",
        "//tensorflow/lite/experimental/delegates/hexagon/hexagon_nn:hexagon_nn_header",
        "//tensorflow/lite/kernels:kernel_util",
        "//tensorflow/lite/kernels:padding",
        "//tensorflow/lite/kernels/internal:optimized_base",
        "@hexagon_nn//:hexagon_nn_ops",
    ],
 )
 cc_library(
    name = "op_factory",
    hdrs = ["op_factory.h"],
    tags = [
        "manual",
        "nobuilder",
    ],
    deps = [
    ],
 )
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/activation_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/activation_builder.cc
@ -0,0 +1,87 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/activation_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ActivationOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static int scalar_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                              std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      scalar_shape, reinterpret_cast<char*>(&input_min_), sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      scalar_shape, reinterpret_cast<char*>(&input_max_), sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  if (op_node_.op_type == OP_QuantizedReluX_8) {
    auto* relu_value_const = graph_builder_->AddConstNodeWithData(
        scalar_shape, reinterpret_cast<char*>(&relu_value_),
        sizeof(relu_value_));
    AddInput(TensorID(relu_value_const->GetID(), 0));
  }
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus ActivationOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                                  TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ActivationOpBuilder::~ActivationOpBuilder() {}
 OpBuilder* CreateActivationBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ActivationOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/activation_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/activation_builder.h
@ -0,0 +1,52 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ACTIVATION_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ACTIVATION_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ActivationOpBuilder : public OpBuilder {
 public:
  explicit ActivationOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  explicit ActivationOpBuilder(GraphBuilder* graph_builder, int op_type,
                               int relu_value)
      : OpBuilder(graph_builder, op_type), relu_value_(relu_value) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ActivationOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
  float relu_value_ = 6;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ACTIVATION_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/arg_min_max_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/arg_min_max_builder.cc
@ -0,0 +1,98 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/arg_min_max_builder.h"
 #include <limits>
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ArgMinMaxOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                                  const TfLiteIntArray* outputs,
                                                  TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  if (inputs->size != 2) {
    context->ReportError(context, "Expecting 2 inputs %d != 2\n", inputs->size);
    return kTfLiteError;
  }
  // Input data tensor.
  int input_tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[input_tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(input_tensor_id));
  // Axis tensor.
  const int axis_tensor_id = inputs->data[1];
  const auto& axis = context->tensors[axis_tensor_id];
  if (axis.allocation_type != kTfLiteMmapRo) {
    context->ReportError(context,
                         "Axis tensor doesn't have correct allocation type: %s",
                         axis.name);
    return kTfLiteError;
  }
  int axis_value = axis.data.i32[0];
  if (axis_value < 0) {
    axis_value += input_tensor.dims->size;
  }
  auto* input_axis_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&axis_value), sizeof(int32_t));
  AddInput(TensorID(input_axis_const->GetID(), 0));
  // Compute Min/Max
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Output Node
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  return kTfLiteOk;
 }
 TfLiteStatus ArgMinMaxOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                                 TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ArgMinMaxOpBuilder::~ArgMinMaxOpBuilder() {}
 OpBuilder* CreateArgMinMaxOpBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ArgMinMaxOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/arg_min_max_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/arg_min_max_builder.h
@ -0,0 +1,46 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARG_MIN_MAX_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARG_MIN_MAX_BUILDER_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ArgMinMaxOpBuilder : public OpBuilder {
 public:
  explicit ArgMinMaxOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ArgMinMaxOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARG_MIN_MAX_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/arithmetic_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/arithmetic_builder.cc
@ -0,0 +1,127 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/arithmetic_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ArithmeticOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // First input data tensor.
  tensor_id = inputs->data[0];
  const auto& input1_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input1_tensor, &input1_min_, &input1_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input1_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input1_min_),
      sizeof(input1_min_));
  auto* input1_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input1_max_),
      sizeof(input1_max_));
  // Second input data tensor.
  tensor_id = inputs->data[1];
  const auto& input2_tensor = context->tensors[tensor_id];
  // TODO(karimnosseir): Have this as util to generalize to all ops.
  if (input2_tensor.allocation_type == kTfLiteMmapRo) {
    auto* const_input_node =
        graph_builder_->AddConstNodeWithData(tensor_id, input2_tensor);
    graph_builder_->AddTensorWithID(tensor_id, const_input_node->GetID(), 0);
  }
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input2_tensor, &input2_min_, &input2_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input2_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input2_min_),
      sizeof(input2_min_));
  auto* input2_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input2_max_),
      sizeof(input2_max_));
  // Min/max values for input tensors.
  AddInput(TensorID(input1_min_const->GetID(), 0));
  AddInput(TensorID(input1_max_const->GetID(), 0));
  AddInput(TensorID(input2_min_const->GetID(), 0));
  AddInput(TensorID(input2_max_const->GetID(), 0));
  // Output min/max as inputs, only if it's an Add node.
  if (op_node_.op_type == OP_QuantizedAdd_8p8to8) {
    output_min_ = 0;
    output_max_ = 0;
    TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
        context->tensors[outputs->data[0]], &output_min_, &output_max_,
        std::numeric_limits<uint8_t>::min(),
        std::numeric_limits<uint8_t>::max()));
    if (output_max_ != 0) {
      auto* output_min_const = graph_builder_->AddConstNodeWithData(
          quant_bound_shape, reinterpret_cast<char*>(&output_min_),
          sizeof(output_min_));
      auto* output_max_const = graph_builder_->AddConstNodeWithData(
          quant_bound_shape, reinterpret_cast<char*>(&output_max_),
          sizeof(output_max_));
      AddInput(TensorID(output_min_const->GetID(), 0));
      AddInput(TensorID(output_max_const->GetID(), 0));
    }
  }
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus ArithmeticOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                                  TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ArithmeticOpBuilder::~ArithmeticOpBuilder() {}
 OpBuilder* CreateArithmeticBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ArithmeticOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/arithmetic_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/arithmetic_builder.h
@ -0,0 +1,49 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARITHMETIC_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARITHMETIC_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ArithmeticOpBuilder : public OpBuilder {
 public:
  explicit ArithmeticOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ArithmeticOpBuilder() override;
 private:
  TensorID node_output_;
  float input1_min_, input1_max_, input2_min_, input2_max_, output_min_,
      output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_ARITHMETIC_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/concat_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/concat_builder.cc
@ -0,0 +1,133 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/concat_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ConcatOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                               const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  // Only axis 3 is supported.
  const TfLiteConcatenationParams* concat_params =
      reinterpret_cast<const TfLiteConcatenationParams*>(builtin_data_);
  auto* axis_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, (char*)&concat_params->axis,
      sizeof(concat_params->axis));
  AddInput(TensorID(axis_const->GetID(), 0));
  int tensor_id;
  // Input data tensors.
  input_minima_.reserve(inputs->size);
  input_maxima_.reserve(inputs->size);
  for (int i = 0; i < inputs->size; ++i) {
    tensor_id = inputs->data[i];
    float data_min, data_max;
    const auto& data_tensor = context->tensors[tensor_id];
    AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
    TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
        data_tensor, &data_min, &data_max, std::numeric_limits<uint8_t>::min(),
        std::numeric_limits<uint8_t>::max()));
    input_minima_.push_back(data_min);
    input_maxima_.push_back(data_max);
  }
  // Minima tensors.
  for (int i = 0; i < input_minima_.size(); ++i) {
    auto* data_min_const = graph_builder_->AddConstNodeWithData(
        quant_bound_shape, reinterpret_cast<char*>(&input_minima_[i]),
        sizeof(input_minima_[i]));
    AddInput(TensorID(data_min_const->GetID(), 0));
  }
  // Maxima tensors.
  for (int i = 0; i < input_minima_.size(); ++i) {
    auto* data_max_const = graph_builder_->AddConstNodeWithData(
        quant_bound_shape, reinterpret_cast<char*>(&input_maxima_[i]),
        sizeof(input_maxima_[i]));
    AddInput(TensorID(data_max_const->GetID(), 0));
  }
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  // We requantize the output from concat to the range expected by TFLite.
  // Otherwise, we see accuracy issues for cases where the inputs have different
  // min/max bounds.
  TensorID concat_out = AddOutput(sizeof(uint8_t), 4,
                                  {output_batch_size, output_height_size,
                                   output_width_size, output_depth_size});
  const auto& concat_out_min = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  const auto& concat_out_max = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  // Output min/max for requantization.
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      context->tensors[outputs->data[0]], &output_min_, &output_max_,
      std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* output_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, (char*)&output_min_, sizeof(output_min_));
  auto* output_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, (char*)&output_max_, sizeof(output_max_));
  auto* requantize_op = graph_builder_->AddNode();
  requantize_op->SetOpType(OP_Requantize_8to8);
  requantize_op->AddInput(concat_out);
  requantize_op->AddInput(concat_out_min);
  requantize_op->AddInput(concat_out_max);
  requantize_op->AddInput(TensorID(output_min_const->GetID(), 0));
  requantize_op->AddInput(TensorID(output_max_const->GetID(), 0));
  node_output_ =
      requantize_op->AddOutput(sizeof(uint8_t), 4,
                               {output_batch_size, output_height_size,
                                output_width_size, output_depth_size});
  requantize_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  requantize_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus ConcatOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ConcatOpBuilder::~ConcatOpBuilder() {}
 OpBuilder* CreateConcatBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ConcatOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/concat_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/concat_builder.h
@ -0,0 +1,50 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONCAT_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONCAT_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ConcatOpBuilder : public OpBuilder {
 public:
  explicit ConcatOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ConcatOpBuilder() override;
 private:
  TensorID node_output_;
  std::vector<float> input_minima_;
  std::vector<float> input_maxima_;
  float output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONCAT_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/conv_2d_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/conv_2d_builder.cc
@ -0,0 +1,378 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/conv_2d_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/optimized/optimized_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 namespace {
 // Dilated Depthwise Convolution performs SpaceToBatchND & BatchToSpaceND before
 // and after the op respectively.
 // This helper computes the paddings param for SpaceToBatchND and crops param
 // for BatchToSpaceND.
 //
 // Inspired by tf.nn.with_space_to_batch & tf.required_space_to_batch_paddings.
 void ComputeSpaceToBatchParams(int input_height, int input_width,
                               int weights_height, int weights_width,
                               const std::vector<int>& dilation_factors_h_w,
                               const TfLitePadding padding_type,
                               std::vector<int>* paddings,
                               std::vector<int>* crops) {
  // Base paddings depend on padding applied to the Depthwise Conv op.
  // 4-element array: {top, bottom, left, right}.
  std::vector<int> base_paddings(4, 0);
  if (padding_type == kTfLitePaddingSame) {
    const int dilated_weights_h =
        dilation_factors_h_w[0] * (weights_height - 1) + 1;
    const int dilated_weights_w =
        dilation_factors_h_w[1] * (weights_width - 1) + 1;
    base_paddings[0] = (dilated_weights_h - 1) / 2;
    base_paddings[1] = dilated_weights_h - 1 - (dilated_weights_h - 1) / 2;
    base_paddings[2] = (dilated_weights_w - 1) / 2;
    base_paddings[3] = dilated_weights_w - 1 - (dilated_weights_w - 1) / 2;
  }
  // paddings represents {pad_top, pad_bottom, pad_left, pad_right}.
  paddings->resize(4, 0);
  // crops represents {crop_top, crop_bottom, crop_left, crop_right}.
  crops->resize(4, 0);
  // Logic for computing paddings & crops follows.
  // Taken from tf.required_space_to_batch_paddings, but without array
  // operations since we only deal with 2 dimensions.
  int pad_start_h = base_paddings[0];
  int pad_start_w = base_paddings[2];
  int orig_pad_end_h = base_paddings[1];
  int orig_pad_end_w = base_paddings[3];
  int full_input_h = input_height + pad_start_h + orig_pad_end_h;
  int full_input_w = input_width + pad_start_w + orig_pad_end_w;
  int pad_end_extra_h =
      (dilation_factors_h_w[0] - full_input_h % dilation_factors_h_w[0]) %
      dilation_factors_h_w[0];
  int pad_end_extra_w =
      (dilation_factors_h_w[1] - full_input_w % dilation_factors_h_w[1]) %
      dilation_factors_h_w[1];
  int pad_end_h = orig_pad_end_h + pad_end_extra_h;
  int pad_end_w = orig_pad_end_w + pad_end_extra_w;
  // Assign values.
  (*paddings)[0] = pad_start_h;
  (*paddings)[1] = pad_end_h;
  (*paddings)[2] = pad_start_w;
  (*paddings)[3] = pad_end_w;
  (*crops)[0] = 0;
  (*crops)[1] = pad_end_extra_h;
  (*crops)[2] = 0;
  (*crops)[3] = pad_end_extra_w;
 }
 // Computes output dimensions for the SpaceToBatchND op used in the dilated
 // Depthwise Conv case.
 // space_to_batch_paddings should be in format {top, bottom, left, right}.
 // These are computed from the documentation for SpaceToBatchND_8's output.
 void PopulateSpaceToBatchOutputDims(
    int input_batch_size, int input_height_size, int input_width_size,
    int input_depth_size, const std::vector<int>& dilation_factors_h_w,
    const std::vector<int>& space_to_batch_paddings,
    std::vector<int>* space_to_batch_output_dims) {
  // Batches.
  space_to_batch_output_dims->push_back(
      input_batch_size * dilation_factors_h_w[0] * dilation_factors_h_w[1]);
  // Height.
  space_to_batch_output_dims->push_back((space_to_batch_paddings[0] +
                                         input_height_size +
                                         space_to_batch_paddings[1]) /
                                        dilation_factors_h_w[0]);
  // Width.
  space_to_batch_output_dims->push_back((space_to_batch_paddings[2] +
                                         input_width_size +
                                         space_to_batch_paddings[3]) /
                                        dilation_factors_h_w[1]);
  // Depth.
  space_to_batch_output_dims->push_back(input_depth_size);
 }
 }  // namespace
 TfLiteStatus Conv2dOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                               const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  static std::vector<int> quant_bound_shape = {1, 1, 1, 1};
  static std::vector<int> dilation_factors_shape = {1, 1, 1, 2};
  static std::vector<int> paddings_shape = {1, 1, 2, 2};
  // Input data tensor.
  const auto& data_tensor = context->tensors[inputs->data[0]];
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      data_tensor, &data_min_, &data_max_, std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* data_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_min_, sizeof(data_min_));
  auto* data_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_max_, sizeof(data_max_));
  // Gather information about the Convolution operations.
  TfLitePadding padding_type = kTfLitePaddingUnknown;
  int stride_height = 0;
  int stride_width = 0;
  bool is_dilated_depthwise_conv = false;
  if (op_node_.op_type == OP_Supernode_8x8p32to8) {
    const TfLiteConvParams* conv_params =
        reinterpret_cast<const TfLiteConvParams*>(builtin_data_);
    stride_height = conv_params->stride_height;
    stride_width = conv_params->stride_width;
    padding_type = conv_params->padding;
  } else if (op_node_.op_type == OP_DepthwiseSupernode_8x8p32to8) {
    const TfLiteDepthwiseConvParams* conv_params =
        reinterpret_cast<const TfLiteDepthwiseConvParams*>(builtin_data_);
    stride_height = conv_params->stride_height;
    stride_width = conv_params->stride_width;
    padding_type = conv_params->padding;
    // We only support dilation for DepthwiseConv.
    if (conv_params->dilation_height_factor > 1 ||
        conv_params->dilation_width_factor > 1) {
      is_dilated_depthwise_conv = true;
      dilation_factors_h_w_.push_back(conv_params->dilation_height_factor);
      dilation_factors_h_w_.push_back(conv_params->dilation_width_factor);
    }
  }
  // Weights tensor
  const auto& weights_tensor = context->tensors[inputs->data[1]];
  if (weights_tensor.allocation_type != kTfLiteMmapRo) {
    context->ReportError(
        context, "Weights tensor doesn't have correct allocation type: %s",
        weights_tensor.name);
    return kTfLiteError;
  }
  int weights_batch_size, weights_height_size, weights_width_size,
      weights_depth_size;
  // Hexagon lib expects the weight tensor in HWCN, TFLite uses NHWC.
  // Transpose NHWC -> HWCN
  GetDims(&weights_batch_size, &weights_height_size, &weights_width_size,
          &weights_depth_size, weights_tensor.dims);
  weight_shape_ = {weights_height_size, weights_width_size, weights_depth_size,
                   weights_batch_size};
  RuntimeShape nhwc_shape({weights_batch_size, weights_height_size,
                           weights_width_size, weights_depth_size});
  RuntimeShape hwcn_shape({weights_height_size, weights_width_size,
                           weights_depth_size, weights_batch_size});
  std::vector<uint8_t> hwcn(NumElements(&weights_tensor));
  TransposeParams transpose_params;
  transpose_params.perm_count = 4;
  transpose_params.perm[0] = 1;
  transpose_params.perm[1] = 2;
  transpose_params.perm[2] = 3;
  transpose_params.perm[3] = 0;
  optimized_ops::Transpose<uint8_t>(transpose_params, nhwc_shape,
                                    weights_tensor.data.uint8, hwcn_shape,
                                    hwcn.data());
  // Quantization params for Weights tensor.
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(weights_tensor, &weights_min_, &weights_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* weights_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&weights_min_, sizeof(weights_min_));
  auto* weights_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&weights_max_, sizeof(weights_max_));
  auto* const_weights_node = graph_builder_->AddConstNodeWithData(
      weight_shape_.data(), (char*)hwcn.data(), hwcn.size() * sizeof(hwcn[0]));
  graph_builder_->AddTensorWithID(inputs->data[1], const_weights_node->GetID(),
                                  0);
  // Stride node.
  static int dummy = 0;
  stride_shape_ = {1, stride_height, stride_width, 1};
  auto* stride_node = graph_builder_->AddConstNodeWithData(
      stride_shape_.data(), (char*)&dummy, sizeof(dummy));
  // Output dimensions.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  // Output min/max.
  // TODO(b/129276536): Add support for other activations here. Current
  // implementation assumes None/Relu.
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      context->tensors[outputs->data[0]], &output_min_, &output_max_,
      std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* output_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&output_min_, sizeof(output_min_));
  auto* output_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&output_max_, sizeof(output_max_));
  // Bias node.
  const auto& bias_tensor = context->tensors[inputs->data[2]];
  auto* bias_data_node =
      graph_builder_->AddConstNodeWithData(inputs->data[2], bias_tensor);
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      bias_tensor, &bias_min_, &bias_max_, std::numeric_limits<int32_t>::min(),
      std::numeric_limits<int32_t>::max()));
  auto* bias_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&bias_min_, sizeof(bias_min_));
  auto* bias_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&bias_max_, sizeof(bias_max_));
  if (is_dilated_depthwise_conv) {
    // For dilated Depthwise Conv, we convert this node into SpaceToBatchND, and
    // then chain Supernode & BatchToSpaceND after it.
    int input_batch_size, input_height_size, input_width_size, input_depth_size;
    GetDims(&input_batch_size, &input_height_size, &input_width_size,
            &input_depth_size, data_tensor.dims);
    ComputeSpaceToBatchParams(
        input_height_size, input_width_size, weights_height_size,
        weights_width_size, dilation_factors_h_w_, padding_type,
        &space_to_batch_paddings_, &batch_to_space_crops_);
    auto* dilation_factors_const = graph_builder_->AddConstNodeWithData(
        dilation_factors_shape.data(), (char*)dilation_factors_h_w_.data(),
        dilation_factors_h_w_.size() * sizeof(stride_height));
    auto* paddings_const = graph_builder_->AddConstNodeWithData(
        paddings_shape.data(), (char*)space_to_batch_paddings_.data(),
        space_to_batch_paddings_.size() * sizeof(stride_height));
    auto* crops_const = graph_builder_->AddConstNodeWithData(
        paddings_shape.data(), (char*)batch_to_space_crops_.data(),
        batch_to_space_crops_.size() * sizeof(stride_height));
    // 1. SpaceToBatch.
    SetOpType(OP_SpaceToBatchND_8);
    AddInput(graph_builder_->GetHexagonTensorId(inputs->data[0]));
    AddInput(TensorID(dilation_factors_const->GetID(), 0));
    AddInput(TensorID(paddings_const->GetID(), 0));
    AddInput(TensorID(data_min_const->GetID(), 0));
    AddInput(TensorID(data_max_const->GetID(), 0));
    std::vector<int> space_to_batch_output_dims;
    PopulateSpaceToBatchOutputDims(
        input_batch_size, input_height_size, input_width_size, input_depth_size,
        dilation_factors_h_w_, space_to_batch_paddings_,
        &space_to_batch_output_dims);
    TensorID space_to_batch_op_out =
        AddOutput(sizeof(uint8_t), 4, space_to_batch_output_dims);
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    // 2. Depthwise Conv.
    auto* conv_op = graph_builder_->AddNode();
    conv_op->SetOpType(OP_DepthwiseSupernode_8x8p32to8);
    conv_op->AddInput(space_to_batch_op_out);
    conv_op->AddInput(TensorID(const_weights_node->GetID(), 0));
    conv_op->AddInput(TensorID(data_min_const->GetID(), 0));
    conv_op->AddInput(TensorID(data_max_const->GetID(), 0));
    conv_op->AddInput(TensorID(weights_min_const->GetID(), 0));
    conv_op->AddInput(TensorID(weights_max_const->GetID(), 0));
    conv_op->AddInput(TensorID(stride_node->GetID(), 0));
    conv_op->AddInput(TensorID(bias_data_node->GetID(), 0));
    conv_op->AddInput(TensorID(bias_min_const->GetID(), 0));
    conv_op->AddInput(TensorID(bias_max_const->GetID(), 0));
    conv_op->AddInput(TensorID(output_min_const->GetID(), 0));
    conv_op->AddInput(TensorID(output_max_const->GetID(), 0));
    // The padding is handled by the SpaceToBatch/BatchToSpace ops surrounding
    // this node. Hence, this op's padding remains VALID only.
    // tf.nn.with_space_to_batch's docs state the following pattern:
    // """
    // batch_to_space_nd(
    //  op(space_to_batch_nd(input, adjusted_dilation_rate, adjusted_paddings),
    //     num_spatial_dims,
    //     "VALID")
    //  adjusted_dilation_rate,
    //  adjusted_crops)
    // """
    conv_op->SetPaddingType(NN_PAD_VALID);
    // These dimensions are probably a little excessive, but they upper-bound
    // the possible output from DepthwiseConv.
    // TODO(b/139955809): Find better bounds?
    TensorID conv_output = conv_op->AddOutput(
        sizeof(uint8_t), 4,
        {output_batch_size * dilation_factors_h_w_[0] *
             dilation_factors_h_w_[1],
         output_height_size, output_width_size, output_depth_size});
    conv_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    conv_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    // 3. BatchToSpace.
    auto* batch_to_space_op = graph_builder_->AddNode();
    batch_to_space_op->SetOpType(OP_BatchToSpaceND_8);
    batch_to_space_op->AddInput(conv_output);
    batch_to_space_op->AddInput(TensorID(dilation_factors_const->GetID(), 0));
    batch_to_space_op->AddInput(TensorID(crops_const->GetID(), 0));
    batch_to_space_op->AddInput(TensorID(output_min_const->GetID(), 0));
    batch_to_space_op->AddInput(TensorID(output_max_const->GetID(), 0));
    node_output_ =
        batch_to_space_op->AddOutput(sizeof(uint8_t), 4,
                                     {output_batch_size, output_height_size,
                                      output_width_size, output_depth_size});
    batch_to_space_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    batch_to_space_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  } else {
    // Standard case.
    // Padding type.
    if (padding_type == kTfLitePaddingSame) {
      SetPaddingType(NN_PAD_SAME);
    } else if (padding_type == kTfLitePaddingValid) {
      SetPaddingType(NN_PAD_VALID);
    }
    // Inputs
    AddInput(graph_builder_->GetHexagonTensorId(inputs->data[0]));
    AddInput(TensorID(const_weights_node->GetID(), 0));
    AddInput(TensorID(data_min_const->GetID(), 0));
    AddInput(TensorID(data_max_const->GetID(), 0));
    AddInput(TensorID(weights_min_const->GetID(), 0));
    AddInput(TensorID(weights_max_const->GetID(), 0));
    AddInput(TensorID(stride_node->GetID(), 0));
    AddInput(TensorID(bias_data_node->GetID(), 0));
    AddInput(TensorID(bias_min_const->GetID(), 0));
    AddInput(TensorID(bias_max_const->GetID(), 0));
    AddInput(TensorID(output_min_const->GetID(), 0));
    AddInput(TensorID(output_max_const->GetID(), 0));
    // Outputs
    node_output_ = AddOutput(sizeof(uint8_t), 4,
                             {output_batch_size, output_height_size,
                              output_width_size, output_depth_size});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  }
  return kTfLiteOk;
 }
 TfLiteStatus Conv2dOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 Conv2dOpBuilder::~Conv2dOpBuilder() {}
 OpBuilder* CreateConv2DBuilder(GraphBuilder* graph_builder, int op_type) {
  return new Conv2dOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/conv_2d_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/conv_2d_builder.h
@ -0,0 +1,57 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class Conv2dOpBuilder : public OpBuilder {
 public:
  explicit Conv2dOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~Conv2dOpBuilder();
 private:
  TensorID node_output_;
  std::vector<float> transposed_weights_;
  std::vector<int> stride_shape_;
  std::vector<int> weight_shape_;
  float data_min_, data_max_, weights_min_, weights_max_, bias_min_, bias_max_,
      output_min_, output_max_;
  // Only used for dilated Depthwise Conv.
  std::vector<int> dilation_factors_h_w_;
  std::vector<int> space_to_batch_paddings_;
  std::vector<int> batch_to_space_crops_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/l2_normalization_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/l2_normalization_builder.cc
@ -0,0 +1,83 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/l2_normalization_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus L2NormalizationOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus L2NormalizationOpBuilder::RegisterOutputs(
    const TfLiteIntArray* outputs, TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 L2NormalizationOpBuilder::~L2NormalizationOpBuilder() {}
 OpBuilder* CreateL2NormalizationBuilder(GraphBuilder* graph_builder,
                                        int op_type) {
  return new L2NormalizationOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/l2_normalization_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/l2_normalization_builder.h
@ -0,0 +1,48 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_L2_NORMALIZATION_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_L2_NORMALIZATION_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class L2NormalizationOpBuilder : public OpBuilder {
 public:
  explicit L2NormalizationOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~L2NormalizationOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_L2_NORMALIZATION_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/matmul_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/matmul_builder.cc
@ -0,0 +1,211 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/matmul_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/optimized/optimized_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 // The TFLite 'Fully-connected' quantized op corresponds to the following
 // subgraph in Hexagon:
 // Data (uint8), Weights (const, uint8) => MatMul => MatMul out (int32)
 // Bias (const, int32) => Quantize => Bias (uint8)
 // MatMul out (int32) => Quantize => MatMul out (uint8)
 // MatMul out (uint8), Bias (uint8) => QuantizedAdd => Output (uint8)
 // TODO(b/129276536): Add activation support.
 TfLiteStatus MatMulOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                               const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  // Data tensor.
  int data_tensor_id = inputs->data[0];
  const auto& data_tensor = context->tensors[data_tensor_id];
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      data_tensor, &data_min_, &data_max_, std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* data_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&data_min_),
      sizeof(data_min_));
  auto* data_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&data_max_),
      sizeof(data_max_));
  // Weights vector.
  int weights_tensor_id = inputs->data[1];
  const auto& weights_tensor = context->tensors[weights_tensor_id];
  // TODO(srjoglekar): Abstract out.
  if (weights_tensor.allocation_type != kTfLiteMmapRo) {
    context->ReportError(
        context, "Weights tensor doesn't have correct allocation type: %s",
        weights_tensor.name);
    return kTfLiteError;
  }
  int batch_size, height_size, width_size, depth_size;
  // Hexagon lib expects the weight tensor in NHCW, TFLite uses NHWC.
  // Transpose NHWC -> NHCW
  GetDims(&batch_size, &height_size, &width_size, &depth_size,
          weights_tensor.dims);
  weights_shape_ = {batch_size, height_size, depth_size, width_size};
  RuntimeShape nhwc_shape({batch_size, height_size, width_size, depth_size});
  RuntimeShape nhcw_shape({batch_size, height_size, depth_size, width_size});
  std::vector<uint8_t> nhcw(NumElements(&weights_tensor));
  TransposeParams transpose_params;
  transpose_params.perm_count = 4;
  transpose_params.perm[0] = 0;
  transpose_params.perm[1] = 1;
  transpose_params.perm[2] = 3;
  transpose_params.perm[3] = 2;
  optimized_ops::Transpose<uint8_t>(transpose_params, nhwc_shape,
                                    weights_tensor.data.uint8, nhcw_shape,
                                    nhcw.data());
  auto* const_weights_node = graph_builder_->AddConstNodeWithData(
      weights_shape_.data(), reinterpret_cast<char*>(nhcw.data()),
      weights_tensor.bytes);
  graph_builder_->AddTensorWithID(weights_tensor_id,
                                  const_weights_node->GetID(), 0);
  ComputeMinAndMaxQuantValues(weights_tensor, &weights_min_, &weights_max_,
                              std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* weights_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&weights_min_),
      sizeof(weights_min_));
  auto* weights_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&weights_max_),
      sizeof(weights_max_));
  // Data and weight tensors in required order.
  AddInput(graph_builder_->GetHexagonTensorId(data_tensor_id));
  AddInput(graph_builder_->GetHexagonTensorId(weights_tensor_id));
  AddInput(TensorID(data_min_const->GetID(), 0));
  AddInput(TensorID(data_max_const->GetID(), 0));
  AddInput(TensorID(weights_min_const->GetID(), 0));
  AddInput(TensorID(weights_max_const->GetID(), 0));
  // Outputs for the MatMul node, which are in int32 format.
  // Output shape should still be the same.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  const auto& matmul_out = AddOutput(sizeof(int32_t), 4,
                                     {output_batch_size, output_height_size,
                                      output_width_size, output_depth_size});
  const auto& matmul_out_min = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  const auto& matmul_out_max = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  // Quantize the MatMul output to quint8.
  auto* quantize_matmul_op = graph_builder_->AddNode();
  quantize_matmul_op->SetOpType(OP_QuantizeDownAndShrinkRange_32to8);
  quantize_matmul_op->AddInput(matmul_out);
  quantize_matmul_op->AddInput(matmul_out_min);
  quantize_matmul_op->AddInput(matmul_out_max);
  const auto& quantized_matmul_out =
      quantize_matmul_op->AddOutput(sizeof(uint8_t), 4,
                                    {output_batch_size, output_height_size,
                                     output_width_size, output_depth_size});
  const auto& quantized_matmul_out_min =
      quantize_matmul_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  const auto& quantized_matmul_out_max =
      quantize_matmul_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  // Bias tensor.
  int bias_tensor_id = inputs->data[2];
  const auto& bias_tensor = context->tensors[bias_tensor_id];
  auto* const_bias_node =
      graph_builder_->AddConstNodeWithData(bias_tensor_id, bias_tensor);
  graph_builder_->AddTensorWithID(bias_tensor_id, const_bias_node->GetID(), 0);
  ComputeMinAndMaxQuantValues(bias_tensor, &bias_min_, &bias_max_,
                              std::numeric_limits<int32_t>::min(),
                              std::numeric_limits<int32_t>::max());
  auto* bias_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&bias_min_),
      sizeof(bias_min_));
  auto* bias_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&bias_max_),
      sizeof(bias_max_));
  // Quantize bias
  auto* quantize_bias_op = graph_builder_->AddNode();
  quantize_bias_op->SetOpType(OP_QuantizeDownAndShrinkRange_32to8);
  quantize_bias_op->AddInput(
      graph_builder_->GetHexagonTensorId(bias_tensor_id));
  quantize_bias_op->AddInput(TensorID(bias_min_const->GetID(), 0));
  quantize_bias_op->AddInput(TensorID(bias_max_const->GetID(), 0));
  const auto& quantized_bias_out =
      quantize_bias_op->AddOutput(sizeof(uint8_t), 4,
                                  {output_batch_size, output_height_size,
                                   output_width_size, output_depth_size});
  const auto& quantized_bias_out_min =
      quantize_bias_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  const auto& quantized_bias_out_max =
      quantize_bias_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  // Output min/max.
  ComputeMinAndMaxQuantValues(context->tensors[outputs->data[0]], &output_min_,
                              &output_max_, std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* output_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&output_min_),
      sizeof(output_min_));
  auto* output_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&output_max_),
      sizeof(output_max_));
  // MatMul + Bias.
  auto* bias_add_op = graph_builder_->AddNode();
  bias_add_op->SetOpType(OP_QuantizedAdd_8p8to8);
  bias_add_op->AddInput(quantized_matmul_out);
  bias_add_op->AddInput(quantized_bias_out);
  bias_add_op->AddInput(quantized_matmul_out_min);
  bias_add_op->AddInput(quantized_matmul_out_max);
  bias_add_op->AddInput(quantized_bias_out_min);
  bias_add_op->AddInput(quantized_bias_out_max);
  bias_add_op->AddInput(TensorID(output_min_const->GetID(), 0));
  bias_add_op->AddInput(TensorID(output_max_const->GetID(), 0));
  node_output_ = bias_add_op->AddOutput(sizeof(uint8_t), 4,
                                        {output_batch_size, output_height_size,
                                         output_width_size, output_depth_size});
  bias_add_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  bias_add_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus MatMulOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 MatMulOpBuilder::~MatMulOpBuilder() {}
 OpBuilder* CreateMatMulBuilder(GraphBuilder* graph_builder, int op_type) {
  return new MatMulOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/matmul_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/matmul_builder.h
@ -0,0 +1,51 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_MATMUL_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_MATMUL_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class MatMulOpBuilder : public OpBuilder {
 public:
  explicit MatMulOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~MatMulOpBuilder() override;
 private:
  TensorID node_output_;
  std::vector<int> weights_shape_, bias_shape_;
  std::vector<float> transposed_weights_;
  float data_min_, data_max_, weights_min_, weights_max_, bias_min_, bias_max_,
      output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_MATMUL_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/neg_op_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/neg_op_builder.cc
@ -0,0 +1,69 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/neg_op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus NegOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                            const TfLiteIntArray* outputs,
                                            TfLiteContext* context) {
  static int scalar_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                              std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      scalar_shape, reinterpret_cast<char*>(&input_min_), sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      scalar_shape, reinterpret_cast<char*>(&input_max_), sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus NegOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                           TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 OpBuilder* CreateNegOpBuilder(GraphBuilder* graph_builder, int op_type) {
  return new NegOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/neg_op_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/neg_op_builder.h
@ -0,0 +1,44 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_NEG_OP_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_NEG_OP_BUILDER_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class NegOpBuilder : public OpBuilder {
 public:
  explicit NegOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_NEG_OP_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.cc
@ -0,0 +1,207 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 #include "tensorflow/lite/builtin_ops.h"
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_factory.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 OpBuilder* GraphBuilder::CreateOpBuilderFromTfLiteOp(int op_type) {
  switch (op_type) {
    case kTfLiteBuiltinAdd:
      return CreateArithmeticBuilder(this, OP_QuantizedAdd_8p8to8);
    case kTfLiteBuiltinArgMax:
      return CreateArgMinMaxOpBuilder(this, OP_ArgMax_8toInt32);
    case kTfLiteBuiltinArgMin:
      return CreateArgMinMaxOpBuilder(this, OP_ArgMin_8);
    case kTfLiteBuiltinMul:
      return CreateArithmeticBuilder(this, OP_QuantizedMul_8x8to8);
    case kTfLiteBuiltinSub:
      return CreateArithmeticBuilder(this, OP_QuantizedSub_8p8to8);
    case kTfLiteBuiltinMean:
      return CreateReduceBuilder(this, OP_QuantizedMean_8);
    case kTfLiteBuiltinSum:
      return CreateReduceBuilder(this, OP_QuantizedSum_8to32);
    case kTfLiteBuiltinPad:
      return CreatePadBuilder(this, OP_QuantizedPad_8);
    case kTfLiteBuiltinFullyConnected:
      return CreateMatMulBuilder(this, OP_QuantizedMatMul_8x8to32);
    case kTfLiteBuiltinAveragePool2d:
      return CreatePool2DBuilder(this, OP_QuantizedAvgPool_8);
    case kTfLiteBuiltinMaxPool2d:
      return CreatePool2DBuilder(this, OP_QuantizedMaxPool_8);
    case kTfLiteBuiltinConcatenation:
      return CreateConcatBuilder(this, OP_QuantizedConcat_8);
    case kTfLiteBuiltinConv2d:
      return CreateConv2DBuilder(this, OP_Supernode_8x8p32to8);
    case kTfLiteBuiltinTransposeConv:
      return CreateTransposeConv2DBuilder(
          this, OP_QuantizedTransposeConv2d_8x8p32to8);
    case kTfLiteBuiltinDepthwiseConv2d:
      return CreateConv2DBuilder(this, OP_DepthwiseSupernode_8x8p32to8);
    case kTfLiteBuiltinReshape:
      return CreateReshapeBuilder(this, OP_Reshape);
    case kTfLiteBuiltinSoftmax:
      return CreateSoftmaxBuilder(this, OP_QuantizedSoftmax_8);
    case kTfLiteBuiltinResizeNearestNeighbor:
      return CreateResizeNearestNeighborBuilder(this,
                                                OP_ResizeNearestNeighbor_8);
    case kTfLiteBuiltinL2Normalization:
      return CreateL2NormalizationBuilder(this, OP_L2Normalize_8);
    case kTfLiteBuiltinRelu:
      return CreateActivationBuilder(this, OP_QuantizedRelu_8);
    case kTfLiteBuiltinRelu6:
      return CreateActivationBuilder(this, OP_QuantizedReluX_8);
    case kTfLiteBuiltinTanh:
      return CreateActivationBuilder(this, OP_QuantizedTanh_8);
    case kTfLiteBuiltinLogistic:
      return CreateActivationBuilder(this, OP_QuantizedSigmoid_8);
    case kTfLiteBuiltinSplit:
      return CreateSplitBuilder(this, OP_QuantizedSplit_8);
    case kTfLiteBuiltinResizeBilinear:
      return CreateResizeBilinearOpBuilder(this, OP_QuantizedResizeBilinear_8);
    case kTfLiteBuiltinNeg:
      return CreateNegOpBuilder(this, OP_QuantizedNeg_8);
    case kTfLiteBuiltinTranspose:
      return CreateTransposeBuilder(this, OP_Transpose_8);
    default:
      context_->ReportError(context_, "Op not supported: %d", op_type);
      return nullptr;
  }
 }
 OpBuilder* GraphBuilder::AddConstNodeWithData(const int shape[], char* data,
                                              int data_size) {
  builders_.emplace_back(new OpBuilder(this, OP_Const));
  builders_.back()->SetConstNode();
  builders_.back()->SetNodeId(builders_.size());
  int error = hexagon_nn_->hexagon_nn_append_const_node(
      graph_id_, builders_.size(), shape[0], shape[1], shape[2], shape[3],
      reinterpret_cast<const uint8_t*>(data), data_size);
  if (error != 0) {
    context_->ReportError(context_, "Error adding const node with shape id: %d",
                          (int)builders_.size());
    return nullptr;
  }
  return builders_.back().get();
 }
 OpBuilder* GraphBuilder::AddConstNodeWithData(int tensor_id,
                                              const TfLiteTensor& tensor) {
  builders_.emplace_back(new OpBuilder(this, OP_Const));
  const int node_id = builders_.size();
  builders_.back()->SetConstNode();
  builders_.back()->SetNodeId(node_id);
  int batch_size, height_size, width_size, depth_size;
  GetDims(&batch_size, &height_size, &width_size, &depth_size, tensor.dims);
  int error = hexagon_nn_->hexagon_nn_append_const_node(
      graph_id_, node_id, batch_size, height_size, width_size, depth_size,
      reinterpret_cast<const uint8_t*>(tensor.data.raw), tensor.bytes);
  if (error > 0) {
    context_->ReportError(
        context_, "Failed to add const node for tensor with id: %d", tensor_id);
    return nullptr;
  }
  AddTensorWithID(tensor_id, node_id, 0);
  return builders_.back().get();
 }
 void delegates::hexagon::GraphBuilder::AddInputTensors(
    const TfLiteIntArray* input_tensors, TfLiteContext* context) {
  builders_.emplace_back(new OpBuilder(this, OP_INPUT));
  builders_.back()->SetNodeId(builders_.size());
  // We need to track num_inputs since not all input_tensors are actual input
  // data. Some are constants.
  int num_inputs = 0;
  for (int i = 0; i < input_tensors->size; ++i) {
    const int tensor_id = input_tensors->data[i];
    const auto& tensor = context->tensors[tensor_id];
    if (tensor.allocation_type != kTfLiteMmapRo) {
      AddTensorWithID(tensor_id, builders_.size(), num_inputs);
      builders_.back()->AddOutput(tensor.dims);
      ++num_inputs;
    }
  }
 }
 void delegates::hexagon::GraphBuilder::AddOutputTensors(
    const TfLiteIntArray* output_tensors, TfLiteContext* context) {
  builders_.emplace_back(new OpBuilder(this, OP_OUTPUT));
  builders_.back()->SetNodeId(builders_.size());
  for (int i = 0; i < output_tensors->size; ++i) {
    const int tensor_id = output_tensors->data[i];
    builders_.back()->AddInput(GetHexagonTensorId(tensor_id));
  }
 }
 OpBuilder::TensorID OpBuilder::AddOutput(const TfLiteIntArray* dims) {
  op_node_.outputs.push_back(hexagon_nn_output());
  op_node_.outputs.back().elementsize = sizeof(float);
  op_node_.outputs.back().rank = 4;
  // TODO(karimnosseir): What is a good to estimate the max size ?
  int batch_size, height_size, width_size, depth_size;
  GetDims(&batch_size, &height_size, &width_size, &depth_size, dims);
  auto& max_sizes = op_node_.outputs.back().max_sizes;
  max_sizes[0] = batch_size;
  max_sizes[1] = height_size;
  max_sizes[2] = width_size;
  max_sizes[3] = depth_size;
  return TensorID(GetID(), op_node_.outputs.size() - 1);
 }
 OpBuilder::TensorID OpBuilder::AddOutput(
    int elementsize, int rank, const std::vector<int>& max_sizes_vect) {
  op_node_.outputs.push_back(hexagon_nn_output());
  op_node_.outputs.back().elementsize = elementsize;
  op_node_.outputs.back().rank = rank;
  auto& max_sizes = op_node_.outputs.back().max_sizes;
  for (int i = 0; i < max_sizes_vect.size(); ++i) {
    max_sizes[i] = max_sizes_vect[i];
  }
  return TensorID(GetID(), op_node_.outputs.size() - 1);
 }
 const OpNode* OpBuilder::Build() {
  for (const auto& id : input_ids_) {
    op_node_.inputs.push_back(hexagon_nn_input());
    op_node_.inputs.back().src_id = id.first;
    op_node_.inputs.back().output_idx = id.second;
  }
  return &op_node_;
 }
 OpBuilder* GraphBuilder::AddNode() {
  OpBuilder* op = new OpBuilder(this, OP_Nop);
  builders_.emplace_back(op);
  op->SetNodeId(builders_.size());
  return op;
 }
 OpBuilder* GraphBuilder::AddNodeFromTfLiteOp(int op_type, TfLiteNode* node) {
  OpBuilder* op = CreateOpBuilderFromTfLiteOp(op_type);
  builders_.emplace_back(op);
  op->SetNodeId(builders_.size());
  op->SetBuiltinData(node->builtin_data);
  op->SetTfLiteNode(node);
  return op;
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h
@ -0,0 +1,277 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_BUILDER_H_
 #include <memory>
 #include <string>
 #include <utility>
 #include <vector>
 #include "hexagon/hexagon_nn_ops.h"
 #include "tensorflow/lite/builtin_ops.h"
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 struct OpNode {
  std::vector<hexagon_nn_input> inputs;
  std::vector<hexagon_nn_output> outputs;
  // Value from the Enum of Ops in hexagon_nn_ops
  int op_type;
  hexagon_nn_padding_type padding_type = NN_PAD_NA;
  // Id of node in the Hexagon graph.
  int node_id = -1;
 };
 class GraphBuilder;
 class OpBuilder {
 public:
  OpBuilder(GraphBuilder* graph_builder, int hexagon_op_type)
      : graph_builder_(graph_builder) {
    op_node_.op_type = hexagon_op_type;
  }
  // A tensor is identified in the graph using a pair of IDs
  // (Node ID, output Tensor ID)
  // Node producing this tensor, and the index of the tensor in this
  // node output list.
  using TensorID = std::pair<int, int>;
  virtual ~OpBuilder() {}
  // TODO(karimnosseir): Do we need to have builder pattern, or they are few not
  // worth it ?
  void SetOpType(int op_type) { op_node_.op_type = op_type; }
  void SetNodeId(int node_id) { op_node_.node_id = node_id; }
  void SetConstNode() { op_node_.op_type = OP_Const; }
  void SetPaddingType(hexagon_nn_padding_type padding_type) {
    op_node_.padding_type = padding_type;
  }
  void SetBuiltinData(void* builtin_data) { builtin_data_ = builtin_data; }
  bool IsConstNode() const { return op_node_.op_type == OP_Const; }
  void print() {}
  const OpNode* Build();
  void AddInput(const TensorID& tensor_id) { input_ids_.push_back(tensor_id); }
  TensorID AddOutput(const TfLiteIntArray* dims);
  TensorID AddOutput(int elementsize, int rank,
                     const std::vector<int>& max_sizes);
  int GetID() const { return op_node_.node_id; }
  int GetOpType() const { return op_node_.op_type; }
  void SetTfLiteNode(const TfLiteNode* node) { tflite_node_ = node; }
  virtual TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                        const TfLiteIntArray* outputs,
                                        TfLiteContext* context) {
    return kTfLiteOk;
  }
  virtual TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                                       TfLiteContext* context) {
    return kTfLiteOk;
  }
 protected:
  // Helper method to fetch dimensions.
  // TODO(karimnosseir): Move to a shared place.
  void GetDims(int* batch_size, int* height_size, int* width_size,
               int* depth_size, const TfLiteIntArray* dims) {
    int* dim[] = {batch_size, height_size, width_size, depth_size};
    for (int i = 0; i < 4; ++i) *(dim[i]) = 1;
    for (int i = 4 - dims->size; i < 4; ++i) {
      *dim[i] = dims->data[i - (4 - dims->size)];
    }
  }
  template <typename T>
  TfLiteStatus ComputeMinAndMaxQuantValues(const TfLiteTensor& tensor,
                                           float* min, float* max, T min_value,
                                           T max_value) {
    *min = 0;
    *max = 0;
    const TfLiteQuantization& quant = tensor.quantization;
    if (quant.type != TfLiteQuantizationType::kTfLiteAffineQuantization) {
      printf("Tensor not quantized: %s\n", tensor.name);
      return kTfLiteError;
    }
    const TfLiteAffineQuantization* params =
        static_cast<const TfLiteAffineQuantization*>(quant.params);
    if (params->quantized_dimension != 0) {
      printf("Quantized dimensions not 0 for tensor: %s\n", tensor.name);
      return kTfLiteError;
    }
    float scale = params->scale->data[0];
    float zero_point = static_cast<float>(params->zero_point->data[0]);
    *min = scale * (static_cast<float>(min_value) - zero_point);
    *max = scale * (static_cast<float>(max_value) - zero_point);
    return kTfLiteOk;
  }
  OpNode op_node_;
  // inputs to the current op. Each pair identifies a single output from
  // another node (node_id, output_id).
  std::vector<TensorID> input_ids_;
  // Pointer to the graph builder.
  GraphBuilder* graph_builder_ = nullptr;
  // Data needed by this node.
  void* builtin_data_ = nullptr;
  // TODO(karimnosseir): Currently we only use it for getting output
  // size. Can we avoid passing it ?
  const TfLiteNode* tflite_node_ = nullptr;
 };
 class GraphBuilder {
 public:
  GraphBuilder(const HexagonNN* hexagon_nn, TfLiteContext* context,
               int graph_id)
      : hexagon_nn_(hexagon_nn), context_(context), graph_id_(graph_id) {}
  // Returns per OP builder. 'op_type' is the TfLite builtinOperator.
  OpBuilder* AddNodeFromTfLiteOp(int op_type, TfLiteNode* node);
  // Add node to the graph. The caller responsible for setting correct
  // data in the Op.
  OpBuilder* AddNode();
  // Add const node that provides the data held by 'tensor'.
  OpBuilder* AddConstNodeWithData(int tensor_id, const TfLiteTensor& tensor);
  // Same as above but takes shape of the tensor that will holds the data.
  OpBuilder* AddConstNodeWithData(const int shape[], char* data, int data_size);
  OpBuilder* CreateOpBuilderFromTfLiteOp(int op_type);
  // Construct Input node with 'input_tensors' as output.
  void AddInputTensors(const TfLiteIntArray* input_tensors,
                       TfLiteContext* context);
  // Construct Output node with 'output_tensors' as input.
  void AddOutputTensors(const TfLiteIntArray* output_tensors,
                        TfLiteContext* context);
  // Returns tensor id inside Hexagon graph.
  OpBuilder::TensorID GetHexagonTensorId(int tflite_tensor_index) {
    if (!HasTensor(tflite_tensor_index)) {
      printf("Could not find tensor id: %d\n", tflite_tensor_index);
      // Return invalid ID.
      return OpBuilder::TensorID(-1, -1);
    }
    return tensors_[tflite_tensor_index];
  }
  // Return true if this tensor was added before to the graph.
  bool HasTensor(int tflite_tensor_index) {
    if (tensors_.size() <= tflite_tensor_index) {
      return false;
    }
    // the first field is node ID and id = 0 is reserved
    // so anything > 0 is correctly initialized.
    return tensors_[tflite_tensor_index].first != 0;
  }
  void AddDebugNode() {}
  void Build() {
    for (int i = 0; i < builders_.size(); ++i) {
      if (builders_[i]->IsConstNode()) {
        continue;
      }
      const OpNode* op_node = builders_[i]->Build();
      int error = hexagon_nn_->hexagon_nn_append_node(
          graph_id_, op_node->node_id, op_node->op_type, op_node->padding_type,
          op_node->inputs.data(), op_node->inputs.size(),
          op_node->outputs.data(), op_node->outputs.size());
      if (error != 0) {
        printf("Error adding node: id:%d, op_type:%d\n", op_node->node_id,
               op_node->op_type);
      }
    }
  }
  void print() {
    printf("------------------------------\n");
    std::vector<unsigned char> buf(10000);
    hexagon_nn_->hexagon_nn_snpprint(graph_id_, buf.data(), buf.size());
    printf("%s", buf.data());
    printf("------------------------------\n");
    fflush(stdout);
  }
  // Add new tensor mapping to the tensor list.
  bool AddTensorWithID(int tflite_tensor_id, int hexagon_node_id,
                       int hexagon_node_output_id) {
    if (HasTensor(tflite_tensor_id)) {
      return false;
    }
    if (tensors_.size() <= tflite_tensor_id) {
      tensors_.resize(tflite_tensor_id + 1);
    }
    tensors_[tflite_tensor_id] =
        OpBuilder::TensorID(hexagon_node_id, hexagon_node_output_id);
    return true;
  }
  int GetOpTypeId(int node_id) {
    if (node_id > builders_.size()) {
      return -1;
    }
    return builders_[node_id - 1]->GetOpType();
  }
 private:
  // Helper method to fetch dimensions.
  // TODO(karimnosseir): Move this method to shared place.
  void GetDims(int* batch_size, int* height_size, int* width_size,
               int* depth_size, const TfLiteIntArray* dims) {
    int* dim[] = {batch_size, height_size, width_size, depth_size};
    for (int i = 0; i < 4; ++i) *(dim[i]) = 1;
    for (int i = 4 - dims->size; i < 4; ++i) {
      *dim[i] = dims->data[i - (4 - dims->size)];
    }
  }
  const HexagonNN* hexagon_nn_ = nullptr;
  TfLiteContext* context_ = nullptr;
  int graph_id_ = -1;
  std::vector<std::unique_ptr<OpBuilder>> builders_;
  // Index in the vector is the tflite_tensor_index, the value
  // is the ID in the hexgon graph.
  std::vector<OpBuilder::TensorID> tensors_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/op_factory.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/op_factory.h
@ -0,0 +1,51 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_FACTORY_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_FACTORY_H_
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class GraphBuilder;
 class OpBuilder;
 OpBuilder* CreateArgMinMaxOpBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateActivationBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateArithmeticBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateMatMulBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateConcatBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateConv2DBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateTransposeConv2DBuilder(GraphBuilder* graph_builder,
                                        int op_type);
 OpBuilder* CreatePool2DBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateReshapeBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateSoftmaxBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateReduceBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreatePadBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateResizeNearestNeighborBuilder(GraphBuilder* graph_builder,
                                              int op_type);
 OpBuilder* CreateL2NormalizationBuilder(GraphBuilder* graph_builder,
                                        int op_type);
 OpBuilder* CreateSplitBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateResizeBilinearOpBuilder(GraphBuilder* graph_builder,
                                         int op_type);
 OpBuilder* CreateNegOpBuilder(GraphBuilder* graph_builder, int op_type);
 OpBuilder* CreateTransposeBuilder(GraphBuilder* graph_builder, int op_type);
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_OP_FACTORY_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/pad_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/pad_builder.cc
@ -0,0 +1,97 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/pad_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus PadOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                            const TfLiteIntArray* outputs,
                                            TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  // Min/max values for input tensor.
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Padding tensor.
  tensor_id = inputs->data[1];
  const auto& padding_tensor = context->tensors[tensor_id];
  if (padding_tensor.allocation_type == kTfLiteMmapRo) {
    // If the padding input is a constant, bake it into the Hexagon graph as a
    // Const node.
    auto* const_padding_node =
        graph_builder_->AddConstNodeWithData(tensor_id, padding_tensor);
    AddInput(TensorID(const_padding_node->GetID(), 0));
  } else {
    AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  }
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus PadOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                           TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 PadOpBuilder::~PadOpBuilder() {}
 OpBuilder* CreatePadBuilder(GraphBuilder* graph_builder, int op_type) {
  return new PadOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/pad_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/pad_builder.h
@ -0,0 +1,48 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_PAD_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_PAD_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class PadOpBuilder : public OpBuilder {
 public:
  explicit PadOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~PadOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_PAD_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/pool_2d_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/pool_2d_builder.cc
@ -0,0 +1,136 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/pool_2d_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus Pool2dOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                               const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  static std::vector<int> quant_bound_shape = {1, 1, 1, 1};
  // Input data tensor.
  int tensor_id = inputs->data[0];
  const auto& data_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      data_tensor, &data_min_, &data_max_, std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* data_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_min_, sizeof(data_min_));
  auto* data_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_max_, sizeof(data_max_));
  AddInput(TensorID(data_min_const->GetID(), 0));
  AddInput(TensorID(data_max_const->GetID(), 0));
  const TfLitePoolParams* pool_params =
      reinterpret_cast<const TfLitePoolParams*>(builtin_data_);
  // Padding type.
  if (pool_params->padding == kTfLitePaddingSame) {
    SetPaddingType(NN_PAD_SAME);
  } else if (pool_params->padding == kTfLitePaddingValid) {
    SetPaddingType(NN_PAD_VALID);
  }
  // Pooling window (filter) width/height as inputs.
  static int dummy = 0;
  filter_shape_ = {1, pool_params->filter_height, pool_params->filter_width, 1};
  auto* filter_node = graph_builder_->AddConstNodeWithData(
      filter_shape_.data(), (char*)&dummy, sizeof(dummy));
  AddInput(TensorID(filter_node->GetID(), 0));
  // Stride width/height as inputs.
  stride_shape_ = {1, pool_params->stride_height, pool_params->stride_width, 1};
  auto* stride_node = graph_builder_->AddConstNodeWithData(
      stride_shape_.data(), (char*)&dummy, sizeof(dummy));
  AddInput(TensorID(stride_node->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  if (op_node_.op_type == OP_QuantizedMaxPool_8) {
    node_output_ = AddOutput(sizeof(uint8_t), 4,
                             {output_batch_size, output_height_size,
                              output_width_size, output_depth_size});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  } else {
    // Hexagon's AvgPool output has different min/max bounds than what TFLite
    // expects. Therefore, we add a Requantize op to correct the ranges.
    TensorID pool_out = AddOutput(sizeof(uint8_t), 4,
                                  {output_batch_size, output_height_size,
                                   output_width_size, output_depth_size});
    const auto& pool_out_min = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    const auto& pool_out_max = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    // Output min/max for requantization.
    TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
        context->tensors[outputs->data[0]], &output_min_, &output_max_,
        std::numeric_limits<uint8_t>::min(),
        std::numeric_limits<uint8_t>::max()));
    auto* output_min_const = graph_builder_->AddConstNodeWithData(
        quant_bound_shape.data(), (char*)&output_min_, sizeof(output_min_));
    auto* output_max_const = graph_builder_->AddConstNodeWithData(
        quant_bound_shape.data(), (char*)&output_max_, sizeof(output_max_));
    auto* requantize_op = graph_builder_->AddNode();
    requantize_op->SetOpType(OP_Requantize_8to8);
    requantize_op->AddInput(pool_out);
    requantize_op->AddInput(pool_out_min);
    requantize_op->AddInput(pool_out_max);
    requantize_op->AddInput(TensorID(output_min_const->GetID(), 0));
    requantize_op->AddInput(TensorID(output_max_const->GetID(), 0));
    node_output_ =
        requantize_op->AddOutput(sizeof(uint8_t), 4,
                                 {output_batch_size, output_height_size,
                                  output_width_size, output_depth_size});
    requantize_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    requantize_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  }
  return kTfLiteOk;
 }
 TfLiteStatus Pool2dOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 Pool2dOpBuilder::~Pool2dOpBuilder() {}
 OpBuilder* CreatePool2DBuilder(GraphBuilder* graph_builder, int op_type) {
  return new Pool2dOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/pool_2d_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/pool_2d_builder.h
@ -0,0 +1,50 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_POOL_2D_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_POOL_2D_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class Pool2dOpBuilder : public OpBuilder {
 public:
  explicit Pool2dOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~Pool2dOpBuilder();
 private:
  TensorID node_output_;
  std::vector<int> stride_shape_;
  std::vector<int> filter_shape_;
  float data_min_, data_max_, output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_POOL_2D_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/reduce_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/reduce_builder.cc
@ -0,0 +1,119 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/reduce_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ReduceOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                               const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                              std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  // Min/max values for input tensor.
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Axes tensor should be constant.
  tensor_id = inputs->data[1];
  const auto& axes_tensor = context->tensors[tensor_id];
  if (axes_tensor.allocation_type == kTfLiteMmapRo) {
    // If the axes input is a constant, bake it into the Hexagon graph as a
    // Const node.
    auto* const_axes_node =
        graph_builder_->AddConstNodeWithData(tensor_id, axes_tensor);
    AddInput(TensorID(const_axes_node->GetID(), 0));
  } else {
    context->ReportError(context, "Reduction op doesn't have constant axis");
    return kTfLiteError;
  }
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  // Hexagon's sum-reduction outputs int32, so we shrink it down to UInt8.
  if (op_node_.op_type == OP_QuantizedSum_8to32) {
    const auto& reduce_out = AddOutput(sizeof(int32_t), 4,
                                       {output_batch_size, output_height_size,
                                        output_width_size, output_depth_size});
    const auto& reduce_out_min = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    const auto& reduce_out_max = AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    auto* quantize_output_op = graph_builder_->AddNode();
    quantize_output_op->SetOpType(OP_QuantizeDownAndShrinkRange_32to8);
    quantize_output_op->AddInput(reduce_out);
    quantize_output_op->AddInput(reduce_out_min);
    quantize_output_op->AddInput(reduce_out_max);
    node_output_ =
        quantize_output_op->AddOutput(sizeof(uint8_t), 4,
                                      {output_batch_size, output_height_size,
                                       output_width_size, output_depth_size});
    quantize_output_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    quantize_output_op->AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  } else {
    node_output_ = AddOutput(sizeof(uint8_t), 4,
                             {output_batch_size, output_height_size,
                              output_width_size, output_depth_size});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
    AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  }
  return kTfLiteOk;
 }
 TfLiteStatus ReduceOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ReduceOpBuilder::~ReduceOpBuilder() {}
 OpBuilder* CreateReduceBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ReduceOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/reduce_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/reduce_builder.h
@ -0,0 +1,48 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_REDUCE_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_REDUCE_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ReduceOpBuilder : public OpBuilder {
 public:
  explicit ReduceOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ReduceOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_, output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_REDUCE_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/reshape_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/reshape_builder.cc
@ -0,0 +1,122 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/reshape_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 namespace {
 void PopulateOutputShapeFromTensor(const TfLiteTensor* shape_tensor,
                                   std::vector<int>* output_shape) {
  for (int i = 0; i < shape_tensor->dims->data[0]; ++i) {
    output_shape->push_back(shape_tensor->data.i32[i]);
  }
 }
 void PopulateShapeFromParam(const TfLiteReshapeParams* params,
                            std::vector<int>* output_shape) {
  // The function is returned above this line if the shape tensor is usable.
  // Now fallback to the shape parameter in `TfLiteReshapeParams`.
  int num_dimensions = params->num_dimensions;
  if (num_dimensions == 1 && params->shape[0] == 0) {
    // Legacy tflite models use a shape parameter of [0] to indicate scalars,
    // so adjust accordingly. TODO(b/111614235): Allow zero-sized buffers during
    // toco conversion.
    num_dimensions = 0;
  }
  for (int i = 0; i < num_dimensions; ++i) {
    output_shape->push_back(params->shape[i]);
  }
 }
 }  // namespace
 TfLiteStatus ReshapeOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                                const TfLiteIntArray* outputs,
                                                TfLiteContext* context) {
  // Input data tensor.
  AddInput(graph_builder_->GetHexagonTensorId(inputs->data[0]));
  // Output shape.
  TfLiteTensor* shape_tensor;
  bool output_shape_is_dynamic = false;
  if (inputs->size == 2) {
    shape_tensor = &context->tensors[inputs->data[1]];
    bool is_shape_tensor =
        (shape_tensor->dims->size == 1 && shape_tensor->type == kTfLiteInt32);
    // If tensor shape is dynamic, pass it along directly.
    if (shape_tensor->allocation_type != kTfLiteMmapRo && is_shape_tensor) {
      output_shape_is_dynamic = true;
      AddInput(graph_builder_->GetHexagonTensorId(inputs->data[1]));
    }
    if (!is_shape_tensor) {
      shape_tensor = nullptr;
    }
  }
  if (!output_shape_is_dynamic) {
    if (shape_tensor) {
      PopulateOutputShapeFromTensor(shape_tensor, &output_shape_);
    } else {
      const TfLiteReshapeParams* reshape_params =
          reinterpret_cast<const TfLiteReshapeParams*>(builtin_data_);
      PopulateShapeFromParam(reshape_params, &output_shape_);
    }
    int num_elements_in_shape = static_cast<int>(output_shape_.size());
    output_shape_shape_ = {1, 1, 1, num_elements_in_shape};
    auto* shape_node = graph_builder_->AddConstNodeWithData(
        output_shape_shape_.data(),
        reinterpret_cast<char*>(output_shape_.data()),
        sizeof(int) * num_elements_in_shape);
    AddInput(TensorID(shape_node->GetID(), 0));
  }
  // Hexagon output for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  return kTfLiteOk;
 }
 TfLiteStatus ReshapeOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ReshapeOpBuilder::~ReshapeOpBuilder() {}
 OpBuilder* CreateReshapeBuilder(GraphBuilder* graph_builder, int op_type) {
  return new ReshapeOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/reshape_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/reshape_builder.h
@ -0,0 +1,49 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESHAPE_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESHAPE_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ReshapeOpBuilder : public OpBuilder {
 public:
  explicit ReshapeOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ReshapeOpBuilder() override;
 private:
  TensorID node_output_;
  std::vector<int> output_shape_;
  std::vector<int> output_shape_shape_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESHAPE_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/resize_bilinear_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/resize_bilinear_builder.cc
@ -0,0 +1,106 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/resize_bilinear_builder.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ResizeBilinearOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  if (inputs->size != 2) {
    context->ReportError(context, "Expecting 2 inputs %d != 2\n", inputs->size);
    return kTfLiteError;
  }
  // Input data tensor.
  int input_tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[input_tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(input_tensor_id));
  const auto& size_tensor = context->tensors[inputs->data[1]];
  if (!IsConstantTensor(&size_tensor)) {
    context->ReportError(context,
                         "Hexagon Delegate doesn't support dynamic shape.\n");
    return kTfLiteError;
  }
  // dims tensor.
  const int dims_shape[] = {1, 1, 1, 2};
  std::vector<int> dims = {size_tensor.data.i32[0], size_tensor.data.i32[1]};
  auto* dims_const = graph_builder_->AddConstNodeWithData(
      dims_shape, reinterpret_cast<char*>(dims.data()),
      sizeof(int) * dims.size());
  AddInput(TensorID(dims_const->GetID(), 0));
  // Input min/max
  TF_LITE_ENSURE_OK(context, ComputeMinAndMaxQuantValues(
                                 input_tensor, &input_min_, &input_max_,
                                 std::numeric_limits<uint8_t>::min(),
                                 std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Align Corners
  const TfLiteResizeBilinearParams* params =
      reinterpret_cast<const TfLiteResizeBilinearParams*>(builtin_data_);
  int align_corners = params->align_corners ? 1 : 0;
  auto* align_corners_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&align_corners),
      sizeof(align_corners));
  AddInput(TensorID(align_corners_const->GetID(), 0));
  // Output
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  auto resize_bilinear_out = AddOutput(sizeof(uint8_t), 4,
                                       {output_batch_size, output_height_size,
                                        output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  node_output_ = resize_bilinear_out;
  return kTfLiteOk;
 }
 TfLiteStatus ResizeBilinearOpBuilder::RegisterOutputs(
    const TfLiteIntArray* outputs, TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ResizeBilinearOpBuilder::~ResizeBilinearOpBuilder() {}
 OpBuilder* CreateResizeBilinearOpBuilder(GraphBuilder* graph_builder,
                                         int op_type) {
  return new ResizeBilinearOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/resize_bilinear_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/resize_bilinear_builder.h
@ -0,0 +1,46 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_BILINEAR_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_BILINEAR_BUILDER_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ResizeBilinearOpBuilder : public OpBuilder {
 public:
  explicit ResizeBilinearOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ResizeBilinearOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_BILINEAR_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/resize_nearest_neighbor_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/resize_nearest_neighbor_builder.cc
@ -0,0 +1,107 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/resize_nearest_neighbor_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus ResizeNearestNeighborOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  // Output dimensions tensor.
  tensor_id = inputs->data[1];
  const auto& output_dim_tensor = context->tensors[tensor_id];
  if (output_dim_tensor.allocation_type == kTfLiteMmapRo) {
    // If the output dimensions input is a constant, bake it into the Hexagon
    // graph as a Const node.
    auto* const_output_dim_node =
        graph_builder_->AddConstNodeWithData(tensor_id, output_dim_tensor);
    AddInput(TensorID(const_output_dim_node->GetID(), 0));
  } else {
    AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  }
  // Min/max values for input tensor.
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Align corners.
  const TfLiteResizeNearestNeighborParams* params =
      reinterpret_cast<const TfLiteResizeNearestNeighborParams*>(builtin_data_);
  align_corners_ = params->align_corners;
  auto* align_corners_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&align_corners_),
      sizeof(align_corners_));
  AddInput(TensorID(align_corners_const->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus ResizeNearestNeighborOpBuilder::RegisterOutputs(
    const TfLiteIntArray* outputs, TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 ResizeNearestNeighborOpBuilder::~ResizeNearestNeighborOpBuilder() {}
 OpBuilder* CreateResizeNearestNeighborBuilder(GraphBuilder* graph_builder,
                                              int op_type) {
  return new ResizeNearestNeighborOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/resize_nearest_neighbor_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/resize_nearest_neighbor_builder.h
@ -0,0 +1,50 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_NEAREST_NEIGHBOR_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_NEAREST_NEIGHBOR_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class ResizeNearestNeighborOpBuilder : public OpBuilder {
 public:
  explicit ResizeNearestNeighborOpBuilder(GraphBuilder* graph_builder,
                                          int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~ResizeNearestNeighborOpBuilder() override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
  bool align_corners_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_RESIZE_NEAREST_NEIGHBOR_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/softmax_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/softmax_builder.cc
@ -0,0 +1,89 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/softmax_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus SoftmaxOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                                const TfLiteIntArray* outputs,
                                                TfLiteContext* context) {
  static std::vector<int> quant_bound_shape = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&input_min_, sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&input_max_, sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // beta value
  const TfLiteSoftmaxParams* softmax_params =
      reinterpret_cast<const TfLiteSoftmaxParams*>(builtin_data_);
  beta_value_ = softmax_params->beta;
  auto* beta_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&beta_value_, sizeof(beta_value_));
  AddInput(TensorID(beta_const->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus SoftmaxOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                               TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 SoftmaxOpBuilder::~SoftmaxOpBuilder() {}
 OpBuilder* CreateSoftmaxBuilder(GraphBuilder* graph_builder, int op_type) {
  return new SoftmaxOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/softmax_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/softmax_builder.h
@ -0,0 +1,49 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SOFTMAX_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SOFTMAX_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class SoftmaxOpBuilder : public OpBuilder {
 public:
  explicit SoftmaxOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~SoftmaxOpBuilder();
 private:
  TensorID node_output_;
  float beta_value_ = 1.0f;
  float input_min_, input_max_, output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SOFTMAX_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/split_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/split_builder.cc
@ -0,0 +1,107 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/split_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus SplitOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                              const TfLiteIntArray* outputs,
                                              TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  const int input_tensor_id = inputs->data[1];
  const auto& input_tensor = context->tensors[input_tensor_id];
  // Axis tensor.
  const int axis_tensor_id = inputs->data[0];
  const auto& axis = context->tensors[axis_tensor_id];
  if (axis.allocation_type != kTfLiteMmapRo) {
    context->ReportError(context,
                         "Axis tensor doesn't have correct allocation type: %s",
                         axis.name);
    return kTfLiteError;
  }
  // We pad Hexagon tensor dimensions with 1 if dims.size < 4.
  // (4 - input_tensor.dims->size) helps maps the input axis value in such
  // cases.
  int axis_value = axis.data.i32[0] + (4 - input_tensor.dims->size);
  if (axis_value < 0) {
    axis_value += input_tensor.dims->size;
  }
  auto* input_axis_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&axis_value), sizeof(int32_t));
  AddInput(TensorID(input_axis_const->GetID(), 0));
  // Input data tensor & min/max.
  AddInput(graph_builder_->GetHexagonTensorId(input_tensor_id));
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Output data tensors.
  for (int i = 0; i < outputs->size; ++i) {
    int output_batch_size, output_height_size, output_width_size,
        output_depth_size;
    GetDims(&output_batch_size, &output_height_size, &output_width_size,
            &output_depth_size, context->tensors[outputs->data[i]].dims);
    TensorID output = AddOutput(sizeof(uint8_t), 4,
                                {output_batch_size, output_height_size,
                                 output_width_size, output_depth_size});
    node_outputs_.push_back(output);
  }
  // For Hexagon output min/max.
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus SplitOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                             TfLiteContext* context) {
  for (int i = 0; i < node_outputs_.size(); ++i) {
    graph_builder_->AddTensorWithID(outputs->data[i], node_outputs_[i].first,
                                    node_outputs_[i].second);
  }
  return kTfLiteOk;
 }
 SplitOpBuilder::~SplitOpBuilder() {}
 OpBuilder* CreateSplitBuilder(GraphBuilder* graph_builder, int op_type) {
  return new SplitOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/split_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/split_builder.h
@ -0,0 +1,49 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SPLIT_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SPLIT_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class SplitOpBuilder : public OpBuilder {
 public:
  explicit SplitOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~SplitOpBuilder() override;
 private:
  std::vector<TensorID> node_outputs_;
  float input_min_;
  float input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_SPLIT_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_builder.cc
@ -0,0 +1,85 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/transpose_builder.h"
 #include <stdint.h>
 #include <limits>
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus TransposeOpBuilder::PopulateSubGraph(const TfLiteIntArray* inputs,
                                                  const TfLiteIntArray* outputs,
                                                  TfLiteContext* context) {
  static int quant_bound_shape[] = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[0];
  const auto& input_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  // permutation tensor.
  tensor_id = inputs->data[1];
  const auto& control_tensor = context->tensors[tensor_id];
  if (control_tensor.allocation_type == kTfLiteMmapRo) {
    auto* const_control_tensor_node =
        graph_builder_->AddConstNodeWithData(tensor_id, control_tensor);
    AddInput(TensorID(const_control_tensor_node->GetID(), 0));
  } else {
    AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  }
  TF_LITE_ENSURE_STATUS(
      ComputeMinAndMaxQuantValues(input_tensor, &input_min_, &input_max_,
                                  std::numeric_limits<uint8_t>::min(),
                                  std::numeric_limits<uint8_t>::max()));
  auto* input_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_min_),
      sizeof(input_min_));
  auto* input_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape, reinterpret_cast<char*>(&input_max_),
      sizeof(input_max_));
  // Min/max values for input tensor.
  AddInput(TensorID(input_min_const->GetID(), 0));
  AddInput(TensorID(input_max_const->GetID(), 0));
  // Hexagon outputs for this node.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus TransposeOpBuilder::RegisterOutputs(const TfLiteIntArray* outputs,
                                                 TfLiteContext* context) {
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 OpBuilder* CreateTransposeBuilder(GraphBuilder* graph_builder, int op_type) {
  return new TransposeOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_builder.h
@ -0,0 +1,43 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_BUILDER_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class TransposeOpBuilder : public OpBuilder {
 public:
  explicit TransposeOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
 private:
  TensorID node_output_;
  float input_min_, input_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_conv_2d_builder.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_conv_2d_builder.cc
@ -0,0 +1,169 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/transpose_conv_2d_builder.h"
 #include <stdint.h>
 #include <limits>
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/kernels/internal/reference/reference_ops.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 #include "tensorflow/lite/kernels/padding.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 TfLiteStatus TransposeConv2dOpBuilder::PopulateSubGraph(
    const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
    TfLiteContext* context) {
  static std::vector<int> quant_bound_shape = {1, 1, 1, 1};
  int tensor_id;
  // Input data tensor.
  tensor_id = inputs->data[2];
  const auto& data_tensor = context->tensors[tensor_id];
  AddInput(graph_builder_->GetHexagonTensorId(tensor_id));
  TF_LITE_ENSURE_STATUS(ComputeMinAndMaxQuantValues(
      data_tensor, &data_min_, &data_max_, std::numeric_limits<uint8_t>::min(),
      std::numeric_limits<uint8_t>::max()));
  auto* data_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_min_, sizeof(data_min_));
  auto* data_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&data_max_, sizeof(data_max_));
  // Weights tensor
  tensor_id = inputs->data[1];
  const auto& weights_tensor = context->tensors[tensor_id];
  if (weights_tensor.allocation_type != kTfLiteMmapRo) {
    context->ReportError(
        context, "Weights tensor doesn't have correct allocation type: %s",
        weights_tensor.name);
    return kTfLiteError;
  }
  int filter_batch_size, filter_height_size, filter_width_size,
      filter_depth_size;
  GetDims(&filter_batch_size, &filter_height_size, &filter_width_size,
          &filter_depth_size, weights_tensor.dims);
  weight_shape_ = {filter_batch_size, filter_height_size, filter_width_size,
                   filter_depth_size};
  auto* const_weights_node = graph_builder_->AddConstNodeWithData(
      weight_shape_.data(), (char*)weights_tensor.data.raw,
      weights_tensor.bytes);
  graph_builder_->AddTensorWithID(tensor_id, const_weights_node->GetID(), 0);
  AddInput(TensorID(const_weights_node->GetID(), 0));
  ComputeMinAndMaxQuantValues(weights_tensor, &weights_min_, &weights_max_,
                              std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* weights_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&weights_min_, sizeof(weights_min_));
  auto* weights_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&weights_max_, sizeof(weights_max_));
  // Min/max inputs for data & weights tensors.
  AddInput(TensorID(data_min_const->GetID(), 0));
  AddInput(TensorID(data_max_const->GetID(), 0));
  AddInput(TensorID(weights_min_const->GetID(), 0));
  AddInput(TensorID(weights_max_const->GetID(), 0));
  // Output dims are required to compute padding.
  int output_batch_size, output_height_size, output_width_size,
      output_depth_size;
  GetDims(&output_batch_size, &output_height_size, &output_width_size,
          &output_depth_size, context->tensors[outputs->data[0]].dims);
  // Hexagon TransposeConv requires an explicit padding tensor. So we compute
  // the same using stride, input & output info.
  const TfLiteTransposeConvParams* params =
      reinterpret_cast<const TfLiteTransposeConvParams*>(builtin_data_);
  int unused_output_height, unused_output_width;
  TfLitePaddingValues padding = ComputePaddingHeightWidth(
      params->stride_height, params->stride_width, 1, 1, output_height_size,
      output_width_size, filter_height_size, filter_width_size, params->padding,
      &unused_output_height, &unused_output_width);
  std::vector<int> padding_tensor = {padding.height, padding.height,
                                     padding.width, padding.width};
  std::vector<int> padding_tensor_shape = {1, 1, 2, 2};
  auto* padding_const = graph_builder_->AddConstNodeWithData(
      padding_tensor_shape.data(), (char*)padding_tensor.data(),
      (sizeof(int) * 4));
  AddInput(TensorID(padding_const->GetID(), 0));
  // Stride shape.
  int stride_height = params->stride_height;
  int stride_width = params->stride_width;
  static int dummy = 0;
  stride_shape_ = {1, stride_height, stride_width, 1};
  auto* stride_node = graph_builder_->AddConstNodeWithData(
      stride_shape_.data(), (char*)&dummy, sizeof(dummy));
  AddInput(TensorID(stride_node->GetID(), 0));
  // TFLite's TransposeConv doesn't have a bias input, so we just feed in 0s.
  std::vector<int> bias_data(output_depth_size);
  // Hexagon's conv ops require bias as a [1, 1, 1, dout] tensor.
  bias_shape_ = {1, 1, 1, output_depth_size};
  auto* bias_const = graph_builder_->AddConstNodeWithData(
      bias_shape_.data(), (char*)bias_data.data(),
      sizeof(bias_data[0]) * bias_data.size());
  bias_min_ = 0;
  bias_max_ = 0;
  auto* bias_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&bias_min_, sizeof(bias_min_));
  auto* bias_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&bias_max_, sizeof(bias_max_));
  AddInput(TensorID(bias_const->GetID(), 0));
  AddInput(TensorID(bias_min_const->GetID(), 0));
  AddInput(TensorID(bias_max_const->GetID(), 0));
  // Output min/max.
  ComputeMinAndMaxQuantValues(context->tensors[outputs->data[0]], &output_min_,
                              &output_max_, std::numeric_limits<uint8_t>::min(),
                              std::numeric_limits<uint8_t>::max());
  auto* output_min_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&output_min_, sizeof(output_min_));
  auto* output_max_const = graph_builder_->AddConstNodeWithData(
      quant_bound_shape.data(), (char*)&output_max_, sizeof(output_max_));
  AddInput(TensorID(output_min_const->GetID(), 0));
  AddInput(TensorID(output_max_const->GetID(), 0));
  // Hexagon outputs for this node.
  node_output_ = AddOutput(sizeof(uint8_t), 4,
                           {output_batch_size, output_height_size,
                            output_width_size, output_depth_size});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  AddOutput(sizeof(float), 4, {1, 1, 1, 1});
  return kTfLiteOk;
 }
 TfLiteStatus TransposeConv2dOpBuilder::RegisterOutputs(
    const TfLiteIntArray* outputs, TfLiteContext* context) {
  // Should be only 1 output.
  graph_builder_->AddTensorWithID(outputs->data[0], node_output_.first,
                                  node_output_.second);
  return kTfLiteOk;
 }
 TransposeConv2dOpBuilder::~TransposeConv2dOpBuilder() {}
 OpBuilder* CreateTransposeConv2DBuilder(GraphBuilder* graph_builder,
                                        int op_type) {
  return new TransposeConv2dOpBuilder(graph_builder, op_type);
 }
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_conv_2d_builder.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/builders/transpose_conv_2d_builder.h
@ -0,0 +1,53 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_CONV_2D_BUILDER_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_CONV_2D_BUILDER_H_
 #include <vector>
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 namespace tflite {
 namespace delegates {
 namespace hexagon {
 class TransposeConv2dOpBuilder : public OpBuilder {
 public:
  explicit TransposeConv2dOpBuilder(GraphBuilder* graph_builder, int op_type)
      : OpBuilder(graph_builder, op_type) {}
  TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
                                const TfLiteIntArray* outputs,
                                TfLiteContext* context) override;
  TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
                               TfLiteContext* context) override;
  ~TransposeConv2dOpBuilder();
 private:
  TensorID node_output_;
  std::vector<float> transposed_weights_;
  std::vector<int> stride_shape_;
  std::vector<int> weight_shape_, bias_shape_;
  std::vector<int> bias_data_;
  float data_min_, data_max_, weights_min_, weights_max_, bias_min_, bias_max_,
      output_min_, output_max_;
 };
 }  // namespace hexagon
 }  // namespace delegates
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_BUILDERS_TRANSPOSE_CONV_2D_BUILDER_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.cc
@ -0,0 +1,184 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h"
 #include <memory>
 #include <string>
 #include <vector>
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/context_util.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/utils.h"
 #include "tensorflow/lite/minimal_logging.h"
 namespace tflite {
 namespace {
 // Should be > 0. > 16 causes problems.
 constexpr int kMaxHexagonGraphs = 4;
 TfLiteRegistration GetHexagonKernelRegistration() {
  // This is the registration for the Delegate Node that gets added to
  // the TFLite graph instead of the subGraph it replaces it.
  // It is treated as a an OP node. But in our case
  // Init will initialize the delegate
  // Invoke will run the delegate graph.
  // Prepare for prearing the delegate.
  // Free for any cleaning needed by the delegate.
  TfLiteRegistration kernel_registration;
  kernel_registration.builtin_code = kTfLiteBuiltinDelegate;
  kernel_registration.custom_name = "TfLiteHexagonDelegate";
  kernel_registration.free = [](TfLiteContext* context, void* buffer) -> void {
    delete reinterpret_cast<HexagonDelegateKernel*>(buffer);
  };
  kernel_registration.init = [](TfLiteContext* context, const char* buffer,
                                size_t length) -> void* {
    const TfLiteDelegateParams* params =
        reinterpret_cast<const TfLiteDelegateParams*>(buffer);
    auto hexagon_kernel = std::make_unique<HexagonDelegateKernel>();
    if (hexagon_kernel->Init(context, params) != kTfLiteOk) {
      return nullptr;
    }
    return hexagon_kernel.release();
  };
  kernel_registration.invoke = [](TfLiteContext* context,
                                  TfLiteNode* node) -> TfLiteStatus {
    HexagonDelegateKernel* kernel =
        reinterpret_cast<HexagonDelegateKernel*>(node->user_data);
    if (!kernel) {
      context->ReportError(context, "Hexagon Kernel was not initialized");
      return kTfLiteError;
    }
    return kernel->Invoke(context, node);
  };
  kernel_registration.prepare = [](TfLiteContext* context,
                                   TfLiteNode* node) -> TfLiteStatus {
    if (node->user_data == nullptr) {
      context->ReportError(context, "Hexagon Kernel was not initialized");
      return kTfLiteError;
    }
    HexagonDelegateKernel* kernel =
        reinterpret_cast<HexagonDelegateKernel*>(node->user_data);
    return kernel->Prepare(context, node);
  };
  return kernel_registration;
 }
 TfLiteStatus DelegatePrepare(TfLiteContext* context, TfLiteDelegate* delegate) {
  // Reserve 1 element, since we need first element to be size, will be updated
  // later.
  std::vector<int> supported_nodes(1);
  TfLiteIntArray* plan;
  TF_LITE_ENSURE_STATUS(context->GetExecutionPlan(context, &plan));
  TfLiteNode* node;
  TfLiteRegistration* registration;
  // Rudimentary mechanism to check how many Hexagon graphs we initialize.
  int num_components = 1;
  int last_index = -1;
  for (int node_index : TfLiteIntArrayView(plan)) {
    TF_LITE_ENSURE_STATUS(context->GetNodeAndRegistration(
        context, node_index, &node, &registration));
    if (IsNodeSupportedByHexagon(registration, node, context)) {
      // If there is a 'break' in node indices, a new subgraph (and therefore, a
      // new Hexagon graph) will be created.
      if (last_index != -1 && node_index != last_index + 1) {
        if (num_components == kMaxHexagonGraphs) {
          break;
        }
        ++num_components;
      }
      supported_nodes.push_back(node_index);
      last_index = node_index;
    }
  }
  // Set first element to the number of nodes to replace.
  supported_nodes[0] = supported_nodes.size() - 1;
  TFLITE_LOG_PROD(tflite::TFLITE_LOG_INFO,
                  "Hexagon delegate: %d nodes delegated out of %d nodes.\n",
                  supported_nodes[0], plan->size);
  TfLiteRegistration hexagon_kernel_registration =
      GetHexagonKernelRegistration();
  return context->ReplaceNodeSubsetsWithDelegateKernels(
      context, hexagon_kernel_registration,
      reinterpret_cast<TfLiteIntArray*>(supported_nodes.data()), delegate);
 }
 class HexagonDelegate : public TfLiteDelegate {
 public:
  explicit HexagonDelegate(const TfLiteHexagonDelegateOptions* params)
      : params_(params != nullptr ? *params : TfLiteHexagonDelegateOptions()) {}
  TfLiteHexagonDelegateOptions* params() { return &params_; }
  bool VerifyDelegate() {
    auto* hexagon_nn = HexagonNNImplementation();
    if (hexagon_nn == nullptr) {
      return false;
    }
    return hexagon_nn->hexagon_nn_is_device_supported &&
           hexagon_nn->hexagon_nn_is_device_supported();
  }
 private:
  TfLiteHexagonDelegateOptions params_;
 };
 TfLiteDelegate* CreateDelegate(const TfLiteHexagonDelegateOptions* params) {
  TfLiteDelegate* delegate = new HexagonDelegate(params);
  if (!static_cast<HexagonDelegate*>(delegate)->VerifyDelegate()) {
    delete delegate;
    TFLITE_LOG_PROD_ONCE(tflite::TFLITE_LOG_INFO,
                         "Hexagon Delegate is not supported.\n");
    return nullptr;
  }
  delegate->data_ = static_cast<HexagonDelegate*>(delegate)->params();
  delegate->flags = kTfLiteDelegateFlagsNone;
  delegate->Prepare = &DelegatePrepare;
  delegate->CopyFromBufferHandle = nullptr;
  delegate->CopyToBufferHandle = nullptr;
  delegate->FreeBufferHandle = nullptr;
  TFLITE_LOG_PROD_ONCE(tflite::TFLITE_LOG_INFO,
                       "Created TensorFlow Lite delegate for Hexagon.");
  return delegate;
 }
 }  // namespace
 }  // namespace tflite
 TfLiteDelegate* TfLiteHexagonDelegateCreate(
    const TfLiteHexagonDelegateOptions* options) {
  return tflite::CreateDelegate(options);
 }
 void TfLiteHexagonDelegateDelete(TfLiteDelegate* delegate) { delete delegate; }
 void TfLiteHexagonInit() { tflite::HexagonDelegateKernel::InitState(); }
 void TfLiteHexagonInitWithPath(const char* lib_directory_path) {
  if (lib_directory_path != nullptr) {
    std::string env_var_value = lib_directory_path;
    env_var_value += ";/system/lib/rfsa/adsp;/system/vendor/lib/rfsa/adsp;/dsp";
    setenv("ADSP_LIBRARY_PATH", env_var_value.c_str(), 1 /* overwrite */);
  }
  tflite::HexagonDelegateKernel::InitState();
 }
 void TfLiteHexagonTearDown() { tflite::HexagonDelegateKernel::Teardown(); }
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h
@ -0,0 +1,81 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_H_
 #include "tensorflow/lite/c/common.h"
 #ifdef SWIG
 #define TFL_CAPI_EXPORT
 #else
 #if defined(_WIN32)
 #ifdef TFL_COMPILE_LIBRARY
 #define TFL_CAPI_EXPORT __declspec(dllexport)
 #else
 #define TFL_CAPI_EXPORT __declspec(dllimport)
 #endif  // TFL_COMPILE_LIBRARY
 #else
 #define TFL_CAPI_EXPORT __attribute__((visibility("default")))
 #endif  // _WIN32
 #endif  // SWIG
 #ifdef __cplusplus
 extern "C" {
 #endif  // __cplusplus
 struct TFL_CAPI_EXPORT TfLiteHexagonDelegateOptions {
  // This corresponds to the debug level in the hexagon SDK. 0 (default)
  // means no debug.
  int debug_level;
  // This corresponds to powersave_level in the hexagon SDK.
  // where 0 (default) means high performance which means more power
  // consumption.
  int powersave_level;
  // If set to true, performance information about the graph will be dumped
  // to Standard output, this includes cpu cycles.
  // WARNING: Experimental and subject to change anytime.
  bool print_graph_profile;
  // If set to true, graph structure will be dumped to Standard output.
  // This is usually beneficial to see what actual nodes executed on
  // the DSP. Combining with 'debug_level' more information will be printed.
  // WARNING: Experimental and subject to change anytime.
  bool print_graph_debug;
 };
 // Return a delegate that uses Hexagon SDK for ops execution.
 // Must outlive the interpreter.
 TfLiteDelegate* TFL_CAPI_EXPORT
 TfLiteHexagonDelegateCreate(const TfLiteHexagonDelegateOptions* options);
 // Do any needed cleanup and delete 'delegate'.
 void TFL_CAPI_EXPORT TfLiteHexagonDelegateDelete(TfLiteDelegate* delegate);
 // Initializes the DSP connection.
 // This should be called before doing any usage of the delegate.
 // "lib_directory_path": Path to the directory which holds the
 // shared libraries for the Hexagon NN libraries on the device.
 void TFL_CAPI_EXPORT TfLiteHexagonInitWithPath(const char* lib_directory_path);
 // Same as above method but doesn't accept the path params.
 // Assumes the environment setup is already done. Only initialize Hexagon.
 void TFL_CAPI_EXPORT TfLiteHexagonInit();
 // Clean up and switch off the DSP connection.
 // This should be called after all processing is done and delegate is deleted.
 void TFL_CAPI_EXPORT TfLiteHexagonTearDown();
 #ifdef __cplusplus
 }
 #endif  // __cplusplus
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.cc
@ -0,0 +1,357 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.h"
 #include <algorithm>
 #include <vector>
 #include "tensorflow/lite/builtin_ops.h"
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/context_util.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/utils.h"
 namespace tflite {
 namespace {
 inline const char* StateToString(
    HexagonDelegateKernel::HexagonKernelState state) {
  switch (state) {
    case HexagonDelegateKernel::HexagonKernelState::HEALTHY:
      return "HEALTHY";
    case HexagonDelegateKernel::HexagonKernelState::FAST_RPC_SETUP_FAILED:
      return "FAST_RPC_SETUP_FAILED";
    case HexagonDelegateKernel::HexagonKernelState::FAILED_TO_INIT_GRAPH:
      return "FAILED_TO_INIT_GRAPH";
    case HexagonDelegateKernel::HexagonKernelState::FAILED_TO_PREPARE_GRAPH:
      return "FAILED_TO_PREPARE_GRAPH";
    case HexagonDelegateKernel::HexagonKernelState::MULTIPLE_INPUTS:
      return "MULTIPLE_INPUTS";
    case HexagonDelegateKernel::HexagonKernelState::INPUT_RANK_NOT_SUPPORTED:
      return "INPUT_RANK_NOT_SUPPORTED";
    case HexagonDelegateKernel::HexagonKernelState::MULTIPLE_OUTPUTS:
      return "MULTIPLE_OUTPUTS";
    case HexagonDelegateKernel::HexagonKernelState::FAILED_TO_EXECUTE_GRAPH:
      return "FAILED_TO_EXECUTE_GRAPH";
  }
 }
 // Returns uint64 representing total cycles in 'perf_info' by
 // combining lo and hi counters.
 inline uint64_t GetCycles(const hexagon_nn_perfinfo& perf_info) {
  uint64_t res = perf_info.counter_hi;
  res <<= 32;
  res |= perf_info.counter_lo;
  return res;
 }
 // Comparator for hexagon_nn_perfinfo in descending order based on
 // total cycles consumed.
 struct PerfInfoCmp {
  bool operator()(const hexagon_nn_perfinfo& a,
                  const hexagon_nn_perfinfo& b) const {
    return GetCycles(a) > GetCycles(b);
  }
 };
 }  // namespace
 void HexagonDelegateKernel::ReportError(TfLiteContext* context,
                                        HexagonKernelState state,
                                        const std::string& msg) {
  PrintLog();
  context->ReportError(context, "Failed: %s. STATE: %s", msg.c_str(),
                       StateToString(state));
 }
 TfLiteStatus HexagonDelegateKernel::Init(TfLiteContext* context,
                                         const TfLiteDelegateParams* params) {
  hexagon_nn_ = HexagonNNImplementation();
  if (hexagon_nn_ == nullptr) {
    context->ReportError(context, "Hexagon interface not available.");
    return kTfLiteError;
  }
  if (params != nullptr && params->delegate != nullptr) {
    const ::TfLiteHexagonDelegateOptions* options_ptr =
        reinterpret_cast<const ::TfLiteHexagonDelegateOptions*>(
            params->delegate->data_);
    params_ = (options_ptr == nullptr ? ::TfLiteHexagonDelegateOptions()
                                      : *options_ptr);
  }
  // Ensure Hexagon NNLib is ready to start working.
  int error = hexagon_nn_->hexagon_nn_config();
  if (error != 0) {
    context->ReportError(context, "hexagon_nn_config failed. Error: %d", error);
    return kTfLiteError;
  }
  // Initialize an empty graph.
  error = hexagon_nn_->hexagon_nn_init(&graph_id_);
  if (error != 0) {
    state_ = HexagonKernelState::FAILED_TO_INIT_GRAPH;
    ReportError(context, state_, "failed to init");
    return kTfLiteError;
  }
  error =
      hexagon_nn_->hexagon_nn_set_debug_level(graph_id_, params_.debug_level);
  if (error != 0) {
    context->ReportError(context, "Failed to set debug level, error: %d",
                         error);
    return kTfLiteError;
  }
  error = hexagon_nn_->hexagon_nn_set_powersave_level(params_.powersave_level);
  if (error != 0) {
    context->ReportError(context, "Failed to set powersave level, error %d",
                         error);
    return kTfLiteError;
  }
  for (auto node_index : TfLiteIntArrayView(params->nodes_to_replace)) {
    nodes_.push_back(node_index);
  }
  TF_LITE_ENSURE_STATUS(
      BuildGraph(context, params->input_tensors, params->output_tensors));
  return kTfLiteOk;
 }
 TfLiteStatus HexagonDelegateKernel::Invoke(TfLiteContext* context,
                                           TfLiteNode* node) {
  if (hexagon_nn_ == nullptr) {
    context->ReportError(context, "Hexagon interface not available.");
    return kTfLiteError;
  }
  // Allocate inputs.
  std::vector<hexagon_nn_tensordef> input_tensors;
  for (auto tensor_index : TfLiteIntArrayView(node->inputs)) {
    if (tensor_index == kTfLiteOptionalTensor) {
      continue;
    }
    TfLiteTensor* tensor = &context->tensors[tensor_index];
    // Const tensors should be added as const nodes during graph construction.
    if (tensor->allocation_type != kTfLiteMmapRo) {
      if (tensor->dims->size > 4) {
        ReportError(context, HexagonKernelState::INPUT_RANK_NOT_SUPPORTED,
                    "Only up to 4d tensor are supported.");
        return kTfLiteError;
      }
      input_tensors.emplace_back();
      auto& input_tensor = input_tensors.back();
      input_tensor.data = reinterpret_cast<unsigned char*>(tensor->data.raw);
      input_tensor.dataLen = tensor->bytes;
      input_tensor.data_valid_len = tensor->bytes;
      TF_LITE_ENSURE_STATUS(
          Get4DShape(&input_tensor.batches, &input_tensor.height,
                     &input_tensor.width, &input_tensor.depth, tensor->dims));
    }
  }
  // Allocate outputs.
  std::vector<hexagon_nn_tensordef> output_tensors;
  for (auto tensor_index : TfLiteIntArrayView(node->outputs)) {
    if (tensor_index == kTfLiteOptionalTensor) {
      continue;
    }
    TfLiteTensor* tensor = &context->tensors[tensor_index];
    if (tensor->allocation_type != kTfLiteMmapRo) {
      if (tensor->dims->size > 4) {
        ReportError(context, HexagonKernelState::INPUT_RANK_NOT_SUPPORTED,
                    "Only up to 4d tensor are supported.");
        return kTfLiteError;
      }
      output_tensors.emplace_back();
      auto& output_tensor = output_tensors.back();
      output_tensor.data = reinterpret_cast<unsigned char*>(tensor->data.raw);
      output_tensor.dataLen = tensor->bytes;
    }
  }
  if (params_.print_graph_profile) {
    hexagon_nn_->hexagon_nn_reset_perfinfo(graph_id_, 0);
  }
  // Execute.
  int error = hexagon_nn_->hexagon_nn_execute_new(
      graph_id_, input_tensors.data(), input_tensors.size(),
      output_tensors.data(), output_tensors.size());
  if (error != 0) {
    ReportError(context, HexagonKernelState::FAILED_TO_EXECUTE_GRAPH,
                "Failed to execute graph.");
    return kTfLiteError;
  }
  if (params_.print_graph_profile) {
    PrintPerformanceData();
  }
  return kTfLiteOk;
 }
 TfLiteStatus HexagonDelegateKernel::Prepare(TfLiteContext* context,
                                            TfLiteNode* node) {
  if (hexagon_nn_ == nullptr) {
    context->ReportError(context, "Hexagon interface not available. prepare");
    return kTfLiteError;
  }
  int status = hexagon_nn_->hexagon_nn_prepare(graph_id_);
  if (status != 0) {
    state_ = HexagonKernelState::FAILED_TO_PREPARE_GRAPH;
    ReportError(context, state_, "Failed to prepare graph.\n");
    return kTfLiteError;
  }
  // Check input/output tensors.
  std::vector<int> tensors;
  for (auto tensor_index : TfLiteIntArrayView(node->inputs)) {
    tensors.push_back(tensor_index);
  }
  for (auto tensor_index : TfLiteIntArrayView(node->outputs)) {
    tensors.push_back(tensor_index);
  }
  for (auto tensor_index : tensors) {
    if (tensor_index == kTfLiteOptionalTensor) {
      continue;
    }
    TfLiteTensor* tensor = &context->tensors[tensor_index];
    // Const tensors should be added as const nodes during graph construction.
    if (tensor->allocation_type != kTfLiteMmapRo && tensor->dims->size > 4) {
      ReportError(context, HexagonKernelState::INPUT_RANK_NOT_SUPPORTED,
                  "Only up to 4d tensor are supported.");
      return kTfLiteError;
    }
  }
  if (params_.print_graph_debug) {
    PrintDebuggingGraph();
  }
  return kTfLiteOk;
 }
 TfLiteStatus HexagonDelegateKernel::BuildGraph(
    TfLiteContext* context, const TfLiteIntArray* input_tensors,
    const TfLiteIntArray* output_tensors) {
  builder_.reset(
      new delegates::hexagon::GraphBuilder(hexagon_nn_, context, graph_id_));
  // Add inputs to the graph.
  builder_->AddInputTensors(input_tensors, context);
  // Add all ops.
  TfLiteNode* node;
  TfLiteRegistration* reg;
  for (int node_index : nodes_) {
    TF_LITE_ENSURE_STATUS(
        context->GetNodeAndRegistration(context, node_index, &node, &reg));
    auto* op_builder = builder_->AddNodeFromTfLiteOp(reg->builtin_code, node);
    TF_LITE_ENSURE_STATUS(
        op_builder->PopulateSubGraph(node->inputs, node->outputs, context));
    TF_LITE_ENSURE_STATUS(op_builder->RegisterOutputs(node->outputs, context));
  }
  // Add Outputs.
  builder_->AddOutputTensors(output_tensors, context);
  builder_->Build();
  return kTfLiteOk;
 }
 HexagonDelegateKernel::~HexagonDelegateKernel() {
  if (graph_id_ != -1) {
    hexagon_nn_->hexagon_nn_teardown(graph_id_);
  }
 }
 void HexagonDelegateKernel::PrintLog() {
  std::vector<unsigned char> buf(3000000);
  time_t my_time = time(nullptr);
  hexagon_nn_->hexagon_nn_getlog(graph_id_, buf.data(), buf.size());
  printf("----------------\n");
  printf("Timestamp: %s\n\n", ctime(&my_time));
  printf("Log\n%s\n", buf.data());
  printf("----------------\n");
  fflush(stdout);
 }
 void HexagonDelegateKernel::PrintPerformanceData() {
  const int kMaxNodes = 2048;
  const int kMaxNameLen = 100;
  std::vector<hexagon_nn_perfinfo> perf_data(kMaxNodes);
  std::vector<char> op_name(kMaxNameLen);
  uint64_t total_cycles = 0;
  uint64_t cum_cycles = 0;
  uint64_t counter = 0;
  unsigned int num_nodes;
  printf("------- Performance Debug Data Start -------\n");
  if (hexagon_nn_->hexagon_nn_get_perfinfo(graph_id_, perf_data.data(),
                                           kMaxNodes, &num_nodes) != 0) {
    printf("Failed fetching perf data.\n");
    return;
  }
  printf("Total %d nodes.\n", num_nodes);
  std::sort(perf_data.begin(), perf_data.begin() + num_nodes, PerfInfoCmp());
  for (int i = 0; i < num_nodes; i++) {
    total_cycles += GetCycles(perf_data[i]);
  }
  printf("Total %lu cycles\n", static_cast<unsigned long>(total_cycles));
  printf(
      "Node ID,\tOP Name,\tExecutions,\tCycles,\t%% of total,\tCummulative "
      "cycles,\tCummulative %%\n");
  for (int i = 0; i < num_nodes; i++) {
    counter = GetCycles(perf_data[i]);
    cum_cycles += counter;
    int op_type_id = builder_->GetOpTypeId(perf_data[i].node_id);
    if (op_type_id >= 0 && hexagon_nn_->hexagon_nn_op_id_to_name(
                               op_type_id, op_name.data(), kMaxNameLen) != 0) {
      printf("Failed to fetch name for %u with type %d\n", perf_data[i].node_id,
             op_type_id);
      continue;
    }
    printf("0x%x,\t%s,\t%d,\t%lu,\t%f %%,\t%lu,\t%f %%\n", perf_data[i].node_id,
           (op_type_id < 0 ? "" : op_name.data()), perf_data[i].executions,
           static_cast<unsigned long>(counter),
           100.0 * (1.0 * counter / total_cycles),
           static_cast<unsigned long>(cum_cycles),
           100.0 * (1.0 * cum_cycles / total_cycles));
  }
  printf("------- Performance Debug Data End -------\n");
 }
 void HexagonDelegateKernel::PrintDebuggingGraph() {
  const int kMaxBufLen = 100000;
  std::vector<unsigned char> buf(kMaxBufLen);
  if (hexagon_nn_->hexagon_nn_snpprint(graph_id_, buf.data(), kMaxBufLen) !=
      0) {
    printf("Error fetching graph debug details.\n");
    return;
  }
  printf("------- Graph Debugging Start -------\n");
  printf("%s\n", buf.data());
  printf("------- Graph Debugging End -------\n");
 }
 void HexagonDelegateKernel::Teardown() {
  auto* hexagon_nn = HexagonNNImplementation();
  if (hexagon_nn != nullptr) {
    hexagon_nn->hexagon_nn_global_teardown();
  }
 }
 void HexagonDelegateKernel::InitState() {
  auto* hexagon_nn = HexagonNNImplementation();
  if (hexagon_nn != nullptr) {
    hexagon_nn->hexagon_nn_global_init();
  }
 }
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate_kernel.h
@ -0,0 +1,100 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_KERNEL_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_KERNEL_H_
 #include <time.h>
 #include <memory>
 #include <string>
 #include <utility>
 #include <vector>
 #include "hexagon/hexagon_nn_ops.h"
 #include "tensorflow/lite/builtin_ops.h"
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/builders/op_builder.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 #include "tensorflow/lite/schema/schema_generated.h"
 namespace tflite {
 // Represents an abstraction of a Hexagon NNLib graph with functionality to
 // initialize, prepare and invoke it based on the TFLite subgraph to be
 // delegated.
 class HexagonDelegateKernel {
 public:
  enum class HexagonKernelState {
    HEALTHY = 0,
    FAST_RPC_SETUP_FAILED = 1,
    FAILED_TO_INIT_GRAPH = 2,
    FAILED_TO_PREPARE_GRAPH = 3,
    MULTIPLE_INPUTS = 4,
    INPUT_RANK_NOT_SUPPORTED = 5,
    MULTIPLE_OUTPUTS = 6,
    FAILED_TO_EXECUTE_GRAPH = 7,
  };
  // Initialize the Hexagon graph and add required nodes.
  TfLiteStatus Init(TfLiteContext* context, const TfLiteDelegateParams* params);
  // Prepare the Hexagon graph with hexagon_nn_prepare.
  TfLiteStatus Prepare(TfLiteContext* context, TfLiteNode* node);
  // Allocate Hexagon tensordefs for graph I/O & execute it.
  TfLiteStatus Invoke(TfLiteContext* context, TfLiteNode* node);
  ~HexagonDelegateKernel();
  // Sets the environment required for Hexagon execution: DSP attributes,
  // rpcmem, etc.
  static void InitState();
  // Teardown the environment initialized in InitState.
  static void Teardown();
 private:
  // Builds the Hexagon graph based on delegated TFLite subgraph.
  TfLiteStatus BuildGraph(TfLiteContext* context,
                          const TfLiteIntArray* input_tensors,
                          const TfLiteIntArray* output_tensors);
  void ReportError(TfLiteContext* context, HexagonKernelState state,
                   const std::string& msg);
  void PrintLog();
  // Prints performance information about the graph including cycles per node.
  void PrintPerformanceData();
  // Print debugging information about the graph constructed.
  // Amount of information can be increased with debug level.
  void PrintDebuggingGraph();
  HexagonKernelState state_ = HexagonKernelState::HEALTHY;
  const HexagonNN* hexagon_nn_ = nullptr;  // Not owned.
  std::unique_ptr<delegates::hexagon::GraphBuilder> builder_;
  hexagon_nn_nn_id graph_id_ = -1;
  // Indices of nodes in the delegated TfLite subgraph.
  std::vector<int> nodes_;
  ::TfLiteHexagonDelegateOptions params_;
 };
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_DELEGATE_KERNEL_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.cc
@ -0,0 +1,89 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h"
 #include <dlfcn.h>
 #include <fcntl.h>
 #include <cstdio>
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn_interface.h"
 #include "tensorflow/lite/kernels/internal/compatibility.h"
 #include "tensorflow/lite/minimal_logging.h"
 namespace tflite {
 namespace {
 void* LoadFunction(void* dl_handle, const char* name) {
  TFLITE_DCHECK(dl_handle != nullptr);
  auto* func_pt = dlsym(dl_handle, name);
  if (func_pt == nullptr) {
    TFLITE_LOG_PROD(TFLITE_LOG_ERROR, "Function %s is  NULL", name);
  }
  return func_pt;
 }
 #define LOAD_FUNCTION(dl_handle, method_name, hexagon_obj)           \
  hexagon_obj.method_name = reinterpret_cast<method_name##_fn*>(     \
      LoadFunction(dl_handle, #method_name));                        \
  if ((hexagon_obj.method_name) == nullptr) {                        \
    TFLITE_LOG_PROD(TFLITE_LOG_ERROR, "%s is NULL", (#method_name)); \
    return hexagon_obj;                                              \
  }
 HexagonNN CreateNewHexagonInterface() {
  HexagonNN hexagon_nn;
  void* libhexagon_interface =
      dlopen("libhexagon_interface.so", RTLD_LAZY | RTLD_LOCAL);
  if (libhexagon_interface == nullptr) {
    TFLITE_LOG_PROD(TFLITE_LOG_ERROR, "Failed to load libhexagon_interface.so");
    return hexagon_nn;
  }
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_config, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_init, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_prepare, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_set_powersave_level,
                hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_set_debug_level, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_append_node, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_append_const_node, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_execute, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_execute_new, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_teardown, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_snpprint, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_getlog, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_get_perfinfo, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_reset_perfinfo, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_op_id_to_name, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_global_teardown, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_global_init, hexagon_nn);
  LOAD_FUNCTION(libhexagon_interface, hexagon_nn_is_device_supported,
                hexagon_nn);
  hexagon_nn.interface_loaded = true;
  return hexagon_nn;
 }
 }  // namespace
 const HexagonNN* HexagonNNImplementation() {
  static HexagonNN hexagon_nn = CreateNewHexagonInterface();
  if (!hexagon_nn.interface_loaded) {
    return nullptr;
  }
  return &hexagon_nn;
 }
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_implementation.h
@ -0,0 +1,137 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_IMPLEMENTATION_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_IMPLEMENTATION_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn_interface.h"
 namespace tflite {
 // Holds the methods to use to Construct/Execute NN graph using Hexagon NNLib.
 struct HexagonNN {
  // Call this function before creating a graph. It allows the environment on
  // the DSP to configure some settings.
  hexagon_nn_config_fn* hexagon_nn_config;
  //   Creates a new graph and returns an identifier to refer to the new graph.
  //   After a graph is
  // initialized, nodes can be added to it.
  // The returned graph is empty and cannot be executed until all nodes have
  // been added and the graph is finalized with hexagon_nn_prepare(). Multiple
  // graphs can be created and can be kept alive in the DSP environment
  // simultaneously.
  hexagon_nn_init_fn* hexagon_nn_init;
  // Provides a simple parameter between 0 and 255 to control the power saving
  // mode.
  // A level of 255 indicates that preference should be given to minimizing
  // power consumption. A level of 0 indicates that preference should be given
  // to executing as fast as possible.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_set_powersave_level_fn* hexagon_nn_set_powersave_level;
  // Changes the debug verbosity level for messages.
  hexagon_nn_set_debug_level_fn* hexagon_nn_set_debug_level;
  // Prepares a network for execution.
  // This function is required after all the nodes have been appended and before
  // execution.
  // This call provides a hook where memory can be allocated, data
  // can be rearranged, inputs and outputs can be linked up, and things in the
  // graph can be optimized.
  // Once a network has been prepared, it can no longer
  // be appended to, but it can be executed.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_prepare_fn* hexagon_nn_prepare;
  // Adds an ordinary (non-constant) node to the graph.
  // Non-constant nodes can have zero or more inputs and zero or more outputs.
  // An input is described as a source node ID as well as an output index to
  // refer to which one of several outputs a node may have.
  // An output is described with a maximum size. The true size of an output can
  // be computed dynamically, but the caller must define the maximum amount of
  // data storage required by the output during node creation.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_append_node_fn* hexagon_nn_append_node;
  // Adds constant nodes to a graph.
  // Constant nodes produce a single output that can be connected to one graph
  // node input. Unique node_ids are required for referencing nodes when
  // connecting the graph (for example, specifying which outputs of earlier
  // nodes will be used as inputs to particular subsequent nodes). Node_ids are
  // selected by the caller, but node_id=0 and node_id>0xF0000000 are reserved.
  // Node_ids must be unique.
  // *** NOTE: On SDM835 and older targets,
  // hexagon_nn_append_const_node() will not work properly for arrays larger
  // than 32 MB. Instead, use hexagon_nn_append_empty_const_node_large_array(),
  // which expects the same arguments.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_append_const_node_fn* hexagon_nn_append_const_node;
  // Executes a network, with provided input data and returning output data.
  // Execution will fail if the network has not been prepared.
  // Input is provided to the INPUT node, and output is returned from the OUTPUT
  // node.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_execute_fn* hexagon_nn_execute;
  // Newer version of hexagon_nn_execute that utilizes hexagon_nn_tensordefs to
  // represent inputs & outputs. Executes a network with provided input tensors
  // and returns output tensors. Execution will fail if the network has not
  // been prepared.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_execute_new_fn* hexagon_nn_execute_new;
  // Tears down and frees an NN graph. This can be done at any time after
  // hexagon_nn_init(). After this function has been invoked, the nn_id id is
  // invalid.
  //
  // Returns 0 on success, otherwise failure.
  hexagon_nn_teardown_fn* hexagon_nn_teardown;
  hexagon_nn_snpprint_fn* hexagon_nn_snpprint;
  hexagon_nn_getlog_fn* hexagon_nn_getlog;
  hexagon_nn_get_perfinfo_fn* hexagon_nn_get_perfinfo;
  hexagon_nn_reset_perfinfo_fn* hexagon_nn_reset_perfinfo;
  hexagon_nn_op_id_to_name_fn* hexagon_nn_op_id_to_name;
  // Should be called once to shutdown DSP and cleanup.
  hexagon_nn_global_teardown_fn* hexagon_nn_global_teardown;
  // Should be called once to initialize DSP.
  hexagon_nn_global_init_fn* hexagon_nn_global_init;
  // Returns true if the device SoC is supported by hexagon library. False
  // Otherwise.
  hexagon_nn_is_device_supported_fn* hexagon_nn_is_device_supported;
  bool interface_loaded = false;
 };
 // Returns an instance of HexagonNN.
 const HexagonNN* HexagonNNImplementation();
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_IMPLEMENTATION_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/BUILD
@ -0,0 +1,31 @@
 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 package(default_visibility = [
    "//visibility:public",
 ])
 licenses(["notice"])  # Apache 2.0
 cc_library(
    name = "hexagon_nn_header",
    hdrs = [
        "hexagon_nn.h",
        "hexagon_nn_init.h",
    ],
    deps = [
        "@hexagon_nn//:hexagon_nn_header",
    ],
 )
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h
@ -0,0 +1,21 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_H_
 #include "hexagon/hexagon_nn.h"
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn_init.h"
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn_init.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn_init.h
@ -0,0 +1,27 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_INIT_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_INIT_H_
 #ifdef __cplusplus
 extern "C" {
 #endif
 void hexagon_nn_global_teardown(void);
 void hexagon_nn_global_init(void);
 bool hexagon_nn_is_device_supported();
 #ifdef __cplusplus
 }
 #endif
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_HEXAGON_NN_INIT_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/version_scripts.lds
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/version_scripts.lds
@ -0,0 +1,25 @@
 VERS_1.0 {
  global:
    hexagon_nn_config;
    hexagon_nn_init;
    hexagon_nn_prepare;
    hexagon_nn_set_powersave_level;
    hexagon_nn_set_debug_level;
    hexagon_nn_append_node;
    hexagon_nn_append_const_node;
    hexagon_nn_execute;
    hexagon_nn_execute_new;
    hexagon_nn_teardown;
    hexagon_nn_snpprint;
    hexagon_nn_getlog;
    hexagon_nn_get_perfinfo;
    hexagon_nn_reset_perfinfo;
    hexagon_nn_op_id_to_name;
    hexagon_nn_global_teardown;
    hexagon_nn_global_init;
    hexagon_nn_is_device_supported;
  # Hide everything else.
  local:
    *;
 };
--- a/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn_interface.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/hexagon_nn_interface.h
@ -0,0 +1,57 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_INTERFACE_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_INTERFACE_H_
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_nn/hexagon_nn.h"
 using hexagon_nn_config_fn = decltype(hexagon_nn_config);
 using hexagon_nn_init_fn = decltype(hexagon_nn_init);
 using hexagon_nn_set_powersave_level_fn =
    decltype(hexagon_nn_set_powersave_level);
 using hexagon_nn_set_debug_level_fn = decltype(hexagon_nn_set_debug_level);
 using hexagon_nn_prepare_fn = decltype(hexagon_nn_prepare);
 using hexagon_nn_append_node_fn = decltype(hexagon_nn_append_node);
 using hexagon_nn_append_const_node_fn = decltype(hexagon_nn_append_const_node);
 using hexagon_nn_execute_fn = decltype(hexagon_nn_execute);
 using hexagon_nn_execute_new_fn = decltype(hexagon_nn_execute_new);
 using hexagon_nn_teardown_fn = decltype(hexagon_nn_teardown);
 using hexagon_nn_snpprint_fn = decltype(hexagon_nn_snpprint);
 using hexagon_nn_getlog_fn = decltype(hexagon_nn_getlog);
 using hexagon_nn_get_perfinfo_fn = decltype(hexagon_nn_get_perfinfo);
 using hexagon_nn_reset_perfinfo_fn = decltype(hexagon_nn_reset_perfinfo);
 using hexagon_nn_op_id_to_name_fn = decltype(hexagon_nn_op_id_to_name);
 using hexagon_nn_global_teardown_fn = decltype(hexagon_nn_global_teardown);
 using hexagon_nn_global_init_fn = decltype(hexagon_nn_global_init);
 using hexagon_nn_is_device_supported_fn =
    decltype(hexagon_nn_is_device_supported);
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_HEXAGON_NN_INTERFACE_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/java/AndroidManifest.xml
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/AndroidManifest.xml
@ -0,0 +1,11 @@
 <?xml version="1.0" encoding="utf-8"?>
 <manifest xmlns:android="http://schemas.android.com/apk/res/android"
    package="org.tensorflow.lite">
    <uses-sdk
        android:targetSdkVersion="19" />
    <application />
 </manifest>
--- a/tensorflow/lite/experimental/delegates/hexagon/java/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/BUILD
@ -0,0 +1,62 @@
 load("@build_bazel_rules_android//android:rules.bzl", "android_library")
 load("//tensorflow/lite:build_def.bzl", "tflite_jni_binary")
 load("//tensorflow/lite/java:aar_with_jni.bzl", "aar_with_jni")
 package(
    default_visibility = ["//visibility:public"],
    licenses = ["notice"],  # Apache 2.0
 )
 # EXPERIMENTAL: Native target that runs inference on the Hexagon backend.
 # The Hexagon backend-related targets are intentionally not included in BUILD.bazel.
 tflite_jni_binary(
    name = "libtensorflowlite_hexagon_jni.so",
    linkscript = "//tensorflow/lite/experimental/delegates/hexagon:version_script.lds",
    tags = [
        "manual",
        "nobuilder",
        "notap",
    ],
    deps = [
        "//tensorflow/lite/experimental/delegates/hexagon/java/src/main/native",
    ],
 )
 cc_library(
    name = "tensorflowlite_hexagon",
    srcs = [
        "libtensorflowlite_hexagon_jni.so",
    ] + select({
        "//tensorflow:android_arm64": ["@hexagon_nn//:hexagon/arm64-v8a/libhexagon_interface.so"],
        "//tensorflow:android_arm": ["@hexagon_nn//:hexagon/armeabi-v7a/libhexagon_interface.so"],
        "//conditions:default": [],
    }),
    tags = [
        "manual",
        "nobuilder",
        "notap",
    ],
 )
 android_library(
    name = "tensorflowlite_java_hexagon",
    srcs = ["//tensorflow/lite/experimental/delegates/hexagon/java/src/main/java/org/tensorflow/lite/experimental:hexagon_delegate"],
    manifest = "AndroidManifest.xml",
    proguard_specs = ["proguard.flags"],
    tags = [
        "manual",
        "nobuilder",
        "notap",
    ],
    deps = [
        ":tensorflowlite_hexagon",
        "//tensorflow/lite/java:tensorflowlite_java",
        "@org_checkerframework_qual",
    ],
 )
 aar_with_jni(
    name = "tensorflow-lite-hexagon",
    android_library = ":tensorflowlite_java_hexagon",
    headers = ["//tensorflow/lite/experimental/delegates/hexagon:hexagon_delegate.h"],
 )
--- a/tensorflow/lite/experimental/delegates/hexagon/java/proguard.flags
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/proguard.flags
@ -0,0 +1,3 @@
 -keepclassmembers class org.tensorflow.lite.NativeInterpreterWrapper {
    private long inferenceDurationNanoseconds;
 }
--- a/tensorflow/lite/experimental/delegates/hexagon/java/src/main/java/org/tensorflow/lite/experimental/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/src/main/java/org/tensorflow/lite/experimental/BUILD
@ -0,0 +1,7 @@
 licenses(["notice"])  # Apache 2.0
 filegroup(
    name = "hexagon_delegate",
    srcs = ["HexagonDelegate.java"],
    visibility = ["//visibility:public"],
 )
--- a/tensorflow/lite/experimental/delegates/hexagon/java/src/main/java/org/tensorflow/lite/experimental/HexagonDelegate.java
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/src/main/java/org/tensorflow/lite/experimental/HexagonDelegate.java
@ -0,0 +1,69 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 package org.tensorflow.lite.experimental;
 import android.content.Context;
 import java.io.Closeable;
 import org.tensorflow.lite.Delegate;
 /** {@link Delegate} for Hexagon inference. */
 public class HexagonDelegate implements Delegate, Closeable {
  private static final long INVALID_DELEGATE_HANDLE = 0;
  private static final String TFLITE_HEXAGON_LIB = "tensorflowlite_hexagon_jni";
  private long delegateHandle;
  /*
   * Creates a new HexagonDelegate object given the current 'context'.
   * Throws UnsupportedOperationException if Hexagon DSP delegation is not available
   * on this device.
   */
  public HexagonDelegate(Context context) throws UnsupportedOperationException {
    setAdspLibraryPath(context.getApplicationInfo().nativeLibraryDir);
    delegateHandle = createDelegate();
    if (delegateHandle == INVALID_DELEGATE_HANDLE) {
      throw new UnsupportedOperationException("This Device doesn't support Hexagon DSP execution.");
    }
  }
  @Override
  public long getNativeHandle() {
    return delegateHandle;
  }
  /**
   * Frees TFLite resources in C runtime.
   *
   * <p>User is expected to call this method explicitly.
   */
  @Override
  public void close() {
    if (delegateHandle != INVALID_DELEGATE_HANDLE) {
      deleteDelegate(delegateHandle);
      delegateHandle = INVALID_DELEGATE_HANDLE;
    }
  }
  static {
    System.loadLibrary(TFLITE_HEXAGON_LIB);
  }
  private static native long createDelegate();
  private static native void deleteDelegate(long delegateHandle);
  private static native boolean setAdspLibraryPath(String libraryPath);
 }
--- a/tensorflow/lite/experimental/delegates/hexagon/java/src/main/native/BUILD
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/src/main/native/BUILD
@ -0,0 +1,25 @@
 # Description:
 # Java Native Interface (JNI) library intended for implementing the
 # TensorFlow Lite Hexagon delegate Java API using the TensorFlow Lite CC library.
 package(default_visibility = ["//tensorflow/lite/experimental/delegates/hexagon/java:__subpackages__"])
 load("//tensorflow/lite:build_def.bzl", "tflite_copts")
 licenses(["notice"])  # Apache 2.0
 cc_library(
    name = "native",
    srcs = ["hexagon_delegate_jni.cc"],
    copts = tflite_copts(),
    tags = [
        "manual",
        "nobuilder",
        "notap",
    ],
    deps = [
        "//tensorflow/lite/experimental/delegates/hexagon:hexagon_delegate",
        "//tensorflow/lite/java/jni",
    ],
    alwayslink = 1,
 )
--- a/tensorflow/lite/experimental/delegates/hexagon/java/src/main/native/hexagon_delegate_jni.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/java/src/main/native/hexagon_delegate_jni.cc
@ -0,0 +1,55 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include <jni.h>
 #include <sstream>
 #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h"
 #ifdef __cplusplus
 extern "C" {
 #endif
 JNIEXPORT jlong JNICALL
 Java_org_tensorflow_lite_experimental_HexagonDelegate_createDelegate(
    JNIEnv* env, jclass clazz) {
  // Auto-choosing the best performing config for closed release.
  TfLiteHexagonDelegateOptions options = {0};
  TfLiteHexagonInit();
  return reinterpret_cast<jlong>(TfLiteHexagonDelegateCreate(&options));
 }
 JNIEXPORT void JNICALL
 Java_org_tensorflow_lite_experimental_HexagonDelegate_deleteDelegate(
    JNIEnv* env, jclass clazz, jlong delegate) {
  TfLiteHexagonDelegateDelete(reinterpret_cast<TfLiteDelegate*>(delegate));
  TfLiteHexagonTearDown();
 }
 JNIEXPORT jboolean JNICALL
 Java_org_tensorflow_lite_experimental_HexagonDelegate_setAdspLibraryPath(
    JNIEnv* env, jclass clazz, jstring native_lib_path) {
  const char* lib_dir_path = env->GetStringUTFChars(native_lib_path, nullptr);
  std::stringstream path;
  path << lib_dir_path
       << ";/system/lib/rfsa/adsp;/system/vendor/lib/rfsa/adsp;/dsp";
  return setenv("ADSP_LIBRARY_PATH", path.str().c_str(), 1 /*override*/) == 0
             ? JNI_TRUE
             : JNI_FALSE;
 }
 #ifdef __cplusplus
 }  // extern "C"
 #endif  // __cplusplus
--- a/tensorflow/lite/experimental/delegates/hexagon/utils.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/utils.cc
@ -0,0 +1,270 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/utils.h"
 #include <vector>
 #include "tensorflow/lite/builtin_ops.h"
 #include "tensorflow/lite/c/builtin_op_data.h"
 #include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/kernels/kernel_util.h"
 namespace tflite {
 namespace {
 bool IsActivationReluOrNone(TfLiteFusedActivation activation) {
  return (activation == kTfLiteActRelu || activation == kTfLiteActRelu6 ||
          activation == kTfLiteActRelu1 || activation == kTfLiteActNone);
 }
 bool TensorTypeMatch(int tensor_id, TfLiteContext* context,
                     TfLiteType tensor_type) {
  const auto& tensor = context->tensors[tensor_id];
  return tensor.type == tensor_type;
 }
 bool InputsWithCorrectTypes(const TfLiteNode* node, TfLiteContext* context,
                            const std::vector<TfLiteType>& input_types) {
  if (node->inputs->size != input_types.size()) return false;
  for (int i = 0; i < input_types.size(); ++i) {
    if (!TensorTypeMatch(node->inputs->data[i], context, input_types[i]))
      return false;
  }
  return true;
 }
 }  // namespace
 TfLiteStatus Get4DShape(unsigned int* batch_size, unsigned int* height_size,
                        unsigned int* width_size, unsigned int* depth_size,
                        TfLiteIntArray* dims) {
  if (dims->size > 4) return kTfLiteError;
  unsigned int* dim[] = {batch_size, height_size, width_size, depth_size};
  for (int i = 0; i < 4; ++i) *(dim[i]) = 1;
  for (int i = 4 - dims->size; i < 4; ++i) {
    *dim[i] = dims->data[i - (4 - dims->size)];
  }
  return kTfLiteOk;
 }
 bool IsNodeSupportedByHexagon(const TfLiteRegistration* registration,
                              const TfLiteNode* node, TfLiteContext* context) {
  // Ensure all inputs & outputs have dim <= 4.
  int tensor_id;
  for (int i = 0; i < node->inputs->size; ++i) {
    tensor_id = node->inputs->data[i];
    const auto& tensor = context->tensors[tensor_id];
    if (tensor.dims->size > 4) return false;
  }
  for (int i = 0; i < node->outputs->size; ++i) {
    tensor_id = node->outputs->data[i];
    const auto& tensor = context->tensors[tensor_id];
    if (tensor.dims->size > 4) return false;
  }
  // Most hexagon kernels are not compatible with op versions > 1.
  // We maintain a 'whitelist' here to ensure we don't accept unintended nodes.
  if (registration->version > 1) {
    if (registration->builtin_code == kTfLiteBuiltinDepthwiseConv2d &&
        registration->version == 2) {
      return true;
    }
    return false;
  }
  switch (registration->builtin_code) {
    case kTfLiteBuiltinAdd: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8, kTfLiteUInt8}))
        return false;
      const TfLiteAddParams* add_params =
          reinterpret_cast<const TfLiteAddParams*>(node->builtin_data);
      return IsActivationReluOrNone(add_params->activation);
    }
    case kTfLiteBuiltinMul: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8, kTfLiteUInt8}))
        return false;
      const TfLiteMulParams* mul_params =
          reinterpret_cast<const TfLiteMulParams*>(node->builtin_data);
      // TODO(b/129276536): Add support for activation on Mul node.
      return mul_params->activation == kTfLiteActNone;
    }
    case kTfLiteBuiltinSub: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8, kTfLiteUInt8}))
        return false;
      const TfLiteSubParams* sub_params =
          reinterpret_cast<const TfLiteSubParams*>(node->builtin_data);
      return IsActivationReluOrNone(sub_params->activation);
    }
    case kTfLiteBuiltinSum:
    case kTfLiteBuiltinMean: {
      // TODO(b/139277813): Enable these when they pass unit tests. These seem
      // to recompute the output min/max instead of taking them as inputs, which
      // causes an unexpected shift in dequantized values.
      return false;
    }
    case kTfLiteBuiltinPad: {
      // TODO(b/139277813): Currently we only support padding with the default
      // of 0. Add support for user-defined constant if required.
      return (
          node->inputs->size == 2 &&
          InputsWithCorrectTypes(node, context, {kTfLiteUInt8, kTfLiteInt32}) &&
          IsConstantTensor(&context->tensors[node->inputs->data[1]]));
    }
    case kTfLiteBuiltinFullyConnected: {
      if (!InputsWithCorrectTypes(node, context,
                                  {kTfLiteUInt8, kTfLiteUInt8, kTfLiteInt32}))
        return false;
      const TfLiteFullyConnectedParams* matmul_params =
          reinterpret_cast<const TfLiteFullyConnectedParams*>(
              node->builtin_data);
      return (IsActivationReluOrNone(matmul_params->activation) &&
              matmul_params->keep_num_dims == false &&
              matmul_params->weights_format ==
                  kTfLiteFullyConnectedWeightsFormatDefault);
    }
    case kTfLiteBuiltinConcatenation: {
      // All concatenated tensors must be Uint8 type.
      for (int i = 0; i < node->inputs->size; ++i) {
        if (!TensorTypeMatch(node->inputs->data[i], context, kTfLiteUInt8))
          return false;
      }
      // Hexagon only supports concatenation at axis 3.
      const TfLiteConcatenationParams* concat_params =
          reinterpret_cast<const TfLiteConcatenationParams*>(
              node->builtin_data);
      return (concat_params->axis == 3);
    }
    case kTfLiteBuiltinMaxPool2d: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8})) return false;
      // TODO(b/129276536): Add support for activation here.
      const TfLitePoolParams* pool_params =
          reinterpret_cast<const TfLitePoolParams*>(node->builtin_data);
      return pool_params->activation == kTfLiteActNone;
    }
    case kTfLiteBuiltinAveragePool2d: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8})) return false;
      // AvgPool works fine for filter dim <=7.
      const TfLitePoolParams* pool_params =
          reinterpret_cast<const TfLitePoolParams*>(node->builtin_data);
      return (node->inputs->size == 1 &&
              pool_params->activation == kTfLiteActNone);
    }
    case kTfLiteBuiltinTransposeConv: {
      if (!InputsWithCorrectTypes(node, context,
                                  {kTfLiteInt32, kTfLiteUInt8, kTfLiteUInt8}))
        return false;
      const TfLiteTransposeConvParams* params =
          reinterpret_cast<const TfLiteTransposeConvParams*>(
              node->builtin_data);
      return (params->stride_height <= 3 && params->stride_width <= 3 &&
              (params->padding == kTfLitePaddingSame ||
               params->padding == kTfLitePaddingValid));
    }
    case kTfLiteBuiltinConv2d: {
      if (!InputsWithCorrectTypes(node, context,
                                  {kTfLiteUInt8, kTfLiteUInt8, kTfLiteInt32}))
        return false;
      const TfLiteConvParams* conv_params =
          reinterpret_cast<const TfLiteConvParams*>(node->builtin_data);
      return (IsActivationReluOrNone(conv_params->activation) &&
              conv_params->stride_height <= 3 &&
              conv_params->stride_width <= 3 &&
              conv_params->dilation_height_factor == 1 &&
              conv_params->dilation_width_factor == 1);
    }
    case kTfLiteBuiltinDepthwiseConv2d: {
      if (!InputsWithCorrectTypes(node, context,
                                  {kTfLiteUInt8, kTfLiteUInt8, kTfLiteInt32}))
        return false;
      // Hexagon only supports width of 3 for Depthwise Conv.
      const auto& tensor = context->tensors[node->inputs->data[1]];
      if (tensor.dims->data[2] != 3) return false;
      const TfLiteDepthwiseConvParams* conv_params =
          reinterpret_cast<const TfLiteDepthwiseConvParams*>(
              node->builtin_data);
      const bool dilation = conv_params->dilation_height_factor != 1 ||
                            conv_params->dilation_width_factor != 1;
      if (dilation) {
        // We only support dilations when stride == 1.
        if (conv_params->stride_height != 1 || conv_params->stride_width != 1)
          return false;
      }
      return (IsActivationReluOrNone(conv_params->activation) &&
              conv_params->stride_height <= 3 &&
              conv_params->stride_width <= 3 &&
              conv_params->depth_multiplier == 1);
    }
    case kTfLiteBuiltinReshape: {
      if (node->inputs->size > 2 ||
          !TensorTypeMatch(node->inputs->data[0], context, kTfLiteUInt8))
        return false;
      return true;
    }
    case kTfLiteBuiltinSoftmax:
    case kTfLiteBuiltinRelu:
    case kTfLiteBuiltinRelu6:
    case kTfLiteBuiltinTanh:
    case kTfLiteBuiltinLogistic: {
      return InputsWithCorrectTypes(node, context, {kTfLiteUInt8});
    }
    case kTfLiteBuiltinResizeNearestNeighbor: {
      return InputsWithCorrectTypes(node, context,
                                    {kTfLiteUInt8, kTfLiteInt32});
    }
    case kTfLiteBuiltinL2Normalization: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteUInt8})) return false;
      const TfLiteL2NormParams* norm_params =
          reinterpret_cast<const TfLiteL2NormParams*>(node->builtin_data);
      return (norm_params->activation == kTfLiteActNone);
    }
    case kTfLiteBuiltinArgMax:
    case kTfLiteBuiltinArgMin:
      return InputsWithCorrectTypes(node, context,
                                    {kTfLiteUInt8, kTfLiteInt32});
    case kTfLiteBuiltinSplit: {
      if (!InputsWithCorrectTypes(node, context, {kTfLiteInt32, kTfLiteUInt8}))
        return false;
      const auto& input_tensor = context->tensors[node->inputs->data[1]];
      const bool is_four_dim_or_less = input_tensor.dims->size < 5;
      // We need splitting axis to be constant, so Hexagon knows output shapes.
      return is_four_dim_or_less &&
             IsConstantTensor(&context->tensors[node->inputs->data[0]]);
    }
    case kTfLiteBuiltinResizeBilinear: {
      if (!InputsWithCorrectTypes(node, context,
                                  {kTfLiteUInt8, kTfLiteInt32}) ||
          !IsConstantTensor(&context->tensors[node->inputs->data[1]])) {
        return false;
      }
      const auto& size_tensor = context->tensors[node->inputs->data[1]];
      // TODO(b/143105433): Latency increase significantly with large size
      // value. Limiting to 65 for now.
      return NumElements(&size_tensor) == 2 && size_tensor.data.i32[0] < 66 &&
             size_tensor.data.i32[1] < 66;
    }
    case kTfLiteBuiltinNeg: {
      return InputsWithCorrectTypes(node, context, {kTfLiteUInt8});
    }
    case kTfLiteBuiltinTranspose: {
      return InputsWithCorrectTypes(node, context,
                                    {kTfLiteUInt8, kTfLiteInt32});
    }
    default:
      return false;
  }
  return false;
 }
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/utils.h
+++ b/tensorflow/lite/experimental/delegates/hexagon/utils.h
@ -0,0 +1,38 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_UTILS_H_
 #define TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_UTILS_H_
 #include "tensorflow/lite/c/common.h"
 namespace tflite {
 // Interpretes data from 'dims' as a 4D shape {batch, height, width, depth} and
 // populates the corresponding values. If dims->size < 4, the shape is prefixed
 // with 1s.
 // For example, dims {2, 3} is interpreted as: {1, 1, 2, 3}.
 // Returns kTfLiteError if dims->size > 4, kTfLiteOk otherwise.
 TfLiteStatus Get4DShape(unsigned int* batch_size, unsigned int* height_size,
                        unsigned int* width_size, unsigned int* depth_size,
                        TfLiteIntArray* dims);
 // Returns true if provided node is supported by Hexagon NNLib in the current
 // context.
 bool IsNodeSupportedByHexagon(const TfLiteRegistration* registration,
                              const TfLiteNode* node, TfLiteContext* context);
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_EXPERIMENTAL_DELEGATES_HEXAGON_UTILS_H_
--- a/tensorflow/lite/experimental/delegates/hexagon/utils_test.cc
+++ b/tensorflow/lite/experimental/delegates/hexagon/utils_test.cc
@ -0,0 +1,71 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/experimental/delegates/hexagon/utils.h"
 #include <string>
 #include <vector>
 #include <gtest/gtest.h>
 #include "tensorflow/lite/c/common.h"
 namespace tflite {
 namespace {
 TEST(UtilsTest, Get4DShapeTest_4DInput) {
  unsigned int batch_dim, height_dim, width_dim, depth_dim;
  TfLiteIntArray* shape_4d = TfLiteIntArrayCreate(4);
  shape_4d->data[0] = 4;
  shape_4d->data[1] = 3;
  shape_4d->data[2] = 2;
  shape_4d->data[3] = 1;
  EXPECT_EQ(
      Get4DShape(&batch_dim, &height_dim, &width_dim, &depth_dim, shape_4d),
      kTfLiteOk);
  EXPECT_EQ(batch_dim, shape_4d->data[0]);
  EXPECT_EQ(height_dim, shape_4d->data[1]);
  EXPECT_EQ(width_dim, shape_4d->data[2]);
  EXPECT_EQ(depth_dim, shape_4d->data[3]);
  TfLiteIntArrayFree(shape_4d);
 }
 TEST(UtilsTest, Get4DShapeTest_2DInput) {
  unsigned int batch_dim, height_dim, width_dim, depth_dim;
  TfLiteIntArray* shape_2d = TfLiteIntArrayCreate(2);
  shape_2d->data[0] = 4;
  shape_2d->data[1] = 3;
  EXPECT_EQ(
      Get4DShape(&batch_dim, &height_dim, &width_dim, &depth_dim, shape_2d),
      kTfLiteOk);
  EXPECT_EQ(batch_dim, 1);
  EXPECT_EQ(height_dim, 1);
  EXPECT_EQ(width_dim, shape_2d->data[0]);
  EXPECT_EQ(depth_dim, shape_2d->data[1]);
  TfLiteIntArrayFree(shape_2d);
 }
 TEST(UtilsTest, Get4DShapeTest_5DInput) {
  unsigned int batch_dim, height_dim, width_dim, depth_dim;
  TfLiteIntArray* shape_5d = TfLiteIntArrayCreate(5);
  EXPECT_EQ(
      Get4DShape(&batch_dim, &height_dim, &width_dim, &depth_dim, shape_5d),
      kTfLiteError);
  TfLiteIntArrayFree(shape_5d);
 }
 }  // namespace
 }  // namespace tflite
--- a/tensorflow/lite/experimental/delegates/hexagon/version_script.lds
+++ b/tensorflow/lite/experimental/delegates/hexagon/version_script.lds
@ -0,0 +1,13 @@
 VERS_1.0 {
  # Export JNI symbols.
  global:
    Java_*;
    JNI_OnLoad;
    JNI_OnUnload;
    # TODO(b/138605512): Remove this and build separate .so for c++ api ?
    TfLiteHexagon*;
  # Hide everything else.
  local:
    *;
 };
--- a/tensorflow/lite/g3doc/performance/hexagon_delegate.md
+++ b/tensorflow/lite/g3doc/performance/hexagon_delegate.md
@ -0,0 +1,265 @@
 ## Tensorflow Lite Hexagon Delegate Quick Guide
 [TOC]
 This document explains how to use the Tensorflow Lite Hexagon Delegate in your
 application using the Java and/or C API. The delegate leverages the Qualcomm
 Hexagon library to execute quantized kernels on the DSP. Note that the delegate
 is intended to *complement* NNAPI functionality, particularly for devices where
 NNAPI DSP acceleration is unavailable (e.g., on older devices, or devices that
 don’t yet have a DSP NNAPI driver). Note: This delegate is in experimental
 (beta) phase.
 **Supported devices:**
 Currently most
 [Qualcomm SoCs](https://en.wikipedia.org/wiki/List_of_Qualcomm_Snapdragon_systems-on-chip)
 are supported, including:
 *   Snapdragon 835 (682 DSP)
 *   Snapdragon 660/820/821 (680 DSP)
 *   Snapdragon 710/845 (685 DSP)
 *   Snapdragon 8150/855 (690 DSP)
 **Supported models:**
 The Hexagon delegate currently supports quantized models generated using
 [quantization-aware training](https://github.com/tensorflow/tensorflow/tree/r1.13/tensorflow/contrib/quantize),
 e.g.,
 [these quantized models](https://www.tensorflow.org/lite/guide/hosted_models#quantized_models)
 hosted on the TensorFlow Lite repo. It does not (yet) support models with
 [8-bit symmetric quantization spec](https://www.tensorflow.org/lite/performance/quantization_spec).
 Sample models include
 [MobileNet V1](https://storage.googleapis.com/download.tensorflow.org/models/mobilenet_v1_2018_08_02/mobilenet_v1_1.0_224_quant.tgz),
 [SSD Mobilenet](https://storage.googleapis.com/download.tensorflow.org/models/tflite/coco_ssd_mobilenet_v1_1.0_quant_2018_06_29.zip).
 ## Hexagon Delegate Java API {#hexagon-delegate-java-api}
 ```
 public class HexagonDelegate implements Delegate, Closeable {
  /*
   * Creates a new HexagonDelegate object given the current 'context'.
   * Throws UnsupportedOperationException if Hexagon DSP delegation is not
   * available on this device.
   */
  public HexagonDelegate(Context context) throws UnsupportedOperationException
  /**
   * Frees TFLite resources in C runtime.
   *
   * User is expected to call this method explicitly.
   */
  @Override
  public void close();
 }
 ```
 ## Example Usage from Java {#example-usage-from-java}
 1.  Add the ‘tensorflow-lite-hexagon.aar’ to your app - this is in addition to
    the standard tensorflow-lite AAR (nightly or release).
    [Relevant instructions](https://stackoverflow.com/questions/16682847/how-to-manually-include-external-aar-package-using-new-gradle-android-build-syst).
 1.  Run “hexagon_nn_skel.run” - Note: you will need to accept the license
    agreement. It should provide 3 different shared libraries
    “libhexagon_nn_skel.so”, “libhexagon_nn_skel_v65.so”,
    “libhexagon_nn_skel_v66.so” \
    Include all 3 in your app with other shared libraries. See
    [How to add shared library to your app](#how-to-add-shared-library-to-your-app)
    \
    The delegate will automatically pick the one with best performance depending
    on the device. \
    Note: If your app will be built for both 32 and 64-bit ARM devices, then you
    will need to add the hexagon shared libs to both 32 and 64-bit lib folders.
 1.  Create a delegate, example:
 ```
 import org.tensorflow.lite.experimental.HexagonDelegate;
 // Create the Delegate instance.
 try {
  hexagonDelegate = new HexagonDelegate(activity);
  tfliteOptions.addDelegate(hexagonDelegate);
 } catch (UnsupportedOperationException e) {
  // Hexagon delegate is not supported on this device.
 }
 tfliteInterpreter = new Interpreter(tfliteModel, tfliteOptions);
 // Dispose after finished with inference.
 tfliteInterpreter.close();
 if (hexagonDelegate != null) {
  hexagonDelegate.close();
 }
 ```
 ## Hexagon Delegate C API {#hexagon-delegate-c-api}
 ```
 struct TfLiteHexagonDelegateOptions {
  // This corresponds to the debug level in the hexagon SDK. 0 (default)
  // means no debug.
  int debug_level;
  // This corresponds to powersave_level in the hexagon SDK.
  // where 0 (default) means high performance which means more power
  // consumption.
  int powersave_level;
  // If set to true, performance information about the graph will be dumped
  // to Standard output, this includes cpu cycles.
  // WARNING: Experimental and subject to change anytime.
  bool print_graph_profile;
  // If set to true, graph structure will be dumped to Standard output.
  // This is usually beneficial to see what actual nodes executed on
  // the DSP. Combining with 'debug_level' more information will be printed.
  // WARNING: Experimental and subject to change anytime.
  bool print_graph_debug;
 };
 // Return a delegate that uses Hexagon SDK for ops execution.
 // Must outlive the interpreter.
 TfLiteDelegate*
 TfLiteHexagonDelegateCreate(const TfLiteHexagonDelegateOptions* options);
 // Do any needed cleanup and delete 'delegate'.
 void TfLiteHexagonDelegateDelete(TfLiteDelegate* delegate);
 // Initializes the DSP connection.
 // This should be called before doing any usage of the delegate.
 // "lib_directory_path": Path to the directory which holds the
 // shared libraries for the Hexagon NN libraries on the device.
 void TfLiteHexagonInitWithPath(const char* lib_directory_path);
 // Same as above method but doesn't accept the path params.
 // Assumes the environment setup is already done. Only initialize Hexagon.
 Void TfLiteHexagonInit();
 // Clean up and switch off the DSP connection.
 // This should be called after all processing is done and delegate is deleted.
 Void TfLiteHexagonTearDown();
 ```
 ## Example Usage from C {#example-usage-from-c}
 1.  Add the ‘tensorflow-lite-hexagon.aar’ to your app - this is in addition to
    the standard tensorflow-lite AAR (nightly or release).
    [Relevant instructions](https://stackoverflow.com/questions/16682847/how-to-manually-include-external-aar-package-using-new-gradle-android-build-syst).
 1.  Include the provided hexagon_delegate.h
 1.  Run “hexagon_nn_skel.run” - Note: you will need to accept the license
    agreement. It should provide 3 different shared libraries \
    “libhexagon_nn_skel.so”, “libhexagon_nn_skel_v65.so”,
    “libhexagon_nn_skel_v66.so” \
    Include all 3 in your app with other shared libraries. See How to add shared
    library to your app. \
    The delegate will automatically pick the one with best performance depending
    on the device. \
    Note: If your app will be built for both 32 and 64-bit ARM devices, then you
    will need to add the hexagon shared libs to both 32 and 64-bit lib folders.
 1.  In your code, ensure the native Hexagon library is loaded. This can be done
    by calling `System.loadLibrary("tensorflowlite_hexagon_jni");` \
    in your Activity or Java entry-point.
 1.  Create a delegate, example:
    ```
    #include "tensorflow/lite/experimental/delegates/hexagon/hexagon_delegate.h"
    // Assuming shared libraries are under "/data/local/tmp/"
    // If files are packaged with native lib in android App then it
    // will typically be equivalent to the path provided by
    // "getContext().getApplicationInfo().nativeLibraryDir"
    const char[] library_directory_path = "/data/local/tmp/";
    TfLiteHexagonInitWithPath(library_directory_path);  // Needed once at startup.
    ::tflite::TfLiteHexagonDelegateOptions params = {0};
    // 'delegate_ptr' Need to outlive the interpreter. For example,
    // If use case will need to resize input or anything that can trigger
    // re-applying delegates then 'delegate_ptr' need to outlive the interpreter.
    auto* delegate_ptr = ::tflite::TfLiteHexagonDelegateCreate(&params);
    Interpreter::TfLiteDelegatePtr delegate(delegate_ptr,
      [](TfLiteDelegate* delegate) {
        ::tflite::TfLiteHexagonDelegateDelete(delegate);
      });
    interpreter->ModifyGraphWithDelegate(delegate.get());
    // After usage of delegate.
    TfLiteHexagonTearDown();  // Needed once at end of app/DSP usage.
    ```
 ## How to add shared library to your app {#how-to-add-shared-library-to-your-app}
 Create folder “app/src/main/jniLibs”, then for each target architecture create a
 directory.
 For example,
 Arm64 bit: “app/src/main/jniLibs/arm64-v8a”
 Arm32 bit: “app/src/main/jniLibs/armeabi-v7a”
 Put your .so in the directory that match the architecture.
 ## Feedback {#feedback}
 For issues, please create a
 [github](https://github.com/tensorflow/tensorflow/issues/new?template=50-other-issues.md)
 issue with all the necessary repro details, including the phone model and board
 used (`adb shell getprop ro.product.device` and `adb shell getprop
 ro.board.platform`).
 ## FAQ {#faq}
 *   Will the delegate support models created using
    [post-training quantization](https://www.tensorflow.org/lite/performance/post_training_quantization)?
    *   This is tentatively planned for a future release, though there is no
        concrete timeline.
 *   Which ops are supported by the delegate?
    *   Initial Dogfood list of supported ops:
        *   Add
        *   ArgMax
        *   ArgMin
        *   AveragePool2D:
        *   Constraints:
        *   No Activation
        *   Concat
        *   Conv2D:
        *   Constraints:
        *   stride width/height <= 3
        *   DepthwiseConv2D:
        *   Constraints:
        *   Filter width == 3
        *   depth_multiplier == 1
        *   dilation only supported when stride == 1
        *   Otherwise, stride height/width <= 3
        *   FullyConnected (without any activation)
        *   L2Normalization (without any activation)
        *   Logistic (aka Sigmoid)
        *   MaxPool2D (without any activation)
        *   Mul (without any activation)
        *   Neg
        *   Pad: Only supports 0 padding
        *   Relu
        *   Relu6
        *   Reshape
        *   Resize Bilinear:
        *   Constraints:
        *   Requested size <= 65
        *   Resize Nearest Neighbor
        *   SoftMax
        *   Split
        *   Sub
        *   Tanh
        *   Transpose
        *   TransposeConv2D:
        *   Constraints:
        *   stride height/width <= 3
        *   dilation height/width == 1
 *   How can I tell that the model is using the DSP when I enable the delegate?
    *   A log message will be printed whether delegate created or not, and
        another one with how many nodes are running using the delegate. \
        "Created TensorFlow Lite delegate for Hexagon." \
        "Hexagon delegate: X nodes delegated out of Y nodes."
 *   Do I need all Ops in the model to be supported to run the delegate ?
    *   No, the Model will be partitioned into subgraphs based on the supported
        ops. Any unsupported ops will run on the CPU.
--- a/tensorflow/workspace.bzl
+++ b/tensorflow/workspace.bzl
@ -27,6 +27,7 @@ load("//third_party/aws:workspace.bzl", aws = "repo")
 load("//third_party/clog:workspace.bzl", clog = "repo")
 load("//third_party/cpuinfo:workspace.bzl", cpuinfo = "repo")
 load("//third_party/flatbuffers:workspace.bzl", flatbuffers = "repo")
 load("//third_party/hexagon:workspace.bzl", hexagon_nn = "repo")
 load("//third_party/highwayhash:workspace.bzl", highwayhash = "repo")
 load("//third_party/hwloc:workspace.bzl", hwloc = "repo")
 load("//third_party/icu:workspace.bzl", icu = "repo")
@ -46,6 +47,7 @@ def initialize_third_party():
    clog()
    cpuinfo()
    flatbuffers()
    hexagon_nn()
    highwayhash()
    hwloc()
    icu()
--- a/third_party/hexagon/BUILD
+++ b/third_party/hexagon/BUILD
@ -0,0 +1,48 @@
 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 package(default_visibility = [
    "//visibility:public",
 ])
 licenses([
    "notice",  # BSD-3-Clause-Clear
 ])
 exports_files(glob(["hexagon/**/*.so"]))
 #Just header file, needed for data types in the interface.
 cc_library(
    name = "hexagon_nn_header",
    hdrs = [
        "hexagon/hexagon_nn.h",
    ],
    tags = [
        "manual",
        "nobuilder",
    ],
 )
 cc_library(
    name = "hexagon_nn_ops",
    hdrs = [
        "hexagon/hexagon_nn_ops.h",
        "hexagon/ops.def",
    ],
    tags = [
        "manual",
        "nobuilder",
    ],
 )
--- a/third_party/hexagon/LICENSE
+++ b/third_party/hexagon/LICENSE
@ -0,0 +1,35 @@
 /*
 * Copyright (c) 2016-2019, The Linux Foundation. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted (subject to the limitations in the
 * disclaimer below) provided that the following conditions are met:
 *
 *    * Redistributions of source code must retain the above copyright
 *      notice, this list of conditions and the following disclaimer.
 *
 *    * Redistributions in binary form must reproduce the above
 *      copyright notice, this list of conditions and the following
 *      disclaimer in the documentation and/or other materials provided
 *      with the distribution.
 *
 *    * Neither the name of The Linux Foundation nor the names of its
 *      contributors may be used to endorse or promote products derived
 *      from this software without specific prior written permission.
 *
 * NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 * GRANTED BY THIS LICENSE. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
 * HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED
 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
 * IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
 * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE
 * GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
 * IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 * IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 */
--- a/third_party/hexagon/workspace.bzl
+++ b/third_party/hexagon/workspace.bzl
@ -0,0 +1,13 @@
 """Loads the Hexagon NN Header files library, used by TF Lite."""
 load("//third_party:repo.bzl", "third_party_http_archive")
 def repo():
    third_party_http_archive(
        name = "hexagon_nn",
        sha256 = "e972f86eb8bcfb1ee93ff3dc7aa4518948e3941b5ea0945f5c9307b2d3334225",
        urls = [
            "http://mirror.tensorflow.org/storage.cloud.google.com/download.tensorflow.org/tflite/hexagon_nn_headers_v1.10.3.1.0.tgz",
        ],
        build_file = "//third_party/hexagon:BUILD",
    )