Add utility functions for integration. This supports the calibration case that the model is initialized multiple times.

(1) quatization_wrapper is the external interface to help calibration and quantization. The interface is string and bool so the dependencies are minimal. It has two functions: - CreateCalibrationModel copies a model to a new location and adds intermediate tensors if any of the op need that. - CreateQuantizedModel quantizes a model in place. (2) quatization wrapper_utils is the helper function for quatization_wrapper - added function to load model - added function to write model PiperOrigin-RevId: 280510873 Change-Id: I58891d6e8d6d3b485242f321466ac91ce2fdffda
2019-11-14 14:16:04 -08:00 · 2019-11-14 14:16:04 -08:00 · fa0fb0d4f6
commit fa0fb0d4f6
parent dd6f51d33b
6 changed files with 148 additions and 12 deletions
--- a/tensorflow/lite/tools/optimize/BUILD
+++ b/tensorflow/lite/tools/optimize/BUILD
@ -13,9 +13,9 @@ exports_files(glob([
 ]))
 cc_library(
-    name = "add_intermediate_tensors",
+    name = "quantization_wrapper_utils",
-    srcs = ["add_intermediate_tensors.cc"],
+    srcs = ["quantization_wrapper_utils.cc"],
-    hdrs = ["add_intermediate_tensors.h"],
+    hdrs = ["quantization_wrapper_utils.h"],
    deps = [
        ":operator_property",
        "//tensorflow/lite:framework",
@ -26,14 +26,14 @@ cc_library(
 )
 tf_cc_test(
-    name = "add_intermediate_tensors_test",
+    name = "quantization_wrapper_utils_test",
-    srcs = ["add_intermediate_tensors_test.cc"],
+    srcs = ["quantization_wrapper_utils_test.cc"],
    tags = [
        "tflite_not_portable_android",
        "tflite_not_portable_ios",
    ],
    deps = [
-        ":add_intermediate_tensors",
+        ":quantization_wrapper_utils",
        "//tensorflow/lite:framework",
        "//tensorflow/lite/schema:schema_fbs",
        "@com_google_absl//absl/memory",
@ -42,6 +42,20 @@ tf_cc_test(
    ],
 )
 cc_library(
    name = "quantization_wrapper",
    srcs = ["quantization_wrapper.cc"],
    hdrs = ["quantization_wrapper.h"],
    deps = [
        ":quantization_wrapper_utils",
        "//tensorflow/lite:framework",
        "//tensorflow/lite/core/api",
        "//tensorflow/lite/schema:schema_fbs",
        "//tensorflow/lite/tools/optimize:quantize_model",
        "@flatbuffers",
    ],
 )
 cc_library(
    name = "quantization_utils",
    srcs = ["quantization_utils.cc"],
--- a/tensorflow/lite/tools/optimize/quantization_wrapper.cc
+++ b/tensorflow/lite/tools/optimize/quantization_wrapper.cc
@ -0,0 +1,52 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #include "tensorflow/lite/tools/optimize/quantization_wrapper.h"
 #include "tensorflow/lite/tools/optimize/quantization_wrapper_utils.h"
 #include "tensorflow/lite/tools/optimize/quantize_model.h"
 namespace tflite {
 namespace optimize {
 bool CreateModelForCalibration(const std::string& input_path,
                               const std::string& output_path) {
  ModelT model;
  if (LoadModel(input_path, &model) != kTfLiteOk) {
    return false;
  }
  flatbuffers::FlatBufferBuilder builder;
  if (AddIntemediateTensorsToFusedOp(&builder, &model) != kTfLiteOk) {
    return false;
  }
  return WriteFile(output_path, builder.GetBufferPointer(), builder.GetSize());
 }
 bool CreateQuantizedModel(const std::string& path) {
  ModelT model;
  if (LoadModel(path, &model) != kTfLiteOk) {
    return false;
  }
  flatbuffers::FlatBufferBuilder builder;
  tflite::StderrReporter error_reporter;
  if (tflite::optimize::QuantizeModel(
          &builder, &model, tflite::TensorType_FLOAT32,
          tflite::TensorType_FLOAT32, &error_reporter) != kTfLiteOk) {
    return false;
  }
  return WriteFile(path, builder.GetBufferPointer(), builder.GetSize());
 }
 }  // namespace optimize
 }  // namespace tflite
--- a/tensorflow/lite/tools/optimize/quantization_wrapper.h
+++ b/tensorflow/lite/tools/optimize/quantization_wrapper.h
@ -0,0 +1,39 @@
 /* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 #ifndef TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_H_
 #define TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_H_
 #include <string>
 namespace tflite {
 namespace optimize {
 // Makes an copy of the model at input_path and writes it to output_path, adding
 // tensors to the model needed for calibration.
 // Returns true if it is successful.
 // Example: a/b/c.tflite becomes a/b/c.calibrated.tflite and has
 // intermediate tensors added according to operator properties.
 bool CreateModelForCalibration(const std::string& input_path,
                               const std::string& output_path);
 // Quantize a model in place. This function is only to be called after calling
 // CreateModelForCalibration and running calibration over data.
 // Returns true if it is successful.
 bool CreateQuantizedModel(const std::string& path);
 }  // namespace optimize
 }  // namespace tflite
 #endif  // TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_H_
--- a/tensorflow/lite/tools/optimize/quantization_wrapper_utils.cc
+++ b/tensorflow/lite/tools/optimize/quantization_wrapper_utils.cc
@ -12,10 +12,12 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-#include "tensorflow/lite/tools/optimize/add_intermediate_tensors.h"
+#include "tensorflow/lite/tools/optimize/quantization_wrapper_utils.h"
 #include <fstream>
 #include <memory>
 #include "tensorflow/lite/schema/schema_generated.h"
 #include "tensorflow/lite/tools/optimize/operator_property.h"
 namespace tflite {
@ -51,6 +53,19 @@ bool IntermediateTensorExists(ModelT* model) {
 }
 }  // namespace
 TfLiteStatus LoadModel(const string& path, ModelT* model) {
  auto input_model = FlatBufferModel::BuildFromFile(path.c_str());
  if (!input_model) {
    return kTfLiteError;
  }
  auto readonly_model = input_model->GetModel();
  if (!readonly_model) {
    return kTfLiteError;
  }
  readonly_model->UnPackTo(model);
  return kTfLiteOk;
 }
 TfLiteStatus AddIntemediateTensorsToFusedOp(
    flatbuffers::FlatBufferBuilder* builder, ModelT* model) {
  // Return early if the model already has intermediate tensors.
@ -90,5 +105,14 @@ TfLiteStatus AddIntemediateTensorsToFusedOp(
  return kTfLiteOk;
 }
 bool WriteFile(const std::string& out_file, const uint8_t* bytes,
               size_t num_bytes) {
  std::fstream stream(out_file, std::ios::binary | std::ios::out);
  for (size_t i = 0; i < num_bytes; i++) {
    stream << bytes[i];
  }
  return (!stream.bad() && !stream.fail());
 }
 }  // namespace optimize
 }  // namespace tflite
--- a/tensorflow/lite/tools/optimize/quantization_wrapper_utils.h
+++ b/tensorflow/lite/tools/optimize/quantization_wrapper_utils.h
@ -12,8 +12,8 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-#ifndef TENSORFLOW_LITE_TOOLS_OPTIMIZE_ADD_INTERMEDIATE_TENSORS_H_
+#ifndef TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_UTILS_H_
-#define TENSORFLOW_LITE_TOOLS_OPTIMIZE_ADD_INTERMEDIATE_TENSORS_H_
+#define TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_UTILS_H_
 #include "tensorflow/lite/core/api/error_reporter.h"
 #include "tensorflow/lite/model.h"
@ -22,13 +22,20 @@ limitations under the License.
 namespace tflite {
 namespace optimize {
 // Load a tflite model from path.
 TfLiteStatus LoadModel(const string& path, ModelT* model);
 // Going through the model and add intermediates tensors if the ops have any.
 // Returns early if the model has already intermediate tensors. This is to
 // support cases where a model is initialized multiple times.
 TfLiteStatus AddIntemediateTensorsToFusedOp(
-    flatbuffers::FlatBufferBuilder* builder, ModelT* input_model);
+    flatbuffers::FlatBufferBuilder* builder, ModelT* model);
 // Write model to a given location.
 bool WriteFile(const std::string& out_file, const uint8_t* bytes,
               size_t num_bytes);
 }  // namespace optimize
 }  // namespace tflite
-#endif  // TENSORFLOW_LITE_TOOLS_OPTIMIZE_ADD_INTERMEDIATE_TENSORS_H_
+#endif  // TENSORFLOW_LITE_TOOLS_OPTIMIZE_QUANTIZATION_WRAPPER_UTILS_H_
--- a/tensorflow/lite/tools/optimize/quantization_wrapper_utils_test.cc
+++ b/tensorflow/lite/tools/optimize/quantization_wrapper_utils_test.cc
@ -12,7 +12,7 @@ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
-#include "tensorflow/lite/tools/optimize/add_intermediate_tensors.h"
+#include "tensorflow/lite/tools/optimize/quantization_wrapper_utils.h"
 #include <gmock/gmock.h>
 #include <gtest/gtest.h>