Export ConversionParams an API

2020-01-15 15:57:38 -08:00 · 2020-01-15 15:57:38 -08:00 · 3a378dbfd5
commit 3a378dbfd5
parent e8565092ff
3 changed files with 69 additions and 4 deletions
--- a/tensorflow/python/compiler/tensorrt/trt_convert.py
+++ b/tensorflow/python/compiler/tensorrt/trt_convert.py
@ -111,6 +111,7 @@ class TrtPrecisionMode(object):
 DEFAULT_TRT_MAX_WORKSPACE_SIZE_BYTES = 1 << 30


+@tf_export("experimental.tensorrt.ConversionParams", v1=[])
 class TrtConversionParams(object):
  """ A class to encapsulate parameters that are used for TF-TRT conversion."""

@ -888,7 +889,7 @@ class TrtGraphConverterV2(object):
  1. FP32/FP16 precision

     ```python
-     params = DEFAULT_TRT_CONVERSION_PARAMS._replace(
+     params = tf.experimental.tensorrt.ConversionParams(
         precision_mode='FP16')
     converter = tf.experimental.tensorrt.Converter(
         input_saved_model_dir="my_dir", conversion_params=params)
@ -904,7 +905,7 @@ class TrtGraphConverterV2(object):
  2. FP32/FP16 precision with pre-built engines

     ```python
-     params = DEFAULT_TRT_CONVERSION_PARAMS._replace(
+     params = tf.experimental.tensorrt.ConversionParams(
         precision_mode='FP16',
         # Set this to a large enough number so it can cache all the engines.
         maximum_cached_engines=16)
@ -936,7 +937,7 @@ class TrtGraphConverterV2(object):
  3. INT8 precision and calibration with pre-built engines

     ```python
-     params = DEFAULT_TRT_CONVERSION_PARAMS._replace(
+     params = tf.experimental.tensorrt.ConversionParams(
         precision_mode='INT8',
         # Currently only one INT8 engine is supported in this mode.
         maximum_cached_engines=1,
@ -974,7 +975,7 @@ class TrtGraphConverterV2(object):
               input_saved_model_dir=None,
               input_saved_model_tags=None,
               input_saved_model_signature_key=None,
-               conversion_params=DEFAULT_TRT_CONVERSION_PARAMS):
+               conversion_params=TrtConversionParams()):
    """Initialize the converter.

    Args:
--- a/tensorflow/python/compiler/tensorrt/trt_convert_windows.py
+++ b/tensorflow/python/compiler/tensorrt/trt_convert_windows.py
@ -26,6 +26,66 @@ if platform.system() != "Windows":
  raise RuntimeError(
      "This module is expected to be loaded only on Windows platform.")

+@tf_export("experimental.tensorrt.ConversionParams", v1=[])
+class TrtConversionParams(object):
+  """ A class to encapsulate parameters that are used for TF-TRT conversion."""
+
+  def __init__(self,
+               rewriter_config_template=None,
+               max_workspace_size_bytes=DEFAULT_TRT_MAX_WORKSPACE_SIZE_BYTES,
+               precision_mode=TrtPrecisionMode.FP32,
+               minimum_segment_size=3,
+               is_dynamic_op=True,
+               maximum_cached_engines=1,
+               use_calibration=True,
+               max_batch_size=1,
+               allow_build_at_runtime=True):
+    """Initialize TrtConversionParams.
+
+    Args:
+      rewriter_config_template: a template RewriterConfig proto used to create a
+        TRT-enabled RewriterConfig. If None, it will use a default one.
+      max_workspace_size_bytes: the maximum GPU temporary memory which the TRT
+        engine can use at execution time. This corresponds to the
+        'workspaceSize' parameter of nvinfer1::IBuilder::setMaxWorkspaceSize().
+      precision_mode: one of TrtPrecisionMode.supported_precision_modes().
+      minimum_segment_size: the minimum number of nodes required for a subgraph
+        to be replaced by TRTEngineOp.
+      is_dynamic_op: whether to generate dynamic TRT ops which will build the
+        TRT network and engine at run time. i.e. Since TensorRT version < 6.0
+        does not support dynamic dimensions other than the batch dimension,
+        when the TensorFlow graph has a non-batch dimension of dynamic size,
+        we would need to enable this option. This option should be set to True
+        in TF 2.0.
+      maximum_cached_engines: max number of cached TRT engines for dynamic TRT
+        ops. Created TRT engines for a dynamic dimension are cached. This is
+        the maximum number of engines that can be cached. If the number of
+        cached engines is already at max but none of them supports the input
+        shapes, the TRTEngineOp will fall back to run the original TF subgraph
+        that corresponds to the TRTEngineOp.
+      use_calibration: this argument is ignored if precision_mode is not INT8.
+        If set to True, a calibration graph will be created to calibrate the
+        missing ranges. The calibration graph must be converted to an inference
+        graph by running calibration with calibrate(). If set to False,
+        quantization nodes will be expected for every tensor in the graph
+        (exlcuding those which will be fused). If a range is missing, an error
+        will occur. Please note that accuracy may be negatively affected if
+        there is a mismatch between which tensors TRT quantizes and which
+        tensors were trained with fake quantization.
+      max_batch_size: max size for the input batch. This parameter is only
+        effective when is_dynamic_op=False which is not supported in TF 2.0.
+      allow_build_at_runtime: whether to build TensorRT engines during runtime.
+        If no TensorRT engine can be found in cache that can handle the given
+        inputs during runtime, then a new TensorRT engine is built at runtime
+        if allow_build_at_runtime=True, and otherwise native TF is used. This
+        argument is only effective if is_dynamic_op=True.
+
+    Raises:
+      NotImplementedError: TRT is not supported on Windows.
+    """
+    raise NotImplementedError(
+        "TensorRT integration is not available on Windows.")
+

@tf_export("experimental.tensorrt.Converter", v1=[])
 class TrtConverterWindows(object):
--- a/tensorflow/tools/api/golden/v2/tensorflow.experimental.tensorrt.pbtxt
+++ b/tensorflow/tools/api/golden/v2/tensorflow.experimental.tensorrt.pbtxt
@ -1,5 +1,9 @@
 path: "tensorflow.experimental.tensorrt"
 tf_module {
+  member {
+    name: "ConversionParams"
+    mtype: "<type \'type\'>"
+  }
  member {
    name: "Converter"
    mtype: "<type \'type\'>"