From f742e74da3eaa536dddbe8ebc1cb85ee8de7f312 Mon Sep 17 00:00:00 2001
From: Dero Gharibian <dero@google.com>
Date: Tue, 27 Aug 2019 18:15:54 -0700
Subject: [PATCH] Update kernels and related libs to use tstring.

This is a part of a larger migration effort for tensorflow::tstring.
See: https://github.com/tensorflow/community/pull/91
PiperOrigin-RevId: 265811129
---
 tensorflow/core/kernels/encode_jpeg_op.cc     |   4 +-
 tensorflow/core/kernels/encode_png_op.cc      |  10 +-
 tensorflow/core/kernels/encode_proto_op.cc    |  28 +++-
 tensorflow/core/kernels/encode_wav_op.cc      |   2 +-
 .../core/kernels/example_parsing_ops.cc       |  28 ++--
 .../core/kernels/example_parsing_ops_test.cc  |   2 +-
 tensorflow/core/kernels/fingerprint_op.cc     |   4 +-
 .../core/kernels/fingerprint_op_test.cc       |  10 +-
 tensorflow/core/kernels/lookup_table_op.h     |   2 +-
 tensorflow/core/kernels/record_input_op.cc    |   2 +-
 tensorflow/core/kernels/record_yielder.cc     |   2 +-
 tensorflow/core/kernels/record_yielder.h      |   2 +-
 tensorflow/core/kernels/regex_replace_op.cc   |   8 +-
 .../core/kernels/regex_replace_op_test.cc     |   4 +-
 tensorflow/core/kernels/string_ngrams_op.cc   |  18 +--
 .../core/kernels/string_ngrams_op_test.cc     | 127 +++++++++---------
 tensorflow/core/kernels/unicode_ops.cc        |   8 +-
 .../core/kernels/whole_file_read_ops.cc       |   8 +-
 .../core/lib/io/buffered_inputstream.cc       |   8 +-
 tensorflow/core/lib/io/buffered_inputstream.h |   3 +-
 tensorflow/core/lib/jpeg/jpeg_handle.cc       |   2 +-
 tensorflow/core/lib/jpeg/jpeg_handle.h        |   4 +-
 tensorflow/core/lib/jpeg/jpeg_mem.cc          |  10 +-
 tensorflow/core/lib/jpeg/jpeg_mem.h           |   6 +-
 tensorflow/core/lib/jpeg/jpeg_mem_unittest.cc |   4 +-
 tensorflow/core/lib/png/png_io.cc             |  19 ++-
 tensorflow/core/lib/png/png_io.h              |   3 +-
 tensorflow/core/lib/strings/base64.cc         |  21 ++-
 tensorflow/core/lib/strings/base64.h          |  10 +-
 tensorflow/core/lib/strings/base64_test.cc    |   4 +-
 tensorflow/core/lib/wav/wav_io.cc             |  18 ++-
 tensorflow/core/lib/wav/wav_io.h              |   3 +-
 tensorflow/core/lib/wav/wav_io_test.cc        |   7 +-
 tensorflow/core/platform/protobuf.cc          |  39 ++++++
 tensorflow/core/platform/protobuf.h           |  23 ++++
 tensorflow/core/platform/tstring.h            |   4 +
 36 files changed, 303 insertions(+), 154 deletions(-)
diff --git a/tensorflow/core/kernels/encode_jpeg_op.cc b/tensorflow/core/kernels/encode_jpeg_op.cc
index 547b9d8da4d..923b379c2d6 100644
--- a/tensorflow/core/kernels/encode_jpeg_op.cc
+++ b/tensorflow/core/kernels/encode_jpeg_op.cc
@@ -124,7 +124,7 @@ class EncodeJpegOp : public OpKernel {
                    context->allocate_output(0, TensorShape({}), &output));
     OP_REQUIRES(context,
                 jpeg::Compress(image.flat<uint8>().data(), dim_size1, dim_size0,
-                               adjusted_flags, &output->scalar<string>()()),
+                               adjusted_flags, &output->scalar<tstring>()()),
                 errors::Internal("JPEG encoding failed"));
   }
 
@@ -190,7 +190,7 @@ class EncodeJpegVariableQualityOp : public OpKernel {
                    context->allocate_output(0, TensorShape({}), &output));
     OP_REQUIRES(context,
                 jpeg::Compress(image.flat<uint8>().data(), dim_size1, dim_size0,
-                               adjusted_flags, &output->scalar<string>()()),
+                               adjusted_flags, &output->scalar<tstring>()()),
                 errors::Internal("JPEG encoding failed"));
   }
 };
diff --git a/tensorflow/core/kernels/encode_png_op.cc b/tensorflow/core/kernels/encode_png_op.cc
index cb9a1660a7d..8dbe1d377df 100644
--- a/tensorflow/core/kernels/encode_png_op.cc
+++ b/tensorflow/core/kernels/encode_png_op.cc
@@ -78,17 +78,17 @@ class EncodePngOp : public OpKernel {
                    context->allocate_output(0, TensorShape({}), &output));
     if (desired_channel_bits_ == 8) {
       OP_REQUIRES(context,
-                  png::WriteImageToBuffer(image.flat<uint8>().data(), width,
-                                          height, width * channels, channels,
-                                          desired_channel_bits_, compression_,
-                                          &output->scalar<string>()(), nullptr),
+                  png::WriteImageToBuffer(
+                      image.flat<uint8>().data(), width, height,
+                      width * channels, channels, desired_channel_bits_,
+                      compression_, &output->scalar<tstring>()(), nullptr),
                   errors::Internal("PNG encoding failed"));
     } else {
       OP_REQUIRES(context,
                   png::WriteImageToBuffer(
                       image.flat<uint16>().data(), width, height,
                       width * channels * 2, channels, desired_channel_bits_,
-                      compression_, &output->scalar<string>()(), nullptr),
+                      compression_, &output->scalar<tstring>()(), nullptr),
                   errors::Internal("PNG encoding failed"));
     }
   }
diff --git a/tensorflow/core/kernels/encode_proto_op.cc b/tensorflow/core/kernels/encode_proto_op.cc
index 12bbd34ec71..288b74c4d24 100644
--- a/tensorflow/core/kernels/encode_proto_op.cc
+++ b/tensorflow/core/kernels/encode_proto_op.cc
@@ -298,6 +298,26 @@ Status WriteVarLenField(const FieldDescriptor& field_desc, const Tensor& input,
   return Status::OK();
 }
 
+static void WriteStringAdapter(int field_number, const tstring& value,
+                               CodedOutputStream* output) {
+  // Unfortunately, external proto does not accept string_view.
+#if defined(PLATFORM_GOOGLE)
+  WireFormatLite::WriteString(field_number, StringPiece(value), output);
+#else
+  WireFormatLite::WriteString(field_number, string(value), output);
+#endif
+}
+
+static void WriteBytesAdapter(int field_number, const tstring& value,
+                              CodedOutputStream* output) {
+  // Unfortunately, external proto does not accept string_view.
+#if defined(PLATFORM_GOOGLE)
+  WireFormatLite::WriteBytes(field_number, StringPiece(value), output);
+#else
+  WireFormatLite::WriteBytes(field_number, string(value), output);
+#endif
+}
+
 // Writes a group field. Groups are treated like submessages, but tag-delimited
 // instead of length-delimited. WireFormatLite handles this differently so we
 // code it ourselves.
@@ -388,15 +408,15 @@ Status WriteField(const FieldDescriptor& field_desc, const Tensor& input,
                         WireFormatLite::WriteBoolNoTag>(
           field_desc, input, message_index, size, output);
     case WireFormatLite::TYPE_STRING:
-      return WriteVarLenField<string, WireFormatLite::WriteString>(
+      return WriteVarLenField<tstring, WriteStringAdapter>(
           field_desc, input, message_index, size, output);
     case WireFormatLite::TYPE_GROUP:
       return WriteGroup(field_desc, input, message_index, size, output);
     case WireFormatLite::TYPE_MESSAGE:
-      return WriteVarLenField<string, WireFormatLite::WriteBytes>(
+      return WriteVarLenField<tstring, WriteBytesAdapter>(
           field_desc, input, message_index, size, output);
     case WireFormatLite::TYPE_BYTES:
-      return WriteVarLenField<string, WireFormatLite::WriteBytes>(
+      return WriteVarLenField<tstring, WriteBytesAdapter>(
           field_desc, input, message_index, size, output);
     case WireFormatLite::TYPE_UINT32:
       switch (dtype) {
@@ -592,7 +612,7 @@ class EncodeProtoOp : public OpKernel {
          message_index++) {
       // TODO(nix): possibly optimize allocation here by calling
       // `bufs(message_index).reserve(DEFAULT_BUF_SIZE)`.
-      StringOutputStream output_string(&bufs(message_index));
+      TStringOutputStream output_string(&bufs(message_index));
       CodedOutputStream out(&output_string);
       // Write fields in ascending field_number order.
       for (int i : sorted_field_index_) {
diff --git a/tensorflow/core/kernels/encode_wav_op.cc b/tensorflow/core/kernels/encode_wav_op.cc
index 082f9a74ae1..b90d90873ab 100644
--- a/tensorflow/core/kernels/encode_wav_op.cc
+++ b/tensorflow/core/kernels/encode_wav_op.cc
@@ -58,7 +58,7 @@ class EncodeWavOp : public OpKernel {
     OP_REQUIRES_OK(context,
                    wav::EncodeAudioAsS16LEWav(
                        audio.flat<float>().data(), sample_rate, channel_count,
-                       sample_count, &output->scalar<string>()()));
+                       sample_count, &output->scalar<tstring>()()));
   }
 };
 REGISTER_KERNEL_BUILDER(Name("EncodeWav").Device(DEVICE_CPU), EncodeWavOp);
diff --git a/tensorflow/core/kernels/example_parsing_ops.cc b/tensorflow/core/kernels/example_parsing_ops.cc
index 8226d14234d..b9f9ec30d52 100644
--- a/tensorflow/core/kernels/example_parsing_ops.cc
+++ b/tensorflow/core/kernels/example_parsing_ops.cc
@@ -132,10 +132,10 @@ class ParseExampleOp : public OpKernel {
       config.sparse.push_back({sparse_keys_t[d], attrs_.sparse_types[d]});
     }
 
-    auto serialized_t = serialized->flat<string>();
-    auto names_t = names->flat<string>();
-    gtl::ArraySlice<string> slice(serialized_t.data(), serialized_t.size());
-    gtl::ArraySlice<string> names_slice(names_t.data(), names_t.size());
+    auto serialized_t = serialized->flat<tstring>();
+    auto names_t = names->flat<tstring>();
+    gtl::ArraySlice<tstring> slice(serialized_t.data(), serialized_t.size());
+    gtl::ArraySlice<tstring> names_slice(names_t.data(), names_t.size());
 
     OP_REQUIRES_OK(
         ctx,
@@ -352,11 +352,11 @@ class ParseSequenceExampleOp : public OpKernel {
            attrs_.feature_list_sparse_types[d]});
     }
 
-    auto serialized_t = serialized->flat<string>();
-    auto debug_name_t = debug_name->flat<string>();
-    gtl::ArraySlice<string> slice(serialized_t.data(), serialized_t.size());
-    gtl::ArraySlice<string> names_slice(debug_name_t.data(),
-                                        debug_name_t.size());
+    auto serialized_t = serialized->flat<tstring>();
+    auto debug_name_t = debug_name->flat<tstring>();
+    gtl::ArraySlice<tstring> slice(serialized_t.data(), serialized_t.size());
+    gtl::ArraySlice<tstring> names_slice(debug_name_t.data(),
+                                         debug_name_t.size());
 
     OP_REQUIRES_OK(
         ctx,
@@ -853,10 +853,12 @@ class DecodeJSONExampleOp : public OpKernel {
                                   &binary_examples));
 
     for (int i = 0; i < json_examples->NumElements(); ++i) {
-      const string& json_example = json_examples->flat<string>()(i);
-      auto status = protobuf::util::JsonToBinaryString(
-          resolver_.get(), "type.googleapis.com/tensorflow.Example",
-          json_example, &binary_examples->flat<string>()(i));
+      const tstring& json_example = json_examples->flat<tstring>()(i);
+      protobuf::io::ArrayInputStream in(json_example.data(),
+                                        json_example.size());
+      TStringOutputStream out(&binary_examples->flat<tstring>()(i));
+      auto status = protobuf::util::JsonToBinaryStream(
+          resolver_.get(), "type.googleapis.com/tensorflow.Example", &in, &out);
       OP_REQUIRES(ctx, status.ok(),
                   errors::InvalidArgument("Error while parsing JSON: ",
                                           string(status.error_message())));
diff --git a/tensorflow/core/kernels/example_parsing_ops_test.cc b/tensorflow/core/kernels/example_parsing_ops_test.cc
index db1672e70a0..7e718ca7be7 100644
--- a/tensorflow/core/kernels/example_parsing_ops_test.cc
+++ b/tensorflow/core/kernels/example_parsing_ops_test.cc
@@ -124,7 +124,7 @@ struct ExampleStore {
         Features* features = example.mutable_features();
         (*features->mutable_feature())[k_str] = f;
       }
-      CHECK(example.SerializeToString(&string_t(b)));
+      CHECK(SerializeToTString(example, &string_t(b)));
     }
     (*examples)[std::make_tuple(batch_size, num_keys, feature_size)] =
         record_string;
diff --git a/tensorflow/core/kernels/fingerprint_op.cc b/tensorflow/core/kernels/fingerprint_op.cc
index 660f900c405..340dcf111a5 100644
--- a/tensorflow/core/kernels/fingerprint_op.cc
+++ b/tensorflow/core/kernels/fingerprint_op.cc
@@ -52,7 +52,7 @@ void FarmhashFingerprint64(TTypes<uint8, 2>::ConstTensor input,
   }
 }
 
-void FarmhashFingerprint64(TTypes<string>::ConstFlat input,
+void FarmhashFingerprint64(TTypes<tstring>::ConstFlat input,
                            TTypes<uint8, 2>::Matrix output) {
   DCHECK_EQ(output.dimension(0), input.dimension(0));
   DCHECK_EQ(output.dimension(1), sizeof(uint64));
@@ -79,7 +79,7 @@ class FingerprintOp : public OpKernel {
                 errors::InvalidArgument("`method` should be a scalar string: ",
                                         method_tensor.shape()));
     // For now, farmhash64 is the only function supported.
-    const string& method = method_tensor.scalar<string>()();
+    const tstring& method = method_tensor.scalar<tstring>()();
     OP_REQUIRES(
         context, method == "farmhash64",
         errors::InvalidArgument("Unsupported fingerprint method: ", method));
diff --git a/tensorflow/core/kernels/fingerprint_op_test.cc b/tensorflow/core/kernels/fingerprint_op_test.cc
index d9a9a97798d..79d54a5fde4 100644
--- a/tensorflow/core/kernels/fingerprint_op_test.cc
+++ b/tensorflow/core/kernels/fingerprint_op_test.cc
@@ -82,10 +82,10 @@ TEST_F(FingerprintOpTest, StringGoldenValue) {
   buffer(1).resize(7);
   buffer(2).resize(0);
   buffer(3).resize(19);
-  std::iota(buffer(0).begin(), buffer(0).end(), 0);
-  std::iota(buffer(1).begin(), buffer(1).end(), 7);
-  std::iota(buffer(2).begin(), buffer(2).end(), 71);
-  std::iota(buffer(3).begin(), buffer(3).end(), 41);
+  std::iota(&buffer(0)[0], &buffer(0)[0] + buffer(0).size(), 0);
+  std::iota(&buffer(1)[0], &buffer(1)[0] + buffer(1).size(), 7);
+  std::iota(&buffer(2)[0], &buffer(2)[0] + buffer(2).size(), 71);
+  std::iota(&buffer(3)[0], &buffer(3)[0] + buffer(3).size(), 41);
 
   TF_ASSERT_OK(MakeFingerprintOp(&data));
   TF_ASSERT_OK(RunOpKernel());
@@ -137,7 +137,7 @@ TEST_F(FingerprintOpTest, CollisionString) {
   auto& input = tensor.vec<tstring>()(0);
   input.resize(size);
 
-  TTypes<uint8>::UnalignedFlat buffer(reinterpret_cast<uint8*>(&*input.begin()),
+  TTypes<uint8>::UnalignedFlat buffer(reinterpret_cast<uint8*>(&input[0]),
                                       input.size());
   buffer.setRandom();
 
diff --git a/tensorflow/core/kernels/lookup_table_op.h b/tensorflow/core/kernels/lookup_table_op.h
index 28d63cbf797..416848db6b0 100644
--- a/tensorflow/core/kernels/lookup_table_op.h
+++ b/tensorflow/core/kernels/lookup_table_op.h
@@ -134,7 +134,7 @@ T SubtleMustCopyIfIntegral(const T& value) {
   return internal::SubtleMustCopy(value);
 }
 
-inline const string& SubtleMustCopyIfIntegral(const string& value) {
+inline const tstring& SubtleMustCopyIfIntegral(const tstring& value) {
   return value;
 }
 
diff --git a/tensorflow/core/kernels/record_input_op.cc b/tensorflow/core/kernels/record_input_op.cc
index 841f9dc4b8e..e7d5750e09d 100644
--- a/tensorflow/core/kernels/record_input_op.cc
+++ b/tensorflow/core/kernels/record_input_op.cc
@@ -55,7 +55,7 @@ class RecordInputOp : public OpKernel {
 
   void Compute(OpKernelContext* ctx) override {
     Tensor out(DT_STRING, {batch_size_});
-    auto t_out = out.flat<string>();
+    auto t_out = out.flat<tstring>();
     for (int i = 0; i < batch_size_; ++i) {
       OP_REQUIRES_OK(ctx, yielder_->YieldOne(&t_out(i)));
     }
diff --git a/tensorflow/core/kernels/record_yielder.cc b/tensorflow/core/kernels/record_yielder.cc
index 3fd9bf9defe..8ca5000cfdf 100644
--- a/tensorflow/core/kernels/record_yielder.cc
+++ b/tensorflow/core/kernels/record_yielder.cc
@@ -44,7 +44,7 @@ RecordYielder::~RecordYielder() {
   delete thread_;
 }
 
-Status RecordYielder::YieldOne(string* value) {
+Status RecordYielder::YieldOne(tstring* value) {
   mutex_lock l(mu_);
   while (!BufEnough() && status_.ok()) {
     buf_enough_.wait(l);
diff --git a/tensorflow/core/kernels/record_yielder.h b/tensorflow/core/kernels/record_yielder.h
index 159b43b4cd0..4efef6c4366 100644
--- a/tensorflow/core/kernels/record_yielder.h
+++ b/tensorflow/core/kernels/record_yielder.h
@@ -90,7 +90,7 @@ class RecordYielder {
   RecordYielder& operator=(const RecordYielder&) = delete;
 
   // Yields one 'value'.
-  Status YieldOne(string* value);
+  Status YieldOne(tstring* value);
 
   // Returns the current epoch number.
   int64 current_epoch() const { return epoch_; }
diff --git a/tensorflow/core/kernels/regex_replace_op.cc b/tensorflow/core/kernels/regex_replace_op.cc
index 187a4f92fbf..4eb83c5fe0d 100644
--- a/tensorflow/core/kernels/regex_replace_op.cc
+++ b/tensorflow/core/kernels/regex_replace_op.cc
@@ -48,11 +48,15 @@ Status InternalCompute(const RE2& match, const string& rewrite,
   }
   auto output_flat = output_tensor->flat<tstring>();
   for (size_t i = 0; i < output_flat.size(); ++i) {
+    // TODO(dero): Mitigate copy; Global and GlobalReplace below currently only
+    // accept std::string.
+    string buf = output_flat(i);
     if (replace_global) {
-      RE2::GlobalReplace(&output_flat(i), match, rewrite);
+      RE2::GlobalReplace(&buf, match, rewrite);
     } else {
-      RE2::Replace(&output_flat(i), match, rewrite);
+      RE2::Replace(&buf, match, rewrite);
     }
+    output_flat(i) = std::move(buf);
   }
   return Status::OK();
 }
diff --git a/tensorflow/core/kernels/regex_replace_op_test.cc b/tensorflow/core/kernels/regex_replace_op_test.cc
index bfc45e8bc07..b9e960efecc 100644
--- a/tensorflow/core/kernels/regex_replace_op_test.cc
+++ b/tensorflow/core/kernels/regex_replace_op_test.cc
@@ -71,9 +71,9 @@ Graph* SetupRegexReplaceGraph(const Tensor& input, const string& input_pattern,
                               const string& input_rewrite) {
   Graph* g = new Graph(OpRegistry::Global());
   Tensor pattern(DT_STRING, TensorShape({}));
-  pattern.flat<string>().setConstant(input_pattern);
+  pattern.flat<tstring>().setConstant(input_pattern);
   Tensor rewrite(DT_STRING, TensorShape({}));
-  rewrite.flat<string>().setConstant(input_rewrite);
+  rewrite.flat<tstring>().setConstant(input_rewrite);
 
   TF_CHECK_OK(NodeBuilder("regex_replace_op", "RegexReplace")
                   .Input(test::graph::Constant(g, input))
diff --git a/tensorflow/core/kernels/string_ngrams_op.cc b/tensorflow/core/kernels/string_ngrams_op.cc
index 430d91bef88..dc757a01fcf 100644
--- a/tensorflow/core/kernels/string_ngrams_op.cc
+++ b/tensorflow/core/kernels/string_ngrams_op.cc
@@ -128,7 +128,7 @@ class StringNGramsOp : public tensorflow::OpKernel {
     }
   }
 
-  void CreateNgrams(const string* data, string* output, int num_ngrams,
+  void CreateNgrams(const tstring* data, tstring* output, int num_ngrams,
                     int ngram_width) const {
     for (int ngram_index = 0; ngram_index < num_ngrams; ++ngram_index) {
       int pad_width = get_pad_width(ngram_width);
@@ -154,20 +154,20 @@ class StringNGramsOp : public tensorflow::OpKernel {
       ngram_size += num_separators * separator_.length();
 
       // Build the ngram.
-      string* ngram = &output[ngram_index];
+      tstring* ngram = &output[ngram_index];
       ngram->reserve(ngram_size);
       for (int n = 0; n < left_padding; ++n) {
-        *ngram += left_pad_;
-        *ngram += separator_;
+        ngram->append(left_pad_);
+        ngram->append(separator_);
       }
       for (int n = 0; n < num_tokens - 1; ++n) {
-        *ngram += data[data_start_index + n];
-        *ngram += separator_;
+        ngram->append(data[data_start_index + n]);
+        ngram->append(separator_);
       }
-      *ngram += data[data_start_index + num_tokens - 1];
+      ngram->append(data[data_start_index + num_tokens - 1]);
       for (int n = 0; n < right_padding; ++n) {
-        *ngram += separator_;
-        *ngram += right_pad_;
+        ngram->append(separator_);
+        ngram->append(right_pad_);
       }
 
       // In debug mode only: validate that we've reserved enough space for the
diff --git a/tensorflow/core/kernels/string_ngrams_op_test.cc b/tensorflow/core/kernels/string_ngrams_op_test.cc
index afd1700c9ab..b89de9ad16d 100644
--- a/tensorflow/core/kernels/string_ngrams_op_test.cc
+++ b/tensorflow/core/kernels/string_ngrams_op_test.cc
@@ -51,12 +51,12 @@ class NgramKernelTest : public tensorflow::OpsTestBase {
     TF_ASSERT_OK(InitOp());
   }
 
-  void assert_string_equal(const std::vector<string> &expected,
+  void assert_string_equal(const std::vector<tstring> &expected,
                            const Tensor &value) {
     Tensor expected_tensor(allocator(), DT_STRING,
                            TensorShape({static_cast<int64>(expected.size())}));
-    test::FillValues<string>(&expected_tensor, expected);
-    test::ExpectTensorEqual<string>(expected_tensor, value);
+    test::FillValues<tstring>(&expected_tensor, expected);
+    test::ExpectTensorEqual<tstring>(expected_tensor, value);
   }
   void assert_int64_equal(const std::vector<int64> &expected,
                           const Tensor &value) {
@@ -72,11 +72,11 @@ TEST_F(NgramKernelTest, TestPaddedTrigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(                              //
+  std::vector<tstring> expected_values(                             //
       {"LP|LP|a", "LP|a|b", "a|b|c", "b|c|d", "c|d|RP", "d|RP|RP",  // 0
        "LP|LP|e", "LP|e|f", "e|f|RP", "f|RP|RP"});                  // 1
   std::vector<int64> expected_splits({0, 6, 10});
@@ -90,11 +90,11 @@ TEST_F(NgramKernelTest, TestPaddedBigramsAndTrigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(
+  std::vector<tstring> expected_values(
       {"LP|a", "a|b", "b|c", "c|d", "d|RP", "LP|LP|a", "LP|a|b", "a|b|c",
        "b|c|d", "c|d|RP", "d|RP|RP",                                       // 0
        "LP|e", "e|f", "f|RP", "LP|LP|e", "LP|e|f", "e|f|RP", "f|RP|RP"});  // 1
@@ -109,11 +109,11 @@ TEST_F(NgramKernelTest, TestPaddedBigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(       //
+  std::vector<tstring> expected_values(      //
       {"LP|a", "a|b", "b|c", "c|d", "d|RP",  // 0
        "LP|e", "e|f", "f|RP"});              // 1
   std::vector<int64> expected_splits({0, 5, 8});
@@ -127,11 +127,11 @@ TEST_F(NgramKernelTest, TestPaddingIsAtMostNGramSizeMinus1) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(       //
+  std::vector<tstring> expected_values(      //
       {"LP|a", "a|b", "b|c", "c|d", "d|RP",  // 0
        "LP|e", "e|f", "f|RP"});              // 1
   std::vector<int64> expected_splits({0, 5, 8});
@@ -145,11 +145,11 @@ TEST_F(NgramKernelTest, TestPaddedUnigramAndBigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(                           //
+  std::vector<tstring> expected_values(                          //
       {"a", "b", "c", "d", "LP|a", "a|b", "b|c", "c|d", "d|RP",  // 0
        "e", "f", "LP|e", "e|f", "f|RP"});                        // 1
   std::vector<int64> expected_splits({0, 9, 14});
@@ -166,11 +166,11 @@ TEST_F(NgramKernelTest, TestOverlappingPaddedNGrams) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(                     //
+  std::vector<tstring> expected_values(                    //
       {"LP|LP|a", "LP|a|RP", "a|RP|RP",                    // ngrams for elem. 0
        "LP|LP|b", "LP|b|c", "b|c|d", "c|d|RP", "d|RP|RP",  // ngrams for elem. 1
        "LP|LP|e", "LP|e|f", "e|f|RP", "f|RP|RP"});         // ngrams for elem. 2
@@ -186,12 +186,12 @@ TEST_F(NgramKernelTest, TestOverlappingPaddedMultiCharNGrams) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}),
-                            {"aa", "bb", "cc", "dd", "ee", "ff"});
+  AddInputFromArray<tstring>(TensorShape({6}),
+                             {"aa", "bb", "cc", "dd", "ee", "ff"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(                              //
+  std::vector<tstring> expected_values(                             //
       {"LP|LP|aa", "LP|aa|RP", "aa|RP|RP",                          //
        "LP|LP|bb", "LP|bb|cc", "bb|cc|dd", "cc|dd|RP", "dd|RP|RP",  //
        "LP|LP|ee", "LP|ee|ff", "ee|ff|RP", "ff|RP|RP"});            //
@@ -207,13 +207,13 @@ TEST_F(NgramKernelTest, TestMultiOverlappingPaddedNGrams) {
   MakeOp("|", {5}, "LP", "RP", -1, false);
   // Batch items are:
   // 0: "a"
-  AddInputFromArray<string>(TensorShape({1}), {"a"});
+  AddInputFromArray<tstring>(TensorShape({1}), {"a"});
   AddInputFromArray<int64>(TensorShape({2}), {0, 1});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"LP|LP|LP|LP|a", "LP|LP|LP|a|RP",
-                                       "LP|LP|a|RP|RP", "LP|a|RP|RP|RP",
-                                       "a|RP|RP|RP|RP"});
+  std::vector<tstring> expected_values({"LP|LP|LP|LP|a", "LP|LP|LP|a|RP",
+                                        "LP|LP|a|RP|RP", "LP|a|RP|RP|RP",
+                                        "a|RP|RP|RP|RP"});
   std::vector<int64> expected_splits({0, 5});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -225,11 +225,11 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b|c", "b|c|d"});
+  std::vector<tstring> expected_values({"a|b|c", "b|c|d"});
   std::vector<int64> expected_splits({0, 2, 2});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -241,11 +241,11 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigramsWithEmptySequence) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 4, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b|c", "b|c|d"});
+  std::vector<tstring> expected_values({"a|b|c", "b|c|d"});
   std::vector<int64> expected_splits({0, 2, 2, 2});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -257,11 +257,11 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigramsWithPreserveShort) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b|c", "b|c|d", "e|f"});
+  std::vector<tstring> expected_values({"a|b|c", "b|c|d", "e|f"});
   std::vector<int64> expected_splits({0, 2, 3});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -273,11 +273,11 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigramsWithPreserveShortAndEmptySequence) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 4, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b|c", "b|c|d", "e|f"});
+  std::vector<tstring> expected_values({"a|b|c", "b|c|d", "e|f"});
   std::vector<int64> expected_splits({0, 2, 2, 3});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -289,11 +289,11 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigramsAndQuadgramsWithPreserveShort) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b|c|d", "a|b|c", "b|c|d", "e|f"});
+  std::vector<tstring> expected_values({"a|b|c|d", "a|b|c", "b|c|d", "e|f"});
   std::vector<int64> expected_splits({0, 3, 4});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -305,11 +305,11 @@ TEST_F(NgramKernelTest, TestUnpaddedBigramsAndTrigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(
+  std::vector<tstring> expected_values(
       {"a|b", "b|c", "c|d", "a|b|c", "b|c|d", "e|f"});
   std::vector<int64> expected_splits({0, 5, 6});
 
@@ -322,13 +322,13 @@ TEST_F(NgramKernelTest, TestUnpaddedBigramsAndTrigramsWithPreserveShort) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
   // Note that in this case, because the bigram 'e|f' was already generated,
   // the op will not generate a special preserve_short bigram.
-  std::vector<string> expected_values(
+  std::vector<tstring> expected_values(
       {"a|b", "b|c", "c|d", "a|b|c", "b|c|d", "e|f"});
   std::vector<int64> expected_splits({0, 5, 6});
 
@@ -341,13 +341,13 @@ TEST_F(NgramKernelTest, TestUnpaddedTrigramsAndBigramsWithPreserveShort) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
   // Note that in this case, because the bigram 'e|f' was already generated,
   // the op will not generate a special preserve_short bigram.
-  std::vector<string> expected_values(
+  std::vector<tstring> expected_values(
       {"a|b|c", "b|c|d", "a|b", "b|c", "c|d", "e|f"});
   std::vector<int64> expected_splits({0, 5, 6});
 
@@ -360,11 +360,11 @@ TEST_F(NgramKernelTest, TestUnpaddedBigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a|b", "b|c", "c|d", "e|f"});
+  std::vector<tstring> expected_values({"a|b", "b|c", "c|d", "e|f"});
   std::vector<int64> expected_splits({0, 3, 4});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -377,11 +377,11 @@ TEST_F(NgramKernelTest, TestOverlappingUnpaddedNGrams) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"b|c|d"});
+  std::vector<tstring> expected_values({"b|c|d"});
   std::vector<int64> expected_splits({0, 0, 1, 1});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -394,11 +394,11 @@ TEST_F(NgramKernelTest, TestOverlappingUnpaddedNGramsNoOutput) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({});
+  std::vector<tstring> expected_values({});
   std::vector<int64> expected_splits({0, 0, 0, 0});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -410,12 +410,13 @@ TEST_F(NgramKernelTest, TestSinglyPaddedTrigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"LP|a|b", "a|b|c", "b|c|d", "c|d|RP",  //
-                                       "LP|e|f", "e|f|RP"});
+  std::vector<tstring> expected_values({"LP|a|b", "a|b|c", "b|c|d",
+                                        "c|d|RP",  //
+                                        "LP|e|f", "e|f|RP"});
   std::vector<int64> expected_splits({0, 4, 6});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -427,12 +428,12 @@ TEST_F(NgramKernelTest, TestSinglyPaddedBigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"LP|a", "a|b", "b|c", "c|d", "d|RP",  //
-                                       "LP|e", "e|f", "f|RP"});
+  std::vector<tstring> expected_values({"LP|a", "a|b", "b|c", "c|d", "d|RP",  //
+                                        "LP|e", "e|f", "f|RP"});
   std::vector<int64> expected_splits({0, 5, 8});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -444,11 +445,11 @@ TEST_F(NgramKernelTest, TestSinglyPaddedBigramsAnd5grams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(                                   //
+  std::vector<tstring> expected_values(                                  //
       {"LP|a", "a|b", "b|c", "c|d", "d|RP", "LP|a|b|c|d", "a|b|c|d|RP",  //
        "LP|e", "e|f", "f|RP"});
   std::vector<int64> expected_splits({0, 7, 10});
@@ -462,12 +463,12 @@ TEST_F(NgramKernelTest, TestSinglyPadded5gramsWithPreserveShort) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(  //
-      {"LP|a|b|c|d", "a|b|c|d|RP",      //
+  std::vector<tstring> expected_values(  //
+      {"LP|a|b|c|d", "a|b|c|d|RP",       //
        "LP|e|f|RP"});
   std::vector<int64> expected_splits({0, 2, 3});
 
@@ -481,11 +482,11 @@ TEST_F(NgramKernelTest, TestOverlappingSinglyPaddedNGrams) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values(
+  std::vector<tstring> expected_values(
       {"LP|a|RP",                    // ngrams for elem. 0
        "LP|b|c", "b|c|d", "c|d|RP",  // ngrams for elem. 1
        "LP|e|f", "e|f|RP"});         // ngrams for elem. 2
@@ -501,11 +502,11 @@ TEST_F(NgramKernelTest, TestOverlappingSinglyPaddedNGramsNoOutput) {
   // 0: "a"
   // 1: "b", "c", "d"
   // 2: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({4}), {0, 1, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"LP|b|c|d|RP"});
+  std::vector<tstring> expected_values({"LP|b|c|d|RP"});
   std::vector<int64> expected_splits({0, 0, 1, 1});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -517,11 +518,11 @@ TEST_F(NgramKernelTest, TestSinglyPaddedUnigrams) {
   // Batch items are:
   // 0: "a", "b", "c", "d"
   // 1: "e", "f"
-  AddInputFromArray<string>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
+  AddInputFromArray<tstring>(TensorShape({6}), {"a", "b", "c", "d", "e", "f"});
   AddInputFromArray<int64>(TensorShape({3}), {0, 4, 6});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({"a", "b", "c", "d", "e", "f"});
+  std::vector<tstring> expected_values({"a", "b", "c", "d", "e", "f"});
   std::vector<int64> expected_splits({0, 4, 6});
 
   assert_string_equal(expected_values, *GetOutput(0));
@@ -530,11 +531,11 @@ TEST_F(NgramKernelTest, TestSinglyPaddedUnigrams) {
 
 TEST_F(NgramKernelTest, TestEmptyInput) {
   MakeOp("|", {1}, "LP", "RP", 3, false);
-  AddInputFromArray<string>(TensorShape({0}), {});
+  AddInputFromArray<tstring>(TensorShape({0}), {});
   AddInputFromArray<int64>(TensorShape({0}), {});
   TF_ASSERT_OK(RunOpKernel());
 
-  std::vector<string> expected_values({});
+  std::vector<tstring> expected_values({});
   std::vector<int64> expected_splits({});
 
   assert_string_equal(expected_values, *GetOutput(0));
diff --git a/tensorflow/core/kernels/unicode_ops.cc b/tensorflow/core/kernels/unicode_ops.cc
index 0bb5f0f7ef6..331139d2fe4 100644
--- a/tensorflow/core/kernels/unicode_ops.cc
+++ b/tensorflow/core/kernels/unicode_ops.cc
@@ -52,7 +52,7 @@ namespace tensorflow {
 namespace {
 
 void Encode(const UnicodeEncoding encoding, const icu::UnicodeString& in,
-            string* out) {
+            tstring* out) {
   if (encoding == UnicodeEncoding::UTF8) {
     out->clear();
     in.toUTF8String(*out);
@@ -330,7 +330,7 @@ class UnicodeTranscodeOp : public OpKernel {
   // Transcode the string from input encoding to the output_encoding_. If
   // non-valid characters are encountered, use the subst_/elide_replacement_
   // config to handle them.
-  void Transcode(string* s, UConverter* input_encoder,
+  void Transcode(tstring* s, UConverter* input_encoder,
                  bool* found_any_format_error) {
     icu::UnicodeString source;
     IterateUnicodeString(
@@ -561,9 +561,9 @@ class UnicodeEncodeOp : public OpKernel {
         appendable_unicode_string.appendCodePoint(code_point);
       }
       // Encode our string and save in the output.
-      string result;
+      tstring result;
       Encode(encoding_, unicode_string, &result);
-      output_tensor_flat(i - 1) = result;
+      output_tensor_flat(i - 1) = std::move(result);
     }
   }
 
diff --git a/tensorflow/core/kernels/whole_file_read_ops.cc b/tensorflow/core/kernels/whole_file_read_ops.cc
index 1e3b7fd6b30..4384bdea90d 100644
--- a/tensorflow/core/kernels/whole_file_read_ops.cc
+++ b/tensorflow/core/kernels/whole_file_read_ops.cc
@@ -34,8 +34,8 @@ limitations under the License.
 
 namespace tensorflow {
 
-static Status ReadEntireFile(Env* env, const string& filename,
-                             string* contents) {
+template <typename T>
+static Status ReadEntireFile(Env* env, const string& filename, T* contents) {
   std::unique_ptr<RandomAccessFile> file;
   TF_RETURN_IF_ERROR(env->NewRandomAccessFile(filename, &file));
   io::RandomAccessInputStream input_stream(file.get());
@@ -112,8 +112,8 @@ class ReadFileOp : public OpKernel {
     OP_REQUIRES_OK(context, context->allocate_output("contents",
                                                      TensorShape({}), &output));
     OP_REQUIRES_OK(context,
-                   ReadEntireFile(context->env(), input->scalar<string>()(),
-                                  &output->scalar<string>()()));
+                   ReadEntireFile(context->env(), input->scalar<tstring>()(),
+                                  &output->scalar<tstring>()()));
   }
 };
 
diff --git a/tensorflow/core/lib/io/buffered_inputstream.cc b/tensorflow/core/lib/io/buffered_inputstream.cc
index b247e9c5756..d69476dbd19 100644
--- a/tensorflow/core/lib/io/buffered_inputstream.cc
+++ b/tensorflow/core/lib/io/buffered_inputstream.cc
@@ -167,7 +167,8 @@ Status BufferedInputStream::Seek(int64 position) {
   return SkipNBytes(position - bufpos);
 }
 
-Status BufferedInputStream::ReadAll(string* result) {
+template <typename T>
+Status BufferedInputStream::ReadAll(T* result) {
   result->clear();
   Status status;
   while (status.ok()) {
@@ -186,6 +187,11 @@ Status BufferedInputStream::ReadAll(string* result) {
   return status;
 }
 
+template Status BufferedInputStream::ReadAll<string>(string* result);
+#ifdef USE_TSTRING
+template Status BufferedInputStream::ReadAll<tstring>(tstring* result);
+#endif  // USE_TSTRING
+
 Status BufferedInputStream::Reset() {
   TF_RETURN_IF_ERROR(input_stream_->Reset());
   pos_ = 0;
diff --git a/tensorflow/core/lib/io/buffered_inputstream.h b/tensorflow/core/lib/io/buffered_inputstream.h
index 96a95b7ed95..57d7615aace 100644
--- a/tensorflow/core/lib/io/buffered_inputstream.h
+++ b/tensorflow/core/lib/io/buffered_inputstream.h
@@ -79,7 +79,8 @@ class BufferedInputStream : public InputStreamInterface {
   //
   // Note: the amount of memory used by this function call is unbounded, so only
   // use in ops that expect that behavior.
-  Status ReadAll(string* result);
+  template <typename T>
+  Status ReadAll(T* result);
 
   Status Reset() override;
 
diff --git a/tensorflow/core/lib/jpeg/jpeg_handle.cc b/tensorflow/core/lib/jpeg/jpeg_handle.cc
index 0ab9249cf59..5f1c9dfa94d 100644
--- a/tensorflow/core/lib/jpeg/jpeg_handle.cc
+++ b/tensorflow/core/lib/jpeg/jpeg_handle.cc
@@ -84,7 +84,7 @@ void SetDest(j_compress_ptr cinfo, void *buffer, int bufsize) {
 
 // -----------------------------------------------------------------------------
 void SetDest(j_compress_ptr cinfo, void *buffer, int bufsize,
-             string *destination) {
+             tstring *destination) {
   MemDestMgr *dest;
   if (cinfo->dest == nullptr) {
     cinfo->dest = reinterpret_cast<struct jpeg_destination_mgr *>(
diff --git a/tensorflow/core/lib/jpeg/jpeg_handle.h b/tensorflow/core/lib/jpeg/jpeg_handle.h
index 86fa3ac5c23..d40cbaae939 100644
--- a/tensorflow/core/lib/jpeg/jpeg_handle.h
+++ b/tensorflow/core/lib/jpeg/jpeg_handle.h
@@ -33,7 +33,7 @@ typedef struct {
   JOCTET *buffer;
   int bufsize;
   int datacount;
-  string *dest;
+  tstring *dest;
 } MemDestMgr;
 
 typedef struct {
@@ -52,7 +52,7 @@ void SetDest(j_compress_ptr cinfo, void *buffer, int bufsize);
 // Same as above, except that buffer is only used as a temporary structure and
 // is emptied into "destination" as soon as it fills up.
 void SetDest(j_compress_ptr cinfo, void *buffer, int bufsize,
-             string *destination);
+             tstring *destination);
 
 }  // namespace jpeg
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/jpeg/jpeg_mem.cc b/tensorflow/core/lib/jpeg/jpeg_mem.cc
index a21b440318e..03befabdefe 100644
--- a/tensorflow/core/lib/jpeg/jpeg_mem.cc
+++ b/tensorflow/core/lib/jpeg/jpeg_mem.cc
@@ -592,7 +592,7 @@ bool GetImageInfo(const void* srcdata, int datasize, int* width, int* height,
 
 namespace {
 bool CompressInternal(const uint8* srcdata, int width, int height,
-                      const CompressFlags& flags, string* output) {
+                      const CompressFlags& flags, tstring* output) {
   output->clear();
   const int components = (static_cast<int>(flags.format) & 0xff);
 
@@ -762,14 +762,14 @@ bool CompressInternal(const uint8* srcdata, int width, int height,
 // -----------------------------------------------------------------------------
 
 bool Compress(const void* srcdata, int width, int height,
-              const CompressFlags& flags, string* output) {
+              const CompressFlags& flags, tstring* output) {
   return CompressInternal(static_cast<const uint8*>(srcdata), width, height,
                           flags, output);
 }
 
-string Compress(const void* srcdata, int width, int height,
-                const CompressFlags& flags) {
-  string temp;
+tstring Compress(const void* srcdata, int width, int height,
+                 const CompressFlags& flags) {
+  tstring temp;
   CompressInternal(static_cast<const uint8*>(srcdata), width, height, flags,
                    &temp);
   // If CompressInternal fails, temp will be empty.
diff --git a/tensorflow/core/lib/jpeg/jpeg_mem.h b/tensorflow/core/lib/jpeg/jpeg_mem.h
index 03437a4e78a..08b379887a4 100644
--- a/tensorflow/core/lib/jpeg/jpeg_mem.h
+++ b/tensorflow/core/lib/jpeg/jpeg_mem.h
@@ -149,12 +149,12 @@ struct CompressFlags {
 // The encoded data is returned as a string.
 // If not empty, XMP metadata can be embedded in the image header
 // On error, returns the empty string (which is never a valid jpeg).
-string Compress(const void* srcdata, int width, int height,
-                const CompressFlags& flags);
+tstring Compress(const void* srcdata, int width, int height,
+                 const CompressFlags& flags);
 
 // On error, returns false and sets output to empty.
 bool Compress(const void* srcdata, int width, int height,
-              const CompressFlags& flags, string* output);
+              const CompressFlags& flags, tstring* output);
 
 }  // namespace jpeg
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/jpeg/jpeg_mem_unittest.cc b/tensorflow/core/lib/jpeg/jpeg_mem_unittest.cc
index 62dd31a65f6..bec84dbf0ae 100644
--- a/tensorflow/core/lib/jpeg/jpeg_mem_unittest.cc
+++ b/tensorflow/core/lib/jpeg/jpeg_mem_unittest.cc
@@ -326,7 +326,7 @@ TEST(JpegMemTest, Jpeg2) {
     CHECK_NE(string::npos, cpdata1.find(kXMP));
 
     // Test the other API, where a storage string is supplied
-    string cptest;
+    tstring cptest;
     flags.stride = 0;
     Compress(refdata1.get(), in_w, in_h, flags, &cptest);
     CHECK_EQ(cptest, cpdata1);
@@ -465,7 +465,7 @@ TEST(JpegMemTest, ChromaDownsampling) {
     flags.format = FORMAT_RGB;
     flags.quality = 85;
     flags.chroma_downsampling = downsample;
-    string recompressed;
+    tstring recompressed;
     Compress(uncompressed.get(), w, h, flags, &recompressed);
     CHECK(!recompressed.empty());
     CHECK_EQ(IsChromaDownsampled(recompressed), downsample);
diff --git a/tensorflow/core/lib/png/png_io.cc b/tensorflow/core/lib/png/png_io.cc
index e8dbcb97b94..3c7a42ae4a7 100644
--- a/tensorflow/core/lib/png/png_io.cc
+++ b/tensorflow/core/lib/png/png_io.cc
@@ -105,8 +105,9 @@ void StringReader(png_structp png_ptr, png_bytep data, png_size_t length) {
   }
 }
 
+template <typename T>
 void StringWriter(png_structp png_ptr, png_bytep data, png_size_t length) {
-  string* const s = absl::bit_cast<string*>(png_get_io_ptr(png_ptr));
+  T* const s = absl::bit_cast<T*>(png_get_io_ptr(png_ptr));
   s->append(absl::bit_cast<const char*>(data), length);
 }
 
@@ -340,9 +341,10 @@ bool CommonFinishDecode(png_bytep data, int row_bytes, DecodeContext* context) {
   return ok;
 }
 
+template <typename T>
 bool WriteImageToBuffer(
     const void* image, int width, int height, int row_bytes, int num_channels,
-    int channel_bits, int compression, string* png_string,
+    int channel_bits, int compression, T* png_string,
     const std::vector<std::pair<string, string> >* metadata) {
   CHECK_NOTNULL(image);
   CHECK_NOTNULL(png_string);
@@ -384,7 +386,7 @@ bool WriteImageToBuffer(
       return false;
   }
 
-  png_set_write_fn(png_ptr, png_string, StringWriter, StringWriterFlush);
+  png_set_write_fn(png_ptr, png_string, StringWriter<T>, StringWriterFlush);
   if (compression < 0) compression = Z_DEFAULT_COMPRESSION;
   png_set_compression_level(png_ptr, compression);
   png_set_compression_mem_level(png_ptr, MAX_MEM_LEVEL);
@@ -418,5 +420,16 @@ bool WriteImageToBuffer(
   return true;
 }
 
+template bool WriteImageToBuffer<string>(
+    const void* image, int width, int height, int row_bytes, int num_channels,
+    int channel_bits, int compression, string* png_string,
+    const std::vector<std::pair<string, string> >* metadata);
+#ifdef USE_TSTRING
+template bool WriteImageToBuffer<tstring>(
+    const void* image, int width, int height, int row_bytes, int num_channels,
+    int channel_bits, int compression, tstring* png_string,
+    const std::vector<std::pair<string, string> >* metadata);
+#endif  // USE_TSTRING
+
 }  // namespace png
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/png/png_io.h b/tensorflow/core/lib/png/png_io.h
index d3a44b19eed..5ecbee89fb7 100644
--- a/tensorflow/core/lib/png/png_io.h
+++ b/tensorflow/core/lib/png/png_io.h
@@ -94,9 +94,10 @@ void CommonFreeDecode(DecodeContext* context);
 // compression is in [-1,9], where 0 is fast and weak compression, 9 is slow
 // and strong, and -1 is the zlib default.
 
+template <typename T>
 bool WriteImageToBuffer(
     const void* image, int width, int height, int row_bytes, int num_channels,
-    int channel_bits, int compression, string* png_string,
+    int channel_bits, int compression, T* png_string,
     const std::vector<std::pair<string, string> >* metadata);
 
 }  // namespace png
diff --git a/tensorflow/core/lib/strings/base64.cc b/tensorflow/core/lib/strings/base64.cc
index c5a521f18ae..80eec3a9403 100644
--- a/tensorflow/core/lib/strings/base64.cc
+++ b/tensorflow/core/lib/strings/base64.cc
@@ -73,7 +73,8 @@ Status DecodeThreeChars(const char* codes, char* result) {
 }
 }  // namespace
 
-Status Base64Decode(StringPiece data, string* decoded) {
+template <typename T>
+Status Base64Decode(StringPiece data, T* decoded) {
   if (decoded == nullptr) {
     return errors::Internal("'decoded' cannot be nullptr.");
   }
@@ -135,11 +136,13 @@ Status Base64Decode(StringPiece data, string* decoded) {
   return Status::OK();
 }
 
-Status Base64Encode(StringPiece source, string* encoded) {
+template <typename T>
+Status Base64Encode(StringPiece source, T* encoded) {
   return Base64Encode(source, false, encoded);
 }
 
-Status Base64Encode(StringPiece source, bool with_padding, string* encoded) {
+template <typename T>
+Status Base64Encode(StringPiece source, bool with_padding, T* encoded) {
   const char* const base64_chars = kBase64UrlSafeChars;
   if (encoded == nullptr) {
     return errors::Internal("'encoded' cannot be nullptr.");
@@ -191,4 +194,16 @@ Status Base64Encode(StringPiece source, bool with_padding, string* encoded) {
   return Status::OK();
 }
 
+template Status Base64Decode<string>(StringPiece data, string* decoded);
+template Status Base64Encode<string>(StringPiece source, string* encoded);
+template Status Base64Encode<string>(StringPiece source, bool with_padding,
+                                     string* encoded);
+
+#ifdef USE_TSTRING
+template Status Base64Decode<tstring>(StringPiece data, tstring* decoded);
+template Status Base64Encode<tstring>(StringPiece source, tstring* encoded);
+template Status Base64Encode<tstring>(StringPiece source, bool with_padding,
+                                      tstring* encoded);
+#endif  // USE_TSTRING
+
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/strings/base64.h b/tensorflow/core/lib/strings/base64.h
index cb8f50df11f..7eecbcae437 100644
--- a/tensorflow/core/lib/strings/base64.h
+++ b/tensorflow/core/lib/strings/base64.h
@@ -24,13 +24,17 @@ namespace tensorflow {
 /// \brief Converts data into web-safe base64 encoding.
 ///
 /// See https://en.wikipedia.org/wiki/Base64
-Status Base64Encode(StringPiece data, bool with_padding, string* encoded);
-Status Base64Encode(StringPiece data, string* encoded);  // with_padding=false.
+template <typename T>
+Status Base64Encode(StringPiece source, bool with_padding, T* encoded);
+template <typename T>
+Status Base64Encode(StringPiece source,
+                    T* encoded);  // with_padding=false.
 
 /// \brief Converts data from web-safe base64 encoding.
 ///
 /// See https://en.wikipedia.org/wiki/Base64
-Status Base64Decode(StringPiece data, string* decoded);
+template <typename T>
+Status Base64Decode(StringPiece data, T* decoded);
 
 }  // namespace tensorflow
 
diff --git a/tensorflow/core/lib/strings/base64_test.cc b/tensorflow/core/lib/strings/base64_test.cc
index 3e03d595d27..df4a4bcf593 100644
--- a/tensorflow/core/lib/strings/base64_test.cc
+++ b/tensorflow/core/lib/strings/base64_test.cc
@@ -21,11 +21,11 @@ namespace tensorflow {
 
 TEST(Base64, EncodeDecode) {
   const string original = "a simple test message!";
-  string encoded;
+  tstring encoded;
   TF_EXPECT_OK(Base64Encode(original, &encoded));
   EXPECT_EQ("YSBzaW1wbGUgdGVzdCBtZXNzYWdlIQ", encoded);
 
-  string decoded;
+  tstring decoded;
   TF_EXPECT_OK(Base64Decode(encoded, &decoded));
   EXPECT_EQ(original, decoded);
 }
diff --git a/tensorflow/core/lib/wav/wav_io.cc b/tensorflow/core/lib/wav/wav_io.cc
index b4f0bfbfb96..62bd7cdf157 100644
--- a/tensorflow/core/lib/wav/wav_io.cc
+++ b/tensorflow/core/lib/wav/wav_io.cc
@@ -132,9 +132,10 @@ Status ReadString(const string& data, int expected_length, string* value,
   return Status::OK();
 }
 
+template <typename T>
 Status EncodeAudioAsS16LEWav(const float* audio, size_t sample_rate,
                              size_t num_channels, size_t num_frames,
-                             string* wav_string) {
+                             T* wav_string) {
   constexpr size_t kFormatChunkSize = 16;
   constexpr size_t kCompressionCodePcm = 1;
   constexpr size_t kBitsPerSample = 16;
@@ -173,7 +174,7 @@ Status EncodeAudioAsS16LEWav(const float* audio, size_t sample_rate,
   }
 
   wav_string->resize(file_size);
-  char* data = &wav_string->at(0);
+  char* data = &(*wav_string)[0];
   WavHeader* header = absl::bit_cast<WavHeader*>(data);
 
   // Fill RIFF chunk.
@@ -208,6 +209,19 @@ Status EncodeAudioAsS16LEWav(const float* audio, size_t sample_rate,
   return Status::OK();
 }
 
+template Status EncodeAudioAsS16LEWav<string>(const float* audio,
+                                              size_t sample_rate,
+                                              size_t num_channels,
+                                              size_t num_frames,
+                                              string* wav_string);
+#ifdef USE_TSTRING
+template Status EncodeAudioAsS16LEWav<tstring>(const float* audio,
+                                               size_t sample_rate,
+                                               size_t num_channels,
+                                               size_t num_frames,
+                                               tstring* wav_string);
+#endif  // USE_TSTRING
+
 Status DecodeLin16WaveAsFloatVector(const string& wav_string,
                                     std::vector<float>* float_values,
                                     uint32* sample_count, uint16* channel_count,
diff --git a/tensorflow/core/lib/wav/wav_io.h b/tensorflow/core/lib/wav/wav_io.h
index 9145e7c9f22..0c8c1abe38c 100644
--- a/tensorflow/core/lib/wav/wav_io.h
+++ b/tensorflow/core/lib/wav/wav_io.h
@@ -41,9 +41,10 @@ namespace wav {
 // if (EncodeAudioAsS16LEWav(audio_buffer, 8000, 2, 4, &wav_string).ok()) {
 //   // Use wav_string.
 // }
+template <typename T>
 Status EncodeAudioAsS16LEWav(const float* audio, size_t sample_rate,
                              size_t num_channels, size_t num_frames,
-                             string* wav_string);
+                             T* wav_string);
 
 // Decodes the little-endian signed 16-bit PCM WAV file data (aka LIN16
 // encoding) into a float Tensor. The channels are encoded as the lowest
diff --git a/tensorflow/core/lib/wav/wav_io_test.cc b/tensorflow/core/lib/wav/wav_io_test.cc
index 9dc42929104..66811e3669e 100644
--- a/tensorflow/core/lib/wav/wav_io_test.cc
+++ b/tensorflow/core/lib/wav/wav_io_test.cc
@@ -34,12 +34,13 @@ Status ReadString(const string& data, int expected_length, string* value,
 
 TEST(WavIO, BadArguments) {
   float audio[] = {0.0f, 0.1f, 0.2f, 0.3f, 0.4f, 0.5f};
-  string result;
+  tstring result;
 
   EXPECT_EQ(error::INVALID_ARGUMENT,
             EncodeAudioAsS16LEWav(nullptr, 44100, 2, 3, &result).code());
-  EXPECT_EQ(error::INVALID_ARGUMENT,
-            EncodeAudioAsS16LEWav(audio, 44100, 2, 3, nullptr).code());
+  EXPECT_EQ(
+      error::INVALID_ARGUMENT,
+      EncodeAudioAsS16LEWav(audio, 44100, 2, 3, (tstring*)nullptr).code());
 
   const size_t kuint32max_plus_one = static_cast<size_t>(kuint32max) + 1;
   const size_t kuint16max_plus_one = static_cast<size_t>(kuint16max) + 1;
diff --git a/tensorflow/core/platform/protobuf.cc b/tensorflow/core/platform/protobuf.cc
index c9e6f3bf5c6..17ecbf77da6 100644
--- a/tensorflow/core/platform/protobuf.cc
+++ b/tensorflow/core/platform/protobuf.cc
@@ -20,4 +20,43 @@ namespace tensorflow {
 const char* kProtobufInt64Typename = "::tensorflow::protobuf_int64";
 const char* kProtobufUint64Typename = "::tensorflow::protobuf_uint64";
 
+#ifdef USE_TSTRING
+TStringOutputStream::TStringOutputStream(tstring* target) : target_(target) {}
+
+bool TStringOutputStream::Next(void** data, int* size) {
+  int old_size = target_->size();
+
+  // Grow the string.
+  if (old_size < target_->capacity()) {
+    // Resize the string to match its capacity, since we can get away
+    // without a memory allocation this way.
+    target_->resize_uninitialized(target_->capacity());
+  } else {
+    // Size has reached capacity, try to double the size.
+    if (old_size > std::numeric_limits<int>::max() / 2) {
+      // Can not double the size otherwise it is going to cause integer
+      // overflow in the expression below: old_size * 2 ";
+      return false;
+    }
+    // Double the size, also make sure that the new size is at least
+    // kMinimumSize.
+    target_->resize_uninitialized(
+        std::max(old_size * 2,
+                 kMinimumSize + 0));  // "+ 0" works around GCC4 weirdness.
+  }
+
+  *data = target_->data() + old_size;
+  *size = target_->size() - old_size;
+  return true;
+}
+
+void TStringOutputStream::BackUp(int count) {
+  target_->resize(target_->size() - count);
+}
+
+protobuf::io::ByteCountInt64 TStringOutputStream::ByteCount() const {
+  return target_->size();
+}
+#endif  // USE_TSTRING
+
 }  // namespace tensorflow
diff --git a/tensorflow/core/platform/protobuf.h b/tensorflow/core/platform/protobuf.h
index d7c41051bae..28d34690091 100644
--- a/tensorflow/core/platform/protobuf.h
+++ b/tensorflow/core/platform/protobuf.h
@@ -90,6 +90,29 @@ inline bool SerializeToTString(const protobuf::MessageLite& proto,
 #endif  // USE_TSTRING
 }
 
+#ifdef USE_TSTRING
+// Analogue to StringOutputStream for tstring.
+class TStringOutputStream : public protobuf::io::ZeroCopyOutputStream {
+ public:
+  explicit TStringOutputStream(tstring* target);
+  ~TStringOutputStream() override = default;
+
+  TStringOutputStream(const TStringOutputStream&) = delete;
+  void operator=(const TStringOutputStream&) = delete;
+
+  bool Next(void** data, int* size) override;
+  void BackUp(int count) override;
+  protobuf::io::ByteCountInt64 ByteCount() const override;
+
+ private:
+  static const int kMinimumSize = 16;
+
+  tstring* target_;
+};
+#else   // USE_TSTRING
+typedef protobuf::io::StringOutputStream TStringOutputStream;
+#endif  // USE_TSTRING
+
 }  // namespace tensorflow
 
 #endif  // TENSORFLOW_CORE_PLATFORM_PROTOBUF_H_
diff --git a/tensorflow/core/platform/tstring.h b/tensorflow/core/platform/tstring.h
index 0e4c97af231..f8e0a86bf95 100644
--- a/tensorflow/core/platform/tstring.h
+++ b/tensorflow/core/platform/tstring.h
@@ -157,6 +157,8 @@ class tstring {
 
   size_t size() const { return str_.size(); }
 
+  size_t capacity() const { return str_.capacity(); }
+
   const char* c_str() const { return str_.c_str(); }
 
   const char* data() const { return str_.data(); }
@@ -207,6 +209,8 @@ class tstring {
     return *this;
   }
 
+  void push_back(char ch) { str_.push_back(ch); }
+
   friend const tstring operator+(const tstring& a, const tstring& b);
   friend bool operator==(const char* a, const tstring& b);
   friend bool operator==(const std::string& a, const tstring& b);