STT-tensorflow/tensorflow/python/client/debug_events_writer_wrapper.cc
Shanqing Cai a8950d70bf [tfdbg2] Add tfdbg_run_id to metadata of data dumps
- A data dump file set generated by tfdbg2 can contain
  multiple subsets when there are multiple hosts involved
  in the instrumented TensorFlow job (e.g., TPUs and Parameter Servers).
  Currently, there is no bit in those subset of files that
  indicates they belong to the same instrumented TF job.
  - This CL addresses this problem by adding a field to the
    metadata proto used by those files (`tfdbg_run_id`)
- The DebugEventsWriter code is revised, so that this new
  field is written to the metadata file of the file set on the writer's
  construction.
- Also in this CL: remove the previous 1-arg `GetDebugEventsWriter(dump_root)`
  that creates the writer object if it doesn't exist at the specified
  dump_root. Replace it with `LookUpDebugEventsWriter(dump_root)` that only
  looks up the writer object and returns a non-OK status if such an object
  hasn't been created at `dump_root`. This makes the code less error prone by
  keeping only the fully-explicit, 3-arg `GetDebugEventsWriter()`.

PiperOrigin-RevId: 316537044
Change-Id: Id5be0b771fbf37c0fc796f1514ed858a0e6d38f0
2020-06-15 13:52:52 -07:00

124 lines
5.6 KiB
C++

/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#include "absl/strings/string_view.h"
#include "pybind11/pybind11.h"
#include "pybind11/pytypes.h"
#include "tensorflow/core/lib/core/status.h"
#include "tensorflow/core/lib/strings/stringprintf.h"
#include "tensorflow/core/util/debug_events_writer.h"
#include "tensorflow/python/lib/core/pybind11_absl.h"
#include "tensorflow/python/lib/core/pybind11_proto.h"
#include "tensorflow/python/lib/core/pybind11_status.h"
PYBIND11_MODULE(_pywrap_debug_events_writer, m) {
namespace py = pybind11;
using namespace tensorflow; // NOLINT(build/namespaces)
using namespace tensorflow::tfdbg; // NOLINT(build/namespaces)
m.def("Init",
[](const std::string& dump_root, const std::string& tfdbg_run_id,
const int64 circular_buffer_size) {
DebugEventsWriter* writer = DebugEventsWriter::GetDebugEventsWriter(
dump_root, tfdbg_run_id, circular_buffer_size);
if (!writer->Init().ok()) {
throw py::value_error(tensorflow::strings::Printf(
"Failed to initialize debug events writer at: %s",
dump_root.c_str()));
}
});
m.def("WriteSourceFile",
[](const std::string& dump_root, const py::object obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedNonExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::SOURCE_FILES);
});
m.def("WriteStackFrameWithId",
[](const std::string& dump_root, const py::object& obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedNonExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::STACK_FRAMES);
});
m.def("WriteGraphOpCreation",
[](const std::string& dump_root, const py::object& obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedNonExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::GRAPHS);
});
m.def("WriteDebuggedGraph",
[](const std::string& dump_root, const py::object& obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedNonExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::GRAPHS);
});
m.def("WriteExecution",
[](const std::string& dump_root, const py::object& obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::EXECUTION);
});
m.def("WriteGraphExecutionTrace",
[](const std::string& dump_root, const py::object& obj) {
CheckProtoType(obj, "tensorflow.DebugEvent");
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(
DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->WriteSerializedExecutionDebugEvent(
obj.attr("SerializeToString")().cast<std::string>(),
tfdbg::DebugEventFileType::GRAPH_EXECUTION_TRACES);
});
m.def("RegisterDeviceAndGetId", [](const std::string& dump_root,
const std::string& device_name) {
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
return writer->RegisterDeviceAndGetId(device_name);
});
m.def("FlushNonExecutionFiles", [](const std::string& dump_root) {
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->FlushNonExecutionFiles();
});
m.def("FlushExecutionFiles", [](const std::string& dump_root) {
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->FlushExecutionFiles();
});
m.def("Close", [](const std::string& dump_root) {
DebugEventsWriter* writer = nullptr;
TF_CHECK_OK(DebugEventsWriter::LookUpDebugEventsWriter(dump_root, &writer));
writer->Close();
});
};