Add RunEnvironmentResult to op_stats.proto

PiperOrigin-RevId: 288806344 Change-Id: I7acb0e00fed8e42819b25479130c8114993ac7ba
2020-01-08 17:14:55 -08:00 · 2020-01-08 17:14:55 -08:00 · 9abca16f96
commit 9abca16f96
parent d79a34bfa4
1 changed files with 69 additions and 0 deletions
--- a/tensorflow/core/profiler/protobuf/op_stats.proto
+++ b/tensorflow/core/profiler/protobuf/op_stats.proto
@ -16,6 +16,75 @@ message PerfEnv {
  double ridge_point = 3;
 }

+// Result proto for host-independent job information.
+message HostIndependentJobInfoResult {
+  // The change-list number of this build.
+  int64 change_list = 1;
+  // The time of this build (nanoseconds since the Unix epoch).
+  int64 build_time = 2;
+  // The target of this build.
+  string build_target = 3;
+  // Profiling duration (in ms).
+  uint32 profile_duration_ms = 4;
+}
+
+// Result proto for host-dependent job information.
+message HostDependentJobInfoResult {
+  // This ID of the host where the job was run on.
+  string host_id = 1;
+  // The command line used to run the job.
+  string command_line = 2;
+  // The start time of this run (nanoseconds since the Unix epoch).
+  int64 start_time = 3;
+  // BNS address specified by client at time of profiling request.
+  string bns_address = 4;
+  // Profiling start walltime (in ns).
+  uint64 profile_time_ns = 5;
+}
+
+// System topology, which describes the number of chips in a pod
+// and the connectivity style.
+message SystemTopology {
+  // The X, Y, and Z dimensions of this topology. 0 means that dimension does
+  // not exist.
+  int64 x_dimension = 1;
+  int64 y_dimension = 2;
+  int64 z_dimension = 3;
+  // The number of expected bad chips in this system.
+  int64 num_expected_reduced_chips = 4;
+}
+
+// Result proto for RunEnvironment (the run environment of a profiling session).
+message RunEnvironment {
+  // Number of hosts used.
+  int32 host_count = 1;
+  // Number of tasks used.
+  int32 task_count = 2;
+  // Distinct hostnames seen.
+  map<string, bool> hostnames = 3;
+  // The type of device used.
+  string device_type = 4;
+  // The number of device cores used.
+  //   In TPU case, this corresponds to the number of TPU cores
+  //   In GPU case, this corresponds to the number of GPUs (not the number of
+  //   SMs).
+  int32 device_core_count = 5;
+  // The per-device-core batch size.
+  int32 per_core_batch_size = 6;
+  // Host-independent job information.
+  HostIndependentJobInfoResult host_independent_job_info = 7;
+  // Host-dependent job information.
+  repeated HostDependentJobInfoResult host_dependent_job_info = 8;
+  // The number of replicas, corresponds to input parallelism.
+  // If there is no model parallelism, replica_count = device_core_count
+  int32 replica_count = 9;
+  // The number of cores used for a single replica, e.g. model parallelism.
+  // If there is no model parallelism, then num_cores_per_replica = 1
+  int32 num_cores_per_replica = 10;
+  // The chip interconnection topology.
+  SystemTopology topology = 11;
+}
+
 // Operator Statistics.
 message OpStats {
  // The database for the op metrics collected from the host over the entire