Add RunEnvironmentResult to op_stats.proto
PiperOrigin-RevId: 288806344 Change-Id: I7acb0e00fed8e42819b25479130c8114993ac7ba
This commit is contained in:
parent
d79a34bfa4
commit
9abca16f96
@ -16,6 +16,75 @@ message PerfEnv {
|
|||||||
double ridge_point = 3;
|
double ridge_point = 3;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Result proto for host-independent job information.
|
||||||
|
message HostIndependentJobInfoResult {
|
||||||
|
// The change-list number of this build.
|
||||||
|
int64 change_list = 1;
|
||||||
|
// The time of this build (nanoseconds since the Unix epoch).
|
||||||
|
int64 build_time = 2;
|
||||||
|
// The target of this build.
|
||||||
|
string build_target = 3;
|
||||||
|
// Profiling duration (in ms).
|
||||||
|
uint32 profile_duration_ms = 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Result proto for host-dependent job information.
|
||||||
|
message HostDependentJobInfoResult {
|
||||||
|
// This ID of the host where the job was run on.
|
||||||
|
string host_id = 1;
|
||||||
|
// The command line used to run the job.
|
||||||
|
string command_line = 2;
|
||||||
|
// The start time of this run (nanoseconds since the Unix epoch).
|
||||||
|
int64 start_time = 3;
|
||||||
|
// BNS address specified by client at time of profiling request.
|
||||||
|
string bns_address = 4;
|
||||||
|
// Profiling start walltime (in ns).
|
||||||
|
uint64 profile_time_ns = 5;
|
||||||
|
}
|
||||||
|
|
||||||
|
// System topology, which describes the number of chips in a pod
|
||||||
|
// and the connectivity style.
|
||||||
|
message SystemTopology {
|
||||||
|
// The X, Y, and Z dimensions of this topology. 0 means that dimension does
|
||||||
|
// not exist.
|
||||||
|
int64 x_dimension = 1;
|
||||||
|
int64 y_dimension = 2;
|
||||||
|
int64 z_dimension = 3;
|
||||||
|
// The number of expected bad chips in this system.
|
||||||
|
int64 num_expected_reduced_chips = 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Result proto for RunEnvironment (the run environment of a profiling session).
|
||||||
|
message RunEnvironment {
|
||||||
|
// Number of hosts used.
|
||||||
|
int32 host_count = 1;
|
||||||
|
// Number of tasks used.
|
||||||
|
int32 task_count = 2;
|
||||||
|
// Distinct hostnames seen.
|
||||||
|
map<string, bool> hostnames = 3;
|
||||||
|
// The type of device used.
|
||||||
|
string device_type = 4;
|
||||||
|
// The number of device cores used.
|
||||||
|
// In TPU case, this corresponds to the number of TPU cores
|
||||||
|
// In GPU case, this corresponds to the number of GPUs (not the number of
|
||||||
|
// SMs).
|
||||||
|
int32 device_core_count = 5;
|
||||||
|
// The per-device-core batch size.
|
||||||
|
int32 per_core_batch_size = 6;
|
||||||
|
// Host-independent job information.
|
||||||
|
HostIndependentJobInfoResult host_independent_job_info = 7;
|
||||||
|
// Host-dependent job information.
|
||||||
|
repeated HostDependentJobInfoResult host_dependent_job_info = 8;
|
||||||
|
// The number of replicas, corresponds to input parallelism.
|
||||||
|
// If there is no model parallelism, replica_count = device_core_count
|
||||||
|
int32 replica_count = 9;
|
||||||
|
// The number of cores used for a single replica, e.g. model parallelism.
|
||||||
|
// If there is no model parallelism, then num_cores_per_replica = 1
|
||||||
|
int32 num_cores_per_replica = 10;
|
||||||
|
// The chip interconnection topology.
|
||||||
|
SystemTopology topology = 11;
|
||||||
|
}
|
||||||
|
|
||||||
// Operator Statistics.
|
// Operator Statistics.
|
||||||
message OpStats {
|
message OpStats {
|
||||||
// The database for the op metrics collected from the host over the entire
|
// The database for the op metrics collected from the host over the entire
|
||||||
|
Loading…
x
Reference in New Issue
Block a user