Update stats_calculator to allow dumping values as CSV

this way it is easier for processing by tools.

PiperOrigin-RevId: 293855718
Change-Id: I098f15977d58c93469a046f17a961c879a4213bb
This commit is contained in:
Karim Nosir 2020-02-07 11:22:56 -08:00 committed by TensorFlower Gardener
parent 851a0b6651
commit f517e2617a
2 changed files with 62 additions and 39 deletions

View File

@ -17,8 +17,7 @@ limitations under the License.
#define TENSORFLOW_CORE_UTIL_STAT_SUMMARIZER_OPTIONS_H_
namespace tensorflow {
// Used to control the output of the statistics summarizer;
class StatSummarizerOptions {
public:
struct StatSummarizerOptions {
StatSummarizerOptions()
: show_run_order(true),
run_order_limit(0),
@ -27,7 +26,8 @@ class StatSummarizerOptions {
show_memory(true),
memory_limit(10),
show_type(true),
show_summary(true) {}
show_summary(true),
format_as_csv(false) {}
bool show_run_order;
int run_order_limit;
@ -37,6 +37,7 @@ class StatSummarizerOptions {
int memory_limit;
bool show_type;
bool show_summary;
bool format_as_csv;
};
} // namespace tensorflow

View File

@ -51,7 +51,10 @@ std::string StatsCalculator::HeaderString(const std::string& title) const {
stream << "============================== " << title
<< " ==============================" << std::endl;
if (options_.format_as_csv) {
stream << "node type, start, first, avg_ms, %, cdf%, mem KB, times called, "
"name";
} else {
InitField(stream, 24) << "[node type]";
InitField(stream, 17) << "[start]";
InitField(stream, 9) << "[first]";
@ -62,6 +65,7 @@ std::string StatsCalculator::HeaderString(const std::string& title) const {
InitField(stream, 9) << "[times called]";
stream << "\t"
<< "[Name]";
}
return stream.str();
}
@ -76,6 +80,12 @@ std::string StatsCalculator::ColumnString(const Detail& detail,
const int64_t times_called = detail.times_called / num_runs();
std::stringstream stream;
if (options_.format_as_csv) {
stream << detail.type << ", " << start_ms << ", " << first_time_ms << ", "
<< avg_time_ms << ", " << percentage << "%, " << cdf_percentage
<< "%, " << detail.mem_used.newest() / 1000.0 << ", " << times_called
<< ", " << detail.name;
} else {
InitField(stream, 24) << detail.type;
InitField(stream, 17) << start_ms;
InitField(stream, 9) << first_time_ms;
@ -85,6 +95,7 @@ std::string StatsCalculator::ColumnString(const Detail& detail,
InitField(stream, 10) << detail.mem_used.newest() / 1000.0;
InitField(stream, 9) << times_called;
stream << "\t" << detail.name;
}
return stream.str();
}
@ -186,6 +197,9 @@ std::string StatsCalculator::GetStatsByNodeType() const {
std::pair<std::string, int64_t>(node_type.first, mem_used));
}
if (options_.format_as_csv) {
stream << "node type, count, avg_ms, avg %, cdf %, mem KB, times called\n";
} else {
InitField(stream, 24) << "[Node type]";
InitField(stream, 9) << "[count]";
InitField(stream, 10) << "[avg ms]";
@ -194,6 +208,7 @@ std::string StatsCalculator::GetStatsByNodeType() const {
InitField(stream, 10) << "[mem KB]";
InitField(stream, 10) << "[times called]";
stream << std::endl;
}
float cdf = 0.0f;
while (!timings.empty()) {
@ -210,6 +225,12 @@ std::string StatsCalculator::GetStatsByNodeType() const {
((entry.first / static_cast<float>(accumulated_us)) * 100.0f);
cdf += percentage;
if (options_.format_as_csv) {
stream << node_type << ", " << node_type_map_count[node_type] << ", "
<< time_per_run_ms << ", " << percentage << "%, " << cdf << "%, "
<< memory << ", " << node_type_map_times_called[node_type]
<< std::endl;
} else {
InitField(stream, 24) << node_type;
InitField(stream, 9) << node_type_map_count[node_type];
InitField(stream, 10) << time_per_run_ms;
@ -219,6 +240,7 @@ std::string StatsCalculator::GetStatsByNodeType() const {
InitField(stream, 9) << node_type_map_times_called[node_type];
stream << std::endl;
}
}
stream << std::endl;
return stream.str();
}