use xspace to serialize gpu trace.
PiperOrigin-RevId: 339102774 Change-Id: Ia329276e58ab53668de6269918f2cd5ef5fbfdf7
This commit is contained in:
		
							parent
							
								
									76a08f796c
								
							
						
					
					
						commit
						2eda043cf4
					
				| @ -32,14 +32,31 @@ namespace profiler { | |||||||
| 
 | 
 | ||||||
| namespace { | namespace { | ||||||
| 
 | 
 | ||||||
| bool IsHostEvent(const CuptiTracerEvent& event) { | bool IsHostEvent(const CuptiTracerEvent& event, int64* line_id) { | ||||||
|   // DriverCallback(i.e. kernel launching) events are host events.
 |   // DriverCallback(i.e. kernel launching) events are host events.
 | ||||||
|   if (event.source == CuptiTracerEventSource::DriverCallback) return true; |   if (event.source == CuptiTracerEventSource::DriverCallback) { | ||||||
|  |     *line_id = event.thread_id; | ||||||
|  |     return true; | ||||||
|  |   } | ||||||
|   // Non-overhead activity events are device events.
 |   // Non-overhead activity events are device events.
 | ||||||
|   if (event.type != CuptiTracerEventType::Overhead) return false; |   if (event.type != CuptiTracerEventType::Overhead) { | ||||||
|  |     *line_id = event.stream_id; | ||||||
|  |     return false; | ||||||
|  |   } | ||||||
|   // Overhead events can be associated with a thread or a stream, etc.
 |   // Overhead events can be associated with a thread or a stream, etc.
 | ||||||
|   // If a valid thread id is specified, we consider it as a host event.
 |   // If a valid thread id is specified, we consider it as a host event.
 | ||||||
|   return event.thread_id != CuptiTracerEvent::kInvalidThreadId; |   //
 | ||||||
|  |   if (event.stream_id != CuptiTracerEvent::kInvalidStreamId) { | ||||||
|  |     *line_id = event.stream_id; | ||||||
|  |     return false; | ||||||
|  |   } else if (event.thread_id != CuptiTracerEvent::kInvalidStreamId && | ||||||
|  |              event.thread_id != 0) { | ||||||
|  |     *line_id = event.thread_id; | ||||||
|  |     return true; | ||||||
|  |   } else { | ||||||
|  |     *line_id = kThreadIdOverhead; | ||||||
|  |     return false; | ||||||
|  |   } | ||||||
| } | } | ||||||
| 
 | 
 | ||||||
| void CreateXEvent(const CuptiTracerEvent& event, XPlaneBuilder* plane, | void CreateXEvent(const CuptiTracerEvent& event, XPlaneBuilder* plane, | ||||||
| @ -60,6 +77,11 @@ void CreateXEvent(const CuptiTracerEvent& event, XPlaneBuilder* plane, | |||||||
|   XEventBuilder xevent = line->AddEvent(*event_metadata); |   XEventBuilder xevent = line->AddEvent(*event_metadata); | ||||||
|   xevent.SetTimestampNs(event.start_time_ns); |   xevent.SetTimestampNs(event.start_time_ns); | ||||||
|   xevent.SetEndTimestampNs(event.end_time_ns); |   xevent.SetEndTimestampNs(event.end_time_ns); | ||||||
|  |   if (event.source == CuptiTracerEventSource::DriverCallback) { | ||||||
|  |     xevent.AddStatValue( | ||||||
|  |         *plane->GetOrCreateStatMetadata(GetStatTypeStr(StatType::kDeviceId)), | ||||||
|  |         event.device_id); | ||||||
|  |   } | ||||||
|   if (event.correlation_id != CuptiTracerEvent::kInvalidCorrelationId) { |   if (event.correlation_id != CuptiTracerEvent::kInvalidCorrelationId) { | ||||||
|     xevent.AddStatValue(*plane->GetOrCreateStatMetadata( |     xevent.AddStatValue(*plane->GetOrCreateStatMetadata( | ||||||
|                             GetStatTypeStr(StatType::kCorrelationId)), |                             GetStatTypeStr(StatType::kCorrelationId)), | ||||||
| @ -146,6 +168,8 @@ std::string GetDeviceXLineName( | |||||||
|   std::string line_name = absl::StrCat("Stream #", stream_id); |   std::string line_name = absl::StrCat("Stream #", stream_id); | ||||||
|   event_types.erase(CuptiTracerEventType::Unsupported); |   event_types.erase(CuptiTracerEventType::Unsupported); | ||||||
|   if (event_types.empty()) return line_name; |   if (event_types.empty()) return line_name; | ||||||
|  |   if (event_types.count(CuptiTracerEventType::Overhead)) | ||||||
|  |     return "CUPTI overhead"; | ||||||
|   std::vector<const char*> type_names; |   std::vector<const char*> type_names; | ||||||
|   for (const auto event_type : event_types) { |   for (const auto event_type : event_types) { | ||||||
|     type_names.emplace_back(GetTraceEventTypeName(event_type)); |     type_names.emplace_back(GetTraceEventTypeName(event_type)); | ||||||
| @ -226,23 +250,26 @@ class CuptiTraceCollectorImpl : public CuptiTraceCollector { | |||||||
|                                      step_stats); |                                      step_stats); | ||||||
|     } |     } | ||||||
|   } |   } | ||||||
|   void Export(XSpace* space, uint64 end_gpu_ns) override { |   // Returns true if some GPU events are captured.
 | ||||||
|  |   bool Export(XSpace* space, uint64 end_gpu_ns) override { | ||||||
|     LOG(INFO) << " GpuTracer has collected " << num_callback_events_ |     LOG(INFO) << " GpuTracer has collected " << num_callback_events_ | ||||||
|               << " callback api events and " << num_activity_events_ |               << " callback api events and " << num_activity_events_ | ||||||
|               << " activity events. " << ReportDroppedEvents(); |               << " activity events. " << ReportDroppedEvents(); | ||||||
|  |     size_t num_events = 0; | ||||||
|     XPlaneBuilder host_plane( |     XPlaneBuilder host_plane( | ||||||
|         FindOrAddMutablePlaneWithName(space, kCuptiDriverApiPlaneName)); |         FindOrAddMutablePlaneWithName(space, kCuptiDriverApiPlaneName)); | ||||||
|     for (int device_ordinal = 0; device_ordinal < num_gpus_; ++device_ordinal) { |     for (int device_ordinal = 0; device_ordinal < num_gpus_; ++device_ordinal) { | ||||||
|       std::string name = GpuPlaneName(device_ordinal); |       std::string name = GpuPlaneName(device_ordinal); | ||||||
|       XPlaneBuilder device_plane(FindOrAddMutablePlaneWithName(space, name)); |       XPlaneBuilder device_plane(FindOrAddMutablePlaneWithName(space, name)); | ||||||
|       device_plane.SetId(device_ordinal); |       device_plane.SetId(device_ordinal); | ||||||
|       per_device_collector_[device_ordinal].Flush(start_gpu_ns_, end_gpu_ns, |       num_events += per_device_collector_[device_ordinal].Flush( | ||||||
|                                                   &device_plane, &host_plane); |           start_gpu_ns_, end_gpu_ns, &device_plane, &host_plane); | ||||||
|       per_device_collector_[device_ordinal].GetDeviceCapabilities( |       per_device_collector_[device_ordinal].GetDeviceCapabilities( | ||||||
|           device_ordinal, &device_plane); |           device_ordinal, &device_plane); | ||||||
|       NormalizeTimeStamps(&device_plane, start_walltime_ns_); |       NormalizeTimeStamps(&device_plane, start_walltime_ns_); | ||||||
|     } |     } | ||||||
|     NormalizeTimeStamps(&host_plane, start_walltime_ns_); |     NormalizeTimeStamps(&host_plane, start_walltime_ns_); | ||||||
|  |     return num_events > 0; | ||||||
|   } |   } | ||||||
|   std::string ReportDroppedEvents() { |   std::string ReportDroppedEvents() { | ||||||
|     absl::MutexLock lock(&mutex_); |     absl::MutexLock lock(&mutex_); | ||||||
| @ -432,16 +459,15 @@ class CuptiTraceCollectorImpl : public CuptiTraceCollector { | |||||||
|       events.clear(); |       events.clear(); | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     void Flush(uint64 start_gpu_ns, uint64 end_gpu_ns, |     size_t Flush(uint64 start_gpu_ns, uint64 end_gpu_ns, | ||||||
|                  XPlaneBuilder* device_plane, XPlaneBuilder* host_plane) { |                  XPlaneBuilder* device_plane, XPlaneBuilder* host_plane) { | ||||||
|       mutex_lock l(m); |       mutex_lock l(m); | ||||||
|       // Tracking event types per line.
 |       // Tracking event types per line.
 | ||||||
|       absl::flat_hash_map<int64, absl::flat_hash_set<CuptiTracerEventType>> |       absl::flat_hash_map<int64, absl::flat_hash_set<CuptiTracerEventType>> | ||||||
|           events_types_per_line; |           events_types_per_line; | ||||||
|       for (auto& event : events) { |       for (auto& event : events) { | ||||||
|         bool is_host_event = IsHostEvent(event); |         int64 line_id = CuptiTracerEvent::kInvalidThreadId; | ||||||
|         int64 line_id = is_host_event ? static_cast<int64>(event.thread_id) |         bool is_host_event = IsHostEvent(event, &line_id); | ||||||
|                                       : event.stream_id; |  | ||||||
|         if (line_id == CuptiTracerEvent::kInvalidThreadId || |         if (line_id == CuptiTracerEvent::kInvalidThreadId || | ||||||
|             line_id == CuptiTracerEvent::kInvalidStreamId) |             line_id == CuptiTracerEvent::kInvalidStreamId) | ||||||
|           continue; |           continue; | ||||||
| @ -458,7 +484,9 @@ class CuptiTraceCollectorImpl : public CuptiTraceCollector { | |||||||
|       host_plane->ForEachLine([&](XLineBuilder line) { |       host_plane->ForEachLine([&](XLineBuilder line) { | ||||||
|         line.SetName(absl::StrCat("Host Threads/", line.Id())); |         line.SetName(absl::StrCat("Host Threads/", line.Id())); | ||||||
|       }); |       }); | ||||||
|  |       size_t num_events = events.size(); | ||||||
|       events.clear(); |       events.clear(); | ||||||
|  |       return num_events; | ||||||
|     } |     } | ||||||
| 
 | 
 | ||||||
|     void GetDeviceCapabilities(int32 device_ordinal, |     void GetDeviceCapabilities(int32 device_ordinal, | ||||||
|  | |||||||
| @ -180,7 +180,7 @@ class CuptiTraceCollector { | |||||||
| 
 | 
 | ||||||
|   // Consumer side functions (i.e. called by GPU tracer);
 |   // Consumer side functions (i.e. called by GPU tracer);
 | ||||||
|   virtual void Export(StepStats* step_stats) {} |   virtual void Export(StepStats* step_stats) {} | ||||||
|   virtual void Export(XSpace* space, uint64 end_gpu_ns) {} |   virtual bool Export(XSpace* space, uint64 end_gpu_ns) { return true; } | ||||||
|   virtual std::string ReportNumEventsIfDropped() { return ""; } |   virtual std::string ReportNumEventsIfDropped() { return ""; } | ||||||
| 
 | 
 | ||||||
|   AnnotationMap* annotation_map() { return &annotation_map_; } |   AnnotationMap* annotation_map() { return &annotation_map_; } | ||||||
|  | |||||||
| @ -264,7 +264,7 @@ void DeriveEventsFromHostTrace(const XPlane* host_trace, | |||||||
|         if (stat.Type() == StatType::kGroupId) { |         if (stat.Type() == StatType::kGroupId) { | ||||||
|           group_id = stat.IntValue(); |           group_id = stat.IntValue(); | ||||||
|         } else if (stat.Type() == StatType::kDeviceId) { |         } else if (stat.Type() == StatType::kDeviceId) { | ||||||
|           device_id = stat.IntValue(); |           device_id = stat.IntOrUintValue(); | ||||||
|         } else if (stat.Type() == StatType::kCorrelationId) { |         } else if (stat.Type() == StatType::kCorrelationId) { | ||||||
|           correlation_id = stat.IntValue(); |           correlation_id = stat.IntValue(); | ||||||
|         } |         } | ||||||
|  | |||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user