hcq simpler _gpu2cpu_time (#5605)

* hcq simpler _gpu2cpu_time

* rename
This commit is contained in:
nimlgen
2024-07-20 11:10:25 +03:00
committed by GitHub
parent 32b0c07d5a
commit 7ca2c48b64

View File

@@ -436,8 +436,7 @@ class HCQCompiled(Compiled):
"""
Translates local gpu time (timestamp) into global cpu time.
"""
if is_copy: return self.copy_cpu_start_time_us + (gpu_time - self.copy_gpu_start_time_us)
return self.cpu_start_time_us + (gpu_time - self.gpu_start_time_us)
return gpu_time + (self.gpu2cpu_copy_time_diff if is_copy else self.gpu2cpu_compute_time_diff)
def _prof_setup(self):
if not hasattr(self, 'profile_logger'): atexit.register(self._prof_finalize)
@@ -448,9 +447,8 @@ class HCQCompiled(Compiled):
self.timeline_value += 1
cpu_start_time = time.perf_counter_ns() / 1e3
self.timeline_signal.wait(self.timeline_value - 1)
return cpu_start_time, self.timeline_signal.timestamp
self.cpu_start_time_us, self.gpu_start_time_us = _sync_queue(self.hw_compute_queue_t)
self.copy_cpu_start_time_us, self.copy_gpu_start_time_us = _sync_queue(self.hw_copy_queue_t)
return cpu_start_time - self.timeline_signal.timestamp
self.gpu2cpu_compute_time_diff, self.gpu2cpu_copy_time_diff = _sync_queue(self.hw_compute_queue_t), _sync_queue(self.hw_copy_queue_t)
def _prof_process_events(self):
self.raw_prof_records += [(st.timestamp, en.timestamp, name, is_cp) for st, en, name, is_cp in self.sig_prof_records]