Fix the duration computation in triton_trtllm/client_grpc.py (#1071)

* Update client_grpc.py

Using `actual_duration` to compute metrics like RTF.
This commit is contained in:
Alice Yanagi
2025-06-04 11:18:00 +08:00
committed by GitHub
parent 35f130ee85
commit 7e37bc5d9a

View File

@@ -310,8 +310,9 @@ async def send(
audio_save_path = os.path.join(audio_save_dir, f"{item['target_audio_path']}.wav")
sf.write(audio_save_path, audio, save_sample_rate, "PCM_16")
latency_data.append((end, estimated_target_duration))
total_duration += estimated_target_duration
actual_duration = len(audio) / save_sample_rate
latency_data.append((end, actual_duration))
total_duration += actual_duration
return total_duration, latency_data