feat(audio): pre-allocate decoded_audio array in the load_audio function

this should improve performance, even if just a little
2026-07-18 03:10:29 +08:00 · 2024-06-11 16:23:13 +07:00
parent 68a3d8caf2
commit 2574ce5ea2
1 changed files with 3 additions and 1 deletions
--- a/infer/lib/audio.py
+++ b/infer/lib/audio.py
@@ -42,7 +42,9 @@ def load_audio(file: str, sr: int) -> np.ndarray:
    try:
        container = av.open(file)
        resampler = AudioResampler(format='fltp', layout='mono', rate=sr)
-        decoded_audio = []
+
+        # AV stores duration in nanoseconds
+        decoded_audio = (((container.duration * sr / container.bit_rate) // 1_000_000) + 1)*[]

        for frame in container.decode(audio=0):
            frame.pts = None  # Clear presentation timestamp to avoid resampling issues