1
0
mirror of https://github.com/fumiama/Retrieval-based-Voice-Conversion-WebUI.git synced 2026-06-10 21:24:16 +08:00

refactor(audio): store all of the audio related functions in the infer.lib.audio

refactors previous commit to have singular functions for each task, all located in `infer.lib.audio`
This commit is contained in:
Alex Murkoff
2024-06-11 12:24:03 +07:00
parent 15cf2e067e
commit 6425f2091e
4 changed files with 74 additions and 74 deletions

View File

@@ -10,6 +10,8 @@ import torch
from tqdm import tqdm
import av
from infer.lib.audio import downsample_audio
cpu = torch.device("cpu")
@@ -219,10 +221,10 @@ class Predictor:
sf.write(path_other, opt, rate)
opt_path_vocal = path_vocal[:-4] + ".%s" % format
opt_path_other = path_other[:-4] + ".%s" % format
process_audio(path_vocal, opt_path_vocal, format)
process_audio(path_other, opt_path_other, format)
downsample_audio(path_vocal, opt_path_vocal, format)
downsample_audio(path_other, opt_path_other, format)
def process_audio(input_path: str, output_path: str, format: str) -> None:
def downsample_audio(input_path: str, output_path: str, format: str) -> None:
if not os.path.exists(input_path): return
input_container = av.open(input_path)