import json import os import time import re import numpy as np import soundfile import torch import tqdm from scipy.interpolate import interp1d from utils import utils from egs.visinger2.models import SynthesizerTrn from infer import preprocess, cross_fade, infer_ds trans = -12 speaker = "otto" ds_path = "infer/share.ds" config_json = "egs/visinger2/config.json" checkpoint_path = f"/Volumes/Extend/下载/G_110000.pth" file_name = os.path.splitext(os.path.basename(ds_path))[0] step = re.findall(r'G_(\d+)\.pth', checkpoint_path)[0] if __name__ == '__main__': ds = json.load(open(ds_path)) hps = utils.get_hparams_from_file(config_json) net_g = SynthesizerTrn(hps) _ = net_g.eval() _ = utils.load_checkpoint(checkpoint_path, net_g, None) audio = infer_ds(net_g, hps, ds, speaker, trans) soundfile.write(f"{speaker}_{file_name}_{step}step.wav", audio, 44100)