innnky commited on
Commit
e306eaf
1 Parent(s): 8f5da61
Files changed (2) hide show
  1. app.py +4 -3
  2. infer/__init__.py +1 -0
app.py CHANGED
@@ -41,12 +41,13 @@ def vc_fn(speaker, ds, vc_transform):
41
  ph_dur= [float(i) for i in ph_dur.split(" ")]
42
  f0_seq = [float(i) for i in f0_seq.split(" ")]
43
  dur+=sum(ph_dur)
44
- if sum(ph_dur) >30:
 
45
  flag = True
46
  except:
47
  return "ds工程需要冻结f0和音素参数才能使用此模型合成", None
48
  if flag:
49
- return "单个切片时长必须小于30s,否则请使用本地推理", None
50
  if dur>120:
51
  return "总时长需要小于2分钟,否则请使用本地推理", None
52
  out_audio = infer_ds(net_g, hps, ds, speaker, vc_transform)
@@ -69,7 +70,7 @@ with app:
69
 
70
  由于此模型是nomidi模型,因此导出ds工程时需要冻结音素和音高参数, 否则会报错,具体DiffSinger工程制作详细问题可以加入DiffSinger QQ交流群 907879266
71
 
72
- 在线推理限制为总时长小于2分钟,且单个切片时长小于30s,有更大需求请下载本仓库或github仓库代码运行ds_inference.py进行本地推理
73
  """)
74
  sid = gr.Dropdown(label="音色", choices=["taffy", "otto"], value="taffy")
75
  vc_input3 = gr.TextArea(label="ds工程(json格式)",value='''[
 
41
  ph_dur= [float(i) for i in ph_dur.split(" ")]
42
  f0_seq = [float(i) for i in f0_seq.split(" ")]
43
  dur+=sum(ph_dur)
44
+ print(sum(ph_dur))
45
+ if sum(ph_dur) >20:
46
  flag = True
47
  except:
48
  return "ds工程需要冻结f0和音素参数才能使用此模型合成", None
49
  if flag:
50
+ return "单个切片时长必须小于20s,否则请使用本地推理", None
51
  if dur>120:
52
  return "总时长需要小于2分钟,否则请使用本地推理", None
53
  out_audio = infer_ds(net_g, hps, ds, speaker, vc_transform)
 
70
 
71
  由于此模型是nomidi模型,因此导出ds工程时需要冻结音素和音高参数, 否则会报错,具体DiffSinger工程制作详细问题可以加入DiffSinger QQ交流群 907879266
72
 
73
+ 在线推理限制为总时长小于2分钟,且单个切片时长小于20s,有更大需求请下载本仓库或github仓库代码运行ds_inference.py进行本地推理
74
  """)
75
  sid = gr.Dropdown(label="音色", choices=["taffy", "otto"], value="taffy")
76
  vc_input3 = gr.TextArea(label="ds工程(json格式)",value='''[
infer/__init__.py CHANGED
@@ -112,6 +112,7 @@ def infer_ds(model, hps, ds, speaker, trans):
112
  result = cross_fade(result, seg_audio, current_length + silent_length)
113
  current_length = current_length + silent_length + seg_audio.shape[0]
114
  print("infer time:", time.time() - t1)
 
115
  return result
116
 
117
 
 
112
  result = cross_fade(result, seg_audio, current_length + silent_length)
113
  current_length = current_length + silent_length + seg_audio.shape[0]
114
  print("infer time:", time.time() - t1)
115
+
116
  return result
117
 
118