Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
|
@@ -52,7 +52,7 @@ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
|
| 52 |
target_sample_rate = 24000
|
| 53 |
n_mel_channels = 100
|
| 54 |
hop_length = 256
|
| 55 |
-
target_rms = 0.
|
| 56 |
nfe_step = 8 # 16, 32
|
| 57 |
cfg_strength = 2.0
|
| 58 |
ode_method = "euler"
|
|
@@ -274,13 +274,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
|
|
| 274 |
|
| 275 |
if not ref_text.strip():
|
| 276 |
gr.Info("No reference text provided, transcribing reference audio...")
|
| 277 |
-
ref_text =
|
| 278 |
-
ref_audio,
|
| 279 |
-
chunk_length_s=30,
|
| 280 |
-
batch_size=128,
|
| 281 |
-
generate_kwargs={"task": "transcribe"},
|
| 282 |
-
return_timestamps=False,
|
| 283 |
-
)["text"].strip()
|
| 284 |
gr.Info("Finished transcription")
|
| 285 |
else:
|
| 286 |
gr.Info("Using custom reference text...")
|
|
|
|
| 52 |
target_sample_rate = 24000
|
| 53 |
n_mel_channels = 100
|
| 54 |
hop_length = 256
|
| 55 |
+
target_rms = 0.1
|
| 56 |
nfe_step = 8 # 16, 32
|
| 57 |
cfg_strength = 2.0
|
| 58 |
ode_method = "euler"
|
|
|
|
| 274 |
|
| 275 |
if not ref_text.strip():
|
| 276 |
gr.Info("No reference text provided, transcribing reference audio...")
|
| 277 |
+
ref_text = gen_text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 278 |
gr.Info("Finished transcription")
|
| 279 |
else:
|
| 280 |
gr.Info("Using custom reference text...")
|