File size: 499 Bytes
bf277fe |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 |
from dia.model import Dia
model = Dia.from_pretrained("nari-labs/Dia-1.6B-0626", compute_dtype="float16")
text = "[S1] Dia is an open weights text to dialogue model. [S2] You get full control over scripts and voices. [S1] Wow. Amazing. (laughs) [S2] Try it now on Git hub or Hugging Face."
output = model.generate(
text,
use_torch_compile=False,
verbose=True,
cfg_scale=3.0,
temperature=1.8,
top_p=0.90,
cfg_filter_top_k=50,
)
model.save_audio("simple.mp3", output)
|