|
|
log_dir: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/checkpoint_cat" |
|
|
mixed_precision: "fp16" |
|
|
data_folder: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/catalan.cat.processed_fixed" |
|
|
batch_size: 4 |
|
|
save_interval: 5000 |
|
|
log_interval: 10 |
|
|
num_process: 1 |
|
|
num_steps: 1000000 |
|
|
|
|
|
dataset_params: |
|
|
tokenizer: "transfo-xl-wt103" |
|
|
token_separator: " " |
|
|
token_mask: "M" |
|
|
word_separator: 3039 |
|
|
token_maps: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/token_maps_cat_new_fix.pkl" |
|
|
|
|
|
max_mel_length: 512 |
|
|
|
|
|
word_mask_prob: 0.15 |
|
|
phoneme_mask_prob: 0.1 |
|
|
replace_prob: 0.2 |
|
|
|
|
|
model_params: |
|
|
vocab_size: 178 |
|
|
hidden_size: 768 |
|
|
num_attention_heads: 12 |
|
|
intermediate_size: 2048 |
|
|
max_position_embeddings: 512 |
|
|
num_hidden_layers: 12 |
|
|
dropout: 0.1 |