rjzevallos commited on
Commit
525f7a1
·
verified ·
1 Parent(s): 1096cef

Upload 2 files

Browse files
Files changed (2) hide show
  1. config.yml +30 -0
  2. token_maps.pkl +3 -0
config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ log_dir: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/checkpoint_es"
2
+ mixed_precision: "fp16"
3
+ data_folder: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/spanish.es.processed_fixed"
4
+ batch_size: 4
5
+ save_interval: 5000
6
+ log_interval: 10
7
+ num_process: 1 # number of GPUs
8
+ num_steps: 1000000
9
+
10
+ dataset_params:
11
+ tokenizer: "transfo-xl-wt103"
12
+ token_separator: " " # token used for phoneme separator (space)
13
+ token_mask: "M" # token used for phoneme mask (M)
14
+ word_separator: 3039 # token used for word separator (<formula>)
15
+ token_maps: "/gpfs/projects/bsc88/speech/TTS/repos/PL-BERT/token_maps_es_new_fix.pkl" # token map path
16
+
17
+ max_mel_length: 512 # max phoneme length
18
+
19
+ word_mask_prob: 0.15 # probability to mask the entire word
20
+ phoneme_mask_prob: 0.1 # probability to mask each phoneme
21
+ replace_prob: 0.2 # probablity to replace phonemes
22
+
23
+ model_params:
24
+ vocab_size: 178
25
+ hidden_size: 768
26
+ num_attention_heads: 12
27
+ intermediate_size: 2048
28
+ max_position_embeddings: 512
29
+ num_hidden_layers: 12
30
+ dropout: 0.1
token_maps.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3286cef21241409b420d8ec66201db2ef2411fd314576cd40c6a96a3738579ff
3
+ size 37356904