CypressYang commited on
Commit
7ba8fd2
·
verified ·
1 Parent(s): f8f92e8

Upload songbloom_full_150s_dpo.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. songbloom_full_150s_dpo.yaml +76 -0
songbloom_full_150s_dpo.yaml ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ cfg_file:
2
+ precision: 'bf16-mixed' # ['16-mixed', 'bf16-mixed']
3
+ min_dur: 60
4
+ max_dur: 150
5
+ sr: 48000
6
+
7
+ pretrained_path: ${dynamic_path:???/songbloom_full_150s_dpo.pt}
8
+ continue_checkpoint:
9
+
10
+ train_dataset:
11
+ lyric_processor: phoneme
12
+ prompt_len: 10
13
+
14
+ vae:
15
+ vae_cfg: ${dynamic_path:???/stable_audio_1920_vae.json}
16
+ vae_ckpt: ${dynamic_path:???/autoencoder_music_dsp1920.ckpt}
17
+ sr: ${sr}
18
+
19
+ model:
20
+ block_size: 16
21
+ latent_dim: 64
22
+ dim: 1536
23
+ num_heads: 24
24
+ lm_layers: 36
25
+ diff_layers: 12
26
+ num_pitch: 16384
27
+ time_cond_type: prepend
28
+ timestep_features_dim: 256
29
+ diffusion_objective: rectified_flow
30
+ timestep_sampler: logit_normal
31
+ backend: llama
32
+ rotary_base_val: 20000
33
+ init_std: 0.02
34
+ h_dropout: 0.05
35
+
36
+ condition_provider_cfg:
37
+ prompt_wav:
38
+ type: audio_tokenizer_wrapper
39
+ output_dim: ${model.dim}
40
+ audio_tokenizer:
41
+ max_len: 250 # 25.0 * 10s
42
+ lyrics:
43
+ type: phoneme_tokenizer
44
+ output_dim: ${model.dim}
45
+ vocab_list: ${load_yaml:${dynamic_path:???/vocab_g2p.yaml}}
46
+ max_len: 600
47
+ max_sentence_per_structure: 50
48
+ mode: sum
49
+
50
+
51
+ cfg_dropout: 0.1
52
+ attribute_dropout:
53
+ text:
54
+ lyrics: 0.
55
+ wav:
56
+ prompt_wav: 0.1
57
+
58
+ fuser_cfg:
59
+ cross_attention_pos_emb: false
60
+ cross_attention_pos_emb_scale: 1
61
+ sum: []
62
+ prepend: [lyrics, prompt_wav]
63
+ cross: []
64
+ input_interpolate: []
65
+
66
+
67
+
68
+ inference:
69
+ cfg_coef: 1.5
70
+ temp: 0.9
71
+ diff_temp: 0.95
72
+ top_k: 100
73
+ penalty_repeat: True
74
+ penalty_window: 50
75
+ steps: 36
76
+ dit_cfg_type: h