wanghappy commited on
Commit
7a54974
·
verified ·
1 Parent(s): 544654c

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. config.yaml +62 -0
  2. model_last.pt +3 -0
config.yaml ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset:
2
+ target_sample_rate: 24000
3
+ n_mel_channels: 100
4
+ hop_length: 256
5
+ win_length: 1024
6
+ n_fft: 1024
7
+ mel_spec_type: vocos
8
+ tokenizer: pinyin
9
+ tokenizer_path: data/HFDatasetNew_pinyin/vocab.txt
10
+ name: /apdcephfs_cq10/share_1297902/user/nenali/project/chukewang/data/Emilia-Dataset
11
+ type: HFDatasetNew
12
+ cache_dir: /apdcephfs_cq10/share_1297902/user/nenali/project/chukewang/data/Emilia-Dataset-Cache
13
+ duration_path: scripts/duration.json
14
+ valid_text_path: scripts/valid.json
15
+ training:
16
+ exp_name: F5TTS_PPG_ONLY
17
+ learning_rate: 7.5e-05
18
+ batch_size_per_gpu: 4096
19
+ batch_size_type: frame
20
+ max_samples: 64
21
+ grad_accumulation_steps: 4
22
+ max_grad_norm: 1.0
23
+ epochs: 11
24
+ num_warmup_updates: 20000
25
+ save_per_updates: 20000
26
+ last_per_steps: 5000
27
+ checkpoint_path: ckpts/ppg_only_cq
28
+ combined_cond_drop_prob:
29
+ - 1
30
+ - 0
31
+ - 0
32
+ - 0
33
+ repeat_space_token: false
34
+ mix_condition: false
35
+ model:
36
+ wandb_resume_id: None
37
+ cls: DiT
38
+ cfg:
39
+ DiT:
40
+ dim: 1024
41
+ depth: 22
42
+ heads: 16
43
+ ff_mult: 2
44
+ text_dim: 512
45
+ conv_layers: 4
46
+ UNetT:
47
+ dim: 1024
48
+ depth: 24
49
+ heads: 16
50
+ ff_mult: 4
51
+ ppg_input: true
52
+ ppg:
53
+ model_path: pretrained_models/ppg/33.pt
54
+ config: pretrained_models/ppg/train.yaml
55
+ frame_length: 20
56
+ mel_frame_shift: 10
57
+ dim: 256
58
+ output_type: map
59
+ map:
60
+ map_mix_ratio: 1.0
61
+ global_phn_center_path: pretrained_models/ppg/7layer_20ms_33pt/phn_center.npy
62
+ para_softmax_path: pretrained_models/ppg/7layer_20ms_33pt/ce_layer.pkl
model_last.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6be869e82a9d23a3130496218a37669981bb6adc1473c8f0d9b242c3f5cdc7cb
3
+ size 5399439861