File size: 1,659 Bytes
461d503
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
{
  "vocoder": {
    "vocoder": {
      "upsample_initial_channel": 1536,
      "resblock": "AMP1",
      "upsample_rates": [
        5,
        2,
        2,
        2,
        2,
        2
      ],
      "resblock_kernel_sizes": [
        3,
        7,
        11
      ],
      "upsample_kernel_sizes": [
        11,
        4,
        4,
        4,
        4,
        4
      ],
      "resblock_dilation_sizes": [
        [
          1,
          3,
          5
        ],
        [
          1,
          3,
          5
        ],
        [
          1,
          3,
          5
        ]
      ],
      "stereo": true,
      "use_tanh_at_final": false,
      "activation": "snakebeta",
      "use_bias_at_final": false
    },
    "bwe": {
      "upsample_initial_channel": 512,
      "resblock": "AMP1",
      "upsample_rates": [
        6,
        5,
        2,
        2,
        2
      ],
      "resblock_kernel_sizes": [
        3,
        7,
        11
      ],
      "upsample_kernel_sizes": [
        12,
        11,
        4,
        4,
        4
      ],
      "resblock_dilation_sizes": [
        [
          1,
          3,
          5
        ],
        [
          1,
          3,
          5
        ],
        [
          1,
          3,
          5
        ]
      ],
      "stereo": true,
      "use_tanh_at_final": false,
      "activation": "snakebeta",
      "use_bias_at_final": false,
      "apply_final_activation": false,
      "input_sampling_rate": 16000,
      "output_sampling_rate": 48000,
      "hop_length": 80,
      "n_fft": 512,
      "win_size": 512,
      "num_mels": 64
    }
  },
  "_class_name": "LTX2Vocoder"
}