model.safetensors.index.json
205.8 KB · 2240 lines · json Raw
1 {
2 "metadata": {
3 "total_size": 9236998676
4 },
5 "weight_map": {
6 "shared.weight": "model-00001-of-00002.safetensors",
7 "speech_encoder.adapter.layers.0.ffn.intermediate_dense.bias": "model-00002-of-00002.safetensors",
8 "speech_encoder.adapter.layers.0.ffn.intermediate_dense.weight": "model-00002-of-00002.safetensors",
9 "speech_encoder.adapter.layers.0.ffn.output_dense.bias": "model-00002-of-00002.safetensors",
10 "speech_encoder.adapter.layers.0.ffn.output_dense.weight": "model-00002-of-00002.safetensors",
11 "speech_encoder.adapter.layers.0.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
12 "speech_encoder.adapter.layers.0.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
13 "speech_encoder.adapter.layers.0.residual_conv.bias": "model-00002-of-00002.safetensors",
14 "speech_encoder.adapter.layers.0.residual_conv.weight": "model-00002-of-00002.safetensors",
15 "speech_encoder.adapter.layers.0.residual_layer_norm.bias": "model-00002-of-00002.safetensors",
16 "speech_encoder.adapter.layers.0.residual_layer_norm.weight": "model-00002-of-00002.safetensors",
17 "speech_encoder.adapter.layers.0.self_attn.linear_k.bias": "model-00002-of-00002.safetensors",
18 "speech_encoder.adapter.layers.0.self_attn.linear_k.weight": "model-00002-of-00002.safetensors",
19 "speech_encoder.adapter.layers.0.self_attn.linear_out.bias": "model-00002-of-00002.safetensors",
20 "speech_encoder.adapter.layers.0.self_attn.linear_out.weight": "model-00002-of-00002.safetensors",
21 "speech_encoder.adapter.layers.0.self_attn.linear_q.bias": "model-00002-of-00002.safetensors",
22 "speech_encoder.adapter.layers.0.self_attn.linear_q.weight": "model-00002-of-00002.safetensors",
23 "speech_encoder.adapter.layers.0.self_attn.linear_v.bias": "model-00002-of-00002.safetensors",
24 "speech_encoder.adapter.layers.0.self_attn.linear_v.weight": "model-00002-of-00002.safetensors",
25 "speech_encoder.adapter.layers.0.self_attn_conv.bias": "model-00002-of-00002.safetensors",
26 "speech_encoder.adapter.layers.0.self_attn_conv.weight": "model-00002-of-00002.safetensors",
27 "speech_encoder.adapter.layers.0.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
28 "speech_encoder.adapter.layers.0.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
29 "speech_encoder.encoder.layer_norm.bias": "model-00002-of-00002.safetensors",
30 "speech_encoder.encoder.layer_norm.weight": "model-00002-of-00002.safetensors",
31 "speech_encoder.encoder.layers.0.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
32 "speech_encoder.encoder.layers.0.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
33 "speech_encoder.encoder.layers.0.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
34 "speech_encoder.encoder.layers.0.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
35 "speech_encoder.encoder.layers.0.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
36 "speech_encoder.encoder.layers.0.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
37 "speech_encoder.encoder.layers.0.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
38 "speech_encoder.encoder.layers.0.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
39 "speech_encoder.encoder.layers.0.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
40 "speech_encoder.encoder.layers.0.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
41 "speech_encoder.encoder.layers.0.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
42 "speech_encoder.encoder.layers.0.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
43 "speech_encoder.encoder.layers.0.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
44 "speech_encoder.encoder.layers.0.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
45 "speech_encoder.encoder.layers.0.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
46 "speech_encoder.encoder.layers.0.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
47 "speech_encoder.encoder.layers.0.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
48 "speech_encoder.encoder.layers.0.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
49 "speech_encoder.encoder.layers.0.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
50 "speech_encoder.encoder.layers.0.final_layer_norm.bias": "model-00001-of-00002.safetensors",
51 "speech_encoder.encoder.layers.0.final_layer_norm.weight": "model-00001-of-00002.safetensors",
52 "speech_encoder.encoder.layers.0.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
53 "speech_encoder.encoder.layers.0.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
54 "speech_encoder.encoder.layers.0.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
55 "speech_encoder.encoder.layers.0.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
56 "speech_encoder.encoder.layers.0.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
57 "speech_encoder.encoder.layers.0.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
58 "speech_encoder.encoder.layers.0.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
59 "speech_encoder.encoder.layers.0.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
60 "speech_encoder.encoder.layers.0.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
61 "speech_encoder.encoder.layers.0.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
62 "speech_encoder.encoder.layers.0.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
63 "speech_encoder.encoder.layers.1.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
64 "speech_encoder.encoder.layers.1.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
65 "speech_encoder.encoder.layers.1.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
66 "speech_encoder.encoder.layers.1.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
67 "speech_encoder.encoder.layers.1.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
68 "speech_encoder.encoder.layers.1.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
69 "speech_encoder.encoder.layers.1.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
70 "speech_encoder.encoder.layers.1.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
71 "speech_encoder.encoder.layers.1.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
72 "speech_encoder.encoder.layers.1.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
73 "speech_encoder.encoder.layers.1.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
74 "speech_encoder.encoder.layers.1.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
75 "speech_encoder.encoder.layers.1.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
76 "speech_encoder.encoder.layers.1.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
77 "speech_encoder.encoder.layers.1.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
78 "speech_encoder.encoder.layers.1.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
79 "speech_encoder.encoder.layers.1.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
80 "speech_encoder.encoder.layers.1.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
81 "speech_encoder.encoder.layers.1.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
82 "speech_encoder.encoder.layers.1.final_layer_norm.bias": "model-00001-of-00002.safetensors",
83 "speech_encoder.encoder.layers.1.final_layer_norm.weight": "model-00001-of-00002.safetensors",
84 "speech_encoder.encoder.layers.1.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
85 "speech_encoder.encoder.layers.1.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
86 "speech_encoder.encoder.layers.1.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
87 "speech_encoder.encoder.layers.1.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
88 "speech_encoder.encoder.layers.1.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
89 "speech_encoder.encoder.layers.1.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
90 "speech_encoder.encoder.layers.1.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
91 "speech_encoder.encoder.layers.1.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
92 "speech_encoder.encoder.layers.1.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
93 "speech_encoder.encoder.layers.1.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
94 "speech_encoder.encoder.layers.1.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
95 "speech_encoder.encoder.layers.10.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
96 "speech_encoder.encoder.layers.10.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
97 "speech_encoder.encoder.layers.10.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
98 "speech_encoder.encoder.layers.10.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
99 "speech_encoder.encoder.layers.10.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
100 "speech_encoder.encoder.layers.10.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
101 "speech_encoder.encoder.layers.10.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
102 "speech_encoder.encoder.layers.10.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
103 "speech_encoder.encoder.layers.10.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
104 "speech_encoder.encoder.layers.10.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
105 "speech_encoder.encoder.layers.10.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
106 "speech_encoder.encoder.layers.10.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
107 "speech_encoder.encoder.layers.10.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
108 "speech_encoder.encoder.layers.10.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
109 "speech_encoder.encoder.layers.10.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
110 "speech_encoder.encoder.layers.10.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
111 "speech_encoder.encoder.layers.10.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
112 "speech_encoder.encoder.layers.10.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
113 "speech_encoder.encoder.layers.10.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
114 "speech_encoder.encoder.layers.10.final_layer_norm.bias": "model-00001-of-00002.safetensors",
115 "speech_encoder.encoder.layers.10.final_layer_norm.weight": "model-00001-of-00002.safetensors",
116 "speech_encoder.encoder.layers.10.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
117 "speech_encoder.encoder.layers.10.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
118 "speech_encoder.encoder.layers.10.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
119 "speech_encoder.encoder.layers.10.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
120 "speech_encoder.encoder.layers.10.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
121 "speech_encoder.encoder.layers.10.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
122 "speech_encoder.encoder.layers.10.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
123 "speech_encoder.encoder.layers.10.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
124 "speech_encoder.encoder.layers.10.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
125 "speech_encoder.encoder.layers.10.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
126 "speech_encoder.encoder.layers.10.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
127 "speech_encoder.encoder.layers.11.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
128 "speech_encoder.encoder.layers.11.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
129 "speech_encoder.encoder.layers.11.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
130 "speech_encoder.encoder.layers.11.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
131 "speech_encoder.encoder.layers.11.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
132 "speech_encoder.encoder.layers.11.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
133 "speech_encoder.encoder.layers.11.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
134 "speech_encoder.encoder.layers.11.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
135 "speech_encoder.encoder.layers.11.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
136 "speech_encoder.encoder.layers.11.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
137 "speech_encoder.encoder.layers.11.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
138 "speech_encoder.encoder.layers.11.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
139 "speech_encoder.encoder.layers.11.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
140 "speech_encoder.encoder.layers.11.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
141 "speech_encoder.encoder.layers.11.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
142 "speech_encoder.encoder.layers.11.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
143 "speech_encoder.encoder.layers.11.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
144 "speech_encoder.encoder.layers.11.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
145 "speech_encoder.encoder.layers.11.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
146 "speech_encoder.encoder.layers.11.final_layer_norm.bias": "model-00001-of-00002.safetensors",
147 "speech_encoder.encoder.layers.11.final_layer_norm.weight": "model-00001-of-00002.safetensors",
148 "speech_encoder.encoder.layers.11.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
149 "speech_encoder.encoder.layers.11.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
150 "speech_encoder.encoder.layers.11.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
151 "speech_encoder.encoder.layers.11.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
152 "speech_encoder.encoder.layers.11.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
153 "speech_encoder.encoder.layers.11.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
154 "speech_encoder.encoder.layers.11.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
155 "speech_encoder.encoder.layers.11.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
156 "speech_encoder.encoder.layers.11.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
157 "speech_encoder.encoder.layers.11.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
158 "speech_encoder.encoder.layers.11.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
159 "speech_encoder.encoder.layers.12.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
160 "speech_encoder.encoder.layers.12.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
161 "speech_encoder.encoder.layers.12.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
162 "speech_encoder.encoder.layers.12.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
163 "speech_encoder.encoder.layers.12.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
164 "speech_encoder.encoder.layers.12.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
165 "speech_encoder.encoder.layers.12.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
166 "speech_encoder.encoder.layers.12.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
167 "speech_encoder.encoder.layers.12.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
168 "speech_encoder.encoder.layers.12.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
169 "speech_encoder.encoder.layers.12.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
170 "speech_encoder.encoder.layers.12.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
171 "speech_encoder.encoder.layers.12.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
172 "speech_encoder.encoder.layers.12.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
173 "speech_encoder.encoder.layers.12.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
174 "speech_encoder.encoder.layers.12.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
175 "speech_encoder.encoder.layers.12.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
176 "speech_encoder.encoder.layers.12.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
177 "speech_encoder.encoder.layers.12.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
178 "speech_encoder.encoder.layers.12.final_layer_norm.bias": "model-00001-of-00002.safetensors",
179 "speech_encoder.encoder.layers.12.final_layer_norm.weight": "model-00001-of-00002.safetensors",
180 "speech_encoder.encoder.layers.12.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
181 "speech_encoder.encoder.layers.12.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
182 "speech_encoder.encoder.layers.12.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
183 "speech_encoder.encoder.layers.12.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
184 "speech_encoder.encoder.layers.12.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
185 "speech_encoder.encoder.layers.12.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
186 "speech_encoder.encoder.layers.12.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
187 "speech_encoder.encoder.layers.12.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
188 "speech_encoder.encoder.layers.12.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
189 "speech_encoder.encoder.layers.12.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
190 "speech_encoder.encoder.layers.12.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
191 "speech_encoder.encoder.layers.13.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
192 "speech_encoder.encoder.layers.13.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
193 "speech_encoder.encoder.layers.13.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
194 "speech_encoder.encoder.layers.13.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
195 "speech_encoder.encoder.layers.13.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
196 "speech_encoder.encoder.layers.13.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
197 "speech_encoder.encoder.layers.13.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
198 "speech_encoder.encoder.layers.13.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
199 "speech_encoder.encoder.layers.13.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
200 "speech_encoder.encoder.layers.13.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
201 "speech_encoder.encoder.layers.13.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
202 "speech_encoder.encoder.layers.13.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
203 "speech_encoder.encoder.layers.13.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
204 "speech_encoder.encoder.layers.13.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
205 "speech_encoder.encoder.layers.13.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
206 "speech_encoder.encoder.layers.13.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
207 "speech_encoder.encoder.layers.13.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
208 "speech_encoder.encoder.layers.13.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
209 "speech_encoder.encoder.layers.13.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
210 "speech_encoder.encoder.layers.13.final_layer_norm.bias": "model-00001-of-00002.safetensors",
211 "speech_encoder.encoder.layers.13.final_layer_norm.weight": "model-00001-of-00002.safetensors",
212 "speech_encoder.encoder.layers.13.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
213 "speech_encoder.encoder.layers.13.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
214 "speech_encoder.encoder.layers.13.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
215 "speech_encoder.encoder.layers.13.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
216 "speech_encoder.encoder.layers.13.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
217 "speech_encoder.encoder.layers.13.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
218 "speech_encoder.encoder.layers.13.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
219 "speech_encoder.encoder.layers.13.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
220 "speech_encoder.encoder.layers.13.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
221 "speech_encoder.encoder.layers.13.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
222 "speech_encoder.encoder.layers.13.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
223 "speech_encoder.encoder.layers.14.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
224 "speech_encoder.encoder.layers.14.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
225 "speech_encoder.encoder.layers.14.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
226 "speech_encoder.encoder.layers.14.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
227 "speech_encoder.encoder.layers.14.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
228 "speech_encoder.encoder.layers.14.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
229 "speech_encoder.encoder.layers.14.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
230 "speech_encoder.encoder.layers.14.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
231 "speech_encoder.encoder.layers.14.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
232 "speech_encoder.encoder.layers.14.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
233 "speech_encoder.encoder.layers.14.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
234 "speech_encoder.encoder.layers.14.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
235 "speech_encoder.encoder.layers.14.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
236 "speech_encoder.encoder.layers.14.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
237 "speech_encoder.encoder.layers.14.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
238 "speech_encoder.encoder.layers.14.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
239 "speech_encoder.encoder.layers.14.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
240 "speech_encoder.encoder.layers.14.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
241 "speech_encoder.encoder.layers.14.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
242 "speech_encoder.encoder.layers.14.final_layer_norm.bias": "model-00001-of-00002.safetensors",
243 "speech_encoder.encoder.layers.14.final_layer_norm.weight": "model-00001-of-00002.safetensors",
244 "speech_encoder.encoder.layers.14.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
245 "speech_encoder.encoder.layers.14.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
246 "speech_encoder.encoder.layers.14.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
247 "speech_encoder.encoder.layers.14.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
248 "speech_encoder.encoder.layers.14.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
249 "speech_encoder.encoder.layers.14.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
250 "speech_encoder.encoder.layers.14.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
251 "speech_encoder.encoder.layers.14.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
252 "speech_encoder.encoder.layers.14.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
253 "speech_encoder.encoder.layers.14.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
254 "speech_encoder.encoder.layers.14.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
255 "speech_encoder.encoder.layers.15.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
256 "speech_encoder.encoder.layers.15.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
257 "speech_encoder.encoder.layers.15.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
258 "speech_encoder.encoder.layers.15.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
259 "speech_encoder.encoder.layers.15.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
260 "speech_encoder.encoder.layers.15.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
261 "speech_encoder.encoder.layers.15.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
262 "speech_encoder.encoder.layers.15.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
263 "speech_encoder.encoder.layers.15.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
264 "speech_encoder.encoder.layers.15.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
265 "speech_encoder.encoder.layers.15.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
266 "speech_encoder.encoder.layers.15.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
267 "speech_encoder.encoder.layers.15.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
268 "speech_encoder.encoder.layers.15.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
269 "speech_encoder.encoder.layers.15.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
270 "speech_encoder.encoder.layers.15.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
271 "speech_encoder.encoder.layers.15.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
272 "speech_encoder.encoder.layers.15.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
273 "speech_encoder.encoder.layers.15.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
274 "speech_encoder.encoder.layers.15.final_layer_norm.bias": "model-00001-of-00002.safetensors",
275 "speech_encoder.encoder.layers.15.final_layer_norm.weight": "model-00001-of-00002.safetensors",
276 "speech_encoder.encoder.layers.15.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
277 "speech_encoder.encoder.layers.15.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
278 "speech_encoder.encoder.layers.15.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
279 "speech_encoder.encoder.layers.15.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
280 "speech_encoder.encoder.layers.15.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
281 "speech_encoder.encoder.layers.15.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
282 "speech_encoder.encoder.layers.15.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
283 "speech_encoder.encoder.layers.15.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
284 "speech_encoder.encoder.layers.15.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
285 "speech_encoder.encoder.layers.15.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
286 "speech_encoder.encoder.layers.15.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
287 "speech_encoder.encoder.layers.16.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
288 "speech_encoder.encoder.layers.16.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
289 "speech_encoder.encoder.layers.16.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
290 "speech_encoder.encoder.layers.16.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
291 "speech_encoder.encoder.layers.16.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
292 "speech_encoder.encoder.layers.16.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
293 "speech_encoder.encoder.layers.16.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
294 "speech_encoder.encoder.layers.16.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
295 "speech_encoder.encoder.layers.16.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
296 "speech_encoder.encoder.layers.16.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
297 "speech_encoder.encoder.layers.16.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
298 "speech_encoder.encoder.layers.16.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
299 "speech_encoder.encoder.layers.16.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
300 "speech_encoder.encoder.layers.16.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
301 "speech_encoder.encoder.layers.16.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
302 "speech_encoder.encoder.layers.16.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
303 "speech_encoder.encoder.layers.16.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
304 "speech_encoder.encoder.layers.16.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
305 "speech_encoder.encoder.layers.16.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
306 "speech_encoder.encoder.layers.16.final_layer_norm.bias": "model-00001-of-00002.safetensors",
307 "speech_encoder.encoder.layers.16.final_layer_norm.weight": "model-00001-of-00002.safetensors",
308 "speech_encoder.encoder.layers.16.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
309 "speech_encoder.encoder.layers.16.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
310 "speech_encoder.encoder.layers.16.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
311 "speech_encoder.encoder.layers.16.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
312 "speech_encoder.encoder.layers.16.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
313 "speech_encoder.encoder.layers.16.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
314 "speech_encoder.encoder.layers.16.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
315 "speech_encoder.encoder.layers.16.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
316 "speech_encoder.encoder.layers.16.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
317 "speech_encoder.encoder.layers.16.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
318 "speech_encoder.encoder.layers.16.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
319 "speech_encoder.encoder.layers.17.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
320 "speech_encoder.encoder.layers.17.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
321 "speech_encoder.encoder.layers.17.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
322 "speech_encoder.encoder.layers.17.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
323 "speech_encoder.encoder.layers.17.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
324 "speech_encoder.encoder.layers.17.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
325 "speech_encoder.encoder.layers.17.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
326 "speech_encoder.encoder.layers.17.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
327 "speech_encoder.encoder.layers.17.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
328 "speech_encoder.encoder.layers.17.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
329 "speech_encoder.encoder.layers.17.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
330 "speech_encoder.encoder.layers.17.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
331 "speech_encoder.encoder.layers.17.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
332 "speech_encoder.encoder.layers.17.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
333 "speech_encoder.encoder.layers.17.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
334 "speech_encoder.encoder.layers.17.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
335 "speech_encoder.encoder.layers.17.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
336 "speech_encoder.encoder.layers.17.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
337 "speech_encoder.encoder.layers.17.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
338 "speech_encoder.encoder.layers.17.final_layer_norm.bias": "model-00001-of-00002.safetensors",
339 "speech_encoder.encoder.layers.17.final_layer_norm.weight": "model-00001-of-00002.safetensors",
340 "speech_encoder.encoder.layers.17.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
341 "speech_encoder.encoder.layers.17.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
342 "speech_encoder.encoder.layers.17.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
343 "speech_encoder.encoder.layers.17.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
344 "speech_encoder.encoder.layers.17.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
345 "speech_encoder.encoder.layers.17.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
346 "speech_encoder.encoder.layers.17.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
347 "speech_encoder.encoder.layers.17.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
348 "speech_encoder.encoder.layers.17.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
349 "speech_encoder.encoder.layers.17.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
350 "speech_encoder.encoder.layers.17.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
351 "speech_encoder.encoder.layers.18.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
352 "speech_encoder.encoder.layers.18.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
353 "speech_encoder.encoder.layers.18.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
354 "speech_encoder.encoder.layers.18.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
355 "speech_encoder.encoder.layers.18.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
356 "speech_encoder.encoder.layers.18.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
357 "speech_encoder.encoder.layers.18.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
358 "speech_encoder.encoder.layers.18.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
359 "speech_encoder.encoder.layers.18.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
360 "speech_encoder.encoder.layers.18.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
361 "speech_encoder.encoder.layers.18.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
362 "speech_encoder.encoder.layers.18.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
363 "speech_encoder.encoder.layers.18.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
364 "speech_encoder.encoder.layers.18.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
365 "speech_encoder.encoder.layers.18.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
366 "speech_encoder.encoder.layers.18.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
367 "speech_encoder.encoder.layers.18.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
368 "speech_encoder.encoder.layers.18.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
369 "speech_encoder.encoder.layers.18.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
370 "speech_encoder.encoder.layers.18.final_layer_norm.bias": "model-00001-of-00002.safetensors",
371 "speech_encoder.encoder.layers.18.final_layer_norm.weight": "model-00001-of-00002.safetensors",
372 "speech_encoder.encoder.layers.18.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
373 "speech_encoder.encoder.layers.18.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
374 "speech_encoder.encoder.layers.18.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
375 "speech_encoder.encoder.layers.18.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
376 "speech_encoder.encoder.layers.18.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
377 "speech_encoder.encoder.layers.18.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
378 "speech_encoder.encoder.layers.18.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
379 "speech_encoder.encoder.layers.18.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
380 "speech_encoder.encoder.layers.18.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
381 "speech_encoder.encoder.layers.18.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
382 "speech_encoder.encoder.layers.18.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
383 "speech_encoder.encoder.layers.19.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
384 "speech_encoder.encoder.layers.19.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
385 "speech_encoder.encoder.layers.19.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
386 "speech_encoder.encoder.layers.19.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
387 "speech_encoder.encoder.layers.19.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
388 "speech_encoder.encoder.layers.19.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
389 "speech_encoder.encoder.layers.19.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
390 "speech_encoder.encoder.layers.19.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
391 "speech_encoder.encoder.layers.19.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
392 "speech_encoder.encoder.layers.19.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
393 "speech_encoder.encoder.layers.19.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
394 "speech_encoder.encoder.layers.19.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
395 "speech_encoder.encoder.layers.19.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
396 "speech_encoder.encoder.layers.19.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
397 "speech_encoder.encoder.layers.19.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
398 "speech_encoder.encoder.layers.19.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
399 "speech_encoder.encoder.layers.19.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
400 "speech_encoder.encoder.layers.19.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
401 "speech_encoder.encoder.layers.19.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
402 "speech_encoder.encoder.layers.19.final_layer_norm.bias": "model-00001-of-00002.safetensors",
403 "speech_encoder.encoder.layers.19.final_layer_norm.weight": "model-00001-of-00002.safetensors",
404 "speech_encoder.encoder.layers.19.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
405 "speech_encoder.encoder.layers.19.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
406 "speech_encoder.encoder.layers.19.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
407 "speech_encoder.encoder.layers.19.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
408 "speech_encoder.encoder.layers.19.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
409 "speech_encoder.encoder.layers.19.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
410 "speech_encoder.encoder.layers.19.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
411 "speech_encoder.encoder.layers.19.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
412 "speech_encoder.encoder.layers.19.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
413 "speech_encoder.encoder.layers.19.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
414 "speech_encoder.encoder.layers.19.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
415 "speech_encoder.encoder.layers.2.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
416 "speech_encoder.encoder.layers.2.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
417 "speech_encoder.encoder.layers.2.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
418 "speech_encoder.encoder.layers.2.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
419 "speech_encoder.encoder.layers.2.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
420 "speech_encoder.encoder.layers.2.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
421 "speech_encoder.encoder.layers.2.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
422 "speech_encoder.encoder.layers.2.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
423 "speech_encoder.encoder.layers.2.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
424 "speech_encoder.encoder.layers.2.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
425 "speech_encoder.encoder.layers.2.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
426 "speech_encoder.encoder.layers.2.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
427 "speech_encoder.encoder.layers.2.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
428 "speech_encoder.encoder.layers.2.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
429 "speech_encoder.encoder.layers.2.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
430 "speech_encoder.encoder.layers.2.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
431 "speech_encoder.encoder.layers.2.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
432 "speech_encoder.encoder.layers.2.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
433 "speech_encoder.encoder.layers.2.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
434 "speech_encoder.encoder.layers.2.final_layer_norm.bias": "model-00001-of-00002.safetensors",
435 "speech_encoder.encoder.layers.2.final_layer_norm.weight": "model-00001-of-00002.safetensors",
436 "speech_encoder.encoder.layers.2.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
437 "speech_encoder.encoder.layers.2.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
438 "speech_encoder.encoder.layers.2.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
439 "speech_encoder.encoder.layers.2.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
440 "speech_encoder.encoder.layers.2.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
441 "speech_encoder.encoder.layers.2.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
442 "speech_encoder.encoder.layers.2.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
443 "speech_encoder.encoder.layers.2.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
444 "speech_encoder.encoder.layers.2.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
445 "speech_encoder.encoder.layers.2.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
446 "speech_encoder.encoder.layers.2.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
447 "speech_encoder.encoder.layers.20.conv_module.depthwise_conv.weight": "model-00002-of-00002.safetensors",
448 "speech_encoder.encoder.layers.20.conv_module.depthwise_layer_norm.bias": "model-00002-of-00002.safetensors",
449 "speech_encoder.encoder.layers.20.conv_module.depthwise_layer_norm.weight": "model-00002-of-00002.safetensors",
450 "speech_encoder.encoder.layers.20.conv_module.layer_norm.bias": "model-00002-of-00002.safetensors",
451 "speech_encoder.encoder.layers.20.conv_module.layer_norm.weight": "model-00002-of-00002.safetensors",
452 "speech_encoder.encoder.layers.20.conv_module.pointwise_conv1.weight": "model-00002-of-00002.safetensors",
453 "speech_encoder.encoder.layers.20.conv_module.pointwise_conv2.weight": "model-00002-of-00002.safetensors",
454 "speech_encoder.encoder.layers.20.ffn1.intermediate_dense.bias": "model-00002-of-00002.safetensors",
455 "speech_encoder.encoder.layers.20.ffn1.intermediate_dense.weight": "model-00002-of-00002.safetensors",
456 "speech_encoder.encoder.layers.20.ffn1.output_dense.bias": "model-00002-of-00002.safetensors",
457 "speech_encoder.encoder.layers.20.ffn1.output_dense.weight": "model-00002-of-00002.safetensors",
458 "speech_encoder.encoder.layers.20.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
459 "speech_encoder.encoder.layers.20.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
460 "speech_encoder.encoder.layers.20.ffn2.intermediate_dense.bias": "model-00002-of-00002.safetensors",
461 "speech_encoder.encoder.layers.20.ffn2.intermediate_dense.weight": "model-00002-of-00002.safetensors",
462 "speech_encoder.encoder.layers.20.ffn2.output_dense.bias": "model-00002-of-00002.safetensors",
463 "speech_encoder.encoder.layers.20.ffn2.output_dense.weight": "model-00002-of-00002.safetensors",
464 "speech_encoder.encoder.layers.20.ffn2_layer_norm.bias": "model-00002-of-00002.safetensors",
465 "speech_encoder.encoder.layers.20.ffn2_layer_norm.weight": "model-00002-of-00002.safetensors",
466 "speech_encoder.encoder.layers.20.final_layer_norm.bias": "model-00002-of-00002.safetensors",
467 "speech_encoder.encoder.layers.20.final_layer_norm.weight": "model-00002-of-00002.safetensors",
468 "speech_encoder.encoder.layers.20.self_attn.distance_embedding.weight": "model-00002-of-00002.safetensors",
469 "speech_encoder.encoder.layers.20.self_attn.linear_k.bias": "model-00002-of-00002.safetensors",
470 "speech_encoder.encoder.layers.20.self_attn.linear_k.weight": "model-00002-of-00002.safetensors",
471 "speech_encoder.encoder.layers.20.self_attn.linear_out.bias": "model-00002-of-00002.safetensors",
472 "speech_encoder.encoder.layers.20.self_attn.linear_out.weight": "model-00002-of-00002.safetensors",
473 "speech_encoder.encoder.layers.20.self_attn.linear_q.bias": "model-00002-of-00002.safetensors",
474 "speech_encoder.encoder.layers.20.self_attn.linear_q.weight": "model-00002-of-00002.safetensors",
475 "speech_encoder.encoder.layers.20.self_attn.linear_v.bias": "model-00002-of-00002.safetensors",
476 "speech_encoder.encoder.layers.20.self_attn.linear_v.weight": "model-00002-of-00002.safetensors",
477 "speech_encoder.encoder.layers.20.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
478 "speech_encoder.encoder.layers.20.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
479 "speech_encoder.encoder.layers.21.conv_module.depthwise_conv.weight": "model-00002-of-00002.safetensors",
480 "speech_encoder.encoder.layers.21.conv_module.depthwise_layer_norm.bias": "model-00002-of-00002.safetensors",
481 "speech_encoder.encoder.layers.21.conv_module.depthwise_layer_norm.weight": "model-00002-of-00002.safetensors",
482 "speech_encoder.encoder.layers.21.conv_module.layer_norm.bias": "model-00002-of-00002.safetensors",
483 "speech_encoder.encoder.layers.21.conv_module.layer_norm.weight": "model-00002-of-00002.safetensors",
484 "speech_encoder.encoder.layers.21.conv_module.pointwise_conv1.weight": "model-00002-of-00002.safetensors",
485 "speech_encoder.encoder.layers.21.conv_module.pointwise_conv2.weight": "model-00002-of-00002.safetensors",
486 "speech_encoder.encoder.layers.21.ffn1.intermediate_dense.bias": "model-00002-of-00002.safetensors",
487 "speech_encoder.encoder.layers.21.ffn1.intermediate_dense.weight": "model-00002-of-00002.safetensors",
488 "speech_encoder.encoder.layers.21.ffn1.output_dense.bias": "model-00002-of-00002.safetensors",
489 "speech_encoder.encoder.layers.21.ffn1.output_dense.weight": "model-00002-of-00002.safetensors",
490 "speech_encoder.encoder.layers.21.ffn1_layer_norm.bias": "model-00002-of-00002.safetensors",
491 "speech_encoder.encoder.layers.21.ffn1_layer_norm.weight": "model-00002-of-00002.safetensors",
492 "speech_encoder.encoder.layers.21.ffn2.intermediate_dense.bias": "model-00002-of-00002.safetensors",
493 "speech_encoder.encoder.layers.21.ffn2.intermediate_dense.weight": "model-00002-of-00002.safetensors",
494 "speech_encoder.encoder.layers.21.ffn2.output_dense.bias": "model-00002-of-00002.safetensors",
495 "speech_encoder.encoder.layers.21.ffn2.output_dense.weight": "model-00002-of-00002.safetensors",
496 "speech_encoder.encoder.layers.21.ffn2_layer_norm.bias": "model-00002-of-00002.safetensors",
497 "speech_encoder.encoder.layers.21.ffn2_layer_norm.weight": "model-00002-of-00002.safetensors",
498 "speech_encoder.encoder.layers.21.final_layer_norm.bias": "model-00002-of-00002.safetensors",
499 "speech_encoder.encoder.layers.21.final_layer_norm.weight": "model-00002-of-00002.safetensors",
500 "speech_encoder.encoder.layers.21.self_attn.distance_embedding.weight": "model-00002-of-00002.safetensors",
501 "speech_encoder.encoder.layers.21.self_attn.linear_k.bias": "model-00002-of-00002.safetensors",
502 "speech_encoder.encoder.layers.21.self_attn.linear_k.weight": "model-00002-of-00002.safetensors",
503 "speech_encoder.encoder.layers.21.self_attn.linear_out.bias": "model-00002-of-00002.safetensors",
504 "speech_encoder.encoder.layers.21.self_attn.linear_out.weight": "model-00002-of-00002.safetensors",
505 "speech_encoder.encoder.layers.21.self_attn.linear_q.bias": "model-00002-of-00002.safetensors",
506 "speech_encoder.encoder.layers.21.self_attn.linear_q.weight": "model-00002-of-00002.safetensors",
507 "speech_encoder.encoder.layers.21.self_attn.linear_v.bias": "model-00002-of-00002.safetensors",
508 "speech_encoder.encoder.layers.21.self_attn.linear_v.weight": "model-00002-of-00002.safetensors",
509 "speech_encoder.encoder.layers.21.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
510 "speech_encoder.encoder.layers.21.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
511 "speech_encoder.encoder.layers.22.conv_module.depthwise_conv.weight": "model-00002-of-00002.safetensors",
512 "speech_encoder.encoder.layers.22.conv_module.depthwise_layer_norm.bias": "model-00002-of-00002.safetensors",
513 "speech_encoder.encoder.layers.22.conv_module.depthwise_layer_norm.weight": "model-00002-of-00002.safetensors",
514 "speech_encoder.encoder.layers.22.conv_module.layer_norm.bias": "model-00002-of-00002.safetensors",
515 "speech_encoder.encoder.layers.22.conv_module.layer_norm.weight": "model-00002-of-00002.safetensors",
516 "speech_encoder.encoder.layers.22.conv_module.pointwise_conv1.weight": "model-00002-of-00002.safetensors",
517 "speech_encoder.encoder.layers.22.conv_module.pointwise_conv2.weight": "model-00002-of-00002.safetensors",
518 "speech_encoder.encoder.layers.22.ffn1.intermediate_dense.bias": "model-00002-of-00002.safetensors",
519 "speech_encoder.encoder.layers.22.ffn1.intermediate_dense.weight": "model-00002-of-00002.safetensors",
520 "speech_encoder.encoder.layers.22.ffn1.output_dense.bias": "model-00002-of-00002.safetensors",
521 "speech_encoder.encoder.layers.22.ffn1.output_dense.weight": "model-00002-of-00002.safetensors",
522 "speech_encoder.encoder.layers.22.ffn1_layer_norm.bias": "model-00002-of-00002.safetensors",
523 "speech_encoder.encoder.layers.22.ffn1_layer_norm.weight": "model-00002-of-00002.safetensors",
524 "speech_encoder.encoder.layers.22.ffn2.intermediate_dense.bias": "model-00002-of-00002.safetensors",
525 "speech_encoder.encoder.layers.22.ffn2.intermediate_dense.weight": "model-00002-of-00002.safetensors",
526 "speech_encoder.encoder.layers.22.ffn2.output_dense.bias": "model-00002-of-00002.safetensors",
527 "speech_encoder.encoder.layers.22.ffn2.output_dense.weight": "model-00002-of-00002.safetensors",
528 "speech_encoder.encoder.layers.22.ffn2_layer_norm.bias": "model-00002-of-00002.safetensors",
529 "speech_encoder.encoder.layers.22.ffn2_layer_norm.weight": "model-00002-of-00002.safetensors",
530 "speech_encoder.encoder.layers.22.final_layer_norm.bias": "model-00002-of-00002.safetensors",
531 "speech_encoder.encoder.layers.22.final_layer_norm.weight": "model-00002-of-00002.safetensors",
532 "speech_encoder.encoder.layers.22.self_attn.distance_embedding.weight": "model-00002-of-00002.safetensors",
533 "speech_encoder.encoder.layers.22.self_attn.linear_k.bias": "model-00002-of-00002.safetensors",
534 "speech_encoder.encoder.layers.22.self_attn.linear_k.weight": "model-00002-of-00002.safetensors",
535 "speech_encoder.encoder.layers.22.self_attn.linear_out.bias": "model-00002-of-00002.safetensors",
536 "speech_encoder.encoder.layers.22.self_attn.linear_out.weight": "model-00002-of-00002.safetensors",
537 "speech_encoder.encoder.layers.22.self_attn.linear_q.bias": "model-00002-of-00002.safetensors",
538 "speech_encoder.encoder.layers.22.self_attn.linear_q.weight": "model-00002-of-00002.safetensors",
539 "speech_encoder.encoder.layers.22.self_attn.linear_v.bias": "model-00002-of-00002.safetensors",
540 "speech_encoder.encoder.layers.22.self_attn.linear_v.weight": "model-00002-of-00002.safetensors",
541 "speech_encoder.encoder.layers.22.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
542 "speech_encoder.encoder.layers.22.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
543 "speech_encoder.encoder.layers.23.conv_module.depthwise_conv.weight": "model-00002-of-00002.safetensors",
544 "speech_encoder.encoder.layers.23.conv_module.depthwise_layer_norm.bias": "model-00002-of-00002.safetensors",
545 "speech_encoder.encoder.layers.23.conv_module.depthwise_layer_norm.weight": "model-00002-of-00002.safetensors",
546 "speech_encoder.encoder.layers.23.conv_module.layer_norm.bias": "model-00002-of-00002.safetensors",
547 "speech_encoder.encoder.layers.23.conv_module.layer_norm.weight": "model-00002-of-00002.safetensors",
548 "speech_encoder.encoder.layers.23.conv_module.pointwise_conv1.weight": "model-00002-of-00002.safetensors",
549 "speech_encoder.encoder.layers.23.conv_module.pointwise_conv2.weight": "model-00002-of-00002.safetensors",
550 "speech_encoder.encoder.layers.23.ffn1.intermediate_dense.bias": "model-00002-of-00002.safetensors",
551 "speech_encoder.encoder.layers.23.ffn1.intermediate_dense.weight": "model-00002-of-00002.safetensors",
552 "speech_encoder.encoder.layers.23.ffn1.output_dense.bias": "model-00002-of-00002.safetensors",
553 "speech_encoder.encoder.layers.23.ffn1.output_dense.weight": "model-00002-of-00002.safetensors",
554 "speech_encoder.encoder.layers.23.ffn1_layer_norm.bias": "model-00002-of-00002.safetensors",
555 "speech_encoder.encoder.layers.23.ffn1_layer_norm.weight": "model-00002-of-00002.safetensors",
556 "speech_encoder.encoder.layers.23.ffn2.intermediate_dense.bias": "model-00002-of-00002.safetensors",
557 "speech_encoder.encoder.layers.23.ffn2.intermediate_dense.weight": "model-00002-of-00002.safetensors",
558 "speech_encoder.encoder.layers.23.ffn2.output_dense.bias": "model-00002-of-00002.safetensors",
559 "speech_encoder.encoder.layers.23.ffn2.output_dense.weight": "model-00002-of-00002.safetensors",
560 "speech_encoder.encoder.layers.23.ffn2_layer_norm.bias": "model-00002-of-00002.safetensors",
561 "speech_encoder.encoder.layers.23.ffn2_layer_norm.weight": "model-00002-of-00002.safetensors",
562 "speech_encoder.encoder.layers.23.final_layer_norm.bias": "model-00002-of-00002.safetensors",
563 "speech_encoder.encoder.layers.23.final_layer_norm.weight": "model-00002-of-00002.safetensors",
564 "speech_encoder.encoder.layers.23.self_attn.distance_embedding.weight": "model-00002-of-00002.safetensors",
565 "speech_encoder.encoder.layers.23.self_attn.linear_k.bias": "model-00002-of-00002.safetensors",
566 "speech_encoder.encoder.layers.23.self_attn.linear_k.weight": "model-00002-of-00002.safetensors",
567 "speech_encoder.encoder.layers.23.self_attn.linear_out.bias": "model-00002-of-00002.safetensors",
568 "speech_encoder.encoder.layers.23.self_attn.linear_out.weight": "model-00002-of-00002.safetensors",
569 "speech_encoder.encoder.layers.23.self_attn.linear_q.bias": "model-00002-of-00002.safetensors",
570 "speech_encoder.encoder.layers.23.self_attn.linear_q.weight": "model-00002-of-00002.safetensors",
571 "speech_encoder.encoder.layers.23.self_attn.linear_v.bias": "model-00002-of-00002.safetensors",
572 "speech_encoder.encoder.layers.23.self_attn.linear_v.weight": "model-00002-of-00002.safetensors",
573 "speech_encoder.encoder.layers.23.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
574 "speech_encoder.encoder.layers.23.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
575 "speech_encoder.encoder.layers.3.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
576 "speech_encoder.encoder.layers.3.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
577 "speech_encoder.encoder.layers.3.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
578 "speech_encoder.encoder.layers.3.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
579 "speech_encoder.encoder.layers.3.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
580 "speech_encoder.encoder.layers.3.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
581 "speech_encoder.encoder.layers.3.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
582 "speech_encoder.encoder.layers.3.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
583 "speech_encoder.encoder.layers.3.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
584 "speech_encoder.encoder.layers.3.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
585 "speech_encoder.encoder.layers.3.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
586 "speech_encoder.encoder.layers.3.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
587 "speech_encoder.encoder.layers.3.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
588 "speech_encoder.encoder.layers.3.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
589 "speech_encoder.encoder.layers.3.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
590 "speech_encoder.encoder.layers.3.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
591 "speech_encoder.encoder.layers.3.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
592 "speech_encoder.encoder.layers.3.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
593 "speech_encoder.encoder.layers.3.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
594 "speech_encoder.encoder.layers.3.final_layer_norm.bias": "model-00001-of-00002.safetensors",
595 "speech_encoder.encoder.layers.3.final_layer_norm.weight": "model-00001-of-00002.safetensors",
596 "speech_encoder.encoder.layers.3.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
597 "speech_encoder.encoder.layers.3.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
598 "speech_encoder.encoder.layers.3.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
599 "speech_encoder.encoder.layers.3.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
600 "speech_encoder.encoder.layers.3.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
601 "speech_encoder.encoder.layers.3.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
602 "speech_encoder.encoder.layers.3.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
603 "speech_encoder.encoder.layers.3.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
604 "speech_encoder.encoder.layers.3.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
605 "speech_encoder.encoder.layers.3.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
606 "speech_encoder.encoder.layers.3.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
607 "speech_encoder.encoder.layers.4.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
608 "speech_encoder.encoder.layers.4.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
609 "speech_encoder.encoder.layers.4.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
610 "speech_encoder.encoder.layers.4.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
611 "speech_encoder.encoder.layers.4.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
612 "speech_encoder.encoder.layers.4.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
613 "speech_encoder.encoder.layers.4.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
614 "speech_encoder.encoder.layers.4.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
615 "speech_encoder.encoder.layers.4.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
616 "speech_encoder.encoder.layers.4.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
617 "speech_encoder.encoder.layers.4.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
618 "speech_encoder.encoder.layers.4.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
619 "speech_encoder.encoder.layers.4.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
620 "speech_encoder.encoder.layers.4.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
621 "speech_encoder.encoder.layers.4.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
622 "speech_encoder.encoder.layers.4.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
623 "speech_encoder.encoder.layers.4.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
624 "speech_encoder.encoder.layers.4.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
625 "speech_encoder.encoder.layers.4.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
626 "speech_encoder.encoder.layers.4.final_layer_norm.bias": "model-00001-of-00002.safetensors",
627 "speech_encoder.encoder.layers.4.final_layer_norm.weight": "model-00001-of-00002.safetensors",
628 "speech_encoder.encoder.layers.4.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
629 "speech_encoder.encoder.layers.4.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
630 "speech_encoder.encoder.layers.4.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
631 "speech_encoder.encoder.layers.4.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
632 "speech_encoder.encoder.layers.4.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
633 "speech_encoder.encoder.layers.4.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
634 "speech_encoder.encoder.layers.4.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
635 "speech_encoder.encoder.layers.4.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
636 "speech_encoder.encoder.layers.4.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
637 "speech_encoder.encoder.layers.4.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
638 "speech_encoder.encoder.layers.4.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
639 "speech_encoder.encoder.layers.5.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
640 "speech_encoder.encoder.layers.5.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
641 "speech_encoder.encoder.layers.5.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
642 "speech_encoder.encoder.layers.5.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
643 "speech_encoder.encoder.layers.5.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
644 "speech_encoder.encoder.layers.5.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
645 "speech_encoder.encoder.layers.5.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
646 "speech_encoder.encoder.layers.5.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
647 "speech_encoder.encoder.layers.5.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
648 "speech_encoder.encoder.layers.5.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
649 "speech_encoder.encoder.layers.5.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
650 "speech_encoder.encoder.layers.5.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
651 "speech_encoder.encoder.layers.5.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
652 "speech_encoder.encoder.layers.5.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
653 "speech_encoder.encoder.layers.5.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
654 "speech_encoder.encoder.layers.5.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
655 "speech_encoder.encoder.layers.5.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
656 "speech_encoder.encoder.layers.5.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
657 "speech_encoder.encoder.layers.5.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
658 "speech_encoder.encoder.layers.5.final_layer_norm.bias": "model-00001-of-00002.safetensors",
659 "speech_encoder.encoder.layers.5.final_layer_norm.weight": "model-00001-of-00002.safetensors",
660 "speech_encoder.encoder.layers.5.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
661 "speech_encoder.encoder.layers.5.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
662 "speech_encoder.encoder.layers.5.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
663 "speech_encoder.encoder.layers.5.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
664 "speech_encoder.encoder.layers.5.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
665 "speech_encoder.encoder.layers.5.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
666 "speech_encoder.encoder.layers.5.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
667 "speech_encoder.encoder.layers.5.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
668 "speech_encoder.encoder.layers.5.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
669 "speech_encoder.encoder.layers.5.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
670 "speech_encoder.encoder.layers.5.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
671 "speech_encoder.encoder.layers.6.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
672 "speech_encoder.encoder.layers.6.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
673 "speech_encoder.encoder.layers.6.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
674 "speech_encoder.encoder.layers.6.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
675 "speech_encoder.encoder.layers.6.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
676 "speech_encoder.encoder.layers.6.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
677 "speech_encoder.encoder.layers.6.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
678 "speech_encoder.encoder.layers.6.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
679 "speech_encoder.encoder.layers.6.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
680 "speech_encoder.encoder.layers.6.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
681 "speech_encoder.encoder.layers.6.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
682 "speech_encoder.encoder.layers.6.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
683 "speech_encoder.encoder.layers.6.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
684 "speech_encoder.encoder.layers.6.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
685 "speech_encoder.encoder.layers.6.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
686 "speech_encoder.encoder.layers.6.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
687 "speech_encoder.encoder.layers.6.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
688 "speech_encoder.encoder.layers.6.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
689 "speech_encoder.encoder.layers.6.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
690 "speech_encoder.encoder.layers.6.final_layer_norm.bias": "model-00001-of-00002.safetensors",
691 "speech_encoder.encoder.layers.6.final_layer_norm.weight": "model-00001-of-00002.safetensors",
692 "speech_encoder.encoder.layers.6.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
693 "speech_encoder.encoder.layers.6.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
694 "speech_encoder.encoder.layers.6.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
695 "speech_encoder.encoder.layers.6.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
696 "speech_encoder.encoder.layers.6.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
697 "speech_encoder.encoder.layers.6.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
698 "speech_encoder.encoder.layers.6.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
699 "speech_encoder.encoder.layers.6.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
700 "speech_encoder.encoder.layers.6.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
701 "speech_encoder.encoder.layers.6.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
702 "speech_encoder.encoder.layers.6.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
703 "speech_encoder.encoder.layers.7.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
704 "speech_encoder.encoder.layers.7.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
705 "speech_encoder.encoder.layers.7.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
706 "speech_encoder.encoder.layers.7.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
707 "speech_encoder.encoder.layers.7.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
708 "speech_encoder.encoder.layers.7.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
709 "speech_encoder.encoder.layers.7.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
710 "speech_encoder.encoder.layers.7.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
711 "speech_encoder.encoder.layers.7.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
712 "speech_encoder.encoder.layers.7.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
713 "speech_encoder.encoder.layers.7.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
714 "speech_encoder.encoder.layers.7.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
715 "speech_encoder.encoder.layers.7.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
716 "speech_encoder.encoder.layers.7.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
717 "speech_encoder.encoder.layers.7.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
718 "speech_encoder.encoder.layers.7.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
719 "speech_encoder.encoder.layers.7.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
720 "speech_encoder.encoder.layers.7.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
721 "speech_encoder.encoder.layers.7.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
722 "speech_encoder.encoder.layers.7.final_layer_norm.bias": "model-00001-of-00002.safetensors",
723 "speech_encoder.encoder.layers.7.final_layer_norm.weight": "model-00001-of-00002.safetensors",
724 "speech_encoder.encoder.layers.7.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
725 "speech_encoder.encoder.layers.7.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
726 "speech_encoder.encoder.layers.7.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
727 "speech_encoder.encoder.layers.7.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
728 "speech_encoder.encoder.layers.7.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
729 "speech_encoder.encoder.layers.7.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
730 "speech_encoder.encoder.layers.7.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
731 "speech_encoder.encoder.layers.7.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
732 "speech_encoder.encoder.layers.7.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
733 "speech_encoder.encoder.layers.7.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
734 "speech_encoder.encoder.layers.7.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
735 "speech_encoder.encoder.layers.8.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
736 "speech_encoder.encoder.layers.8.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
737 "speech_encoder.encoder.layers.8.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
738 "speech_encoder.encoder.layers.8.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
739 "speech_encoder.encoder.layers.8.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
740 "speech_encoder.encoder.layers.8.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
741 "speech_encoder.encoder.layers.8.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
742 "speech_encoder.encoder.layers.8.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
743 "speech_encoder.encoder.layers.8.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
744 "speech_encoder.encoder.layers.8.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
745 "speech_encoder.encoder.layers.8.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
746 "speech_encoder.encoder.layers.8.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
747 "speech_encoder.encoder.layers.8.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
748 "speech_encoder.encoder.layers.8.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
749 "speech_encoder.encoder.layers.8.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
750 "speech_encoder.encoder.layers.8.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
751 "speech_encoder.encoder.layers.8.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
752 "speech_encoder.encoder.layers.8.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
753 "speech_encoder.encoder.layers.8.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
754 "speech_encoder.encoder.layers.8.final_layer_norm.bias": "model-00001-of-00002.safetensors",
755 "speech_encoder.encoder.layers.8.final_layer_norm.weight": "model-00001-of-00002.safetensors",
756 "speech_encoder.encoder.layers.8.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
757 "speech_encoder.encoder.layers.8.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
758 "speech_encoder.encoder.layers.8.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
759 "speech_encoder.encoder.layers.8.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
760 "speech_encoder.encoder.layers.8.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
761 "speech_encoder.encoder.layers.8.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
762 "speech_encoder.encoder.layers.8.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
763 "speech_encoder.encoder.layers.8.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
764 "speech_encoder.encoder.layers.8.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
765 "speech_encoder.encoder.layers.8.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
766 "speech_encoder.encoder.layers.8.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
767 "speech_encoder.encoder.layers.9.conv_module.depthwise_conv.weight": "model-00001-of-00002.safetensors",
768 "speech_encoder.encoder.layers.9.conv_module.depthwise_layer_norm.bias": "model-00001-of-00002.safetensors",
769 "speech_encoder.encoder.layers.9.conv_module.depthwise_layer_norm.weight": "model-00001-of-00002.safetensors",
770 "speech_encoder.encoder.layers.9.conv_module.layer_norm.bias": "model-00001-of-00002.safetensors",
771 "speech_encoder.encoder.layers.9.conv_module.layer_norm.weight": "model-00001-of-00002.safetensors",
772 "speech_encoder.encoder.layers.9.conv_module.pointwise_conv1.weight": "model-00001-of-00002.safetensors",
773 "speech_encoder.encoder.layers.9.conv_module.pointwise_conv2.weight": "model-00001-of-00002.safetensors",
774 "speech_encoder.encoder.layers.9.ffn1.intermediate_dense.bias": "model-00001-of-00002.safetensors",
775 "speech_encoder.encoder.layers.9.ffn1.intermediate_dense.weight": "model-00001-of-00002.safetensors",
776 "speech_encoder.encoder.layers.9.ffn1.output_dense.bias": "model-00001-of-00002.safetensors",
777 "speech_encoder.encoder.layers.9.ffn1.output_dense.weight": "model-00001-of-00002.safetensors",
778 "speech_encoder.encoder.layers.9.ffn1_layer_norm.bias": "model-00001-of-00002.safetensors",
779 "speech_encoder.encoder.layers.9.ffn1_layer_norm.weight": "model-00001-of-00002.safetensors",
780 "speech_encoder.encoder.layers.9.ffn2.intermediate_dense.bias": "model-00001-of-00002.safetensors",
781 "speech_encoder.encoder.layers.9.ffn2.intermediate_dense.weight": "model-00001-of-00002.safetensors",
782 "speech_encoder.encoder.layers.9.ffn2.output_dense.bias": "model-00001-of-00002.safetensors",
783 "speech_encoder.encoder.layers.9.ffn2.output_dense.weight": "model-00001-of-00002.safetensors",
784 "speech_encoder.encoder.layers.9.ffn2_layer_norm.bias": "model-00001-of-00002.safetensors",
785 "speech_encoder.encoder.layers.9.ffn2_layer_norm.weight": "model-00001-of-00002.safetensors",
786 "speech_encoder.encoder.layers.9.final_layer_norm.bias": "model-00001-of-00002.safetensors",
787 "speech_encoder.encoder.layers.9.final_layer_norm.weight": "model-00001-of-00002.safetensors",
788 "speech_encoder.encoder.layers.9.self_attn.distance_embedding.weight": "model-00001-of-00002.safetensors",
789 "speech_encoder.encoder.layers.9.self_attn.linear_k.bias": "model-00001-of-00002.safetensors",
790 "speech_encoder.encoder.layers.9.self_attn.linear_k.weight": "model-00001-of-00002.safetensors",
791 "speech_encoder.encoder.layers.9.self_attn.linear_out.bias": "model-00001-of-00002.safetensors",
792 "speech_encoder.encoder.layers.9.self_attn.linear_out.weight": "model-00001-of-00002.safetensors",
793 "speech_encoder.encoder.layers.9.self_attn.linear_q.bias": "model-00001-of-00002.safetensors",
794 "speech_encoder.encoder.layers.9.self_attn.linear_q.weight": "model-00001-of-00002.safetensors",
795 "speech_encoder.encoder.layers.9.self_attn.linear_v.bias": "model-00001-of-00002.safetensors",
796 "speech_encoder.encoder.layers.9.self_attn.linear_v.weight": "model-00001-of-00002.safetensors",
797 "speech_encoder.encoder.layers.9.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
798 "speech_encoder.encoder.layers.9.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
799 "speech_encoder.feature_projection.layer_norm.bias": "model-00001-of-00002.safetensors",
800 "speech_encoder.feature_projection.layer_norm.weight": "model-00001-of-00002.safetensors",
801 "speech_encoder.feature_projection.projection.bias": "model-00001-of-00002.safetensors",
802 "speech_encoder.feature_projection.projection.weight": "model-00001-of-00002.safetensors",
803 "speech_encoder.inner_layer_norm.bias": "model-00002-of-00002.safetensors",
804 "speech_encoder.inner_layer_norm.weight": "model-00002-of-00002.safetensors",
805 "speech_encoder.intermediate_ffn.intermediate_dense.bias": "model-00002-of-00002.safetensors",
806 "speech_encoder.intermediate_ffn.intermediate_dense.weight": "model-00002-of-00002.safetensors",
807 "speech_encoder.intermediate_ffn.output_dense.bias": "model-00002-of-00002.safetensors",
808 "speech_encoder.intermediate_ffn.output_dense.weight": "model-00002-of-00002.safetensors",
809 "t2u_model.model.decoder.duration_predictor.conv1.bias": "model-00002-of-00002.safetensors",
810 "t2u_model.model.decoder.duration_predictor.conv1.weight": "model-00002-of-00002.safetensors",
811 "t2u_model.model.decoder.duration_predictor.conv2.bias": "model-00002-of-00002.safetensors",
812 "t2u_model.model.decoder.duration_predictor.conv2.weight": "model-00002-of-00002.safetensors",
813 "t2u_model.model.decoder.duration_predictor.ln1.bias": "model-00002-of-00002.safetensors",
814 "t2u_model.model.decoder.duration_predictor.ln1.weight": "model-00002-of-00002.safetensors",
815 "t2u_model.model.decoder.duration_predictor.ln2.bias": "model-00002-of-00002.safetensors",
816 "t2u_model.model.decoder.duration_predictor.ln2.weight": "model-00002-of-00002.safetensors",
817 "t2u_model.model.decoder.duration_predictor.proj.bias": "model-00002-of-00002.safetensors",
818 "t2u_model.model.decoder.duration_predictor.proj.weight": "model-00002-of-00002.safetensors",
819 "t2u_model.model.decoder.embed_char.weight": "model-00002-of-00002.safetensors",
820 "t2u_model.model.decoder.embed_tokens.weight": "model-00002-of-00002.safetensors",
821 "t2u_model.model.decoder.layer_norm.bias": "model-00002-of-00002.safetensors",
822 "t2u_model.model.decoder.layer_norm.weight": "model-00002-of-00002.safetensors",
823 "t2u_model.model.decoder.layers.0.conv1.bias": "model-00002-of-00002.safetensors",
824 "t2u_model.model.decoder.layers.0.conv1.weight": "model-00002-of-00002.safetensors",
825 "t2u_model.model.decoder.layers.0.conv2.bias": "model-00002-of-00002.safetensors",
826 "t2u_model.model.decoder.layers.0.conv2.weight": "model-00002-of-00002.safetensors",
827 "t2u_model.model.decoder.layers.0.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
828 "t2u_model.model.decoder.layers.0.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
829 "t2u_model.model.decoder.layers.0.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
830 "t2u_model.model.decoder.layers.0.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
831 "t2u_model.model.decoder.layers.0.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
832 "t2u_model.model.decoder.layers.0.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
833 "t2u_model.model.decoder.layers.0.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
834 "t2u_model.model.decoder.layers.0.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
835 "t2u_model.model.decoder.layers.0.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
836 "t2u_model.model.decoder.layers.0.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
837 "t2u_model.model.decoder.layers.0.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
838 "t2u_model.model.decoder.layers.0.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
839 "t2u_model.model.decoder.layers.1.conv1.bias": "model-00002-of-00002.safetensors",
840 "t2u_model.model.decoder.layers.1.conv1.weight": "model-00002-of-00002.safetensors",
841 "t2u_model.model.decoder.layers.1.conv2.bias": "model-00002-of-00002.safetensors",
842 "t2u_model.model.decoder.layers.1.conv2.weight": "model-00002-of-00002.safetensors",
843 "t2u_model.model.decoder.layers.1.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
844 "t2u_model.model.decoder.layers.1.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
845 "t2u_model.model.decoder.layers.1.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
846 "t2u_model.model.decoder.layers.1.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
847 "t2u_model.model.decoder.layers.1.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
848 "t2u_model.model.decoder.layers.1.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
849 "t2u_model.model.decoder.layers.1.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
850 "t2u_model.model.decoder.layers.1.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
851 "t2u_model.model.decoder.layers.1.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
852 "t2u_model.model.decoder.layers.1.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
853 "t2u_model.model.decoder.layers.1.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
854 "t2u_model.model.decoder.layers.1.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
855 "t2u_model.model.decoder.layers.2.conv1.bias": "model-00002-of-00002.safetensors",
856 "t2u_model.model.decoder.layers.2.conv1.weight": "model-00002-of-00002.safetensors",
857 "t2u_model.model.decoder.layers.2.conv2.bias": "model-00002-of-00002.safetensors",
858 "t2u_model.model.decoder.layers.2.conv2.weight": "model-00002-of-00002.safetensors",
859 "t2u_model.model.decoder.layers.2.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
860 "t2u_model.model.decoder.layers.2.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
861 "t2u_model.model.decoder.layers.2.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
862 "t2u_model.model.decoder.layers.2.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
863 "t2u_model.model.decoder.layers.2.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
864 "t2u_model.model.decoder.layers.2.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
865 "t2u_model.model.decoder.layers.2.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
866 "t2u_model.model.decoder.layers.2.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
867 "t2u_model.model.decoder.layers.2.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
868 "t2u_model.model.decoder.layers.2.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
869 "t2u_model.model.decoder.layers.2.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
870 "t2u_model.model.decoder.layers.2.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
871 "t2u_model.model.decoder.layers.3.conv1.bias": "model-00002-of-00002.safetensors",
872 "t2u_model.model.decoder.layers.3.conv1.weight": "model-00002-of-00002.safetensors",
873 "t2u_model.model.decoder.layers.3.conv2.bias": "model-00002-of-00002.safetensors",
874 "t2u_model.model.decoder.layers.3.conv2.weight": "model-00002-of-00002.safetensors",
875 "t2u_model.model.decoder.layers.3.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
876 "t2u_model.model.decoder.layers.3.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
877 "t2u_model.model.decoder.layers.3.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
878 "t2u_model.model.decoder.layers.3.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
879 "t2u_model.model.decoder.layers.3.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
880 "t2u_model.model.decoder.layers.3.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
881 "t2u_model.model.decoder.layers.3.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
882 "t2u_model.model.decoder.layers.3.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
883 "t2u_model.model.decoder.layers.3.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
884 "t2u_model.model.decoder.layers.3.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
885 "t2u_model.model.decoder.layers.3.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
886 "t2u_model.model.decoder.layers.3.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
887 "t2u_model.model.decoder.layers.4.conv1.bias": "model-00002-of-00002.safetensors",
888 "t2u_model.model.decoder.layers.4.conv1.weight": "model-00002-of-00002.safetensors",
889 "t2u_model.model.decoder.layers.4.conv2.bias": "model-00002-of-00002.safetensors",
890 "t2u_model.model.decoder.layers.4.conv2.weight": "model-00002-of-00002.safetensors",
891 "t2u_model.model.decoder.layers.4.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
892 "t2u_model.model.decoder.layers.4.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
893 "t2u_model.model.decoder.layers.4.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
894 "t2u_model.model.decoder.layers.4.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
895 "t2u_model.model.decoder.layers.4.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
896 "t2u_model.model.decoder.layers.4.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
897 "t2u_model.model.decoder.layers.4.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
898 "t2u_model.model.decoder.layers.4.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
899 "t2u_model.model.decoder.layers.4.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
900 "t2u_model.model.decoder.layers.4.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
901 "t2u_model.model.decoder.layers.4.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
902 "t2u_model.model.decoder.layers.4.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
903 "t2u_model.model.decoder.layers.5.conv1.bias": "model-00002-of-00002.safetensors",
904 "t2u_model.model.decoder.layers.5.conv1.weight": "model-00002-of-00002.safetensors",
905 "t2u_model.model.decoder.layers.5.conv2.bias": "model-00002-of-00002.safetensors",
906 "t2u_model.model.decoder.layers.5.conv2.weight": "model-00002-of-00002.safetensors",
907 "t2u_model.model.decoder.layers.5.conv_layer_norm.bias": "model-00002-of-00002.safetensors",
908 "t2u_model.model.decoder.layers.5.conv_layer_norm.weight": "model-00002-of-00002.safetensors",
909 "t2u_model.model.decoder.layers.5.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
910 "t2u_model.model.decoder.layers.5.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
911 "t2u_model.model.decoder.layers.5.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
912 "t2u_model.model.decoder.layers.5.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
913 "t2u_model.model.decoder.layers.5.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
914 "t2u_model.model.decoder.layers.5.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
915 "t2u_model.model.decoder.layers.5.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
916 "t2u_model.model.decoder.layers.5.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
917 "t2u_model.model.decoder.layers.5.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
918 "t2u_model.model.decoder.layers.5.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
919 "t2u_model.model.decoder.pos_emb_alpha": "model-00002-of-00002.safetensors",
920 "t2u_model.model.decoder.pos_emb_alpha_char": "model-00002-of-00002.safetensors",
921 "t2u_model.model.encoder.layer_norm.bias": "model-00002-of-00002.safetensors",
922 "t2u_model.model.encoder.layer_norm.weight": "model-00002-of-00002.safetensors",
923 "t2u_model.model.encoder.layers.0.ffn.fc1.bias": "model-00002-of-00002.safetensors",
924 "t2u_model.model.encoder.layers.0.ffn.fc1.weight": "model-00002-of-00002.safetensors",
925 "t2u_model.model.encoder.layers.0.ffn.fc2.bias": "model-00002-of-00002.safetensors",
926 "t2u_model.model.encoder.layers.0.ffn.fc2.weight": "model-00002-of-00002.safetensors",
927 "t2u_model.model.encoder.layers.0.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
928 "t2u_model.model.encoder.layers.0.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
929 "t2u_model.model.encoder.layers.0.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
930 "t2u_model.model.encoder.layers.0.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
931 "t2u_model.model.encoder.layers.0.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
932 "t2u_model.model.encoder.layers.0.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
933 "t2u_model.model.encoder.layers.0.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
934 "t2u_model.model.encoder.layers.0.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
935 "t2u_model.model.encoder.layers.0.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
936 "t2u_model.model.encoder.layers.0.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
937 "t2u_model.model.encoder.layers.0.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
938 "t2u_model.model.encoder.layers.0.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
939 "t2u_model.model.encoder.layers.1.ffn.fc1.bias": "model-00002-of-00002.safetensors",
940 "t2u_model.model.encoder.layers.1.ffn.fc1.weight": "model-00002-of-00002.safetensors",
941 "t2u_model.model.encoder.layers.1.ffn.fc2.bias": "model-00002-of-00002.safetensors",
942 "t2u_model.model.encoder.layers.1.ffn.fc2.weight": "model-00002-of-00002.safetensors",
943 "t2u_model.model.encoder.layers.1.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
944 "t2u_model.model.encoder.layers.1.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
945 "t2u_model.model.encoder.layers.1.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
946 "t2u_model.model.encoder.layers.1.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
947 "t2u_model.model.encoder.layers.1.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
948 "t2u_model.model.encoder.layers.1.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
949 "t2u_model.model.encoder.layers.1.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
950 "t2u_model.model.encoder.layers.1.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
951 "t2u_model.model.encoder.layers.1.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
952 "t2u_model.model.encoder.layers.1.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
953 "t2u_model.model.encoder.layers.1.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
954 "t2u_model.model.encoder.layers.1.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
955 "t2u_model.model.encoder.layers.2.ffn.fc1.bias": "model-00002-of-00002.safetensors",
956 "t2u_model.model.encoder.layers.2.ffn.fc1.weight": "model-00002-of-00002.safetensors",
957 "t2u_model.model.encoder.layers.2.ffn.fc2.bias": "model-00002-of-00002.safetensors",
958 "t2u_model.model.encoder.layers.2.ffn.fc2.weight": "model-00002-of-00002.safetensors",
959 "t2u_model.model.encoder.layers.2.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
960 "t2u_model.model.encoder.layers.2.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
961 "t2u_model.model.encoder.layers.2.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
962 "t2u_model.model.encoder.layers.2.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
963 "t2u_model.model.encoder.layers.2.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
964 "t2u_model.model.encoder.layers.2.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
965 "t2u_model.model.encoder.layers.2.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
966 "t2u_model.model.encoder.layers.2.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
967 "t2u_model.model.encoder.layers.2.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
968 "t2u_model.model.encoder.layers.2.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
969 "t2u_model.model.encoder.layers.2.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
970 "t2u_model.model.encoder.layers.2.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
971 "t2u_model.model.encoder.layers.3.ffn.fc1.bias": "model-00002-of-00002.safetensors",
972 "t2u_model.model.encoder.layers.3.ffn.fc1.weight": "model-00002-of-00002.safetensors",
973 "t2u_model.model.encoder.layers.3.ffn.fc2.bias": "model-00002-of-00002.safetensors",
974 "t2u_model.model.encoder.layers.3.ffn.fc2.weight": "model-00002-of-00002.safetensors",
975 "t2u_model.model.encoder.layers.3.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
976 "t2u_model.model.encoder.layers.3.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
977 "t2u_model.model.encoder.layers.3.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
978 "t2u_model.model.encoder.layers.3.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
979 "t2u_model.model.encoder.layers.3.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
980 "t2u_model.model.encoder.layers.3.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
981 "t2u_model.model.encoder.layers.3.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
982 "t2u_model.model.encoder.layers.3.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
983 "t2u_model.model.encoder.layers.3.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
984 "t2u_model.model.encoder.layers.3.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
985 "t2u_model.model.encoder.layers.3.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
986 "t2u_model.model.encoder.layers.3.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
987 "t2u_model.model.encoder.layers.4.ffn.fc1.bias": "model-00002-of-00002.safetensors",
988 "t2u_model.model.encoder.layers.4.ffn.fc1.weight": "model-00002-of-00002.safetensors",
989 "t2u_model.model.encoder.layers.4.ffn.fc2.bias": "model-00002-of-00002.safetensors",
990 "t2u_model.model.encoder.layers.4.ffn.fc2.weight": "model-00002-of-00002.safetensors",
991 "t2u_model.model.encoder.layers.4.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
992 "t2u_model.model.encoder.layers.4.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
993 "t2u_model.model.encoder.layers.4.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
994 "t2u_model.model.encoder.layers.4.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
995 "t2u_model.model.encoder.layers.4.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
996 "t2u_model.model.encoder.layers.4.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
997 "t2u_model.model.encoder.layers.4.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
998 "t2u_model.model.encoder.layers.4.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
999 "t2u_model.model.encoder.layers.4.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1000 "t2u_model.model.encoder.layers.4.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1001 "t2u_model.model.encoder.layers.4.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1002 "t2u_model.model.encoder.layers.4.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1003 "t2u_model.model.encoder.layers.5.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1004 "t2u_model.model.encoder.layers.5.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1005 "t2u_model.model.encoder.layers.5.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1006 "t2u_model.model.encoder.layers.5.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1007 "t2u_model.model.encoder.layers.5.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1008 "t2u_model.model.encoder.layers.5.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1009 "t2u_model.model.encoder.layers.5.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1010 "t2u_model.model.encoder.layers.5.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1011 "t2u_model.model.encoder.layers.5.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1012 "t2u_model.model.encoder.layers.5.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1013 "t2u_model.model.encoder.layers.5.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1014 "t2u_model.model.encoder.layers.5.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1015 "t2u_model.model.encoder.layers.5.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1016 "t2u_model.model.encoder.layers.5.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1017 "t2u_model.model.encoder.layers.5.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1018 "t2u_model.model.encoder.layers.5.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1019 "text_decoder.layer_norm.bias": "model-00002-of-00002.safetensors",
1020 "text_decoder.layer_norm.weight": "model-00002-of-00002.safetensors",
1021 "text_decoder.layers.0.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1022 "text_decoder.layers.0.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1023 "text_decoder.layers.0.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1024 "text_decoder.layers.0.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1025 "text_decoder.layers.0.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1026 "text_decoder.layers.0.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1027 "text_decoder.layers.0.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1028 "text_decoder.layers.0.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1029 "text_decoder.layers.0.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1030 "text_decoder.layers.0.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1031 "text_decoder.layers.0.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1032 "text_decoder.layers.0.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1033 "text_decoder.layers.0.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1034 "text_decoder.layers.0.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1035 "text_decoder.layers.0.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1036 "text_decoder.layers.0.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1037 "text_decoder.layers.0.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1038 "text_decoder.layers.0.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1039 "text_decoder.layers.0.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1040 "text_decoder.layers.0.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1041 "text_decoder.layers.0.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1042 "text_decoder.layers.0.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1043 "text_decoder.layers.0.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1044 "text_decoder.layers.0.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1045 "text_decoder.layers.0.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1046 "text_decoder.layers.0.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1047 "text_decoder.layers.1.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1048 "text_decoder.layers.1.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1049 "text_decoder.layers.1.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1050 "text_decoder.layers.1.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1051 "text_decoder.layers.1.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1052 "text_decoder.layers.1.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1053 "text_decoder.layers.1.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1054 "text_decoder.layers.1.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1055 "text_decoder.layers.1.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1056 "text_decoder.layers.1.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1057 "text_decoder.layers.1.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1058 "text_decoder.layers.1.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1059 "text_decoder.layers.1.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1060 "text_decoder.layers.1.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1061 "text_decoder.layers.1.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1062 "text_decoder.layers.1.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1063 "text_decoder.layers.1.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1064 "text_decoder.layers.1.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1065 "text_decoder.layers.1.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1066 "text_decoder.layers.1.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1067 "text_decoder.layers.1.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1068 "text_decoder.layers.1.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1069 "text_decoder.layers.1.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1070 "text_decoder.layers.1.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1071 "text_decoder.layers.1.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1072 "text_decoder.layers.1.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1073 "text_decoder.layers.10.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1074 "text_decoder.layers.10.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1075 "text_decoder.layers.10.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1076 "text_decoder.layers.10.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1077 "text_decoder.layers.10.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1078 "text_decoder.layers.10.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1079 "text_decoder.layers.10.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1080 "text_decoder.layers.10.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1081 "text_decoder.layers.10.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1082 "text_decoder.layers.10.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1083 "text_decoder.layers.10.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1084 "text_decoder.layers.10.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1085 "text_decoder.layers.10.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1086 "text_decoder.layers.10.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1087 "text_decoder.layers.10.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1088 "text_decoder.layers.10.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1089 "text_decoder.layers.10.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1090 "text_decoder.layers.10.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1091 "text_decoder.layers.10.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1092 "text_decoder.layers.10.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1093 "text_decoder.layers.10.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1094 "text_decoder.layers.10.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1095 "text_decoder.layers.10.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1096 "text_decoder.layers.10.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1097 "text_decoder.layers.10.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1098 "text_decoder.layers.10.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1099 "text_decoder.layers.11.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1100 "text_decoder.layers.11.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1101 "text_decoder.layers.11.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1102 "text_decoder.layers.11.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1103 "text_decoder.layers.11.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1104 "text_decoder.layers.11.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1105 "text_decoder.layers.11.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1106 "text_decoder.layers.11.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1107 "text_decoder.layers.11.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1108 "text_decoder.layers.11.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1109 "text_decoder.layers.11.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1110 "text_decoder.layers.11.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1111 "text_decoder.layers.11.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1112 "text_decoder.layers.11.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1113 "text_decoder.layers.11.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1114 "text_decoder.layers.11.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1115 "text_decoder.layers.11.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1116 "text_decoder.layers.11.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1117 "text_decoder.layers.11.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1118 "text_decoder.layers.11.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1119 "text_decoder.layers.11.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1120 "text_decoder.layers.11.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1121 "text_decoder.layers.11.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1122 "text_decoder.layers.11.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1123 "text_decoder.layers.11.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1124 "text_decoder.layers.11.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1125 "text_decoder.layers.12.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1126 "text_decoder.layers.12.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1127 "text_decoder.layers.12.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1128 "text_decoder.layers.12.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1129 "text_decoder.layers.12.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1130 "text_decoder.layers.12.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1131 "text_decoder.layers.12.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1132 "text_decoder.layers.12.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1133 "text_decoder.layers.12.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1134 "text_decoder.layers.12.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1135 "text_decoder.layers.12.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1136 "text_decoder.layers.12.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1137 "text_decoder.layers.12.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1138 "text_decoder.layers.12.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1139 "text_decoder.layers.12.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1140 "text_decoder.layers.12.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1141 "text_decoder.layers.12.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1142 "text_decoder.layers.12.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1143 "text_decoder.layers.12.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1144 "text_decoder.layers.12.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1145 "text_decoder.layers.12.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1146 "text_decoder.layers.12.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1147 "text_decoder.layers.12.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1148 "text_decoder.layers.12.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1149 "text_decoder.layers.12.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1150 "text_decoder.layers.12.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1151 "text_decoder.layers.13.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1152 "text_decoder.layers.13.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1153 "text_decoder.layers.13.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1154 "text_decoder.layers.13.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1155 "text_decoder.layers.13.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1156 "text_decoder.layers.13.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1157 "text_decoder.layers.13.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1158 "text_decoder.layers.13.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1159 "text_decoder.layers.13.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1160 "text_decoder.layers.13.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1161 "text_decoder.layers.13.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1162 "text_decoder.layers.13.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1163 "text_decoder.layers.13.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1164 "text_decoder.layers.13.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1165 "text_decoder.layers.13.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1166 "text_decoder.layers.13.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1167 "text_decoder.layers.13.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1168 "text_decoder.layers.13.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1169 "text_decoder.layers.13.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1170 "text_decoder.layers.13.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1171 "text_decoder.layers.13.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1172 "text_decoder.layers.13.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1173 "text_decoder.layers.13.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1174 "text_decoder.layers.13.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1175 "text_decoder.layers.13.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1176 "text_decoder.layers.13.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1177 "text_decoder.layers.14.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1178 "text_decoder.layers.14.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1179 "text_decoder.layers.14.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1180 "text_decoder.layers.14.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1181 "text_decoder.layers.14.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1182 "text_decoder.layers.14.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1183 "text_decoder.layers.14.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1184 "text_decoder.layers.14.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1185 "text_decoder.layers.14.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1186 "text_decoder.layers.14.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1187 "text_decoder.layers.14.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1188 "text_decoder.layers.14.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1189 "text_decoder.layers.14.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1190 "text_decoder.layers.14.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1191 "text_decoder.layers.14.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1192 "text_decoder.layers.14.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1193 "text_decoder.layers.14.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1194 "text_decoder.layers.14.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1195 "text_decoder.layers.14.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1196 "text_decoder.layers.14.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1197 "text_decoder.layers.14.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1198 "text_decoder.layers.14.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1199 "text_decoder.layers.14.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1200 "text_decoder.layers.14.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1201 "text_decoder.layers.14.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1202 "text_decoder.layers.14.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1203 "text_decoder.layers.15.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1204 "text_decoder.layers.15.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1205 "text_decoder.layers.15.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1206 "text_decoder.layers.15.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1207 "text_decoder.layers.15.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1208 "text_decoder.layers.15.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1209 "text_decoder.layers.15.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1210 "text_decoder.layers.15.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1211 "text_decoder.layers.15.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1212 "text_decoder.layers.15.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1213 "text_decoder.layers.15.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1214 "text_decoder.layers.15.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1215 "text_decoder.layers.15.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1216 "text_decoder.layers.15.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1217 "text_decoder.layers.15.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1218 "text_decoder.layers.15.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1219 "text_decoder.layers.15.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1220 "text_decoder.layers.15.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1221 "text_decoder.layers.15.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1222 "text_decoder.layers.15.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1223 "text_decoder.layers.15.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1224 "text_decoder.layers.15.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1225 "text_decoder.layers.15.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1226 "text_decoder.layers.15.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1227 "text_decoder.layers.15.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1228 "text_decoder.layers.15.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1229 "text_decoder.layers.16.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1230 "text_decoder.layers.16.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1231 "text_decoder.layers.16.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1232 "text_decoder.layers.16.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1233 "text_decoder.layers.16.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1234 "text_decoder.layers.16.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1235 "text_decoder.layers.16.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1236 "text_decoder.layers.16.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1237 "text_decoder.layers.16.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1238 "text_decoder.layers.16.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1239 "text_decoder.layers.16.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1240 "text_decoder.layers.16.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1241 "text_decoder.layers.16.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1242 "text_decoder.layers.16.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1243 "text_decoder.layers.16.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1244 "text_decoder.layers.16.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1245 "text_decoder.layers.16.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1246 "text_decoder.layers.16.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1247 "text_decoder.layers.16.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1248 "text_decoder.layers.16.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1249 "text_decoder.layers.16.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1250 "text_decoder.layers.16.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1251 "text_decoder.layers.16.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1252 "text_decoder.layers.16.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1253 "text_decoder.layers.16.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1254 "text_decoder.layers.16.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1255 "text_decoder.layers.17.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1256 "text_decoder.layers.17.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1257 "text_decoder.layers.17.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1258 "text_decoder.layers.17.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1259 "text_decoder.layers.17.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1260 "text_decoder.layers.17.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1261 "text_decoder.layers.17.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1262 "text_decoder.layers.17.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1263 "text_decoder.layers.17.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1264 "text_decoder.layers.17.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1265 "text_decoder.layers.17.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1266 "text_decoder.layers.17.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1267 "text_decoder.layers.17.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1268 "text_decoder.layers.17.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1269 "text_decoder.layers.17.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1270 "text_decoder.layers.17.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1271 "text_decoder.layers.17.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1272 "text_decoder.layers.17.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1273 "text_decoder.layers.17.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1274 "text_decoder.layers.17.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1275 "text_decoder.layers.17.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1276 "text_decoder.layers.17.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1277 "text_decoder.layers.17.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1278 "text_decoder.layers.17.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1279 "text_decoder.layers.17.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1280 "text_decoder.layers.17.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1281 "text_decoder.layers.18.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1282 "text_decoder.layers.18.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1283 "text_decoder.layers.18.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1284 "text_decoder.layers.18.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1285 "text_decoder.layers.18.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1286 "text_decoder.layers.18.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1287 "text_decoder.layers.18.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1288 "text_decoder.layers.18.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1289 "text_decoder.layers.18.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1290 "text_decoder.layers.18.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1291 "text_decoder.layers.18.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1292 "text_decoder.layers.18.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1293 "text_decoder.layers.18.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1294 "text_decoder.layers.18.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1295 "text_decoder.layers.18.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1296 "text_decoder.layers.18.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1297 "text_decoder.layers.18.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1298 "text_decoder.layers.18.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1299 "text_decoder.layers.18.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1300 "text_decoder.layers.18.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1301 "text_decoder.layers.18.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1302 "text_decoder.layers.18.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1303 "text_decoder.layers.18.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1304 "text_decoder.layers.18.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1305 "text_decoder.layers.18.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1306 "text_decoder.layers.18.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1307 "text_decoder.layers.19.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1308 "text_decoder.layers.19.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1309 "text_decoder.layers.19.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1310 "text_decoder.layers.19.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1311 "text_decoder.layers.19.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1312 "text_decoder.layers.19.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1313 "text_decoder.layers.19.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1314 "text_decoder.layers.19.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1315 "text_decoder.layers.19.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1316 "text_decoder.layers.19.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1317 "text_decoder.layers.19.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1318 "text_decoder.layers.19.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1319 "text_decoder.layers.19.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1320 "text_decoder.layers.19.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1321 "text_decoder.layers.19.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1322 "text_decoder.layers.19.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1323 "text_decoder.layers.19.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1324 "text_decoder.layers.19.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1325 "text_decoder.layers.19.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1326 "text_decoder.layers.19.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1327 "text_decoder.layers.19.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1328 "text_decoder.layers.19.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1329 "text_decoder.layers.19.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1330 "text_decoder.layers.19.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1331 "text_decoder.layers.19.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1332 "text_decoder.layers.19.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1333 "text_decoder.layers.2.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1334 "text_decoder.layers.2.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1335 "text_decoder.layers.2.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1336 "text_decoder.layers.2.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1337 "text_decoder.layers.2.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1338 "text_decoder.layers.2.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1339 "text_decoder.layers.2.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1340 "text_decoder.layers.2.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1341 "text_decoder.layers.2.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1342 "text_decoder.layers.2.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1343 "text_decoder.layers.2.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1344 "text_decoder.layers.2.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1345 "text_decoder.layers.2.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1346 "text_decoder.layers.2.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1347 "text_decoder.layers.2.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1348 "text_decoder.layers.2.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1349 "text_decoder.layers.2.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1350 "text_decoder.layers.2.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1351 "text_decoder.layers.2.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1352 "text_decoder.layers.2.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1353 "text_decoder.layers.2.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1354 "text_decoder.layers.2.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1355 "text_decoder.layers.2.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1356 "text_decoder.layers.2.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1357 "text_decoder.layers.2.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1358 "text_decoder.layers.2.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1359 "text_decoder.layers.20.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1360 "text_decoder.layers.20.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1361 "text_decoder.layers.20.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1362 "text_decoder.layers.20.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1363 "text_decoder.layers.20.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1364 "text_decoder.layers.20.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1365 "text_decoder.layers.20.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1366 "text_decoder.layers.20.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1367 "text_decoder.layers.20.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1368 "text_decoder.layers.20.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1369 "text_decoder.layers.20.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1370 "text_decoder.layers.20.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1371 "text_decoder.layers.20.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1372 "text_decoder.layers.20.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1373 "text_decoder.layers.20.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1374 "text_decoder.layers.20.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1375 "text_decoder.layers.20.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1376 "text_decoder.layers.20.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1377 "text_decoder.layers.20.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1378 "text_decoder.layers.20.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1379 "text_decoder.layers.20.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1380 "text_decoder.layers.20.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1381 "text_decoder.layers.20.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1382 "text_decoder.layers.20.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1383 "text_decoder.layers.20.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1384 "text_decoder.layers.20.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1385 "text_decoder.layers.21.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1386 "text_decoder.layers.21.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1387 "text_decoder.layers.21.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1388 "text_decoder.layers.21.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1389 "text_decoder.layers.21.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1390 "text_decoder.layers.21.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1391 "text_decoder.layers.21.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1392 "text_decoder.layers.21.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1393 "text_decoder.layers.21.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1394 "text_decoder.layers.21.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1395 "text_decoder.layers.21.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1396 "text_decoder.layers.21.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1397 "text_decoder.layers.21.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1398 "text_decoder.layers.21.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1399 "text_decoder.layers.21.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1400 "text_decoder.layers.21.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1401 "text_decoder.layers.21.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1402 "text_decoder.layers.21.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1403 "text_decoder.layers.21.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1404 "text_decoder.layers.21.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1405 "text_decoder.layers.21.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1406 "text_decoder.layers.21.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1407 "text_decoder.layers.21.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1408 "text_decoder.layers.21.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1409 "text_decoder.layers.21.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1410 "text_decoder.layers.21.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1411 "text_decoder.layers.22.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1412 "text_decoder.layers.22.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1413 "text_decoder.layers.22.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1414 "text_decoder.layers.22.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1415 "text_decoder.layers.22.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1416 "text_decoder.layers.22.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1417 "text_decoder.layers.22.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1418 "text_decoder.layers.22.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1419 "text_decoder.layers.22.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1420 "text_decoder.layers.22.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1421 "text_decoder.layers.22.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1422 "text_decoder.layers.22.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1423 "text_decoder.layers.22.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1424 "text_decoder.layers.22.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1425 "text_decoder.layers.22.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1426 "text_decoder.layers.22.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1427 "text_decoder.layers.22.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1428 "text_decoder.layers.22.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1429 "text_decoder.layers.22.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1430 "text_decoder.layers.22.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1431 "text_decoder.layers.22.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1432 "text_decoder.layers.22.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1433 "text_decoder.layers.22.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1434 "text_decoder.layers.22.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1435 "text_decoder.layers.22.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1436 "text_decoder.layers.22.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1437 "text_decoder.layers.23.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1438 "text_decoder.layers.23.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1439 "text_decoder.layers.23.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1440 "text_decoder.layers.23.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1441 "text_decoder.layers.23.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1442 "text_decoder.layers.23.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1443 "text_decoder.layers.23.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1444 "text_decoder.layers.23.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1445 "text_decoder.layers.23.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1446 "text_decoder.layers.23.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1447 "text_decoder.layers.23.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1448 "text_decoder.layers.23.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1449 "text_decoder.layers.23.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1450 "text_decoder.layers.23.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1451 "text_decoder.layers.23.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1452 "text_decoder.layers.23.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1453 "text_decoder.layers.23.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1454 "text_decoder.layers.23.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1455 "text_decoder.layers.23.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1456 "text_decoder.layers.23.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1457 "text_decoder.layers.23.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1458 "text_decoder.layers.23.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1459 "text_decoder.layers.23.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1460 "text_decoder.layers.23.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1461 "text_decoder.layers.23.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1462 "text_decoder.layers.23.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1463 "text_decoder.layers.3.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1464 "text_decoder.layers.3.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1465 "text_decoder.layers.3.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1466 "text_decoder.layers.3.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1467 "text_decoder.layers.3.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1468 "text_decoder.layers.3.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1469 "text_decoder.layers.3.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1470 "text_decoder.layers.3.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1471 "text_decoder.layers.3.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1472 "text_decoder.layers.3.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1473 "text_decoder.layers.3.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1474 "text_decoder.layers.3.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1475 "text_decoder.layers.3.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1476 "text_decoder.layers.3.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1477 "text_decoder.layers.3.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1478 "text_decoder.layers.3.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1479 "text_decoder.layers.3.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1480 "text_decoder.layers.3.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1481 "text_decoder.layers.3.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1482 "text_decoder.layers.3.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1483 "text_decoder.layers.3.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1484 "text_decoder.layers.3.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1485 "text_decoder.layers.3.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1486 "text_decoder.layers.3.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1487 "text_decoder.layers.3.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1488 "text_decoder.layers.3.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1489 "text_decoder.layers.4.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1490 "text_decoder.layers.4.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1491 "text_decoder.layers.4.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1492 "text_decoder.layers.4.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1493 "text_decoder.layers.4.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1494 "text_decoder.layers.4.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1495 "text_decoder.layers.4.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1496 "text_decoder.layers.4.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1497 "text_decoder.layers.4.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1498 "text_decoder.layers.4.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1499 "text_decoder.layers.4.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1500 "text_decoder.layers.4.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1501 "text_decoder.layers.4.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1502 "text_decoder.layers.4.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1503 "text_decoder.layers.4.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1504 "text_decoder.layers.4.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1505 "text_decoder.layers.4.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1506 "text_decoder.layers.4.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1507 "text_decoder.layers.4.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1508 "text_decoder.layers.4.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1509 "text_decoder.layers.4.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1510 "text_decoder.layers.4.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1511 "text_decoder.layers.4.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1512 "text_decoder.layers.4.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1513 "text_decoder.layers.4.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1514 "text_decoder.layers.4.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1515 "text_decoder.layers.5.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1516 "text_decoder.layers.5.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1517 "text_decoder.layers.5.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1518 "text_decoder.layers.5.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1519 "text_decoder.layers.5.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1520 "text_decoder.layers.5.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1521 "text_decoder.layers.5.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1522 "text_decoder.layers.5.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1523 "text_decoder.layers.5.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1524 "text_decoder.layers.5.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1525 "text_decoder.layers.5.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1526 "text_decoder.layers.5.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1527 "text_decoder.layers.5.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1528 "text_decoder.layers.5.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1529 "text_decoder.layers.5.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1530 "text_decoder.layers.5.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1531 "text_decoder.layers.5.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1532 "text_decoder.layers.5.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1533 "text_decoder.layers.5.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1534 "text_decoder.layers.5.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1535 "text_decoder.layers.5.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1536 "text_decoder.layers.5.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1537 "text_decoder.layers.5.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1538 "text_decoder.layers.5.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1539 "text_decoder.layers.5.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1540 "text_decoder.layers.5.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1541 "text_decoder.layers.6.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1542 "text_decoder.layers.6.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1543 "text_decoder.layers.6.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1544 "text_decoder.layers.6.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1545 "text_decoder.layers.6.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1546 "text_decoder.layers.6.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1547 "text_decoder.layers.6.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1548 "text_decoder.layers.6.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1549 "text_decoder.layers.6.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1550 "text_decoder.layers.6.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1551 "text_decoder.layers.6.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1552 "text_decoder.layers.6.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1553 "text_decoder.layers.6.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1554 "text_decoder.layers.6.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1555 "text_decoder.layers.6.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1556 "text_decoder.layers.6.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1557 "text_decoder.layers.6.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1558 "text_decoder.layers.6.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1559 "text_decoder.layers.6.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1560 "text_decoder.layers.6.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1561 "text_decoder.layers.6.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1562 "text_decoder.layers.6.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1563 "text_decoder.layers.6.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1564 "text_decoder.layers.6.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1565 "text_decoder.layers.6.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1566 "text_decoder.layers.6.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1567 "text_decoder.layers.7.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1568 "text_decoder.layers.7.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1569 "text_decoder.layers.7.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1570 "text_decoder.layers.7.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1571 "text_decoder.layers.7.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1572 "text_decoder.layers.7.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1573 "text_decoder.layers.7.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1574 "text_decoder.layers.7.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1575 "text_decoder.layers.7.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1576 "text_decoder.layers.7.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1577 "text_decoder.layers.7.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1578 "text_decoder.layers.7.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1579 "text_decoder.layers.7.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1580 "text_decoder.layers.7.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1581 "text_decoder.layers.7.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1582 "text_decoder.layers.7.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1583 "text_decoder.layers.7.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1584 "text_decoder.layers.7.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1585 "text_decoder.layers.7.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1586 "text_decoder.layers.7.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1587 "text_decoder.layers.7.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1588 "text_decoder.layers.7.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1589 "text_decoder.layers.7.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1590 "text_decoder.layers.7.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1591 "text_decoder.layers.7.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1592 "text_decoder.layers.7.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1593 "text_decoder.layers.8.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1594 "text_decoder.layers.8.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1595 "text_decoder.layers.8.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1596 "text_decoder.layers.8.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1597 "text_decoder.layers.8.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1598 "text_decoder.layers.8.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1599 "text_decoder.layers.8.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1600 "text_decoder.layers.8.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1601 "text_decoder.layers.8.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1602 "text_decoder.layers.8.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1603 "text_decoder.layers.8.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1604 "text_decoder.layers.8.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1605 "text_decoder.layers.8.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1606 "text_decoder.layers.8.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1607 "text_decoder.layers.8.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1608 "text_decoder.layers.8.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1609 "text_decoder.layers.8.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1610 "text_decoder.layers.8.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1611 "text_decoder.layers.8.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1612 "text_decoder.layers.8.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1613 "text_decoder.layers.8.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1614 "text_decoder.layers.8.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1615 "text_decoder.layers.8.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1616 "text_decoder.layers.8.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1617 "text_decoder.layers.8.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1618 "text_decoder.layers.8.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1619 "text_decoder.layers.9.cross_attention.k_proj.bias": "model-00002-of-00002.safetensors",
1620 "text_decoder.layers.9.cross_attention.k_proj.weight": "model-00002-of-00002.safetensors",
1621 "text_decoder.layers.9.cross_attention.out_proj.bias": "model-00002-of-00002.safetensors",
1622 "text_decoder.layers.9.cross_attention.out_proj.weight": "model-00002-of-00002.safetensors",
1623 "text_decoder.layers.9.cross_attention.q_proj.bias": "model-00002-of-00002.safetensors",
1624 "text_decoder.layers.9.cross_attention.q_proj.weight": "model-00002-of-00002.safetensors",
1625 "text_decoder.layers.9.cross_attention.v_proj.bias": "model-00002-of-00002.safetensors",
1626 "text_decoder.layers.9.cross_attention.v_proj.weight": "model-00002-of-00002.safetensors",
1627 "text_decoder.layers.9.cross_attention_layer_norm.bias": "model-00002-of-00002.safetensors",
1628 "text_decoder.layers.9.cross_attention_layer_norm.weight": "model-00002-of-00002.safetensors",
1629 "text_decoder.layers.9.ffn.fc1.bias": "model-00002-of-00002.safetensors",
1630 "text_decoder.layers.9.ffn.fc1.weight": "model-00002-of-00002.safetensors",
1631 "text_decoder.layers.9.ffn.fc2.bias": "model-00002-of-00002.safetensors",
1632 "text_decoder.layers.9.ffn.fc2.weight": "model-00002-of-00002.safetensors",
1633 "text_decoder.layers.9.ffn_layer_norm.bias": "model-00002-of-00002.safetensors",
1634 "text_decoder.layers.9.ffn_layer_norm.weight": "model-00002-of-00002.safetensors",
1635 "text_decoder.layers.9.self_attn.k_proj.bias": "model-00002-of-00002.safetensors",
1636 "text_decoder.layers.9.self_attn.k_proj.weight": "model-00002-of-00002.safetensors",
1637 "text_decoder.layers.9.self_attn.out_proj.bias": "model-00002-of-00002.safetensors",
1638 "text_decoder.layers.9.self_attn.out_proj.weight": "model-00002-of-00002.safetensors",
1639 "text_decoder.layers.9.self_attn.q_proj.bias": "model-00002-of-00002.safetensors",
1640 "text_decoder.layers.9.self_attn.q_proj.weight": "model-00002-of-00002.safetensors",
1641 "text_decoder.layers.9.self_attn.v_proj.bias": "model-00002-of-00002.safetensors",
1642 "text_decoder.layers.9.self_attn.v_proj.weight": "model-00002-of-00002.safetensors",
1643 "text_decoder.layers.9.self_attn_layer_norm.bias": "model-00002-of-00002.safetensors",
1644 "text_decoder.layers.9.self_attn_layer_norm.weight": "model-00002-of-00002.safetensors",
1645 "text_encoder.layer_norm.bias": "model-00001-of-00002.safetensors",
1646 "text_encoder.layer_norm.weight": "model-00001-of-00002.safetensors",
1647 "text_encoder.layers.0.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1648 "text_encoder.layers.0.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1649 "text_encoder.layers.0.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1650 "text_encoder.layers.0.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1651 "text_encoder.layers.0.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1652 "text_encoder.layers.0.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1653 "text_encoder.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1654 "text_encoder.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1655 "text_encoder.layers.0.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1656 "text_encoder.layers.0.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1657 "text_encoder.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1658 "text_encoder.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1659 "text_encoder.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1660 "text_encoder.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1661 "text_encoder.layers.0.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1662 "text_encoder.layers.0.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1663 "text_encoder.layers.1.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1664 "text_encoder.layers.1.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1665 "text_encoder.layers.1.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1666 "text_encoder.layers.1.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1667 "text_encoder.layers.1.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1668 "text_encoder.layers.1.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1669 "text_encoder.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1670 "text_encoder.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1671 "text_encoder.layers.1.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1672 "text_encoder.layers.1.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1673 "text_encoder.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1674 "text_encoder.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1675 "text_encoder.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1676 "text_encoder.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1677 "text_encoder.layers.1.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1678 "text_encoder.layers.1.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1679 "text_encoder.layers.10.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1680 "text_encoder.layers.10.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1681 "text_encoder.layers.10.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1682 "text_encoder.layers.10.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1683 "text_encoder.layers.10.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1684 "text_encoder.layers.10.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1685 "text_encoder.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1686 "text_encoder.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1687 "text_encoder.layers.10.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1688 "text_encoder.layers.10.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1689 "text_encoder.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1690 "text_encoder.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1691 "text_encoder.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1692 "text_encoder.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1693 "text_encoder.layers.10.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1694 "text_encoder.layers.10.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1695 "text_encoder.layers.11.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1696 "text_encoder.layers.11.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1697 "text_encoder.layers.11.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1698 "text_encoder.layers.11.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1699 "text_encoder.layers.11.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1700 "text_encoder.layers.11.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1701 "text_encoder.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1702 "text_encoder.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1703 "text_encoder.layers.11.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1704 "text_encoder.layers.11.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1705 "text_encoder.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1706 "text_encoder.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1707 "text_encoder.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1708 "text_encoder.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1709 "text_encoder.layers.11.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1710 "text_encoder.layers.11.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1711 "text_encoder.layers.12.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1712 "text_encoder.layers.12.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1713 "text_encoder.layers.12.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1714 "text_encoder.layers.12.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1715 "text_encoder.layers.12.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1716 "text_encoder.layers.12.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1717 "text_encoder.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1718 "text_encoder.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1719 "text_encoder.layers.12.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1720 "text_encoder.layers.12.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1721 "text_encoder.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1722 "text_encoder.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1723 "text_encoder.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1724 "text_encoder.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1725 "text_encoder.layers.12.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1726 "text_encoder.layers.12.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1727 "text_encoder.layers.13.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1728 "text_encoder.layers.13.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1729 "text_encoder.layers.13.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1730 "text_encoder.layers.13.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1731 "text_encoder.layers.13.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1732 "text_encoder.layers.13.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1733 "text_encoder.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1734 "text_encoder.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1735 "text_encoder.layers.13.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1736 "text_encoder.layers.13.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1737 "text_encoder.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1738 "text_encoder.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1739 "text_encoder.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1740 "text_encoder.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1741 "text_encoder.layers.13.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1742 "text_encoder.layers.13.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1743 "text_encoder.layers.14.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1744 "text_encoder.layers.14.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1745 "text_encoder.layers.14.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1746 "text_encoder.layers.14.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1747 "text_encoder.layers.14.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1748 "text_encoder.layers.14.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1749 "text_encoder.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1750 "text_encoder.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1751 "text_encoder.layers.14.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1752 "text_encoder.layers.14.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1753 "text_encoder.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1754 "text_encoder.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1755 "text_encoder.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1756 "text_encoder.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1757 "text_encoder.layers.14.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1758 "text_encoder.layers.14.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1759 "text_encoder.layers.15.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1760 "text_encoder.layers.15.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1761 "text_encoder.layers.15.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1762 "text_encoder.layers.15.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1763 "text_encoder.layers.15.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1764 "text_encoder.layers.15.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1765 "text_encoder.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1766 "text_encoder.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1767 "text_encoder.layers.15.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1768 "text_encoder.layers.15.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1769 "text_encoder.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1770 "text_encoder.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1771 "text_encoder.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1772 "text_encoder.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1773 "text_encoder.layers.15.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1774 "text_encoder.layers.15.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1775 "text_encoder.layers.16.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1776 "text_encoder.layers.16.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1777 "text_encoder.layers.16.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1778 "text_encoder.layers.16.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1779 "text_encoder.layers.16.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1780 "text_encoder.layers.16.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1781 "text_encoder.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1782 "text_encoder.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1783 "text_encoder.layers.16.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1784 "text_encoder.layers.16.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1785 "text_encoder.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1786 "text_encoder.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1787 "text_encoder.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1788 "text_encoder.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1789 "text_encoder.layers.16.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1790 "text_encoder.layers.16.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1791 "text_encoder.layers.17.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1792 "text_encoder.layers.17.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1793 "text_encoder.layers.17.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1794 "text_encoder.layers.17.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1795 "text_encoder.layers.17.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1796 "text_encoder.layers.17.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1797 "text_encoder.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1798 "text_encoder.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1799 "text_encoder.layers.17.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1800 "text_encoder.layers.17.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1801 "text_encoder.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1802 "text_encoder.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1803 "text_encoder.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1804 "text_encoder.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1805 "text_encoder.layers.17.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1806 "text_encoder.layers.17.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1807 "text_encoder.layers.18.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1808 "text_encoder.layers.18.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1809 "text_encoder.layers.18.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1810 "text_encoder.layers.18.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1811 "text_encoder.layers.18.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1812 "text_encoder.layers.18.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1813 "text_encoder.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1814 "text_encoder.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1815 "text_encoder.layers.18.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1816 "text_encoder.layers.18.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1817 "text_encoder.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1818 "text_encoder.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1819 "text_encoder.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1820 "text_encoder.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1821 "text_encoder.layers.18.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1822 "text_encoder.layers.18.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1823 "text_encoder.layers.19.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1824 "text_encoder.layers.19.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1825 "text_encoder.layers.19.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1826 "text_encoder.layers.19.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1827 "text_encoder.layers.19.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1828 "text_encoder.layers.19.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1829 "text_encoder.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1830 "text_encoder.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1831 "text_encoder.layers.19.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1832 "text_encoder.layers.19.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1833 "text_encoder.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1834 "text_encoder.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1835 "text_encoder.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1836 "text_encoder.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1837 "text_encoder.layers.19.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1838 "text_encoder.layers.19.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1839 "text_encoder.layers.2.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1840 "text_encoder.layers.2.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1841 "text_encoder.layers.2.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1842 "text_encoder.layers.2.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1843 "text_encoder.layers.2.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1844 "text_encoder.layers.2.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1845 "text_encoder.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1846 "text_encoder.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1847 "text_encoder.layers.2.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1848 "text_encoder.layers.2.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1849 "text_encoder.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1850 "text_encoder.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1851 "text_encoder.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1852 "text_encoder.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1853 "text_encoder.layers.2.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1854 "text_encoder.layers.2.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1855 "text_encoder.layers.20.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1856 "text_encoder.layers.20.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1857 "text_encoder.layers.20.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1858 "text_encoder.layers.20.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1859 "text_encoder.layers.20.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1860 "text_encoder.layers.20.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1861 "text_encoder.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1862 "text_encoder.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1863 "text_encoder.layers.20.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1864 "text_encoder.layers.20.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1865 "text_encoder.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1866 "text_encoder.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1867 "text_encoder.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1868 "text_encoder.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1869 "text_encoder.layers.20.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1870 "text_encoder.layers.20.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1871 "text_encoder.layers.21.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1872 "text_encoder.layers.21.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1873 "text_encoder.layers.21.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1874 "text_encoder.layers.21.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1875 "text_encoder.layers.21.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1876 "text_encoder.layers.21.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1877 "text_encoder.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1878 "text_encoder.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1879 "text_encoder.layers.21.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1880 "text_encoder.layers.21.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1881 "text_encoder.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1882 "text_encoder.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1883 "text_encoder.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1884 "text_encoder.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1885 "text_encoder.layers.21.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1886 "text_encoder.layers.21.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1887 "text_encoder.layers.22.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1888 "text_encoder.layers.22.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1889 "text_encoder.layers.22.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1890 "text_encoder.layers.22.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1891 "text_encoder.layers.22.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1892 "text_encoder.layers.22.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1893 "text_encoder.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1894 "text_encoder.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1895 "text_encoder.layers.22.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1896 "text_encoder.layers.22.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1897 "text_encoder.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1898 "text_encoder.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1899 "text_encoder.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1900 "text_encoder.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1901 "text_encoder.layers.22.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1902 "text_encoder.layers.22.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1903 "text_encoder.layers.23.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1904 "text_encoder.layers.23.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1905 "text_encoder.layers.23.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1906 "text_encoder.layers.23.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1907 "text_encoder.layers.23.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1908 "text_encoder.layers.23.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1909 "text_encoder.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1910 "text_encoder.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1911 "text_encoder.layers.23.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1912 "text_encoder.layers.23.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1913 "text_encoder.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1914 "text_encoder.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1915 "text_encoder.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1916 "text_encoder.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1917 "text_encoder.layers.23.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1918 "text_encoder.layers.23.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1919 "text_encoder.layers.3.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1920 "text_encoder.layers.3.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1921 "text_encoder.layers.3.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1922 "text_encoder.layers.3.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1923 "text_encoder.layers.3.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1924 "text_encoder.layers.3.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1925 "text_encoder.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1926 "text_encoder.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1927 "text_encoder.layers.3.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1928 "text_encoder.layers.3.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1929 "text_encoder.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1930 "text_encoder.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1931 "text_encoder.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1932 "text_encoder.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1933 "text_encoder.layers.3.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1934 "text_encoder.layers.3.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1935 "text_encoder.layers.4.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1936 "text_encoder.layers.4.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1937 "text_encoder.layers.4.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1938 "text_encoder.layers.4.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1939 "text_encoder.layers.4.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1940 "text_encoder.layers.4.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1941 "text_encoder.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1942 "text_encoder.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1943 "text_encoder.layers.4.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1944 "text_encoder.layers.4.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1945 "text_encoder.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1946 "text_encoder.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1947 "text_encoder.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1948 "text_encoder.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1949 "text_encoder.layers.4.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1950 "text_encoder.layers.4.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1951 "text_encoder.layers.5.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1952 "text_encoder.layers.5.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1953 "text_encoder.layers.5.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1954 "text_encoder.layers.5.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1955 "text_encoder.layers.5.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1956 "text_encoder.layers.5.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1957 "text_encoder.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1958 "text_encoder.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1959 "text_encoder.layers.5.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1960 "text_encoder.layers.5.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1961 "text_encoder.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1962 "text_encoder.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1963 "text_encoder.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1964 "text_encoder.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1965 "text_encoder.layers.5.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1966 "text_encoder.layers.5.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1967 "text_encoder.layers.6.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1968 "text_encoder.layers.6.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1969 "text_encoder.layers.6.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1970 "text_encoder.layers.6.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1971 "text_encoder.layers.6.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1972 "text_encoder.layers.6.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1973 "text_encoder.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1974 "text_encoder.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1975 "text_encoder.layers.6.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1976 "text_encoder.layers.6.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1977 "text_encoder.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1978 "text_encoder.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1979 "text_encoder.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1980 "text_encoder.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1981 "text_encoder.layers.6.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1982 "text_encoder.layers.6.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1983 "text_encoder.layers.7.ffn.fc1.bias": "model-00001-of-00002.safetensors",
1984 "text_encoder.layers.7.ffn.fc1.weight": "model-00001-of-00002.safetensors",
1985 "text_encoder.layers.7.ffn.fc2.bias": "model-00001-of-00002.safetensors",
1986 "text_encoder.layers.7.ffn.fc2.weight": "model-00001-of-00002.safetensors",
1987 "text_encoder.layers.7.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
1988 "text_encoder.layers.7.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
1989 "text_encoder.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
1990 "text_encoder.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
1991 "text_encoder.layers.7.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
1992 "text_encoder.layers.7.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
1993 "text_encoder.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
1994 "text_encoder.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
1995 "text_encoder.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
1996 "text_encoder.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
1997 "text_encoder.layers.7.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
1998 "text_encoder.layers.7.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
1999 "text_encoder.layers.8.ffn.fc1.bias": "model-00001-of-00002.safetensors",
2000 "text_encoder.layers.8.ffn.fc1.weight": "model-00001-of-00002.safetensors",
2001 "text_encoder.layers.8.ffn.fc2.bias": "model-00001-of-00002.safetensors",
2002 "text_encoder.layers.8.ffn.fc2.weight": "model-00001-of-00002.safetensors",
2003 "text_encoder.layers.8.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
2004 "text_encoder.layers.8.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
2005 "text_encoder.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
2006 "text_encoder.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
2007 "text_encoder.layers.8.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
2008 "text_encoder.layers.8.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
2009 "text_encoder.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
2010 "text_encoder.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
2011 "text_encoder.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
2012 "text_encoder.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
2013 "text_encoder.layers.8.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
2014 "text_encoder.layers.8.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
2015 "text_encoder.layers.9.ffn.fc1.bias": "model-00001-of-00002.safetensors",
2016 "text_encoder.layers.9.ffn.fc1.weight": "model-00001-of-00002.safetensors",
2017 "text_encoder.layers.9.ffn.fc2.bias": "model-00001-of-00002.safetensors",
2018 "text_encoder.layers.9.ffn.fc2.weight": "model-00001-of-00002.safetensors",
2019 "text_encoder.layers.9.ffn_layer_norm.bias": "model-00001-of-00002.safetensors",
2020 "text_encoder.layers.9.ffn_layer_norm.weight": "model-00001-of-00002.safetensors",
2021 "text_encoder.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors",
2022 "text_encoder.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors",
2023 "text_encoder.layers.9.self_attn.out_proj.bias": "model-00001-of-00002.safetensors",
2024 "text_encoder.layers.9.self_attn.out_proj.weight": "model-00001-of-00002.safetensors",
2025 "text_encoder.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors",
2026 "text_encoder.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors",
2027 "text_encoder.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors",
2028 "text_encoder.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors",
2029 "text_encoder.layers.9.self_attn_layer_norm.bias": "model-00001-of-00002.safetensors",
2030 "text_encoder.layers.9.self_attn_layer_norm.weight": "model-00001-of-00002.safetensors",
2031 "vocoder.dur_predictor.conv1.bias": "model-00002-of-00002.safetensors",
2032 "vocoder.dur_predictor.conv1.weight": "model-00002-of-00002.safetensors",
2033 "vocoder.dur_predictor.conv2.bias": "model-00002-of-00002.safetensors",
2034 "vocoder.dur_predictor.conv2.weight": "model-00002-of-00002.safetensors",
2035 "vocoder.dur_predictor.ln1.bias": "model-00002-of-00002.safetensors",
2036 "vocoder.dur_predictor.ln1.weight": "model-00002-of-00002.safetensors",
2037 "vocoder.dur_predictor.ln2.bias": "model-00002-of-00002.safetensors",
2038 "vocoder.dur_predictor.ln2.weight": "model-00002-of-00002.safetensors",
2039 "vocoder.dur_predictor.proj.bias": "model-00002-of-00002.safetensors",
2040 "vocoder.dur_predictor.proj.weight": "model-00002-of-00002.safetensors",
2041 "vocoder.hifi_gan.conv_post.bias": "model-00002-of-00002.safetensors",
2042 "vocoder.hifi_gan.conv_post.weight": "model-00002-of-00002.safetensors",
2043 "vocoder.hifi_gan.conv_pre.bias": "model-00002-of-00002.safetensors",
2044 "vocoder.hifi_gan.conv_pre.weight": "model-00002-of-00002.safetensors",
2045 "vocoder.hifi_gan.resblocks.0.convs1.0.bias": "model-00002-of-00002.safetensors",
2046 "vocoder.hifi_gan.resblocks.0.convs1.0.weight": "model-00002-of-00002.safetensors",
2047 "vocoder.hifi_gan.resblocks.0.convs1.1.bias": "model-00002-of-00002.safetensors",
2048 "vocoder.hifi_gan.resblocks.0.convs1.1.weight": "model-00002-of-00002.safetensors",
2049 "vocoder.hifi_gan.resblocks.0.convs1.2.bias": "model-00002-of-00002.safetensors",
2050 "vocoder.hifi_gan.resblocks.0.convs1.2.weight": "model-00002-of-00002.safetensors",
2051 "vocoder.hifi_gan.resblocks.0.convs2.0.bias": "model-00002-of-00002.safetensors",
2052 "vocoder.hifi_gan.resblocks.0.convs2.0.weight": "model-00002-of-00002.safetensors",
2053 "vocoder.hifi_gan.resblocks.0.convs2.1.bias": "model-00002-of-00002.safetensors",
2054 "vocoder.hifi_gan.resblocks.0.convs2.1.weight": "model-00002-of-00002.safetensors",
2055 "vocoder.hifi_gan.resblocks.0.convs2.2.bias": "model-00002-of-00002.safetensors",
2056 "vocoder.hifi_gan.resblocks.0.convs2.2.weight": "model-00002-of-00002.safetensors",
2057 "vocoder.hifi_gan.resblocks.1.convs1.0.bias": "model-00002-of-00002.safetensors",
2058 "vocoder.hifi_gan.resblocks.1.convs1.0.weight": "model-00002-of-00002.safetensors",
2059 "vocoder.hifi_gan.resblocks.1.convs1.1.bias": "model-00002-of-00002.safetensors",
2060 "vocoder.hifi_gan.resblocks.1.convs1.1.weight": "model-00002-of-00002.safetensors",
2061 "vocoder.hifi_gan.resblocks.1.convs1.2.bias": "model-00002-of-00002.safetensors",
2062 "vocoder.hifi_gan.resblocks.1.convs1.2.weight": "model-00002-of-00002.safetensors",
2063 "vocoder.hifi_gan.resblocks.1.convs2.0.bias": "model-00002-of-00002.safetensors",
2064 "vocoder.hifi_gan.resblocks.1.convs2.0.weight": "model-00002-of-00002.safetensors",
2065 "vocoder.hifi_gan.resblocks.1.convs2.1.bias": "model-00002-of-00002.safetensors",
2066 "vocoder.hifi_gan.resblocks.1.convs2.1.weight": "model-00002-of-00002.safetensors",
2067 "vocoder.hifi_gan.resblocks.1.convs2.2.bias": "model-00002-of-00002.safetensors",
2068 "vocoder.hifi_gan.resblocks.1.convs2.2.weight": "model-00002-of-00002.safetensors",
2069 "vocoder.hifi_gan.resblocks.10.convs1.0.bias": "model-00002-of-00002.safetensors",
2070 "vocoder.hifi_gan.resblocks.10.convs1.0.weight": "model-00002-of-00002.safetensors",
2071 "vocoder.hifi_gan.resblocks.10.convs1.1.bias": "model-00002-of-00002.safetensors",
2072 "vocoder.hifi_gan.resblocks.10.convs1.1.weight": "model-00002-of-00002.safetensors",
2073 "vocoder.hifi_gan.resblocks.10.convs1.2.bias": "model-00002-of-00002.safetensors",
2074 "vocoder.hifi_gan.resblocks.10.convs1.2.weight": "model-00002-of-00002.safetensors",
2075 "vocoder.hifi_gan.resblocks.10.convs2.0.bias": "model-00002-of-00002.safetensors",
2076 "vocoder.hifi_gan.resblocks.10.convs2.0.weight": "model-00002-of-00002.safetensors",
2077 "vocoder.hifi_gan.resblocks.10.convs2.1.bias": "model-00002-of-00002.safetensors",
2078 "vocoder.hifi_gan.resblocks.10.convs2.1.weight": "model-00002-of-00002.safetensors",
2079 "vocoder.hifi_gan.resblocks.10.convs2.2.bias": "model-00002-of-00002.safetensors",
2080 "vocoder.hifi_gan.resblocks.10.convs2.2.weight": "model-00002-of-00002.safetensors",
2081 "vocoder.hifi_gan.resblocks.11.convs1.0.bias": "model-00002-of-00002.safetensors",
2082 "vocoder.hifi_gan.resblocks.11.convs1.0.weight": "model-00002-of-00002.safetensors",
2083 "vocoder.hifi_gan.resblocks.11.convs1.1.bias": "model-00002-of-00002.safetensors",
2084 "vocoder.hifi_gan.resblocks.11.convs1.1.weight": "model-00002-of-00002.safetensors",
2085 "vocoder.hifi_gan.resblocks.11.convs1.2.bias": "model-00002-of-00002.safetensors",
2086 "vocoder.hifi_gan.resblocks.11.convs1.2.weight": "model-00002-of-00002.safetensors",
2087 "vocoder.hifi_gan.resblocks.11.convs2.0.bias": "model-00002-of-00002.safetensors",
2088 "vocoder.hifi_gan.resblocks.11.convs2.0.weight": "model-00002-of-00002.safetensors",
2089 "vocoder.hifi_gan.resblocks.11.convs2.1.bias": "model-00002-of-00002.safetensors",
2090 "vocoder.hifi_gan.resblocks.11.convs2.1.weight": "model-00002-of-00002.safetensors",
2091 "vocoder.hifi_gan.resblocks.11.convs2.2.bias": "model-00002-of-00002.safetensors",
2092 "vocoder.hifi_gan.resblocks.11.convs2.2.weight": "model-00002-of-00002.safetensors",
2093 "vocoder.hifi_gan.resblocks.12.convs1.0.bias": "model-00002-of-00002.safetensors",
2094 "vocoder.hifi_gan.resblocks.12.convs1.0.weight": "model-00002-of-00002.safetensors",
2095 "vocoder.hifi_gan.resblocks.12.convs1.1.bias": "model-00002-of-00002.safetensors",
2096 "vocoder.hifi_gan.resblocks.12.convs1.1.weight": "model-00002-of-00002.safetensors",
2097 "vocoder.hifi_gan.resblocks.12.convs1.2.bias": "model-00002-of-00002.safetensors",
2098 "vocoder.hifi_gan.resblocks.12.convs1.2.weight": "model-00002-of-00002.safetensors",
2099 "vocoder.hifi_gan.resblocks.12.convs2.0.bias": "model-00002-of-00002.safetensors",
2100 "vocoder.hifi_gan.resblocks.12.convs2.0.weight": "model-00002-of-00002.safetensors",
2101 "vocoder.hifi_gan.resblocks.12.convs2.1.bias": "model-00002-of-00002.safetensors",
2102 "vocoder.hifi_gan.resblocks.12.convs2.1.weight": "model-00002-of-00002.safetensors",
2103 "vocoder.hifi_gan.resblocks.12.convs2.2.bias": "model-00002-of-00002.safetensors",
2104 "vocoder.hifi_gan.resblocks.12.convs2.2.weight": "model-00002-of-00002.safetensors",
2105 "vocoder.hifi_gan.resblocks.13.convs1.0.bias": "model-00002-of-00002.safetensors",
2106 "vocoder.hifi_gan.resblocks.13.convs1.0.weight": "model-00002-of-00002.safetensors",
2107 "vocoder.hifi_gan.resblocks.13.convs1.1.bias": "model-00002-of-00002.safetensors",
2108 "vocoder.hifi_gan.resblocks.13.convs1.1.weight": "model-00002-of-00002.safetensors",
2109 "vocoder.hifi_gan.resblocks.13.convs1.2.bias": "model-00002-of-00002.safetensors",
2110 "vocoder.hifi_gan.resblocks.13.convs1.2.weight": "model-00002-of-00002.safetensors",
2111 "vocoder.hifi_gan.resblocks.13.convs2.0.bias": "model-00002-of-00002.safetensors",
2112 "vocoder.hifi_gan.resblocks.13.convs2.0.weight": "model-00002-of-00002.safetensors",
2113 "vocoder.hifi_gan.resblocks.13.convs2.1.bias": "model-00002-of-00002.safetensors",
2114 "vocoder.hifi_gan.resblocks.13.convs2.1.weight": "model-00002-of-00002.safetensors",
2115 "vocoder.hifi_gan.resblocks.13.convs2.2.bias": "model-00002-of-00002.safetensors",
2116 "vocoder.hifi_gan.resblocks.13.convs2.2.weight": "model-00002-of-00002.safetensors",
2117 "vocoder.hifi_gan.resblocks.14.convs1.0.bias": "model-00002-of-00002.safetensors",
2118 "vocoder.hifi_gan.resblocks.14.convs1.0.weight": "model-00002-of-00002.safetensors",
2119 "vocoder.hifi_gan.resblocks.14.convs1.1.bias": "model-00002-of-00002.safetensors",
2120 "vocoder.hifi_gan.resblocks.14.convs1.1.weight": "model-00002-of-00002.safetensors",
2121 "vocoder.hifi_gan.resblocks.14.convs1.2.bias": "model-00002-of-00002.safetensors",
2122 "vocoder.hifi_gan.resblocks.14.convs1.2.weight": "model-00002-of-00002.safetensors",
2123 "vocoder.hifi_gan.resblocks.14.convs2.0.bias": "model-00002-of-00002.safetensors",
2124 "vocoder.hifi_gan.resblocks.14.convs2.0.weight": "model-00002-of-00002.safetensors",
2125 "vocoder.hifi_gan.resblocks.14.convs2.1.bias": "model-00002-of-00002.safetensors",
2126 "vocoder.hifi_gan.resblocks.14.convs2.1.weight": "model-00002-of-00002.safetensors",
2127 "vocoder.hifi_gan.resblocks.14.convs2.2.bias": "model-00002-of-00002.safetensors",
2128 "vocoder.hifi_gan.resblocks.14.convs2.2.weight": "model-00002-of-00002.safetensors",
2129 "vocoder.hifi_gan.resblocks.2.convs1.0.bias": "model-00002-of-00002.safetensors",
2130 "vocoder.hifi_gan.resblocks.2.convs1.0.weight": "model-00002-of-00002.safetensors",
2131 "vocoder.hifi_gan.resblocks.2.convs1.1.bias": "model-00002-of-00002.safetensors",
2132 "vocoder.hifi_gan.resblocks.2.convs1.1.weight": "model-00002-of-00002.safetensors",
2133 "vocoder.hifi_gan.resblocks.2.convs1.2.bias": "model-00002-of-00002.safetensors",
2134 "vocoder.hifi_gan.resblocks.2.convs1.2.weight": "model-00002-of-00002.safetensors",
2135 "vocoder.hifi_gan.resblocks.2.convs2.0.bias": "model-00002-of-00002.safetensors",
2136 "vocoder.hifi_gan.resblocks.2.convs2.0.weight": "model-00002-of-00002.safetensors",
2137 "vocoder.hifi_gan.resblocks.2.convs2.1.bias": "model-00002-of-00002.safetensors",
2138 "vocoder.hifi_gan.resblocks.2.convs2.1.weight": "model-00002-of-00002.safetensors",
2139 "vocoder.hifi_gan.resblocks.2.convs2.2.bias": "model-00002-of-00002.safetensors",
2140 "vocoder.hifi_gan.resblocks.2.convs2.2.weight": "model-00002-of-00002.safetensors",
2141 "vocoder.hifi_gan.resblocks.3.convs1.0.bias": "model-00002-of-00002.safetensors",
2142 "vocoder.hifi_gan.resblocks.3.convs1.0.weight": "model-00002-of-00002.safetensors",
2143 "vocoder.hifi_gan.resblocks.3.convs1.1.bias": "model-00002-of-00002.safetensors",
2144 "vocoder.hifi_gan.resblocks.3.convs1.1.weight": "model-00002-of-00002.safetensors",
2145 "vocoder.hifi_gan.resblocks.3.convs1.2.bias": "model-00002-of-00002.safetensors",
2146 "vocoder.hifi_gan.resblocks.3.convs1.2.weight": "model-00002-of-00002.safetensors",
2147 "vocoder.hifi_gan.resblocks.3.convs2.0.bias": "model-00002-of-00002.safetensors",
2148 "vocoder.hifi_gan.resblocks.3.convs2.0.weight": "model-00002-of-00002.safetensors",
2149 "vocoder.hifi_gan.resblocks.3.convs2.1.bias": "model-00002-of-00002.safetensors",
2150 "vocoder.hifi_gan.resblocks.3.convs2.1.weight": "model-00002-of-00002.safetensors",
2151 "vocoder.hifi_gan.resblocks.3.convs2.2.bias": "model-00002-of-00002.safetensors",
2152 "vocoder.hifi_gan.resblocks.3.convs2.2.weight": "model-00002-of-00002.safetensors",
2153 "vocoder.hifi_gan.resblocks.4.convs1.0.bias": "model-00002-of-00002.safetensors",
2154 "vocoder.hifi_gan.resblocks.4.convs1.0.weight": "model-00002-of-00002.safetensors",
2155 "vocoder.hifi_gan.resblocks.4.convs1.1.bias": "model-00002-of-00002.safetensors",
2156 "vocoder.hifi_gan.resblocks.4.convs1.1.weight": "model-00002-of-00002.safetensors",
2157 "vocoder.hifi_gan.resblocks.4.convs1.2.bias": "model-00002-of-00002.safetensors",
2158 "vocoder.hifi_gan.resblocks.4.convs1.2.weight": "model-00002-of-00002.safetensors",
2159 "vocoder.hifi_gan.resblocks.4.convs2.0.bias": "model-00002-of-00002.safetensors",
2160 "vocoder.hifi_gan.resblocks.4.convs2.0.weight": "model-00002-of-00002.safetensors",
2161 "vocoder.hifi_gan.resblocks.4.convs2.1.bias": "model-00002-of-00002.safetensors",
2162 "vocoder.hifi_gan.resblocks.4.convs2.1.weight": "model-00002-of-00002.safetensors",
2163 "vocoder.hifi_gan.resblocks.4.convs2.2.bias": "model-00002-of-00002.safetensors",
2164 "vocoder.hifi_gan.resblocks.4.convs2.2.weight": "model-00002-of-00002.safetensors",
2165 "vocoder.hifi_gan.resblocks.5.convs1.0.bias": "model-00002-of-00002.safetensors",
2166 "vocoder.hifi_gan.resblocks.5.convs1.0.weight": "model-00002-of-00002.safetensors",
2167 "vocoder.hifi_gan.resblocks.5.convs1.1.bias": "model-00002-of-00002.safetensors",
2168 "vocoder.hifi_gan.resblocks.5.convs1.1.weight": "model-00002-of-00002.safetensors",
2169 "vocoder.hifi_gan.resblocks.5.convs1.2.bias": "model-00002-of-00002.safetensors",
2170 "vocoder.hifi_gan.resblocks.5.convs1.2.weight": "model-00002-of-00002.safetensors",
2171 "vocoder.hifi_gan.resblocks.5.convs2.0.bias": "model-00002-of-00002.safetensors",
2172 "vocoder.hifi_gan.resblocks.5.convs2.0.weight": "model-00002-of-00002.safetensors",
2173 "vocoder.hifi_gan.resblocks.5.convs2.1.bias": "model-00002-of-00002.safetensors",
2174 "vocoder.hifi_gan.resblocks.5.convs2.1.weight": "model-00002-of-00002.safetensors",
2175 "vocoder.hifi_gan.resblocks.5.convs2.2.bias": "model-00002-of-00002.safetensors",
2176 "vocoder.hifi_gan.resblocks.5.convs2.2.weight": "model-00002-of-00002.safetensors",
2177 "vocoder.hifi_gan.resblocks.6.convs1.0.bias": "model-00002-of-00002.safetensors",
2178 "vocoder.hifi_gan.resblocks.6.convs1.0.weight": "model-00002-of-00002.safetensors",
2179 "vocoder.hifi_gan.resblocks.6.convs1.1.bias": "model-00002-of-00002.safetensors",
2180 "vocoder.hifi_gan.resblocks.6.convs1.1.weight": "model-00002-of-00002.safetensors",
2181 "vocoder.hifi_gan.resblocks.6.convs1.2.bias": "model-00002-of-00002.safetensors",
2182 "vocoder.hifi_gan.resblocks.6.convs1.2.weight": "model-00002-of-00002.safetensors",
2183 "vocoder.hifi_gan.resblocks.6.convs2.0.bias": "model-00002-of-00002.safetensors",
2184 "vocoder.hifi_gan.resblocks.6.convs2.0.weight": "model-00002-of-00002.safetensors",
2185 "vocoder.hifi_gan.resblocks.6.convs2.1.bias": "model-00002-of-00002.safetensors",
2186 "vocoder.hifi_gan.resblocks.6.convs2.1.weight": "model-00002-of-00002.safetensors",
2187 "vocoder.hifi_gan.resblocks.6.convs2.2.bias": "model-00002-of-00002.safetensors",
2188 "vocoder.hifi_gan.resblocks.6.convs2.2.weight": "model-00002-of-00002.safetensors",
2189 "vocoder.hifi_gan.resblocks.7.convs1.0.bias": "model-00002-of-00002.safetensors",
2190 "vocoder.hifi_gan.resblocks.7.convs1.0.weight": "model-00002-of-00002.safetensors",
2191 "vocoder.hifi_gan.resblocks.7.convs1.1.bias": "model-00002-of-00002.safetensors",
2192 "vocoder.hifi_gan.resblocks.7.convs1.1.weight": "model-00002-of-00002.safetensors",
2193 "vocoder.hifi_gan.resblocks.7.convs1.2.bias": "model-00002-of-00002.safetensors",
2194 "vocoder.hifi_gan.resblocks.7.convs1.2.weight": "model-00002-of-00002.safetensors",
2195 "vocoder.hifi_gan.resblocks.7.convs2.0.bias": "model-00002-of-00002.safetensors",
2196 "vocoder.hifi_gan.resblocks.7.convs2.0.weight": "model-00002-of-00002.safetensors",
2197 "vocoder.hifi_gan.resblocks.7.convs2.1.bias": "model-00002-of-00002.safetensors",
2198 "vocoder.hifi_gan.resblocks.7.convs2.1.weight": "model-00002-of-00002.safetensors",
2199 "vocoder.hifi_gan.resblocks.7.convs2.2.bias": "model-00002-of-00002.safetensors",
2200 "vocoder.hifi_gan.resblocks.7.convs2.2.weight": "model-00002-of-00002.safetensors",
2201 "vocoder.hifi_gan.resblocks.8.convs1.0.bias": "model-00002-of-00002.safetensors",
2202 "vocoder.hifi_gan.resblocks.8.convs1.0.weight": "model-00002-of-00002.safetensors",
2203 "vocoder.hifi_gan.resblocks.8.convs1.1.bias": "model-00002-of-00002.safetensors",
2204 "vocoder.hifi_gan.resblocks.8.convs1.1.weight": "model-00002-of-00002.safetensors",
2205 "vocoder.hifi_gan.resblocks.8.convs1.2.bias": "model-00002-of-00002.safetensors",
2206 "vocoder.hifi_gan.resblocks.8.convs1.2.weight": "model-00002-of-00002.safetensors",
2207 "vocoder.hifi_gan.resblocks.8.convs2.0.bias": "model-00002-of-00002.safetensors",
2208 "vocoder.hifi_gan.resblocks.8.convs2.0.weight": "model-00002-of-00002.safetensors",
2209 "vocoder.hifi_gan.resblocks.8.convs2.1.bias": "model-00002-of-00002.safetensors",
2210 "vocoder.hifi_gan.resblocks.8.convs2.1.weight": "model-00002-of-00002.safetensors",
2211 "vocoder.hifi_gan.resblocks.8.convs2.2.bias": "model-00002-of-00002.safetensors",
2212 "vocoder.hifi_gan.resblocks.8.convs2.2.weight": "model-00002-of-00002.safetensors",
2213 "vocoder.hifi_gan.resblocks.9.convs1.0.bias": "model-00002-of-00002.safetensors",
2214 "vocoder.hifi_gan.resblocks.9.convs1.0.weight": "model-00002-of-00002.safetensors",
2215 "vocoder.hifi_gan.resblocks.9.convs1.1.bias": "model-00002-of-00002.safetensors",
2216 "vocoder.hifi_gan.resblocks.9.convs1.1.weight": "model-00002-of-00002.safetensors",
2217 "vocoder.hifi_gan.resblocks.9.convs1.2.bias": "model-00002-of-00002.safetensors",
2218 "vocoder.hifi_gan.resblocks.9.convs1.2.weight": "model-00002-of-00002.safetensors",
2219 "vocoder.hifi_gan.resblocks.9.convs2.0.bias": "model-00002-of-00002.safetensors",
2220 "vocoder.hifi_gan.resblocks.9.convs2.0.weight": "model-00002-of-00002.safetensors",
2221 "vocoder.hifi_gan.resblocks.9.convs2.1.bias": "model-00002-of-00002.safetensors",
2222 "vocoder.hifi_gan.resblocks.9.convs2.1.weight": "model-00002-of-00002.safetensors",
2223 "vocoder.hifi_gan.resblocks.9.convs2.2.bias": "model-00002-of-00002.safetensors",
2224 "vocoder.hifi_gan.resblocks.9.convs2.2.weight": "model-00002-of-00002.safetensors",
2225 "vocoder.hifi_gan.upsampler.0.bias": "model-00002-of-00002.safetensors",
2226 "vocoder.hifi_gan.upsampler.0.weight": "model-00002-of-00002.safetensors",
2227 "vocoder.hifi_gan.upsampler.1.bias": "model-00002-of-00002.safetensors",
2228 "vocoder.hifi_gan.upsampler.1.weight": "model-00002-of-00002.safetensors",
2229 "vocoder.hifi_gan.upsampler.2.bias": "model-00002-of-00002.safetensors",
2230 "vocoder.hifi_gan.upsampler.2.weight": "model-00002-of-00002.safetensors",
2231 "vocoder.hifi_gan.upsampler.3.bias": "model-00002-of-00002.safetensors",
2232 "vocoder.hifi_gan.upsampler.3.weight": "model-00002-of-00002.safetensors",
2233 "vocoder.hifi_gan.upsampler.4.bias": "model-00002-of-00002.safetensors",
2234 "vocoder.hifi_gan.upsampler.4.weight": "model-00002-of-00002.safetensors",
2235 "vocoder.language_embedding.weight": "model-00002-of-00002.safetensors",
2236 "vocoder.speaker_embedding.weight": "model-00002-of-00002.safetensors",
2237 "vocoder.unit_embedding.weight": "model-00002-of-00002.safetensors"
2238 }
2239 }
2240