text_encoder/model.safetensors.index.json
21.9 KB · 250 lines · json Raw
1 {
2 "metadata": {
3 "total_size": 22723641344
4 },
5 "weight_map": {
6 "encoder.block.0.layer.0.SelfAttention.k.weight": "model-00001-of-00005.safetensors",
7 "encoder.block.0.layer.0.SelfAttention.o.weight": "model-00001-of-00005.safetensors",
8 "encoder.block.0.layer.0.SelfAttention.q.weight": "model-00001-of-00005.safetensors",
9 "encoder.block.0.layer.0.SelfAttention.relative_attention_bias.weight": "model-00001-of-00005.safetensors",
10 "encoder.block.0.layer.0.SelfAttention.v.weight": "model-00001-of-00005.safetensors",
11 "encoder.block.0.layer.0.layer_norm.weight": "model-00001-of-00005.safetensors",
12 "encoder.block.0.layer.1.DenseReluDense.wi_0.weight": "model-00001-of-00005.safetensors",
13 "encoder.block.0.layer.1.DenseReluDense.wi_1.weight": "model-00001-of-00005.safetensors",
14 "encoder.block.0.layer.1.DenseReluDense.wo.weight": "model-00001-of-00005.safetensors",
15 "encoder.block.0.layer.1.layer_norm.weight": "model-00001-of-00005.safetensors",
16 "encoder.block.1.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
17 "encoder.block.1.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
18 "encoder.block.1.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
19 "encoder.block.1.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
20 "encoder.block.1.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
21 "encoder.block.1.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
22 "encoder.block.1.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
23 "encoder.block.1.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
24 "encoder.block.1.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
25 "encoder.block.1.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
26 "encoder.block.10.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
27 "encoder.block.10.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
28 "encoder.block.10.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
29 "encoder.block.10.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
30 "encoder.block.10.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
31 "encoder.block.10.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
32 "encoder.block.10.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
33 "encoder.block.10.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
34 "encoder.block.10.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
35 "encoder.block.10.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
36 "encoder.block.11.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
37 "encoder.block.11.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
38 "encoder.block.11.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
39 "encoder.block.11.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
40 "encoder.block.11.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
41 "encoder.block.11.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
42 "encoder.block.11.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
43 "encoder.block.11.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
44 "encoder.block.11.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
45 "encoder.block.11.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
46 "encoder.block.12.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
47 "encoder.block.12.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
48 "encoder.block.12.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
49 "encoder.block.12.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
50 "encoder.block.12.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
51 "encoder.block.12.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
52 "encoder.block.12.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
53 "encoder.block.12.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
54 "encoder.block.12.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
55 "encoder.block.12.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
56 "encoder.block.13.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
57 "encoder.block.13.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
58 "encoder.block.13.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
59 "encoder.block.13.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
60 "encoder.block.13.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
61 "encoder.block.13.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
62 "encoder.block.13.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
63 "encoder.block.13.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
64 "encoder.block.13.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
65 "encoder.block.13.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
66 "encoder.block.14.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
67 "encoder.block.14.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
68 "encoder.block.14.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
69 "encoder.block.14.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
70 "encoder.block.14.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
71 "encoder.block.14.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
72 "encoder.block.14.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
73 "encoder.block.14.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
74 "encoder.block.14.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
75 "encoder.block.14.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
76 "encoder.block.15.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
77 "encoder.block.15.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
78 "encoder.block.15.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
79 "encoder.block.15.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
80 "encoder.block.15.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
81 "encoder.block.15.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
82 "encoder.block.15.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
83 "encoder.block.15.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
84 "encoder.block.15.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
85 "encoder.block.15.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
86 "encoder.block.16.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
87 "encoder.block.16.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
88 "encoder.block.16.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
89 "encoder.block.16.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
90 "encoder.block.16.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
91 "encoder.block.16.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
92 "encoder.block.16.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
93 "encoder.block.16.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
94 "encoder.block.16.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
95 "encoder.block.16.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
96 "encoder.block.17.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
97 "encoder.block.17.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
98 "encoder.block.17.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
99 "encoder.block.17.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
100 "encoder.block.17.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
101 "encoder.block.17.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
102 "encoder.block.17.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
103 "encoder.block.17.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
104 "encoder.block.17.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
105 "encoder.block.17.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
106 "encoder.block.18.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
107 "encoder.block.18.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
108 "encoder.block.18.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
109 "encoder.block.18.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
110 "encoder.block.18.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
111 "encoder.block.18.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
112 "encoder.block.18.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
113 "encoder.block.18.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
114 "encoder.block.18.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
115 "encoder.block.18.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
116 "encoder.block.19.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
117 "encoder.block.19.layer.0.SelfAttention.o.weight": "model-00004-of-00005.safetensors",
118 "encoder.block.19.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
119 "encoder.block.19.layer.0.SelfAttention.relative_attention_bias.weight": "model-00004-of-00005.safetensors",
120 "encoder.block.19.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
121 "encoder.block.19.layer.0.layer_norm.weight": "model-00004-of-00005.safetensors",
122 "encoder.block.19.layer.1.DenseReluDense.wi_0.weight": "model-00004-of-00005.safetensors",
123 "encoder.block.19.layer.1.DenseReluDense.wi_1.weight": "model-00004-of-00005.safetensors",
124 "encoder.block.19.layer.1.DenseReluDense.wo.weight": "model-00004-of-00005.safetensors",
125 "encoder.block.19.layer.1.layer_norm.weight": "model-00004-of-00005.safetensors",
126 "encoder.block.2.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
127 "encoder.block.2.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
128 "encoder.block.2.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
129 "encoder.block.2.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
130 "encoder.block.2.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
131 "encoder.block.2.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
132 "encoder.block.2.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
133 "encoder.block.2.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
134 "encoder.block.2.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
135 "encoder.block.2.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
136 "encoder.block.20.layer.0.SelfAttention.k.weight": "model-00004-of-00005.safetensors",
137 "encoder.block.20.layer.0.SelfAttention.o.weight": "model-00005-of-00005.safetensors",
138 "encoder.block.20.layer.0.SelfAttention.q.weight": "model-00004-of-00005.safetensors",
139 "encoder.block.20.layer.0.SelfAttention.relative_attention_bias.weight": "model-00005-of-00005.safetensors",
140 "encoder.block.20.layer.0.SelfAttention.v.weight": "model-00004-of-00005.safetensors",
141 "encoder.block.20.layer.0.layer_norm.weight": "model-00005-of-00005.safetensors",
142 "encoder.block.20.layer.1.DenseReluDense.wi_0.weight": "model-00005-of-00005.safetensors",
143 "encoder.block.20.layer.1.DenseReluDense.wi_1.weight": "model-00005-of-00005.safetensors",
144 "encoder.block.20.layer.1.DenseReluDense.wo.weight": "model-00005-of-00005.safetensors",
145 "encoder.block.20.layer.1.layer_norm.weight": "model-00005-of-00005.safetensors",
146 "encoder.block.21.layer.0.SelfAttention.k.weight": "model-00005-of-00005.safetensors",
147 "encoder.block.21.layer.0.SelfAttention.o.weight": "model-00005-of-00005.safetensors",
148 "encoder.block.21.layer.0.SelfAttention.q.weight": "model-00005-of-00005.safetensors",
149 "encoder.block.21.layer.0.SelfAttention.relative_attention_bias.weight": "model-00005-of-00005.safetensors",
150 "encoder.block.21.layer.0.SelfAttention.v.weight": "model-00005-of-00005.safetensors",
151 "encoder.block.21.layer.0.layer_norm.weight": "model-00005-of-00005.safetensors",
152 "encoder.block.21.layer.1.DenseReluDense.wi_0.weight": "model-00005-of-00005.safetensors",
153 "encoder.block.21.layer.1.DenseReluDense.wi_1.weight": "model-00005-of-00005.safetensors",
154 "encoder.block.21.layer.1.DenseReluDense.wo.weight": "model-00005-of-00005.safetensors",
155 "encoder.block.21.layer.1.layer_norm.weight": "model-00005-of-00005.safetensors",
156 "encoder.block.22.layer.0.SelfAttention.k.weight": "model-00005-of-00005.safetensors",
157 "encoder.block.22.layer.0.SelfAttention.o.weight": "model-00005-of-00005.safetensors",
158 "encoder.block.22.layer.0.SelfAttention.q.weight": "model-00005-of-00005.safetensors",
159 "encoder.block.22.layer.0.SelfAttention.relative_attention_bias.weight": "model-00005-of-00005.safetensors",
160 "encoder.block.22.layer.0.SelfAttention.v.weight": "model-00005-of-00005.safetensors",
161 "encoder.block.22.layer.0.layer_norm.weight": "model-00005-of-00005.safetensors",
162 "encoder.block.22.layer.1.DenseReluDense.wi_0.weight": "model-00005-of-00005.safetensors",
163 "encoder.block.22.layer.1.DenseReluDense.wi_1.weight": "model-00005-of-00005.safetensors",
164 "encoder.block.22.layer.1.DenseReluDense.wo.weight": "model-00005-of-00005.safetensors",
165 "encoder.block.22.layer.1.layer_norm.weight": "model-00005-of-00005.safetensors",
166 "encoder.block.23.layer.0.SelfAttention.k.weight": "model-00005-of-00005.safetensors",
167 "encoder.block.23.layer.0.SelfAttention.o.weight": "model-00005-of-00005.safetensors",
168 "encoder.block.23.layer.0.SelfAttention.q.weight": "model-00005-of-00005.safetensors",
169 "encoder.block.23.layer.0.SelfAttention.relative_attention_bias.weight": "model-00005-of-00005.safetensors",
170 "encoder.block.23.layer.0.SelfAttention.v.weight": "model-00005-of-00005.safetensors",
171 "encoder.block.23.layer.0.layer_norm.weight": "model-00005-of-00005.safetensors",
172 "encoder.block.23.layer.1.DenseReluDense.wi_0.weight": "model-00005-of-00005.safetensors",
173 "encoder.block.23.layer.1.DenseReluDense.wi_1.weight": "model-00005-of-00005.safetensors",
174 "encoder.block.23.layer.1.DenseReluDense.wo.weight": "model-00005-of-00005.safetensors",
175 "encoder.block.23.layer.1.layer_norm.weight": "model-00005-of-00005.safetensors",
176 "encoder.block.3.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
177 "encoder.block.3.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
178 "encoder.block.3.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
179 "encoder.block.3.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
180 "encoder.block.3.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
181 "encoder.block.3.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
182 "encoder.block.3.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
183 "encoder.block.3.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
184 "encoder.block.3.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
185 "encoder.block.3.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
186 "encoder.block.4.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
187 "encoder.block.4.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
188 "encoder.block.4.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
189 "encoder.block.4.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
190 "encoder.block.4.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
191 "encoder.block.4.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
192 "encoder.block.4.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
193 "encoder.block.4.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
194 "encoder.block.4.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
195 "encoder.block.4.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
196 "encoder.block.5.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
197 "encoder.block.5.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
198 "encoder.block.5.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
199 "encoder.block.5.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
200 "encoder.block.5.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
201 "encoder.block.5.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
202 "encoder.block.5.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
203 "encoder.block.5.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
204 "encoder.block.5.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
205 "encoder.block.5.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
206 "encoder.block.6.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
207 "encoder.block.6.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
208 "encoder.block.6.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
209 "encoder.block.6.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
210 "encoder.block.6.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
211 "encoder.block.6.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
212 "encoder.block.6.layer.1.DenseReluDense.wi_0.weight": "model-00002-of-00005.safetensors",
213 "encoder.block.6.layer.1.DenseReluDense.wi_1.weight": "model-00002-of-00005.safetensors",
214 "encoder.block.6.layer.1.DenseReluDense.wo.weight": "model-00002-of-00005.safetensors",
215 "encoder.block.6.layer.1.layer_norm.weight": "model-00002-of-00005.safetensors",
216 "encoder.block.7.layer.0.SelfAttention.k.weight": "model-00002-of-00005.safetensors",
217 "encoder.block.7.layer.0.SelfAttention.o.weight": "model-00002-of-00005.safetensors",
218 "encoder.block.7.layer.0.SelfAttention.q.weight": "model-00002-of-00005.safetensors",
219 "encoder.block.7.layer.0.SelfAttention.relative_attention_bias.weight": "model-00002-of-00005.safetensors",
220 "encoder.block.7.layer.0.SelfAttention.v.weight": "model-00002-of-00005.safetensors",
221 "encoder.block.7.layer.0.layer_norm.weight": "model-00002-of-00005.safetensors",
222 "encoder.block.7.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
223 "encoder.block.7.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
224 "encoder.block.7.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
225 "encoder.block.7.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
226 "encoder.block.8.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
227 "encoder.block.8.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
228 "encoder.block.8.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
229 "encoder.block.8.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
230 "encoder.block.8.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
231 "encoder.block.8.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
232 "encoder.block.8.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
233 "encoder.block.8.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
234 "encoder.block.8.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
235 "encoder.block.8.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
236 "encoder.block.9.layer.0.SelfAttention.k.weight": "model-00003-of-00005.safetensors",
237 "encoder.block.9.layer.0.SelfAttention.o.weight": "model-00003-of-00005.safetensors",
238 "encoder.block.9.layer.0.SelfAttention.q.weight": "model-00003-of-00005.safetensors",
239 "encoder.block.9.layer.0.SelfAttention.relative_attention_bias.weight": "model-00003-of-00005.safetensors",
240 "encoder.block.9.layer.0.SelfAttention.v.weight": "model-00003-of-00005.safetensors",
241 "encoder.block.9.layer.0.layer_norm.weight": "model-00003-of-00005.safetensors",
242 "encoder.block.9.layer.1.DenseReluDense.wi_0.weight": "model-00003-of-00005.safetensors",
243 "encoder.block.9.layer.1.DenseReluDense.wi_1.weight": "model-00003-of-00005.safetensors",
244 "encoder.block.9.layer.1.DenseReluDense.wo.weight": "model-00003-of-00005.safetensors",
245 "encoder.block.9.layer.1.layer_norm.weight": "model-00003-of-00005.safetensors",
246 "encoder.final_layer_norm.weight": "model-00005-of-00005.safetensors",
247 "shared.weight": "model-00001-of-00005.safetensors"
248 }
249 }
250