transformer/diffusion_pytorch_model.safetensors.index.json
368.9 KB · 3518 lines · json Raw
1 {
2 "metadata": {
3 "total_size": 37758861824
4 },
5 "weight_map": {
6 "audio_caption_projection.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
7 "audio_caption_projection.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
8 "audio_caption_projection.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
9 "audio_caption_projection.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
10 "audio_proj_in.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
11 "audio_proj_in.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
12 "audio_proj_out.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
13 "audio_proj_out.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
14 "audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
15 "audio_time_embed.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
16 "audio_time_embed.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
17 "audio_time_embed.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
18 "audio_time_embed.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
19 "audio_time_embed.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
20 "audio_time_embed.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
21 "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
22 "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
23 "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
24 "av_cross_attn_audio_scale_shift.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
25 "av_cross_attn_audio_scale_shift.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
26 "av_cross_attn_audio_scale_shift.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
27 "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
28 "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
29 "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
30 "av_cross_attn_audio_v2a_gate.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
31 "av_cross_attn_audio_v2a_gate.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
32 "av_cross_attn_audio_v2a_gate.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
33 "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
34 "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
35 "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
36 "av_cross_attn_video_a2v_gate.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
37 "av_cross_attn_video_a2v_gate.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
38 "av_cross_attn_video_a2v_gate.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
39 "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
40 "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
41 "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
42 "av_cross_attn_video_scale_shift.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
43 "av_cross_attn_video_scale_shift.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
44 "av_cross_attn_video_scale_shift.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
45 "caption_projection.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
46 "caption_projection.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
47 "caption_projection.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
48 "caption_projection.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
49 "proj_in.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
50 "proj_in.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
51 "proj_out.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
52 "proj_out.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
53 "scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
54 "time_embed.emb.timestep_embedder.linear_1.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
55 "time_embed.emb.timestep_embedder.linear_1.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
56 "time_embed.emb.timestep_embedder.linear_2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
57 "time_embed.emb.timestep_embedder.linear_2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
58 "time_embed.linear.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
59 "time_embed.linear.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
60 "transformer_blocks.0.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
61 "transformer_blocks.0.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
62 "transformer_blocks.0.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
63 "transformer_blocks.0.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
64 "transformer_blocks.0.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
65 "transformer_blocks.0.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
66 "transformer_blocks.0.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
67 "transformer_blocks.0.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
68 "transformer_blocks.0.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
69 "transformer_blocks.0.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
70 "transformer_blocks.0.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
71 "transformer_blocks.0.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
72 "transformer_blocks.0.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
73 "transformer_blocks.0.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
74 "transformer_blocks.0.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
75 "transformer_blocks.0.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
76 "transformer_blocks.0.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
77 "transformer_blocks.0.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
78 "transformer_blocks.0.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
79 "transformer_blocks.0.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
80 "transformer_blocks.0.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
81 "transformer_blocks.0.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
82 "transformer_blocks.0.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
83 "transformer_blocks.0.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
84 "transformer_blocks.0.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
85 "transformer_blocks.0.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
86 "transformer_blocks.0.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
87 "transformer_blocks.0.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
88 "transformer_blocks.0.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
89 "transformer_blocks.0.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
90 "transformer_blocks.0.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
91 "transformer_blocks.0.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
92 "transformer_blocks.0.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
93 "transformer_blocks.0.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
94 "transformer_blocks.0.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
95 "transformer_blocks.0.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
96 "transformer_blocks.0.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
97 "transformer_blocks.0.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
98 "transformer_blocks.0.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
99 "transformer_blocks.0.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
100 "transformer_blocks.0.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
101 "transformer_blocks.0.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
102 "transformer_blocks.0.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
103 "transformer_blocks.0.audio_ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
104 "transformer_blocks.0.audio_ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
105 "transformer_blocks.0.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
106 "transformer_blocks.0.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
107 "transformer_blocks.0.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
108 "transformer_blocks.0.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
109 "transformer_blocks.0.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
110 "transformer_blocks.0.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
111 "transformer_blocks.0.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
112 "transformer_blocks.0.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
113 "transformer_blocks.0.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
114 "transformer_blocks.0.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
115 "transformer_blocks.0.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
116 "transformer_blocks.0.ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
117 "transformer_blocks.0.ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
118 "transformer_blocks.0.ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
119 "transformer_blocks.0.ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
120 "transformer_blocks.0.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
121 "transformer_blocks.0.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
122 "transformer_blocks.0.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
123 "transformer_blocks.0.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
124 "transformer_blocks.0.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
125 "transformer_blocks.0.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
126 "transformer_blocks.0.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
127 "transformer_blocks.0.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
128 "transformer_blocks.0.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
129 "transformer_blocks.0.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
130 "transformer_blocks.0.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
131 "transformer_blocks.0.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
132 "transformer_blocks.1.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
133 "transformer_blocks.1.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
134 "transformer_blocks.1.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
135 "transformer_blocks.1.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
136 "transformer_blocks.1.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
137 "transformer_blocks.1.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
138 "transformer_blocks.1.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
139 "transformer_blocks.1.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
140 "transformer_blocks.1.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
141 "transformer_blocks.1.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
142 "transformer_blocks.1.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
143 "transformer_blocks.1.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
144 "transformer_blocks.1.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
145 "transformer_blocks.1.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
146 "transformer_blocks.1.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
147 "transformer_blocks.1.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
148 "transformer_blocks.1.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
149 "transformer_blocks.1.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
150 "transformer_blocks.1.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
151 "transformer_blocks.1.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
152 "transformer_blocks.1.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
153 "transformer_blocks.1.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
154 "transformer_blocks.1.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
155 "transformer_blocks.1.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
156 "transformer_blocks.1.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
157 "transformer_blocks.1.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
158 "transformer_blocks.1.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
159 "transformer_blocks.1.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
160 "transformer_blocks.1.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
161 "transformer_blocks.1.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
162 "transformer_blocks.1.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
163 "transformer_blocks.1.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
164 "transformer_blocks.1.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
165 "transformer_blocks.1.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
166 "transformer_blocks.1.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
167 "transformer_blocks.1.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
168 "transformer_blocks.1.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
169 "transformer_blocks.1.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
170 "transformer_blocks.1.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
171 "transformer_blocks.1.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
172 "transformer_blocks.1.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
173 "transformer_blocks.1.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
174 "transformer_blocks.1.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
175 "transformer_blocks.1.audio_ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
176 "transformer_blocks.1.audio_ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
177 "transformer_blocks.1.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
178 "transformer_blocks.1.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
179 "transformer_blocks.1.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
180 "transformer_blocks.1.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
181 "transformer_blocks.1.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
182 "transformer_blocks.1.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
183 "transformer_blocks.1.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
184 "transformer_blocks.1.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
185 "transformer_blocks.1.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
186 "transformer_blocks.1.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
187 "transformer_blocks.1.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
188 "transformer_blocks.1.ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
189 "transformer_blocks.1.ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
190 "transformer_blocks.1.ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
191 "transformer_blocks.1.ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
192 "transformer_blocks.1.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
193 "transformer_blocks.1.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
194 "transformer_blocks.1.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
195 "transformer_blocks.1.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
196 "transformer_blocks.1.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
197 "transformer_blocks.1.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
198 "transformer_blocks.1.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
199 "transformer_blocks.1.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
200 "transformer_blocks.1.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
201 "transformer_blocks.1.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
202 "transformer_blocks.1.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
203 "transformer_blocks.1.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
204 "transformer_blocks.10.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
205 "transformer_blocks.10.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
206 "transformer_blocks.10.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
207 "transformer_blocks.10.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
208 "transformer_blocks.10.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
209 "transformer_blocks.10.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
210 "transformer_blocks.10.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
211 "transformer_blocks.10.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
212 "transformer_blocks.10.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
213 "transformer_blocks.10.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
214 "transformer_blocks.10.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
215 "transformer_blocks.10.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
216 "transformer_blocks.10.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
217 "transformer_blocks.10.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
218 "transformer_blocks.10.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
219 "transformer_blocks.10.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
220 "transformer_blocks.10.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
221 "transformer_blocks.10.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
222 "transformer_blocks.10.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
223 "transformer_blocks.10.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
224 "transformer_blocks.10.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
225 "transformer_blocks.10.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
226 "transformer_blocks.10.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
227 "transformer_blocks.10.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
228 "transformer_blocks.10.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
229 "transformer_blocks.10.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
230 "transformer_blocks.10.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
231 "transformer_blocks.10.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
232 "transformer_blocks.10.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
233 "transformer_blocks.10.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
234 "transformer_blocks.10.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
235 "transformer_blocks.10.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
236 "transformer_blocks.10.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
237 "transformer_blocks.10.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
238 "transformer_blocks.10.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
239 "transformer_blocks.10.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
240 "transformer_blocks.10.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
241 "transformer_blocks.10.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
242 "transformer_blocks.10.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
243 "transformer_blocks.10.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
244 "transformer_blocks.10.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
245 "transformer_blocks.10.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
246 "transformer_blocks.10.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
247 "transformer_blocks.10.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
248 "transformer_blocks.10.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
249 "transformer_blocks.10.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
250 "transformer_blocks.10.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
251 "transformer_blocks.10.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
252 "transformer_blocks.10.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
253 "transformer_blocks.10.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
254 "transformer_blocks.10.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
255 "transformer_blocks.10.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
256 "transformer_blocks.10.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
257 "transformer_blocks.10.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
258 "transformer_blocks.10.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
259 "transformer_blocks.10.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
260 "transformer_blocks.10.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
261 "transformer_blocks.10.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
262 "transformer_blocks.10.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
263 "transformer_blocks.10.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
264 "transformer_blocks.10.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
265 "transformer_blocks.10.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
266 "transformer_blocks.10.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
267 "transformer_blocks.10.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
268 "transformer_blocks.10.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
269 "transformer_blocks.10.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
270 "transformer_blocks.10.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
271 "transformer_blocks.10.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
272 "transformer_blocks.10.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
273 "transformer_blocks.10.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
274 "transformer_blocks.10.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
275 "transformer_blocks.10.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
276 "transformer_blocks.11.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
277 "transformer_blocks.11.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
278 "transformer_blocks.11.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
279 "transformer_blocks.11.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
280 "transformer_blocks.11.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
281 "transformer_blocks.11.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
282 "transformer_blocks.11.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
283 "transformer_blocks.11.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
284 "transformer_blocks.11.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
285 "transformer_blocks.11.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
286 "transformer_blocks.11.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
287 "transformer_blocks.11.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
288 "transformer_blocks.11.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
289 "transformer_blocks.11.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
290 "transformer_blocks.11.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
291 "transformer_blocks.11.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
292 "transformer_blocks.11.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
293 "transformer_blocks.11.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
294 "transformer_blocks.11.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
295 "transformer_blocks.11.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
296 "transformer_blocks.11.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
297 "transformer_blocks.11.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
298 "transformer_blocks.11.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
299 "transformer_blocks.11.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
300 "transformer_blocks.11.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
301 "transformer_blocks.11.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
302 "transformer_blocks.11.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
303 "transformer_blocks.11.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
304 "transformer_blocks.11.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
305 "transformer_blocks.11.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
306 "transformer_blocks.11.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
307 "transformer_blocks.11.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
308 "transformer_blocks.11.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
309 "transformer_blocks.11.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
310 "transformer_blocks.11.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
311 "transformer_blocks.11.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
312 "transformer_blocks.11.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
313 "transformer_blocks.11.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
314 "transformer_blocks.11.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
315 "transformer_blocks.11.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
316 "transformer_blocks.11.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
317 "transformer_blocks.11.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
318 "transformer_blocks.11.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
319 "transformer_blocks.11.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
320 "transformer_blocks.11.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
321 "transformer_blocks.11.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
322 "transformer_blocks.11.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
323 "transformer_blocks.11.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
324 "transformer_blocks.11.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
325 "transformer_blocks.11.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
326 "transformer_blocks.11.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
327 "transformer_blocks.11.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
328 "transformer_blocks.11.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
329 "transformer_blocks.11.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
330 "transformer_blocks.11.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
331 "transformer_blocks.11.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
332 "transformer_blocks.11.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
333 "transformer_blocks.11.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
334 "transformer_blocks.11.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
335 "transformer_blocks.11.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
336 "transformer_blocks.11.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
337 "transformer_blocks.11.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
338 "transformer_blocks.11.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
339 "transformer_blocks.11.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
340 "transformer_blocks.11.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
341 "transformer_blocks.11.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
342 "transformer_blocks.11.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
343 "transformer_blocks.11.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
344 "transformer_blocks.11.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
345 "transformer_blocks.11.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
346 "transformer_blocks.11.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
347 "transformer_blocks.11.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
348 "transformer_blocks.12.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
349 "transformer_blocks.12.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
350 "transformer_blocks.12.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
351 "transformer_blocks.12.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
352 "transformer_blocks.12.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
353 "transformer_blocks.12.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
354 "transformer_blocks.12.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
355 "transformer_blocks.12.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
356 "transformer_blocks.12.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
357 "transformer_blocks.12.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
358 "transformer_blocks.12.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
359 "transformer_blocks.12.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
360 "transformer_blocks.12.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
361 "transformer_blocks.12.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
362 "transformer_blocks.12.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
363 "transformer_blocks.12.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
364 "transformer_blocks.12.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
365 "transformer_blocks.12.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
366 "transformer_blocks.12.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
367 "transformer_blocks.12.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
368 "transformer_blocks.12.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
369 "transformer_blocks.12.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
370 "transformer_blocks.12.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
371 "transformer_blocks.12.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
372 "transformer_blocks.12.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
373 "transformer_blocks.12.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
374 "transformer_blocks.12.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
375 "transformer_blocks.12.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
376 "transformer_blocks.12.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
377 "transformer_blocks.12.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
378 "transformer_blocks.12.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
379 "transformer_blocks.12.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
380 "transformer_blocks.12.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
381 "transformer_blocks.12.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
382 "transformer_blocks.12.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
383 "transformer_blocks.12.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
384 "transformer_blocks.12.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
385 "transformer_blocks.12.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
386 "transformer_blocks.12.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
387 "transformer_blocks.12.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
388 "transformer_blocks.12.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
389 "transformer_blocks.12.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
390 "transformer_blocks.12.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
391 "transformer_blocks.12.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
392 "transformer_blocks.12.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
393 "transformer_blocks.12.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
394 "transformer_blocks.12.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
395 "transformer_blocks.12.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
396 "transformer_blocks.12.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
397 "transformer_blocks.12.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
398 "transformer_blocks.12.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
399 "transformer_blocks.12.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
400 "transformer_blocks.12.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
401 "transformer_blocks.12.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
402 "transformer_blocks.12.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
403 "transformer_blocks.12.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
404 "transformer_blocks.12.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
405 "transformer_blocks.12.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
406 "transformer_blocks.12.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
407 "transformer_blocks.12.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
408 "transformer_blocks.12.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
409 "transformer_blocks.12.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
410 "transformer_blocks.12.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
411 "transformer_blocks.12.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
412 "transformer_blocks.12.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
413 "transformer_blocks.12.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
414 "transformer_blocks.12.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
415 "transformer_blocks.12.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
416 "transformer_blocks.12.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
417 "transformer_blocks.12.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
418 "transformer_blocks.12.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
419 "transformer_blocks.12.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
420 "transformer_blocks.13.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
421 "transformer_blocks.13.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
422 "transformer_blocks.13.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
423 "transformer_blocks.13.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
424 "transformer_blocks.13.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
425 "transformer_blocks.13.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
426 "transformer_blocks.13.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
427 "transformer_blocks.13.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
428 "transformer_blocks.13.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
429 "transformer_blocks.13.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
430 "transformer_blocks.13.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
431 "transformer_blocks.13.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
432 "transformer_blocks.13.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
433 "transformer_blocks.13.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
434 "transformer_blocks.13.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
435 "transformer_blocks.13.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
436 "transformer_blocks.13.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
437 "transformer_blocks.13.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
438 "transformer_blocks.13.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
439 "transformer_blocks.13.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
440 "transformer_blocks.13.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
441 "transformer_blocks.13.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
442 "transformer_blocks.13.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
443 "transformer_blocks.13.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
444 "transformer_blocks.13.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
445 "transformer_blocks.13.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
446 "transformer_blocks.13.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
447 "transformer_blocks.13.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
448 "transformer_blocks.13.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
449 "transformer_blocks.13.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
450 "transformer_blocks.13.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
451 "transformer_blocks.13.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
452 "transformer_blocks.13.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
453 "transformer_blocks.13.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
454 "transformer_blocks.13.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
455 "transformer_blocks.13.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
456 "transformer_blocks.13.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
457 "transformer_blocks.13.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
458 "transformer_blocks.13.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
459 "transformer_blocks.13.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
460 "transformer_blocks.13.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
461 "transformer_blocks.13.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
462 "transformer_blocks.13.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
463 "transformer_blocks.13.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
464 "transformer_blocks.13.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
465 "transformer_blocks.13.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
466 "transformer_blocks.13.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
467 "transformer_blocks.13.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
468 "transformer_blocks.13.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
469 "transformer_blocks.13.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
470 "transformer_blocks.13.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
471 "transformer_blocks.13.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
472 "transformer_blocks.13.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
473 "transformer_blocks.13.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
474 "transformer_blocks.13.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
475 "transformer_blocks.13.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
476 "transformer_blocks.13.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
477 "transformer_blocks.13.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
478 "transformer_blocks.13.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
479 "transformer_blocks.13.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
480 "transformer_blocks.13.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
481 "transformer_blocks.13.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
482 "transformer_blocks.13.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
483 "transformer_blocks.13.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
484 "transformer_blocks.13.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
485 "transformer_blocks.13.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
486 "transformer_blocks.13.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
487 "transformer_blocks.13.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
488 "transformer_blocks.13.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
489 "transformer_blocks.13.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
490 "transformer_blocks.13.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
491 "transformer_blocks.13.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
492 "transformer_blocks.14.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
493 "transformer_blocks.14.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
494 "transformer_blocks.14.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
495 "transformer_blocks.14.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
496 "transformer_blocks.14.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
497 "transformer_blocks.14.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
498 "transformer_blocks.14.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
499 "transformer_blocks.14.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
500 "transformer_blocks.14.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
501 "transformer_blocks.14.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
502 "transformer_blocks.14.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
503 "transformer_blocks.14.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
504 "transformer_blocks.14.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
505 "transformer_blocks.14.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
506 "transformer_blocks.14.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
507 "transformer_blocks.14.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
508 "transformer_blocks.14.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
509 "transformer_blocks.14.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
510 "transformer_blocks.14.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
511 "transformer_blocks.14.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
512 "transformer_blocks.14.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
513 "transformer_blocks.14.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
514 "transformer_blocks.14.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
515 "transformer_blocks.14.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
516 "transformer_blocks.14.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
517 "transformer_blocks.14.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
518 "transformer_blocks.14.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
519 "transformer_blocks.14.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
520 "transformer_blocks.14.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
521 "transformer_blocks.14.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
522 "transformer_blocks.14.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
523 "transformer_blocks.14.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
524 "transformer_blocks.14.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
525 "transformer_blocks.14.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
526 "transformer_blocks.14.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
527 "transformer_blocks.14.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
528 "transformer_blocks.14.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
529 "transformer_blocks.14.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
530 "transformer_blocks.14.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
531 "transformer_blocks.14.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
532 "transformer_blocks.14.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
533 "transformer_blocks.14.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
534 "transformer_blocks.14.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
535 "transformer_blocks.14.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
536 "transformer_blocks.14.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
537 "transformer_blocks.14.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
538 "transformer_blocks.14.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
539 "transformer_blocks.14.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
540 "transformer_blocks.14.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
541 "transformer_blocks.14.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
542 "transformer_blocks.14.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
543 "transformer_blocks.14.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
544 "transformer_blocks.14.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
545 "transformer_blocks.14.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
546 "transformer_blocks.14.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
547 "transformer_blocks.14.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
548 "transformer_blocks.14.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
549 "transformer_blocks.14.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
550 "transformer_blocks.14.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
551 "transformer_blocks.14.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
552 "transformer_blocks.14.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
553 "transformer_blocks.14.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
554 "transformer_blocks.14.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
555 "transformer_blocks.14.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
556 "transformer_blocks.14.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
557 "transformer_blocks.14.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
558 "transformer_blocks.14.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
559 "transformer_blocks.14.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
560 "transformer_blocks.14.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
561 "transformer_blocks.14.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
562 "transformer_blocks.14.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
563 "transformer_blocks.14.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
564 "transformer_blocks.15.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
565 "transformer_blocks.15.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
566 "transformer_blocks.15.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
567 "transformer_blocks.15.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
568 "transformer_blocks.15.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
569 "transformer_blocks.15.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
570 "transformer_blocks.15.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
571 "transformer_blocks.15.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
572 "transformer_blocks.15.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
573 "transformer_blocks.15.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
574 "transformer_blocks.15.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
575 "transformer_blocks.15.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
576 "transformer_blocks.15.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
577 "transformer_blocks.15.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
578 "transformer_blocks.15.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
579 "transformer_blocks.15.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
580 "transformer_blocks.15.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
581 "transformer_blocks.15.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
582 "transformer_blocks.15.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
583 "transformer_blocks.15.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
584 "transformer_blocks.15.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
585 "transformer_blocks.15.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
586 "transformer_blocks.15.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
587 "transformer_blocks.15.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
588 "transformer_blocks.15.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
589 "transformer_blocks.15.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
590 "transformer_blocks.15.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
591 "transformer_blocks.15.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
592 "transformer_blocks.15.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
593 "transformer_blocks.15.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
594 "transformer_blocks.15.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
595 "transformer_blocks.15.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
596 "transformer_blocks.15.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
597 "transformer_blocks.15.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
598 "transformer_blocks.15.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
599 "transformer_blocks.15.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
600 "transformer_blocks.15.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
601 "transformer_blocks.15.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
602 "transformer_blocks.15.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
603 "transformer_blocks.15.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
604 "transformer_blocks.15.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
605 "transformer_blocks.15.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
606 "transformer_blocks.15.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
607 "transformer_blocks.15.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
608 "transformer_blocks.15.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
609 "transformer_blocks.15.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
610 "transformer_blocks.15.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
611 "transformer_blocks.15.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
612 "transformer_blocks.15.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
613 "transformer_blocks.15.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
614 "transformer_blocks.15.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
615 "transformer_blocks.15.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
616 "transformer_blocks.15.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
617 "transformer_blocks.15.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
618 "transformer_blocks.15.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
619 "transformer_blocks.15.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
620 "transformer_blocks.15.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
621 "transformer_blocks.15.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
622 "transformer_blocks.15.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
623 "transformer_blocks.15.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
624 "transformer_blocks.15.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
625 "transformer_blocks.15.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
626 "transformer_blocks.15.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
627 "transformer_blocks.15.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
628 "transformer_blocks.15.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
629 "transformer_blocks.15.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
630 "transformer_blocks.15.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
631 "transformer_blocks.15.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
632 "transformer_blocks.15.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
633 "transformer_blocks.15.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
634 "transformer_blocks.15.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
635 "transformer_blocks.15.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
636 "transformer_blocks.16.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
637 "transformer_blocks.16.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
638 "transformer_blocks.16.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
639 "transformer_blocks.16.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
640 "transformer_blocks.16.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
641 "transformer_blocks.16.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
642 "transformer_blocks.16.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
643 "transformer_blocks.16.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
644 "transformer_blocks.16.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
645 "transformer_blocks.16.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
646 "transformer_blocks.16.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
647 "transformer_blocks.16.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
648 "transformer_blocks.16.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
649 "transformer_blocks.16.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
650 "transformer_blocks.16.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
651 "transformer_blocks.16.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
652 "transformer_blocks.16.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
653 "transformer_blocks.16.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
654 "transformer_blocks.16.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
655 "transformer_blocks.16.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
656 "transformer_blocks.16.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
657 "transformer_blocks.16.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
658 "transformer_blocks.16.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
659 "transformer_blocks.16.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
660 "transformer_blocks.16.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
661 "transformer_blocks.16.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
662 "transformer_blocks.16.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
663 "transformer_blocks.16.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
664 "transformer_blocks.16.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
665 "transformer_blocks.16.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
666 "transformer_blocks.16.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
667 "transformer_blocks.16.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
668 "transformer_blocks.16.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
669 "transformer_blocks.16.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
670 "transformer_blocks.16.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
671 "transformer_blocks.16.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
672 "transformer_blocks.16.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
673 "transformer_blocks.16.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
674 "transformer_blocks.16.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
675 "transformer_blocks.16.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
676 "transformer_blocks.16.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
677 "transformer_blocks.16.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
678 "transformer_blocks.16.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
679 "transformer_blocks.16.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
680 "transformer_blocks.16.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
681 "transformer_blocks.16.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
682 "transformer_blocks.16.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
683 "transformer_blocks.16.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
684 "transformer_blocks.16.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
685 "transformer_blocks.16.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
686 "transformer_blocks.16.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
687 "transformer_blocks.16.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
688 "transformer_blocks.16.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
689 "transformer_blocks.16.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
690 "transformer_blocks.16.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
691 "transformer_blocks.16.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
692 "transformer_blocks.16.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
693 "transformer_blocks.16.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
694 "transformer_blocks.16.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
695 "transformer_blocks.16.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
696 "transformer_blocks.16.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
697 "transformer_blocks.16.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
698 "transformer_blocks.16.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
699 "transformer_blocks.16.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
700 "transformer_blocks.16.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
701 "transformer_blocks.16.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
702 "transformer_blocks.16.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
703 "transformer_blocks.16.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
704 "transformer_blocks.16.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
705 "transformer_blocks.16.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
706 "transformer_blocks.16.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
707 "transformer_blocks.16.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
708 "transformer_blocks.17.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
709 "transformer_blocks.17.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
710 "transformer_blocks.17.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
711 "transformer_blocks.17.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
712 "transformer_blocks.17.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
713 "transformer_blocks.17.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
714 "transformer_blocks.17.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
715 "transformer_blocks.17.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
716 "transformer_blocks.17.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
717 "transformer_blocks.17.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
718 "transformer_blocks.17.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
719 "transformer_blocks.17.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
720 "transformer_blocks.17.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
721 "transformer_blocks.17.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
722 "transformer_blocks.17.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
723 "transformer_blocks.17.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
724 "transformer_blocks.17.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
725 "transformer_blocks.17.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
726 "transformer_blocks.17.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
727 "transformer_blocks.17.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
728 "transformer_blocks.17.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
729 "transformer_blocks.17.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
730 "transformer_blocks.17.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
731 "transformer_blocks.17.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
732 "transformer_blocks.17.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
733 "transformer_blocks.17.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
734 "transformer_blocks.17.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
735 "transformer_blocks.17.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
736 "transformer_blocks.17.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
737 "transformer_blocks.17.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
738 "transformer_blocks.17.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
739 "transformer_blocks.17.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
740 "transformer_blocks.17.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
741 "transformer_blocks.17.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
742 "transformer_blocks.17.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
743 "transformer_blocks.17.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
744 "transformer_blocks.17.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
745 "transformer_blocks.17.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
746 "transformer_blocks.17.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
747 "transformer_blocks.17.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
748 "transformer_blocks.17.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
749 "transformer_blocks.17.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
750 "transformer_blocks.17.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
751 "transformer_blocks.17.audio_ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
752 "transformer_blocks.17.audio_ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
753 "transformer_blocks.17.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
754 "transformer_blocks.17.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
755 "transformer_blocks.17.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
756 "transformer_blocks.17.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
757 "transformer_blocks.17.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
758 "transformer_blocks.17.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
759 "transformer_blocks.17.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
760 "transformer_blocks.17.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
761 "transformer_blocks.17.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
762 "transformer_blocks.17.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
763 "transformer_blocks.17.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
764 "transformer_blocks.17.ff.net.0.proj.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
765 "transformer_blocks.17.ff.net.0.proj.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
766 "transformer_blocks.17.ff.net.2.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
767 "transformer_blocks.17.ff.net.2.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
768 "transformer_blocks.17.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
769 "transformer_blocks.17.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
770 "transformer_blocks.17.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
771 "transformer_blocks.17.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
772 "transformer_blocks.17.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
773 "transformer_blocks.17.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
774 "transformer_blocks.17.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
775 "transformer_blocks.17.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
776 "transformer_blocks.17.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
777 "transformer_blocks.17.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
778 "transformer_blocks.17.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
779 "transformer_blocks.17.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
780 "transformer_blocks.18.attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
781 "transformer_blocks.18.attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
782 "transformer_blocks.18.attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
783 "transformer_blocks.18.attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
784 "transformer_blocks.18.attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
785 "transformer_blocks.18.attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
786 "transformer_blocks.18.attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
787 "transformer_blocks.18.attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
788 "transformer_blocks.18.attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
789 "transformer_blocks.18.attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
790 "transformer_blocks.18.attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
791 "transformer_blocks.18.attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
792 "transformer_blocks.18.attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
793 "transformer_blocks.18.attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
794 "transformer_blocks.18.attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
795 "transformer_blocks.18.attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
796 "transformer_blocks.18.attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
797 "transformer_blocks.18.attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
798 "transformer_blocks.18.attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
799 "transformer_blocks.18.attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
800 "transformer_blocks.18.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
801 "transformer_blocks.18.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
802 "transformer_blocks.18.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
803 "transformer_blocks.18.audio_attn1.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
804 "transformer_blocks.18.audio_attn1.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
805 "transformer_blocks.18.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
806 "transformer_blocks.18.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
807 "transformer_blocks.18.audio_attn1.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
808 "transformer_blocks.18.audio_attn1.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
809 "transformer_blocks.18.audio_attn1.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
810 "transformer_blocks.18.audio_attn1.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
811 "transformer_blocks.18.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
812 "transformer_blocks.18.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
813 "transformer_blocks.18.audio_attn2.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
814 "transformer_blocks.18.audio_attn2.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
815 "transformer_blocks.18.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
816 "transformer_blocks.18.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
817 "transformer_blocks.18.audio_attn2.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
818 "transformer_blocks.18.audio_attn2.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
819 "transformer_blocks.18.audio_attn2.to_v.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
820 "transformer_blocks.18.audio_attn2.to_v.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
821 "transformer_blocks.18.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
822 "transformer_blocks.18.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
823 "transformer_blocks.18.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
824 "transformer_blocks.18.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
825 "transformer_blocks.18.audio_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
826 "transformer_blocks.18.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
827 "transformer_blocks.18.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
828 "transformer_blocks.18.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
829 "transformer_blocks.18.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
830 "transformer_blocks.18.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
831 "transformer_blocks.18.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
832 "transformer_blocks.18.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00003-of-00008.safetensors",
833 "transformer_blocks.18.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00003-of-00008.safetensors",
834 "transformer_blocks.18.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
835 "transformer_blocks.18.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
836 "transformer_blocks.18.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
837 "transformer_blocks.18.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
838 "transformer_blocks.18.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
839 "transformer_blocks.18.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
840 "transformer_blocks.18.scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
841 "transformer_blocks.18.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00003-of-00008.safetensors",
842 "transformer_blocks.18.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
843 "transformer_blocks.18.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
844 "transformer_blocks.18.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
845 "transformer_blocks.18.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
846 "transformer_blocks.18.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
847 "transformer_blocks.18.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
848 "transformer_blocks.18.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
849 "transformer_blocks.18.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
850 "transformer_blocks.18.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
851 "transformer_blocks.18.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
852 "transformer_blocks.19.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
853 "transformer_blocks.19.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
854 "transformer_blocks.19.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
855 "transformer_blocks.19.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
856 "transformer_blocks.19.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
857 "transformer_blocks.19.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
858 "transformer_blocks.19.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
859 "transformer_blocks.19.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
860 "transformer_blocks.19.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
861 "transformer_blocks.19.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
862 "transformer_blocks.19.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
863 "transformer_blocks.19.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
864 "transformer_blocks.19.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
865 "transformer_blocks.19.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
866 "transformer_blocks.19.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
867 "transformer_blocks.19.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
868 "transformer_blocks.19.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
869 "transformer_blocks.19.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
870 "transformer_blocks.19.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
871 "transformer_blocks.19.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
872 "transformer_blocks.19.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
873 "transformer_blocks.19.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
874 "transformer_blocks.19.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
875 "transformer_blocks.19.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
876 "transformer_blocks.19.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
877 "transformer_blocks.19.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
878 "transformer_blocks.19.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
879 "transformer_blocks.19.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
880 "transformer_blocks.19.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
881 "transformer_blocks.19.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
882 "transformer_blocks.19.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
883 "transformer_blocks.19.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
884 "transformer_blocks.19.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
885 "transformer_blocks.19.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
886 "transformer_blocks.19.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
887 "transformer_blocks.19.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
888 "transformer_blocks.19.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
889 "transformer_blocks.19.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
890 "transformer_blocks.19.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
891 "transformer_blocks.19.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
892 "transformer_blocks.19.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
893 "transformer_blocks.19.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
894 "transformer_blocks.19.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
895 "transformer_blocks.19.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
896 "transformer_blocks.19.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
897 "transformer_blocks.19.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
898 "transformer_blocks.19.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
899 "transformer_blocks.19.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
900 "transformer_blocks.19.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
901 "transformer_blocks.19.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
902 "transformer_blocks.19.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
903 "transformer_blocks.19.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
904 "transformer_blocks.19.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
905 "transformer_blocks.19.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
906 "transformer_blocks.19.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
907 "transformer_blocks.19.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
908 "transformer_blocks.19.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
909 "transformer_blocks.19.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
910 "transformer_blocks.19.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
911 "transformer_blocks.19.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
912 "transformer_blocks.19.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
913 "transformer_blocks.19.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
914 "transformer_blocks.19.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
915 "transformer_blocks.19.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
916 "transformer_blocks.19.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
917 "transformer_blocks.19.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
918 "transformer_blocks.19.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
919 "transformer_blocks.19.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
920 "transformer_blocks.19.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
921 "transformer_blocks.19.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
922 "transformer_blocks.19.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
923 "transformer_blocks.19.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
924 "transformer_blocks.2.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
925 "transformer_blocks.2.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
926 "transformer_blocks.2.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
927 "transformer_blocks.2.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
928 "transformer_blocks.2.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
929 "transformer_blocks.2.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
930 "transformer_blocks.2.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
931 "transformer_blocks.2.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
932 "transformer_blocks.2.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
933 "transformer_blocks.2.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
934 "transformer_blocks.2.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
935 "transformer_blocks.2.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
936 "transformer_blocks.2.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
937 "transformer_blocks.2.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
938 "transformer_blocks.2.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
939 "transformer_blocks.2.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
940 "transformer_blocks.2.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
941 "transformer_blocks.2.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
942 "transformer_blocks.2.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
943 "transformer_blocks.2.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
944 "transformer_blocks.2.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
945 "transformer_blocks.2.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
946 "transformer_blocks.2.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
947 "transformer_blocks.2.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
948 "transformer_blocks.2.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
949 "transformer_blocks.2.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
950 "transformer_blocks.2.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
951 "transformer_blocks.2.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
952 "transformer_blocks.2.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
953 "transformer_blocks.2.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
954 "transformer_blocks.2.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
955 "transformer_blocks.2.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
956 "transformer_blocks.2.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
957 "transformer_blocks.2.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
958 "transformer_blocks.2.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
959 "transformer_blocks.2.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
960 "transformer_blocks.2.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
961 "transformer_blocks.2.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
962 "transformer_blocks.2.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
963 "transformer_blocks.2.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
964 "transformer_blocks.2.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
965 "transformer_blocks.2.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
966 "transformer_blocks.2.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
967 "transformer_blocks.2.audio_ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
968 "transformer_blocks.2.audio_ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
969 "transformer_blocks.2.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
970 "transformer_blocks.2.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
971 "transformer_blocks.2.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
972 "transformer_blocks.2.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
973 "transformer_blocks.2.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
974 "transformer_blocks.2.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
975 "transformer_blocks.2.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
976 "transformer_blocks.2.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
977 "transformer_blocks.2.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
978 "transformer_blocks.2.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
979 "transformer_blocks.2.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
980 "transformer_blocks.2.ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
981 "transformer_blocks.2.ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
982 "transformer_blocks.2.ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
983 "transformer_blocks.2.ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
984 "transformer_blocks.2.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
985 "transformer_blocks.2.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
986 "transformer_blocks.2.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
987 "transformer_blocks.2.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
988 "transformer_blocks.2.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
989 "transformer_blocks.2.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
990 "transformer_blocks.2.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
991 "transformer_blocks.2.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
992 "transformer_blocks.2.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
993 "transformer_blocks.2.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
994 "transformer_blocks.2.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
995 "transformer_blocks.2.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
996 "transformer_blocks.20.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
997 "transformer_blocks.20.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
998 "transformer_blocks.20.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
999 "transformer_blocks.20.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1000 "transformer_blocks.20.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1001 "transformer_blocks.20.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1002 "transformer_blocks.20.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1003 "transformer_blocks.20.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1004 "transformer_blocks.20.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1005 "transformer_blocks.20.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1006 "transformer_blocks.20.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1007 "transformer_blocks.20.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1008 "transformer_blocks.20.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1009 "transformer_blocks.20.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1010 "transformer_blocks.20.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1011 "transformer_blocks.20.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1012 "transformer_blocks.20.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1013 "transformer_blocks.20.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1014 "transformer_blocks.20.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1015 "transformer_blocks.20.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1016 "transformer_blocks.20.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1017 "transformer_blocks.20.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1018 "transformer_blocks.20.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1019 "transformer_blocks.20.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1020 "transformer_blocks.20.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1021 "transformer_blocks.20.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1022 "transformer_blocks.20.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1023 "transformer_blocks.20.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1024 "transformer_blocks.20.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1025 "transformer_blocks.20.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1026 "transformer_blocks.20.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1027 "transformer_blocks.20.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1028 "transformer_blocks.20.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1029 "transformer_blocks.20.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1030 "transformer_blocks.20.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1031 "transformer_blocks.20.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1032 "transformer_blocks.20.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1033 "transformer_blocks.20.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1034 "transformer_blocks.20.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1035 "transformer_blocks.20.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1036 "transformer_blocks.20.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1037 "transformer_blocks.20.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1038 "transformer_blocks.20.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1039 "transformer_blocks.20.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1040 "transformer_blocks.20.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1041 "transformer_blocks.20.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1042 "transformer_blocks.20.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1043 "transformer_blocks.20.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1044 "transformer_blocks.20.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1045 "transformer_blocks.20.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1046 "transformer_blocks.20.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1047 "transformer_blocks.20.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1048 "transformer_blocks.20.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1049 "transformer_blocks.20.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1050 "transformer_blocks.20.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1051 "transformer_blocks.20.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1052 "transformer_blocks.20.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1053 "transformer_blocks.20.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1054 "transformer_blocks.20.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1055 "transformer_blocks.20.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1056 "transformer_blocks.20.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1057 "transformer_blocks.20.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1058 "transformer_blocks.20.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1059 "transformer_blocks.20.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1060 "transformer_blocks.20.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1061 "transformer_blocks.20.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1062 "transformer_blocks.20.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1063 "transformer_blocks.20.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1064 "transformer_blocks.20.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1065 "transformer_blocks.20.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1066 "transformer_blocks.20.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1067 "transformer_blocks.20.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1068 "transformer_blocks.21.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1069 "transformer_blocks.21.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1070 "transformer_blocks.21.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1071 "transformer_blocks.21.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1072 "transformer_blocks.21.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1073 "transformer_blocks.21.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1074 "transformer_blocks.21.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1075 "transformer_blocks.21.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1076 "transformer_blocks.21.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1077 "transformer_blocks.21.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1078 "transformer_blocks.21.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1079 "transformer_blocks.21.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1080 "transformer_blocks.21.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1081 "transformer_blocks.21.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1082 "transformer_blocks.21.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1083 "transformer_blocks.21.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1084 "transformer_blocks.21.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1085 "transformer_blocks.21.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1086 "transformer_blocks.21.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1087 "transformer_blocks.21.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1088 "transformer_blocks.21.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1089 "transformer_blocks.21.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1090 "transformer_blocks.21.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1091 "transformer_blocks.21.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1092 "transformer_blocks.21.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1093 "transformer_blocks.21.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1094 "transformer_blocks.21.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1095 "transformer_blocks.21.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1096 "transformer_blocks.21.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1097 "transformer_blocks.21.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1098 "transformer_blocks.21.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1099 "transformer_blocks.21.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1100 "transformer_blocks.21.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1101 "transformer_blocks.21.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1102 "transformer_blocks.21.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1103 "transformer_blocks.21.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1104 "transformer_blocks.21.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1105 "transformer_blocks.21.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1106 "transformer_blocks.21.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1107 "transformer_blocks.21.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1108 "transformer_blocks.21.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1109 "transformer_blocks.21.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1110 "transformer_blocks.21.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1111 "transformer_blocks.21.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1112 "transformer_blocks.21.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1113 "transformer_blocks.21.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1114 "transformer_blocks.21.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1115 "transformer_blocks.21.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1116 "transformer_blocks.21.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1117 "transformer_blocks.21.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1118 "transformer_blocks.21.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1119 "transformer_blocks.21.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1120 "transformer_blocks.21.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1121 "transformer_blocks.21.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1122 "transformer_blocks.21.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1123 "transformer_blocks.21.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1124 "transformer_blocks.21.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1125 "transformer_blocks.21.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1126 "transformer_blocks.21.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1127 "transformer_blocks.21.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1128 "transformer_blocks.21.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1129 "transformer_blocks.21.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1130 "transformer_blocks.21.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1131 "transformer_blocks.21.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1132 "transformer_blocks.21.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1133 "transformer_blocks.21.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1134 "transformer_blocks.21.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1135 "transformer_blocks.21.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1136 "transformer_blocks.21.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1137 "transformer_blocks.21.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1138 "transformer_blocks.21.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1139 "transformer_blocks.21.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1140 "transformer_blocks.22.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1141 "transformer_blocks.22.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1142 "transformer_blocks.22.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1143 "transformer_blocks.22.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1144 "transformer_blocks.22.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1145 "transformer_blocks.22.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1146 "transformer_blocks.22.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1147 "transformer_blocks.22.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1148 "transformer_blocks.22.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1149 "transformer_blocks.22.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1150 "transformer_blocks.22.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1151 "transformer_blocks.22.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1152 "transformer_blocks.22.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1153 "transformer_blocks.22.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1154 "transformer_blocks.22.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1155 "transformer_blocks.22.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1156 "transformer_blocks.22.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1157 "transformer_blocks.22.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1158 "transformer_blocks.22.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1159 "transformer_blocks.22.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1160 "transformer_blocks.22.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1161 "transformer_blocks.22.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1162 "transformer_blocks.22.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1163 "transformer_blocks.22.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1164 "transformer_blocks.22.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1165 "transformer_blocks.22.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1166 "transformer_blocks.22.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1167 "transformer_blocks.22.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1168 "transformer_blocks.22.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1169 "transformer_blocks.22.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1170 "transformer_blocks.22.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1171 "transformer_blocks.22.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1172 "transformer_blocks.22.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1173 "transformer_blocks.22.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1174 "transformer_blocks.22.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1175 "transformer_blocks.22.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1176 "transformer_blocks.22.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1177 "transformer_blocks.22.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1178 "transformer_blocks.22.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1179 "transformer_blocks.22.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1180 "transformer_blocks.22.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1181 "transformer_blocks.22.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1182 "transformer_blocks.22.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1183 "transformer_blocks.22.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1184 "transformer_blocks.22.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1185 "transformer_blocks.22.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1186 "transformer_blocks.22.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1187 "transformer_blocks.22.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1188 "transformer_blocks.22.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1189 "transformer_blocks.22.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1190 "transformer_blocks.22.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1191 "transformer_blocks.22.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1192 "transformer_blocks.22.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1193 "transformer_blocks.22.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1194 "transformer_blocks.22.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1195 "transformer_blocks.22.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1196 "transformer_blocks.22.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1197 "transformer_blocks.22.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1198 "transformer_blocks.22.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1199 "transformer_blocks.22.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1200 "transformer_blocks.22.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1201 "transformer_blocks.22.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1202 "transformer_blocks.22.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1203 "transformer_blocks.22.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1204 "transformer_blocks.22.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1205 "transformer_blocks.22.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1206 "transformer_blocks.22.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1207 "transformer_blocks.22.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1208 "transformer_blocks.22.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1209 "transformer_blocks.22.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1210 "transformer_blocks.22.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1211 "transformer_blocks.22.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1212 "transformer_blocks.23.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1213 "transformer_blocks.23.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1214 "transformer_blocks.23.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1215 "transformer_blocks.23.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1216 "transformer_blocks.23.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1217 "transformer_blocks.23.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1218 "transformer_blocks.23.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1219 "transformer_blocks.23.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1220 "transformer_blocks.23.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1221 "transformer_blocks.23.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1222 "transformer_blocks.23.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1223 "transformer_blocks.23.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1224 "transformer_blocks.23.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1225 "transformer_blocks.23.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1226 "transformer_blocks.23.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1227 "transformer_blocks.23.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1228 "transformer_blocks.23.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1229 "transformer_blocks.23.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1230 "transformer_blocks.23.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1231 "transformer_blocks.23.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1232 "transformer_blocks.23.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1233 "transformer_blocks.23.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1234 "transformer_blocks.23.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1235 "transformer_blocks.23.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1236 "transformer_blocks.23.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1237 "transformer_blocks.23.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1238 "transformer_blocks.23.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1239 "transformer_blocks.23.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1240 "transformer_blocks.23.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1241 "transformer_blocks.23.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1242 "transformer_blocks.23.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1243 "transformer_blocks.23.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1244 "transformer_blocks.23.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1245 "transformer_blocks.23.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1246 "transformer_blocks.23.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1247 "transformer_blocks.23.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1248 "transformer_blocks.23.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1249 "transformer_blocks.23.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1250 "transformer_blocks.23.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1251 "transformer_blocks.23.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1252 "transformer_blocks.23.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1253 "transformer_blocks.23.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1254 "transformer_blocks.23.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1255 "transformer_blocks.23.audio_ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1256 "transformer_blocks.23.audio_ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1257 "transformer_blocks.23.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1258 "transformer_blocks.23.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1259 "transformer_blocks.23.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1260 "transformer_blocks.23.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1261 "transformer_blocks.23.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1262 "transformer_blocks.23.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1263 "transformer_blocks.23.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1264 "transformer_blocks.23.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1265 "transformer_blocks.23.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1266 "transformer_blocks.23.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1267 "transformer_blocks.23.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1268 "transformer_blocks.23.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1269 "transformer_blocks.23.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1270 "transformer_blocks.23.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1271 "transformer_blocks.23.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1272 "transformer_blocks.23.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1273 "transformer_blocks.23.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1274 "transformer_blocks.23.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1275 "transformer_blocks.23.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1276 "transformer_blocks.23.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1277 "transformer_blocks.23.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1278 "transformer_blocks.23.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1279 "transformer_blocks.23.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1280 "transformer_blocks.23.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1281 "transformer_blocks.23.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1282 "transformer_blocks.23.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1283 "transformer_blocks.23.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1284 "transformer_blocks.24.attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1285 "transformer_blocks.24.attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1286 "transformer_blocks.24.attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1287 "transformer_blocks.24.attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1288 "transformer_blocks.24.attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1289 "transformer_blocks.24.attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1290 "transformer_blocks.24.attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1291 "transformer_blocks.24.attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1292 "transformer_blocks.24.attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1293 "transformer_blocks.24.attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1294 "transformer_blocks.24.attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1295 "transformer_blocks.24.attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1296 "transformer_blocks.24.attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1297 "transformer_blocks.24.attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1298 "transformer_blocks.24.attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1299 "transformer_blocks.24.attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1300 "transformer_blocks.24.attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1301 "transformer_blocks.24.attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1302 "transformer_blocks.24.attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1303 "transformer_blocks.24.attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1304 "transformer_blocks.24.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1305 "transformer_blocks.24.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1306 "transformer_blocks.24.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1307 "transformer_blocks.24.audio_attn1.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1308 "transformer_blocks.24.audio_attn1.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1309 "transformer_blocks.24.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1310 "transformer_blocks.24.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1311 "transformer_blocks.24.audio_attn1.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1312 "transformer_blocks.24.audio_attn1.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1313 "transformer_blocks.24.audio_attn1.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1314 "transformer_blocks.24.audio_attn1.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1315 "transformer_blocks.24.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1316 "transformer_blocks.24.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1317 "transformer_blocks.24.audio_attn2.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1318 "transformer_blocks.24.audio_attn2.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1319 "transformer_blocks.24.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1320 "transformer_blocks.24.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1321 "transformer_blocks.24.audio_attn2.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1322 "transformer_blocks.24.audio_attn2.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1323 "transformer_blocks.24.audio_attn2.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1324 "transformer_blocks.24.audio_attn2.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1325 "transformer_blocks.24.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1326 "transformer_blocks.24.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1327 "transformer_blocks.24.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1328 "transformer_blocks.24.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1329 "transformer_blocks.24.audio_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1330 "transformer_blocks.24.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1331 "transformer_blocks.24.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1332 "transformer_blocks.24.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1333 "transformer_blocks.24.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1334 "transformer_blocks.24.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1335 "transformer_blocks.24.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1336 "transformer_blocks.24.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1337 "transformer_blocks.24.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1338 "transformer_blocks.24.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1339 "transformer_blocks.24.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1340 "transformer_blocks.24.ff.net.0.proj.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1341 "transformer_blocks.24.ff.net.0.proj.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1342 "transformer_blocks.24.ff.net.2.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1343 "transformer_blocks.24.ff.net.2.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1344 "transformer_blocks.24.scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1345 "transformer_blocks.24.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00004-of-00008.safetensors",
1346 "transformer_blocks.24.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1347 "transformer_blocks.24.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1348 "transformer_blocks.24.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1349 "transformer_blocks.24.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1350 "transformer_blocks.24.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1351 "transformer_blocks.24.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1352 "transformer_blocks.24.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1353 "transformer_blocks.24.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1354 "transformer_blocks.24.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00004-of-00008.safetensors",
1355 "transformer_blocks.24.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00004-of-00008.safetensors",
1356 "transformer_blocks.25.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1357 "transformer_blocks.25.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1358 "transformer_blocks.25.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1359 "transformer_blocks.25.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1360 "transformer_blocks.25.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1361 "transformer_blocks.25.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1362 "transformer_blocks.25.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1363 "transformer_blocks.25.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1364 "transformer_blocks.25.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1365 "transformer_blocks.25.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1366 "transformer_blocks.25.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1367 "transformer_blocks.25.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1368 "transformer_blocks.25.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1369 "transformer_blocks.25.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1370 "transformer_blocks.25.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1371 "transformer_blocks.25.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1372 "transformer_blocks.25.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1373 "transformer_blocks.25.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1374 "transformer_blocks.25.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1375 "transformer_blocks.25.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1376 "transformer_blocks.25.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1377 "transformer_blocks.25.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1378 "transformer_blocks.25.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1379 "transformer_blocks.25.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1380 "transformer_blocks.25.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1381 "transformer_blocks.25.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1382 "transformer_blocks.25.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1383 "transformer_blocks.25.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1384 "transformer_blocks.25.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1385 "transformer_blocks.25.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1386 "transformer_blocks.25.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1387 "transformer_blocks.25.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1388 "transformer_blocks.25.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1389 "transformer_blocks.25.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1390 "transformer_blocks.25.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1391 "transformer_blocks.25.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1392 "transformer_blocks.25.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1393 "transformer_blocks.25.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1394 "transformer_blocks.25.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1395 "transformer_blocks.25.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1396 "transformer_blocks.25.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1397 "transformer_blocks.25.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1398 "transformer_blocks.25.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1399 "transformer_blocks.25.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1400 "transformer_blocks.25.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1401 "transformer_blocks.25.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1402 "transformer_blocks.25.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1403 "transformer_blocks.25.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1404 "transformer_blocks.25.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1405 "transformer_blocks.25.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1406 "transformer_blocks.25.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1407 "transformer_blocks.25.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1408 "transformer_blocks.25.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1409 "transformer_blocks.25.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1410 "transformer_blocks.25.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1411 "transformer_blocks.25.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1412 "transformer_blocks.25.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1413 "transformer_blocks.25.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1414 "transformer_blocks.25.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1415 "transformer_blocks.25.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1416 "transformer_blocks.25.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1417 "transformer_blocks.25.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1418 "transformer_blocks.25.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1419 "transformer_blocks.25.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1420 "transformer_blocks.25.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1421 "transformer_blocks.25.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1422 "transformer_blocks.25.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1423 "transformer_blocks.25.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1424 "transformer_blocks.25.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1425 "transformer_blocks.25.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1426 "transformer_blocks.25.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1427 "transformer_blocks.25.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1428 "transformer_blocks.26.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1429 "transformer_blocks.26.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1430 "transformer_blocks.26.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1431 "transformer_blocks.26.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1432 "transformer_blocks.26.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1433 "transformer_blocks.26.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1434 "transformer_blocks.26.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1435 "transformer_blocks.26.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1436 "transformer_blocks.26.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1437 "transformer_blocks.26.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1438 "transformer_blocks.26.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1439 "transformer_blocks.26.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1440 "transformer_blocks.26.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1441 "transformer_blocks.26.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1442 "transformer_blocks.26.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1443 "transformer_blocks.26.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1444 "transformer_blocks.26.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1445 "transformer_blocks.26.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1446 "transformer_blocks.26.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1447 "transformer_blocks.26.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1448 "transformer_blocks.26.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1449 "transformer_blocks.26.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1450 "transformer_blocks.26.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1451 "transformer_blocks.26.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1452 "transformer_blocks.26.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1453 "transformer_blocks.26.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1454 "transformer_blocks.26.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1455 "transformer_blocks.26.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1456 "transformer_blocks.26.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1457 "transformer_blocks.26.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1458 "transformer_blocks.26.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1459 "transformer_blocks.26.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1460 "transformer_blocks.26.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1461 "transformer_blocks.26.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1462 "transformer_blocks.26.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1463 "transformer_blocks.26.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1464 "transformer_blocks.26.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1465 "transformer_blocks.26.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1466 "transformer_blocks.26.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1467 "transformer_blocks.26.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1468 "transformer_blocks.26.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1469 "transformer_blocks.26.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1470 "transformer_blocks.26.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1471 "transformer_blocks.26.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1472 "transformer_blocks.26.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1473 "transformer_blocks.26.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1474 "transformer_blocks.26.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1475 "transformer_blocks.26.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1476 "transformer_blocks.26.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1477 "transformer_blocks.26.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1478 "transformer_blocks.26.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1479 "transformer_blocks.26.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1480 "transformer_blocks.26.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1481 "transformer_blocks.26.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1482 "transformer_blocks.26.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1483 "transformer_blocks.26.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1484 "transformer_blocks.26.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1485 "transformer_blocks.26.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1486 "transformer_blocks.26.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1487 "transformer_blocks.26.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1488 "transformer_blocks.26.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1489 "transformer_blocks.26.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1490 "transformer_blocks.26.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1491 "transformer_blocks.26.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1492 "transformer_blocks.26.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1493 "transformer_blocks.26.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1494 "transformer_blocks.26.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1495 "transformer_blocks.26.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1496 "transformer_blocks.26.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1497 "transformer_blocks.26.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1498 "transformer_blocks.26.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1499 "transformer_blocks.26.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1500 "transformer_blocks.27.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1501 "transformer_blocks.27.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1502 "transformer_blocks.27.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1503 "transformer_blocks.27.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1504 "transformer_blocks.27.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1505 "transformer_blocks.27.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1506 "transformer_blocks.27.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1507 "transformer_blocks.27.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1508 "transformer_blocks.27.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1509 "transformer_blocks.27.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1510 "transformer_blocks.27.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1511 "transformer_blocks.27.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1512 "transformer_blocks.27.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1513 "transformer_blocks.27.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1514 "transformer_blocks.27.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1515 "transformer_blocks.27.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1516 "transformer_blocks.27.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1517 "transformer_blocks.27.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1518 "transformer_blocks.27.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1519 "transformer_blocks.27.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1520 "transformer_blocks.27.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1521 "transformer_blocks.27.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1522 "transformer_blocks.27.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1523 "transformer_blocks.27.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1524 "transformer_blocks.27.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1525 "transformer_blocks.27.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1526 "transformer_blocks.27.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1527 "transformer_blocks.27.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1528 "transformer_blocks.27.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1529 "transformer_blocks.27.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1530 "transformer_blocks.27.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1531 "transformer_blocks.27.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1532 "transformer_blocks.27.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1533 "transformer_blocks.27.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1534 "transformer_blocks.27.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1535 "transformer_blocks.27.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1536 "transformer_blocks.27.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1537 "transformer_blocks.27.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1538 "transformer_blocks.27.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1539 "transformer_blocks.27.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1540 "transformer_blocks.27.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1541 "transformer_blocks.27.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1542 "transformer_blocks.27.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1543 "transformer_blocks.27.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1544 "transformer_blocks.27.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1545 "transformer_blocks.27.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1546 "transformer_blocks.27.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1547 "transformer_blocks.27.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1548 "transformer_blocks.27.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1549 "transformer_blocks.27.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1550 "transformer_blocks.27.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1551 "transformer_blocks.27.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1552 "transformer_blocks.27.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1553 "transformer_blocks.27.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1554 "transformer_blocks.27.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1555 "transformer_blocks.27.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1556 "transformer_blocks.27.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1557 "transformer_blocks.27.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1558 "transformer_blocks.27.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1559 "transformer_blocks.27.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1560 "transformer_blocks.27.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1561 "transformer_blocks.27.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1562 "transformer_blocks.27.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1563 "transformer_blocks.27.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1564 "transformer_blocks.27.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1565 "transformer_blocks.27.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1566 "transformer_blocks.27.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1567 "transformer_blocks.27.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1568 "transformer_blocks.27.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1569 "transformer_blocks.27.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1570 "transformer_blocks.27.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1571 "transformer_blocks.27.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1572 "transformer_blocks.28.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1573 "transformer_blocks.28.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1574 "transformer_blocks.28.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1575 "transformer_blocks.28.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1576 "transformer_blocks.28.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1577 "transformer_blocks.28.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1578 "transformer_blocks.28.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1579 "transformer_blocks.28.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1580 "transformer_blocks.28.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1581 "transformer_blocks.28.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1582 "transformer_blocks.28.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1583 "transformer_blocks.28.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1584 "transformer_blocks.28.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1585 "transformer_blocks.28.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1586 "transformer_blocks.28.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1587 "transformer_blocks.28.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1588 "transformer_blocks.28.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1589 "transformer_blocks.28.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1590 "transformer_blocks.28.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1591 "transformer_blocks.28.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1592 "transformer_blocks.28.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1593 "transformer_blocks.28.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1594 "transformer_blocks.28.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1595 "transformer_blocks.28.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1596 "transformer_blocks.28.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1597 "transformer_blocks.28.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1598 "transformer_blocks.28.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1599 "transformer_blocks.28.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1600 "transformer_blocks.28.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1601 "transformer_blocks.28.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1602 "transformer_blocks.28.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1603 "transformer_blocks.28.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1604 "transformer_blocks.28.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1605 "transformer_blocks.28.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1606 "transformer_blocks.28.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1607 "transformer_blocks.28.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1608 "transformer_blocks.28.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1609 "transformer_blocks.28.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1610 "transformer_blocks.28.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1611 "transformer_blocks.28.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1612 "transformer_blocks.28.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1613 "transformer_blocks.28.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1614 "transformer_blocks.28.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1615 "transformer_blocks.28.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1616 "transformer_blocks.28.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1617 "transformer_blocks.28.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1618 "transformer_blocks.28.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1619 "transformer_blocks.28.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1620 "transformer_blocks.28.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1621 "transformer_blocks.28.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1622 "transformer_blocks.28.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1623 "transformer_blocks.28.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1624 "transformer_blocks.28.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1625 "transformer_blocks.28.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1626 "transformer_blocks.28.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1627 "transformer_blocks.28.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1628 "transformer_blocks.28.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1629 "transformer_blocks.28.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1630 "transformer_blocks.28.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1631 "transformer_blocks.28.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1632 "transformer_blocks.28.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1633 "transformer_blocks.28.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1634 "transformer_blocks.28.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1635 "transformer_blocks.28.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1636 "transformer_blocks.28.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1637 "transformer_blocks.28.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1638 "transformer_blocks.28.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1639 "transformer_blocks.28.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1640 "transformer_blocks.28.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1641 "transformer_blocks.28.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1642 "transformer_blocks.28.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1643 "transformer_blocks.28.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1644 "transformer_blocks.29.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1645 "transformer_blocks.29.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1646 "transformer_blocks.29.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1647 "transformer_blocks.29.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1648 "transformer_blocks.29.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1649 "transformer_blocks.29.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1650 "transformer_blocks.29.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1651 "transformer_blocks.29.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1652 "transformer_blocks.29.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1653 "transformer_blocks.29.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1654 "transformer_blocks.29.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1655 "transformer_blocks.29.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1656 "transformer_blocks.29.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1657 "transformer_blocks.29.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1658 "transformer_blocks.29.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1659 "transformer_blocks.29.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1660 "transformer_blocks.29.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1661 "transformer_blocks.29.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1662 "transformer_blocks.29.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1663 "transformer_blocks.29.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1664 "transformer_blocks.29.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1665 "transformer_blocks.29.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1666 "transformer_blocks.29.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1667 "transformer_blocks.29.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1668 "transformer_blocks.29.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1669 "transformer_blocks.29.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1670 "transformer_blocks.29.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1671 "transformer_blocks.29.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1672 "transformer_blocks.29.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1673 "transformer_blocks.29.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1674 "transformer_blocks.29.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1675 "transformer_blocks.29.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1676 "transformer_blocks.29.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1677 "transformer_blocks.29.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1678 "transformer_blocks.29.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1679 "transformer_blocks.29.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1680 "transformer_blocks.29.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1681 "transformer_blocks.29.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1682 "transformer_blocks.29.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1683 "transformer_blocks.29.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1684 "transformer_blocks.29.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1685 "transformer_blocks.29.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1686 "transformer_blocks.29.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1687 "transformer_blocks.29.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1688 "transformer_blocks.29.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1689 "transformer_blocks.29.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1690 "transformer_blocks.29.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1691 "transformer_blocks.29.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1692 "transformer_blocks.29.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1693 "transformer_blocks.29.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1694 "transformer_blocks.29.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1695 "transformer_blocks.29.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1696 "transformer_blocks.29.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1697 "transformer_blocks.29.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1698 "transformer_blocks.29.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1699 "transformer_blocks.29.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1700 "transformer_blocks.29.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1701 "transformer_blocks.29.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1702 "transformer_blocks.29.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1703 "transformer_blocks.29.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1704 "transformer_blocks.29.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1705 "transformer_blocks.29.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1706 "transformer_blocks.29.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1707 "transformer_blocks.29.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1708 "transformer_blocks.29.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1709 "transformer_blocks.29.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1710 "transformer_blocks.29.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1711 "transformer_blocks.29.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1712 "transformer_blocks.29.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1713 "transformer_blocks.29.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1714 "transformer_blocks.29.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1715 "transformer_blocks.29.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1716 "transformer_blocks.3.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1717 "transformer_blocks.3.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1718 "transformer_blocks.3.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1719 "transformer_blocks.3.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1720 "transformer_blocks.3.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1721 "transformer_blocks.3.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1722 "transformer_blocks.3.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1723 "transformer_blocks.3.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1724 "transformer_blocks.3.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1725 "transformer_blocks.3.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1726 "transformer_blocks.3.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1727 "transformer_blocks.3.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1728 "transformer_blocks.3.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1729 "transformer_blocks.3.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1730 "transformer_blocks.3.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1731 "transformer_blocks.3.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1732 "transformer_blocks.3.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1733 "transformer_blocks.3.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1734 "transformer_blocks.3.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1735 "transformer_blocks.3.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1736 "transformer_blocks.3.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
1737 "transformer_blocks.3.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1738 "transformer_blocks.3.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1739 "transformer_blocks.3.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1740 "transformer_blocks.3.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1741 "transformer_blocks.3.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1742 "transformer_blocks.3.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1743 "transformer_blocks.3.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1744 "transformer_blocks.3.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1745 "transformer_blocks.3.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1746 "transformer_blocks.3.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1747 "transformer_blocks.3.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1748 "transformer_blocks.3.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1749 "transformer_blocks.3.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1750 "transformer_blocks.3.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1751 "transformer_blocks.3.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1752 "transformer_blocks.3.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1753 "transformer_blocks.3.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1754 "transformer_blocks.3.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1755 "transformer_blocks.3.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1756 "transformer_blocks.3.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1757 "transformer_blocks.3.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1758 "transformer_blocks.3.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1759 "transformer_blocks.3.audio_ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1760 "transformer_blocks.3.audio_ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1761 "transformer_blocks.3.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
1762 "transformer_blocks.3.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1763 "transformer_blocks.3.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1764 "transformer_blocks.3.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1765 "transformer_blocks.3.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1766 "transformer_blocks.3.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1767 "transformer_blocks.3.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1768 "transformer_blocks.3.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1769 "transformer_blocks.3.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1770 "transformer_blocks.3.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1771 "transformer_blocks.3.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1772 "transformer_blocks.3.ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1773 "transformer_blocks.3.ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1774 "transformer_blocks.3.ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1775 "transformer_blocks.3.ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1776 "transformer_blocks.3.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
1777 "transformer_blocks.3.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
1778 "transformer_blocks.3.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1779 "transformer_blocks.3.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1780 "transformer_blocks.3.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1781 "transformer_blocks.3.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1782 "transformer_blocks.3.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1783 "transformer_blocks.3.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1784 "transformer_blocks.3.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1785 "transformer_blocks.3.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1786 "transformer_blocks.3.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
1787 "transformer_blocks.3.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
1788 "transformer_blocks.30.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1789 "transformer_blocks.30.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1790 "transformer_blocks.30.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1791 "transformer_blocks.30.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1792 "transformer_blocks.30.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1793 "transformer_blocks.30.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1794 "transformer_blocks.30.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1795 "transformer_blocks.30.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1796 "transformer_blocks.30.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1797 "transformer_blocks.30.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1798 "transformer_blocks.30.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1799 "transformer_blocks.30.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1800 "transformer_blocks.30.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1801 "transformer_blocks.30.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1802 "transformer_blocks.30.attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1803 "transformer_blocks.30.attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1804 "transformer_blocks.30.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1805 "transformer_blocks.30.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1806 "transformer_blocks.30.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1807 "transformer_blocks.30.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1808 "transformer_blocks.30.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1809 "transformer_blocks.30.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1810 "transformer_blocks.30.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1811 "transformer_blocks.30.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1812 "transformer_blocks.30.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1813 "transformer_blocks.30.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1814 "transformer_blocks.30.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1815 "transformer_blocks.30.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1816 "transformer_blocks.30.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1817 "transformer_blocks.30.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1818 "transformer_blocks.30.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1819 "transformer_blocks.30.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1820 "transformer_blocks.30.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1821 "transformer_blocks.30.audio_attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1822 "transformer_blocks.30.audio_attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1823 "transformer_blocks.30.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1824 "transformer_blocks.30.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1825 "transformer_blocks.30.audio_attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1826 "transformer_blocks.30.audio_attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1827 "transformer_blocks.30.audio_attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1828 "transformer_blocks.30.audio_attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1829 "transformer_blocks.30.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1830 "transformer_blocks.30.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1831 "transformer_blocks.30.audio_ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1832 "transformer_blocks.30.audio_ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1833 "transformer_blocks.30.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1834 "transformer_blocks.30.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1835 "transformer_blocks.30.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1836 "transformer_blocks.30.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1837 "transformer_blocks.30.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1838 "transformer_blocks.30.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1839 "transformer_blocks.30.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1840 "transformer_blocks.30.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1841 "transformer_blocks.30.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1842 "transformer_blocks.30.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1843 "transformer_blocks.30.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1844 "transformer_blocks.30.ff.net.0.proj.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1845 "transformer_blocks.30.ff.net.0.proj.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1846 "transformer_blocks.30.ff.net.2.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1847 "transformer_blocks.30.ff.net.2.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1848 "transformer_blocks.30.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1849 "transformer_blocks.30.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1850 "transformer_blocks.30.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1851 "transformer_blocks.30.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1852 "transformer_blocks.30.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1853 "transformer_blocks.30.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1854 "transformer_blocks.30.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1855 "transformer_blocks.30.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1856 "transformer_blocks.30.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1857 "transformer_blocks.30.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1858 "transformer_blocks.30.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1859 "transformer_blocks.30.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1860 "transformer_blocks.31.attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1861 "transformer_blocks.31.attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1862 "transformer_blocks.31.attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1863 "transformer_blocks.31.attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1864 "transformer_blocks.31.attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1865 "transformer_blocks.31.attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1866 "transformer_blocks.31.attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1867 "transformer_blocks.31.attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1868 "transformer_blocks.31.attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1869 "transformer_blocks.31.attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1870 "transformer_blocks.31.attn2.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1871 "transformer_blocks.31.attn2.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1872 "transformer_blocks.31.attn2.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1873 "transformer_blocks.31.attn2.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1874 "transformer_blocks.31.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1875 "transformer_blocks.31.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1876 "transformer_blocks.31.attn2.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1877 "transformer_blocks.31.attn2.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1878 "transformer_blocks.31.attn2.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1879 "transformer_blocks.31.attn2.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1880 "transformer_blocks.31.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1881 "transformer_blocks.31.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1882 "transformer_blocks.31.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1883 "transformer_blocks.31.audio_attn1.to_k.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1884 "transformer_blocks.31.audio_attn1.to_k.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1885 "transformer_blocks.31.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1886 "transformer_blocks.31.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1887 "transformer_blocks.31.audio_attn1.to_q.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1888 "transformer_blocks.31.audio_attn1.to_q.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1889 "transformer_blocks.31.audio_attn1.to_v.bias": "diffusion_pytorch_model-00005-of-00008.safetensors",
1890 "transformer_blocks.31.audio_attn1.to_v.weight": "diffusion_pytorch_model-00005-of-00008.safetensors",
1891 "transformer_blocks.31.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1892 "transformer_blocks.31.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1893 "transformer_blocks.31.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1894 "transformer_blocks.31.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1895 "transformer_blocks.31.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1896 "transformer_blocks.31.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1897 "transformer_blocks.31.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1898 "transformer_blocks.31.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1899 "transformer_blocks.31.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1900 "transformer_blocks.31.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1901 "transformer_blocks.31.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1902 "transformer_blocks.31.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1903 "transformer_blocks.31.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1904 "transformer_blocks.31.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1905 "transformer_blocks.31.audio_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1906 "transformer_blocks.31.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1907 "transformer_blocks.31.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1908 "transformer_blocks.31.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1909 "transformer_blocks.31.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1910 "transformer_blocks.31.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1911 "transformer_blocks.31.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1912 "transformer_blocks.31.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1913 "transformer_blocks.31.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1914 "transformer_blocks.31.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1915 "transformer_blocks.31.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1916 "transformer_blocks.31.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1917 "transformer_blocks.31.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1918 "transformer_blocks.31.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1919 "transformer_blocks.31.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1920 "transformer_blocks.31.scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1921 "transformer_blocks.31.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00005-of-00008.safetensors",
1922 "transformer_blocks.31.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1923 "transformer_blocks.31.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1924 "transformer_blocks.31.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1925 "transformer_blocks.31.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1926 "transformer_blocks.31.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1927 "transformer_blocks.31.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1928 "transformer_blocks.31.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1929 "transformer_blocks.31.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1930 "transformer_blocks.31.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1931 "transformer_blocks.31.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1932 "transformer_blocks.32.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1933 "transformer_blocks.32.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1934 "transformer_blocks.32.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1935 "transformer_blocks.32.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1936 "transformer_blocks.32.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1937 "transformer_blocks.32.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1938 "transformer_blocks.32.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1939 "transformer_blocks.32.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1940 "transformer_blocks.32.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1941 "transformer_blocks.32.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1942 "transformer_blocks.32.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1943 "transformer_blocks.32.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1944 "transformer_blocks.32.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1945 "transformer_blocks.32.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1946 "transformer_blocks.32.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1947 "transformer_blocks.32.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1948 "transformer_blocks.32.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1949 "transformer_blocks.32.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1950 "transformer_blocks.32.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1951 "transformer_blocks.32.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1952 "transformer_blocks.32.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
1953 "transformer_blocks.32.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1954 "transformer_blocks.32.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1955 "transformer_blocks.32.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1956 "transformer_blocks.32.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1957 "transformer_blocks.32.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1958 "transformer_blocks.32.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1959 "transformer_blocks.32.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1960 "transformer_blocks.32.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1961 "transformer_blocks.32.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1962 "transformer_blocks.32.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1963 "transformer_blocks.32.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1964 "transformer_blocks.32.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1965 "transformer_blocks.32.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1966 "transformer_blocks.32.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1967 "transformer_blocks.32.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1968 "transformer_blocks.32.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1969 "transformer_blocks.32.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1970 "transformer_blocks.32.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1971 "transformer_blocks.32.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1972 "transformer_blocks.32.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1973 "transformer_blocks.32.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1974 "transformer_blocks.32.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1975 "transformer_blocks.32.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1976 "transformer_blocks.32.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1977 "transformer_blocks.32.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
1978 "transformer_blocks.32.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1979 "transformer_blocks.32.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1980 "transformer_blocks.32.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1981 "transformer_blocks.32.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1982 "transformer_blocks.32.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1983 "transformer_blocks.32.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1984 "transformer_blocks.32.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1985 "transformer_blocks.32.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1986 "transformer_blocks.32.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1987 "transformer_blocks.32.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1988 "transformer_blocks.32.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1989 "transformer_blocks.32.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1990 "transformer_blocks.32.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1991 "transformer_blocks.32.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1992 "transformer_blocks.32.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
1993 "transformer_blocks.32.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
1994 "transformer_blocks.32.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1995 "transformer_blocks.32.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1996 "transformer_blocks.32.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1997 "transformer_blocks.32.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
1998 "transformer_blocks.32.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
1999 "transformer_blocks.32.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2000 "transformer_blocks.32.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2001 "transformer_blocks.32.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2002 "transformer_blocks.32.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2003 "transformer_blocks.32.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2004 "transformer_blocks.33.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2005 "transformer_blocks.33.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2006 "transformer_blocks.33.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2007 "transformer_blocks.33.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2008 "transformer_blocks.33.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2009 "transformer_blocks.33.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2010 "transformer_blocks.33.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2011 "transformer_blocks.33.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2012 "transformer_blocks.33.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2013 "transformer_blocks.33.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2014 "transformer_blocks.33.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2015 "transformer_blocks.33.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2016 "transformer_blocks.33.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2017 "transformer_blocks.33.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2018 "transformer_blocks.33.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2019 "transformer_blocks.33.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2020 "transformer_blocks.33.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2021 "transformer_blocks.33.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2022 "transformer_blocks.33.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2023 "transformer_blocks.33.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2024 "transformer_blocks.33.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2025 "transformer_blocks.33.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2026 "transformer_blocks.33.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2027 "transformer_blocks.33.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2028 "transformer_blocks.33.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2029 "transformer_blocks.33.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2030 "transformer_blocks.33.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2031 "transformer_blocks.33.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2032 "transformer_blocks.33.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2033 "transformer_blocks.33.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2034 "transformer_blocks.33.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2035 "transformer_blocks.33.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2036 "transformer_blocks.33.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2037 "transformer_blocks.33.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2038 "transformer_blocks.33.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2039 "transformer_blocks.33.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2040 "transformer_blocks.33.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2041 "transformer_blocks.33.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2042 "transformer_blocks.33.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2043 "transformer_blocks.33.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2044 "transformer_blocks.33.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2045 "transformer_blocks.33.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2046 "transformer_blocks.33.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2047 "transformer_blocks.33.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2048 "transformer_blocks.33.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2049 "transformer_blocks.33.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2050 "transformer_blocks.33.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2051 "transformer_blocks.33.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2052 "transformer_blocks.33.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2053 "transformer_blocks.33.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2054 "transformer_blocks.33.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2055 "transformer_blocks.33.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2056 "transformer_blocks.33.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2057 "transformer_blocks.33.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2058 "transformer_blocks.33.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2059 "transformer_blocks.33.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2060 "transformer_blocks.33.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2061 "transformer_blocks.33.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2062 "transformer_blocks.33.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2063 "transformer_blocks.33.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2064 "transformer_blocks.33.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2065 "transformer_blocks.33.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2066 "transformer_blocks.33.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2067 "transformer_blocks.33.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2068 "transformer_blocks.33.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2069 "transformer_blocks.33.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2070 "transformer_blocks.33.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2071 "transformer_blocks.33.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2072 "transformer_blocks.33.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2073 "transformer_blocks.33.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2074 "transformer_blocks.33.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2075 "transformer_blocks.33.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2076 "transformer_blocks.34.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2077 "transformer_blocks.34.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2078 "transformer_blocks.34.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2079 "transformer_blocks.34.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2080 "transformer_blocks.34.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2081 "transformer_blocks.34.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2082 "transformer_blocks.34.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2083 "transformer_blocks.34.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2084 "transformer_blocks.34.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2085 "transformer_blocks.34.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2086 "transformer_blocks.34.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2087 "transformer_blocks.34.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2088 "transformer_blocks.34.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2089 "transformer_blocks.34.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2090 "transformer_blocks.34.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2091 "transformer_blocks.34.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2092 "transformer_blocks.34.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2093 "transformer_blocks.34.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2094 "transformer_blocks.34.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2095 "transformer_blocks.34.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2096 "transformer_blocks.34.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2097 "transformer_blocks.34.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2098 "transformer_blocks.34.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2099 "transformer_blocks.34.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2100 "transformer_blocks.34.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2101 "transformer_blocks.34.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2102 "transformer_blocks.34.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2103 "transformer_blocks.34.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2104 "transformer_blocks.34.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2105 "transformer_blocks.34.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2106 "transformer_blocks.34.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2107 "transformer_blocks.34.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2108 "transformer_blocks.34.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2109 "transformer_blocks.34.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2110 "transformer_blocks.34.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2111 "transformer_blocks.34.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2112 "transformer_blocks.34.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2113 "transformer_blocks.34.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2114 "transformer_blocks.34.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2115 "transformer_blocks.34.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2116 "transformer_blocks.34.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2117 "transformer_blocks.34.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2118 "transformer_blocks.34.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2119 "transformer_blocks.34.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2120 "transformer_blocks.34.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2121 "transformer_blocks.34.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2122 "transformer_blocks.34.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2123 "transformer_blocks.34.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2124 "transformer_blocks.34.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2125 "transformer_blocks.34.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2126 "transformer_blocks.34.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2127 "transformer_blocks.34.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2128 "transformer_blocks.34.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2129 "transformer_blocks.34.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2130 "transformer_blocks.34.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2131 "transformer_blocks.34.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2132 "transformer_blocks.34.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2133 "transformer_blocks.34.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2134 "transformer_blocks.34.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2135 "transformer_blocks.34.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2136 "transformer_blocks.34.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2137 "transformer_blocks.34.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2138 "transformer_blocks.34.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2139 "transformer_blocks.34.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2140 "transformer_blocks.34.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2141 "transformer_blocks.34.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2142 "transformer_blocks.34.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2143 "transformer_blocks.34.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2144 "transformer_blocks.34.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2145 "transformer_blocks.34.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2146 "transformer_blocks.34.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2147 "transformer_blocks.34.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2148 "transformer_blocks.35.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2149 "transformer_blocks.35.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2150 "transformer_blocks.35.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2151 "transformer_blocks.35.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2152 "transformer_blocks.35.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2153 "transformer_blocks.35.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2154 "transformer_blocks.35.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2155 "transformer_blocks.35.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2156 "transformer_blocks.35.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2157 "transformer_blocks.35.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2158 "transformer_blocks.35.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2159 "transformer_blocks.35.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2160 "transformer_blocks.35.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2161 "transformer_blocks.35.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2162 "transformer_blocks.35.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2163 "transformer_blocks.35.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2164 "transformer_blocks.35.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2165 "transformer_blocks.35.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2166 "transformer_blocks.35.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2167 "transformer_blocks.35.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2168 "transformer_blocks.35.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2169 "transformer_blocks.35.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2170 "transformer_blocks.35.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2171 "transformer_blocks.35.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2172 "transformer_blocks.35.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2173 "transformer_blocks.35.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2174 "transformer_blocks.35.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2175 "transformer_blocks.35.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2176 "transformer_blocks.35.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2177 "transformer_blocks.35.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2178 "transformer_blocks.35.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2179 "transformer_blocks.35.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2180 "transformer_blocks.35.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2181 "transformer_blocks.35.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2182 "transformer_blocks.35.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2183 "transformer_blocks.35.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2184 "transformer_blocks.35.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2185 "transformer_blocks.35.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2186 "transformer_blocks.35.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2187 "transformer_blocks.35.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2188 "transformer_blocks.35.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2189 "transformer_blocks.35.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2190 "transformer_blocks.35.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2191 "transformer_blocks.35.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2192 "transformer_blocks.35.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2193 "transformer_blocks.35.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2194 "transformer_blocks.35.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2195 "transformer_blocks.35.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2196 "transformer_blocks.35.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2197 "transformer_blocks.35.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2198 "transformer_blocks.35.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2199 "transformer_blocks.35.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2200 "transformer_blocks.35.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2201 "transformer_blocks.35.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2202 "transformer_blocks.35.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2203 "transformer_blocks.35.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2204 "transformer_blocks.35.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2205 "transformer_blocks.35.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2206 "transformer_blocks.35.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2207 "transformer_blocks.35.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2208 "transformer_blocks.35.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2209 "transformer_blocks.35.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2210 "transformer_blocks.35.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2211 "transformer_blocks.35.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2212 "transformer_blocks.35.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2213 "transformer_blocks.35.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2214 "transformer_blocks.35.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2215 "transformer_blocks.35.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2216 "transformer_blocks.35.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2217 "transformer_blocks.35.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2218 "transformer_blocks.35.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2219 "transformer_blocks.35.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2220 "transformer_blocks.36.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2221 "transformer_blocks.36.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2222 "transformer_blocks.36.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2223 "transformer_blocks.36.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2224 "transformer_blocks.36.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2225 "transformer_blocks.36.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2226 "transformer_blocks.36.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2227 "transformer_blocks.36.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2228 "transformer_blocks.36.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2229 "transformer_blocks.36.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2230 "transformer_blocks.36.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2231 "transformer_blocks.36.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2232 "transformer_blocks.36.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2233 "transformer_blocks.36.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2234 "transformer_blocks.36.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2235 "transformer_blocks.36.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2236 "transformer_blocks.36.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2237 "transformer_blocks.36.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2238 "transformer_blocks.36.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2239 "transformer_blocks.36.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2240 "transformer_blocks.36.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2241 "transformer_blocks.36.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2242 "transformer_blocks.36.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2243 "transformer_blocks.36.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2244 "transformer_blocks.36.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2245 "transformer_blocks.36.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2246 "transformer_blocks.36.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2247 "transformer_blocks.36.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2248 "transformer_blocks.36.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2249 "transformer_blocks.36.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2250 "transformer_blocks.36.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2251 "transformer_blocks.36.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2252 "transformer_blocks.36.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2253 "transformer_blocks.36.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2254 "transformer_blocks.36.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2255 "transformer_blocks.36.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2256 "transformer_blocks.36.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2257 "transformer_blocks.36.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2258 "transformer_blocks.36.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2259 "transformer_blocks.36.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2260 "transformer_blocks.36.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2261 "transformer_blocks.36.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2262 "transformer_blocks.36.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2263 "transformer_blocks.36.audio_ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2264 "transformer_blocks.36.audio_ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2265 "transformer_blocks.36.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2266 "transformer_blocks.36.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2267 "transformer_blocks.36.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2268 "transformer_blocks.36.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2269 "transformer_blocks.36.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2270 "transformer_blocks.36.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2271 "transformer_blocks.36.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2272 "transformer_blocks.36.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2273 "transformer_blocks.36.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2274 "transformer_blocks.36.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2275 "transformer_blocks.36.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2276 "transformer_blocks.36.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2277 "transformer_blocks.36.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2278 "transformer_blocks.36.ff.net.2.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2279 "transformer_blocks.36.ff.net.2.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2280 "transformer_blocks.36.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2281 "transformer_blocks.36.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2282 "transformer_blocks.36.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2283 "transformer_blocks.36.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2284 "transformer_blocks.36.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2285 "transformer_blocks.36.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2286 "transformer_blocks.36.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2287 "transformer_blocks.36.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2288 "transformer_blocks.36.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2289 "transformer_blocks.36.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2290 "transformer_blocks.36.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2291 "transformer_blocks.36.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2292 "transformer_blocks.37.attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2293 "transformer_blocks.37.attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2294 "transformer_blocks.37.attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2295 "transformer_blocks.37.attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2296 "transformer_blocks.37.attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2297 "transformer_blocks.37.attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2298 "transformer_blocks.37.attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2299 "transformer_blocks.37.attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2300 "transformer_blocks.37.attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2301 "transformer_blocks.37.attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2302 "transformer_blocks.37.attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2303 "transformer_blocks.37.attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2304 "transformer_blocks.37.attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2305 "transformer_blocks.37.attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2306 "transformer_blocks.37.attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2307 "transformer_blocks.37.attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2308 "transformer_blocks.37.attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2309 "transformer_blocks.37.attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2310 "transformer_blocks.37.attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2311 "transformer_blocks.37.attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2312 "transformer_blocks.37.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2313 "transformer_blocks.37.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2314 "transformer_blocks.37.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2315 "transformer_blocks.37.audio_attn1.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2316 "transformer_blocks.37.audio_attn1.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2317 "transformer_blocks.37.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2318 "transformer_blocks.37.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2319 "transformer_blocks.37.audio_attn1.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2320 "transformer_blocks.37.audio_attn1.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2321 "transformer_blocks.37.audio_attn1.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2322 "transformer_blocks.37.audio_attn1.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2323 "transformer_blocks.37.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2324 "transformer_blocks.37.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2325 "transformer_blocks.37.audio_attn2.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2326 "transformer_blocks.37.audio_attn2.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2327 "transformer_blocks.37.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2328 "transformer_blocks.37.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2329 "transformer_blocks.37.audio_attn2.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2330 "transformer_blocks.37.audio_attn2.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2331 "transformer_blocks.37.audio_attn2.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2332 "transformer_blocks.37.audio_attn2.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2333 "transformer_blocks.37.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2334 "transformer_blocks.37.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2335 "transformer_blocks.37.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2336 "transformer_blocks.37.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2337 "transformer_blocks.37.audio_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2338 "transformer_blocks.37.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2339 "transformer_blocks.37.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2340 "transformer_blocks.37.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2341 "transformer_blocks.37.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2342 "transformer_blocks.37.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2343 "transformer_blocks.37.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2344 "transformer_blocks.37.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2345 "transformer_blocks.37.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2346 "transformer_blocks.37.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2347 "transformer_blocks.37.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2348 "transformer_blocks.37.ff.net.0.proj.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2349 "transformer_blocks.37.ff.net.0.proj.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2350 "transformer_blocks.37.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2351 "transformer_blocks.37.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2352 "transformer_blocks.37.scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2353 "transformer_blocks.37.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00006-of-00008.safetensors",
2354 "transformer_blocks.37.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2355 "transformer_blocks.37.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2356 "transformer_blocks.37.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2357 "transformer_blocks.37.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2358 "transformer_blocks.37.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2359 "transformer_blocks.37.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2360 "transformer_blocks.37.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2361 "transformer_blocks.37.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2362 "transformer_blocks.37.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00006-of-00008.safetensors",
2363 "transformer_blocks.37.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00006-of-00008.safetensors",
2364 "transformer_blocks.38.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2365 "transformer_blocks.38.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2366 "transformer_blocks.38.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2367 "transformer_blocks.38.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2368 "transformer_blocks.38.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2369 "transformer_blocks.38.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2370 "transformer_blocks.38.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2371 "transformer_blocks.38.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2372 "transformer_blocks.38.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2373 "transformer_blocks.38.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2374 "transformer_blocks.38.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2375 "transformer_blocks.38.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2376 "transformer_blocks.38.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2377 "transformer_blocks.38.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2378 "transformer_blocks.38.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2379 "transformer_blocks.38.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2380 "transformer_blocks.38.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2381 "transformer_blocks.38.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2382 "transformer_blocks.38.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2383 "transformer_blocks.38.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2384 "transformer_blocks.38.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2385 "transformer_blocks.38.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2386 "transformer_blocks.38.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2387 "transformer_blocks.38.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2388 "transformer_blocks.38.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2389 "transformer_blocks.38.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2390 "transformer_blocks.38.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2391 "transformer_blocks.38.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2392 "transformer_blocks.38.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2393 "transformer_blocks.38.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2394 "transformer_blocks.38.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2395 "transformer_blocks.38.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2396 "transformer_blocks.38.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2397 "transformer_blocks.38.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2398 "transformer_blocks.38.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2399 "transformer_blocks.38.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2400 "transformer_blocks.38.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2401 "transformer_blocks.38.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2402 "transformer_blocks.38.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2403 "transformer_blocks.38.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2404 "transformer_blocks.38.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2405 "transformer_blocks.38.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2406 "transformer_blocks.38.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2407 "transformer_blocks.38.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2408 "transformer_blocks.38.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2409 "transformer_blocks.38.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2410 "transformer_blocks.38.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2411 "transformer_blocks.38.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2412 "transformer_blocks.38.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2413 "transformer_blocks.38.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2414 "transformer_blocks.38.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2415 "transformer_blocks.38.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2416 "transformer_blocks.38.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2417 "transformer_blocks.38.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2418 "transformer_blocks.38.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2419 "transformer_blocks.38.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2420 "transformer_blocks.38.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2421 "transformer_blocks.38.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2422 "transformer_blocks.38.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2423 "transformer_blocks.38.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2424 "transformer_blocks.38.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2425 "transformer_blocks.38.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2426 "transformer_blocks.38.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2427 "transformer_blocks.38.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2428 "transformer_blocks.38.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2429 "transformer_blocks.38.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2430 "transformer_blocks.38.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2431 "transformer_blocks.38.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2432 "transformer_blocks.38.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2433 "transformer_blocks.38.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2434 "transformer_blocks.38.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2435 "transformer_blocks.38.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2436 "transformer_blocks.39.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2437 "transformer_blocks.39.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2438 "transformer_blocks.39.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2439 "transformer_blocks.39.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2440 "transformer_blocks.39.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2441 "transformer_blocks.39.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2442 "transformer_blocks.39.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2443 "transformer_blocks.39.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2444 "transformer_blocks.39.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2445 "transformer_blocks.39.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2446 "transformer_blocks.39.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2447 "transformer_blocks.39.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2448 "transformer_blocks.39.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2449 "transformer_blocks.39.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2450 "transformer_blocks.39.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2451 "transformer_blocks.39.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2452 "transformer_blocks.39.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2453 "transformer_blocks.39.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2454 "transformer_blocks.39.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2455 "transformer_blocks.39.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2456 "transformer_blocks.39.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2457 "transformer_blocks.39.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2458 "transformer_blocks.39.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2459 "transformer_blocks.39.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2460 "transformer_blocks.39.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2461 "transformer_blocks.39.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2462 "transformer_blocks.39.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2463 "transformer_blocks.39.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2464 "transformer_blocks.39.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2465 "transformer_blocks.39.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2466 "transformer_blocks.39.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2467 "transformer_blocks.39.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2468 "transformer_blocks.39.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2469 "transformer_blocks.39.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2470 "transformer_blocks.39.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2471 "transformer_blocks.39.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2472 "transformer_blocks.39.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2473 "transformer_blocks.39.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2474 "transformer_blocks.39.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2475 "transformer_blocks.39.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2476 "transformer_blocks.39.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2477 "transformer_blocks.39.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2478 "transformer_blocks.39.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2479 "transformer_blocks.39.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2480 "transformer_blocks.39.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2481 "transformer_blocks.39.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2482 "transformer_blocks.39.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2483 "transformer_blocks.39.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2484 "transformer_blocks.39.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2485 "transformer_blocks.39.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2486 "transformer_blocks.39.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2487 "transformer_blocks.39.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2488 "transformer_blocks.39.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2489 "transformer_blocks.39.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2490 "transformer_blocks.39.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2491 "transformer_blocks.39.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2492 "transformer_blocks.39.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2493 "transformer_blocks.39.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2494 "transformer_blocks.39.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2495 "transformer_blocks.39.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2496 "transformer_blocks.39.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2497 "transformer_blocks.39.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2498 "transformer_blocks.39.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2499 "transformer_blocks.39.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2500 "transformer_blocks.39.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2501 "transformer_blocks.39.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2502 "transformer_blocks.39.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2503 "transformer_blocks.39.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2504 "transformer_blocks.39.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2505 "transformer_blocks.39.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2506 "transformer_blocks.39.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2507 "transformer_blocks.39.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2508 "transformer_blocks.4.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2509 "transformer_blocks.4.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2510 "transformer_blocks.4.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2511 "transformer_blocks.4.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2512 "transformer_blocks.4.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2513 "transformer_blocks.4.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2514 "transformer_blocks.4.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2515 "transformer_blocks.4.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2516 "transformer_blocks.4.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2517 "transformer_blocks.4.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2518 "transformer_blocks.4.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2519 "transformer_blocks.4.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2520 "transformer_blocks.4.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2521 "transformer_blocks.4.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2522 "transformer_blocks.4.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2523 "transformer_blocks.4.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2524 "transformer_blocks.4.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2525 "transformer_blocks.4.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2526 "transformer_blocks.4.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2527 "transformer_blocks.4.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2528 "transformer_blocks.4.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
2529 "transformer_blocks.4.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2530 "transformer_blocks.4.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2531 "transformer_blocks.4.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2532 "transformer_blocks.4.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2533 "transformer_blocks.4.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2534 "transformer_blocks.4.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2535 "transformer_blocks.4.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2536 "transformer_blocks.4.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2537 "transformer_blocks.4.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2538 "transformer_blocks.4.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2539 "transformer_blocks.4.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2540 "transformer_blocks.4.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2541 "transformer_blocks.4.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2542 "transformer_blocks.4.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2543 "transformer_blocks.4.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2544 "transformer_blocks.4.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2545 "transformer_blocks.4.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2546 "transformer_blocks.4.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2547 "transformer_blocks.4.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2548 "transformer_blocks.4.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2549 "transformer_blocks.4.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2550 "transformer_blocks.4.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2551 "transformer_blocks.4.audio_ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2552 "transformer_blocks.4.audio_ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2553 "transformer_blocks.4.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
2554 "transformer_blocks.4.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2555 "transformer_blocks.4.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2556 "transformer_blocks.4.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2557 "transformer_blocks.4.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2558 "transformer_blocks.4.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2559 "transformer_blocks.4.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2560 "transformer_blocks.4.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2561 "transformer_blocks.4.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2562 "transformer_blocks.4.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2563 "transformer_blocks.4.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2564 "transformer_blocks.4.ff.net.0.proj.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2565 "transformer_blocks.4.ff.net.0.proj.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2566 "transformer_blocks.4.ff.net.2.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2567 "transformer_blocks.4.ff.net.2.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2568 "transformer_blocks.4.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
2569 "transformer_blocks.4.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
2570 "transformer_blocks.4.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2571 "transformer_blocks.4.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2572 "transformer_blocks.4.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2573 "transformer_blocks.4.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2574 "transformer_blocks.4.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2575 "transformer_blocks.4.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2576 "transformer_blocks.4.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2577 "transformer_blocks.4.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2578 "transformer_blocks.4.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
2579 "transformer_blocks.4.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
2580 "transformer_blocks.40.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2581 "transformer_blocks.40.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2582 "transformer_blocks.40.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2583 "transformer_blocks.40.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2584 "transformer_blocks.40.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2585 "transformer_blocks.40.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2586 "transformer_blocks.40.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2587 "transformer_blocks.40.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2588 "transformer_blocks.40.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2589 "transformer_blocks.40.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2590 "transformer_blocks.40.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2591 "transformer_blocks.40.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2592 "transformer_blocks.40.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2593 "transformer_blocks.40.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2594 "transformer_blocks.40.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2595 "transformer_blocks.40.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2596 "transformer_blocks.40.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2597 "transformer_blocks.40.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2598 "transformer_blocks.40.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2599 "transformer_blocks.40.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2600 "transformer_blocks.40.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2601 "transformer_blocks.40.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2602 "transformer_blocks.40.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2603 "transformer_blocks.40.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2604 "transformer_blocks.40.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2605 "transformer_blocks.40.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2606 "transformer_blocks.40.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2607 "transformer_blocks.40.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2608 "transformer_blocks.40.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2609 "transformer_blocks.40.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2610 "transformer_blocks.40.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2611 "transformer_blocks.40.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2612 "transformer_blocks.40.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2613 "transformer_blocks.40.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2614 "transformer_blocks.40.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2615 "transformer_blocks.40.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2616 "transformer_blocks.40.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2617 "transformer_blocks.40.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2618 "transformer_blocks.40.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2619 "transformer_blocks.40.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2620 "transformer_blocks.40.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2621 "transformer_blocks.40.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2622 "transformer_blocks.40.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2623 "transformer_blocks.40.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2624 "transformer_blocks.40.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2625 "transformer_blocks.40.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2626 "transformer_blocks.40.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2627 "transformer_blocks.40.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2628 "transformer_blocks.40.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2629 "transformer_blocks.40.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2630 "transformer_blocks.40.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2631 "transformer_blocks.40.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2632 "transformer_blocks.40.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2633 "transformer_blocks.40.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2634 "transformer_blocks.40.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2635 "transformer_blocks.40.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2636 "transformer_blocks.40.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2637 "transformer_blocks.40.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2638 "transformer_blocks.40.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2639 "transformer_blocks.40.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2640 "transformer_blocks.40.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2641 "transformer_blocks.40.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2642 "transformer_blocks.40.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2643 "transformer_blocks.40.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2644 "transformer_blocks.40.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2645 "transformer_blocks.40.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2646 "transformer_blocks.40.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2647 "transformer_blocks.40.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2648 "transformer_blocks.40.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2649 "transformer_blocks.40.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2650 "transformer_blocks.40.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2651 "transformer_blocks.40.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2652 "transformer_blocks.41.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2653 "transformer_blocks.41.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2654 "transformer_blocks.41.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2655 "transformer_blocks.41.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2656 "transformer_blocks.41.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2657 "transformer_blocks.41.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2658 "transformer_blocks.41.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2659 "transformer_blocks.41.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2660 "transformer_blocks.41.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2661 "transformer_blocks.41.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2662 "transformer_blocks.41.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2663 "transformer_blocks.41.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2664 "transformer_blocks.41.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2665 "transformer_blocks.41.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2666 "transformer_blocks.41.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2667 "transformer_blocks.41.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2668 "transformer_blocks.41.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2669 "transformer_blocks.41.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2670 "transformer_blocks.41.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2671 "transformer_blocks.41.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2672 "transformer_blocks.41.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2673 "transformer_blocks.41.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2674 "transformer_blocks.41.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2675 "transformer_blocks.41.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2676 "transformer_blocks.41.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2677 "transformer_blocks.41.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2678 "transformer_blocks.41.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2679 "transformer_blocks.41.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2680 "transformer_blocks.41.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2681 "transformer_blocks.41.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2682 "transformer_blocks.41.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2683 "transformer_blocks.41.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2684 "transformer_blocks.41.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2685 "transformer_blocks.41.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2686 "transformer_blocks.41.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2687 "transformer_blocks.41.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2688 "transformer_blocks.41.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2689 "transformer_blocks.41.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2690 "transformer_blocks.41.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2691 "transformer_blocks.41.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2692 "transformer_blocks.41.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2693 "transformer_blocks.41.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2694 "transformer_blocks.41.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2695 "transformer_blocks.41.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2696 "transformer_blocks.41.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2697 "transformer_blocks.41.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2698 "transformer_blocks.41.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2699 "transformer_blocks.41.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2700 "transformer_blocks.41.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2701 "transformer_blocks.41.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2702 "transformer_blocks.41.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2703 "transformer_blocks.41.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2704 "transformer_blocks.41.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2705 "transformer_blocks.41.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2706 "transformer_blocks.41.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2707 "transformer_blocks.41.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2708 "transformer_blocks.41.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2709 "transformer_blocks.41.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2710 "transformer_blocks.41.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2711 "transformer_blocks.41.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2712 "transformer_blocks.41.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2713 "transformer_blocks.41.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2714 "transformer_blocks.41.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2715 "transformer_blocks.41.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2716 "transformer_blocks.41.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2717 "transformer_blocks.41.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2718 "transformer_blocks.41.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2719 "transformer_blocks.41.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2720 "transformer_blocks.41.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2721 "transformer_blocks.41.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2722 "transformer_blocks.41.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2723 "transformer_blocks.41.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2724 "transformer_blocks.42.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2725 "transformer_blocks.42.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2726 "transformer_blocks.42.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2727 "transformer_blocks.42.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2728 "transformer_blocks.42.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2729 "transformer_blocks.42.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2730 "transformer_blocks.42.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2731 "transformer_blocks.42.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2732 "transformer_blocks.42.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2733 "transformer_blocks.42.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2734 "transformer_blocks.42.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2735 "transformer_blocks.42.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2736 "transformer_blocks.42.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2737 "transformer_blocks.42.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2738 "transformer_blocks.42.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2739 "transformer_blocks.42.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2740 "transformer_blocks.42.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2741 "transformer_blocks.42.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2742 "transformer_blocks.42.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2743 "transformer_blocks.42.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2744 "transformer_blocks.42.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2745 "transformer_blocks.42.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2746 "transformer_blocks.42.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2747 "transformer_blocks.42.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2748 "transformer_blocks.42.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2749 "transformer_blocks.42.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2750 "transformer_blocks.42.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2751 "transformer_blocks.42.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2752 "transformer_blocks.42.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2753 "transformer_blocks.42.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2754 "transformer_blocks.42.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2755 "transformer_blocks.42.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2756 "transformer_blocks.42.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2757 "transformer_blocks.42.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2758 "transformer_blocks.42.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2759 "transformer_blocks.42.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2760 "transformer_blocks.42.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2761 "transformer_blocks.42.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2762 "transformer_blocks.42.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2763 "transformer_blocks.42.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2764 "transformer_blocks.42.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2765 "transformer_blocks.42.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2766 "transformer_blocks.42.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2767 "transformer_blocks.42.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2768 "transformer_blocks.42.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2769 "transformer_blocks.42.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2770 "transformer_blocks.42.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2771 "transformer_blocks.42.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2772 "transformer_blocks.42.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2773 "transformer_blocks.42.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2774 "transformer_blocks.42.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2775 "transformer_blocks.42.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2776 "transformer_blocks.42.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2777 "transformer_blocks.42.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2778 "transformer_blocks.42.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2779 "transformer_blocks.42.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2780 "transformer_blocks.42.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2781 "transformer_blocks.42.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2782 "transformer_blocks.42.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2783 "transformer_blocks.42.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2784 "transformer_blocks.42.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2785 "transformer_blocks.42.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2786 "transformer_blocks.42.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2787 "transformer_blocks.42.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2788 "transformer_blocks.42.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2789 "transformer_blocks.42.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2790 "transformer_blocks.42.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2791 "transformer_blocks.42.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2792 "transformer_blocks.42.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2793 "transformer_blocks.42.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2794 "transformer_blocks.42.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2795 "transformer_blocks.42.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2796 "transformer_blocks.43.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2797 "transformer_blocks.43.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2798 "transformer_blocks.43.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2799 "transformer_blocks.43.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2800 "transformer_blocks.43.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2801 "transformer_blocks.43.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2802 "transformer_blocks.43.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2803 "transformer_blocks.43.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2804 "transformer_blocks.43.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2805 "transformer_blocks.43.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2806 "transformer_blocks.43.attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2807 "transformer_blocks.43.attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2808 "transformer_blocks.43.attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2809 "transformer_blocks.43.attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2810 "transformer_blocks.43.attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2811 "transformer_blocks.43.attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2812 "transformer_blocks.43.attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2813 "transformer_blocks.43.attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2814 "transformer_blocks.43.attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2815 "transformer_blocks.43.attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2816 "transformer_blocks.43.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2817 "transformer_blocks.43.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2818 "transformer_blocks.43.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2819 "transformer_blocks.43.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2820 "transformer_blocks.43.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2821 "transformer_blocks.43.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2822 "transformer_blocks.43.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2823 "transformer_blocks.43.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2824 "transformer_blocks.43.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2825 "transformer_blocks.43.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2826 "transformer_blocks.43.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2827 "transformer_blocks.43.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2828 "transformer_blocks.43.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2829 "transformer_blocks.43.audio_attn2.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2830 "transformer_blocks.43.audio_attn2.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2831 "transformer_blocks.43.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2832 "transformer_blocks.43.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2833 "transformer_blocks.43.audio_attn2.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2834 "transformer_blocks.43.audio_attn2.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2835 "transformer_blocks.43.audio_attn2.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2836 "transformer_blocks.43.audio_attn2.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2837 "transformer_blocks.43.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2838 "transformer_blocks.43.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2839 "transformer_blocks.43.audio_ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2840 "transformer_blocks.43.audio_ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2841 "transformer_blocks.43.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2842 "transformer_blocks.43.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2843 "transformer_blocks.43.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2844 "transformer_blocks.43.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2845 "transformer_blocks.43.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2846 "transformer_blocks.43.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2847 "transformer_blocks.43.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2848 "transformer_blocks.43.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2849 "transformer_blocks.43.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2850 "transformer_blocks.43.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2851 "transformer_blocks.43.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2852 "transformer_blocks.43.ff.net.0.proj.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2853 "transformer_blocks.43.ff.net.0.proj.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2854 "transformer_blocks.43.ff.net.2.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2855 "transformer_blocks.43.ff.net.2.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2856 "transformer_blocks.43.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2857 "transformer_blocks.43.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2858 "transformer_blocks.43.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2859 "transformer_blocks.43.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2860 "transformer_blocks.43.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2861 "transformer_blocks.43.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2862 "transformer_blocks.43.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2863 "transformer_blocks.43.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2864 "transformer_blocks.43.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2865 "transformer_blocks.43.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2866 "transformer_blocks.43.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2867 "transformer_blocks.43.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2868 "transformer_blocks.44.attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2869 "transformer_blocks.44.attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2870 "transformer_blocks.44.attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2871 "transformer_blocks.44.attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2872 "transformer_blocks.44.attn1.to_out.0.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2873 "transformer_blocks.44.attn1.to_out.0.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2874 "transformer_blocks.44.attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2875 "transformer_blocks.44.attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2876 "transformer_blocks.44.attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2877 "transformer_blocks.44.attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2878 "transformer_blocks.44.attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2879 "transformer_blocks.44.attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2880 "transformer_blocks.44.attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2881 "transformer_blocks.44.attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2882 "transformer_blocks.44.attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2883 "transformer_blocks.44.attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2884 "transformer_blocks.44.attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2885 "transformer_blocks.44.attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2886 "transformer_blocks.44.attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2887 "transformer_blocks.44.attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2888 "transformer_blocks.44.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2889 "transformer_blocks.44.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2890 "transformer_blocks.44.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2891 "transformer_blocks.44.audio_attn1.to_k.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2892 "transformer_blocks.44.audio_attn1.to_k.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2893 "transformer_blocks.44.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2894 "transformer_blocks.44.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2895 "transformer_blocks.44.audio_attn1.to_q.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2896 "transformer_blocks.44.audio_attn1.to_q.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2897 "transformer_blocks.44.audio_attn1.to_v.bias": "diffusion_pytorch_model-00007-of-00008.safetensors",
2898 "transformer_blocks.44.audio_attn1.to_v.weight": "diffusion_pytorch_model-00007-of-00008.safetensors",
2899 "transformer_blocks.44.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2900 "transformer_blocks.44.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2901 "transformer_blocks.44.audio_attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2902 "transformer_blocks.44.audio_attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2903 "transformer_blocks.44.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2904 "transformer_blocks.44.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2905 "transformer_blocks.44.audio_attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2906 "transformer_blocks.44.audio_attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2907 "transformer_blocks.44.audio_attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2908 "transformer_blocks.44.audio_attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2909 "transformer_blocks.44.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2910 "transformer_blocks.44.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2911 "transformer_blocks.44.audio_ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2912 "transformer_blocks.44.audio_ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2913 "transformer_blocks.44.audio_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2914 "transformer_blocks.44.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2915 "transformer_blocks.44.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2916 "transformer_blocks.44.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2917 "transformer_blocks.44.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2918 "transformer_blocks.44.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2919 "transformer_blocks.44.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2920 "transformer_blocks.44.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2921 "transformer_blocks.44.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2922 "transformer_blocks.44.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2923 "transformer_blocks.44.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2924 "transformer_blocks.44.ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2925 "transformer_blocks.44.ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2926 "transformer_blocks.44.ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2927 "transformer_blocks.44.ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2928 "transformer_blocks.44.scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2929 "transformer_blocks.44.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00007-of-00008.safetensors",
2930 "transformer_blocks.44.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2931 "transformer_blocks.44.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2932 "transformer_blocks.44.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2933 "transformer_blocks.44.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2934 "transformer_blocks.44.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2935 "transformer_blocks.44.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2936 "transformer_blocks.44.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2937 "transformer_blocks.44.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2938 "transformer_blocks.44.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2939 "transformer_blocks.44.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2940 "transformer_blocks.45.attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2941 "transformer_blocks.45.attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2942 "transformer_blocks.45.attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2943 "transformer_blocks.45.attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2944 "transformer_blocks.45.attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2945 "transformer_blocks.45.attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2946 "transformer_blocks.45.attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2947 "transformer_blocks.45.attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2948 "transformer_blocks.45.attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2949 "transformer_blocks.45.attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2950 "transformer_blocks.45.attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2951 "transformer_blocks.45.attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2952 "transformer_blocks.45.attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2953 "transformer_blocks.45.attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2954 "transformer_blocks.45.attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2955 "transformer_blocks.45.attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2956 "transformer_blocks.45.attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2957 "transformer_blocks.45.attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2958 "transformer_blocks.45.attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2959 "transformer_blocks.45.attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2960 "transformer_blocks.45.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
2961 "transformer_blocks.45.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2962 "transformer_blocks.45.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2963 "transformer_blocks.45.audio_attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2964 "transformer_blocks.45.audio_attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2965 "transformer_blocks.45.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2966 "transformer_blocks.45.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2967 "transformer_blocks.45.audio_attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2968 "transformer_blocks.45.audio_attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2969 "transformer_blocks.45.audio_attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2970 "transformer_blocks.45.audio_attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2971 "transformer_blocks.45.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2972 "transformer_blocks.45.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2973 "transformer_blocks.45.audio_attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2974 "transformer_blocks.45.audio_attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2975 "transformer_blocks.45.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2976 "transformer_blocks.45.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2977 "transformer_blocks.45.audio_attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2978 "transformer_blocks.45.audio_attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2979 "transformer_blocks.45.audio_attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2980 "transformer_blocks.45.audio_attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2981 "transformer_blocks.45.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2982 "transformer_blocks.45.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2983 "transformer_blocks.45.audio_ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2984 "transformer_blocks.45.audio_ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2985 "transformer_blocks.45.audio_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
2986 "transformer_blocks.45.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2987 "transformer_blocks.45.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2988 "transformer_blocks.45.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2989 "transformer_blocks.45.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2990 "transformer_blocks.45.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2991 "transformer_blocks.45.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2992 "transformer_blocks.45.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2993 "transformer_blocks.45.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2994 "transformer_blocks.45.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2995 "transformer_blocks.45.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2996 "transformer_blocks.45.ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2997 "transformer_blocks.45.ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
2998 "transformer_blocks.45.ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
2999 "transformer_blocks.45.ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3000 "transformer_blocks.45.scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3001 "transformer_blocks.45.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3002 "transformer_blocks.45.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3003 "transformer_blocks.45.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3004 "transformer_blocks.45.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3005 "transformer_blocks.45.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3006 "transformer_blocks.45.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3007 "transformer_blocks.45.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3008 "transformer_blocks.45.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3009 "transformer_blocks.45.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3010 "transformer_blocks.45.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3011 "transformer_blocks.45.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3012 "transformer_blocks.46.attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3013 "transformer_blocks.46.attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3014 "transformer_blocks.46.attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3015 "transformer_blocks.46.attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3016 "transformer_blocks.46.attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3017 "transformer_blocks.46.attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3018 "transformer_blocks.46.attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3019 "transformer_blocks.46.attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3020 "transformer_blocks.46.attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3021 "transformer_blocks.46.attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3022 "transformer_blocks.46.attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3023 "transformer_blocks.46.attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3024 "transformer_blocks.46.attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3025 "transformer_blocks.46.attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3026 "transformer_blocks.46.attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3027 "transformer_blocks.46.attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3028 "transformer_blocks.46.attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3029 "transformer_blocks.46.attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3030 "transformer_blocks.46.attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3031 "transformer_blocks.46.attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3032 "transformer_blocks.46.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3033 "transformer_blocks.46.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3034 "transformer_blocks.46.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3035 "transformer_blocks.46.audio_attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3036 "transformer_blocks.46.audio_attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3037 "transformer_blocks.46.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3038 "transformer_blocks.46.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3039 "transformer_blocks.46.audio_attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3040 "transformer_blocks.46.audio_attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3041 "transformer_blocks.46.audio_attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3042 "transformer_blocks.46.audio_attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3043 "transformer_blocks.46.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3044 "transformer_blocks.46.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3045 "transformer_blocks.46.audio_attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3046 "transformer_blocks.46.audio_attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3047 "transformer_blocks.46.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3048 "transformer_blocks.46.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3049 "transformer_blocks.46.audio_attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3050 "transformer_blocks.46.audio_attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3051 "transformer_blocks.46.audio_attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3052 "transformer_blocks.46.audio_attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3053 "transformer_blocks.46.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3054 "transformer_blocks.46.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3055 "transformer_blocks.46.audio_ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3056 "transformer_blocks.46.audio_ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3057 "transformer_blocks.46.audio_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3058 "transformer_blocks.46.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3059 "transformer_blocks.46.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3060 "transformer_blocks.46.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3061 "transformer_blocks.46.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3062 "transformer_blocks.46.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3063 "transformer_blocks.46.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3064 "transformer_blocks.46.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3065 "transformer_blocks.46.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3066 "transformer_blocks.46.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3067 "transformer_blocks.46.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3068 "transformer_blocks.46.ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3069 "transformer_blocks.46.ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3070 "transformer_blocks.46.ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3071 "transformer_blocks.46.ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3072 "transformer_blocks.46.scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3073 "transformer_blocks.46.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3074 "transformer_blocks.46.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3075 "transformer_blocks.46.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3076 "transformer_blocks.46.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3077 "transformer_blocks.46.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3078 "transformer_blocks.46.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3079 "transformer_blocks.46.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3080 "transformer_blocks.46.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3081 "transformer_blocks.46.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3082 "transformer_blocks.46.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3083 "transformer_blocks.46.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3084 "transformer_blocks.47.attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3085 "transformer_blocks.47.attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3086 "transformer_blocks.47.attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3087 "transformer_blocks.47.attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3088 "transformer_blocks.47.attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3089 "transformer_blocks.47.attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3090 "transformer_blocks.47.attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3091 "transformer_blocks.47.attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3092 "transformer_blocks.47.attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3093 "transformer_blocks.47.attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3094 "transformer_blocks.47.attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3095 "transformer_blocks.47.attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3096 "transformer_blocks.47.attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3097 "transformer_blocks.47.attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3098 "transformer_blocks.47.attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3099 "transformer_blocks.47.attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3100 "transformer_blocks.47.attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3101 "transformer_blocks.47.attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3102 "transformer_blocks.47.attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3103 "transformer_blocks.47.attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3104 "transformer_blocks.47.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3105 "transformer_blocks.47.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3106 "transformer_blocks.47.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3107 "transformer_blocks.47.audio_attn1.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3108 "transformer_blocks.47.audio_attn1.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3109 "transformer_blocks.47.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3110 "transformer_blocks.47.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3111 "transformer_blocks.47.audio_attn1.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3112 "transformer_blocks.47.audio_attn1.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3113 "transformer_blocks.47.audio_attn1.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3114 "transformer_blocks.47.audio_attn1.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3115 "transformer_blocks.47.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3116 "transformer_blocks.47.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3117 "transformer_blocks.47.audio_attn2.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3118 "transformer_blocks.47.audio_attn2.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3119 "transformer_blocks.47.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3120 "transformer_blocks.47.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3121 "transformer_blocks.47.audio_attn2.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3122 "transformer_blocks.47.audio_attn2.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3123 "transformer_blocks.47.audio_attn2.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3124 "transformer_blocks.47.audio_attn2.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3125 "transformer_blocks.47.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3126 "transformer_blocks.47.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3127 "transformer_blocks.47.audio_ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3128 "transformer_blocks.47.audio_ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3129 "transformer_blocks.47.audio_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3130 "transformer_blocks.47.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3131 "transformer_blocks.47.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3132 "transformer_blocks.47.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3133 "transformer_blocks.47.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3134 "transformer_blocks.47.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3135 "transformer_blocks.47.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3136 "transformer_blocks.47.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3137 "transformer_blocks.47.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3138 "transformer_blocks.47.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3139 "transformer_blocks.47.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3140 "transformer_blocks.47.ff.net.0.proj.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3141 "transformer_blocks.47.ff.net.0.proj.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3142 "transformer_blocks.47.ff.net.2.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3143 "transformer_blocks.47.ff.net.2.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3144 "transformer_blocks.47.scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3145 "transformer_blocks.47.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00008-of-00008.safetensors",
3146 "transformer_blocks.47.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3147 "transformer_blocks.47.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3148 "transformer_blocks.47.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3149 "transformer_blocks.47.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3150 "transformer_blocks.47.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3151 "transformer_blocks.47.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3152 "transformer_blocks.47.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3153 "transformer_blocks.47.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3154 "transformer_blocks.47.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00008-of-00008.safetensors",
3155 "transformer_blocks.47.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00008-of-00008.safetensors",
3156 "transformer_blocks.5.attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3157 "transformer_blocks.5.attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3158 "transformer_blocks.5.attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3159 "transformer_blocks.5.attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3160 "transformer_blocks.5.attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3161 "transformer_blocks.5.attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3162 "transformer_blocks.5.attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3163 "transformer_blocks.5.attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3164 "transformer_blocks.5.attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3165 "transformer_blocks.5.attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3166 "transformer_blocks.5.attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3167 "transformer_blocks.5.attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3168 "transformer_blocks.5.attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3169 "transformer_blocks.5.attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3170 "transformer_blocks.5.attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3171 "transformer_blocks.5.attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3172 "transformer_blocks.5.attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3173 "transformer_blocks.5.attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3174 "transformer_blocks.5.attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3175 "transformer_blocks.5.attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3176 "transformer_blocks.5.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
3177 "transformer_blocks.5.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3178 "transformer_blocks.5.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3179 "transformer_blocks.5.audio_attn1.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3180 "transformer_blocks.5.audio_attn1.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3181 "transformer_blocks.5.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3182 "transformer_blocks.5.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3183 "transformer_blocks.5.audio_attn1.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3184 "transformer_blocks.5.audio_attn1.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3185 "transformer_blocks.5.audio_attn1.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3186 "transformer_blocks.5.audio_attn1.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3187 "transformer_blocks.5.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3188 "transformer_blocks.5.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3189 "transformer_blocks.5.audio_attn2.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3190 "transformer_blocks.5.audio_attn2.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3191 "transformer_blocks.5.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3192 "transformer_blocks.5.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3193 "transformer_blocks.5.audio_attn2.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3194 "transformer_blocks.5.audio_attn2.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3195 "transformer_blocks.5.audio_attn2.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3196 "transformer_blocks.5.audio_attn2.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3197 "transformer_blocks.5.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3198 "transformer_blocks.5.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3199 "transformer_blocks.5.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3200 "transformer_blocks.5.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3201 "transformer_blocks.5.audio_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
3202 "transformer_blocks.5.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3203 "transformer_blocks.5.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3204 "transformer_blocks.5.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3205 "transformer_blocks.5.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3206 "transformer_blocks.5.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3207 "transformer_blocks.5.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3208 "transformer_blocks.5.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3209 "transformer_blocks.5.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3210 "transformer_blocks.5.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3211 "transformer_blocks.5.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3212 "transformer_blocks.5.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3213 "transformer_blocks.5.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3214 "transformer_blocks.5.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3215 "transformer_blocks.5.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3216 "transformer_blocks.5.scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
3217 "transformer_blocks.5.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00001-of-00008.safetensors",
3218 "transformer_blocks.5.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3219 "transformer_blocks.5.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3220 "transformer_blocks.5.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3221 "transformer_blocks.5.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3222 "transformer_blocks.5.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3223 "transformer_blocks.5.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3224 "transformer_blocks.5.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3225 "transformer_blocks.5.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3226 "transformer_blocks.5.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00001-of-00008.safetensors",
3227 "transformer_blocks.5.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00001-of-00008.safetensors",
3228 "transformer_blocks.6.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3229 "transformer_blocks.6.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3230 "transformer_blocks.6.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3231 "transformer_blocks.6.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3232 "transformer_blocks.6.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3233 "transformer_blocks.6.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3234 "transformer_blocks.6.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3235 "transformer_blocks.6.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3236 "transformer_blocks.6.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3237 "transformer_blocks.6.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3238 "transformer_blocks.6.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3239 "transformer_blocks.6.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3240 "transformer_blocks.6.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3241 "transformer_blocks.6.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3242 "transformer_blocks.6.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3243 "transformer_blocks.6.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3244 "transformer_blocks.6.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3245 "transformer_blocks.6.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3246 "transformer_blocks.6.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3247 "transformer_blocks.6.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3248 "transformer_blocks.6.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3249 "transformer_blocks.6.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3250 "transformer_blocks.6.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3251 "transformer_blocks.6.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3252 "transformer_blocks.6.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3253 "transformer_blocks.6.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3254 "transformer_blocks.6.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3255 "transformer_blocks.6.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3256 "transformer_blocks.6.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3257 "transformer_blocks.6.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3258 "transformer_blocks.6.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3259 "transformer_blocks.6.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3260 "transformer_blocks.6.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3261 "transformer_blocks.6.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3262 "transformer_blocks.6.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3263 "transformer_blocks.6.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3264 "transformer_blocks.6.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3265 "transformer_blocks.6.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3266 "transformer_blocks.6.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3267 "transformer_blocks.6.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3268 "transformer_blocks.6.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3269 "transformer_blocks.6.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3270 "transformer_blocks.6.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3271 "transformer_blocks.6.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3272 "transformer_blocks.6.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3273 "transformer_blocks.6.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3274 "transformer_blocks.6.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3275 "transformer_blocks.6.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3276 "transformer_blocks.6.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3277 "transformer_blocks.6.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3278 "transformer_blocks.6.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3279 "transformer_blocks.6.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3280 "transformer_blocks.6.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3281 "transformer_blocks.6.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3282 "transformer_blocks.6.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3283 "transformer_blocks.6.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3284 "transformer_blocks.6.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3285 "transformer_blocks.6.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3286 "transformer_blocks.6.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3287 "transformer_blocks.6.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3288 "transformer_blocks.6.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3289 "transformer_blocks.6.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3290 "transformer_blocks.6.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3291 "transformer_blocks.6.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3292 "transformer_blocks.6.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3293 "transformer_blocks.6.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3294 "transformer_blocks.6.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3295 "transformer_blocks.6.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3296 "transformer_blocks.6.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3297 "transformer_blocks.6.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3298 "transformer_blocks.6.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3299 "transformer_blocks.6.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3300 "transformer_blocks.7.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3301 "transformer_blocks.7.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3302 "transformer_blocks.7.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3303 "transformer_blocks.7.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3304 "transformer_blocks.7.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3305 "transformer_blocks.7.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3306 "transformer_blocks.7.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3307 "transformer_blocks.7.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3308 "transformer_blocks.7.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3309 "transformer_blocks.7.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3310 "transformer_blocks.7.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3311 "transformer_blocks.7.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3312 "transformer_blocks.7.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3313 "transformer_blocks.7.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3314 "transformer_blocks.7.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3315 "transformer_blocks.7.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3316 "transformer_blocks.7.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3317 "transformer_blocks.7.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3318 "transformer_blocks.7.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3319 "transformer_blocks.7.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3320 "transformer_blocks.7.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3321 "transformer_blocks.7.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3322 "transformer_blocks.7.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3323 "transformer_blocks.7.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3324 "transformer_blocks.7.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3325 "transformer_blocks.7.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3326 "transformer_blocks.7.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3327 "transformer_blocks.7.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3328 "transformer_blocks.7.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3329 "transformer_blocks.7.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3330 "transformer_blocks.7.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3331 "transformer_blocks.7.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3332 "transformer_blocks.7.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3333 "transformer_blocks.7.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3334 "transformer_blocks.7.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3335 "transformer_blocks.7.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3336 "transformer_blocks.7.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3337 "transformer_blocks.7.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3338 "transformer_blocks.7.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3339 "transformer_blocks.7.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3340 "transformer_blocks.7.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3341 "transformer_blocks.7.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3342 "transformer_blocks.7.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3343 "transformer_blocks.7.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3344 "transformer_blocks.7.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3345 "transformer_blocks.7.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3346 "transformer_blocks.7.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3347 "transformer_blocks.7.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3348 "transformer_blocks.7.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3349 "transformer_blocks.7.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3350 "transformer_blocks.7.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3351 "transformer_blocks.7.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3352 "transformer_blocks.7.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3353 "transformer_blocks.7.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3354 "transformer_blocks.7.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3355 "transformer_blocks.7.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3356 "transformer_blocks.7.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3357 "transformer_blocks.7.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3358 "transformer_blocks.7.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3359 "transformer_blocks.7.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3360 "transformer_blocks.7.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3361 "transformer_blocks.7.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3362 "transformer_blocks.7.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3363 "transformer_blocks.7.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3364 "transformer_blocks.7.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3365 "transformer_blocks.7.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3366 "transformer_blocks.7.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3367 "transformer_blocks.7.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3368 "transformer_blocks.7.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3369 "transformer_blocks.7.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3370 "transformer_blocks.7.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3371 "transformer_blocks.7.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3372 "transformer_blocks.8.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3373 "transformer_blocks.8.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3374 "transformer_blocks.8.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3375 "transformer_blocks.8.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3376 "transformer_blocks.8.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3377 "transformer_blocks.8.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3378 "transformer_blocks.8.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3379 "transformer_blocks.8.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3380 "transformer_blocks.8.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3381 "transformer_blocks.8.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3382 "transformer_blocks.8.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3383 "transformer_blocks.8.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3384 "transformer_blocks.8.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3385 "transformer_blocks.8.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3386 "transformer_blocks.8.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3387 "transformer_blocks.8.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3388 "transformer_blocks.8.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3389 "transformer_blocks.8.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3390 "transformer_blocks.8.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3391 "transformer_blocks.8.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3392 "transformer_blocks.8.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3393 "transformer_blocks.8.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3394 "transformer_blocks.8.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3395 "transformer_blocks.8.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3396 "transformer_blocks.8.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3397 "transformer_blocks.8.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3398 "transformer_blocks.8.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3399 "transformer_blocks.8.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3400 "transformer_blocks.8.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3401 "transformer_blocks.8.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3402 "transformer_blocks.8.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3403 "transformer_blocks.8.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3404 "transformer_blocks.8.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3405 "transformer_blocks.8.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3406 "transformer_blocks.8.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3407 "transformer_blocks.8.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3408 "transformer_blocks.8.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3409 "transformer_blocks.8.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3410 "transformer_blocks.8.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3411 "transformer_blocks.8.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3412 "transformer_blocks.8.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3413 "transformer_blocks.8.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3414 "transformer_blocks.8.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3415 "transformer_blocks.8.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3416 "transformer_blocks.8.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3417 "transformer_blocks.8.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3418 "transformer_blocks.8.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3419 "transformer_blocks.8.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3420 "transformer_blocks.8.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3421 "transformer_blocks.8.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3422 "transformer_blocks.8.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3423 "transformer_blocks.8.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3424 "transformer_blocks.8.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3425 "transformer_blocks.8.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3426 "transformer_blocks.8.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3427 "transformer_blocks.8.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3428 "transformer_blocks.8.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3429 "transformer_blocks.8.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3430 "transformer_blocks.8.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3431 "transformer_blocks.8.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3432 "transformer_blocks.8.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3433 "transformer_blocks.8.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3434 "transformer_blocks.8.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3435 "transformer_blocks.8.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3436 "transformer_blocks.8.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3437 "transformer_blocks.8.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3438 "transformer_blocks.8.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3439 "transformer_blocks.8.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3440 "transformer_blocks.8.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3441 "transformer_blocks.8.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3442 "transformer_blocks.8.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3443 "transformer_blocks.8.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3444 "transformer_blocks.9.attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3445 "transformer_blocks.9.attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3446 "transformer_blocks.9.attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3447 "transformer_blocks.9.attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3448 "transformer_blocks.9.attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3449 "transformer_blocks.9.attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3450 "transformer_blocks.9.attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3451 "transformer_blocks.9.attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3452 "transformer_blocks.9.attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3453 "transformer_blocks.9.attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3454 "transformer_blocks.9.attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3455 "transformer_blocks.9.attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3456 "transformer_blocks.9.attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3457 "transformer_blocks.9.attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3458 "transformer_blocks.9.attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3459 "transformer_blocks.9.attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3460 "transformer_blocks.9.attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3461 "transformer_blocks.9.attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3462 "transformer_blocks.9.attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3463 "transformer_blocks.9.attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3464 "transformer_blocks.9.audio_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3465 "transformer_blocks.9.audio_attn1.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3466 "transformer_blocks.9.audio_attn1.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3467 "transformer_blocks.9.audio_attn1.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3468 "transformer_blocks.9.audio_attn1.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3469 "transformer_blocks.9.audio_attn1.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3470 "transformer_blocks.9.audio_attn1.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3471 "transformer_blocks.9.audio_attn1.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3472 "transformer_blocks.9.audio_attn1.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3473 "transformer_blocks.9.audio_attn1.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3474 "transformer_blocks.9.audio_attn1.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3475 "transformer_blocks.9.audio_attn2.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3476 "transformer_blocks.9.audio_attn2.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3477 "transformer_blocks.9.audio_attn2.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3478 "transformer_blocks.9.audio_attn2.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3479 "transformer_blocks.9.audio_attn2.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3480 "transformer_blocks.9.audio_attn2.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3481 "transformer_blocks.9.audio_attn2.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3482 "transformer_blocks.9.audio_attn2.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3483 "transformer_blocks.9.audio_attn2.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3484 "transformer_blocks.9.audio_attn2.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3485 "transformer_blocks.9.audio_ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3486 "transformer_blocks.9.audio_ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3487 "transformer_blocks.9.audio_ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3488 "transformer_blocks.9.audio_ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3489 "transformer_blocks.9.audio_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3490 "transformer_blocks.9.audio_to_video_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3491 "transformer_blocks.9.audio_to_video_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3492 "transformer_blocks.9.audio_to_video_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3493 "transformer_blocks.9.audio_to_video_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3494 "transformer_blocks.9.audio_to_video_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3495 "transformer_blocks.9.audio_to_video_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3496 "transformer_blocks.9.audio_to_video_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3497 "transformer_blocks.9.audio_to_video_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3498 "transformer_blocks.9.audio_to_video_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3499 "transformer_blocks.9.audio_to_video_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3500 "transformer_blocks.9.ff.net.0.proj.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3501 "transformer_blocks.9.ff.net.0.proj.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3502 "transformer_blocks.9.ff.net.2.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3503 "transformer_blocks.9.ff.net.2.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3504 "transformer_blocks.9.scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3505 "transformer_blocks.9.video_a2v_cross_attn_scale_shift_table": "diffusion_pytorch_model-00002-of-00008.safetensors",
3506 "transformer_blocks.9.video_to_audio_attn.norm_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3507 "transformer_blocks.9.video_to_audio_attn.norm_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3508 "transformer_blocks.9.video_to_audio_attn.to_k.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3509 "transformer_blocks.9.video_to_audio_attn.to_k.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3510 "transformer_blocks.9.video_to_audio_attn.to_out.0.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3511 "transformer_blocks.9.video_to_audio_attn.to_out.0.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3512 "transformer_blocks.9.video_to_audio_attn.to_q.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3513 "transformer_blocks.9.video_to_audio_attn.to_q.weight": "diffusion_pytorch_model-00002-of-00008.safetensors",
3514 "transformer_blocks.9.video_to_audio_attn.to_v.bias": "diffusion_pytorch_model-00002-of-00008.safetensors",
3515 "transformer_blocks.9.video_to_audio_attn.to_v.weight": "diffusion_pytorch_model-00002-of-00008.safetensors"
3516 }
3517 }
3518