unet/config.json
787 B · 33 lines · json Raw
1 {
2 "_class_name": "UNet3DConditionModel",
3 "_diffusers_version": "0.15.0.dev0",
4 "_name_or_path": "/home/patrick_huggingface_co/.cache/huggingface/hub/models--damo-vilab--text-to-video-ms-1.7b/snapshots/32aa057809b033d6f3ca31da4b0ade1fa7904654/unet",
5 "act_fn": "silu",
6 "attention_head_dim": 64,
7 "block_out_channels": [
8 320,
9 640,
10 1280,
11 1280
12 ],
13 "cross_attention_dim": 1024,
14 "down_block_types": [
15 "CrossAttnDownBlock3D",
16 "CrossAttnDownBlock3D",
17 "CrossAttnDownBlock3D",
18 "DownBlock3D"
19 ],
20 "in_channels": 4,
21 "layers_per_block": 2,
22 "norm_eps": 1e-05,
23 "norm_num_groups": 32,
24 "out_channels": 4,
25 "sample_size": 32,
26 "up_block_types": [
27 "UpBlock3D",
28 "CrossAttnUpBlock3D",
29 "CrossAttnUpBlock3D",
30 "CrossAttnUpBlock3D"
31 ]
32 }
33