config.json
1.7 KB · 111 lines · json Raw
1 {
2 "_name_or_path": "nvidia/mit-b2",
3 "architectures": [
4 "SegformerForSemanticSegmentation"
5 ],
6 "attention_probs_dropout_prob": 0.0,
7 "classifier_dropout_prob": 0.1,
8 "decoder_hidden_size": 768,
9 "depths": [
10 3,
11 4,
12 6,
13 3
14 ],
15 "downsampling_rates": [
16 1,
17 4,
18 8,
19 16
20 ],
21 "drop_path_rate": 0.1,
22 "hidden_act": "gelu",
23 "hidden_dropout_prob": 0.0,
24 "hidden_sizes": [
25 64,
26 128,
27 320,
28 512
29 ],
30 "id2label": {
31 "0": "Background",
32 "1": "Hat",
33 "2": "Hair",
34 "3": "Sunglasses",
35 "4": "Upper-clothes",
36 "5": "Skirt",
37 "6": "Pants",
38 "7": "Dress",
39 "8": "Belt",
40 "9": "Left-shoe",
41 "10": "Right-shoe",
42 "11": "Face",
43 "12": "Left-leg",
44 "13": "Right-leg",
45 "14": "Left-arm",
46 "15": "Right-arm",
47 "16": "Bag",
48 "17": "Scarf"
49 },
50 "image_size": 224,
51 "initializer_range": 0.02,
52 "label2id": {
53 "Background": 0,
54 "Bag": 16,
55 "Belt": 8,
56 "Dress": 7,
57 "Face": 11,
58 "Hair": 2,
59 "Hat": 1,
60 "Left-arm": 14,
61 "Left-leg": 12,
62 "Left-shoe": 9,
63 "Pants": 6,
64 "Right-arm": 15,
65 "Right-leg": 13,
66 "Right-shoe": 10,
67 "Scarf": 17,
68 "Skirt": 5,
69 "Sunglasses": 3,
70 "Upper-clothes": 4
71 },
72 "layer_norm_eps": 1e-06,
73 "mlp_ratios": [
74 4,
75 4,
76 4,
77 4
78 ],
79 "model_type": "segformer",
80 "num_attention_heads": [
81 1,
82 2,
83 5,
84 8
85 ],
86 "num_channels": 3,
87 "num_encoder_blocks": 4,
88 "patch_sizes": [
89 7,
90 3,
91 3,
92 3
93 ],
94 "reshape_last_stage": true,
95 "semantic_loss_ignore_index": 255,
96 "sr_ratios": [
97 8,
98 4,
99 2,
100 1
101 ],
102 "strides": [
103 4,
104 2,
105 2,
106 2
107 ],
108 "torch_dtype": "float32",
109 "transformers_version": "4.24.0"
110 }
111