config.json
629 B · 32 lines · json Raw
1 {
2 "activation": "gelu",
3 "architectures": [
4 "DistilBertForSequenceClassification"
5 ],
6 "attention_dropout": 0.1,
7 "dim": 768,
8 "dropout": 0.1,
9 "finetuning_task": "sst-2",
10 "hidden_dim": 3072,
11 "id2label": {
12 "0": "NEGATIVE",
13 "1": "POSITIVE"
14 },
15 "initializer_range": 0.02,
16 "label2id": {
17 "NEGATIVE": 0,
18 "POSITIVE": 1
19 },
20 "max_position_embeddings": 512,
21 "model_type": "distilbert",
22 "n_heads": 12,
23 "n_layers": 6,
24 "output_past": true,
25 "pad_token_id": 0,
26 "qa_dropout": 0.1,
27 "seq_classif_dropout": 0.2,
28 "sinusoidal_pos_embds": false,
29 "tie_weights_": true,
30 "vocab_size": 30522
31 }
32