config.json
998 B · 49 lines · json Raw
1 {
2 "_num_labels": 9,
3 "architectures": [
4 "BertForTokenClassification"
5 ],
6 "attention_probs_dropout_prob": 0.1,
7 "directionality": "bidi",
8 "hidden_act": "gelu",
9 "hidden_dropout_prob": 0.1,
10 "hidden_size": 1024,
11 "id2label": {
12 "0": "O",
13 "1": "B-MISC",
14 "2": "I-MISC",
15 "3": "B-PER",
16 "4": "I-PER",
17 "5": "B-ORG",
18 "6": "I-ORG",
19 "7": "B-LOC",
20 "8": "I-LOC"
21 },
22 "initializer_range": 0.02,
23 "intermediate_size": 4096,
24 "label2id": {
25 "B-LOC": 7,
26 "B-MISC": 1,
27 "B-ORG": 5,
28 "B-PER": 3,
29 "I-LOC": 8,
30 "I-MISC": 2,
31 "I-ORG": 6,
32 "I-PER": 4,
33 "O": 0
34 },
35 "layer_norm_eps": 1e-12,
36 "max_position_embeddings": 512,
37 "model_type": "bert",
38 "num_attention_heads": 16,
39 "num_hidden_layers": 24,
40 "pad_token_id": 0,
41 "pooler_fc_size": 768,
42 "pooler_num_attention_heads": 12,
43 "pooler_num_fc_layers": 3,
44 "pooler_size_per_head": 128,
45 "pooler_type": "first_token_transform",
46 "type_vocab_size": 2,
47 "vocab_size": 28996
48 }
49