File size: 3,531 Bytes
1aacd2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
{
  "_name_or_path": "hub/ckiplab/bert-base-chinese-20210817-001848",
  "architectures": [
    "BertForTokenClassification"
  ],
  "attention_probs_dropout_prob": 0.1,
  "directionality": "bidi",
  "finetuning_task": "ner",
  "gradient_checkpointing": false,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "label2id": {
    "A": 33,
    "COLONCATEGORY": 40,
    "COMMACATEGORY": 1,
    "Caa": 21,
    "Cab": 47,
    "Cba": 57,
    "Cbb": 13,
    "D": 2,
    "DASHCATEGORY": 53,
    "DE": 3,
    "DK": 64,
    "DM": 59,
    "DOTCATEGORY": 58,
    "Da": 38,
    "De": 63,
    "Dfa": 27,
    "Dfb": 55,
    "Di": 26,
    "Dk": 49,
    "ETCCATEGORY": 51,
    "EXCLAMATIONCATEGORY": 44,
    "FW": 37,
    "I": 52,
    "N": 73,
    "ND": 68,
    "NG": 61,
    "Na": 0,
    "Nb": 15,
    "Nc": 6,
    "Ncd": 29,
    "Nd": 17,
    "Nep": 23,
    "Neqa": 25,
    "Neqb": 56,
    "Nes": 35,
    "Neu": 11,
    "Nf": 10,
    "Ng": 20,
    "Nh": 9,
    "Nv": 28,
    "P": 7,
    "PARENTHESISCATEGORY": 12,
    "PAUSECATEGORY": 22,
    "PERIODCATEGORY": 8,
    "QUESTIONCATEGORY": 41,
    "SEMICOLONCATEGORY": 46,
    "SHI": 19,
    "SPCHANGECATEGORY": 48,
    "T": 32,
    "V": 66,
    "VA": 16,
    "VAC": 54,
    "VB": 45,
    "VC": 4,
    "VCL": 34,
    "VD": 42,
    "VE": 14,
    "VF": 43,
    "VG": 30,
    "VH": 5,
    "VHC": 39,
    "VI": 50,
    "VJ": 18,
    "VK": 24,
    "VL": 36,
    "V_2": 31,
    "Vc": 65,
    "cbb": 67,
    "dI": 75,
    "na": 69,
    "nf": 72,
    "p": 71,
    "sHI": 60,
    "vA": 62,
    "vC": 70,
    "vH": 74
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "id2label": {
    "0": "Na",
    "1": "COMMACATEGORY",
    "2": "D",
    "3": "DE",
    "4": "VC",
    "5": "VH",
    "6": "Nc",
    "7": "P",
    "8": "PERIODCATEGORY",
    "9": "Nh",
    "10": "Nf",
    "11": "Neu",
    "12": "PARENTHESISCATEGORY",
    "13": "Cbb",
    "14": "VE",
    "15": "Nb",
    "16": "VA",
    "17": "Nd",
    "18": "VJ",
    "19": "SHI",
    "20": "Ng",
    "21": "Caa",
    "22": "PAUSECATEGORY",
    "23": "Nep",
    "24": "VK",
    "25": "Neqa",
    "26": "Di",
    "27": "Dfa",
    "28": "Nv",
    "29": "Ncd",
    "30": "VG",
    "31": "V_2",
    "32": "T",
    "33": "A",
    "34": "VCL",
    "35": "Nes",
    "36": "VL",
    "37": "FW",
    "38": "Da",
    "39": "VHC",
    "40": "COLONCATEGORY",
    "41": "QUESTIONCATEGORY",
    "42": "VD",
    "43": "VF",
    "44": "EXCLAMATIONCATEGORY",
    "45": "VB",
    "46": "SEMICOLONCATEGORY",
    "47": "Cab",
    "48": "SPCHANGECATEGORY",
    "49": "Dk",
    "50": "VI",
    "51": "ETCCATEGORY",
    "52": "I",
    "53": "DASHCATEGORY",
    "54": "VAC",
    "55": "Dfb",
    "56": "Neqb",
    "57": "Cba",
    "58": "DOTCATEGORY",
    "59": "DM",
    "60": "sHI",
    "61": "NG",
    "62": "vA",
    "63": "De",
    "64": "DK",
    "65": "Vc",
    "66": "V",
    "67": "cbb",
    "68": "ND",
    "69": "na",
    "70": "vC",
    "71": "p",
    "72": "nf",
    "73": "N",
    "74": "vH",
    "75": "dI"
  },
  "layer_norm_eps": 1e-12,
  "max_position_embeddings": 512,
  "model_type": "bert",
  "num_attention_heads": 12,
  "num_hidden_layers": 12,
  "pad_token_id": 0,
  "pooler_fc_size": 768,
  "pooler_num_attention_heads": 12,
  "pooler_num_fc_layers": 3,
  "pooler_size_per_head": 128,
  "pooler_type": "first_token_transform",
  "position_embedding_type": "absolute",
  "tokenizer_class": "BertTokenizerFast",
  "transformers_version": "4.7.0",
  "type_vocab_size": 2,
  "use_cache": true,
  "vocab_size": 26140
}