jaggernaut007 commited on
Commit
e6c2d11
1 Parent(s): dfa22ad

Model save

Browse files
Files changed (6) hide show
  1. README.md +8 -20
  2. added_tokens.json +3 -0
  3. config.json +11 -167
  4. model.safetensors +2 -2
  5. spm.model +3 -0
  6. training_args.bin +2 -2
README.md CHANGED
@@ -3,11 +3,6 @@ license: mit
3
  base_model: Clinical-AI-Apollo/Medical-NER
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - precision
8
- - recall
9
- - f1
10
- - accuracy
11
  model-index:
12
  - name: Medical-NER-finetuned-ner
13
  results: []
@@ -19,12 +14,6 @@ should probably proofread and complete it, then remove this comment. -->
19
  # Medical-NER-finetuned-ner
20
 
21
  This model is a fine-tuned version of [Clinical-AI-Apollo/Medical-NER](https://huggingface.co/Clinical-AI-Apollo/Medical-NER) on an unknown dataset.
22
- It achieves the following results on the evaluation set:
23
- - Loss: 0.2030
24
- - Precision: 0.9543
25
- - Recall: 0.9462
26
- - F1: 0.9502
27
- - Accuracy: 0.9453
28
 
29
  ## Model description
30
 
@@ -44,20 +33,19 @@ More information needed
44
 
45
  The following hyperparameters were used during training:
46
  - learning_rate: 2e-05
47
- - train_batch_size: 6
48
  - eval_batch_size: 4
49
  - seed: 42
 
 
50
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
  - lr_scheduler_type: linear
52
- - num_epochs: 6
53
-
54
- ### Training results
55
-
56
-
57
 
58
  ### Framework versions
59
 
60
- - Transformers 4.39.2
61
- - Pytorch 1.12.1+cu102
62
- - Datasets 2.18.0
63
  - Tokenizers 0.15.2
 
3
  base_model: Clinical-AI-Apollo/Medical-NER
4
  tags:
5
  - generated_from_trainer
 
 
 
 
 
6
  model-index:
7
  - name: Medical-NER-finetuned-ner
8
  results: []
 
14
  # Medical-NER-finetuned-ner
15
 
16
  This model is a fine-tuned version of [Clinical-AI-Apollo/Medical-NER](https://huggingface.co/Clinical-AI-Apollo/Medical-NER) on an unknown dataset.
 
 
 
 
 
 
17
 
18
  ## Model description
19
 
 
33
 
34
  The following hyperparameters were used during training:
35
  - learning_rate: 2e-05
36
+ - train_batch_size: 4
37
  - eval_batch_size: 4
38
  - seed: 42
39
+ - gradient_accumulation_steps: 4
40
+ - total_train_batch_size: 16
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 5
44
+ - mixed_precision_training: Native AMP
 
 
 
45
 
46
  ### Framework versions
47
 
48
+ - Transformers 4.39.3
49
+ - Pytorch 2.2.2+cu121
50
+ - Datasets 2.19.0
51
  - Tokenizers 0.15.2
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[MASK]": 128000
3
+ }
config.json CHANGED
@@ -8,176 +8,20 @@
8
  "hidden_dropout_prob": 0.1,
9
  "hidden_size": 768,
10
  "id2label": {
11
- "0": "O",
12
- "1": "B-ACTIVITY",
13
- "2": "I-ACTIVITY",
14
- "3": "I-ADMINISTRATION",
15
- "4": "B-ADMINISTRATION",
16
- "5": "B-AGE",
17
- "6": "I-AGE",
18
- "7": "I-AREA",
19
- "8": "B-AREA",
20
- "9": "B-BIOLOGICAL_ATTRIBUTE",
21
- "10": "I-BIOLOGICAL_ATTRIBUTE",
22
- "11": "I-BIOLOGICAL_STRUCTURE",
23
- "12": "B-BIOLOGICAL_STRUCTURE",
24
- "13": "B-CLINICAL_EVENT",
25
- "14": "I-CLINICAL_EVENT",
26
- "15": "B-COLOR",
27
- "16": "I-COLOR",
28
- "17": "I-COREFERENCE",
29
- "18": "B-COREFERENCE",
30
- "19": "B-DATE",
31
- "20": "I-DATE",
32
- "21": "I-DETAILED_DESCRIPTION",
33
- "22": "B-DETAILED_DESCRIPTION",
34
- "23": "I-DIAGNOSTIC_PROCEDURE",
35
- "24": "B-DIAGNOSTIC_PROCEDURE",
36
- "25": "I-DISEASE_DISORDER",
37
- "26": "B-DISEASE_DISORDER",
38
- "27": "B-DISTANCE",
39
- "28": "I-DISTANCE",
40
- "29": "B-DOSAGE",
41
- "30": "I-DOSAGE",
42
- "31": "I-DURATION",
43
- "32": "B-DURATION",
44
- "33": "I-FAMILY_HISTORY",
45
- "34": "B-FAMILY_HISTORY",
46
- "35": "B-FREQUENCY",
47
- "36": "I-FREQUENCY",
48
- "37": "I-HEIGHT",
49
- "38": "B-HEIGHT",
50
- "39": "B-HISTORY",
51
- "40": "I-HISTORY",
52
- "41": "I-LAB_VALUE",
53
- "42": "B-LAB_VALUE",
54
- "43": "I-MASS",
55
- "44": "B-MASS",
56
- "45": "I-MEDICATION",
57
- "46": "B-MEDICATION",
58
- "47": "I-NONBIOLOGICAL_LOCATION",
59
- "48": "B-NONBIOLOGICAL_LOCATION",
60
- "49": "I-OCCUPATION",
61
- "50": "B-OCCUPATION",
62
- "51": "B-OTHER_ENTITY",
63
- "52": "I-OTHER_ENTITY",
64
- "53": "B-OTHER_EVENT",
65
- "54": "I-OTHER_EVENT",
66
- "55": "I-OUTCOME",
67
- "56": "B-OUTCOME",
68
- "57": "I-PERSONAL_BACKGROUND",
69
- "58": "B-PERSONAL_BACKGROUND",
70
- "59": "B-QUALITATIVE_CONCEPT",
71
- "60": "I-QUALITATIVE_CONCEPT",
72
- "61": "I-QUANTITATIVE_CONCEPT",
73
- "62": "B-QUANTITATIVE_CONCEPT",
74
- "63": "B-SEVERITY",
75
- "64": "I-SEVERITY",
76
- "65": "B-SEX",
77
- "66": "I-SEX",
78
- "67": "B-SHAPE",
79
- "68": "I-SHAPE",
80
- "69": "B-SIGN_SYMPTOM",
81
- "70": "I-SIGN_SYMPTOM",
82
- "71": "B-SUBJECT",
83
- "72": "I-SUBJECT",
84
- "73": "B-TEXTURE",
85
- "74": "I-TEXTURE",
86
- "75": "B-THERAPEUTIC_PROCEDURE",
87
- "76": "I-THERAPEUTIC_PROCEDURE",
88
- "77": "I-TIME",
89
- "78": "B-TIME",
90
- "79": "B-VOLUME",
91
- "80": "I-VOLUME",
92
- "81": "I-WEIGHT",
93
- "82": "B-WEIGHT"
94
  },
95
  "initializer_range": 0.02,
96
  "intermediate_size": 3072,
97
  "label2id": {
98
- "B-ACTIVITY": 1,
99
- "B-ADMINISTRATION": 4,
100
- "B-AGE": 5,
101
- "B-AREA": 8,
102
- "B-BIOLOGICAL_ATTRIBUTE": 9,
103
- "B-BIOLOGICAL_STRUCTURE": 12,
104
- "B-CLINICAL_EVENT": 13,
105
- "B-COLOR": 15,
106
- "B-COREFERENCE": 18,
107
- "B-DATE": 19,
108
- "B-DETAILED_DESCRIPTION": 22,
109
- "B-DIAGNOSTIC_PROCEDURE": 24,
110
- "B-DISEASE_DISORDER": 26,
111
- "B-DISTANCE": 27,
112
- "B-DOSAGE": 29,
113
- "B-DURATION": 32,
114
- "B-FAMILY_HISTORY": 34,
115
- "B-FREQUENCY": 35,
116
- "B-HEIGHT": 38,
117
- "B-HISTORY": 39,
118
- "B-LAB_VALUE": 42,
119
- "B-MASS": 44,
120
- "B-MEDICATION": 46,
121
- "B-NONBIOLOGICAL_LOCATION": 48,
122
- "B-OCCUPATION": 50,
123
- "B-OTHER_ENTITY": 51,
124
- "B-OTHER_EVENT": 53,
125
- "B-OUTCOME": 56,
126
- "B-PERSONAL_BACKGROUND": 58,
127
- "B-QUALITATIVE_CONCEPT": 59,
128
- "B-QUANTITATIVE_CONCEPT": 62,
129
- "B-SEVERITY": 63,
130
- "B-SEX": 65,
131
- "B-SHAPE": 67,
132
- "B-SIGN_SYMPTOM": 69,
133
- "B-SUBJECT": 71,
134
- "B-TEXTURE": 73,
135
- "B-THERAPEUTIC_PROCEDURE": 75,
136
- "B-TIME": 78,
137
- "B-VOLUME": 79,
138
- "B-WEIGHT": 82,
139
- "I-ACTIVITY": 2,
140
- "I-ADMINISTRATION": 3,
141
- "I-AGE": 6,
142
- "I-AREA": 7,
143
- "I-BIOLOGICAL_ATTRIBUTE": 10,
144
- "I-BIOLOGICAL_STRUCTURE": 11,
145
- "I-CLINICAL_EVENT": 14,
146
- "I-COLOR": 16,
147
- "I-COREFERENCE": 17,
148
- "I-DATE": 20,
149
- "I-DETAILED_DESCRIPTION": 21,
150
- "I-DIAGNOSTIC_PROCEDURE": 23,
151
- "I-DISEASE_DISORDER": 25,
152
- "I-DISTANCE": 28,
153
- "I-DOSAGE": 30,
154
- "I-DURATION": 31,
155
- "I-FAMILY_HISTORY": 33,
156
- "I-FREQUENCY": 36,
157
- "I-HEIGHT": 37,
158
- "I-HISTORY": 40,
159
- "I-LAB_VALUE": 41,
160
- "I-MASS": 43,
161
- "I-MEDICATION": 45,
162
- "I-NONBIOLOGICAL_LOCATION": 47,
163
- "I-OCCUPATION": 49,
164
- "I-OTHER_ENTITY": 52,
165
- "I-OTHER_EVENT": 54,
166
- "I-OUTCOME": 55,
167
- "I-PERSONAL_BACKGROUND": 57,
168
- "I-QUALITATIVE_CONCEPT": 60,
169
- "I-QUANTITATIVE_CONCEPT": 61,
170
- "I-SEVERITY": 64,
171
- "I-SEX": 66,
172
- "I-SHAPE": 68,
173
- "I-SIGN_SYMPTOM": 70,
174
- "I-SUBJECT": 72,
175
- "I-TEXTURE": 74,
176
- "I-THERAPEUTIC_PROCEDURE": 76,
177
- "I-TIME": 77,
178
- "I-VOLUME": 80,
179
- "I-WEIGHT": 81,
180
- "O": 0
181
  },
182
  "layer_norm_eps": 1e-07,
183
  "max_position_embeddings": 512,
@@ -199,7 +43,7 @@
199
  "relative_attention": true,
200
  "share_att_key": true,
201
  "torch_dtype": "float32",
202
- "transformers_version": "4.39.2",
203
  "type_vocab_size": 0,
204
  "vocab_size": 128100
205
  }
 
8
  "hidden_dropout_prob": 0.1,
9
  "hidden_size": 768,
10
  "id2label": {
11
+ "0": "LABEL_0",
12
+ "1": "LABEL_1",
13
+ "2": "LABEL_2",
14
+ "3": "LABEL_3",
15
+ "4": "LABEL_4"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  },
17
  "initializer_range": 0.02,
18
  "intermediate_size": 3072,
19
  "label2id": {
20
+ "LABEL_0": 0,
21
+ "LABEL_1": 1,
22
+ "LABEL_2": 2,
23
+ "LABEL_3": 3,
24
+ "LABEL_4": 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  },
26
  "layer_norm_eps": 1e-07,
27
  "max_position_embeddings": 512,
 
43
  "relative_attention": true,
44
  "share_att_key": true,
45
  "torch_dtype": "float32",
46
+ "transformers_version": "4.39.3",
47
  "type_vocab_size": 0,
48
  "vocab_size": 128100
49
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0869169ee520de1aae48681b98e1042b3406f8dfd86a0a06009dfc2fb518eb3b
3
- size 735605900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d5274078a776dd953b0390ee77fc2d3335ecd6e77093c3fa28017bef2033ef5
3
+ size 735365964
spm.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c679fbf93643d19aab7ee10c0b99e460bdbc02fedf34b92b05af343b4af586fd
3
+ size 2464616
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8280c5db6559eca6ebac8e65c3555c0d423372e0769d5326e1890367e110c0e6
3
- size 4463
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:429f9a5397d21c04b6c82646ed585300c0105bd1539e5e6ae89c9bb49a39b6c5
3
+ size 4920