sjrhuschlee
commited on
Commit
•
caa89c2
1
Parent(s):
f7c9f9b
Update README.md
Browse files
README.md
CHANGED
@@ -24,6 +24,7 @@ tags:
|
|
24 |
- mrqa
|
25 |
- synQA
|
26 |
- adversarial_qa
|
|
|
27 |
model-index:
|
28 |
- name: sjrhuschlee/deberta-v3-base-squad2-ext-v1
|
29 |
results:
|
@@ -52,10 +53,10 @@ model-index:
|
|
52 |
split: validation
|
53 |
metrics:
|
54 |
- type: exact_match
|
55 |
-
value:
|
56 |
name: Exact Match
|
57 |
- type: f1
|
58 |
-
value:
|
59 |
name: F1
|
60 |
- task:
|
61 |
type: question-answering
|
@@ -67,10 +68,10 @@ model-index:
|
|
67 |
split: validation
|
68 |
metrics:
|
69 |
- type: exact_match
|
70 |
-
value:
|
71 |
name: Exact Match
|
72 |
- type: f1
|
73 |
-
value:
|
74 |
name: F1
|
75 |
- task:
|
76 |
type: question-answering
|
@@ -82,70 +83,70 @@ model-index:
|
|
82 |
split: validation
|
83 |
metrics:
|
84 |
- type: exact_match
|
85 |
-
value:
|
86 |
name: Exact Match
|
87 |
- type: f1
|
88 |
-
value:
|
89 |
name: F1
|
90 |
- task:
|
91 |
type: question-answering
|
92 |
name: Question Answering
|
93 |
dataset:
|
94 |
-
name: squadshifts
|
95 |
type: squadshifts
|
96 |
config: amazon
|
97 |
split: test
|
98 |
metrics:
|
99 |
- type: exact_match
|
100 |
-
value:
|
101 |
name: Exact Match
|
102 |
- type: f1
|
103 |
-
value:
|
104 |
name: F1
|
105 |
- task:
|
106 |
type: question-answering
|
107 |
name: Question Answering
|
108 |
dataset:
|
109 |
-
name: squadshifts
|
110 |
type: squadshifts
|
111 |
config: new_wiki
|
112 |
split: test
|
113 |
metrics:
|
114 |
- type: exact_match
|
115 |
-
value:
|
116 |
name: Exact Match
|
117 |
- type: f1
|
118 |
-
value:
|
119 |
name: F1
|
120 |
- task:
|
121 |
type: question-answering
|
122 |
name: Question Answering
|
123 |
dataset:
|
124 |
-
name: squadshifts
|
125 |
type: squadshifts
|
126 |
config: nyt
|
127 |
split: test
|
128 |
metrics:
|
129 |
- type: exact_match
|
130 |
-
value:
|
131 |
name: Exact Match
|
132 |
- type: f1
|
133 |
-
value:
|
134 |
name: F1
|
135 |
- task:
|
136 |
type: question-answering
|
137 |
name: Question Answering
|
138 |
dataset:
|
139 |
-
name: squadshifts
|
140 |
type: squadshifts
|
141 |
config: reddit
|
142 |
split: test
|
143 |
metrics:
|
144 |
- type: exact_match
|
145 |
-
value:
|
146 |
name: Exact Match
|
147 |
- type: f1
|
148 |
-
value:
|
149 |
name: F1
|
150 |
---
|
151 |
|
|
|
24 |
- mrqa
|
25 |
- synQA
|
26 |
- adversarial_qa
|
27 |
+
base_model: microsoft/deberta-v3-base
|
28 |
model-index:
|
29 |
- name: sjrhuschlee/deberta-v3-base-squad2-ext-v1
|
30 |
results:
|
|
|
53 |
split: validation
|
54 |
metrics:
|
55 |
- type: exact_match
|
56 |
+
value: 87.985
|
57 |
name: Exact Match
|
58 |
- type: f1
|
59 |
+
value: 93.651
|
60 |
name: F1
|
61 |
- task:
|
62 |
type: question-answering
|
|
|
68 |
split: validation
|
69 |
metrics:
|
70 |
- type: exact_match
|
71 |
+
value: 47.533
|
72 |
name: Exact Match
|
73 |
- type: f1
|
74 |
+
value: 59.838
|
75 |
name: F1
|
76 |
- task:
|
77 |
type: question-answering
|
|
|
83 |
split: validation
|
84 |
metrics:
|
85 |
- type: exact_match
|
86 |
+
value: 84.723
|
87 |
name: Exact Match
|
88 |
- type: f1
|
89 |
+
value: 89.780
|
90 |
name: F1
|
91 |
- task:
|
92 |
type: question-answering
|
93 |
name: Question Answering
|
94 |
dataset:
|
95 |
+
name: squadshifts amazon
|
96 |
type: squadshifts
|
97 |
config: amazon
|
98 |
split: test
|
99 |
metrics:
|
100 |
- type: exact_match
|
101 |
+
value: 74.851
|
102 |
name: Exact Match
|
103 |
- type: f1
|
104 |
+
value: 87.448
|
105 |
name: F1
|
106 |
- task:
|
107 |
type: question-answering
|
108 |
name: Question Answering
|
109 |
dataset:
|
110 |
+
name: squadshifts new_wiki
|
111 |
type: squadshifts
|
112 |
config: new_wiki
|
113 |
split: test
|
114 |
metrics:
|
115 |
- type: exact_match
|
116 |
+
value: 83.396
|
117 |
name: Exact Match
|
118 |
- type: f1
|
119 |
+
value: 91.996
|
120 |
name: F1
|
121 |
- task:
|
122 |
type: question-answering
|
123 |
name: Question Answering
|
124 |
dataset:
|
125 |
+
name: squadshifts nyt
|
126 |
type: squadshifts
|
127 |
config: nyt
|
128 |
split: test
|
129 |
metrics:
|
130 |
- type: exact_match
|
131 |
+
value: 83.934
|
132 |
name: Exact Match
|
133 |
- type: f1
|
134 |
+
value: 92.234
|
135 |
name: F1
|
136 |
- task:
|
137 |
type: question-answering
|
138 |
name: Question Answering
|
139 |
dataset:
|
140 |
+
name: squadshifts reddit
|
141 |
type: squadshifts
|
142 |
config: reddit
|
143 |
split: test
|
144 |
metrics:
|
145 |
- type: exact_match
|
146 |
+
value: 75.008
|
147 |
name: Exact Match
|
148 |
- type: f1
|
149 |
+
value: 86.120
|
150 |
name: F1
|
151 |
---
|
152 |
|