Commit
·
4f27e41
1
Parent(s):
0495bc2
style: Re-order
Browse files
app.py
CHANGED
@@ -160,13 +160,13 @@ class Dataset(BaseModel):
|
|
160 |
return hash(self.name)
|
161 |
|
162 |
|
|
|
|
|
|
|
|
|
163 |
SUMMARISATION = Task(name="summarisation", metric="bertscore")
|
164 |
KNOWLEDGE = Task(name="knowledge", metric="mcc")
|
165 |
COMMON_SENSE_REASONING = Task(name="common-sense reasoning", metric="mcc")
|
166 |
-
GRAMMAR = Task(name="grammar", metric="mcc")
|
167 |
-
READING_COMPREHENSION = Task(name="reading comprehension", metric="em")
|
168 |
-
TEXT_CLASSIFICATION = Task(name="text classification", metric="mcc")
|
169 |
-
INFORMATION_EXTRACTION = Task(name="information extraction", metric="micro_f1_no_misc")
|
170 |
ALL_TASKS = [obj for obj in globals().values() if isinstance(obj, Task)]
|
171 |
|
172 |
DANISH = Language(code="da", name="Danish")
|
@@ -184,82 +184,87 @@ ALL_LANGUAGES = {
|
|
184 |
}
|
185 |
|
186 |
DATASETS = [
|
187 |
-
Dataset(name="swerec", language=SWEDISH, task=TEXT_CLASSIFICATION),
|
188 |
Dataset(name="angry-tweets", language=DANISH, task=TEXT_CLASSIFICATION),
|
189 |
-
Dataset(name="
|
190 |
-
Dataset(name="sb10k", language=GERMAN, task=TEXT_CLASSIFICATION),
|
191 |
-
Dataset(name="dutch-social", language=DUTCH, task=TEXT_CLASSIFICATION),
|
192 |
-
Dataset(name="sst5", language=ENGLISH, task=TEXT_CLASSIFICATION),
|
193 |
-
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
194 |
-
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
195 |
-
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
196 |
-
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
197 |
-
|
198 |
-
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
199 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
200 |
-
Dataset(name="
|
201 |
-
Dataset(name="
|
202 |
-
Dataset(name="
|
203 |
-
Dataset(name="
|
204 |
-
Dataset(name="
|
205 |
-
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
206 |
-
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
207 |
-
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
208 |
-
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
209 |
|
210 |
-
Dataset(name="
|
211 |
-
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
212 |
-
Dataset(name="scala-nb", language=NORWEGIAN, task=GRAMMAR),
|
213 |
-
Dataset(name="scala-nn", language=NORWEGIAN, task=GRAMMAR),
|
214 |
-
Dataset(name="scala-is", language=ICELANDIC, task=GRAMMAR),
|
215 |
-
Dataset(name="scala-de", language=GERMAN, task=GRAMMAR),
|
216 |
Dataset(name="scala-nl", language=DUTCH, task=GRAMMAR),
|
217 |
-
Dataset(name="
|
218 |
-
Dataset(name="
|
219 |
-
Dataset(name="
|
220 |
-
Dataset(name="
|
|
|
221 |
|
222 |
-
Dataset(name="
|
223 |
-
Dataset(name="
|
224 |
-
Dataset(name="
|
225 |
-
Dataset(name="nqii", language=ICELANDIC, task=READING_COMPREHENSION),
|
226 |
-
Dataset(name="germanquad", language=GERMAN, task=READING_COMPREHENSION),
|
227 |
Dataset(name="squad", language=ENGLISH, task=READING_COMPREHENSION),
|
228 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
|
|
|
229 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
|
|
|
|
|
|
|
|
230 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
231 |
-
Dataset(name="
|
|
|
|
|
232 |
|
233 |
-
Dataset(name="
|
|
|
|
|
|
|
234 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
235 |
-
Dataset(name="
|
236 |
-
Dataset(name="
|
237 |
-
Dataset(name="wiki-lingua-nl", language=DUTCH, task=SUMMARISATION),
|
238 |
-
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
239 |
-
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
240 |
-
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
241 |
-
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
242 |
|
243 |
-
Dataset(
|
244 |
-
|
245 |
-
|
246 |
-
Dataset(name="
|
|
|
|
|
|
|
247 |
Dataset(name="icelandic-knowledge", language=ICELANDIC, task=KNOWLEDGE),
|
248 |
-
Dataset(name="
|
249 |
-
|
250 |
-
Dataset(name="
|
251 |
-
Dataset(name="
|
|
|
|
|
|
|
252 |
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
|
|
253 |
|
254 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
255 |
Dataset(name="nor-common-sense-qa", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
256 |
Dataset(name="hellaswag-sv", language=SWEDISH, task=COMMON_SENSE_REASONING),
|
257 |
-
Dataset(name="winogrande-is", language=ICELANDIC, task=COMMON_SENSE_REASONING),
|
258 |
-
Dataset(name="hellaswag-de", language=GERMAN, task=COMMON_SENSE_REASONING),
|
259 |
-
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
260 |
-
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
261 |
-
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
262 |
-
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
263 |
]
|
264 |
|
265 |
|
|
|
160 |
return hash(self.name)
|
161 |
|
162 |
|
163 |
+
TEXT_CLASSIFICATION = Task(name="text classification", metric="mcc")
|
164 |
+
GRAMMAR = Task(name="grammar", metric="mcc")
|
165 |
+
INFORMATION_EXTRACTION = Task(name="information extraction", metric="micro_f1_no_misc")
|
166 |
+
READING_COMPREHENSION = Task(name="reading comprehension", metric="em")
|
167 |
SUMMARISATION = Task(name="summarisation", metric="bertscore")
|
168 |
KNOWLEDGE = Task(name="knowledge", metric="mcc")
|
169 |
COMMON_SENSE_REASONING = Task(name="common-sense reasoning", metric="mcc")
|
|
|
|
|
|
|
|
|
170 |
ALL_TASKS = [obj for obj in globals().values() if isinstance(obj, Task)]
|
171 |
|
172 |
DANISH = Language(code="da", name="Danish")
|
|
|
184 |
}
|
185 |
|
186 |
DATASETS = [
|
|
|
187 |
Dataset(name="angry-tweets", language=DANISH, task=TEXT_CLASSIFICATION),
|
188 |
+
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
189 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
190 |
+
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
191 |
+
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
192 |
+
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
193 |
+
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
194 |
+
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
195 |
|
196 |
+
Dataset(name="dutch-social", language=DUTCH, task=TEXT_CLASSIFICATION),
|
|
|
|
|
|
|
|
|
|
|
197 |
Dataset(name="scala-nl", language=DUTCH, task=GRAMMAR),
|
198 |
+
Dataset(name="conll-nl", language=DUTCH, task=INFORMATION_EXTRACTION),
|
199 |
+
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
200 |
+
Dataset(name="wiki-lingua-nl", language=DUTCH, task=SUMMARISATION),
|
201 |
+
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
202 |
+
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
203 |
|
204 |
+
Dataset(name="sst5", language=ENGLISH, task=TEXT_CLASSIFICATION),
|
205 |
+
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
206 |
+
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
|
|
|
|
207 |
Dataset(name="squad", language=ENGLISH, task=READING_COMPREHENSION),
|
208 |
+
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
209 |
+
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
210 |
+
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
211 |
+
|
212 |
+
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
213 |
+
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
214 |
+
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
215 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
216 |
+
|
217 |
+
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
218 |
+
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
219 |
+
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
220 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
221 |
+
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
222 |
+
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
223 |
+
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
224 |
|
225 |
+
Dataset(name="sb10k", language=GERMAN, task=TEXT_CLASSIFICATION),
|
226 |
+
Dataset(name="scala-de", language=GERMAN, task=GRAMMAR),
|
227 |
+
Dataset(name="germeval", language=GERMAN, task=INFORMATION_EXTRACTION),
|
228 |
+
Dataset(name="germanquad", language=GERMAN, task=READING_COMPREHENSION),
|
229 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
230 |
+
Dataset(name="mmlu-de", language=GERMAN, task=KNOWLEDGE),
|
231 |
+
Dataset(name="hellaswag-de", language=GERMAN, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
232 |
|
233 |
+
Dataset(
|
234 |
+
name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION
|
235 |
+
),
|
236 |
+
Dataset(name="scala-is", language=ICELANDIC, task=GRAMMAR),
|
237 |
+
Dataset(name="mim-gold-ner", language=ICELANDIC, task=INFORMATION_EXTRACTION),
|
238 |
+
Dataset(name="nqii", language=ICELANDIC, task=READING_COMPREHENSION),
|
239 |
+
Dataset(name="rrn", language=ICELANDIC, task=SUMMARISATION),
|
240 |
Dataset(name="icelandic-knowledge", language=ICELANDIC, task=KNOWLEDGE),
|
241 |
+
Dataset(name="winogrande-is", language=ICELANDIC, task=COMMON_SENSE_REASONING),
|
242 |
+
|
243 |
+
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
244 |
+
Dataset(name="scala-it", language=ITALIAN, task=GRAMMAR),
|
245 |
+
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
246 |
+
Dataset(name="squad-it", language=ITALIAN, task=READING_COMPREHENSION),
|
247 |
+
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
248 |
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
249 |
+
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
250 |
|
251 |
+
Dataset(name="norec", language=NORWEGIAN, task=TEXT_CLASSIFICATION),
|
252 |
+
Dataset(name="scala-nb", language=NORWEGIAN, task=GRAMMAR),
|
253 |
+
Dataset(name="scala-nn", language=NORWEGIAN, task=GRAMMAR),
|
254 |
+
Dataset(name="norne-nb", language=NORWEGIAN, task=INFORMATION_EXTRACTION),
|
255 |
+
Dataset(name="norne-nn", language=NORWEGIAN, task=INFORMATION_EXTRACTION),
|
256 |
+
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
257 |
+
Dataset(name="no-sammendrag", language=NORWEGIAN, task=SUMMARISATION),
|
258 |
+
Dataset(name="nrk-quiz-qa", language=NORWEGIAN, task=KNOWLEDGE),
|
259 |
Dataset(name="nor-common-sense-qa", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
260 |
+
|
261 |
+
Dataset(name="swerec", language=SWEDISH, task=TEXT_CLASSIFICATION),
|
262 |
+
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
263 |
+
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
264 |
+
Dataset(name="scandiqa-sv", language=SWEDISH, task=READING_COMPREHENSION),
|
265 |
+
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
266 |
+
Dataset(name="mmlu-sv", language=SWEDISH, task=KNOWLEDGE),
|
267 |
Dataset(name="hellaswag-sv", language=SWEDISH, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
268 |
]
|
269 |
|
270 |
|