Commit
·
cdd9094
1
Parent(s):
9fa29df
feat: Add support for Italian
Browse files
app.py
CHANGED
|
@@ -176,6 +176,7 @@ FAROESE = Language(code="fo", name="Faroese")
|
|
| 176 |
FRENCH = Language(code="fr", name="French")
|
| 177 |
GERMAN = Language(code="de", name="German")
|
| 178 |
ICELANDIC = Language(code="is", name="Icelandic")
|
|
|
|
| 179 |
NORWEGIAN = Language(code="no", name="Norwegian")
|
| 180 |
SWEDISH = Language(code="sv", name="Swedish")
|
| 181 |
ALL_LANGUAGES = {
|
|
@@ -192,6 +193,7 @@ DATASETS = [
|
|
| 192 |
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
| 193 |
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
| 194 |
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
|
|
|
| 195 |
|
| 196 |
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
| 197 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
|
@@ -203,6 +205,7 @@ DATASETS = [
|
|
| 203 |
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
| 204 |
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
| 205 |
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
|
|
|
| 206 |
|
| 207 |
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
| 208 |
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
|
@@ -214,6 +217,7 @@ DATASETS = [
|
|
| 214 |
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
| 215 |
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
| 216 |
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
|
|
|
| 217 |
|
| 218 |
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
| 219 |
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
|
@@ -224,6 +228,7 @@ DATASETS = [
|
|
| 224 |
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
| 225 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
| 226 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
|
|
|
| 227 |
|
| 228 |
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
| 229 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
|
@@ -233,6 +238,7 @@ DATASETS = [
|
|
| 233 |
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
| 234 |
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
| 235 |
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
|
|
|
| 236 |
|
| 237 |
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
| 238 |
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
|
@@ -243,6 +249,7 @@ DATASETS = [
|
|
| 243 |
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
| 244 |
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
| 245 |
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
|
|
|
| 246 |
|
| 247 |
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
| 248 |
Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
|
@@ -252,6 +259,7 @@ DATASETS = [
|
|
| 252 |
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
| 253 |
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
| 254 |
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
|
|
|
| 255 |
]
|
| 256 |
|
| 257 |
|
|
|
|
| 176 |
FRENCH = Language(code="fr", name="French")
|
| 177 |
GERMAN = Language(code="de", name="German")
|
| 178 |
ICELANDIC = Language(code="is", name="Icelandic")
|
| 179 |
+
ITALIAN = Language(code="it", name="Italian")
|
| 180 |
NORWEGIAN = Language(code="no", name="Norwegian")
|
| 181 |
SWEDISH = Language(code="sv", name="Swedish")
|
| 182 |
ALL_LANGUAGES = {
|
|
|
|
| 193 |
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
| 194 |
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
| 195 |
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
| 196 |
+
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
| 197 |
|
| 198 |
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
| 199 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
|
|
|
| 205 |
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
| 206 |
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
| 207 |
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
| 208 |
+
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
| 209 |
|
| 210 |
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
| 211 |
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
|
|
|
| 217 |
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
| 218 |
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
| 219 |
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
| 220 |
+
Dataset(name="scala-it", language=ITALIAN, task=GRAMMAR),
|
| 221 |
|
| 222 |
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
| 223 |
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
|
|
|
| 228 |
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
| 229 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
| 230 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
| 231 |
+
Dataset(name="squad-it", language=ITALIAN, task=READING_COMPREHENSION),
|
| 232 |
|
| 233 |
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
| 234 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
|
|
|
| 238 |
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
| 239 |
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
| 240 |
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
| 241 |
+
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
| 242 |
|
| 243 |
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
| 244 |
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
|
|
|
| 249 |
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
| 250 |
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
| 251 |
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
| 252 |
+
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
| 253 |
|
| 254 |
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
| 255 |
Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
|
|
|
| 259 |
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
| 260 |
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
| 261 |
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
| 262 |
+
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
| 263 |
]
|
| 264 |
|
| 265 |
|