saattrupdan commited on
Commit
cdd9094
·
1 Parent(s): 9fa29df

feat: Add support for Italian

Browse files
Files changed (1) hide show
  1. app.py +8 -0
app.py CHANGED
@@ -176,6 +176,7 @@ FAROESE = Language(code="fo", name="Faroese")
176
  FRENCH = Language(code="fr", name="French")
177
  GERMAN = Language(code="de", name="German")
178
  ICELANDIC = Language(code="is", name="Icelandic")
 
179
  NORWEGIAN = Language(code="no", name="Norwegian")
180
  SWEDISH = Language(code="sv", name="Swedish")
181
  ALL_LANGUAGES = {
@@ -192,6 +193,7 @@ DATASETS = [
192
  Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
193
  Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
194
  Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
 
195
 
196
  Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
197
  Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
@@ -203,6 +205,7 @@ DATASETS = [
203
  Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
204
  Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
205
  Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
 
206
 
207
  Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
208
  Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
@@ -214,6 +217,7 @@ DATASETS = [
214
  Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
215
  Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
216
  Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
 
217
 
218
  Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
219
  Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
@@ -224,6 +228,7 @@ DATASETS = [
224
  Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
225
  Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
226
  Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
 
227
 
228
  Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
229
  Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
@@ -233,6 +238,7 @@ DATASETS = [
233
  Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
234
  Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
235
  Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
 
236
 
237
  Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
238
  Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
@@ -243,6 +249,7 @@ DATASETS = [
243
  Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
244
  Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
245
  Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
 
246
 
247
  Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
248
  Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
@@ -252,6 +259,7 @@ DATASETS = [
252
  Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
253
  Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
254
  Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
 
255
  ]
256
 
257
 
 
176
  FRENCH = Language(code="fr", name="French")
177
  GERMAN = Language(code="de", name="German")
178
  ICELANDIC = Language(code="is", name="Icelandic")
179
+ ITALIAN = Language(code="it", name="Italian")
180
  NORWEGIAN = Language(code="no", name="Norwegian")
181
  SWEDISH = Language(code="sv", name="Swedish")
182
  ALL_LANGUAGES = {
 
193
  Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
194
  Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
195
  Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
196
+ Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
197
 
198
  Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
199
  Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
 
205
  Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
206
  Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
207
  Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
208
+ Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
209
 
210
  Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
211
  Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
 
217
  Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
218
  Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
219
  Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
220
+ Dataset(name="scala-it", language=ITALIAN, task=GRAMMAR),
221
 
222
  Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
223
  Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
 
228
  Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
229
  Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
230
  Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
231
+ Dataset(name="squad-it", language=ITALIAN, task=READING_COMPREHENSION),
232
 
233
  Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
234
  Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
 
238
  Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
239
  Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
240
  Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
241
+ Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
242
 
243
  Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
244
  Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
 
249
  Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
250
  Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
251
  Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
252
+ Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
253
 
254
  Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
255
  Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
 
259
  Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
260
  Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
261
  Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
262
+ Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
263
  ]
264
 
265