Commit
·
cdd9094
1
Parent(s):
9fa29df
feat: Add support for Italian
Browse files
app.py
CHANGED
@@ -176,6 +176,7 @@ FAROESE = Language(code="fo", name="Faroese")
|
|
176 |
FRENCH = Language(code="fr", name="French")
|
177 |
GERMAN = Language(code="de", name="German")
|
178 |
ICELANDIC = Language(code="is", name="Icelandic")
|
|
|
179 |
NORWEGIAN = Language(code="no", name="Norwegian")
|
180 |
SWEDISH = Language(code="sv", name="Swedish")
|
181 |
ALL_LANGUAGES = {
|
@@ -192,6 +193,7 @@ DATASETS = [
|
|
192 |
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
193 |
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
194 |
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
|
|
195 |
|
196 |
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
197 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
@@ -203,6 +205,7 @@ DATASETS = [
|
|
203 |
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
204 |
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
205 |
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
|
|
206 |
|
207 |
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
208 |
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
@@ -214,6 +217,7 @@ DATASETS = [
|
|
214 |
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
215 |
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
216 |
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
|
|
217 |
|
218 |
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
219 |
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
@@ -224,6 +228,7 @@ DATASETS = [
|
|
224 |
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
225 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
226 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
|
|
227 |
|
228 |
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
229 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
@@ -233,6 +238,7 @@ DATASETS = [
|
|
233 |
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
234 |
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
235 |
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
|
|
236 |
|
237 |
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
238 |
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
@@ -243,6 +249,7 @@ DATASETS = [
|
|
243 |
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
244 |
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
245 |
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
|
|
246 |
|
247 |
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
248 |
Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
@@ -252,6 +259,7 @@ DATASETS = [
|
|
252 |
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
253 |
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
254 |
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
|
|
255 |
]
|
256 |
|
257 |
|
|
|
176 |
FRENCH = Language(code="fr", name="French")
|
177 |
GERMAN = Language(code="de", name="German")
|
178 |
ICELANDIC = Language(code="is", name="Icelandic")
|
179 |
+
ITALIAN = Language(code="it", name="Italian")
|
180 |
NORWEGIAN = Language(code="no", name="Norwegian")
|
181 |
SWEDISH = Language(code="sv", name="Swedish")
|
182 |
ALL_LANGUAGES = {
|
|
|
193 |
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
194 |
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
195 |
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
196 |
+
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
197 |
|
198 |
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
199 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
|
|
205 |
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
206 |
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
207 |
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
208 |
+
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
209 |
|
210 |
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
211 |
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
|
|
217 |
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
218 |
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
219 |
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
220 |
+
Dataset(name="scala-it", language=ITALIAN, task=GRAMMAR),
|
221 |
|
222 |
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
223 |
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
|
|
228 |
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
229 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
230 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
231 |
+
Dataset(name="squad-it", language=ITALIAN, task=READING_COMPREHENSION),
|
232 |
|
233 |
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
234 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
|
|
238 |
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
239 |
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
240 |
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
241 |
+
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
242 |
|
243 |
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
244 |
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
|
|
249 |
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
250 |
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
251 |
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
252 |
+
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
253 |
|
254 |
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
255 |
Dataset(name="hellaswag-no", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
|
|
259 |
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
260 |
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
261 |
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
262 |
+
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
263 |
]
|
264 |
|
265 |
|