Spaces:
Restarting
on
CPU Upgrade
Restarting
on
CPU Upgrade
add polqa tasks
Browse files- src/about.py +24 -18
src/about.py
CHANGED
@@ -32,7 +32,10 @@ class Tasks(Enum):
|
|
32 |
task17 = Task("polish_cbd_regex", "f1,score-first", "cbd_g", "generate_until")
|
33 |
task18 = Task("polish_klej_ner_multiple_choice", "acc,none", "klej_ner_mc", "multiple_choice")
|
34 |
task19 = Task("polish_klej_ner_regex", "exact_match,score-first", "klej_ner_g", "generate_until")
|
35 |
-
task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "
|
|
|
|
|
|
|
36 |
|
37 |
NUM_FEWSHOT = 0 # Change with your few shot
|
38 |
# ---------------------------------------------------
|
@@ -81,25 +84,28 @@ or join our [Discord SpeakLeash](https://discord.gg/3G9DVM39)
|
|
81 |
|
82 |
| Task | Dataset | Metric | Type |
|
83 |
|---------------------------------|---------------------------------------|-----------|-----------------|
|
84 |
-
| belebele_pol_Latn | facebook/belebele | accuracy | multiple_choice |
|
85 |
| polemo2_in | allegro/klej-polemo2-in | accuracy | generate_until |
|
86 |
-
|
|
87 |
| polemo2_out | allegro/klej-polemo2-out | accuracy | generate_until |
|
88 |
-
|
|
89 |
-
|
|
90 |
-
|
|
91 |
-
|
|
92 |
-
|
|
93 |
-
|
|
94 |
-
|
|
95 |
-
|
|
96 |
-
|
|
97 |
-
|
|
98 |
-
|
|
99 |
-
|
|
100 |
-
|
|
101 |
-
|
|
102 |
-
|
|
|
|
|
|
|
|
|
|
103 |
|
104 |
## Reproducibility
|
105 |
To reproduce our results, you need to clone the repository:
|
|
|
32 |
task17 = Task("polish_cbd_regex", "f1,score-first", "cbd_g", "generate_until")
|
33 |
task18 = Task("polish_klej_ner_multiple_choice", "acc,none", "klej_ner_mc", "multiple_choice")
|
34 |
task19 = Task("polish_klej_ner_regex", "exact_match,score-first", "klej_ner_g", "generate_until")
|
35 |
+
task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "poleval2018_task3_test_10k", "other")
|
36 |
+
task21 = Task("polish_polqa_reranking_multiple_choice", "acc,none", "polqa_reranking_mc", "other") # multiple_choice
|
37 |
+
task22 = Task("polish_polqa_open_book", "levenshtein,none", "polqa_open_book_g", "other") # generate_until
|
38 |
+
task23 = Task("polish_polqa_closed_book", "levenshtein,none", "polqa_closed_book_g", "other") # generate_until
|
39 |
|
40 |
NUM_FEWSHOT = 0 # Change with your few shot
|
41 |
# ---------------------------------------------------
|
|
|
84 |
|
85 |
| Task | Dataset | Metric | Type |
|
86 |
|---------------------------------|---------------------------------------|-----------|-----------------|
|
|
|
87 |
| polemo2_in | allegro/klej-polemo2-in | accuracy | generate_until |
|
88 |
+
| polemo2_in_mc | allegro/klej-polemo2-in | accuracy | multiple_choice |
|
89 |
| polemo2_out | allegro/klej-polemo2-out | accuracy | generate_until |
|
90 |
+
| polemo2_out_mc | allegro/klej-polemo2-out | accuracy | multiple_choice |
|
91 |
+
| 8tags_mc | sdadas/8tags | accuracy | multiple_choice |
|
92 |
+
| 8tags_g | sdadas/8tags | accuracy | generate_until |
|
93 |
+
| belebele_mc | facebook/belebele | accuracy | multiple_choice |
|
94 |
+
| belebele_g | facebook/belebele | accuracy | generate_until |
|
95 |
+
| dyk_mc | allegro/klej-dyk | binary F1 | multiple_choice |
|
96 |
+
| dyk_g | allegro/klej-dyk | binary F1 | generate_until |
|
97 |
+
| ppc_mc | sdadas/ppc | accuracy | multiple_choice |
|
98 |
+
| ppc_g | sdadas/ppc | accuracy | generate_until |
|
99 |
+
| psc_mc | allegro/klej-psc | binary F1 | multiple_choice |
|
100 |
+
| psc_g | allegro/klej-psc | binary F1 | generate_until |
|
101 |
+
| cbd_mc | ptaszynski/PolishCyberbullyingDataset | macro F1 | multiple_choice |
|
102 |
+
| cbd_g | ptaszynski/PolishCyberbullyingDataset | macro F1 | generate_until |
|
103 |
+
| klej_ner_mc | allegro/klej-nkjp-ner | accuracy | multiple_choice |
|
104 |
+
| klej_ner_g | allegro/klej-nkjp-ner | accuracy | generate_until |
|
105 |
+
| poleval2018_task3_test_10k | enelpol/poleval2018_task3_test_10k | word perplexity | other |
|
106 |
+
| polqa_reranking_mc | ipipan/polqa | accuracy | other |
|
107 |
+
| polqa_open_book_g | ipipan/polqa | levenshtein | other |
|
108 |
+
| polqa_closed_book_g | ipipan/polqa | levenshtein | other |
|
109 |
|
110 |
## Reproducibility
|
111 |
To reproduce our results, you need to clone the repository:
|