sileod commited on
Commit
95fb3b0
1 Parent(s): a8b808d

Upload DebertaV2ForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +98 -94
  2. pytorch_model.bin +1 -1
config.json CHANGED
@@ -289,11 +289,11 @@
289
  28,
290
  3,
291
  6,
292
- 4,
293
  5,
294
  6,
295
  7,
296
  3,
 
297
  2,
298
  2,
299
  20,
@@ -305,9 +305,9 @@
305
  6,
306
  4,
307
  2,
308
- 4,
309
  3,
310
  3,
 
311
  2,
312
  13,
313
  2,
@@ -387,6 +387,7 @@
387
  2,
388
  2,
389
  2,
 
390
  3,
391
  2,
392
  2,
@@ -452,6 +453,7 @@
452
  1,
453
  1,
454
  2,
 
455
  3,
456
  3,
457
  3,
@@ -569,106 +571,106 @@
569
  "model-written-evals",
570
  "truthful_qa/multiple_choice",
571
  "fig-qa",
572
- "bigbench/novel_concepts",
573
- "bigbench/winowhy",
574
- "bigbench/dark_humor_detection",
575
- "bigbench/crass_ai",
576
- "bigbench/undo_permutation",
577
- "bigbench/logical_fallacy_detection",
578
- "bigbench/analytic_entailment",
579
- "bigbench/similarities_abstraction",
580
- "bigbench/simple_ethical_questions",
581
- "bigbench/intent_recognition",
582
- "bigbench/english_proverbs",
583
  "bigbench/penguins_in_a_table",
584
- "bigbench/hyperbaton",
585
- "bigbench/phrase_relatedness",
586
- "bigbench/social_support",
587
- "bigbench/symbol_interpretation",
588
- "bigbench/play_dialog_same_or_different",
589
- "bigbench/discourse_marker_prediction",
590
- "bigbench/human_organs_senses",
591
- "bigbench/date_understanding",
592
  "bigbench/contextual_parametric_knowledge_conflicts",
593
- "bigbench/code_line_description",
594
- "bigbench/moral_permissibility",
595
- "bigbench/crash_blossom",
 
 
 
 
 
 
596
  "bigbench/nonsense_words_grammar",
597
- "bigbench/conceptual_combinations",
598
- "bigbench/identify_odd_metaphor",
599
- "bigbench/question_selection",
 
 
 
 
600
  "bigbench/mathematical_induction",
601
- "bigbench/logical_args",
 
 
602
  "bigbench/arithmetic",
603
- "bigbench/temporal_sequences",
604
- "bigbench/sports_understanding",
605
- "bigbench/timedial",
 
 
 
606
  "bigbench/hindu_knowledge",
607
- "bigbench/navigate",
608
- "bigbench/unit_interpretation",
609
- "bigbench/figure_of_speech_detection",
610
- "bigbench/authorship_verification",
611
- "bigbench/entailed_polarity",
612
- "bigbench/odd_one_out",
613
  "bigbench/physics",
 
 
 
 
 
614
  "bigbench/dyck_languages",
615
- "bigbench/riddle_sense",
616
- "bigbench/physical_intuition",
617
- "bigbench/checkmate_in_one",
618
- "bigbench/gre_reading_comprehension",
619
- "bigbench/causal_judgment",
620
- "bigbench/misconceptions",
621
  "bigbench/presuppositions_as_nli",
622
- "bigbench/anachronisms",
623
- "bigbench/vitaminc_fact_verification",
624
- "bigbench/movie_dialog_same_or_different",
625
- "bigbench/implicatures",
626
- "bigbench/bbq_lite_json",
627
- "bigbench/emoji_movie",
628
- "bigbench/geometric_shapes",
629
- "bigbench/metaphor_boolean",
630
- "bigbench/understanding_fables",
631
- "bigbench/cause_and_effect",
632
  "bigbench/elementary_math_qa",
633
- "bigbench/formal_fallacies_syllogisms_negation",
634
- "bigbench/fact_checker",
635
- "bigbench/evaluating_information_essentiality",
636
- "bigbench/salient_translation_error_detection",
637
- "bigbench/sentence_ambiguity",
638
  "bigbench/cs_algorithms",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
639
  "bigbench/hhh_alignment",
640
- "bigbench/social_iqa",
641
- "bigbench/abstract_narrative_understanding",
642
  "bigbench/implicit_relations",
643
- "bigbench/known_unknowns",
644
- "bigbench/identify_math_theorems",
645
- "bigbench/tracking_shuffled_objects",
646
  "bigbench/disambiguation_qa",
647
- "bigbench/logic_grid_puzzle",
648
- "bigbench/suicide_risk",
649
- "bigbench/snarks",
650
- "bigbench/goal_step_wikihow",
651
- "bigbench/cifar10_classification",
652
- "bigbench/analogical_similarity",
653
- "bigbench/international_phonetic_alphabet_nli",
654
- "bigbench/epistemic_reasoning",
655
- "bigbench/logical_deduction",
656
- "bigbench/mnist_ascii",
657
- "bigbench/emojis_emotion_prediction",
658
- "bigbench/movie_recommendation",
659
- "bigbench/real_or_fake_text",
660
  "bigbench/fantasy_reasoning",
661
- "bigbench/ruin_names",
662
- "bigbench/general_knowledge",
 
 
 
663
  "bigbench/reasoning_about_colored_objects",
664
- "bigbench/key_value_maps",
665
- "bigbench/logical_sequence",
666
- "bigbench/color",
667
- "bigbench/strategyqa",
668
- "bigbench/irony_identification",
669
- "bigbench/empirical_judgments",
670
- "bigbench/strange_stories",
671
- "bigbench/metaphor_understanding",
672
  "cos_e/v1.0",
673
  "cosmos_qa",
674
  "dream",
@@ -777,11 +779,11 @@
777
  "go_emotions/simplified",
778
  "scicite",
779
  "liar",
780
- "lexical_relation_classification/K&H+N",
781
  "lexical_relation_classification/CogALexV",
782
  "lexical_relation_classification/BLESS",
783
  "lexical_relation_classification/EVALution",
784
  "lexical_relation_classification/ROOT09",
 
785
  "linguisticprobing/subj_number",
786
  "linguisticprobing/bigram_shift",
787
  "linguisticprobing/top_constituents",
@@ -793,9 +795,9 @@
793
  "linguisticprobing/sentence_length",
794
  "crowdflower/sentiment_nuclear_power",
795
  "crowdflower/tweet_global_warming",
796
- "crowdflower/corporate-messaging",
797
- "crowdflower/economic-news",
798
  "crowdflower/airline-sentiment",
 
 
799
  "crowdflower/political-media-bias",
800
  "crowdflower/text_emotion",
801
  "crowdflower/political-media-audience",
@@ -871,8 +873,9 @@
871
  "scruples",
872
  "wouldyourather",
873
  "attempto-nli",
874
- "defeasible-nli/atomic",
875
  "defeasible-nli/snli",
 
 
876
  "nli-veridicality-transitivity",
877
  "natural-language-satisfiability",
878
  "lonli",
@@ -894,8 +897,8 @@
894
  "redefine-math",
895
  "puzzte",
896
  "implicatures",
897
- "race/high",
898
  "race/middle",
 
899
  "race-c",
900
  "spartqa-yn",
901
  "spartqa-mchoice",
@@ -921,12 +924,12 @@
921
  "oasst1_dense_flat/helpfulness",
922
  "PARARULE-Plus",
923
  "mindgames",
924
- "universal_dependencies/en_partut/deprel",
925
- "universal_dependencies/en_lines/deprel",
926
- "universal_dependencies/en_gumreddit/deprel",
927
  "universal_dependencies/en_esl/deprel",
928
  "universal_dependencies/en_ewt/deprel",
929
  "universal_dependencies/en_gum/deprel",
 
 
 
930
  "ambient",
931
  "path-naturalness-prediction",
932
  "civil_comments/toxicity",
@@ -939,6 +942,7 @@
939
  "cloth",
940
  "dgen",
941
  "oasst1_pairwise_rlhf_reward",
 
942
  "babi_nli",
943
  "gen_debiased_nli",
944
  "imppres/presupposition",
 
289
  28,
290
  3,
291
  6,
 
292
  5,
293
  6,
294
  7,
295
  3,
296
+ 4,
297
  2,
298
  2,
299
  20,
 
305
  6,
306
  4,
307
  2,
 
308
  3,
309
  3,
310
+ 4,
311
  2,
312
  13,
313
  2,
 
387
  2,
388
  2,
389
  2,
390
+ 2,
391
  3,
392
  2,
393
  2,
 
453
  1,
454
  1,
455
  2,
456
+ 2,
457
  3,
458
  3,
459
  3,
 
571
  "model-written-evals",
572
  "truthful_qa/multiple_choice",
573
  "fig-qa",
574
+ "bigbench/conceptual_combinations",
575
+ "bigbench/international_phonetic_alphabet_nli",
576
+ "bigbench/anachronisms",
577
+ "bigbench/mnist_ascii",
578
+ "bigbench/physical_intuition",
579
+ "bigbench/crash_blossom",
580
+ "bigbench/timedial",
581
+ "bigbench/entailed_polarity",
582
+ "bigbench/color",
583
+ "bigbench/question_selection",
 
584
  "bigbench/penguins_in_a_table",
585
+ "bigbench/key_value_maps",
586
+ "bigbench/metaphor_boolean",
587
+ "bigbench/formal_fallacies_syllogisms_negation",
588
+ "bigbench/emoji_movie",
589
+ "bigbench/strange_stories",
 
 
 
590
  "bigbench/contextual_parametric_knowledge_conflicts",
591
+ "bigbench/identify_math_theorems",
592
+ "bigbench/logical_deduction",
593
+ "bigbench/logical_args",
594
+ "bigbench/emojis_emotion_prediction",
595
+ "bigbench/movie_dialog_same_or_different",
596
+ "bigbench/general_knowledge",
597
+ "bigbench/novel_concepts",
598
+ "bigbench/understanding_fables",
599
+ "bigbench/checkmate_in_one",
600
  "bigbench/nonsense_words_grammar",
601
+ "bigbench/logical_fallacy_detection",
602
+ "bigbench/cause_and_effect",
603
+ "bigbench/authorship_verification",
604
+ "bigbench/goal_step_wikihow",
605
+ "bigbench/irony_identification",
606
+ "bigbench/known_unknowns",
607
+ "bigbench/phrase_relatedness",
608
  "bigbench/mathematical_induction",
609
+ "bigbench/metaphor_understanding",
610
+ "bigbench/date_understanding",
611
+ "bigbench/evaluating_information_essentiality",
612
  "bigbench/arithmetic",
613
+ "bigbench/movie_recommendation",
614
+ "bigbench/intent_recognition",
615
+ "bigbench/human_organs_senses",
616
+ "bigbench/misconceptions",
617
+ "bigbench/logic_grid_puzzle",
618
+ "bigbench/tracking_shuffled_objects",
619
  "bigbench/hindu_knowledge",
620
+ "bigbench/social_support",
 
 
 
 
 
621
  "bigbench/physics",
622
+ "bigbench/vitaminc_fact_verification",
623
+ "bigbench/navigate",
624
+ "bigbench/hyperbaton",
625
+ "bigbench/undo_permutation",
626
+ "bigbench/similarities_abstraction",
627
  "bigbench/dyck_languages",
 
 
 
 
 
 
628
  "bigbench/presuppositions_as_nli",
629
+ "bigbench/empirical_judgments",
630
+ "bigbench/snarks",
631
+ "bigbench/logical_sequence",
632
+ "bigbench/abstract_narrative_understanding",
633
+ "bigbench/odd_one_out",
634
+ "bigbench/suicide_risk",
 
 
 
 
635
  "bigbench/elementary_math_qa",
636
+ "bigbench/analogical_similarity",
637
+ "bigbench/social_iqa",
638
+ "bigbench/unit_interpretation",
639
+ "bigbench/temporal_sequences",
 
640
  "bigbench/cs_algorithms",
641
+ "bigbench/ruin_names",
642
+ "bigbench/moral_permissibility",
643
+ "bigbench/causal_judgment",
644
+ "bigbench/code_line_description",
645
+ "bigbench/epistemic_reasoning",
646
+ "bigbench/cifar10_classification",
647
+ "bigbench/implicatures",
648
+ "bigbench/simple_ethical_questions",
649
+ "bigbench/riddle_sense",
650
+ "bigbench/winowhy",
651
+ "bigbench/sports_understanding",
652
+ "bigbench/identify_odd_metaphor",
653
+ "bigbench/geometric_shapes",
654
+ "bigbench/gre_reading_comprehension",
655
+ "bigbench/symbol_interpretation",
656
  "bigbench/hhh_alignment",
 
 
657
  "bigbench/implicit_relations",
 
 
 
658
  "bigbench/disambiguation_qa",
659
+ "bigbench/play_dialog_same_or_different",
660
+ "bigbench/strategyqa",
661
+ "bigbench/discourse_marker_prediction",
662
+ "bigbench/analytic_entailment",
663
+ "bigbench/bbq_lite_json",
664
+ "bigbench/dark_humor_detection",
665
+ "bigbench/english_proverbs",
 
 
 
 
 
 
666
  "bigbench/fantasy_reasoning",
667
+ "bigbench/real_or_fake_text",
668
+ "bigbench/fact_checker",
669
+ "bigbench/salient_translation_error_detection",
670
+ "bigbench/crass_ai",
671
+ "bigbench/sentence_ambiguity",
672
  "bigbench/reasoning_about_colored_objects",
673
+ "bigbench/figure_of_speech_detection",
 
 
 
 
 
 
 
674
  "cos_e/v1.0",
675
  "cosmos_qa",
676
  "dream",
 
779
  "go_emotions/simplified",
780
  "scicite",
781
  "liar",
 
782
  "lexical_relation_classification/CogALexV",
783
  "lexical_relation_classification/BLESS",
784
  "lexical_relation_classification/EVALution",
785
  "lexical_relation_classification/ROOT09",
786
+ "lexical_relation_classification/K&H+N",
787
  "linguisticprobing/subj_number",
788
  "linguisticprobing/bigram_shift",
789
  "linguisticprobing/top_constituents",
 
795
  "linguisticprobing/sentence_length",
796
  "crowdflower/sentiment_nuclear_power",
797
  "crowdflower/tweet_global_warming",
 
 
798
  "crowdflower/airline-sentiment",
799
+ "crowdflower/economic-news",
800
+ "crowdflower/corporate-messaging",
801
  "crowdflower/political-media-bias",
802
  "crowdflower/text_emotion",
803
  "crowdflower/political-media-audience",
 
873
  "scruples",
874
  "wouldyourather",
875
  "attempto-nli",
 
876
  "defeasible-nli/snli",
877
+ "defeasible-nli/atomic",
878
+ "help-nli",
879
  "nli-veridicality-transitivity",
880
  "natural-language-satisfiability",
881
  "lonli",
 
897
  "redefine-math",
898
  "puzzte",
899
  "implicatures",
 
900
  "race/middle",
901
+ "race/high",
902
  "race-c",
903
  "spartqa-yn",
904
  "spartqa-mchoice",
 
924
  "oasst1_dense_flat/helpfulness",
925
  "PARARULE-Plus",
926
  "mindgames",
 
 
 
927
  "universal_dependencies/en_esl/deprel",
928
  "universal_dependencies/en_ewt/deprel",
929
  "universal_dependencies/en_gum/deprel",
930
+ "universal_dependencies/en_gumreddit/deprel",
931
+ "universal_dependencies/en_lines/deprel",
932
+ "universal_dependencies/en_partut/deprel",
933
  "ambient",
934
  "path-naturalness-prediction",
935
  "civil_comments/toxicity",
 
942
  "cloth",
943
  "dgen",
944
  "oasst1_pairwise_rlhf_reward",
945
+ "I2D2",
946
  "babi_nli",
947
  "gen_debiased_nli",
948
  "imppres/presupposition",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b613bfb3264fdb4336c063a4ca45befdd3f2c36933a878e9b8763be026773e1
3
  size 737771833
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:162ed65448424ffdffbe0505359fb62ab99bcfa2865f7e8449e3f84b19903485
3
  size 737771833