LLM_Detection_Attribution / ood_results.json
wissamantoun's picture
Upload ood_results.json
28f58b8
raw
history blame
No virus
120 kB
[{
"model_name": "mpt-30b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6557377049180327,
"f1": 0.609451219512195,
"precision": 0.7961165048543689,
"recall": 0.6557377049180328,
"auc": 0.5048374092985757
},
{
"model_name": "mpt-30b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.708008599838753
},
{
"model_name": "mpt-30b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.6883902176834185
},
{
"model_name": "mpt-30b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.6490190808922334
},
{
"model_name": "mpt-30b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.707874227358237
},
{
"model_name": "openllama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.5226697353279632,
"precision": 0.6629273504273505,
"recall": 0.5819672131147541,
"auc": 0.6484815909701692
},
{
"model_name": "openllama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.5566116857701985,
"precision": 0.587281399046105,
"recall": 0.5737704918032787,
"auc": 0.570276807309863
},
{
"model_name": "openllama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5709047369602633,
"precision": 0.6940909090909091,
"recall": 0.6147540983606558,
"auc": 0.6772373018005912
},
{
"model_name": "openllama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.6052136522440205
},
{
"model_name": "openllama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6311475409836066,
"f1": 0.5788262370540851,
"precision": 0.7606837606837606,
"recall": 0.6311475409836065,
"auc": 0.5925826390755173
},
{
"model_name": "vicuna-33b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.6834184359043268
},
{
"model_name": "vicuna-33b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.680327868852459,
"f1": 0.6439422285414952,
"precision": 0.8049999999999999,
"recall": 0.680327868852459,
"auc": 0.6049449072829884
},
{
"model_name": "vicuna-33b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.8071754904595538
},
{
"model_name": "vicuna-33b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.7786885245901639
},
{
"model_name": "vicuna-33b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5655737704918032,
"f1": 0.4645134575569358,
"precision": 0.7675438596491229,
"recall": 0.5655737704918032,
"auc": 0.8501746842246708
},
{
"model_name": "pythia-410m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5151033386327504,
"precision": 0.7367678193366267,
"recall": 0.5901639344262295,
"auc": 0.7304488040849234
},
{
"model_name": "pythia-410m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.7973662993818866
},
{
"model_name": "pythia-410m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.7041117979037892
},
{
"model_name": "pythia-410m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5245901639344263,
"f1": 0.38576388888888885,
"precision": 0.7563025210084033,
"recall": 0.5245901639344263,
"auc": 0.6750873421123353
},
{
"model_name": "pythia-410m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5327868852459017,
"f1": 0.4136099165190994,
"precision": 0.6752873563218391,
"recall": 0.5327868852459017,
"auc": 0.6057511421660844
},
{
"model_name": "alfred-40b-0723",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.9684224670787422
},
{
"model_name": "alfred-40b-0723",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.7125772641762966
},
{
"model_name": "alfred-40b-0723",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.8250470303681807
},
{
"model_name": "alfred-40b-0723",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.903520558989519
},
{
"model_name": "alfred-40b-0723",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.7132491265788767
},
{
"model_name": "vicuna-13b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.8238376780435367
},
{
"model_name": "vicuna-13b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5983606557377049,
"f1": 0.5211087078426659,
"precision": 0.7772727272727273,
"recall": 0.5983606557377049,
"auc": 0.8001881214727223
},
{
"model_name": "vicuna-13b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.5052405267401237
},
{
"model_name": "vicuna-13b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.8797366299381887
},
{
"model_name": "vicuna-13b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6967213114754098,
"f1": 0.666000739918609,
"precision": 0.8112244897959184,
"recall": 0.6967213114754098,
"auc": 0.8152378392905133
},
{
"model_name": "pythia-2.8b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5477293790546802,
"precision": 0.7221288515406162,
"recall": 0.6065573770491803,
"auc": 0.7187583982800322
},
{
"model_name": "pythia-2.8b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.4820155411359449,
"precision": 0.6848484848484848,
"recall": 0.5655737704918032,
"auc": 0.7571889277076055
},
{
"model_name": "pythia-2.8b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5722560975609756,
"precision": 0.7337761880429228,
"recall": 0.6229508196721312,
"auc": 0.7511421660843859
},
{
"model_name": "pythia-2.8b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6229508196721312,
"f1": 0.5722560975609756,
"precision": 0.7337761880429228,
"recall": 0.6229508196721312,
"auc": 0.6691749529696318
},
{
"model_name": "pythia-2.8b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5655737704918032,
"f1": 0.4820155411359449,
"precision": 0.6848484848484848,
"recall": 0.5655737704918032,
"auc": 0.5747110991668907
},
{
"model_name": "bloom-7.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.6815372211771029
},
{
"model_name": "bloom-7.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6147540983606558,
"f1": 0.5601074031453778,
"precision": 0.7280982905982906,
"recall": 0.6147540983606558,
"auc": 0.7308519215264714
},
{
"model_name": "bloom-7.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5737704918032787,
"f1": 0.4877260981912145,
"precision": 0.7248157248157248,
"recall": 0.5737704918032787,
"auc": 0.6871808653587745
},
{
"model_name": "bloom-7.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5901639344262295,
"f1": 0.5222431077694234,
"precision": 0.7090342679127726,
"recall": 0.5901639344262295,
"auc": 0.7199677506046762
},
{
"model_name": "bloom-7.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.680327868852459,
"f1": 0.6479467258601554,
"precision": 0.7852891156462585,
"recall": 0.680327868852459,
"auc": 0.7274926095135715
},
{
"model_name": "pythia-160m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5573770491803278,
"f1": 0.4591133004926109,
"precision": 0.7099311701081612,
"recall": 0.5573770491803278,
"auc": 0.779226014512228
},
{
"model_name": "pythia-160m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6557377049180327,
"f1": 0.6142728093947607,
"precision": 0.7732201791607731,
"recall": 0.6557377049180327,
"auc": 0.8505778016662188
},
{
"model_name": "pythia-160m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.7669981187852728
},
{
"model_name": "pythia-160m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5491803278688525,
"f1": 0.44430641821946165,
"precision": 0.700657894736842,
"recall": 0.5491803278688524,
"auc": 0.6178446654125235
},
{
"model_name": "pythia-160m-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5327868852459017,
"f1": 0.4136099165190994,
"precision": 0.6752873563218391,
"recall": 0.5327868852459017,
"auc": 0.7280300994356356
},
{
"model_name": "bloom-1.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6639344262295082,
"f1": 0.6256828556461873,
"precision": 0.7772727272727273,
"recall": 0.6639344262295082,
"auc": 0.7944101048105348
},
{
"model_name": "bloom-1.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5491803278688525,
"f1": 0.43418500716755204,
"precision": 0.7629310344827587,
"recall": 0.5491803278688525,
"auc": 0.7434829346949744
},
{
"model_name": "bloom-1.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5540866319309432,
"precision": 0.7517688679245282,
"recall": 0.6147540983606558,
"auc": 0.7004837409298575
},
{
"model_name": "bloom-1.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.7375705455522709
},
{
"model_name": "bloom-1.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.6273851115291589
},
{
"model_name": "openllama-2-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5151033386327504,
"precision": 0.7367678193366267,
"recall": 0.5901639344262295,
"auc": 0.7120397742542327
},
{
"model_name": "openllama-2-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5491803278688525,
"f1": 0.45371651876577385,
"precision": 0.6633928571428571,
"recall": 0.5491803278688524,
"auc": 0.6130072561139479
},
{
"model_name": "openllama-2-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5737704918032787,
"f1": 0.5031328320802004,
"precision": 0.6710280373831776,
"recall": 0.5737704918032787,
"auc": 0.6729373824240795
},
{
"model_name": "openllama-2-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5655737704918032,
"f1": 0.49716152111361694,
"precision": 0.6438679245283019,
"recall": 0.5655737704918034,
"auc": 0.5732330018812148
},
{
"model_name": "openllama-2-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5709047369602633,
"precision": 0.6940909090909091,
"recall": 0.6147540983606558,
"auc": 0.6140822359580758
},
{
"model_name": "opt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5491803278688525,
"f1": 0.43418500716755204,
"precision": 0.7629310344827587,
"recall": 0.5491803278688525,
"auc": 0.5853265251276539
},
{
"model_name": "opt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5327868852459017,
"f1": 0.4136099165190994,
"precision": 0.6752873563218391,
"recall": 0.5327868852459017,
"auc": 0.4273044880408492
},
{
"model_name": "opt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.584251545283526
},
{
"model_name": "opt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5245901639344263,
"f1": 0.40875668449197855,
"precision": 0.613664596273292,
"recall": 0.5245901639344263,
"auc": 0.4486697124428917
},
{
"model_name": "opt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5491803278688525,
"f1": 0.46246895778258434,
"precision": 0.6386363636363637,
"recall": 0.5491803278688524,
"auc": 0.5111529158828272
},
{
"model_name": "opt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5573770491803278,
"f1": 0.4495320855614974,
"precision": 0.7652173913043478,
"recall": 0.5573770491803278,
"auc": 0.6719967750604676
},
{
"model_name": "opt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5245901639344263,
"f1": 0.3976847122914538,
"precision": 0.6564102564102564,
"recall": 0.5245901639344263,
"auc": 0.48938457403923674
},
{
"model_name": "opt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5573770491803278,
"f1": 0.46802325581395354,
"precision": 0.6748566748566749,
"recall": 0.5573770491803278,
"auc": 0.4778285407148616
},
{
"model_name": "opt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5327868852459017,
"f1": 0.42409937888198757,
"precision": 0.6337719298245614,
"recall": 0.5327868852459017,
"auc": 0.52848696586939
},
{
"model_name": "opt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.583042192958882
},
{
"model_name": "llama-2-70b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.680327868852459,
"f1": 0.6479467258601554,
"precision": 0.7852891156462585,
"recall": 0.680327868852459,
"auc": 0.7471109916689063
},
{
"model_name": "llama-2-70b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6721311475409836,
"f1": 0.6479076479076479,
"precision": 0.7374860956618465,
"recall": 0.6721311475409837,
"auc": 0.6390755173340499
},
{
"model_name": "llama-2-70b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.639344262295082,
"f1": 0.6049455401825139,
"precision": 0.7138144329896907,
"recall": 0.639344262295082,
"auc": 0.6890620800859983
},
{
"model_name": "llama-2-70b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6557377049180327,
"f1": 0.6418786692759295,
"precision": 0.6842607313195549,
"recall": 0.6557377049180327,
"auc": 0.625369524321419
},
{
"model_name": "llama-2-70b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6311475409836066,
"f1": 0.5788262370540851,
"precision": 0.7606837606837606,
"recall": 0.6311475409836065,
"auc": 0.7374361730717549
},
{
"model_name": "llama-2-70b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6721311475409836,
"f1": 0.6408595819841036,
"precision": 0.7641237113402062,
"recall": 0.6721311475409836,
"auc": 0.6365224402042462
},
{
"model_name": "llama-2-70b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.680327868852459,
"f1": 0.6516582473094663,
"precision": 0.7688301282051282,
"recall": 0.680327868852459,
"auc": 0.5325181402848697
},
{
"model_name": "llama-2-70b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6721311475409836,
"f1": 0.6408595819841036,
"precision": 0.7641237113402062,
"recall": 0.6721311475409836,
"auc": 0.6847621607094866
},
{
"model_name": "llama-2-70b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6967213114754098,
"f1": 0.6855451062347615,
"precision": 0.7293233082706767,
"recall": 0.6967213114754098,
"auc": 0.6886589626444504
},
{
"model_name": "llama-2-70b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6967213114754098,
"f1": 0.6727799927509968,
"precision": 0.7781155015197568,
"recall": 0.6967213114754098,
"auc": 0.7678043536683689
},
{
"model_name": "llama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.7651169040580489
},
{
"model_name": "llama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6065573770491803,
"f1": 0.5690314983809244,
"precision": 0.6635051546391753,
"recall": 0.6065573770491803,
"auc": 0.5888202096210696
},
{
"model_name": "llama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5737704918032787,
"f1": 0.4791461412151067,
"precision": 0.7699115044247787,
"recall": 0.5737704918032787,
"auc": 0.7668637463047567
},
{
"model_name": "llama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.6726686374630476
},
{
"model_name": "llama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.7143241064230045
},
{
"model_name": "gpt2",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.5486428379467885
},
{
"model_name": "gpt2",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.7868852459016393
},
{
"model_name": "gpt2",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5655737704918032,
"f1": 0.4735813726288366,
"precision": 0.7178571428571429,
"recall": 0.5655737704918032,
"auc": 0.694974469228702
},
{
"model_name": "gpt2",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5491803278688525,
"f1": 0.44430641821946165,
"precision": 0.700657894736842,
"recall": 0.5491803278688524,
"auc": 0.5154528352593388
},
{
"model_name": "gpt2",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.6834184359043267
},
{
"model_name": "gpt2-large",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5655737704918032,
"f1": 0.4645134575569358,
"precision": 0.7675438596491229,
"recall": 0.5655737704918032,
"auc": 0.5912389142703574
},
{
"model_name": "gpt2-large",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.7073367374361731
},
{
"model_name": "gpt2-large",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.6655468959957002
},
{
"model_name": "gpt2-large",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.6768341843590432
},
{
"model_name": "gpt2-large",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6065573770491803,
"f1": 0.5536585365853659,
"precision": 0.7026060296371998,
"recall": 0.6065573770491803,
"auc": 0.7256113947863477
},
{
"model_name": "pythia-1.4b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5222431077694234,
"precision": 0.7090342679127726,
"recall": 0.5901639344262295,
"auc": 0.664606288632088
},
{
"model_name": "pythia-1.4b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.48986193293885605,
"precision": 0.6613756613756614,
"recall": 0.5655737704918032,
"auc": 0.6636656812684761
},
{
"model_name": "pythia-1.4b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5226697353279632,
"precision": 0.6629273504273505,
"recall": 0.5819672131147541,
"auc": 0.5730986294006987
},
{
"model_name": "pythia-1.4b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.7194302606826122
},
{
"model_name": "pythia-1.4b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.5950013437248052
},
{
"model_name": "gpt2-medium",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.7125772641762966
},
{
"model_name": "gpt2-medium",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.4820155411359449,
"precision": 0.6848484848484848,
"recall": 0.5655737704918032,
"auc": 0.6558720773985487
},
{
"model_name": "gpt2-medium",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5226697353279632,
"precision": 0.6629273504273505,
"recall": 0.5819672131147541,
"auc": 0.5919107766729373
},
{
"model_name": "gpt2-medium",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5573770491803278,
"f1": 0.46802325581395354,
"precision": 0.6748566748566749,
"recall": 0.5573770491803278,
"auc": 0.6076323568933082
},
{
"model_name": "gpt2-medium",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5573770491803278,
"f1": 0.4495320855614974,
"precision": 0.7652173913043478,
"recall": 0.5573770491803278,
"auc": 0.6408223595807578
},
{
"model_name": "pythia-2.8b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5477293790546802,
"precision": 0.7221288515406162,
"recall": 0.6065573770491803,
"auc": 0.6428379467884977
},
{
"model_name": "pythia-2.8b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.6195915076592313
},
{
"model_name": "pythia-2.8b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5601074031453778,
"precision": 0.7280982905982906,
"recall": 0.6147540983606558,
"auc": 0.6062886320881483
},
{
"model_name": "pythia-2.8b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.7747917226552002
},
{
"model_name": "pythia-2.8b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5540866319309432,
"precision": 0.7517688679245282,
"recall": 0.6147540983606558,
"auc": 0.48589088954582105
},
{
"model_name": "opt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5409836065573771,
"f1": 0.41845420497105895,
"precision": 0.7606837606837606,
"recall": 0.5409836065573771,
"auc": 0.6909432948132223
},
{
"model_name": "opt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.5338618650900295
},
{
"model_name": "opt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5245901639344263,
"f1": 0.38576388888888885,
"precision": 0.7563025210084033,
"recall": 0.5245901639344263,
"auc": 0.7308519215264715
},
{
"model_name": "opt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5245901639344263,
"f1": 0.3976847122914538,
"precision": 0.6564102564102564,
"recall": 0.5245901639344263,
"auc": 0.6367911851652781
},
{
"model_name": "opt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5491803278688525,
"f1": 0.43418500716755204,
"precision": 0.7629310344827587,
"recall": 0.5491803278688525,
"auc": 0.7231926901370599
},
{
"model_name": "falcon-40b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5737704918032787,
"f1": 0.5031328320802004,
"precision": 0.6710280373831776,
"recall": 0.5737704918032787,
"auc": 0.7186240257995162
},
{
"model_name": "falcon-40b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.7162053211502284
},
{
"model_name": "falcon-40b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5901639344262295,
"f1": 0.5288847698486252,
"precision": 0.6879551820728291,
"recall": 0.5901639344262295,
"auc": 0.6510346680999731
},
{
"model_name": "falcon-40b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6229508196721312,
"f1": 0.5950937950937951,
"precision": 0.6696329254727476,
"recall": 0.6229508196721312,
"auc": 0.6557377049180328
},
{
"model_name": "falcon-40b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6065573770491803,
"f1": 0.5642857142857143,
"precision": 0.6741326306543698,
"recall": 0.6065573770491803,
"auc": 0.6566783122816446
},
{
"model_name": "pythia-1b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.6549314700349368
},
{
"model_name": "pythia-1b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.4877260981912145,
"precision": 0.7248157248157248,
"recall": 0.5737704918032787,
"auc": 0.7660575114216608
},
{
"model_name": "pythia-1b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5226697353279632,
"precision": 0.6629273504273505,
"recall": 0.5819672131147541,
"auc": 0.5987637731792528
},
{
"model_name": "pythia-1b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.6272507390486428
},
{
"model_name": "pythia-1b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5655737704918032,
"f1": 0.4735813726288366,
"precision": 0.7178571428571429,
"recall": 0.5655737704918032,
"auc": 0.6736092448266596
},
{
"model_name": "vicuna-7b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.666353130878796
},
{
"model_name": "vicuna-7b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.5658425154528353
},
{
"model_name": "vicuna-7b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.7696855683955925
},
{
"model_name": "vicuna-7b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5211087078426659,
"precision": 0.7772727272727273,
"recall": 0.5983606557377049,
"auc": 0.7334049986562752
},
{
"model_name": "vicuna-7b-v1.3",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.7417360924482665
},
{
"model_name": "openllama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.5343859911696476,
"precision": 0.6386363636363637,
"recall": 0.5819672131147541,
"auc": 0.666756248320344
},
{
"model_name": "openllama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.4820155411359449,
"precision": 0.6848484848484848,
"recall": 0.5655737704918032,
"auc": 0.6182477828540714
},
{
"model_name": "openllama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6311475409836066,
"f1": 0.5841854124062713,
"precision": 0.7392156862745098,
"recall": 0.6311475409836065,
"auc": 0.7313894114485352
},
{
"model_name": "openllama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5901639344262295,
"f1": 0.5288847698486252,
"precision": 0.6879551820728291,
"recall": 0.5901639344262295,
"auc": 0.6490190808922333
},
{
"model_name": "openllama-2-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5737704918032787,
"f1": 0.4791461412151067,
"precision": 0.7699115044247787,
"recall": 0.5737704918032787,
"auc": 0.7278957269551196
},
{
"model_name": "opt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.5204246170384306
},
{
"model_name": "opt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.5031328320802004,
"precision": 0.6710280373831776,
"recall": 0.5737704918032787,
"auc": 0.6091104541789841
},
{
"model_name": "opt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5161365580527257,
"precision": 0.6798349056603774,
"recall": 0.5819672131147541,
"auc": 0.7471109916689063
},
{
"model_name": "opt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.5815640956732061
},
{
"model_name": "opt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.5174684224670787
},
{
"model_name": "opt-66b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5737704918032787,
"f1": 0.5164634146341464,
"precision": 0.6402657128257536,
"recall": 0.5737704918032787,
"auc": 0.5911045417898414
},
{
"model_name": "opt-66b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6147540983606558,
"f1": 0.5757306696263411,
"precision": 0.6815476190476191,
"recall": 0.6147540983606558,
"auc": 0.5382961569470572
},
{
"model_name": "opt-66b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5161365580527257,
"precision": 0.6798349056603774,
"recall": 0.5819672131147541,
"auc": 0.6823434560601989
},
{
"model_name": "opt-66b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5573770491803278,
"f1": 0.46802325581395354,
"precision": 0.6748566748566749,
"recall": 0.5573770491803278,
"auc": 0.5163934426229508
},
{
"model_name": "opt-66b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5737704918032787,
"f1": 0.4877260981912145,
"precision": 0.7248157248157248,
"recall": 0.5737704918032787,
"auc": 0.6748185971513034
},
{
"model_name": "cerebras-gpt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5540866319309432,
"precision": 0.7517688679245282,
"recall": 0.6147540983606558,
"auc": 0.7946788497715669
},
{
"model_name": "cerebras-gpt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.806503628056974
},
{
"model_name": "cerebras-gpt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5540866319309432,
"precision": 0.7517688679245282,
"recall": 0.6147540983606558,
"auc": 0.7625638269282451
},
{
"model_name": "cerebras-gpt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6311475409836066,
"f1": 0.5788262370540851,
"precision": 0.7606837606837606,
"recall": 0.6311475409836065,
"auc": 0.707605482397205
},
{
"model_name": "cerebras-gpt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5901639344262295,
"f1": 0.5151033386327504,
"precision": 0.7367678193366267,
"recall": 0.5901639344262295,
"auc": 0.6560064498790648
},
{
"model_name": "bloom-560m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.846277882289707
},
{
"model_name": "bloom-560m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6557377049180327,
"f1": 0.6142728093947607,
"precision": 0.7732201791607731,
"recall": 0.6557377049180327,
"auc": 0.7846009137328676
},
{
"model_name": "bloom-560m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6639344262295082,
"f1": 0.6211467090812693,
"precision": 0.7990196078431373,
"recall": 0.6639344262295082,
"auc": 0.764579414135985
},
{
"model_name": "bloom-560m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.777613544746036
},
{
"model_name": "bloom-560m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.8129535071217413
},
{
"model_name": "cerebras-gpt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.8089223327062617
},
{
"model_name": "cerebras-gpt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.7440204246170384
},
{
"model_name": "cerebras-gpt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.6440472991131417
},
{
"model_name": "cerebras-gpt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.7139209889814565
},
{
"model_name": "cerebras-gpt-6.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.5662456328943832
},
{
"model_name": "pythia-1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.6879871002418705
},
{
"model_name": "pythia-1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.7390486428379467
},
{
"model_name": "pythia-1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.6499596882558452
},
{
"model_name": "pythia-1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.6961838215533459
},
{
"model_name": "pythia-1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5901639344262295,
"f1": 0.5222431077694234,
"precision": 0.7090342679127726,
"recall": 0.5901639344262295,
"auc": 0.5990325181402849
},
{
"model_name": "falcon-7b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.8481590970169308
},
{
"model_name": "falcon-7b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.7617575920451491
},
{
"model_name": "falcon-7b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.6005106154259607
},
{
"model_name": "falcon-7b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6475409836065574,
"f1": 0.5975450709627925,
"precision": 0.7932692307692308,
"recall": 0.6475409836065573,
"auc": 0.8382155334587477
},
{
"model_name": "falcon-7b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.7886320881483473
},
{
"model_name": "gpt2-xl",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.6983337812416016
},
{
"model_name": "gpt2-xl",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5491803278688525,
"f1": 0.44430641821946165,
"precision": 0.700657894736842,
"recall": 0.5491803278688524,
"auc": 0.583310937919914
},
{
"model_name": "gpt2-xl",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5655737704918032,
"f1": 0.49716152111361694,
"precision": 0.6438679245283019,
"recall": 0.5655737704918034,
"auc": 0.5331900026874496
},
{
"model_name": "gpt2-xl",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5573770491803278,
"f1": 0.4911955514365153,
"precision": 0.6196078431372549,
"recall": 0.5573770491803278,
"auc": 0.5395055092717012
},
{
"model_name": "gpt2-xl",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5491803278688525,
"f1": 0.45371651876577385,
"precision": 0.6633928571428571,
"recall": 0.5491803278688524,
"auc": 0.7543671056167697
},
{
"model_name": "llama-2-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.8804084923407686
},
{
"model_name": "llama-2-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.5455522708949208
},
{
"model_name": "llama-2-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6311475409836066,
"f1": 0.5788262370540851,
"precision": 0.7606837606837606,
"recall": 0.6311475409836065,
"auc": 0.708680462241333
},
{
"model_name": "llama-2-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5351115949918346,
"precision": 0.7158018867924528,
"recall": 0.5983606557377049,
"auc": 0.569739317387799
},
{
"model_name": "llama-2-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5757306696263411,
"precision": 0.6815476190476191,
"recall": 0.6147540983606558,
"auc": 0.7049180327868851
},
{
"model_name": "pythia-12b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5151033386327504,
"precision": 0.7367678193366267,
"recall": 0.5901639344262295,
"auc": 0.6510346680999731
},
{
"model_name": "pythia-12b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.4735813726288366,
"precision": 0.7178571428571429,
"recall": 0.5655737704918032,
"auc": 0.6038699274388606
},
{
"model_name": "pythia-12b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.6659500134372481
},
{
"model_name": "pythia-12b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.624025799516259
},
{
"model_name": "pythia-12b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.6165009406073636
},
{
"model_name": "bloom-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.7049180327868853,
"f1": 0.6831168831168831,
"precision": 0.7827215424545791,
"recall": 0.7049180327868853,
"auc": 0.6734748723461434
},
{
"model_name": "bloom-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6639344262295082,
"f1": 0.6256828556461873,
"precision": 0.7772727272727273,
"recall": 0.6639344262295082,
"auc": 0.7714324106423005
},
{
"model_name": "bloom-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.7049180327868853,
"f1": 0.6859267734553776,
"precision": 0.7702942219071252,
"recall": 0.7049180327868853,
"auc": 0.7594732598763774
},
{
"model_name": "bloom-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.5161365580527257,
"precision": 0.6798349056603774,
"recall": 0.5819672131147541,
"auc": 0.625235151840903
},
{
"model_name": "bloom-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6721311475409836,
"f1": 0.6408595819841036,
"precision": 0.7641237113402062,
"recall": 0.6721311475409836,
"auc": 0.7198333781241602
},
{
"model_name": "llama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5351115949918346,
"precision": 0.7158018867924528,
"recall": 0.5983606557377049,
"auc": 0.8235689330825046
},
{
"model_name": "llama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5983606557377049,
"f1": 0.5526453640649555,
"precision": 0.6663636363636364,
"recall": 0.5983606557377049,
"auc": 0.5597957538296157
},
{
"model_name": "llama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5642857142857143,
"precision": 0.6741326306543698,
"recall": 0.6065573770491803,
"auc": 0.6471378661650095
},
{
"model_name": "llama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5655737704918032,
"f1": 0.48986193293885605,
"precision": 0.6613756613756614,
"recall": 0.5655737704918032,
"auc": 0.6366568126847622
},
{
"model_name": "llama-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.5287434673937742,
"precision": 0.6495098039215687,
"recall": 0.5819672131147541,
"auc": 0.7244020424617037
},
{
"model_name": "cerebras-gpt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.7867508734211233
},
{
"model_name": "cerebras-gpt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.6627250739048642
},
{
"model_name": "cerebras-gpt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5722560975609756,
"precision": 0.7337761880429228,
"recall": 0.6229508196721312,
"auc": 0.6474066111260414
},
{
"model_name": "cerebras-gpt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6311475409836066,
"f1": 0.5891641098555713,
"precision": 0.7218181818181818,
"recall": 0.6311475409836065,
"auc": 0.7819134641225477
},
{
"model_name": "cerebras-gpt-13b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5983606557377049,
"f1": 0.5211087078426659,
"precision": 0.7772727272727273,
"recall": 0.5983606557377049,
"auc": 0.6861058855146466
},
{
"model_name": "pythia-1.4b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.6159634506852997
},
{
"model_name": "pythia-1.4b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.4791461412151067,
"precision": 0.7699115044247787,
"recall": 0.5737704918032787,
"auc": 0.6412254770223058
},
{
"model_name": "pythia-1.4b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.6788497715667831
},
{
"model_name": "pythia-1.4b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6147540983606558,
"f1": 0.5540866319309432,
"precision": 0.7517688679245282,
"recall": 0.6147540983606558,
"auc": 0.6588282719699006
},
{
"model_name": "pythia-1.4b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6229508196721312,
"f1": 0.5665739882607352,
"precision": 0.7563025210084033,
"recall": 0.6229508196721312,
"auc": 0.6660843859177641
},
{
"model_name": "bloom-1.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6311475409836066,
"f1": 0.5788262370540851,
"precision": 0.7606837606837606,
"recall": 0.6311475409836065,
"auc": 0.8325718892770761
},
{
"model_name": "bloom-1.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6311475409836066,
"f1": 0.5841854124062713,
"precision": 0.7392156862745098,
"recall": 0.6311475409836065,
"auc": 0.6961838215533459
},
{
"model_name": "bloom-1.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.7702230583176565
},
{
"model_name": "bloom-1.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5477293790546802,
"precision": 0.7221288515406162,
"recall": 0.6065573770491803,
"auc": 0.7156678312281645
},
{
"model_name": "bloom-1.1b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.639344262295082,
"f1": 0.5854185974667903,
"precision": 0.7904761904761906,
"recall": 0.639344262295082,
"auc": 0.8121472722386456
},
{
"model_name": "llama-2-13b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.778016662187584
},
{
"model_name": "llama-2-13b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6557377049180327,
"f1": 0.6187499999999999,
"precision": 0.7545015371102327,
"recall": 0.6557377049180327,
"auc": 0.7487234614350982
},
{
"model_name": "llama-2-13b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5655737704918032,
"f1": 0.4645134575569358,
"precision": 0.7675438596491229,
"recall": 0.5655737704918032,
"auc": 0.7725073904864284
},
{
"model_name": "llama-2-13b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.5154528352593388
},
{
"model_name": "llama-2-13b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.6652781510346681
},
{
"model_name": "llama-65b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.8497715667831229
},
{
"model_name": "llama-65b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6557377049180327,
"f1": 0.6335812356979404,
"precision": 0.705423608649415,
"recall": 0.6557377049180328,
"auc": 0.5665143778554151
},
{
"model_name": "llama-65b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5757306696263411,
"precision": 0.6815476190476191,
"recall": 0.6147540983606558,
"auc": 0.7852727761354474
},
{
"model_name": "llama-65b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.639344262295082,
"f1": 0.5959048479373683,
"precision": 0.7444601603017444,
"recall": 0.639344262295082,
"auc": 0.6769685568395593
},
{
"model_name": "llama-65b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.584342152953969,
"precision": 0.6622340425531915,
"recall": 0.6147540983606558,
"auc": 0.6132760010749798
},
{
"model_name": "pythia-12b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5477293790546802,
"precision": 0.7221288515406162,
"recall": 0.6065573770491803,
"auc": 0.680059123891427
},
{
"model_name": "pythia-12b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.4820155411359449,
"precision": 0.6848484848484848,
"recall": 0.5655737704918032,
"auc": 0.5999731255038967
},
{
"model_name": "pythia-12b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5536585365853659,
"precision": 0.7026060296371998,
"recall": 0.6065573770491803,
"auc": 0.6796560064498791
},
{
"model_name": "pythia-12b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5737704918032787,
"f1": 0.5164634146341464,
"precision": 0.6402657128257536,
"recall": 0.5737704918032787,
"auc": 0.7188927707605481
},
{
"model_name": "pythia-12b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5573770491803278,
"f1": 0.4911955514365153,
"precision": 0.6196078431372549,
"recall": 0.5573770491803278,
"auc": 0.584923407686106
},
{
"model_name": "openllama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5288847698486252,
"precision": 0.6879551820728291,
"recall": 0.5901639344262295,
"auc": 0.6036011824778286
},
{
"model_name": "openllama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.48986193293885605,
"precision": 0.6613756613756614,
"recall": 0.5655737704918032,
"auc": 0.49758129535071216
},
{
"model_name": "openllama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.7339424885783391
},
{
"model_name": "openllama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5327868852459017,
"f1": 0.433851664902711,
"precision": 0.6089285714285715,
"recall": 0.5327868852459016,
"auc": 0.6339693630744423
},
{
"model_name": "openllama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.6326256382692824
},
{
"model_name": "opt-125m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5655737704918032,
"f1": 0.4735813726288366,
"precision": 0.7178571428571429,
"recall": 0.5655737704918032,
"auc": 0.723327062617576
},
{
"model_name": "opt-125m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.6902714324106423
},
{
"model_name": "opt-125m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.6660843859177641
},
{
"model_name": "opt-125m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5655737704918032,
"f1": 0.4645134575569358,
"precision": 0.7675438596491229,
"recall": 0.5655737704918032,
"auc": 0.7484547164740661
},
{
"model_name": "opt-125m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5655737704918032,
"f1": 0.4735813726288366,
"precision": 0.7178571428571429,
"recall": 0.5655737704918032,
"auc": 0.6703843052942758
},
{
"model_name": "openllama-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5737704918032787,
"f1": 0.4791461412151067,
"precision": 0.7699115044247787,
"recall": 0.5737704918032787,
"auc": 0.7656543939801129
},
{
"model_name": "openllama-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5491803278688525,
"f1": 0.46246895778258434,
"precision": 0.6386363636363637,
"recall": 0.5491803278688524,
"auc": 0.5318462778822897
},
{
"model_name": "openllama-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5491803278688525,
"f1": 0.43418500716755204,
"precision": 0.7629310344827587,
"recall": 0.5491803278688525,
"auc": 0.832571889277076
},
{
"model_name": "openllama-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5491803278688525,
"f1": 0.45371651876577385,
"precision": 0.6633928571428571,
"recall": 0.5491803278688524,
"auc": 0.5812953507121741
},
{
"model_name": "openllama-3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5573770491803278,
"f1": 0.46802325581395354,
"precision": 0.6748566748566749,
"recall": 0.5573770491803278,
"auc": 0.5165278151034669
},
{
"model_name": "pythia-410m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.5015621244893054,
"precision": 0.731060606060606,
"recall": 0.5819672131147541,
"auc": 0.6229508196721312
},
{
"model_name": "pythia-410m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5409836065573771,
"f1": 0.429144385026738,
"precision": 0.6894409937888198,
"recall": 0.540983606557377,
"auc": 0.6890620800859983
},
{
"model_name": "pythia-410m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.6863746304756786
},
{
"model_name": "pythia-410m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5737704918032787,
"f1": 0.4877260981912145,
"precision": 0.7248157248157248,
"recall": 0.5737704918032787,
"auc": 0.6327600107497984
},
{
"model_name": "pythia-410m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5601074031453778,
"precision": 0.7280982905982906,
"recall": 0.6147540983606558,
"auc": 0.7167428110722923
},
{
"model_name": "llama-2-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.680327868852459,
"f1": 0.6439422285414952,
"precision": 0.8049999999999999,
"recall": 0.680327868852459,
"auc": 0.7976350443429187
},
{
"model_name": "llama-2-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6475409836065574,
"f1": 0.5975450709627925,
"precision": 0.7932692307692308,
"recall": 0.6475409836065573,
"auc": 0.7179521633969362
},
{
"model_name": "llama-2-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.639344262295082,
"f1": 0.5854185974667903,
"precision": 0.7904761904761906,
"recall": 0.639344262295082,
"auc": 0.7269551195915076
},
{
"model_name": "llama-2-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5211087078426659,
"precision": 0.7772727272727273,
"recall": 0.5983606557377049,
"auc": 0.8016662187583983
},
{
"model_name": "llama-2-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6311475409836066,
"f1": 0.573061668870052,
"precision": 0.7877358490566038,
"recall": 0.6311475409836066,
"auc": 0.6991400161246976
},
{
"model_name": "mpt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5655737704918032,
"f1": 0.48986193293885605,
"precision": 0.6613756613756614,
"recall": 0.5655737704918032,
"auc": 0.7256113947863478
},
{
"model_name": "mpt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.6851652781510347
},
{
"model_name": "mpt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5591689250225835,
"precision": 0.6869401225836869,
"recall": 0.6065573770491803,
"auc": 0.6088417092179522
},
{
"model_name": "mpt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.861058855146466
},
{
"model_name": "mpt-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5737704918032787,
"f1": 0.5100401606425702,
"precision": 0.6537815126050419,
"recall": 0.5737704918032787,
"auc": 0.6517065305025531
},
{
"model_name": "cerebras-gpt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.7328675087342112
},
{
"model_name": "cerebras-gpt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.708546089760817
},
{
"model_name": "cerebras-gpt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5344992050874404,
"precision": 0.7798165137614679,
"recall": 0.6065573770491803,
"auc": 0.6690405804891159
},
{
"model_name": "cerebras-gpt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.6019887127116367
},
{
"model_name": "cerebras-gpt-2.7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6311475409836066,
"f1": 0.5841854124062713,
"precision": 0.7392156862745098,
"recall": 0.6311475409836065,
"auc": 0.6170384305294276
},
{
"model_name": "pythia-6.9b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5074289405684755,
"precision": 0.7747747747747749,
"recall": 0.5901639344262295,
"auc": 0.6156947057242677
},
{
"model_name": "pythia-6.9b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5573770491803278,
"f1": 0.46802325581395354,
"precision": 0.6748566748566749,
"recall": 0.5573770491803278,
"auc": 0.568798710024187
},
{
"model_name": "pythia-6.9b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5737704918032787,
"f1": 0.4957074721780603,
"precision": 0.6937191249117854,
"recall": 0.5737704918032787,
"auc": 0.7940069873689868
},
{
"model_name": "pythia-6.9b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5526453640649555,
"precision": 0.6663636363636364,
"recall": 0.5983606557377049,
"auc": 0.5176027949475948
},
{
"model_name": "pythia-6.9b-deduped",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5491803278688525,
"f1": 0.45371651876577385,
"precision": 0.6633928571428571,
"recall": 0.5491803278688524,
"auc": 0.48172534264982536
},
{
"model_name": "llama-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6639344262295082,
"f1": 0.6407383466206997,
"precision": 0.7210144927536233,
"recall": 0.6639344262295082,
"auc": 0.6748185971513034
},
{
"model_name": "llama-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6475409836065574,
"f1": 0.6074234827508793,
"precision": 0.7495454545454545,
"recall": 0.6475409836065573,
"auc": 0.6734748723461433
},
{
"model_name": "llama-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5983606557377049,
"f1": 0.5526453640649555,
"precision": 0.6663636363636364,
"recall": 0.5983606557377049,
"auc": 0.8099973125503896
},
{
"model_name": "llama-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6311475409836066,
"f1": 0.6121511833274462,
"precision": 0.6631016042780749,
"recall": 0.6311475409836065,
"auc": 0.6226820747110992
},
{
"model_name": "llama-30b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6475409836065574,
"f1": 0.629388908512893,
"precision": 0.6834893048128342,
"recall": 0.6475409836065573,
"auc": 0.7000806234883096
},
{
"model_name": "llama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.8019349637194303
},
{
"model_name": "llama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6065573770491803,
"f1": 0.5477293790546802,
"precision": 0.7221288515406162,
"recall": 0.6065573770491803,
"auc": 0.5862671324912657
},
{
"model_name": "llama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5722560975609756,
"precision": 0.7337761880429228,
"recall": 0.6229508196721312,
"auc": 0.6752217145928514
},
{
"model_name": "llama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6065573770491803,
"f1": 0.5591689250225835,
"precision": 0.6869401225836869,
"recall": 0.6065573770491803,
"auc": 0.6397473797366299
},
{
"model_name": "llama-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6147540983606558,
"f1": 0.5601074031453778,
"precision": 0.7280982905982906,
"recall": 0.6147540983606558,
"auc": 0.5939263638806772
},
{
"model_name": "falcon-40b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6475409836065574,
"f1": 0.5975450709627925,
"precision": 0.7932692307692308,
"recall": 0.6475409836065573,
"auc": 0.5874764848159097
},
{
"model_name": "falcon-40b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.7540983606557377,
"f1": 0.7441990494828068,
"precision": 0.8006359300476948,
"recall": 0.7540983606557377,
"auc": 0.6627250739048642
},
{
"model_name": "falcon-40b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.7131147540983607,
"f1": 0.6904675607104024,
"precision": 0.8012917933130699,
"recall": 0.7131147540983607,
"auc": 0.7863477559795754
},
{
"model_name": "falcon-40b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6639344262295082,
"f1": 0.6211467090812693,
"precision": 0.7990196078431373,
"recall": 0.6639344262295082,
"auc": 0.8234345606019886
},
{
"model_name": "falcon-40b-instruct",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.7131147540983607,
"f1": 0.6933132227249874,
"precision": 0.7873188405797101,
"recall": 0.7131147540983607,
"auc": 0.7320612738511153
},
{
"model_name": "mpt-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5901639344262295,
"f1": 0.5222431077694234,
"precision": 0.7090342679127726,
"recall": 0.5901639344262295,
"auc": 0.6847621607094867
},
{
"model_name": "mpt-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5409836065573771,
"f1": 0.4483204134366925,
"precision": 0.6248976248976249,
"recall": 0.540983606557377,
"auc": 0.5201558720773986
},
{
"model_name": "mpt-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5591689250225835,
"precision": 0.6869401225836869,
"recall": 0.6065573770491803,
"auc": 0.4875033593120129
},
{
"model_name": "mpt-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5472241157312732,
"precision": 0.6794117647058824,
"recall": 0.5983606557377049,
"auc": 0.5837140553614619
},
{
"model_name": "mpt-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.6025262026337007
},
{
"model_name": "mpt-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.8902176834184359
},
{
"model_name": "mpt-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6639344262295082,
"f1": 0.6211467090812693,
"precision": 0.7990196078431373,
"recall": 0.6639344262295082,
"auc": 0.7312550389680194
},
{
"model_name": "mpt-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.6617844665412523
},
{
"model_name": "mpt-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.8586401504971782
},
{
"model_name": "mpt-7b-chat",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.6229508196721312,
"f1": 0.5604636591478697,
"precision": 0.7850467289719626,
"recall": 0.6229508196721312,
"auc": 0.7890352055898953
},
{
"model_name": "pythia-6.9b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.610857296425692
},
{
"model_name": "pythia-6.9b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6229508196721312,
"f1": 0.5775368864799759,
"precision": 0.7157001414427157,
"recall": 0.6229508196721312,
"auc": 0.6620532115022842
},
{
"model_name": "pythia-6.9b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6147540983606558,
"f1": 0.5657047640687722,
"precision": 0.709313725490196,
"recall": 0.6147540983606556,
"auc": 0.6621875839828003
},
{
"model_name": "pythia-6.9b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5283629191321499,
"precision": 0.7420634920634921,
"recall": 0.5983606557377049,
"auc": 0.6556033324375168
},
{
"model_name": "pythia-6.9b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5983606557377049,
"f1": 0.5351115949918346,
"precision": 0.7158018867924528,
"recall": 0.5983606557377049,
"auc": 0.5610051061542596
},
{
"model_name": "falcon-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.7235958075786079
},
{
"model_name": "falcon-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5655737704918032,
"f1": 0.5312794490757521,
"precision": 0.5927051671732523,
"recall": 0.5655737704918034,
"auc": 0.5540177371674281
},
{
"model_name": "falcon-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6229508196721312,
"f1": 0.5775368864799759,
"precision": 0.7157001414427157,
"recall": 0.6229508196721312,
"auc": 0.6457941413598496
},
{
"model_name": "falcon-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.5161365580527257,
"precision": 0.6798349056603774,
"recall": 0.5819672131147541,
"auc": 0.5921795216339694
},
{
"model_name": "falcon-7b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5409836065573771,
"f1": 0.4390804597701149,
"precision": 0.6499508357915438,
"recall": 0.540983606557377,
"auc": 0.7046492878258532
},
{
"model_name": "opt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6147540983606558,
"f1": 0.5476134122287968,
"precision": 0.7824074074074074,
"recall": 0.6147540983606558,
"auc": 0.7256113947863478
},
{
"model_name": "opt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.5819672131147541,
"f1": 0.5161365580527257,
"precision": 0.6798349056603774,
"recall": 0.5819672131147541,
"auc": 0.6788497715667832
},
{
"model_name": "opt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.5819672131147541,
"f1": 0.4934462264918993,
"precision": 0.7723214285714286,
"recall": 0.5819672131147541,
"auc": 0.5786079011018543
},
{
"model_name": "opt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5819672131147541,
"f1": 0.509112426035503,
"precision": 0.7017195767195767,
"recall": 0.5819672131147541,
"auc": 0.7042461703843053
},
{
"model_name": "opt-1.3b",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.5573770491803278,
"f1": 0.4495320855614974,
"precision": 0.7652173913043478,
"recall": 0.5573770491803278,
"auc": 0.6202633700618114
},
{
"model_name": "pythia-160m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1",
"accuracy": 0.6721311475409836,
"f1": 0.6445221445221445,
"precision": 0.7497076023391813,
"recall": 0.6721311475409836,
"auc": 0.8653587745229776
},
{
"model_name": "pythia-160m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "666",
"accuracy": 0.6639344262295082,
"f1": 0.6298927118017018,
"precision": 0.7593537414965986,
"recall": 0.6639344262295082,
"auc": 0.7406611126041386
},
{
"model_name": "pythia-160m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "42",
"accuracy": 0.6065573770491803,
"f1": 0.5413533834586466,
"precision": 0.7470404984423675,
"recall": 0.6065573770491803,
"auc": 0.7694168234345606
},
{
"model_name": "pythia-160m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "25",
"accuracy": 0.5983606557377049,
"f1": 0.5211087078426659,
"precision": 0.7772727272727273,
"recall": 0.5983606557377049,
"auc": 0.8133566245632894
},
{
"model_name": "pythia-160m",
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42",
"seed": "1337",
"accuracy": 0.7131147540983607,
"f1": 0.6983398092546802,
"precision": 0.7650401069518716,
"recall": 0.7131147540983607,
"auc": 0.721311475409836
}
]