|
[{ |
|
"model_name": "mpt-30b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.609451219512195, |
|
"precision": 0.7961165048543689, |
|
"recall": 0.6557377049180328, |
|
"auc": 0.5048374092985757 |
|
}, |
|
{ |
|
"model_name": "mpt-30b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.708008599838753 |
|
}, |
|
{ |
|
"model_name": "mpt-30b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6883902176834185 |
|
}, |
|
{ |
|
"model_name": "mpt-30b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6490190808922334 |
|
}, |
|
{ |
|
"model_name": "mpt-30b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.707874227358237 |
|
}, |
|
{ |
|
"model_name": "openllama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5226697353279632, |
|
"precision": 0.6629273504273505, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6484815909701692 |
|
}, |
|
{ |
|
"model_name": "openllama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5566116857701985, |
|
"precision": 0.587281399046105, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.570276807309863 |
|
}, |
|
{ |
|
"model_name": "openllama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5709047369602633, |
|
"precision": 0.6940909090909091, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6772373018005912 |
|
}, |
|
{ |
|
"model_name": "openllama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6052136522440205 |
|
}, |
|
{ |
|
"model_name": "openllama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5788262370540851, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.5925826390755173 |
|
}, |
|
{ |
|
"model_name": "vicuna-33b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6834184359043268 |
|
}, |
|
{ |
|
"model_name": "vicuna-33b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.680327868852459, |
|
"f1": 0.6439422285414952, |
|
"precision": 0.8049999999999999, |
|
"recall": 0.680327868852459, |
|
"auc": 0.6049449072829884 |
|
}, |
|
{ |
|
"model_name": "vicuna-33b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.8071754904595538 |
|
}, |
|
{ |
|
"model_name": "vicuna-33b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7786885245901639 |
|
}, |
|
{ |
|
"model_name": "vicuna-33b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4645134575569358, |
|
"precision": 0.7675438596491229, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.8501746842246708 |
|
}, |
|
{ |
|
"model_name": "pythia-410m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5151033386327504, |
|
"precision": 0.7367678193366267, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7304488040849234 |
|
}, |
|
{ |
|
"model_name": "pythia-410m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7973662993818866 |
|
}, |
|
{ |
|
"model_name": "pythia-410m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7041117979037892 |
|
}, |
|
{ |
|
"model_name": "pythia-410m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5245901639344263, |
|
"f1": 0.38576388888888885, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.5245901639344263, |
|
"auc": 0.6750873421123353 |
|
}, |
|
{ |
|
"model_name": "pythia-410m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5327868852459017, |
|
"f1": 0.4136099165190994, |
|
"precision": 0.6752873563218391, |
|
"recall": 0.5327868852459017, |
|
"auc": 0.6057511421660844 |
|
}, |
|
{ |
|
"model_name": "alfred-40b-0723", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.9684224670787422 |
|
}, |
|
{ |
|
"model_name": "alfred-40b-0723", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7125772641762966 |
|
}, |
|
{ |
|
"model_name": "alfred-40b-0723", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.8250470303681807 |
|
}, |
|
{ |
|
"model_name": "alfred-40b-0723", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.903520558989519 |
|
}, |
|
{ |
|
"model_name": "alfred-40b-0723", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7132491265788767 |
|
}, |
|
{ |
|
"model_name": "vicuna-13b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.8238376780435367 |
|
}, |
|
{ |
|
"model_name": "vicuna-13b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5211087078426659, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.8001881214727223 |
|
}, |
|
{ |
|
"model_name": "vicuna-13b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.5052405267401237 |
|
}, |
|
{ |
|
"model_name": "vicuna-13b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.8797366299381887 |
|
}, |
|
{ |
|
"model_name": "vicuna-13b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6967213114754098, |
|
"f1": 0.666000739918609, |
|
"precision": 0.8112244897959184, |
|
"recall": 0.6967213114754098, |
|
"auc": 0.8152378392905133 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5477293790546802, |
|
"precision": 0.7221288515406162, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7187583982800322 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4820155411359449, |
|
"precision": 0.6848484848484848, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.7571889277076055 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5722560975609756, |
|
"precision": 0.7337761880429228, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7511421660843859 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5722560975609756, |
|
"precision": 0.7337761880429228, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6691749529696318 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4820155411359449, |
|
"precision": 0.6848484848484848, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.5747110991668907 |
|
}, |
|
{ |
|
"model_name": "bloom-7.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6815372211771029 |
|
}, |
|
{ |
|
"model_name": "bloom-7.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5601074031453778, |
|
"precision": 0.7280982905982906, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7308519215264714 |
|
}, |
|
{ |
|
"model_name": "bloom-7.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4877260981912145, |
|
"precision": 0.7248157248157248, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6871808653587745 |
|
}, |
|
{ |
|
"model_name": "bloom-7.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5222431077694234, |
|
"precision": 0.7090342679127726, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7199677506046762 |
|
}, |
|
{ |
|
"model_name": "bloom-7.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.680327868852459, |
|
"f1": 0.6479467258601554, |
|
"precision": 0.7852891156462585, |
|
"recall": 0.680327868852459, |
|
"auc": 0.7274926095135715 |
|
}, |
|
{ |
|
"model_name": "pythia-160m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4591133004926109, |
|
"precision": 0.7099311701081612, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.779226014512228 |
|
}, |
|
{ |
|
"model_name": "pythia-160m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.6142728093947607, |
|
"precision": 0.7732201791607731, |
|
"recall": 0.6557377049180327, |
|
"auc": 0.8505778016662188 |
|
}, |
|
{ |
|
"model_name": "pythia-160m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7669981187852728 |
|
}, |
|
{ |
|
"model_name": "pythia-160m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.44430641821946165, |
|
"precision": 0.700657894736842, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.6178446654125235 |
|
}, |
|
{ |
|
"model_name": "pythia-160m-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5327868852459017, |
|
"f1": 0.4136099165190994, |
|
"precision": 0.6752873563218391, |
|
"recall": 0.5327868852459017, |
|
"auc": 0.7280300994356356 |
|
}, |
|
{ |
|
"model_name": "bloom-1.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6256828556461873, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.7944101048105348 |
|
}, |
|
{ |
|
"model_name": "bloom-1.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.43418500716755204, |
|
"precision": 0.7629310344827587, |
|
"recall": 0.5491803278688525, |
|
"auc": 0.7434829346949744 |
|
}, |
|
{ |
|
"model_name": "bloom-1.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5540866319309432, |
|
"precision": 0.7517688679245282, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7004837409298575 |
|
}, |
|
{ |
|
"model_name": "bloom-1.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7375705455522709 |
|
}, |
|
{ |
|
"model_name": "bloom-1.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6273851115291589 |
|
}, |
|
{ |
|
"model_name": "openllama-2-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5151033386327504, |
|
"precision": 0.7367678193366267, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7120397742542327 |
|
}, |
|
{ |
|
"model_name": "openllama-2-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.45371651876577385, |
|
"precision": 0.6633928571428571, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.6130072561139479 |
|
}, |
|
{ |
|
"model_name": "openllama-2-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5031328320802004, |
|
"precision": 0.6710280373831776, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6729373824240795 |
|
}, |
|
{ |
|
"model_name": "openllama-2-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.49716152111361694, |
|
"precision": 0.6438679245283019, |
|
"recall": 0.5655737704918034, |
|
"auc": 0.5732330018812148 |
|
}, |
|
{ |
|
"model_name": "openllama-2-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5709047369602633, |
|
"precision": 0.6940909090909091, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6140822359580758 |
|
}, |
|
{ |
|
"model_name": "opt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.43418500716755204, |
|
"precision": 0.7629310344827587, |
|
"recall": 0.5491803278688525, |
|
"auc": 0.5853265251276539 |
|
}, |
|
{ |
|
"model_name": "opt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5327868852459017, |
|
"f1": 0.4136099165190994, |
|
"precision": 0.6752873563218391, |
|
"recall": 0.5327868852459017, |
|
"auc": 0.4273044880408492 |
|
}, |
|
{ |
|
"model_name": "opt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.584251545283526 |
|
}, |
|
{ |
|
"model_name": "opt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5245901639344263, |
|
"f1": 0.40875668449197855, |
|
"precision": 0.613664596273292, |
|
"recall": 0.5245901639344263, |
|
"auc": 0.4486697124428917 |
|
}, |
|
{ |
|
"model_name": "opt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.46246895778258434, |
|
"precision": 0.6386363636363637, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.5111529158828272 |
|
}, |
|
{ |
|
"model_name": "opt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4495320855614974, |
|
"precision": 0.7652173913043478, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.6719967750604676 |
|
}, |
|
{ |
|
"model_name": "opt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5245901639344263, |
|
"f1": 0.3976847122914538, |
|
"precision": 0.6564102564102564, |
|
"recall": 0.5245901639344263, |
|
"auc": 0.48938457403923674 |
|
}, |
|
{ |
|
"model_name": "opt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.46802325581395354, |
|
"precision": 0.6748566748566749, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.4778285407148616 |
|
}, |
|
{ |
|
"model_name": "opt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5327868852459017, |
|
"f1": 0.42409937888198757, |
|
"precision": 0.6337719298245614, |
|
"recall": 0.5327868852459017, |
|
"auc": 0.52848696586939 |
|
}, |
|
{ |
|
"model_name": "opt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.583042192958882 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.680327868852459, |
|
"f1": 0.6479467258601554, |
|
"precision": 0.7852891156462585, |
|
"recall": 0.680327868852459, |
|
"auc": 0.7471109916689063 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6721311475409836, |
|
"f1": 0.6479076479076479, |
|
"precision": 0.7374860956618465, |
|
"recall": 0.6721311475409837, |
|
"auc": 0.6390755173340499 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.639344262295082, |
|
"f1": 0.6049455401825139, |
|
"precision": 0.7138144329896907, |
|
"recall": 0.639344262295082, |
|
"auc": 0.6890620800859983 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.6418786692759295, |
|
"precision": 0.6842607313195549, |
|
"recall": 0.6557377049180327, |
|
"auc": 0.625369524321419 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5788262370540851, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.7374361730717549 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6721311475409836, |
|
"f1": 0.6408595819841036, |
|
"precision": 0.7641237113402062, |
|
"recall": 0.6721311475409836, |
|
"auc": 0.6365224402042462 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.680327868852459, |
|
"f1": 0.6516582473094663, |
|
"precision": 0.7688301282051282, |
|
"recall": 0.680327868852459, |
|
"auc": 0.5325181402848697 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6721311475409836, |
|
"f1": 0.6408595819841036, |
|
"precision": 0.7641237113402062, |
|
"recall": 0.6721311475409836, |
|
"auc": 0.6847621607094866 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6967213114754098, |
|
"f1": 0.6855451062347615, |
|
"precision": 0.7293233082706767, |
|
"recall": 0.6967213114754098, |
|
"auc": 0.6886589626444504 |
|
}, |
|
{ |
|
"model_name": "llama-2-70b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6967213114754098, |
|
"f1": 0.6727799927509968, |
|
"precision": 0.7781155015197568, |
|
"recall": 0.6967213114754098, |
|
"auc": 0.7678043536683689 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.7651169040580489 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5690314983809244, |
|
"precision": 0.6635051546391753, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.5888202096210696 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4791461412151067, |
|
"precision": 0.7699115044247787, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7668637463047567 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.6726686374630476 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7143241064230045 |
|
}, |
|
{ |
|
"model_name": "gpt2", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5486428379467885 |
|
}, |
|
{ |
|
"model_name": "gpt2", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7868852459016393 |
|
}, |
|
{ |
|
"model_name": "gpt2", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4735813726288366, |
|
"precision": 0.7178571428571429, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.694974469228702 |
|
}, |
|
{ |
|
"model_name": "gpt2", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.44430641821946165, |
|
"precision": 0.700657894736842, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.5154528352593388 |
|
}, |
|
{ |
|
"model_name": "gpt2", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6834184359043267 |
|
}, |
|
{ |
|
"model_name": "gpt2-large", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4645134575569358, |
|
"precision": 0.7675438596491229, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.5912389142703574 |
|
}, |
|
{ |
|
"model_name": "gpt2-large", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7073367374361731 |
|
}, |
|
{ |
|
"model_name": "gpt2-large", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6655468959957002 |
|
}, |
|
{ |
|
"model_name": "gpt2-large", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.6768341843590432 |
|
}, |
|
{ |
|
"model_name": "gpt2-large", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5536585365853659, |
|
"precision": 0.7026060296371998, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7256113947863477 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5222431077694234, |
|
"precision": 0.7090342679127726, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.664606288632088 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.48986193293885605, |
|
"precision": 0.6613756613756614, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6636656812684761 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5226697353279632, |
|
"precision": 0.6629273504273505, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5730986294006987 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7194302606826122 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5950013437248052 |
|
}, |
|
{ |
|
"model_name": "gpt2-medium", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.7125772641762966 |
|
}, |
|
{ |
|
"model_name": "gpt2-medium", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4820155411359449, |
|
"precision": 0.6848484848484848, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6558720773985487 |
|
}, |
|
{ |
|
"model_name": "gpt2-medium", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5226697353279632, |
|
"precision": 0.6629273504273505, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5919107766729373 |
|
}, |
|
{ |
|
"model_name": "gpt2-medium", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.46802325581395354, |
|
"precision": 0.6748566748566749, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.6076323568933082 |
|
}, |
|
{ |
|
"model_name": "gpt2-medium", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4495320855614974, |
|
"precision": 0.7652173913043478, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.6408223595807578 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5477293790546802, |
|
"precision": 0.7221288515406162, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6428379467884977 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6195915076592313 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5601074031453778, |
|
"precision": 0.7280982905982906, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6062886320881483 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7747917226552002 |
|
}, |
|
{ |
|
"model_name": "pythia-2.8b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5540866319309432, |
|
"precision": 0.7517688679245282, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.48589088954582105 |
|
}, |
|
{ |
|
"model_name": "opt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.41845420497105895, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.5409836065573771, |
|
"auc": 0.6909432948132223 |
|
}, |
|
{ |
|
"model_name": "opt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.5338618650900295 |
|
}, |
|
{ |
|
"model_name": "opt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5245901639344263, |
|
"f1": 0.38576388888888885, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.5245901639344263, |
|
"auc": 0.7308519215264715 |
|
}, |
|
{ |
|
"model_name": "opt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5245901639344263, |
|
"f1": 0.3976847122914538, |
|
"precision": 0.6564102564102564, |
|
"recall": 0.5245901639344263, |
|
"auc": 0.6367911851652781 |
|
}, |
|
{ |
|
"model_name": "opt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.43418500716755204, |
|
"precision": 0.7629310344827587, |
|
"recall": 0.5491803278688525, |
|
"auc": 0.7231926901370599 |
|
}, |
|
{ |
|
"model_name": "falcon-40b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5031328320802004, |
|
"precision": 0.6710280373831776, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7186240257995162 |
|
}, |
|
{ |
|
"model_name": "falcon-40b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7162053211502284 |
|
}, |
|
{ |
|
"model_name": "falcon-40b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5288847698486252, |
|
"precision": 0.6879551820728291, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6510346680999731 |
|
}, |
|
{ |
|
"model_name": "falcon-40b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5950937950937951, |
|
"precision": 0.6696329254727476, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6557377049180328 |
|
}, |
|
{ |
|
"model_name": "falcon-40b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5642857142857143, |
|
"precision": 0.6741326306543698, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6566783122816446 |
|
}, |
|
{ |
|
"model_name": "pythia-1b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6549314700349368 |
|
}, |
|
{ |
|
"model_name": "pythia-1b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4877260981912145, |
|
"precision": 0.7248157248157248, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7660575114216608 |
|
}, |
|
{ |
|
"model_name": "pythia-1b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5226697353279632, |
|
"precision": 0.6629273504273505, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5987637731792528 |
|
}, |
|
{ |
|
"model_name": "pythia-1b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6272507390486428 |
|
}, |
|
{ |
|
"model_name": "pythia-1b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4735813726288366, |
|
"precision": 0.7178571428571429, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6736092448266596 |
|
}, |
|
{ |
|
"model_name": "vicuna-7b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.666353130878796 |
|
}, |
|
{ |
|
"model_name": "vicuna-7b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.5658425154528353 |
|
}, |
|
{ |
|
"model_name": "vicuna-7b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7696855683955925 |
|
}, |
|
{ |
|
"model_name": "vicuna-7b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5211087078426659, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.7334049986562752 |
|
}, |
|
{ |
|
"model_name": "vicuna-7b-v1.3", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7417360924482665 |
|
}, |
|
{ |
|
"model_name": "openllama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5343859911696476, |
|
"precision": 0.6386363636363637, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.666756248320344 |
|
}, |
|
{ |
|
"model_name": "openllama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4820155411359449, |
|
"precision": 0.6848484848484848, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6182477828540714 |
|
}, |
|
{ |
|
"model_name": "openllama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5841854124062713, |
|
"precision": 0.7392156862745098, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.7313894114485352 |
|
}, |
|
{ |
|
"model_name": "openllama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5288847698486252, |
|
"precision": 0.6879551820728291, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6490190808922333 |
|
}, |
|
{ |
|
"model_name": "openllama-2-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4791461412151067, |
|
"precision": 0.7699115044247787, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7278957269551196 |
|
}, |
|
{ |
|
"model_name": "opt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5204246170384306 |
|
}, |
|
{ |
|
"model_name": "opt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5031328320802004, |
|
"precision": 0.6710280373831776, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6091104541789841 |
|
}, |
|
{ |
|
"model_name": "opt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5161365580527257, |
|
"precision": 0.6798349056603774, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7471109916689063 |
|
}, |
|
{ |
|
"model_name": "opt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.5815640956732061 |
|
}, |
|
{ |
|
"model_name": "opt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5174684224670787 |
|
}, |
|
{ |
|
"model_name": "opt-66b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5164634146341464, |
|
"precision": 0.6402657128257536, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.5911045417898414 |
|
}, |
|
{ |
|
"model_name": "opt-66b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5757306696263411, |
|
"precision": 0.6815476190476191, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.5382961569470572 |
|
}, |
|
{ |
|
"model_name": "opt-66b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5161365580527257, |
|
"precision": 0.6798349056603774, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6823434560601989 |
|
}, |
|
{ |
|
"model_name": "opt-66b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.46802325581395354, |
|
"precision": 0.6748566748566749, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.5163934426229508 |
|
}, |
|
{ |
|
"model_name": "opt-66b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4877260981912145, |
|
"precision": 0.7248157248157248, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6748185971513034 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5540866319309432, |
|
"precision": 0.7517688679245282, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7946788497715669 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.806503628056974 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5540866319309432, |
|
"precision": 0.7517688679245282, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7625638269282451 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5788262370540851, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.707605482397205 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5151033386327504, |
|
"precision": 0.7367678193366267, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6560064498790648 |
|
}, |
|
{ |
|
"model_name": "bloom-560m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.846277882289707 |
|
}, |
|
{ |
|
"model_name": "bloom-560m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.6142728093947607, |
|
"precision": 0.7732201791607731, |
|
"recall": 0.6557377049180327, |
|
"auc": 0.7846009137328676 |
|
}, |
|
{ |
|
"model_name": "bloom-560m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6211467090812693, |
|
"precision": 0.7990196078431373, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.764579414135985 |
|
}, |
|
{ |
|
"model_name": "bloom-560m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.777613544746036 |
|
}, |
|
{ |
|
"model_name": "bloom-560m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.8129535071217413 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.8089223327062617 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.7440204246170384 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6440472991131417 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.7139209889814565 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-6.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5662456328943832 |
|
}, |
|
{ |
|
"model_name": "pythia-1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6879871002418705 |
|
}, |
|
{ |
|
"model_name": "pythia-1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7390486428379467 |
|
}, |
|
{ |
|
"model_name": "pythia-1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6499596882558452 |
|
}, |
|
{ |
|
"model_name": "pythia-1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6961838215533459 |
|
}, |
|
{ |
|
"model_name": "pythia-1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5222431077694234, |
|
"precision": 0.7090342679127726, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.5990325181402849 |
|
}, |
|
{ |
|
"model_name": "falcon-7b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.8481590970169308 |
|
}, |
|
{ |
|
"model_name": "falcon-7b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.7617575920451491 |
|
}, |
|
{ |
|
"model_name": "falcon-7b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6005106154259607 |
|
}, |
|
{ |
|
"model_name": "falcon-7b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6475409836065574, |
|
"f1": 0.5975450709627925, |
|
"precision": 0.7932692307692308, |
|
"recall": 0.6475409836065573, |
|
"auc": 0.8382155334587477 |
|
}, |
|
{ |
|
"model_name": "falcon-7b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.7886320881483473 |
|
}, |
|
{ |
|
"model_name": "gpt2-xl", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.6983337812416016 |
|
}, |
|
{ |
|
"model_name": "gpt2-xl", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.44430641821946165, |
|
"precision": 0.700657894736842, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.583310937919914 |
|
}, |
|
{ |
|
"model_name": "gpt2-xl", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.49716152111361694, |
|
"precision": 0.6438679245283019, |
|
"recall": 0.5655737704918034, |
|
"auc": 0.5331900026874496 |
|
}, |
|
{ |
|
"model_name": "gpt2-xl", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4911955514365153, |
|
"precision": 0.6196078431372549, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.5395055092717012 |
|
}, |
|
{ |
|
"model_name": "gpt2-xl", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.45371651876577385, |
|
"precision": 0.6633928571428571, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.7543671056167697 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.8804084923407686 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5455522708949208 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5788262370540851, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.708680462241333 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5351115949918346, |
|
"precision": 0.7158018867924528, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.569739317387799 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5757306696263411, |
|
"precision": 0.6815476190476191, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7049180327868851 |
|
}, |
|
{ |
|
"model_name": "pythia-12b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5151033386327504, |
|
"precision": 0.7367678193366267, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6510346680999731 |
|
}, |
|
{ |
|
"model_name": "pythia-12b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4735813726288366, |
|
"precision": 0.7178571428571429, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6038699274388606 |
|
}, |
|
{ |
|
"model_name": "pythia-12b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6659500134372481 |
|
}, |
|
{ |
|
"model_name": "pythia-12b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.624025799516259 |
|
}, |
|
{ |
|
"model_name": "pythia-12b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6165009406073636 |
|
}, |
|
{ |
|
"model_name": "bloom-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.7049180327868853, |
|
"f1": 0.6831168831168831, |
|
"precision": 0.7827215424545791, |
|
"recall": 0.7049180327868853, |
|
"auc": 0.6734748723461434 |
|
}, |
|
{ |
|
"model_name": "bloom-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6256828556461873, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.7714324106423005 |
|
}, |
|
{ |
|
"model_name": "bloom-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.7049180327868853, |
|
"f1": 0.6859267734553776, |
|
"precision": 0.7702942219071252, |
|
"recall": 0.7049180327868853, |
|
"auc": 0.7594732598763774 |
|
}, |
|
{ |
|
"model_name": "bloom-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5161365580527257, |
|
"precision": 0.6798349056603774, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.625235151840903 |
|
}, |
|
{ |
|
"model_name": "bloom-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6721311475409836, |
|
"f1": 0.6408595819841036, |
|
"precision": 0.7641237113402062, |
|
"recall": 0.6721311475409836, |
|
"auc": 0.7198333781241602 |
|
}, |
|
{ |
|
"model_name": "llama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5351115949918346, |
|
"precision": 0.7158018867924528, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.8235689330825046 |
|
}, |
|
{ |
|
"model_name": "llama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5526453640649555, |
|
"precision": 0.6663636363636364, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5597957538296157 |
|
}, |
|
{ |
|
"model_name": "llama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5642857142857143, |
|
"precision": 0.6741326306543698, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6471378661650095 |
|
}, |
|
{ |
|
"model_name": "llama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.48986193293885605, |
|
"precision": 0.6613756613756614, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6366568126847622 |
|
}, |
|
{ |
|
"model_name": "llama-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5287434673937742, |
|
"precision": 0.6495098039215687, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7244020424617037 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7867508734211233 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6627250739048642 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5722560975609756, |
|
"precision": 0.7337761880429228, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6474066111260414 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5891641098555713, |
|
"precision": 0.7218181818181818, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.7819134641225477 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-13b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5211087078426659, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.6861058855146466 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.6159634506852997 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4791461412151067, |
|
"precision": 0.7699115044247787, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6412254770223058 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6788497715667831 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5540866319309432, |
|
"precision": 0.7517688679245282, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6588282719699006 |
|
}, |
|
{ |
|
"model_name": "pythia-1.4b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5665739882607352, |
|
"precision": 0.7563025210084033, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6660843859177641 |
|
}, |
|
{ |
|
"model_name": "bloom-1.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5788262370540851, |
|
"precision": 0.7606837606837606, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.8325718892770761 |
|
}, |
|
{ |
|
"model_name": "bloom-1.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5841854124062713, |
|
"precision": 0.7392156862745098, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.6961838215533459 |
|
}, |
|
{ |
|
"model_name": "bloom-1.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7702230583176565 |
|
}, |
|
{ |
|
"model_name": "bloom-1.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5477293790546802, |
|
"precision": 0.7221288515406162, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7156678312281645 |
|
}, |
|
{ |
|
"model_name": "bloom-1.1b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.639344262295082, |
|
"f1": 0.5854185974667903, |
|
"precision": 0.7904761904761906, |
|
"recall": 0.639344262295082, |
|
"auc": 0.8121472722386456 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.778016662187584 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.6187499999999999, |
|
"precision": 0.7545015371102327, |
|
"recall": 0.6557377049180327, |
|
"auc": 0.7487234614350982 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4645134575569358, |
|
"precision": 0.7675438596491229, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.7725073904864284 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.5154528352593388 |
|
}, |
|
{ |
|
"model_name": "llama-2-13b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.6652781510346681 |
|
}, |
|
{ |
|
"model_name": "llama-65b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.8497715667831229 |
|
}, |
|
{ |
|
"model_name": "llama-65b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6557377049180327, |
|
"f1": 0.6335812356979404, |
|
"precision": 0.705423608649415, |
|
"recall": 0.6557377049180328, |
|
"auc": 0.5665143778554151 |
|
}, |
|
{ |
|
"model_name": "llama-65b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5757306696263411, |
|
"precision": 0.6815476190476191, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7852727761354474 |
|
}, |
|
{ |
|
"model_name": "llama-65b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.639344262295082, |
|
"f1": 0.5959048479373683, |
|
"precision": 0.7444601603017444, |
|
"recall": 0.639344262295082, |
|
"auc": 0.6769685568395593 |
|
}, |
|
{ |
|
"model_name": "llama-65b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.584342152953969, |
|
"precision": 0.6622340425531915, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.6132760010749798 |
|
}, |
|
{ |
|
"model_name": "pythia-12b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5477293790546802, |
|
"precision": 0.7221288515406162, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.680059123891427 |
|
}, |
|
{ |
|
"model_name": "pythia-12b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4820155411359449, |
|
"precision": 0.6848484848484848, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.5999731255038967 |
|
}, |
|
{ |
|
"model_name": "pythia-12b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5536585365853659, |
|
"precision": 0.7026060296371998, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6796560064498791 |
|
}, |
|
{ |
|
"model_name": "pythia-12b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5164634146341464, |
|
"precision": 0.6402657128257536, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7188927707605481 |
|
}, |
|
{ |
|
"model_name": "pythia-12b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4911955514365153, |
|
"precision": 0.6196078431372549, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.584923407686106 |
|
}, |
|
{ |
|
"model_name": "openllama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5288847698486252, |
|
"precision": 0.6879551820728291, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6036011824778286 |
|
}, |
|
{ |
|
"model_name": "openllama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.48986193293885605, |
|
"precision": 0.6613756613756614, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.49758129535071216 |
|
}, |
|
{ |
|
"model_name": "openllama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.7339424885783391 |
|
}, |
|
{ |
|
"model_name": "openllama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5327868852459017, |
|
"f1": 0.433851664902711, |
|
"precision": 0.6089285714285715, |
|
"recall": 0.5327868852459016, |
|
"auc": 0.6339693630744423 |
|
}, |
|
{ |
|
"model_name": "openllama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.6326256382692824 |
|
}, |
|
{ |
|
"model_name": "opt-125m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4735813726288366, |
|
"precision": 0.7178571428571429, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.723327062617576 |
|
}, |
|
{ |
|
"model_name": "opt-125m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.6902714324106423 |
|
}, |
|
{ |
|
"model_name": "opt-125m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.6660843859177641 |
|
}, |
|
{ |
|
"model_name": "opt-125m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4645134575569358, |
|
"precision": 0.7675438596491229, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.7484547164740661 |
|
}, |
|
{ |
|
"model_name": "opt-125m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.4735813726288366, |
|
"precision": 0.7178571428571429, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.6703843052942758 |
|
}, |
|
{ |
|
"model_name": "openllama-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4791461412151067, |
|
"precision": 0.7699115044247787, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7656543939801129 |
|
}, |
|
{ |
|
"model_name": "openllama-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.46246895778258434, |
|
"precision": 0.6386363636363637, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.5318462778822897 |
|
}, |
|
{ |
|
"model_name": "openllama-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.43418500716755204, |
|
"precision": 0.7629310344827587, |
|
"recall": 0.5491803278688525, |
|
"auc": 0.832571889277076 |
|
}, |
|
{ |
|
"model_name": "openllama-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.45371651876577385, |
|
"precision": 0.6633928571428571, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.5812953507121741 |
|
}, |
|
{ |
|
"model_name": "openllama-3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.46802325581395354, |
|
"precision": 0.6748566748566749, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.5165278151034669 |
|
}, |
|
{ |
|
"model_name": "pythia-410m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5015621244893054, |
|
"precision": 0.731060606060606, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6229508196721312 |
|
}, |
|
{ |
|
"model_name": "pythia-410m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.429144385026738, |
|
"precision": 0.6894409937888198, |
|
"recall": 0.540983606557377, |
|
"auc": 0.6890620800859983 |
|
}, |
|
{ |
|
"model_name": "pythia-410m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6863746304756786 |
|
}, |
|
{ |
|
"model_name": "pythia-410m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4877260981912145, |
|
"precision": 0.7248157248157248, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6327600107497984 |
|
}, |
|
{ |
|
"model_name": "pythia-410m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5601074031453778, |
|
"precision": 0.7280982905982906, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7167428110722923 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.680327868852459, |
|
"f1": 0.6439422285414952, |
|
"precision": 0.8049999999999999, |
|
"recall": 0.680327868852459, |
|
"auc": 0.7976350443429187 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6475409836065574, |
|
"f1": 0.5975450709627925, |
|
"precision": 0.7932692307692308, |
|
"recall": 0.6475409836065573, |
|
"auc": 0.7179521633969362 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.639344262295082, |
|
"f1": 0.5854185974667903, |
|
"precision": 0.7904761904761906, |
|
"recall": 0.639344262295082, |
|
"auc": 0.7269551195915076 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5211087078426659, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.8016662187583983 |
|
}, |
|
{ |
|
"model_name": "llama-2-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.573061668870052, |
|
"precision": 0.7877358490566038, |
|
"recall": 0.6311475409836066, |
|
"auc": 0.6991400161246976 |
|
}, |
|
{ |
|
"model_name": "mpt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.48986193293885605, |
|
"precision": 0.6613756613756614, |
|
"recall": 0.5655737704918032, |
|
"auc": 0.7256113947863478 |
|
}, |
|
{ |
|
"model_name": "mpt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6851652781510347 |
|
}, |
|
{ |
|
"model_name": "mpt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5591689250225835, |
|
"precision": 0.6869401225836869, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6088417092179522 |
|
}, |
|
{ |
|
"model_name": "mpt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.861058855146466 |
|
}, |
|
{ |
|
"model_name": "mpt-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.5100401606425702, |
|
"precision": 0.6537815126050419, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.6517065305025531 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7328675087342112 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.708546089760817 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5344992050874404, |
|
"precision": 0.7798165137614679, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6690405804891159 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6019887127116367 |
|
}, |
|
{ |
|
"model_name": "cerebras-gpt-2.7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.5841854124062713, |
|
"precision": 0.7392156862745098, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.6170384305294276 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5074289405684755, |
|
"precision": 0.7747747747747749, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6156947057242677 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.46802325581395354, |
|
"precision": 0.6748566748566749, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.568798710024187 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5737704918032787, |
|
"f1": 0.4957074721780603, |
|
"precision": 0.6937191249117854, |
|
"recall": 0.5737704918032787, |
|
"auc": 0.7940069873689868 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5526453640649555, |
|
"precision": 0.6663636363636364, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5176027949475948 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b-deduped", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5491803278688525, |
|
"f1": 0.45371651876577385, |
|
"precision": 0.6633928571428571, |
|
"recall": 0.5491803278688524, |
|
"auc": 0.48172534264982536 |
|
}, |
|
{ |
|
"model_name": "llama-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6407383466206997, |
|
"precision": 0.7210144927536233, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.6748185971513034 |
|
}, |
|
{ |
|
"model_name": "llama-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6475409836065574, |
|
"f1": 0.6074234827508793, |
|
"precision": 0.7495454545454545, |
|
"recall": 0.6475409836065573, |
|
"auc": 0.6734748723461433 |
|
}, |
|
{ |
|
"model_name": "llama-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5526453640649555, |
|
"precision": 0.6663636363636364, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.8099973125503896 |
|
}, |
|
{ |
|
"model_name": "llama-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6311475409836066, |
|
"f1": 0.6121511833274462, |
|
"precision": 0.6631016042780749, |
|
"recall": 0.6311475409836065, |
|
"auc": 0.6226820747110992 |
|
}, |
|
{ |
|
"model_name": "llama-30b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6475409836065574, |
|
"f1": 0.629388908512893, |
|
"precision": 0.6834893048128342, |
|
"recall": 0.6475409836065573, |
|
"auc": 0.7000806234883096 |
|
}, |
|
{ |
|
"model_name": "llama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.8019349637194303 |
|
}, |
|
{ |
|
"model_name": "llama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5477293790546802, |
|
"precision": 0.7221288515406162, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.5862671324912657 |
|
}, |
|
{ |
|
"model_name": "llama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5722560975609756, |
|
"precision": 0.7337761880429228, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6752217145928514 |
|
}, |
|
{ |
|
"model_name": "llama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5591689250225835, |
|
"precision": 0.6869401225836869, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.6397473797366299 |
|
}, |
|
{ |
|
"model_name": "llama-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5601074031453778, |
|
"precision": 0.7280982905982906, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.5939263638806772 |
|
}, |
|
{ |
|
"model_name": "falcon-40b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6475409836065574, |
|
"f1": 0.5975450709627925, |
|
"precision": 0.7932692307692308, |
|
"recall": 0.6475409836065573, |
|
"auc": 0.5874764848159097 |
|
}, |
|
{ |
|
"model_name": "falcon-40b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.7540983606557377, |
|
"f1": 0.7441990494828068, |
|
"precision": 0.8006359300476948, |
|
"recall": 0.7540983606557377, |
|
"auc": 0.6627250739048642 |
|
}, |
|
{ |
|
"model_name": "falcon-40b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.7131147540983607, |
|
"f1": 0.6904675607104024, |
|
"precision": 0.8012917933130699, |
|
"recall": 0.7131147540983607, |
|
"auc": 0.7863477559795754 |
|
}, |
|
{ |
|
"model_name": "falcon-40b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6211467090812693, |
|
"precision": 0.7990196078431373, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.8234345606019886 |
|
}, |
|
{ |
|
"model_name": "falcon-40b-instruct", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.7131147540983607, |
|
"f1": 0.6933132227249874, |
|
"precision": 0.7873188405797101, |
|
"recall": 0.7131147540983607, |
|
"auc": 0.7320612738511153 |
|
}, |
|
{ |
|
"model_name": "mpt-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5901639344262295, |
|
"f1": 0.5222431077694234, |
|
"precision": 0.7090342679127726, |
|
"recall": 0.5901639344262295, |
|
"auc": 0.6847621607094867 |
|
}, |
|
{ |
|
"model_name": "mpt-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4483204134366925, |
|
"precision": 0.6248976248976249, |
|
"recall": 0.540983606557377, |
|
"auc": 0.5201558720773986 |
|
}, |
|
{ |
|
"model_name": "mpt-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5591689250225835, |
|
"precision": 0.6869401225836869, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.4875033593120129 |
|
}, |
|
{ |
|
"model_name": "mpt-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5472241157312732, |
|
"precision": 0.6794117647058824, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5837140553614619 |
|
}, |
|
{ |
|
"model_name": "mpt-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6025262026337007 |
|
}, |
|
{ |
|
"model_name": "mpt-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.8902176834184359 |
|
}, |
|
{ |
|
"model_name": "mpt-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6211467090812693, |
|
"precision": 0.7990196078431373, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.7312550389680194 |
|
}, |
|
{ |
|
"model_name": "mpt-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6617844665412523 |
|
}, |
|
{ |
|
"model_name": "mpt-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.8586401504971782 |
|
}, |
|
{ |
|
"model_name": "mpt-7b-chat", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5604636591478697, |
|
"precision": 0.7850467289719626, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.7890352055898953 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.610857296425692 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5775368864799759, |
|
"precision": 0.7157001414427157, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6620532115022842 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5657047640687722, |
|
"precision": 0.709313725490196, |
|
"recall": 0.6147540983606556, |
|
"auc": 0.6621875839828003 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5283629191321499, |
|
"precision": 0.7420634920634921, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.6556033324375168 |
|
}, |
|
{ |
|
"model_name": "pythia-6.9b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5351115949918346, |
|
"precision": 0.7158018867924528, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.5610051061542596 |
|
}, |
|
{ |
|
"model_name": "falcon-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7235958075786079 |
|
}, |
|
{ |
|
"model_name": "falcon-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5655737704918032, |
|
"f1": 0.5312794490757521, |
|
"precision": 0.5927051671732523, |
|
"recall": 0.5655737704918034, |
|
"auc": 0.5540177371674281 |
|
}, |
|
{ |
|
"model_name": "falcon-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6229508196721312, |
|
"f1": 0.5775368864799759, |
|
"precision": 0.7157001414427157, |
|
"recall": 0.6229508196721312, |
|
"auc": 0.6457941413598496 |
|
}, |
|
{ |
|
"model_name": "falcon-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5161365580527257, |
|
"precision": 0.6798349056603774, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5921795216339694 |
|
}, |
|
{ |
|
"model_name": "falcon-7b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5409836065573771, |
|
"f1": 0.4390804597701149, |
|
"precision": 0.6499508357915438, |
|
"recall": 0.540983606557377, |
|
"auc": 0.7046492878258532 |
|
}, |
|
{ |
|
"model_name": "opt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6147540983606558, |
|
"f1": 0.5476134122287968, |
|
"precision": 0.7824074074074074, |
|
"recall": 0.6147540983606558, |
|
"auc": 0.7256113947863478 |
|
}, |
|
{ |
|
"model_name": "opt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.5161365580527257, |
|
"precision": 0.6798349056603774, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.6788497715667832 |
|
}, |
|
{ |
|
"model_name": "opt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.4934462264918993, |
|
"precision": 0.7723214285714286, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.5786079011018543 |
|
}, |
|
{ |
|
"model_name": "opt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5819672131147541, |
|
"f1": 0.509112426035503, |
|
"precision": 0.7017195767195767, |
|
"recall": 0.5819672131147541, |
|
"auc": 0.7042461703843053 |
|
}, |
|
{ |
|
"model_name": "opt-1.3b", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.5573770491803278, |
|
"f1": 0.4495320855614974, |
|
"precision": 0.7652173913043478, |
|
"recall": 0.5573770491803278, |
|
"auc": 0.6202633700618114 |
|
}, |
|
{ |
|
"model_name": "pythia-160m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1", |
|
"accuracy": 0.6721311475409836, |
|
"f1": 0.6445221445221445, |
|
"precision": 0.7497076023391813, |
|
"recall": 0.6721311475409836, |
|
"auc": 0.8653587745229776 |
|
}, |
|
{ |
|
"model_name": "pythia-160m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "666", |
|
"accuracy": 0.6639344262295082, |
|
"f1": 0.6298927118017018, |
|
"precision": 0.7593537414965986, |
|
"recall": 0.6639344262295082, |
|
"auc": 0.7406611126041386 |
|
}, |
|
{ |
|
"model_name": "pythia-160m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "42", |
|
"accuracy": 0.6065573770491803, |
|
"f1": 0.5413533834586466, |
|
"precision": 0.7470404984423675, |
|
"recall": 0.6065573770491803, |
|
"auc": 0.7694168234345606 |
|
}, |
|
{ |
|
"model_name": "pythia-160m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "25", |
|
"accuracy": 0.5983606557377049, |
|
"f1": 0.5211087078426659, |
|
"precision": 0.7772727272727273, |
|
"recall": 0.5983606557377049, |
|
"auc": 0.8133566245632894 |
|
}, |
|
{ |
|
"model_name": "pythia-160m", |
|
"exp_name": "deberta__openwebtext-10k____float16__NO_SAMPLING__beams-5__max-new-tokens-256__repetition-penalty-1.0__seed-42", |
|
"seed": "1337", |
|
"accuracy": 0.7131147540983607, |
|
"f1": 0.6983398092546802, |
|
"precision": 0.7650401069518716, |
|
"recall": 0.7131147540983607, |
|
"auc": 0.721311475409836 |
|
} |
|
] |