taf-agent / data /exp_d4 /area_law_results.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
15 kB
{
"N_context": 2000,
"n_models": 56,
"results": [
{
"model": "meta-llama/Llama-2-7b-hf",
"corpus": "mongo",
"gamma": 0.2870574377368437,
"S_gamma": 7.540761817121435,
"area_law_pred": 5.419006875018258,
"ratio_S_area": 1.3915394445953768,
"phase": "A",
"r2": 0.814928
},
{
"model": "meta-llama/Llama-2-7b-hf",
"corpus": "mongo",
"gamma": 0.2870574377368437,
"S_gamma": 7.540761817121435,
"area_law_pred": 5.419006875018258,
"ratio_S_area": 1.3915394445953768,
"phase": "A",
"r2": 0.814928
},
{
"model": "EleutherAI/pythia-160m",
"corpus": "mongo",
"gamma": 0.510891565491545,
"S_gamma": 7.330756084048007,
"area_law_pred": 3.7176655028380927,
"ratio_S_area": 1.971870809369927,
"phase": "A",
"r2": 0.916873
},
{
"model": "allenai/OLMo-7B",
"corpus": "mongo",
"gamma": 0.5243966907611701,
"S_gamma": 7.310088552158613,
"area_law_pred": 3.6150143629597755,
"ratio_S_area": 2.0221464752835763,
"phase": "A",
"r2": 0.976863
},
{
"model": "allenai/OLMo-7B",
"corpus": "random",
"gamma": 0.5411598042384096,
"S_gamma": 7.282815329848365,
"area_law_pred": 3.487599572501043,
"ratio_S_area": 2.0882028393602767,
"phase": "A",
"r2": 0.96368
},
{
"model": "allenai/OLMo-7B-hf",
"corpus": "random",
"gamma": 0.550891782676269,
"S_gamma": 7.266127883242827,
"area_law_pred": 3.4136277536565065,
"ratio_S_area": 2.1285648019060415,
"phase": "A",
"r2": 0.957841
},
{
"model": "HuggingFaceTB/SmolLM2-135M",
"corpus": "random",
"gamma": 0.62665506839462,
"S_gamma": 7.112817971850239,
"area_law_pred": 2.837758408896903,
"ratio_S_area": 2.506491725846085,
"phase": "A",
"r2": 0.828515
},
{
"model": "google/gemma-2-9b-it",
"corpus": "mongo",
"gamma": 0.6276459084140061,
"S_gamma": 7.110519287154698,
"area_law_pred": 2.8302271305565383,
"ratio_S_area": 2.5123493483565325,
"phase": "A",
"r2": 0.977314
},
{
"model": "microsoft/phi-3-mini-4k-instruct",
"corpus": "mongo",
"gamma": 0.6295631683122206,
"S_gamma": 7.106048616532607,
"area_law_pred": 2.815654225080619,
"ratio_S_area": 2.5237646559137223,
"phase": "A",
"r2": 0.985314
},
{
"model": "EleutherAI/pythia-2.8b",
"corpus": "mongo",
"gamma": 0.6741618914822415,
"S_gamma": 6.993335911568815,
"area_law_pred": 2.4766636804451707,
"ratio_S_area": 2.8236921980104257,
"phase": "A",
"r2": 0.999287
},
{
"model": "EleutherAI/pythia-14m",
"corpus": "mongo",
"gamma": 0.6852875452461592,
"S_gamma": 6.9625275628284164,
"area_law_pred": 2.3920986713869947,
"ratio_S_area": 2.9106356046723527,
"phase": "A",
"r2": 0.904735
},
{
"model": "EleutherAI/pythia-1.4b",
"corpus": "random",
"gamma": 0.6875846707476845,
"S_gamma": 6.956028732948211,
"area_law_pred": 2.3746384445125743,
"ratio_S_area": 2.9293001421005913,
"phase": "A",
"r2": 0.948837
},
{
"model": "EleutherAI/pythia-1.4b",
"corpus": "mongo",
"gamma": 0.7050725013322717,
"S_gamma": 6.904986546637838,
"area_law_pred": 2.2417151500101298,
"ratio_S_area": 3.080224776375641,
"phase": "A",
"r2": 0.841258
},
{
"model": "EleutherAI/pythia-1b",
"corpus": "random",
"gamma": 0.7127537531683527,
"S_gamma": 6.881681916795565,
"area_law_pred": 2.1833307040369005,
"ratio_S_area": 3.151919177462022,
"phase": "A",
"r2": 0.956201
},
{
"model": "gpt2-large",
"corpus": "random",
"gamma": 0.7274410953080044,
"S_gamma": 6.835595893390991,
"area_law_pred": 2.0716936490434854,
"ratio_S_area": 3.2995206103696995,
"phase": "A",
"r2": 0.977312
},
{
"model": "gpt2-medium",
"corpus": "random",
"gamma": 0.7409610966104535,
"S_gamma": 6.791383942293905,
"area_law_pred": 1.9689294378906879,
"ratio_S_area": 3.4492774660170187,
"phase": "A",
"r2": 0.9987
},
{
"model": "EleutherAI/pythia-70m",
"corpus": "mongo",
"gamma": 0.7476017873166874,
"S_gamma": 6.769034916681587,
"area_law_pred": 1.9184541955686165,
"ratio_S_area": 3.528379740479179,
"phase": "A",
"r2": 0.984269
},
{
"model": "HuggingFaceTB/SmolLM2-135M",
"corpus": "mongo",
"gamma": 0.7479961324735662,
"S_gamma": 6.76769458718171,
"area_law_pred": 1.9154568164957875,
"ratio_S_area": 3.533201338134471,
"phase": "A",
"r2": 0.988937
},
{
"model": "gpt2-large",
"corpus": "mongo",
"gamma": 0.7526597997629645,
"S_gamma": 6.751731138994513,
"area_law_pred": 1.8800087363253144,
"ratio_S_area": 3.5913296616863177,
"phase": "A",
"r2": 0.963281
},
{
"model": "meta-llama/Meta-Llama-3-8B",
"corpus": "random",
"gamma": 0.7589145044527899,
"S_gamma": 6.7299962332100405,
"area_law_pred": 1.8324673360647112,
"ratio_S_area": 3.672641853285607,
"phase": "A",
"r2": 0.984284
},
{
"model": "Qwen/Qwen2.5-3B",
"corpus": "mongo",
"gamma": 0.7720333740995954,
"S_gamma": 6.683194212515172,
"area_law_pred": 1.7327520874998952,
"ratio_S_area": 3.8569823465964093,
"phase": "A",
"r2": 0.995841
},
{
"model": "gpt2-medium",
"corpus": "mongo",
"gamma": 0.7842197184521328,
"S_gamma": 6.6382427776423985,
"area_law_pred": 1.6401248727378668,
"ratio_S_area": 4.047400833914039,
"phase": "A",
"r2": 0.996208
},
{
"model": "meta-llama/Llama-2-7b-hf",
"corpus": "random",
"gamma": 0.8266242679750889,
"S_gamma": 6.470778115399689,
"area_law_pred": 1.3178120279730556,
"ratio_S_area": 4.9102436296263585,
"phase": "A",
"r2": 0.993628
},
{
"model": "Qwen/Qwen2.5-7B",
"corpus": "random",
"gamma": 0.8270155146179213,
"S_gamma": 6.469153732984772,
"area_law_pred": 1.314838200403263,
"ratio_S_area": 4.9201139204813735,
"phase": "A",
"r2": 0.984663
},
{
"model": "allenai/OLMo-7B-hf",
"corpus": "mongo",
"gamma": 0.8291935914574181,
"S_gamma": 6.460084559322255,
"area_law_pred": 1.2982828507968605,
"ratio_S_area": 4.975868359777827,
"phase": "A",
"r2": 0.99587
},
{
"model": "mistralai/Mistral-7B-v0.1",
"corpus": "random",
"gamma": 0.8296009929924347,
"S_gamma": 6.4583832741852625,
"area_law_pred": 1.2951862314673315,
"ratio_S_area": 4.986451459469643,
"phase": "A",
"r2": 0.996923
},
{
"model": "EleutherAI/gpt-j-6B",
"corpus": "random",
"gamma": 0.8347553760849855,
"S_gamma": 6.436725078705287,
"area_law_pred": 1.25600826834174,
"ratio_S_area": 5.124747377024397,
"phase": "A",
"r2": 0.980141
},
{
"model": "microsoft/phi-2",
"corpus": "random",
"gamma": 0.8707349253167322,
"S_gamma": 6.278751523867516,
"area_law_pred": 0.9825312240929408,
"ratio_S_area": 6.3903837047662,
"phase": "A",
"r2": 0.947956
},
{
"model": "bigscience/bloom-7b1",
"corpus": "random",
"gamma": 0.882390442263598,
"S_gamma": 6.225096260313582,
"area_law_pred": 0.8939387766642747,
"ratio_S_area": 6.963671811555685,
"phase": "A",
"r2": 0.994632
},
{
"model": "EleutherAI/gpt-j-6B",
"corpus": "mongo",
"gamma": 0.8967966648253523,
"S_gamma": 6.157167619017644,
"area_law_pred": 0.784438484161926,
"ratio_S_area": 7.849140172662238,
"phase": "A",
"r2": 0.98687
},
{
"model": "deepseek-ai/deepseek-llm-7b-base",
"corpus": "random",
"gamma": 0.9103448618583042,
"S_gamma": 6.09171169898598,
"area_law_pred": 0.6814599600118006,
"ratio_S_area": 8.939207079577342,
"phase": "A",
"r2": 0.992208
},
{
"model": "Qwen/Qwen2.5-0.5B",
"corpus": "random",
"gamma": 0.9194920254637005,
"S_gamma": 6.046685882415325,
"area_law_pred": 0.6119332616657105,
"ratio_S_area": 9.881283239868296,
"phase": "A",
"r2": 0.995818
},
{
"model": "HuggingFaceTB/SmolLM2-360M",
"corpus": "random",
"gamma": 0.9197098362636822,
"S_gamma": 6.0456057444940505,
"area_law_pred": 0.6102777030204145,
"ratio_S_area": 9.90631922905402,
"phase": "A",
"r2": 0.992716
},
{
"model": "EleutherAI/pythia-1b",
"corpus": "mongo",
"gamma": 0.9311078627189842,
"S_gamma": 5.988575565494448,
"area_law_pred": 0.5236424157023841,
"ratio_S_area": 11.436383657847337,
"phase": "A",
"r2": 0.983104
},
{
"model": "EleutherAI/pythia-410m",
"corpus": "random",
"gamma": 0.9362347719713631,
"S_gamma": 5.962605278027159,
"area_law_pred": 0.4846732785561282,
"ratio_S_area": 12.302318988556848,
"phase": "A",
"r2": 0.987529
},
{
"model": "deepseek-ai/deepseek-llm-7b-base",
"corpus": "mongo",
"gamma": 0.9469730981988765,
"S_gamma": 5.907593587772118,
"area_law_pred": 0.4030523083220558,
"ratio_S_area": 14.657138703326074,
"phase": "A",
"r2": 0.995256
},
{
"model": "Qwen/Qwen2.5-3B",
"corpus": "random",
"gamma": 0.9643628833140916,
"S_gamma": 5.816818113694677,
"area_law_pred": 0.2708742478689094,
"ratio_S_area": 21.47423817309406,
"phase": "A",
"r2": 0.97891
},
{
"model": "HuggingFaceTB/SmolLM2-360M",
"corpus": "mongo",
"gamma": 0.9691725803316233,
"S_gamma": 5.791361269838827,
"area_law_pred": 0.23431620997870006,
"ratio_S_area": 24.716007784375126,
"phase": "A",
"r2": 0.998139
},
{
"model": "Qwen/Qwen2.5-7B",
"corpus": "mongo",
"gamma": 0.9966953735480816,
"S_gamma": 5.643021626136776,
"area_law_pred": 0.025118143326254574,
"ratio_S_area": 224.6591857065504,
"phase": "A",
"r2": 0.993942
},
{
"model": "EleutherAI/pythia-14m",
"corpus": "random",
"gamma": 1.003714187534367,
"S_gamma": 9.113816929580823,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.977698
},
{
"model": "gpt2-xl",
"corpus": "mongo",
"gamma": 1.0097027213131609,
"S_gamma": 8.144856340401692,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.980958
},
{
"model": "EleutherAI/pythia-160m",
"corpus": "random",
"gamma": 1.0171452847779678,
"S_gamma": 7.564188500805029,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.981723
},
{
"model": "EleutherAI/pythia-410m",
"corpus": "mongo",
"gamma": 1.0218530106365162,
"S_gamma": 7.314101726492739,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.981594
},
{
"model": "gpt2",
"corpus": "mongo",
"gamma": 1.0231174997210821,
"S_gamma": 7.255805984306381,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.955115
},
{
"model": "gpt2-xl",
"corpus": "random",
"gamma": 1.024099984346949,
"S_gamma": 7.2125851754934445,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.988966
},
{
"model": "Qwen/Qwen2.5-0.5B",
"corpus": "mongo",
"gamma": 1.0283740139174087,
"S_gamma": 7.042254100757362,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.996775
},
{
"model": "microsoft/phi-3-mini-4k-instruct",
"corpus": "random",
"gamma": 1.0366024777115062,
"S_gamma": 6.7735078789401655,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.977923
},
{
"model": "microsoft/phi-2",
"corpus": "mongo",
"gamma": 1.0446992618601783,
"S_gamma": 6.55917099187236,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.979964
},
{
"model": "meta-llama/Meta-Llama-3-8B",
"corpus": "mongo",
"gamma": 1.0454762537473639,
"S_gamma": 6.540515247430771,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.997461
},
{
"model": "gpt2",
"corpus": "random",
"gamma": 1.0514830126336872,
"S_gamma": 6.405275999206491,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.907872
},
{
"model": "mistralai/Mistral-7B-v0.1",
"corpus": "mongo",
"gamma": 1.060750419523944,
"S_gamma": 6.2218961952351,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.99869
},
{
"model": "google/gemma-2-9b-it",
"corpus": "random",
"gamma": 1.1347958464287666,
"S_gamma": 5.259629681982037,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.976472
},
{
"model": "EleutherAI/pythia-70m",
"corpus": "random",
"gamma": 1.1705141984482668,
"S_gamma": 4.933980978257978,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.994076
},
{
"model": "bigscience/bloom-7b1",
"corpus": "mongo",
"gamma": 1.2178239236386044,
"S_gamma": 4.562721586731967,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.99733
},
{
"model": "EleutherAI/pythia-31m",
"corpus": "mongo",
"gamma": 1.2350013988825523,
"S_gamma": 4.439867464810442,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.973742
},
{
"model": "EleutherAI/pythia-31m",
"corpus": "random",
"gamma": 1.5398244746231446,
"S_gamma": 2.8462032124350634,
"area_law_pred": null,
"ratio_S_area": null,
"phase": "B",
"r2": 0.964259
}
],
"phase_a_ratio_mean": 11.448812263895999,
"phase_a_ratio_std": 34.96120529181214
}