taf-agent / data /e1_h3 /EleutherAI--pythia-2.8b_seed42.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
4.57 kB
{
"tau_90": 0.9,
"tau_99": 0.99,
"N_prompts": 50,
"dist_short": 10,
"dist_long": 1000,
"vocab_low": 1000,
"vocab_high": 49000,
"n_prefix": 20,
"ref_logp_d10": {
"mean": -14.8755,
"std": 2.7859
},
"baseline_logp_d1000": {
"mean": -14.8256,
"std": 2.527
},
"logp_gap": -0.05,
"layer_sweep": {
"0": {
"recovery_pct": -0.0,
"logp_transplant_mean": -14.8256,
"logp_transplant_std": 2.527
},
"1": {
"recovery_pct": 78.61,
"logp_transplant_mean": -14.8649,
"logp_transplant_std": 2.5669
},
"2": {
"recovery_pct": -373.24,
"logp_transplant_mean": -14.639,
"logp_transplant_std": 2.5252
},
"3": {
"recovery_pct": -304.78,
"logp_transplant_mean": -14.6733,
"logp_transplant_std": 2.4592
},
"4": {
"recovery_pct": 113.78,
"logp_transplant_mean": -14.8824,
"logp_transplant_std": 2.4183
},
"5": {
"recovery_pct": -269.64,
"logp_transplant_mean": -14.6908,
"logp_transplant_std": 2.3048
},
"6": {
"recovery_pct": -160.57,
"logp_transplant_mean": -14.7453,
"logp_transplant_std": 2.3683
},
"7": {
"recovery_pct": -470.9,
"logp_transplant_mean": -14.5902,
"logp_transplant_std": 2.2346
},
"8": {
"recovery_pct": -194.26,
"logp_transplant_mean": -14.7285,
"logp_transplant_std": 2.3823
},
"9": {
"recovery_pct": -379.04,
"logp_transplant_mean": -14.6361,
"logp_transplant_std": 2.1932
},
"10": {
"recovery_pct": -818.12,
"logp_transplant_mean": -14.4167,
"logp_transplant_std": 2.3253
},
"11": {
"recovery_pct": -785.01,
"logp_transplant_mean": -14.4333,
"logp_transplant_std": 1.9795
},
"12": {
"recovery_pct": -798.05,
"logp_transplant_mean": -14.4267,
"logp_transplant_std": 2.305
},
"13": {
"recovery_pct": -104.81,
"logp_transplant_mean": -14.7732,
"logp_transplant_std": 2.357
},
"14": {
"recovery_pct": 407.95,
"logp_transplant_mean": -15.0295,
"logp_transplant_std": 2.8019
},
"15": {
"recovery_pct": 71.89,
"logp_transplant_mean": -14.8615,
"logp_transplant_std": 2.6564
},
"16": {
"recovery_pct": -672.74,
"logp_transplant_mean": -14.4894,
"logp_transplant_std": 2.3578
},
"17": {
"recovery_pct": 112.29,
"logp_transplant_mean": -14.8817,
"logp_transplant_std": 2.3406
},
"18": {
"recovery_pct": -447.09,
"logp_transplant_mean": -14.6021,
"logp_transplant_std": 2.205
},
"19": {
"recovery_pct": -569.58,
"logp_transplant_mean": -14.5409,
"logp_transplant_std": 2.259
},
"20": {
"recovery_pct": -474.43,
"logp_transplant_mean": -14.5885,
"logp_transplant_std": 2.3099
},
"21": {
"recovery_pct": -739.27,
"logp_transplant_mean": -14.4561,
"logp_transplant_std": 2.477
},
"22": {
"recovery_pct": -1065.09,
"logp_transplant_mean": -14.2933,
"logp_transplant_std": 2.6142
},
"23": {
"recovery_pct": -600.65,
"logp_transplant_mean": -14.5254,
"logp_transplant_std": 2.5483
},
"24": {
"recovery_pct": -901.16,
"logp_transplant_mean": -14.3752,
"logp_transplant_std": 2.5421
},
"25": {
"recovery_pct": -536.13,
"logp_transplant_mean": -14.5576,
"logp_transplant_std": 2.4489
},
"26": {
"recovery_pct": -382.06,
"logp_transplant_mean": -14.6346,
"logp_transplant_std": 2.755
},
"27": {
"recovery_pct": -557.72,
"logp_transplant_mean": -14.5468,
"logp_transplant_std": 2.7981
},
"28": {
"recovery_pct": -625.42,
"logp_transplant_mean": -14.513,
"logp_transplant_std": 2.659
},
"29": {
"recovery_pct": -736.55,
"logp_transplant_mean": -14.4575,
"logp_transplant_std": 2.7427
},
"30": {
"recovery_pct": -567.96,
"logp_transplant_mean": -14.5417,
"logp_transplant_std": 2.7488
},
"31": {
"recovery_pct": -136.75,
"logp_transplant_mean": -14.7572,
"logp_transplant_std": 2.7043
}
},
"L_crit_90": null,
"L_crit_99": null,
"alpha_90": null,
"alpha_99": null,
"recovery_at_Lcrit": null,
"n_layers": 32,
"d_model": 2560,
"model": "EleutherAI/pythia-2.8b",
"seed": 42,
"runtime_seconds": 1043.0
}