taf-agent / data /e4_gamma /EleutherAI--pythia-2.8b_random.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
3.08 kB
{
"model": "EleutherAI/pythia-2.8b",
"theta": 10000,
"gamma_pred": 0.99999561666838,
"C_theory": 9.2103,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"d_min_fit": 30,
"n_prompts_per_distance": 150,
"seeds": [
42,
123,
7
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.007388996658846736,
"std_across_seeds": 0.00018226253624295958,
"per_seed_means": [
0.007328578910479943,
0.007202199265981714,
0.007636211800078551
]
},
"20": {
"mean_across_seeds": 0.0065620680425005655,
"std_across_seeds": 0.0013119660642064493,
"per_seed_means": [
0.008389089189780255,
0.005368597246706486,
0.005928517691014956
]
},
"30": {
"mean_across_seeds": 0.004171221432948693,
"std_across_seeds": 5.492056749426419e-05,
"per_seed_means": [
0.004100738317550471,
0.004178205231825511,
0.0042347207494700945
]
},
"50": {
"mean_across_seeds": 0.0028834379232850755,
"std_across_seeds": 0.00011670489556831891,
"per_seed_means": [
0.002764531443050752,
0.0030420172734496494,
0.0028437650533548247
]
},
"100": {
"mean_across_seeds": 0.0016150823904253128,
"std_across_seeds": 1.6027428565874314e-05,
"per_seed_means": [
0.0015924673308230315,
0.001627707876614295,
0.001625071963838612
]
},
"200": {
"mean_across_seeds": 0.0012179727724287658,
"std_across_seeds": 1.7310186855210638e-05,
"per_seed_means": [
0.001211881641841804,
0.0012004845253735159,
0.0012415521500709777
]
},
"500": {
"mean_across_seeds": 0.0003523622222484037,
"std_across_seeds": 3.2832611113364645e-05,
"per_seed_means": [
0.00039570461075830583,
0.00031626713990893525,
0.0003451149160779702
]
},
"1000": {
"mean_across_seeds": 0.00021088249445407807,
"std_across_seeds": 8.525966582865826e-06,
"per_seed_means": [
0.0002150495473082022,
0.00019900024810340255,
0.00021859768795062944
]
},
"2000": {
"mean_across_seeds": 0.0009888755242556928,
"std_across_seeds": 0.0010801453503042908,
"per_seed_means": [
0.00020996567844122182,
0.0002403297636192292,
0.0025163311307066275
]
}
},
"fit_power_law": {
"gamma": 0.5511942093739615,
"log_A": -3.841280530850879,
"R2": 0.644437,
"n_points": 7
},
"fit_exponential": {
"lambda": 0.0007053287474078895,
"log_A": -6.437797432208634,
"R2": 0.227415,
"n_points": 7
},
"delta_R2_power_minus_exp": 0.417,
"gamma_CI_95": {
"lo": 0.23611731057176769,
"hi": 0.9185010077352719
},
"decision": "UNCLEAR: \u03b3=0.551 outside all expected ranges"
}