taf-agent / data /e4_gamma /google--gemma-2-9b-it_random.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
3.05 kB
{
"model": "google/gemma-2-9b-it",
"theta": 10000,
"gamma_pred": 0.99999561666838,
"C_theory": 9.2103,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"d_min_fit": 30,
"n_prompts_per_distance": 150,
"seeds": [
42,
123,
7
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.01131202671935575,
"std_across_seeds": 0.0004384004663510598,
"per_seed_means": [
0.01191513662226498,
0.011134915679382781,
0.010886027856419483
]
},
"20": {
"mean_across_seeds": 0.007342287618666887,
"std_across_seeds": 0.000120221270640251,
"per_seed_means": [
0.0071971141314134,
0.007338237394578755,
0.007491511330008507
]
},
"30": {
"mean_across_seeds": 0.005608218560616176,
"std_across_seeds": 0.00012586673790719274,
"per_seed_means": [
0.005452117463573813,
0.00576035007291163,
0.005612188145363082
]
},
"50": {
"mean_across_seeds": 0.004600468463678327,
"std_across_seeds": 0.00029442297838144305,
"per_seed_means": [
0.004994370874483138,
0.004286649797577411,
0.004520384718974432
]
},
"100": {
"mean_across_seeds": 0.0025041243884091576,
"std_across_seeds": 0.00013270791219153536,
"per_seed_means": [
0.0026802454908223202,
0.0024722163340387244,
0.0023599113403664283
]
},
"200": {
"mean_across_seeds": 0.0011723479800275526,
"std_across_seeds": 0.00010549223246344652,
"per_seed_means": [
0.00103700214473065,
0.0012943720275264544,
0.0011856697678255539
]
},
"500": {
"mean_across_seeds": 0.00037003465085743104,
"std_across_seeds": 6.662525937622196e-05,
"per_seed_means": [
0.00031459913613313497,
0.0004637339629213481,
0.00033177085351780987
]
},
"1000": {
"mean_across_seeds": 0.0001858278461845152,
"std_across_seeds": 5.3211896888022095e-06,
"per_seed_means": [
0.00019292063060371827,
0.00018445904356970762,
0.00018010386438011968
]
},
"2000": {
"mean_across_seeds": 4.510536613654242e-05,
"std_across_seeds": 1.884703048218177e-06,
"per_seed_means": [
4.538706549889563e-05,
4.266916409202774e-05,
4.725986881870389e-05
]
}
},
"fit_power_law": {
"gamma": 1.1347958464287666,
"log_A": -0.9640958037685541,
"R2": 0.976472,
"n_points": 7
},
"fit_exponential": {
"lambda": 0.002322719608941013,
"log_A": -5.827234742708562,
"R2": 0.881621,
"n_points": 7
},
"delta_R2_power_minus_exp": 0.0949,
"gamma_CI_95": {
"lo": 0.9244744962120605,
"hi": 1.331560490527999
},
"decision": "ANOMALY: long-context training effect"
}