taf-agent / data /e4_gamma /Qwen--Qwen2.5-7B_random.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
3.07 kB
{
"model": "Qwen/Qwen2.5-7B",
"theta": 1000000,
"gamma_pred": 0.6666637444455867,
"C_theory": 9.2103,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"d_min_fit": 30,
"n_prompts_per_distance": 150,
"seeds": [
42,
123,
7
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.009949791732554635,
"std_across_seeds": 0.00017400484474847187,
"per_seed_means": [
0.00970459462919583,
0.010054353810846805,
0.010090426757621269
]
},
"20": {
"mean_across_seeds": 0.00652512194097249,
"std_across_seeds": 0.00027764715284577684,
"per_seed_means": [
0.006915346873768916,
0.006367762469065686,
0.00629225648008287
]
},
"30": {
"mean_across_seeds": 0.004573273731706043,
"std_across_seeds": 0.0002440010861132137,
"per_seed_means": [
0.004245316321806361,
0.00483019192237407,
0.004644312950937699
]
},
"50": {
"mean_across_seeds": 0.0037503224599640815,
"std_across_seeds": 0.00014970965595137803,
"per_seed_means": [
0.0036074511027739693,
0.003686442569984744,
0.003957073707133532
]
},
"100": {
"mean_across_seeds": 0.0017626451529536603,
"std_across_seeds": 6.538491081934697e-05,
"per_seed_means": [
0.0016974271783449998,
0.0017384849436348304,
0.0018520233368811507
]
},
"200": {
"mean_across_seeds": 0.0009006613932110162,
"std_across_seeds": 1.4542795753788803e-05,
"per_seed_means": [
0.0008808788963748763,
0.0009056814018792162,
0.0009154238813789561
]
},
"500": {
"mean_across_seeds": 0.0004466055328116959,
"std_across_seeds": 2.9333787485462512e-05,
"per_seed_means": [
0.0004095632961252704,
0.00044895225291838867,
0.0004813010493914286
]
},
"1000": {
"mean_across_seeds": 0.00036055122376031553,
"std_across_seeds": 3.763717614004054e-05,
"per_seed_means": [
0.00032056129857664927,
0.00035012514175226294,
0.0004109672309520344
]
},
"2000": {
"mean_across_seeds": 0.00013122257518666125,
"std_across_seeds": 2.1018759696526725e-06,
"per_seed_means": [
0.0001299849769566208,
0.00013418190562030456,
0.00012950084298305833
]
}
},
"fit_power_law": {
"gamma": 0.8270155146179213,
"log_A": -2.5043057610030255,
"R2": 0.984663,
"n_points": 7
},
"fit_exponential": {
"lambda": 0.00159574430485393,
"log_A": -6.102228480230107,
"R2": 0.790044,
"n_points": 7
},
"delta_R2_power_minus_exp": 0.1946,
"gamma_CI_95": {
"lo": 0.718555951342085,
"hi": 0.9106818877708862
},
"decision": "UNCLEAR: \u03b3=0.827 outside all expected ranges"
}