taf-agent / data /e4_gamma /EleutherAI--pythia-1.4b_random.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
3.07 kB
{
"model": "EleutherAI/pythia-1.4b",
"theta": 10000,
"gamma_pred": 0.99999561666838,
"C_theory": 9.2103,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"d_min_fit": 30,
"n_prompts_per_distance": 150,
"seeds": [
42,
123,
7
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.00868701820054816,
"std_across_seeds": 0.000225376018293542,
"per_seed_means": [
0.00849575198100259,
0.008561847213034829,
0.009003455407607058
]
},
"20": {
"mean_across_seeds": 0.007241151898374988,
"std_across_seeds": 0.000907916062609691,
"per_seed_means": [
0.008468000154631833,
0.006299703560459117,
0.006955751980034014
]
},
"30": {
"mean_across_seeds": 0.004176199407730666,
"std_across_seeds": 0.0003113188967399462,
"per_seed_means": [
0.003928308213750522,
0.0039850392285734415,
0.004615250780868034
]
},
"50": {
"mean_across_seeds": 0.0029845095390919596,
"std_across_seeds": 0.00023642395319887298,
"per_seed_means": [
0.0027204082436704385,
0.0029389867997573066,
0.0032941335738481334
]
},
"100": {
"mean_across_seeds": 0.0028477065866657843,
"std_across_seeds": 0.0010192211252852063,
"per_seed_means": [
0.004288771225837991,
0.002153952665782223,
0.002100395868377139
]
},
"200": {
"mean_across_seeds": 0.0014213456220588544,
"std_across_seeds": 0.00018510584610857393,
"per_seed_means": [
0.0012832466786494479,
0.0012978002527961508,
0.0016829899347309645
]
},
"500": {
"mean_across_seeds": 0.0004443507219710025,
"std_across_seeds": 2.1944710361610797e-05,
"per_seed_means": [
0.0004357509139420775,
0.0004228264523165611,
0.00047447479965436894
]
},
"1000": {
"mean_across_seeds": 0.00037049855294753794,
"std_across_seeds": 7.606907661861908e-06,
"per_seed_means": [
0.0003622182499869571,
0.0003686910155132258,
0.00038058639334243103
]
},
"2000": {
"mean_across_seeds": 0.0003167598478871191,
"std_across_seeds": 8.808747176569926e-06,
"per_seed_means": [
0.00031430382912124816,
0.0003074111366489281,
0.0003285645778911809
]
}
},
"fit_power_law": {
"gamma": 0.6875846707476845,
"log_A": -3.0428636808858562,
"R2": 0.948837,
"n_points": 7
},
"fit_exponential": {
"lambda": 0.0012564601985353926,
"log_A": -6.073132081889184,
"R2": 0.682811,
"n_points": 7
},
"delta_R2_power_minus_exp": 0.266,
"gamma_CI_95": {
"lo": 0.5680458803652685,
"hi": 0.8957392897879572
},
"decision": "UNCLEAR: \u03b3=0.688 outside all expected ranges"
}