Spaces:
Running
Running
| { | |
| "model": "google/gemma-2-9b-it", | |
| "theta": 10000, | |
| "gamma_pred": 0.99999561666838, | |
| "C_theory": 9.2103, | |
| "distances": [ | |
| 10, | |
| 20, | |
| 30, | |
| 50, | |
| 100, | |
| 200, | |
| 500, | |
| 1000, | |
| 2000 | |
| ], | |
| "distances_fit": [ | |
| 30, | |
| 50, | |
| 100, | |
| 200, | |
| 500, | |
| 1000, | |
| 2000 | |
| ], | |
| "d_min_fit": 30, | |
| "n_prompts_per_distance": 150, | |
| "seeds": [ | |
| 42, | |
| 123, | |
| 7 | |
| ], | |
| "attn_by_distance": { | |
| "10": { | |
| "mean_across_seeds": 0.01131202671935575, | |
| "std_across_seeds": 0.0004384004663510598, | |
| "per_seed_means": [ | |
| 0.01191513662226498, | |
| 0.011134915679382781, | |
| 0.010886027856419483 | |
| ] | |
| }, | |
| "20": { | |
| "mean_across_seeds": 0.007342287618666887, | |
| "std_across_seeds": 0.000120221270640251, | |
| "per_seed_means": [ | |
| 0.0071971141314134, | |
| 0.007338237394578755, | |
| 0.007491511330008507 | |
| ] | |
| }, | |
| "30": { | |
| "mean_across_seeds": 0.005608218560616176, | |
| "std_across_seeds": 0.00012586673790719274, | |
| "per_seed_means": [ | |
| 0.005452117463573813, | |
| 0.00576035007291163, | |
| 0.005612188145363082 | |
| ] | |
| }, | |
| "50": { | |
| "mean_across_seeds": 0.004600468463678327, | |
| "std_across_seeds": 0.00029442297838144305, | |
| "per_seed_means": [ | |
| 0.004994370874483138, | |
| 0.004286649797577411, | |
| 0.004520384718974432 | |
| ] | |
| }, | |
| "100": { | |
| "mean_across_seeds": 0.0025041243884091576, | |
| "std_across_seeds": 0.00013270791219153536, | |
| "per_seed_means": [ | |
| 0.0026802454908223202, | |
| 0.0024722163340387244, | |
| 0.0023599113403664283 | |
| ] | |
| }, | |
| "200": { | |
| "mean_across_seeds": 0.0011723479800275526, | |
| "std_across_seeds": 0.00010549223246344652, | |
| "per_seed_means": [ | |
| 0.00103700214473065, | |
| 0.0012943720275264544, | |
| 0.0011856697678255539 | |
| ] | |
| }, | |
| "500": { | |
| "mean_across_seeds": 0.00037003465085743104, | |
| "std_across_seeds": 6.662525937622196e-05, | |
| "per_seed_means": [ | |
| 0.00031459913613313497, | |
| 0.0004637339629213481, | |
| 0.00033177085351780987 | |
| ] | |
| }, | |
| "1000": { | |
| "mean_across_seeds": 0.0001858278461845152, | |
| "std_across_seeds": 5.3211896888022095e-06, | |
| "per_seed_means": [ | |
| 0.00019292063060371827, | |
| 0.00018445904356970762, | |
| 0.00018010386438011968 | |
| ] | |
| }, | |
| "2000": { | |
| "mean_across_seeds": 4.510536613654242e-05, | |
| "std_across_seeds": 1.884703048218177e-06, | |
| "per_seed_means": [ | |
| 4.538706549889563e-05, | |
| 4.266916409202774e-05, | |
| 4.725986881870389e-05 | |
| ] | |
| } | |
| }, | |
| "fit_power_law": { | |
| "gamma": 1.1347958464287666, | |
| "log_A": -0.9640958037685541, | |
| "R2": 0.976472, | |
| "n_points": 7 | |
| }, | |
| "fit_exponential": { | |
| "lambda": 0.002322719608941013, | |
| "log_A": -5.827234742708562, | |
| "R2": 0.881621, | |
| "n_points": 7 | |
| }, | |
| "delta_R2_power_minus_exp": 0.0949, | |
| "gamma_CI_95": { | |
| "lo": 0.9244744962120605, | |
| "hi": 1.331560490527999 | |
| }, | |
| "decision": "ANOMALY: long-context training effect" | |
| } |