{ "model": "cerebras/Cerebras-GPT-2.7B", "theta": null, "status": "partial", "distances_done": [ 10, 20, 30, 50, 100, 200, 500, 1000 ], "attn_by_distance": { "10": { "mean_across_seeds": 0.011066294480632578, "std_across_seeds": 0.0003957905898929582, "per_seed_means": [ 0.010601912275888026, 0.01102786192825685, 0.011569109237752855 ] }, "20": { "mean_across_seeds": 0.007225409053110828, "std_across_seeds": 0.0005509117999463269, "per_seed_means": [ 0.006504136952571571, 0.007330936039021859, 0.007841154167739053 ] }, "30": { "mean_across_seeds": 0.005252867244934249, "std_across_seeds": 0.0002543120148813196, "per_seed_means": [ 0.005113226118652771, 0.005035656157803411, 0.0056097194583465656 ] }, "50": { "mean_across_seeds": 0.003439449271989159, "std_across_seeds": 8.001153093620939e-05, "per_seed_means": [ 0.0033557674067560585, 0.0034153297869488597, 0.0035472506222625575 ] }, "100": { "mean_across_seeds": 0.0020080710809108697, "std_across_seeds": 0.0002751025739235102, "per_seed_means": [ 0.0019321673724334687, 0.0017155670234933495, 0.002376478846805791 ] }, "200": { "mean_across_seeds": 0.0008928673497090736, "std_across_seeds": 9.575487302045444e-05, "per_seed_means": [ 0.0008424188293671857, 0.0008092582342214882, 0.0010269249855385473 ] }, "500": { "mean_across_seeds": 0.00032154169373421206, "std_across_seeds": 3.624580892715188e-05, "per_seed_means": [ 0.0002953432806922744, 0.00029648503094601136, 0.00037279676956435045 ] }, "1000": { "mean_across_seeds": 0.00014317721089658638, "std_across_seeds": 1.7442142724204942e-05, "per_seed_means": [ 0.00013669004430994392, 0.00012581060213657716, 0.00016703098624323804 ] } }, "runtime_so_far": 433.1 }