taf-agent / data /e4_gamma /cerebras--Cerebras-GPT-2.7B_mongo.partial.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
2.18 kB
{
"model": "cerebras/Cerebras-GPT-2.7B",
"theta": null,
"status": "partial",
"distances_done": [
10,
20,
30,
50,
100,
200,
500,
1000
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.011066294480632578,
"std_across_seeds": 0.0003957905898929582,
"per_seed_means": [
0.010601912275888026,
0.01102786192825685,
0.011569109237752855
]
},
"20": {
"mean_across_seeds": 0.007225409053110828,
"std_across_seeds": 0.0005509117999463269,
"per_seed_means": [
0.006504136952571571,
0.007330936039021859,
0.007841154167739053
]
},
"30": {
"mean_across_seeds": 0.005252867244934249,
"std_across_seeds": 0.0002543120148813196,
"per_seed_means": [
0.005113226118652771,
0.005035656157803411,
0.0056097194583465656
]
},
"50": {
"mean_across_seeds": 0.003439449271989159,
"std_across_seeds": 8.001153093620939e-05,
"per_seed_means": [
0.0033557674067560585,
0.0034153297869488597,
0.0035472506222625575
]
},
"100": {
"mean_across_seeds": 0.0020080710809108697,
"std_across_seeds": 0.0002751025739235102,
"per_seed_means": [
0.0019321673724334687,
0.0017155670234933495,
0.002376478846805791
]
},
"200": {
"mean_across_seeds": 0.0008928673497090736,
"std_across_seeds": 9.575487302045444e-05,
"per_seed_means": [
0.0008424188293671857,
0.0008092582342214882,
0.0010269249855385473
]
},
"500": {
"mean_across_seeds": 0.00032154169373421206,
"std_across_seeds": 3.624580892715188e-05,
"per_seed_means": [
0.0002953432806922744,
0.00029648503094601136,
0.00037279676956435045
]
},
"1000": {
"mean_across_seeds": 0.00014317721089658638,
"std_across_seeds": 1.7442142724204942e-05,
"per_seed_means": [
0.00013669004430994392,
0.00012581060213657716,
0.00016703098624323804
]
}
},
"runtime_so_far": 433.1
}