taf-agent / data /exp_yarn /pythia-70m_yarn_scan.json
karlexmarin's picture
feat: ship paper artefacts + CLI diagnostic alongside browser tool
535348a
raw
history blame
1.53 kB
{
"model": "pythia-70m",
"d_head": 64,
"theta_opt": 25330,
"n_prompts": 30,
"results": {
"orig": {
"theta": 10000,
"f_active": 0.4688,
"R_curve": [
-0.6016,
-0.2562,
-1.0246,
1.2354,
0.9883,
1.0
],
"L_crit": 3,
"max_R": 1.2354,
"mu_baseline": -14.133,
"mu_d10": -13.5259
},
"2x": {
"theta": 20000,
"f_active": 0.5,
"R_curve": [
-1.2888,
-0.6825,
-0.4616,
0.8958,
1.0183,
1.0
],
"L_crit": 4,
"max_R": 1.0183,
"mu_baseline": -14.7723,
"mu_d10": -14.1086
},
"5x": {
"theta": 50000,
"f_active": 0.5625,
"R_curve": [
3.1073,
3.6146,
2.2174,
0.9883,
0.9279,
1.0
],
"L_crit": 0,
"max_R": 3.6146,
"mu_baseline": -14.2183,
"mu_d10": -14.6064
},
"10x": {
"theta": 100000,
"f_active": 0.5625,
"R_curve": [
14.4179,
14.652,
7.5319,
0.4504,
2.0614,
1.0
],
"L_crit": 0,
"max_R": 14.652,
"mu_baseline": -14.4646,
"mu_d10": -14.5444
},
"opt": {
"theta": 25330,
"f_active": 0.5,
"R_curve": [
-0.9232,
-0.0786,
-0.7304,
0.9235,
0.8343,
1.0
],
"L_crit": 3,
"max_R": 1.0,
"mu_baseline": -14.8087,
"mu_d10": -14.261
}
}
}