Spaces:
Running
Running
File size: 1,532 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 | {
"model": "pythia-70m",
"d_head": 64,
"theta_opt": 25330,
"n_prompts": 30,
"results": {
"orig": {
"theta": 10000,
"f_active": 0.4688,
"R_curve": [
-0.6016,
-0.2562,
-1.0246,
1.2354,
0.9883,
1.0
],
"L_crit": 3,
"max_R": 1.2354,
"mu_baseline": -14.133,
"mu_d10": -13.5259
},
"2x": {
"theta": 20000,
"f_active": 0.5,
"R_curve": [
-1.2888,
-0.6825,
-0.4616,
0.8958,
1.0183,
1.0
],
"L_crit": 4,
"max_R": 1.0183,
"mu_baseline": -14.7723,
"mu_d10": -14.1086
},
"5x": {
"theta": 50000,
"f_active": 0.5625,
"R_curve": [
3.1073,
3.6146,
2.2174,
0.9883,
0.9279,
1.0
],
"L_crit": 0,
"max_R": 3.6146,
"mu_baseline": -14.2183,
"mu_d10": -14.6064
},
"10x": {
"theta": 100000,
"f_active": 0.5625,
"R_curve": [
14.4179,
14.652,
7.5319,
0.4504,
2.0614,
1.0
],
"L_crit": 0,
"max_R": 14.652,
"mu_baseline": -14.4646,
"mu_d10": -14.5444
},
"opt": {
"theta": 25330,
"f_active": 0.5,
"R_curve": [
-0.9232,
-0.0786,
-0.7304,
0.9235,
0.8343,
1.0
],
"L_crit": 3,
"max_R": 1.0,
"mu_baseline": -14.8087,
"mu_d10": -14.261
}
}
} |