Spaces:
Running
Running
File size: 2,207 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 | {
"model": "pythia-70m",
"k_dead": 23,
"distances": [
10,
20,
50,
100,
200,
500,
1000,
2000
],
"results": {
"1.0": {
"alpha": 1.0,
"k_dead": 23,
"means": [
0.009425997069726388,
0.007616706314341475,
0.003960159035632387,
0.0018816962791849314,
0.0014853083784206924,
0.0006055987625450143,
0.0003808813685085018,
0.00015858603301590317
],
"gamma_real": 0.7692273954314717,
"r2": 0.9860517153515315,
"gamma_sage_meanfield": 0.33,
"err_vs_meanfield_pct": 133.0992107368096,
"ppl_wikitext": NaN
},
"2.0": {
"alpha": 2.0,
"k_dead": 23,
"means": [
0.00890763213156788,
0.006072100852854874,
0.0031495152239991364,
0.0017093524947366728,
0.001437205056663894,
0.0005462497385639863,
0.00045400904272921617,
0.00015552891511949496
],
"gamma_real": 0.7273015822544925,
"r2": 0.9815381835461346,
"gamma_sage_meanfield": 0.48,
"err_vs_meanfield_pct": 51.52116296968594,
"ppl_wikitext": NaN
},
"3.0": {
"alpha": 3.0,
"k_dead": 23,
"means": [
0.009233167045204407,
0.004930038112424881,
0.0035480961872745333,
0.002592464875204937,
0.001741171412087207,
0.000496885728552936,
0.00040662634407486413,
0.0002976683259442052
],
"gamma_real": 0.6676490038337431,
"r2": 0.9715798143918007,
"gamma_sage_meanfield": 0.69,
"err_vs_meanfield_pct": 3.2392748067038837,
"ppl_wikitext": NaN
},
"5.0": {
"alpha": 5.0,
"k_dead": 23,
"means": [
0.010232932424529889,
0.005207723380084042,
0.004237773541388871,
0.004040550790293906,
0.0009580180254268576,
0.0012850861333382796,
0.0005448017653475767,
0.00015817918144421132
],
"gamma_real": 0.7022015830608412,
"r2": 0.9060310930476675,
"gamma_sage_meanfield": 1.03,
"err_vs_meanfield_pct": 31.8250890232193,
"ppl_wikitext": NaN
}
}
} |