File size: 2,207 Bytes
535348a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
{
  "model": "pythia-70m",
  "k_dead": 23,
  "distances": [
    10,
    20,
    50,
    100,
    200,
    500,
    1000,
    2000
  ],
  "results": {
    "1.0": {
      "alpha": 1.0,
      "k_dead": 23,
      "means": [
        0.009425997069726388,
        0.007616706314341475,
        0.003960159035632387,
        0.0018816962791849314,
        0.0014853083784206924,
        0.0006055987625450143,
        0.0003808813685085018,
        0.00015858603301590317
      ],
      "gamma_real": 0.7692273954314717,
      "r2": 0.9860517153515315,
      "gamma_sage_meanfield": 0.33,
      "err_vs_meanfield_pct": 133.0992107368096,
      "ppl_wikitext": NaN
    },
    "2.0": {
      "alpha": 2.0,
      "k_dead": 23,
      "means": [
        0.00890763213156788,
        0.006072100852854874,
        0.0031495152239991364,
        0.0017093524947366728,
        0.001437205056663894,
        0.0005462497385639863,
        0.00045400904272921617,
        0.00015552891511949496
      ],
      "gamma_real": 0.7273015822544925,
      "r2": 0.9815381835461346,
      "gamma_sage_meanfield": 0.48,
      "err_vs_meanfield_pct": 51.52116296968594,
      "ppl_wikitext": NaN
    },
    "3.0": {
      "alpha": 3.0,
      "k_dead": 23,
      "means": [
        0.009233167045204407,
        0.004930038112424881,
        0.0035480961872745333,
        0.002592464875204937,
        0.001741171412087207,
        0.000496885728552936,
        0.00040662634407486413,
        0.0002976683259442052
      ],
      "gamma_real": 0.6676490038337431,
      "r2": 0.9715798143918007,
      "gamma_sage_meanfield": 0.69,
      "err_vs_meanfield_pct": 3.2392748067038837,
      "ppl_wikitext": NaN
    },
    "5.0": {
      "alpha": 5.0,
      "k_dead": 23,
      "means": [
        0.010232932424529889,
        0.005207723380084042,
        0.004237773541388871,
        0.004040550790293906,
        0.0009580180254268576,
        0.0012850861333382796,
        0.0005448017653475767,
        0.00015817918144421132
      ],
      "gamma_real": 0.7022015830608412,
      "r2": 0.9060310930476675,
      "gamma_sage_meanfield": 1.03,
      "err_vs_meanfield_pct": 31.8250890232193,
      "ppl_wikitext": NaN
    }
  }
}