File size: 4,569 Bytes
535348a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
{
  "tau_90": 0.9,
  "tau_99": 0.99,
  "N_prompts": 50,
  "dist_short": 10,
  "dist_long": 1000,
  "vocab_low": 1000,
  "vocab_high": 49000,
  "n_prefix": 20,
  "ref_logp_d10": {
    "mean": -14.8755,
    "std": 2.7859
  },
  "baseline_logp_d1000": {
    "mean": -14.8256,
    "std": 2.527
  },
  "logp_gap": -0.05,
  "layer_sweep": {
    "0": {
      "recovery_pct": -0.0,
      "logp_transplant_mean": -14.8256,
      "logp_transplant_std": 2.527
    },
    "1": {
      "recovery_pct": 78.61,
      "logp_transplant_mean": -14.8649,
      "logp_transplant_std": 2.5669
    },
    "2": {
      "recovery_pct": -373.24,
      "logp_transplant_mean": -14.639,
      "logp_transplant_std": 2.5252
    },
    "3": {
      "recovery_pct": -304.78,
      "logp_transplant_mean": -14.6733,
      "logp_transplant_std": 2.4592
    },
    "4": {
      "recovery_pct": 113.78,
      "logp_transplant_mean": -14.8824,
      "logp_transplant_std": 2.4183
    },
    "5": {
      "recovery_pct": -269.64,
      "logp_transplant_mean": -14.6908,
      "logp_transplant_std": 2.3048
    },
    "6": {
      "recovery_pct": -160.57,
      "logp_transplant_mean": -14.7453,
      "logp_transplant_std": 2.3683
    },
    "7": {
      "recovery_pct": -470.9,
      "logp_transplant_mean": -14.5902,
      "logp_transplant_std": 2.2346
    },
    "8": {
      "recovery_pct": -194.26,
      "logp_transplant_mean": -14.7285,
      "logp_transplant_std": 2.3823
    },
    "9": {
      "recovery_pct": -379.04,
      "logp_transplant_mean": -14.6361,
      "logp_transplant_std": 2.1932
    },
    "10": {
      "recovery_pct": -818.12,
      "logp_transplant_mean": -14.4167,
      "logp_transplant_std": 2.3253
    },
    "11": {
      "recovery_pct": -785.01,
      "logp_transplant_mean": -14.4333,
      "logp_transplant_std": 1.9795
    },
    "12": {
      "recovery_pct": -798.05,
      "logp_transplant_mean": -14.4267,
      "logp_transplant_std": 2.305
    },
    "13": {
      "recovery_pct": -104.81,
      "logp_transplant_mean": -14.7732,
      "logp_transplant_std": 2.357
    },
    "14": {
      "recovery_pct": 407.95,
      "logp_transplant_mean": -15.0295,
      "logp_transplant_std": 2.8019
    },
    "15": {
      "recovery_pct": 71.89,
      "logp_transplant_mean": -14.8615,
      "logp_transplant_std": 2.6564
    },
    "16": {
      "recovery_pct": -672.74,
      "logp_transplant_mean": -14.4894,
      "logp_transplant_std": 2.3578
    },
    "17": {
      "recovery_pct": 112.29,
      "logp_transplant_mean": -14.8817,
      "logp_transplant_std": 2.3406
    },
    "18": {
      "recovery_pct": -447.09,
      "logp_transplant_mean": -14.6021,
      "logp_transplant_std": 2.205
    },
    "19": {
      "recovery_pct": -569.58,
      "logp_transplant_mean": -14.5409,
      "logp_transplant_std": 2.259
    },
    "20": {
      "recovery_pct": -474.43,
      "logp_transplant_mean": -14.5885,
      "logp_transplant_std": 2.3099
    },
    "21": {
      "recovery_pct": -739.27,
      "logp_transplant_mean": -14.4561,
      "logp_transplant_std": 2.477
    },
    "22": {
      "recovery_pct": -1065.09,
      "logp_transplant_mean": -14.2933,
      "logp_transplant_std": 2.6142
    },
    "23": {
      "recovery_pct": -600.65,
      "logp_transplant_mean": -14.5254,
      "logp_transplant_std": 2.5483
    },
    "24": {
      "recovery_pct": -901.16,
      "logp_transplant_mean": -14.3752,
      "logp_transplant_std": 2.5421
    },
    "25": {
      "recovery_pct": -536.13,
      "logp_transplant_mean": -14.5576,
      "logp_transplant_std": 2.4489
    },
    "26": {
      "recovery_pct": -382.06,
      "logp_transplant_mean": -14.6346,
      "logp_transplant_std": 2.755
    },
    "27": {
      "recovery_pct": -557.72,
      "logp_transplant_mean": -14.5468,
      "logp_transplant_std": 2.7981
    },
    "28": {
      "recovery_pct": -625.42,
      "logp_transplant_mean": -14.513,
      "logp_transplant_std": 2.659
    },
    "29": {
      "recovery_pct": -736.55,
      "logp_transplant_mean": -14.4575,
      "logp_transplant_std": 2.7427
    },
    "30": {
      "recovery_pct": -567.96,
      "logp_transplant_mean": -14.5417,
      "logp_transplant_std": 2.7488
    },
    "31": {
      "recovery_pct": -136.75,
      "logp_transplant_mean": -14.7572,
      "logp_transplant_std": 2.7043
    }
  },
  "L_crit_90": null,
  "L_crit_99": null,
  "alpha_90": null,
  "alpha_99": null,
  "recovery_at_Lcrit": null,
  "n_layers": 32,
  "d_model": 2560,
  "model": "EleutherAI/pythia-2.8b",
  "seed": 42,
  "runtime_seconds": 1043.0
}