Spaces:
Running
Running
File size: 4,569 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 | {
"tau_90": 0.9,
"tau_99": 0.99,
"N_prompts": 50,
"dist_short": 10,
"dist_long": 1000,
"vocab_low": 1000,
"vocab_high": 49000,
"n_prefix": 20,
"ref_logp_d10": {
"mean": -14.8755,
"std": 2.7859
},
"baseline_logp_d1000": {
"mean": -14.8256,
"std": 2.527
},
"logp_gap": -0.05,
"layer_sweep": {
"0": {
"recovery_pct": -0.0,
"logp_transplant_mean": -14.8256,
"logp_transplant_std": 2.527
},
"1": {
"recovery_pct": 78.61,
"logp_transplant_mean": -14.8649,
"logp_transplant_std": 2.5669
},
"2": {
"recovery_pct": -373.24,
"logp_transplant_mean": -14.639,
"logp_transplant_std": 2.5252
},
"3": {
"recovery_pct": -304.78,
"logp_transplant_mean": -14.6733,
"logp_transplant_std": 2.4592
},
"4": {
"recovery_pct": 113.78,
"logp_transplant_mean": -14.8824,
"logp_transplant_std": 2.4183
},
"5": {
"recovery_pct": -269.64,
"logp_transplant_mean": -14.6908,
"logp_transplant_std": 2.3048
},
"6": {
"recovery_pct": -160.57,
"logp_transplant_mean": -14.7453,
"logp_transplant_std": 2.3683
},
"7": {
"recovery_pct": -470.9,
"logp_transplant_mean": -14.5902,
"logp_transplant_std": 2.2346
},
"8": {
"recovery_pct": -194.26,
"logp_transplant_mean": -14.7285,
"logp_transplant_std": 2.3823
},
"9": {
"recovery_pct": -379.04,
"logp_transplant_mean": -14.6361,
"logp_transplant_std": 2.1932
},
"10": {
"recovery_pct": -818.12,
"logp_transplant_mean": -14.4167,
"logp_transplant_std": 2.3253
},
"11": {
"recovery_pct": -785.01,
"logp_transplant_mean": -14.4333,
"logp_transplant_std": 1.9795
},
"12": {
"recovery_pct": -798.05,
"logp_transplant_mean": -14.4267,
"logp_transplant_std": 2.305
},
"13": {
"recovery_pct": -104.81,
"logp_transplant_mean": -14.7732,
"logp_transplant_std": 2.357
},
"14": {
"recovery_pct": 407.95,
"logp_transplant_mean": -15.0295,
"logp_transplant_std": 2.8019
},
"15": {
"recovery_pct": 71.89,
"logp_transplant_mean": -14.8615,
"logp_transplant_std": 2.6564
},
"16": {
"recovery_pct": -672.74,
"logp_transplant_mean": -14.4894,
"logp_transplant_std": 2.3578
},
"17": {
"recovery_pct": 112.29,
"logp_transplant_mean": -14.8817,
"logp_transplant_std": 2.3406
},
"18": {
"recovery_pct": -447.09,
"logp_transplant_mean": -14.6021,
"logp_transplant_std": 2.205
},
"19": {
"recovery_pct": -569.58,
"logp_transplant_mean": -14.5409,
"logp_transplant_std": 2.259
},
"20": {
"recovery_pct": -474.43,
"logp_transplant_mean": -14.5885,
"logp_transplant_std": 2.3099
},
"21": {
"recovery_pct": -739.27,
"logp_transplant_mean": -14.4561,
"logp_transplant_std": 2.477
},
"22": {
"recovery_pct": -1065.09,
"logp_transplant_mean": -14.2933,
"logp_transplant_std": 2.6142
},
"23": {
"recovery_pct": -600.65,
"logp_transplant_mean": -14.5254,
"logp_transplant_std": 2.5483
},
"24": {
"recovery_pct": -901.16,
"logp_transplant_mean": -14.3752,
"logp_transplant_std": 2.5421
},
"25": {
"recovery_pct": -536.13,
"logp_transplant_mean": -14.5576,
"logp_transplant_std": 2.4489
},
"26": {
"recovery_pct": -382.06,
"logp_transplant_mean": -14.6346,
"logp_transplant_std": 2.755
},
"27": {
"recovery_pct": -557.72,
"logp_transplant_mean": -14.5468,
"logp_transplant_std": 2.7981
},
"28": {
"recovery_pct": -625.42,
"logp_transplant_mean": -14.513,
"logp_transplant_std": 2.659
},
"29": {
"recovery_pct": -736.55,
"logp_transplant_mean": -14.4575,
"logp_transplant_std": 2.7427
},
"30": {
"recovery_pct": -567.96,
"logp_transplant_mean": -14.5417,
"logp_transplant_std": 2.7488
},
"31": {
"recovery_pct": -136.75,
"logp_transplant_mean": -14.7572,
"logp_transplant_std": 2.7043
}
},
"L_crit_90": null,
"L_crit_99": null,
"alpha_90": null,
"alpha_99": null,
"recovery_at_Lcrit": null,
"n_layers": 32,
"d_model": 2560,
"model": "EleutherAI/pythia-2.8b",
"seed": 42,
"runtime_seconds": 1043.0
} |