Spaces:
Running
Running
File size: 2,883 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 | {
"model": "EleutherAI/pythia-70m",
"theta": 10000,
"d_head": 64,
"n_layers": 6,
"L_crit_known": 4,
"z": 0.282842712474619,
"gamma_pos_pred": 0.7522013138014093,
"gamma_pade": 0.7522013138014093,
"beta_gamma": 0.2,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"n_prompts": 150,
"seeds": [
42,
123,
7
],
"layer_gamma": {
"0": {
"gamma": 1.3468013543313044,
"R2": 0.981851,
"n_points": 7,
"type": "pos"
},
"1": {
"gamma": 1.410356134563726,
"R2": 0.886404,
"n_points": 7,
"type": "pos"
},
"2": {
"gamma": 1.1152541530423556,
"R2": 0.949761,
"n_points": 7,
"type": "pos"
},
"3": {
"gamma": 1.1030121418119894,
"R2": 0.992778,
"n_points": 7,
"type": "pos"
},
"4": {
"gamma": NaN,
"R2": 0.0,
"n_points": 0,
"type": "sem"
},
"5": {
"gamma": NaN,
"R2": 0.0,
"n_points": 0,
"type": "sem"
}
},
"per_layer_agg": {
"0": {
"10": 0.015644904689656364,
"20": 0.013133970548709234,
"30": 0.005567839278115167,
"50": 0.003556306262811025,
"100": 0.0019510852628284031,
"200": 0.0007665379345417021,
"500": 0.0002498780190944672,
"1000": 5.03444837199317e-05,
"2000": 2.262747950024075e-05
},
"1": {
"10": 0.008926776730351978,
"20": 0.01036835898955663,
"30": 0.0026452516516049704,
"50": 0.0025659463637404973,
"100": 0.0008467986186345418,
"200": 0.0005270672672324711,
"500": 0.00018555617994732326,
"1000": 8.427821927600437e-05,
"2000": 3.328240580028958e-06
},
"2": {
"10": 0.016187396844228107,
"20": 0.010158376197020213,
"30": 0.0047512871026992795,
"50": 0.0032849965658452774,
"100": 0.0013126978443728553,
"200": 0.0007603488696946038,
"500": 0.00015906307432386608,
"1000": 5.299210548400879e-05,
"2000": 8.578023976749844e-05
},
"3": {
"10": 0.01852987120057353,
"20": 0.014939713157816894,
"30": 0.007211493629470674,
"50": 0.005900978506348717,
"100": 0.0021263419639500273,
"200": 0.001293775682166193,
"500": 0.00036153811212797233,
"1000": 0.00019700892104083324,
"2000": 7.671554883321127e-05
},
"4": {
"10": NaN,
"20": NaN,
"30": NaN,
"50": NaN,
"100": NaN,
"200": NaN,
"500": NaN,
"1000": NaN,
"2000": NaN
},
"5": {
"10": NaN,
"20": NaN,
"30": NaN,
"50": NaN,
"100": NaN,
"200": NaN,
"500": NaN,
"1000": NaN,
"2000": NaN
}
}
} |