Spaces:
Running
Running
File size: 3,082 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 | {
"model": "EleutherAI/pythia-1b",
"theta": 10000,
"gamma_pred": 0.99999561666838,
"C_theory": 9.2103,
"distances": [
10,
20,
30,
50,
100,
200,
500,
1000,
2000
],
"distances_fit": [
30,
50,
100,
200,
500,
1000,
2000
],
"d_min_fit": 30,
"n_prompts_per_distance": 150,
"seeds": [
42,
123,
7
],
"attn_by_distance": {
"10": {
"mean_across_seeds": 0.010958388174573582,
"std_across_seeds": 0.0004834559168031873,
"per_seed_means": [
0.011297275526449085,
0.010274686822667719,
0.011303202174603939
]
},
"20": {
"mean_across_seeds": 0.006365462491909664,
"std_across_seeds": 4.797004634512219e-05,
"per_seed_means": [
0.006431558985883991,
0.006319180646290382,
0.006345647843554616
]
},
"30": {
"mean_across_seeds": 0.003956688532812728,
"std_across_seeds": 0.00041444934898881186,
"per_seed_means": [
0.003707738428687056,
0.003621630910784006,
0.0045406962589671215
]
},
"50": {
"mean_across_seeds": 0.0027740057195640272,
"std_across_seeds": 0.00017409472550222068,
"per_seed_means": [
0.0028004927871127924,
0.0025487780198454857,
0.0029727463517338036
]
},
"100": {
"mean_across_seeds": 0.0014326052833348512,
"std_across_seeds": 4.960638948465883e-05,
"per_seed_means": [
0.0014700610004365444,
0.001362506297106544,
0.0014652485524614652
]
},
"200": {
"mean_across_seeds": 0.0006671193842258718,
"std_across_seeds": 0.00014972843939483376,
"per_seed_means": [
0.00054337820969522,
0.0005801813707997401,
0.0008777985721826554
]
},
"500": {
"mean_across_seeds": 0.00020134633510477014,
"std_across_seeds": 1.977215748224994e-05,
"per_seed_means": [
0.00018427866821487746,
0.00019069870933890342,
0.0002290616277605295
]
},
"1000": {
"mean_across_seeds": 0.00015050364037354788,
"std_across_seeds": 1.545945974564147e-05,
"per_seed_means": [
0.00014964959894617398,
0.00016985010355710984,
0.0001320112186173598
]
},
"2000": {
"mean_across_seeds": 0.00010232122304538885,
"std_across_seeds": 6.657508586021642e-06,
"per_seed_means": [
0.00010441893401245276,
0.00010922116227447987,
9.332357284923395e-05
]
}
},
"fit_power_law": {
"gamma": 0.9311078627189842,
"log_A": -2.350543685121484,
"R2": 0.983104,
"n_points": 7
},
"fit_exponential": {
"lambda": 0.001683695888726774,
"log_A": -6.4638962346156505,
"R2": 0.692773,
"n_points": 7
},
"delta_R2_power_minus_exp": 0.2903,
"gamma_CI_95": {
"lo": 0.8649963102497168,
"hi": 1.0919504310156105
},
"decision": "CONFIRMED: \u03b3 law holds (\u03b3\u00d7ln(\u03b8) = C)"
} |