Spaces:
Running
Running
File size: 1,620 Bytes
535348a | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 | {
"analysis": "T-ContentDecay: short vs long range gamma split",
"d_short_max": 100,
"d_long_min": 200,
"models": [
{
"model": "EleutherAI/pythia-70m",
"theta": 10000,
"gamma_full": 0.6811,
"r2_full": 0.9825,
"gamma_short": 0.6611,
"r2_short": 0.9632,
"gamma_long": 0.8564,
"r2_long": 0.9815,
"delta_long_minus_short": 0.1953,
"n_short": 5,
"n_long": 4,
"short_range": "d<=100",
"long_range": "d>=200"
},
{
"model": "meta-llama/Meta-Llama-3-8B",
"theta": 500000,
"gamma_full": 0.8313,
"r2_full": 0.9936,
"gamma_short": 0.8125,
"r2_short": 0.9899,
"gamma_long": 1.0413,
"r2_long": 0.988,
"delta_long_minus_short": 0.2289,
"n_short": 5,
"n_long": 4,
"short_range": "d<=100",
"long_range": "d>=200"
},
{
"model": "mistralai/Mistral-7B-v0.1",
"theta": 10000,
"gamma_full": null,
"r2_full": null,
"gamma_short": null,
"r2_short": null,
"gamma_long": null,
"r2_long": null,
"delta_long_minus_short": null,
"n_short": 2,
"n_long": 0,
"short_range": "d<=100",
"long_range": "d>=200"
},
{
"model": "Qwen/Qwen2.5-7B",
"theta": 1000000,
"gamma_full": 0.9145,
"r2_full": 0.9993,
"gamma_short": 0.9041,
"r2_short": 0.9996,
"gamma_long": 0.8542,
"r2_long": 0.9936,
"delta_long_minus_short": -0.0499,
"n_short": 5,
"n_long": 4,
"short_range": "d<=100",
"long_range": "d>=200"
}
]
} |