Spaces:
Running
Running
| { | |
| "model_type": "rwkv_rnn", | |
| "tau_90": 0.9, | |
| "tau_99": 0.99, | |
| "N_prompts": 2, | |
| "dist_short": 10, | |
| "dist_long": 1000, | |
| "logp_gap": 5.3643, | |
| "ref_logp_d10": { | |
| "mean": -8.0806, | |
| "std": 2.5551 | |
| }, | |
| "baseline_logp_d1000": { | |
| "mean": -13.4449, | |
| "std": 0.5371 | |
| }, | |
| "layer_sweep": { | |
| "0": { | |
| "recovery_pct": 0.0, | |
| "logp_transplant_mean": -13.4449, | |
| "logp_transplant_std": 0.5371 | |
| }, | |
| "1": { | |
| "recovery_pct": 9.32, | |
| "logp_transplant_mean": -12.9449, | |
| "logp_transplant_std": 0.6751 | |
| }, | |
| "2": { | |
| "recovery_pct": 6.6, | |
| "logp_transplant_mean": -13.0907, | |
| "logp_transplant_std": 0.7562 | |
| }, | |
| "3": { | |
| "recovery_pct": 2.42, | |
| "logp_transplant_mean": -13.3152, | |
| "logp_transplant_std": 0.7399 | |
| }, | |
| "4": { | |
| "recovery_pct": -3.9, | |
| "logp_transplant_mean": -13.654, | |
| "logp_transplant_std": 0.5254 | |
| }, | |
| "5": { | |
| "recovery_pct": -5.81, | |
| "logp_transplant_mean": -13.7564, | |
| "logp_transplant_std": 0.3247 | |
| }, | |
| "6": { | |
| "recovery_pct": -11.03, | |
| "logp_transplant_mean": -14.0365, | |
| "logp_transplant_std": 0.535 | |
| }, | |
| "7": { | |
| "recovery_pct": -12.82, | |
| "logp_transplant_mean": -14.1328, | |
| "logp_transplant_std": 0.8057 | |
| }, | |
| "8": { | |
| "recovery_pct": -10.49, | |
| "logp_transplant_mean": -14.0078, | |
| "logp_transplant_std": 0.716 | |
| }, | |
| "9": { | |
| "recovery_pct": -9.73, | |
| "logp_transplant_mean": -13.9669, | |
| "logp_transplant_std": 0.7431 | |
| }, | |
| "10": { | |
| "recovery_pct": -8.57, | |
| "logp_transplant_mean": -13.9048, | |
| "logp_transplant_std": 0.731 | |
| }, | |
| "11": { | |
| "recovery_pct": -9.3, | |
| "logp_transplant_mean": -13.944, | |
| "logp_transplant_std": 0.7777 | |
| }, | |
| "12": { | |
| "recovery_pct": -6.77, | |
| "logp_transplant_mean": -13.8083, | |
| "logp_transplant_std": 0.7119 | |
| }, | |
| "13": { | |
| "recovery_pct": -7.08, | |
| "logp_transplant_mean": -13.8246, | |
| "logp_transplant_std": 0.782 | |
| }, | |
| "14": { | |
| "recovery_pct": -10.01, | |
| "logp_transplant_mean": -13.9817, | |
| "logp_transplant_std": 0.7615 | |
| }, | |
| "15": { | |
| "recovery_pct": -3.46, | |
| "logp_transplant_mean": -13.6305, | |
| "logp_transplant_std": 0.5568 | |
| }, | |
| "16": { | |
| "recovery_pct": -2.56, | |
| "logp_transplant_mean": -13.5825, | |
| "logp_transplant_std": 0.3059 | |
| }, | |
| "17": { | |
| "recovery_pct": 7.37, | |
| "logp_transplant_mean": -13.0499, | |
| "logp_transplant_std": 0.231 | |
| }, | |
| "18": { | |
| "recovery_pct": 13.75, | |
| "logp_transplant_mean": -12.7073, | |
| "logp_transplant_std": 0.2173 | |
| }, | |
| "19": { | |
| "recovery_pct": 18.04, | |
| "logp_transplant_mean": -12.4773, | |
| "logp_transplant_std": 0.6731 | |
| }, | |
| "20": { | |
| "recovery_pct": 24.66, | |
| "logp_transplant_mean": -12.1223, | |
| "logp_transplant_std": 0.4863 | |
| }, | |
| "21": { | |
| "recovery_pct": 23.65, | |
| "logp_transplant_mean": -12.1762, | |
| "logp_transplant_std": 0.5121 | |
| }, | |
| "22": { | |
| "recovery_pct": 36.9, | |
| "logp_transplant_mean": -11.4657, | |
| "logp_transplant_std": 0.1153 | |
| }, | |
| "23": { | |
| "recovery_pct": 34.61, | |
| "logp_transplant_mean": -11.5886, | |
| "logp_transplant_std": 0.0028 | |
| }, | |
| "24": { | |
| "recovery_pct": 43.64, | |
| "logp_transplant_mean": -11.104, | |
| "logp_transplant_std": 0.4192 | |
| }, | |
| "25": { | |
| "recovery_pct": 60.76, | |
| "logp_transplant_mean": -10.1854, | |
| "logp_transplant_std": 0.2813 | |
| }, | |
| "26": { | |
| "recovery_pct": 65.54, | |
| "logp_transplant_mean": -9.9294, | |
| "logp_transplant_std": 0.8151 | |
| }, | |
| "27": { | |
| "recovery_pct": 70.47, | |
| "logp_transplant_mean": -9.6648, | |
| "logp_transplant_std": 1.0024 | |
| }, | |
| "28": { | |
| "recovery_pct": 73.63, | |
| "logp_transplant_mean": -9.4952, | |
| "logp_transplant_std": 1.2598 | |
| }, | |
| "29": { | |
| "recovery_pct": 75.04, | |
| "logp_transplant_mean": -9.4197, | |
| "logp_transplant_std": 1.3715 | |
| }, | |
| "30": { | |
| "recovery_pct": 80.81, | |
| "logp_transplant_mean": -9.1098, | |
| "logp_transplant_std": 1.5623 | |
| }, | |
| "31": { | |
| "recovery_pct": 99.03, | |
| "logp_transplant_mean": -8.1328, | |
| "logp_transplant_std": 2.5247 | |
| } | |
| }, | |
| "L_crit_90": 31, | |
| "L_crit_99": 31, | |
| "alpha_90": 0.9688, | |
| "alpha_99": 0.9688, | |
| "n_layers": 32, | |
| "d_model": 2560, | |
| "seed": 42, | |
| "model": "BlinkDL/rwkv-4-world-3b", | |
| "runtime_seconds": 3226.7 | |
| } |