{ "phase_AB_rc": [ { "label": "Mistral-7B (4bit)", "hf_id": "mistralai/Mistral-7B-v0.1", "phase": "A", "n_kv": 8, "d_head": 128, "n_params_M": 7240, "theta": 10000, "T_train": 32768, "R_c": 0.9574147216280355, "error": "load: Illegal header value b'Bearer '" }, { "label": "Qwen2.5-7B (4bit)", "hf_id": "Qwen/Qwen2.5-7B", "phase": "A", "n_kv": 4, "d_head": 128, "n_params_M": 7610, "theta": 1000000, "T_train": 131072, "R_c": 1.1765191580975, "error": "load: Illegal header value b'Bearer '" }, { "label": "OLMo-7B (4bit)", "hf_id": "allenai/OLMo-7B-hf", "phase": "B", "n_kv": 32, "d_head": 128, "n_params_M": 6890, "theta": 10000, "T_train": 2048, "R_c": 0.48704080868743954, "error": "load: Illegal header value b'Bearer '" }, { "label": "Falcon-7B (4bit)", "hf_id": "tiiuae/falcon-7b", "phase": "B", "n_kv": 1, "d_head": 64, "n_params_M": 6920, "theta": 10000, "T_train": 2048, "R_c": 1.4588955689285732, "error": "load: Illegal header value b'Bearer '" }, { "label": "pythia-6.9b (4bit)", "hf_id": "EleutherAI/pythia-6.9b", "phase": "B", "n_kv": 32, "d_head": 128, "n_params_M": 6900, "theta": 10000, "T_train": 2048, "R_c": 0.4867927697741792, "error": "load: Illegal header value b'Bearer '" } ], "phase_C_multifractal": [ { "label": "Llama-3-8B (4bit, Nous mirror)", "hf_id": "NousResearch/Meta-Llama-3-8B", "phase": "C", "error": "load: Illegal header value b'Bearer '" }, { "label": "Mistral-7B (4bit)", "hf_id": "mistralai/Mistral-7B-v0.1", "phase": "C", "error": "load: Illegal header value b'Bearer '" } ], "elapsed_min": 0.029302664597829185, "n_completed_rc": 0, "n_completed_mf": 0 }