cross-model-lora-prediction-3b / train_results_round3.json
CK0607's picture
Round 3 3B domain expansion results
4838960 verified
raw
history blame
7.19 kB
[
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mawps",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "math_counting_easy",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mbpp_sanitized",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "arc_easy",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mmlu_high_school_biology",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "math_algebra_medium",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mmlu_college_chemistry",
"ok": true,
"gpu": 7
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "gsm8k",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "multiarith",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mbpp",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "conala_curated",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "openbookqa",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mmlu_high_school_physics",
"ok": true,
"gpu": 1
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "humaneval_plus",
"ok": true,
"gpu": 1
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mawps",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "math_counting_easy",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mbpp_sanitized",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "arc_easy",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mmlu_high_school_biology",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "math_algebra_medium",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mmlu_college_chemistry",
"ok": true,
"gpu": 6
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "gsm8k",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "multiarith",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mbpp",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "conala_curated",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "openbookqa",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mmlu_high_school_physics",
"ok": true,
"gpu": 0
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "humaneval_plus",
"ok": true,
"gpu": 0
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "asdiv",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "math_algebra_easy",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "codealpaca_mini",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "sciq",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mmlu_elementary_math",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "gsm_hard",
"ok": true,
"gpu": 5
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "arc_challenge",
"ok": true,
"gpu": 5
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "asdiv",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "math_algebra_easy",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "codealpaca_mini",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "sciq",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mmlu_elementary_math",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "gsm_hard",
"ok": true,
"gpu": 4
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "arc_challenge",
"ok": true,
"gpu": 4
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "svamp",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "aqua_rat",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "humaneval",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "livecodebench_easy",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "medmcqa_easy",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "pubmedqa_pqal",
"ok": true,
"gpu": 3
},
{
"side": "Y",
"model": "meta-llama/Llama-3.2-3B-Instruct",
"task": "mbpp_plus",
"ok": true,
"gpu": 3
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "svamp",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "aqua_rat",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "humaneval",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "livecodebench_easy",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "medmcqa_easy",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "pubmedqa_pqal",
"ok": true,
"gpu": 2
},
{
"side": "X",
"model": "Qwen/Qwen2.5-3B-Instruct",
"task": "mbpp_plus",
"ok": true,
"gpu": 2
}
]