cross-model-lora-prediction-3b / train_results_round3.json

Round 3 3B domain expansion results

4838960 verified about 1 month ago

7.19 kB

	[
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mawps",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "math_counting_easy",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mbpp_sanitized",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "arc_easy",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mmlu_high_school_biology",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "math_algebra_medium",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mmlu_college_chemistry",
	"ok": true,
	"gpu": 7
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "gsm8k",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "multiarith",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mbpp",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "conala_curated",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "openbookqa",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mmlu_high_school_physics",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "humaneval_plus",
	"ok": true,
	"gpu": 1
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mawps",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "math_counting_easy",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mbpp_sanitized",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "arc_easy",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mmlu_high_school_biology",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "math_algebra_medium",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mmlu_college_chemistry",
	"ok": true,
	"gpu": 6
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "gsm8k",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "multiarith",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mbpp",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "conala_curated",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "openbookqa",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mmlu_high_school_physics",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "humaneval_plus",
	"ok": true,
	"gpu": 0
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "asdiv",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "math_algebra_easy",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "codealpaca_mini",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "sciq",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mmlu_elementary_math",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "gsm_hard",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "arc_challenge",
	"ok": true,
	"gpu": 5
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "asdiv",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "math_algebra_easy",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "codealpaca_mini",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "sciq",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mmlu_elementary_math",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "gsm_hard",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "arc_challenge",
	"ok": true,
	"gpu": 4
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "svamp",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "aqua_rat",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "humaneval",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "livecodebench_easy",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "medmcqa_easy",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "pubmedqa_pqal",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "Y",
	"model": "meta-llama/Llama-3.2-3B-Instruct",
	"task": "mbpp_plus",
	"ok": true,
	"gpu": 3
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "svamp",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "aqua_rat",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "humaneval",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "livecodebench_easy",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "medmcqa_easy",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "pubmedqa_pqal",
	"ok": true,
	"gpu": 2
	},
	{
	"side": "X",
	"model": "Qwen/Qwen2.5-3B-Instruct",
	"task": "mbpp_plus",
	"ok": true,
	"gpu": 2
	}
	]