s20-attention-kernel / benchmark_model_results.json
callensxavier's picture
Upload benchmark_model_results.json with huggingface_hub
73360ee verified
Raw
History Blame Contribute Delete
1.52 kB
{
"kernel_benchmark": [
{
"model_id": "openai-community/gpt2",
"model_name": "GPT-2 (124M)",
"n_params_M": 124.4,
"seq_len": 56,
"device": "cpu",
"baseline_ms": 39.176,
"s20_injected_ms": 41.556,
"s20_overhead": 1.061,
"avg_perplexity": 175.7,
"perplexity_per_prompt": [
89.63,
202.44,
235.02
]
},
{
"model_id": "distilbert/distilgpt2",
"model_name": "DistilGPT-2 (82M)",
"n_params_M": 81.9,
"seq_len": 56,
"device": "cpu",
"baseline_ms": 21.623,
"s20_injected_ms": 21.331,
"s20_overhead": 0.987,
"avg_perplexity": 302.02,
"perplexity_per_prompt": [
223.34,
339.5,
343.22
]
},
{
"model_id": "facebook/opt-125m",
"model_name": "OPT-125M",
"n_params_M": 125.2,
"seq_len": 57,
"device": "cpu",
"baseline_ms": 29.008,
"s20_injected_ms": 29.36,
"s20_overhead": 1.012,
"avg_perplexity": 199.73,
"perplexity_per_prompt": [
148.67,
265.95,
184.57
]
},
{
"model_id": "bigscience/bloom-560m",
"model_name": "BLOOM-560M",
"n_params_M": 559.2,
"seq_len": 48,
"device": "cpu",
"baseline_ms": 122.361,
"s20_injected_ms": 117.968,
"s20_overhead": 0.964,
"avg_perplexity": 138.99,
"perplexity_per_prompt": [
177.74,
209.88,
29.35
]
}
]
}