{ "arch_id": "gemma4-assistant-mtp", "artifacts": { "assistant_dtype": null, "assistant_format": "q6-g64-affine", "assistant_model": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-assistant-google-q6-g64-mlx", "assistant_quantization": { "bits": 6, "group_size": 64, "mode": "affine" }, "disk_ok": true, "min_free_gib": 220.0, "observed_free_gib": 704.1539611816406, "target_model": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx", "target_quantization": { "bits": 4, "format": "mlx-flat4-g64", "group_size": 64, "mode": "affine" } }, "backend": "gemma4_assistant", "benchmark": { "draft_block_sizes": [ 6 ], "draft_sampler": { "exactness_note": "Assistant q may differ from target p; MTPLX remains exact because acceptance uses p/q and rejection samples the residual distribution.", "inherits_target_sampler": true, "temperature": null, "top_k": null, "top_p": null }, "max_mode": true, "max_tokens": 1000, "profile": "sustained", "prompt_suite": "mtplx/benchmarks/prompts/flappy.jsonl", "reasoning": "off", "sampler_source": { "do_sample": true, "local_reference": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx/generation_config.json", "name": "official Gemma 4 generation_config.json", "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "seed": 0, "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "blockers": [ "best speedup 1.923x is below 2.000x", "median confirmation speedup 1.923x is below 2.000x" ], "can_run_now": true, "gates": { "generated_tokens": 1000, "longer_lengths_blocked_until_160_passes": true, "median_of_3_min_speedup_vs_ar": 2.0, "min_speedup_vs_ar": 2.0, "mtp_peak_memory_lte_ar_multiplier": 1.18, "mtp_peak_memory_lte_ar_plus_gib": 6 }, "official_sources": { "assistant": "google/gemma-4-31B-it-assistant", "assistant_revision": "cffbbd2cea41ea56a0fa5b0487e0d445121fd204", "target": "google/gemma-4-31B-it", "target_revision": "145dc2508c480a64b47242f160d286cff94a2343" }, "pair": { "assistant_exists": true, "assistant_inspection": { "architecture": "Gemma4AssistantForCausalLM", "architecture_recognized": true, "backbone_hidden_size": 5376, "compatibility": { "arch_id": "gemma4-assistant-mtp", "can_run": false, "exit_code": 3, "message": "Official-style Gemma 4 31B assistant artifact recognized. This is an assistant-backed MTP pair, not a standalone target; MTPLX scaffold is present but QA and the 160-token speed/memory gate are still pending.", "mtp_supported": "recognized", "recognized": true, "recommended_backend": "gemma4_assistant", "recommended_profile": "performance-cold", "runtime_compatibility": "assistant-pair-qa-pending", "runtime_contract": null, "runtime_contract_error": null, "runtime_contract_path": null, "support_level": "architecture-scaffolded-qa-pending", "support_notes": "Assistant-backed scaffold for the official dense Gemma 4 31B pair. It remains QA-pending and is not a public runnable backend until 160-token exactness, speed, and memory gates pass.", "supported": false, "tier": "architecture-compatible-but-unverified", "unsafe_force_required": false, "unverified_model": true }, "config_exists": true, "hidden_size": 1024, "layer_types": [ "sliding_attention", "sliding_attention", "sliding_attention", "full_attention" ], "model_dir": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-assistant-google-q6-g64-mlx", "model_files": [ "model.safetensors" ], "model_type": "gemma4_assistant", "mtp": { "exists": false, "expected_tensor_count": 15, "extra_keys": [], "metadata_only": true, "missing_expected_keys": [], "mtp_file": "model.safetensors.index.json::embedded", "passes_tensor_gate": false, "sidecar_format": "bf16", "tensor_count": 0, "tensors": [] }, "mtp_arch": "gemma4-assistant-mtp", "mtp_num_hidden_layers": 0, "mtp_pattern": null, "mtp_supported": "recognized", "num_hidden_layers": 4, "num_kv_shared_layers": 4, "passes_primary_gate": false, "quantization": { "bits": 6, "group_size": 64, "mode": "affine" }, "recommended_backend": "gemma4_assistant", "recommended_profile": "performance-cold", "runtime_compatibility": "assistant-pair-qa-pending", "runtime_contract_path": null, "sidecars": { "preprocessor_config.json": false, "processor_config.json": false, "video_preprocessor_config.json": false }, "source": "local", "support_level": "architecture-scaffolded-qa-pending", "support_notes": "Assistant-backed scaffold for the official dense Gemma 4 31B pair. It remains QA-pending and is not a public runnable backend until 160-token exactness, speed, and memory gates pass.", "unverified_model": true, "use_ordered_embeddings": false, "vocab_size": 262144 }, "assistant_model": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-assistant-google-q6-g64-mlx", "pair_error": null, "pair_valid": true, "target_exists": true, "target_inspection": { "architecture": "Gemma4ForConditionalGeneration", "architecture_recognized": false, "backbone_hidden_size": null, "compatibility": { "arch_id": null, "can_run": false, "exit_code": 2, "message": "Model has no MTP head. MTPLX requires an MTP-equipped model.", "mtp_supported": "no", "recognized": false, "recommended_backend": null, "recommended_profile": null, "runtime_compatibility": "unsupported", "runtime_contract": null, "runtime_contract_error": null, "runtime_contract_path": null, "support_level": "unsupported", "support_notes": null, "supported": false, "tier": "no-MTP", "unsafe_force_required": false, "unverified_model": false }, "config_exists": true, "hidden_size": 5376, "layer_types": [ "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "sliding_attention", "full_attention" ], "model_dir": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx", "model_files": [ "model-00001-of-00004.safetensors", "model-00002-of-00004.safetensors", "model-00003-of-00004.safetensors", "model-00004-of-00004.safetensors" ], "model_type": "gemma4_text", "mtp": { "exists": false, "expected_tensor_count": 15, "extra_keys": [], "metadata_only": true, "missing_expected_keys": [], "mtp_file": "model.safetensors.index.json::embedded", "passes_tensor_gate": false, "sidecar_format": "bf16", "tensor_count": 0, "tensors": [] }, "mtp_arch": null, "mtp_num_hidden_layers": 0, "mtp_pattern": null, "mtp_supported": "no", "num_hidden_layers": 60, "num_kv_shared_layers": 0, "passes_primary_gate": false, "quantization": { "bits": 4, "group_size": 64, "mode": "affine" }, "recommended_backend": null, "recommended_profile": null, "runtime_compatibility": "unsupported", "runtime_contract_path": null, "sidecars": { "preprocessor_config.json": false, "processor_config.json": false, "video_preprocessor_config.json": false }, "source": "local", "support_level": "unsupported", "support_notes": null, "unverified_model": false, "use_ordered_embeddings": null, "vocab_size": 262144 }, "target_model": "/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx" }, "planned_commands": { "assistant_bf16_snapshot": "uv run python -c \"from huggingface_hub import snapshot_download; snapshot_download(repo_id='google/gemma-4-31B-it-assistant', revision='cffbbd2cea41ea56a0fa5b0487e0d445121fd204', repo_type='model', local_dir='/Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-assistant-google-q6-g64-mlx')\"", "gate": "mtplx bench gemma-mtp --target-model /Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx --assistant-model /Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-assistant-google-q6-g64-mlx --profile sustained --max --prompt-suite mtplx/benchmarks/prompts/flappy.jsonl --max-tokens 1000 --temperature 1.0 --top-p 0.95 --top-k 64 --seed 0 --reasoning off --draft-block-sizes 6 --json --output outputs/gemma4/flappy1000-q6assistant-pure-confirm2-block6.json", "target_flat4_g64": "uv run python -m mlx_lm.convert --hf-path /Users/youssof/Documents/MTPLX/models/.sources/gemma-4-31B-it-145dc2508c48 --mlx-path /Users/youssof/Documents/MTPLX/models/gemma-4-31B-it-google-flat4-g64-mlx --quantize --q-bits 4 --q-group-size 64 --q-mode affine", "target_revision_download": "uv run python -c \"from huggingface_hub import snapshot_download; snapshot_download(repo_id='google/gemma-4-31B-it', revision='145dc2508c480a64b47242f160d286cff94a2343', repo_type='model', local_dir='/Users/youssof/Documents/MTPLX/models/.sources/gemma-4-31B-it-145dc2508c48')\"" }, "qa_pending": true, "results": { "ar": { "active_memory_gib": 16.96542397607118, "cache_memory_gib": 1.9759961115196347, "decode_s": 43.638336165997316, "generated_tokens": 1000, "mode": "ar", "peak_memory_gib": 17.040895924903452, "prefill_s": 0.7599931250006193, "tok_s": 22.915630792981354, "token_preview": [ 9996, 625, 24731, 236761, 9996, 625, 24731, 236761, 9996, 625, 24731, 236761, 9996, 625, 24731, 236761 ] }, "ar_confirmation": [ { "active_memory_gib": 16.96542397607118, "cache_memory_gib": 1.9759961115196347, "decode_s": 43.638336165997316, "generated_tokens": 1000, "mode": "ar", "peak_memory_gib": 17.040895924903452, "prefill_s": 0.7599931250006193, "tok_s": 22.915630792981354, "token_preview": [ 9996, 625, 24731, 236761, 9996, 625, 24731, 236761, 9996, 625, 24731, 236761, 9996, 625, 24731, 236761 ] } ], "best_block_confirmation": [ { "acceptance": 0.9810874704491725, "accepted_drafts": 830, "active_memory_gib": 17.410899550653994, "block_size": 6, "cache_memory_gib": 67.3336522737518, "decode_s": 22.690279750007903, "draft_sampler": { "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "drafted_tokens": 846, "generated_tokens": 1000, "mode": "mtp", "peak_memory_gib": 17.566339950077236, "prefill_s": 0.25343483399774414, "row_distribution_evals": 0, "speedup_vs_ar": 1.9232171946219445, "target_distribution_modes": { "batched_logits": 170 }, "target_sampler": { "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "telemetry": { "ar_dense_fallback_calls": 0, "decode_dense_fallback_calls": 0, "dense_fallback_calls_by_phase": { "ar_decode": 0, "decode_verify": 0, "postcommit": 0, "prefill": 0, "unknown": 0 }, "events": [], "paged_active_array_calls_by_phase": { "ar_decode": 0, "decode_verify": 0, "postcommit": 0, "prefill": 0, "unknown": 0 }, "paged_attention_bailouts_by_phase_reason": { "ar_decode": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "decode_verify": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "postcommit": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "prefill": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "unknown": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 } }, "paged_attention_large_q_path": { "dense_forbidden": 0, "large_q_split_sdpa_fallback": 0, "partitioned_paged": 0, "tail_paged": 0, "unknown": 0 }, "postcommit_dense_fallback_calls": 0, "prefill_dense_fallback_calls": 0, "trace_events": false }, "timing_s": { "accept": 0.014734539974597283, "draft": 1.5304279569390928, "rollback": 0.00014716008445248008, "target_distribution": 20.938332714038552, "target_hidden": 0.0, "verify": 0.19443316804245114 }, "tok_s": 44.071735166669846, "token_preview": [ 9996, 625, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759 ], "verify_calls": 170 } ], "best_block_size": 6, "best_speedup": 1.9232171946219445, "blockers": [ "best speedup 1.923x is below 2.000x", "median confirmation speedup 1.923x is below 2.000x" ], "draft_sampler": { "exactness_note": "Assistant q may differ from target p; MTPLX remains exact because acceptance uses p/q and rejection samples the residual distribution.", "inherits_target_sampler": true, "temperature": null, "top_k": null, "top_p": null }, "fan_restore": { "after": { "actual_max_rpm": 6341, "actual_min_rpm": 5980, "capacity_max_rpm": 7826, "capacity_min_rpm": 7826, "fans": [ { "actual_rpm": 5980, "max_capacity_rpm": 7826, "mode": "auto", "raw": { "actual_rpm": 5980, "index": 0, "max_rpm": 7826, "min_rpm": 2317, "mode": "auto", "target_rpm": 5490 }, "rpm": 5980, "target_rpm": 5490 }, { "actual_rpm": 6341, "max_capacity_rpm": 7826, "mode": "auto", "raw": { "actual_rpm": 6341, "index": 1, "max_rpm": 7826, "min_rpm": 2317, "mode": "auto", "target_rpm": 5929 }, "rpm": 6341, "target_rpm": 5929 } ], "max_rpm": 6341, "min_rpm": 5980, "ok": true, "raw": { "attempts": [ { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 5980,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5490\n },\n {\n \"actual_rpm\" : 6341,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5929\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.2,\n \"TB0T\" : 32.6,\n \"TCDX\" : 77.2,\n \"TCHP\" : 64.2,\n \"TCMb\" : 92.3,\n \"TG0B\" : 32.5,\n \"TG0H\" : 32,\n \"TG0V\" : 32.5,\n \"TH0x\" : 41.2,\n \"TMVR\" : 69.4,\n \"TPDX\" : 70.4,\n \"TRDX\" : 83.8,\n \"TS0P\" : 76.1,\n \"Tg0j\" : 80.6,\n \"Tm08\" : 76.7,\n \"Tp04\" : 77.7,\n \"Tp08\" : 77.3,\n \"Tp0C\" : 78.1,\n \"Tp0G\" : 78.5,\n \"Tp0X\" : 78.3\n }\n}" } ], "detection": { "available": true, "clock_anchor_enabled": false, "clock_anchor_policy": "explicit experimental only; never used for product claims", "instructions": "Install ThermalForge and ensure the thermalforge CLI is on PATH.", "selected": { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } }, "tools": [ { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } } ] }, "ok": true, "status": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 5980,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5490\n },\n {\n \"actual_rpm\" : 6341,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5929\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.2,\n \"TB0T\" : 32.6,\n \"TCDX\" : 77.2,\n \"TCHP\" : 64.2,\n \"TCMb\" : 92.3,\n \"TG0B\" : 32.5,\n \"TG0H\" : 32,\n \"TG0V\" : 32.5,\n \"TH0x\" : 41.2,\n \"TMVR\" : 69.4,\n \"TPDX\" : 70.4,\n \"TRDX\" : 83.8,\n \"TS0P\" : 76.1,\n \"Tg0j\" : 80.6,\n \"Tm08\" : 76.7,\n \"Tp04\" : 77.7,\n \"Tp08\" : 77.3,\n \"Tp0C\" : 78.1,\n \"Tp0G\" : 78.5,\n \"Tp0X\" : 78.3\n }\n}" } }, "target_max_rpm": 5929, "target_min_rpm": 5490 }, "message": "fan profile restored", "ok": true, "profile": "silent", "set_result": { "attempts": [ { "command": [ "sudo", "-n", "/Users/youssof/.mtplx/bin/thermalforge", "auto" ], "ok": true, "returncode": 0, "stderr": "No matching processes were found", "stdout": "Fans reset to Apple defaults" } ], "command": [ "sudo", "-n", "/Users/youssof/.mtplx/bin/thermalforge", "auto" ], "detection": { "available": true, "clock_anchor_enabled": false, "clock_anchor_policy": "explicit experimental only; never used for product claims", "instructions": "Install ThermalForge and ensure the thermalforge CLI is on PATH.", "selected": { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } }, "tools": [ { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } } ] }, "dry_run": false, "ok": true, "profile": "silent" } }, "fanmax": { "after": { "actual_max_rpm": 7385, "actual_min_rpm": 7332, "capacity_max_rpm": 7826, "capacity_min_rpm": 7826, "fans": [ { "actual_rpm": 7332, "max_capacity_rpm": 7826, "mode": "manual", "raw": { "actual_rpm": 7332, "index": 0, "max_rpm": 7826, "min_rpm": 2317, "mode": "manual", "target_rpm": 7826 }, "rpm": 7332, "target_rpm": 7826 }, { "actual_rpm": 7385, "max_capacity_rpm": 7826, "mode": "manual", "raw": { "actual_rpm": 7385, "index": 1, "max_rpm": 7826, "min_rpm": 2317, "mode": "manual", "target_rpm": 7826 }, "rpm": 7385, "target_rpm": 7826 } ], "max_rpm": 7385, "min_rpm": 7332, "ok": true, "raw": { "attempts": [ { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 7332,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"manual\",\n \"target_rpm\" : 7826\n },\n {\n \"actual_rpm\" : 7385,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"manual\",\n \"target_rpm\" : 7826\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.1,\n \"TB0T\" : 32.6,\n \"TCDX\" : 82.5,\n \"TCHP\" : 60.5,\n \"TCMb\" : 86.9,\n \"TG0B\" : 32.6,\n \"TG0H\" : 32,\n \"TG0V\" : 32.6,\n \"TH0x\" : 40,\n \"TMVR\" : 59.5,\n \"TPDX\" : 65.2,\n \"TRDX\" : 67.7,\n \"TS0P\" : 66.7,\n \"Tg0j\" : 67.2,\n \"Tm08\" : 67.9,\n \"Tp04\" : 75.1,\n \"Tp08\" : 74.2,\n \"Tp0C\" : 77.5,\n \"Tp0G\" : 76.2,\n \"Tp0X\" : 75.2\n }\n}" } ], "detection": { "available": true, "clock_anchor_enabled": false, "clock_anchor_policy": "explicit experimental only; never used for product claims", "instructions": "Install ThermalForge and ensure the thermalforge CLI is on PATH.", "selected": { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } }, "tools": [ { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } } ] }, "ok": true, "status": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 7332,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"manual\",\n \"target_rpm\" : 7826\n },\n {\n \"actual_rpm\" : 7385,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"manual\",\n \"target_rpm\" : 7826\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.1,\n \"TB0T\" : 32.6,\n \"TCDX\" : 82.5,\n \"TCHP\" : 60.5,\n \"TCMb\" : 86.9,\n \"TG0B\" : 32.6,\n \"TG0H\" : 32,\n \"TG0V\" : 32.6,\n \"TH0x\" : 40,\n \"TMVR\" : 59.5,\n \"TPDX\" : 65.2,\n \"TRDX\" : 67.7,\n \"TS0P\" : 66.7,\n \"Tg0j\" : 67.2,\n \"Tm08\" : 67.9,\n \"Tp04\" : 75.1,\n \"Tp08\" : 74.2,\n \"Tp0C\" : 77.5,\n \"Tp0G\" : 76.2,\n \"Tp0X\" : 75.2\n }\n}" } }, "target_max_rpm": 7826, "target_min_rpm": 7826 }, "baseline": { "actual_max_rpm": 5367, "actual_min_rpm": 4968, "capacity_max_rpm": 7826, "capacity_min_rpm": 7826, "fans": [ { "actual_rpm": 4968, "max_capacity_rpm": 7826, "mode": "auto", "raw": { "actual_rpm": 4968, "index": 0, "max_rpm": 7826, "min_rpm": 2317, "mode": "auto", "target_rpm": 4976 }, "rpm": 4968, "target_rpm": 4976 }, { "actual_rpm": 5367, "max_capacity_rpm": 7826, "mode": "auto", "raw": { "actual_rpm": 5367, "index": 1, "max_rpm": 7826, "min_rpm": 2317, "mode": "auto", "target_rpm": 5374 }, "rpm": 5367, "target_rpm": 5374 } ], "max_rpm": 5367, "min_rpm": 4968, "ok": true, "raw": { "attempts": [ { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 4968,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 4976\n },\n {\n \"actual_rpm\" : 5367,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5374\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.1,\n \"TB0T\" : 32.6,\n \"TCDX\" : 68.2,\n \"TCHP\" : 60.5,\n \"TCMb\" : 75.8,\n \"TG0B\" : 32.6,\n \"TG0H\" : 32,\n \"TG0V\" : 32.6,\n \"TH0x\" : 39.6,\n \"TMVR\" : 59.7,\n \"TPDX\" : 65.7,\n \"TRDX\" : 67.6,\n \"TS0P\" : 67.4,\n \"Tg0j\" : 67.2,\n \"Tm08\" : 68.6,\n \"Tp04\" : 76.5,\n \"Tp08\" : 75.4,\n \"Tp0C\" : 79.5,\n \"Tp0G\" : 77.4,\n \"Tp0X\" : 76.6\n }\n}" } ], "detection": { "available": true, "clock_anchor_enabled": false, "clock_anchor_policy": "explicit experimental only; never used for product claims", "instructions": "Install ThermalForge and ensure the thermalforge CLI is on PATH.", "selected": { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } }, "tools": [ { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } } ] }, "ok": true, "status": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "status" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "{\n \"fans\" : [\n {\n \"actual_rpm\" : 4968,\n \"index\" : 0,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 4976\n },\n {\n \"actual_rpm\" : 5367,\n \"index\" : 1,\n \"max_rpm\" : 7826,\n \"min_rpm\" : 2317,\n \"mode\" : \"auto\",\n \"target_rpm\" : 5374\n }\n ],\n \"temperatures\" : {\n \"TAOL\" : 34.1,\n \"TB0T\" : 32.6,\n \"TCDX\" : 68.2,\n \"TCHP\" : 60.5,\n \"TCMb\" : 75.8,\n \"TG0B\" : 32.6,\n \"TG0H\" : 32,\n \"TG0V\" : 32.6,\n \"TH0x\" : 39.6,\n \"TMVR\" : 59.7,\n \"TPDX\" : 65.7,\n \"TRDX\" : 67.6,\n \"TS0P\" : 67.4,\n \"Tg0j\" : 67.2,\n \"Tm08\" : 68.6,\n \"Tp04\" : 76.5,\n \"Tp08\" : 75.4,\n \"Tp0C\" : 79.5,\n \"Tp0G\" : 77.4,\n \"Tp0X\" : 76.6\n }\n}" } }, "target_max_rpm": 5374, "target_min_rpm": 4976 }, "message": "fans ramped to max (actual 7332-7385 RPM; target 7826 RPM)", "ok": true, "profile": "max", "set_result": { "attempts": [ { "command": [ "sudo", "-n", "/Users/youssof/.mtplx/bin/thermalforge", "max" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "Fan 0: 4968 RPM \u2192 max (7826 RPM)\nFan 1: 5367 RPM \u2192 max (7826 RPM)" } ], "command": [ "sudo", "-n", "/Users/youssof/.mtplx/bin/thermalforge", "max" ], "detection": { "available": true, "clock_anchor_enabled": false, "clock_anchor_policy": "explicit experimental only; never used for product claims", "instructions": "Install ThermalForge and ensure the thermalforge CLI is on PATH.", "selected": { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } }, "tools": [ { "kind": "thermalforge", "path": "/Users/youssof/.mtplx/bin/thermalforge", "version": { "command": [ "/Users/youssof/.mtplx/bin/thermalforge", "--version" ], "ok": true, "returncode": 0, "stderr": "", "stdout": "0.1.0" } } ] }, "dry_run": false, "ok": true, "profile": "max" } }, "max_tokens": 1000, "median_confirmation_speedup": 1.9232171946219445, "memory_gate": { "ar_peak_memory_gib": 17.040895924903452, "lte_ar_plus_6_gib": true, "lte_ar_times_1_18": true, "mtp_peak_memory_gib": 17.566339950077236 }, "mtp_by_block_size": { "6": { "acceptance": 0.9810874704491725, "accepted_drafts": 830, "active_memory_gib": 17.410899550653994, "block_size": 6, "cache_memory_gib": 67.3336522737518, "decode_s": 22.690279750007903, "draft_sampler": { "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "drafted_tokens": 846, "generated_tokens": 1000, "mode": "mtp", "peak_memory_gib": 17.566339950077236, "prefill_s": 0.25343483399774414, "row_distribution_evals": 0, "speedup_vs_ar": 1.9232171946219445, "target_distribution_modes": { "batched_logits": 170 }, "target_sampler": { "temperature": 1.0, "top_k": 64, "top_p": 0.95 }, "telemetry": { "ar_dense_fallback_calls": 0, "decode_dense_fallback_calls": 0, "dense_fallback_calls_by_phase": { "ar_decode": 0, "decode_verify": 0, "postcommit": 0, "prefill": 0, "unknown": 0 }, "events": [], "paged_active_array_calls_by_phase": { "ar_decode": 0, "decode_verify": 0, "postcommit": 0, "prefill": 0, "unknown": 0 }, "paged_attention_bailouts_by_phase_reason": { "ar_decode": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "decode_verify": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "postcommit": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "prefill": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 }, "unknown": { "batch_not_1": 0, "block_size_mismatch": 0, "blocks_invalid": 0, "dtype_unsupported": 0, "empty_cache": 0, "head_dim_unsupported": 0, "kernel_unavailable": 0, "offset_invalid": 0, "partitioned_invalid_output": 0, "partitioned_unavailable": 0, "q_len_gt_max": 0, "q_len_invalid": 0, "turboquant_unsupported": 0, "unknown": 0, "unsupported_mask": 0 } }, "paged_attention_large_q_path": { "dense_forbidden": 0, "large_q_split_sdpa_fallback": 0, "partitioned_paged": 0, "tail_paged": 0, "unknown": 0 }, "postcommit_dense_fallback_calls": 0, "prefill_dense_fallback_calls": 0, "trace_events": false }, "timing_s": { "accept": 0.014734539974597283, "draft": 1.5304279569390928, "rollback": 0.00014716008445248008, "target_distribution": 20.938332714038552, "target_hidden": 0.0, "verify": 0.19443316804245114 }, "tok_s": 44.071735166669846, "token_preview": [ 9996, 625, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759, 759 ], "verify_calls": 170 } }, "passed": false, "prompt_id": "flappy_html5_canvas_game", "prompt_tokens": 119, "sampler": { "seed": 0, "temperature": 1.0, "top_k": 64, "top_p": 0.95 } }, "status": "failed" }