{ "activation": "gelu", "adam_betas": "0.9,0.95", "arch": "perceiver", "args_from": "configs/base.json", "aug_drop": 0.0, "aug_flip": true, "aug_jitter": 0.0, "aug_rotate": true, "batch_size": 64, "behind_emb_dim": 8, "cache_dir": "hf://usm3d/s23dr-2026-sampled_4096_v2:train", "conf_clamp_min": null, "conf_head_wd": 0.1, "conf_mode": "sinkhorn", "conf_weight": 0.1, "cooldown_start": 0, "cooldown_steps": 0, "cosine_decay": false, "cpu": false, "cross_attn_interval": 4, "decoder_input_xattn": false, "decoder_layers": 3, "deterministic": false, "dropout": 0.1, "ema_decay": 0.0, "encoder_layers": 4, "endpoint_warmup": 0, "endpoint_weight": 0.0, "ff": 1024, "git_dirty": true, "git_sha": "465f2c6eb6ce4be5c2e52e8384961930f5f9f20a", "hidden": 256, "kv_heads_cross": 2, "kv_heads_self": 2, "latent_layers": 7, "latent_tokens": 256, "learnable_fourier": false, "length_floor": 0.0, "lr": 3e-05, "num_heads": 4, "out_dir": "/workspace/s23dr_2026_example/repro_e2e_run4", "pre_encoder_layers": 0, "qk_norm": true, "qk_norm_type": "l2", "resume": "/workspace/s23dr_2026_example/repro_e2e_run4/20260329_213417_ef91_6503/checkpoints/step125000.pt", "rms_norm": true, "seed": 353, "segment_conf": true, "segment_param": "midpoint_dir_len", "segments": 64, "seq_len": 4096, "sinkhorn_dustbin": 0.3, "sinkhorn_eps": 0.1, "sinkhorn_eps_schedule": "none", "sinkhorn_eps_start": null, "sinkhorn_iters": 20, "sinkhorn_weight": 1.0, "steps": 135000, "val_cache_dir": "", "varifold_cross_only": false, "varifold_weight": 0.0, "vote_features": true, "warmup": 10000, "weight_decay": 0.01 }