{ "base_model_name_or_path": null, "quantizer_ckpt_path": null, "llm_hidden_size": 2560, "mixture_mode": "mot", "embedding_dim": 256, "image_size": 448, "num_image_tokens": 256, "max_num_patches": 12, "image_token": "", "model": { "internvl_path": null, "llm_hidden_size": 2560, "mixture_mode": "mot", "embedding_dim": 256, "quantizer": { "ckpt_path": null, "vq_type": "multi_vq", "type": "MLP", "input_feature_dim": 4096, "embedding_dim": 256, "llm_hidden_size": 2560, "num_embeddings": 2048, "num_codebooks": 8 }, "head": { "num_codebooks": 8, "num_layers": 3, "hidden_size": 2560, "num_embeddings": 2048, "num_heads": 32, "mlp_ratio": 4.0 } }, "quantizer": { "ckpt_path": null, "vq_type": "multi_vq", "type": "MLP", "input_feature_dim": 4096, "embedding_dim": 256, "llm_hidden_size": 2560, "num_embeddings": 2048, "num_codebooks": 8 }, "head": { "num_codebooks": 8, "num_layers": 3, "hidden_size": 2560, "num_embeddings": 2048, "num_heads": 32, "mlp_ratio": 4.0 }, "legacy_checkpoint_path": null, "legacy_state_key": "module" }