{ "architecture_type": "vit", "num_labels": 19294, "num_channels": 3, "image_size": 448, "patch_size": 16, "hidden_size": 1024, "num_hidden_layers": 18, "num_attention_heads": 16, "intermediate_size": 4096, "hidden_dropout_prob": 0.1, "pos_dropout": 0.0, "attention_dropout": 0.05, "drop_path_rate": 0.2, "initializer_range": 0.02, "layer_norm_eps": 1e-06, "use_fp32_layernorm": false, "attention_bias": true, "num_groups": 20, "tags_per_group": 10000, "training_epoch": 7, "training_step": 85517, "vocab_format_version": 1, "vocab_sha256": "ad3c33d3b760bd0d15bd4631f441d47fcb136c7a6e53473b5588d760907b0316", "state_dict_keys_format": "plain (no _orig_mod./module. prefixes)", "state_dict_dtype": "bfloat16", "checkpoint_source": "experiments/run1_vit/checkpoints/last.pt (epoch 7, step 85517)" }