{ "architectures": [ "HTRConvTextModel" ], "blank_token_id": 0, "conv_kernel_size": 7, "depth": 8, "down_after": 3, "drop_path": 0.1, "dropout": 0.1, "ds_kernel": 3, "dtype": "float32", "embed_dim": 512, "image_height": 64, "image_max_width": 3072, "max_seq_len": 128, "mlp_ratio": 4.0, "model_type": "htr-convtext", "num_heads": 8, "patch_size": [ 4, 64 ], "transformers_version": "5.3.0", "up_after": 7, "upsample_mode": "nearest", "use_masking_default": false, "vocab_size": 151, "width_stride": 32, "auto_map": { "AutoConfig": "configuration_htr.HTRConfig", "AutoModel": "modeling_htr.HTRConvTextModel", "AutoProcessor": "processing_htr.HTRProcessor" } }