{ "architectures": [ "GPTBERTForCausalLM" ], "auto_map": { "AutoConfig": "configuration_gpt_bert.ModelConfig", "AutoModel": "modeling_gpt_bert.GPTBERT", "AutoModelForCausalLM": "modeling_gpt_bert.GPTBERTForCausalLM", "AutoModelForMaskedLM": "modeling_gpt_bert.GPTBERTForMaskedLM" }, "attention_probs_dropout_prob": 0.1, "hidden_dropout_prob": 0.1, "hidden_size": 768, "intermediate_size": 2560, "max_position_embeddings": 512, "position_bucket_size": 32, "num_attention_heads": 12, "num_hidden_layers": 12, "vocab_size": 16384, "layer_norm_eps": 1e-05, "return_dict": true, "num_layers": 12 }