{ "architectures": [ "GPTBERTFoCausalLM" ], "auto_map": { "AutoConfig": "configuration_gpt_bert.ModelConfig", "AutoModel": "modeling_gpt_bert.GPTBERT", "AutoModelForCausalLM": "modeling_gpt_bert.GPTBERTForCausalLM", "AutoModelForMaskedLM": "modeling_gpt_bert.GPTBERTForMaskedLM" }, "attention_probs_dropout_prob": 0.1, "hidden_dropout_prob": 0.1, "hidden_size": 768, "intermediate_size": 2560, "max_position_embeddings": 512, "position_bucket_size": 32, "num_attention_heads": 12, "num_hidden_layers": 12, "vocab_size": 16384, "layer_norm_eps": 1.0e-7 }