1{ 2 "architectures": [ 3 "LlamaForCausalLM" 4 ], 5 "bos_token_id": 128000, 6 "eos_token_id": 128001, 7 "head_dim": 128, 8 "hidden_size": 3072, 9 "initializer_range": 0.02, 10 "intermediate_size": 8192, 11 "max_position_embeddings": 131072, 12 "model_type": "llama", 13 "num_attention_heads": 24, 14 "num_hidden_layers": 28, 15 "num_key_value_heads": 8, 16 "pretraining_tp": 1, 17 "rms_norm_eps": 1e-05, 18 "rope_theta": 500000.0, 19 "tie_word_embeddings": true, 20 "torch_dtype": "bfloat16", 21 "transformers_version": "4.45.0.dev0", 22 "vocab_size": 128256, 23 "tokenizer": "pretrained_fast" 24} 25