mistral_instruct_7b_en / config.json
Divyasreepat's picture
Upload folder using huggingface_hub
0046286 verified
raw
history blame contribute delete
645 Bytes
{
"module": "keras_nlp.models.mistral.mistral_backbone",
"class_name": "MistralBackbone",
"config": {
"name": "mistral_backbone_1",
"trainable": true,
"vocabulary_size": 32000,
"num_layers": 32,
"num_query_heads": 32,
"hidden_dim": 4096,
"intermediate_dim": 14336,
"rope_max_wavelength": 10000.0,
"rope_scaling_factor": 1.0,
"num_key_value_heads": 8,
"sliding_window": 4096,
"layer_norm_epsilon": 1e-05,
"dropout": 0
},
"registered_name": "keras_nlp>MistralBackbone",
"assets": [],
"weights": "model.weights.h5"
}