{ | |
"module": "keras_nlp.src.models.phi3.phi3_backbone", | |
"class_name": "Phi3Backbone", | |
"config": { | |
"name": "phi3_backbone_1", | |
"trainable": true, | |
"vocabulary_size": 32064, | |
"num_layers": 32, | |
"num_query_heads": 32, | |
"hidden_dim": 3072, | |
"intermediate_dim": 8192, | |
"num_key_value_heads": 32, | |
"layer_norm_epsilon": 1e-05, | |
"dropout": 0.0, | |
"max_sequence_length": 4096, | |
"pretraining_sequence_length": 4096, | |
"rope_max_wavelength": 10000.0, | |
"rope_scaling_type": null, | |
"rope_scaling_short_factor": null, | |
"rope_scaling_long_factor": null | |
}, | |
"registered_name": "keras_nlp>Phi3Backbone" | |
} |