blackWizard commited on
Commit
ae7a022
1 Parent(s): c469edb

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: keras-nlp
3
+ pipeline_tag: text-generation
4
+ ---
5
+ This is a [`Phi3` model](https://keras.io/api/keras_nlp/models/phi3) uploaded using the KerasNLP library and can be used with JAX, TensorFlow, and PyTorch backends.
6
+ This model is related to a `CausalLM` task.
7
+
8
+ Model config:
9
+ * **name:** phi3_backbone_1
10
+ * **trainable:** True
11
+ * **vocabulary_size:** 32064
12
+ * **num_layers:** 32
13
+ * **num_query_heads:** 32
14
+ * **hidden_dim:** 3072
15
+ * **intermediate_dim:** 8192
16
+ * **num_key_value_heads:** 32
17
+ * **layer_norm_epsilon:** 1e-05
18
+ * **dropout:** 0.0
19
+ * **max_sequence_length:** 4096
20
+ * **pretraining_sequence_length:** 4096
21
+ * **rope_max_wavelength:** 10000.0
22
+ * **rope_scaling_type:** None
23
+ * **rope_scaling_short_factor:** None
24
+ * **rope_scaling_long_factor:** None
25
+
26
+ This model card has been generated automatically and should be completed by the model author. See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for more information.
assets/tokenizer/vocabulary.spm ADDED
Binary file (500 kB). View file
 
config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.phi3.phi3_backbone",
3
+ "class_name": "Phi3Backbone",
4
+ "config": {
5
+ "name": "phi3_backbone_1",
6
+ "trainable": true,
7
+ "vocabulary_size": 32064,
8
+ "num_layers": 32,
9
+ "num_query_heads": 32,
10
+ "hidden_dim": 3072,
11
+ "intermediate_dim": 8192,
12
+ "num_key_value_heads": 32,
13
+ "layer_norm_epsilon": 1e-05,
14
+ "dropout": 0.0,
15
+ "max_sequence_length": 4096,
16
+ "pretraining_sequence_length": 4096,
17
+ "rope_max_wavelength": 10000.0,
18
+ "rope_scaling_type": null,
19
+ "rope_scaling_short_factor": null,
20
+ "rope_scaling_long_factor": null
21
+ },
22
+ "registered_name": "keras_nlp>Phi3Backbone"
23
+ }
metadata.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "keras_version": "3.4.1",
3
+ "keras_nlp_version": "0.14.0",
4
+ "parameter_count": 3821079552,
5
+ "date_saved": "2024-07-26@02:34:09"
6
+ }
model.weights.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2bf084f5e43a263be8bf03751088b2532ebb306bb81ffc36908a598ff00ec7b
3
+ size 15285416504
preprocessor.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.phi3.phi3_causal_lm_preprocessor",
3
+ "class_name": "Phi3CausalLMPreprocessor",
4
+ "config": {
5
+ "name": "phi3_causal_lm_preprocessor",
6
+ "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "mixed_bfloat16"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "tokenizer": {
16
+ "module": "keras_nlp.src.models.phi3.phi3_tokenizer",
17
+ "class_name": "Phi3Tokenizer",
18
+ "config": {
19
+ "name": "phi3_tokenizer",
20
+ "trainable": true,
21
+ "dtype": {
22
+ "module": "keras",
23
+ "class_name": "DTypePolicy",
24
+ "config": {
25
+ "name": "int32"
26
+ },
27
+ "registered_name": null
28
+ },
29
+ "proto": null,
30
+ "sequence_length": null
31
+ },
32
+ "registered_name": "keras_nlp>Phi3Tokenizer"
33
+ },
34
+ "sequence_length": 1024,
35
+ "add_start_token": true,
36
+ "add_end_token": false
37
+ },
38
+ "registered_name": "keras_nlp>Phi3CausalLMPreprocessor"
39
+ }
task.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.phi3.phi3_causal_lm",
3
+ "class_name": "Phi3CausalLM",
4
+ "config": {
5
+ "backbone": {
6
+ "module": "keras_nlp.src.models.phi3.phi3_backbone",
7
+ "class_name": "Phi3Backbone",
8
+ "config": {
9
+ "name": "phi3_backbone_1",
10
+ "trainable": true,
11
+ "vocabulary_size": 32064,
12
+ "num_layers": 32,
13
+ "num_query_heads": 32,
14
+ "hidden_dim": 3072,
15
+ "intermediate_dim": 8192,
16
+ "num_key_value_heads": 32,
17
+ "layer_norm_epsilon": 1e-05,
18
+ "dropout": 0.0,
19
+ "max_sequence_length": 4096,
20
+ "pretraining_sequence_length": 4096,
21
+ "rope_max_wavelength": 10000.0,
22
+ "rope_scaling_type": null,
23
+ "rope_scaling_short_factor": null,
24
+ "rope_scaling_long_factor": null
25
+ },
26
+ "registered_name": "keras_nlp>Phi3Backbone"
27
+ },
28
+ "preprocessor": {
29
+ "module": "keras_nlp.src.models.phi3.phi3_causal_lm_preprocessor",
30
+ "class_name": "Phi3CausalLMPreprocessor",
31
+ "config": {
32
+ "name": "phi3_causal_lm_preprocessor",
33
+ "trainable": true,
34
+ "dtype": {
35
+ "module": "keras",
36
+ "class_name": "DTypePolicy",
37
+ "config": {
38
+ "name": "mixed_bfloat16"
39
+ },
40
+ "registered_name": null
41
+ },
42
+ "tokenizer": {
43
+ "module": "keras_nlp.src.models.phi3.phi3_tokenizer",
44
+ "class_name": "Phi3Tokenizer",
45
+ "config": {
46
+ "name": "phi3_tokenizer",
47
+ "trainable": true,
48
+ "dtype": {
49
+ "module": "keras",
50
+ "class_name": "DTypePolicy",
51
+ "config": {
52
+ "name": "int32"
53
+ },
54
+ "registered_name": null
55
+ },
56
+ "proto": null,
57
+ "sequence_length": null
58
+ },
59
+ "registered_name": "keras_nlp>Phi3Tokenizer"
60
+ },
61
+ "sequence_length": 1024,
62
+ "add_start_token": true,
63
+ "add_end_token": false
64
+ },
65
+ "registered_name": "keras_nlp>Phi3CausalLMPreprocessor"
66
+ },
67
+ "name": "phi3_causal_lm"
68
+ },
69
+ "registered_name": "keras_nlp>Phi3CausalLM"
70
+ }
tokenizer.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "module": "keras_nlp.src.models.phi3.phi3_tokenizer",
3
+ "class_name": "Phi3Tokenizer",
4
+ "config": {
5
+ "name": "phi3_tokenizer",
6
+ "trainable": true,
7
+ "dtype": {
8
+ "module": "keras",
9
+ "class_name": "DTypePolicy",
10
+ "config": {
11
+ "name": "int32"
12
+ },
13
+ "registered_name": null
14
+ },
15
+ "proto": null,
16
+ "sequence_length": null
17
+ },
18
+ "registered_name": "keras_nlp>Phi3Tokenizer"
19
+ }