fozziethebeat commited on
Commit
ba73a6a
1 Parent(s): 8364ffb

Upload LlavaMistralForCausalLM

Browse files
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
3
  "architectures": [
4
- "LlavaLlamaForCausalLM"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
@@ -10,7 +10,6 @@
10
  "freeze_mm_vision_resampler": false,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
- "ignore_index": -100,
14
  "image_aspect_ratio": "anyres",
15
  "image_crop_resolution": 224,
16
  "image_grid_pinpoints": [
@@ -36,7 +35,6 @@
36
  ]
37
  ],
38
  "image_split_resolution": 224,
39
- "image_token_index": 32000,
40
  "initializer_range": 0.02,
41
  "intermediate_size": 14336,
42
  "max_position_embeddings": 32768,
@@ -51,18 +49,13 @@
51
  "mm_vision_select_layer": -2,
52
  "mm_vision_tower": "openai/clip-vit-large-patch14-336",
53
  "mm_vision_tower_lr": 2e-06,
54
- "model_type": "llava",
55
  "num_attention_heads": 32,
56
  "num_hidden_layers": 32,
57
  "num_key_value_heads": 8,
58
- "pad_token_id": 32001,
59
- "projector_hidden_act": "gelu",
60
  "rms_norm_eps": 1e-05,
61
  "rope_theta": 1000000.0,
62
  "sliding_window": null,
63
- "text_config": {
64
- "model_type": "llama"
65
- },
66
  "tie_word_embeddings": false,
67
  "tokenizer_model_max_length": 4096,
68
  "tokenizer_padding_side": "left",
@@ -73,18 +66,5 @@
73
  "unfreeze_mm_vision_tower": true,
74
  "use_cache": true,
75
  "use_mm_proj": true,
76
- "vision_config": {
77
- "hidden_size": 1024,
78
- "image_size": 336,
79
- "intermediate_size": 4096,
80
- "model_type": "clip_vision_model",
81
- "num_attention_heads": 16,
82
- "num_hidden_layers": 24,
83
- "patch_size": 14,
84
- "projection_dim": 768,
85
- "vocab_size": 32000
86
- },
87
- "vision_feature_layer": -2,
88
- "vision_feature_select_strategy": "default",
89
  "vocab_size": 32000
90
  }
 
1
  {
2
  "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
3
  "architectures": [
4
+ "LlavaMistralForCausalLM"
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
 
10
  "freeze_mm_vision_resampler": false,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
 
13
  "image_aspect_ratio": "anyres",
14
  "image_crop_resolution": 224,
15
  "image_grid_pinpoints": [
 
35
  ]
36
  ],
37
  "image_split_resolution": 224,
 
38
  "initializer_range": 0.02,
39
  "intermediate_size": 14336,
40
  "max_position_embeddings": 32768,
 
49
  "mm_vision_select_layer": -2,
50
  "mm_vision_tower": "openai/clip-vit-large-patch14-336",
51
  "mm_vision_tower_lr": 2e-06,
52
+ "model_type": "llava_mistral",
53
  "num_attention_heads": 32,
54
  "num_hidden_layers": 32,
55
  "num_key_value_heads": 8,
 
 
56
  "rms_norm_eps": 1e-05,
57
  "rope_theta": 1000000.0,
58
  "sliding_window": null,
 
 
 
59
  "tie_word_embeddings": false,
60
  "tokenizer_model_max_length": 4096,
61
  "tokenizer_padding_side": "left",
 
66
  "unfreeze_mm_vision_tower": true,
67
  "use_cache": true,
68
  "use_mm_proj": true,
 
 
 
 
 
 
 
 
 
 
 
 
 
69
  "vocab_size": 32000
70
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed847689535b583f0cce5ec866118b2028c25b06990c2baa611a30717d119bb2
3
- size 4943170528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95f62213d2f1b6e87b897bb48b23b1cd51292e74c54ceda150fe8bddb9c3a692
3
+ size 4943170624
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7476e5d88ef0847407f7c21e4b36f00b6f7a82a19d7b4a60b8e4c0c959336dea
3
- size 4999819232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a163a5b72360c131b4e24eafb53f708fee98a7be42440eb4e89056812f4c08dc
3
+ size 4999819336
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a80b40f7465dd414c8fab2f1c869423a9dde5ba0d4807fd279d38e69652992a
3
- size 4927407880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91b09c2332ca2e829fe56b912e01736e872d62f58e66e44a65c4f848618b14e1
3
+ size 4927408360
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db8e7284360293748cb7fa3bdcec0cbd418e8721041723a5abaa4b7f5c1a14af
3
  size 262144128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb257ed562525979a1bf69cae89828d4580bcdb525e1c426fc7b96117a9e0dbe
3
  size 262144128