jburtoft commited on Jan 13

Commit

67b593a

•

1 Parent(s): d2c6bb6

9baf68f25225e25f0cf14788e00887629a2702ae956b76bdb4f615262d70399f

Browse files

Files changed (21) hide show

checkpoint/config.json +27 -0
checkpoint/generation_config.json +7 -0
checkpoint/pytorch_model.bin/key_to_filename.json +3 -0
checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight +3 -0
checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight +3 -0
checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight +3 -0
checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight +3 -0
checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight +3 -0
checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight +3 -0
checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight +3 -0
checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight +3 -0
checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight +3 -0
checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight +3 -0

checkpoint/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "SOLAR-10.7B-v1.0",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 14336,
+  "max_position_embeddings": 4096,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 48,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.35.0",
+  "use_cache": false,
+  "vocab_size": 32000
+}

checkpoint/generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "transformers_version": "4.35.0",
+  "use_cache": false
+}

checkpoint/pytorch_model.bin/key_to_filename.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:408ad396d329c82ca699a62e277b1af43cd60413c7f5ef275b5fcd12f8913934
+size 39661

checkpoint/pytorch_model.bin/p0.model.embed_tokens.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f826aaa8ff17bf50940f6f7a2563404df0c00287ec3af0414cb98ea4df4b7065
+size 524288789

checkpoint/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:782d1fe3043d72ce1916338d2f8ec2c094a5a1a55962b39ca18e3022c025299d
+size 67109756

checkpoint/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd0bfe727386bc395cb9ade3183f514f8c77ab834363df65cd24f12c6609b88d
+size 67109759

checkpoint/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:baf82cc47336698e73130a5080a993e27c5b568d0fe839dda20563bae4b8ff77
+size 67109765

checkpoint/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e9ed9e561549e1db150ec6c9bbc0a852efc6d2f2a26fb334e1cc627b864d123a
+size 16778117

checkpoint/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b4413adb71900f5a872de63ae00823310f0843546d441e543616c4671717355
+size 16778117

checkpoint/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d5e810de6a404938eee84aa5dc05982f06a4c8092d65017fa75691521614090
+size 67109765

checkpoint/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6cd3ed09ec561001104b63c8ca015dfeb40e64bea27e8f27f90d045a5a1994cb
+size 234881916

checkpoint/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0ed4095919abdde1eeedc771bcdca92911e9e6076f156e0831537dd2cf14454
+size 234881910

checkpoint/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fa639d44565cb737af256b0b533e7535b83a2f3a78e7c255abe94fe03194d84
+size 234881916

checkpoint/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4c729ce40007d4e71f6cdd8102b575fab26947be415da578ca2a76cfe8b31f9
+size 17282

checkpoint/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2120204b8442d4e7e5c1a7ab65dd78ae0530241090c9db8129a6fc2059b599a
+size 17309

checkpoint/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3877ba90aa3ccaefe419946b93d40c6df6404d08d7ed4e18eee4796426c84105
+size 67109765

checkpoint/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:761379bb269a38ecba268ee6e91087d6f0bf0443e049b57dd2a5be7337dcedc3
+size 16778111

checkpoint/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c0106a5423ea9775312b727b50427185d827086c05c8c08a386367065c1dac3
+size 16778117

checkpoint/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f4c584d3b7fe9ba9d25f4a954d5175308f34b3a4b85fe2bc2cd94d372e8060ea
+size 16778117

checkpoint/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b89d9d6818807fd1e346eefc97f29926b3734b28fcf3b4d0b2d2b4373ede360e
+size 67109765

checkpoint/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9c4090f834560e92c7232dc8870d1aecdcb45bd2ec20a903708c54e0b4e77917
+size 234881916