junzhang74
commited on
Commit
•
0b4e111
1
Parent(s):
56e91ab
commit from
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +50 -0
- generation_config.json +9 -0
- model-00001-of-00086.safetensors +3 -0
- model-00002-of-00086.safetensors +3 -0
- model-00003-of-00086.safetensors +3 -0
- model-00004-of-00086.safetensors +3 -0
- model-00005-of-00086.safetensors +3 -0
- model-00006-of-00086.safetensors +3 -0
- model-00007-of-00086.safetensors +3 -0
- model-00008-of-00086.safetensors +3 -0
- model-00009-of-00086.safetensors +3 -0
- model-00010-of-00086.safetensors +3 -0
- model-00011-of-00086.safetensors +3 -0
- model-00012-of-00086.safetensors +3 -0
- model-00013-of-00086.safetensors +3 -0
- model-00014-of-00086.safetensors +3 -0
- model-00015-of-00086.safetensors +3 -0
- model-00016-of-00086.safetensors +3 -0
- model-00017-of-00086.safetensors +3 -0
- model-00018-of-00086.safetensors +3 -0
- model-00019-of-00086.safetensors +3 -0
- model-00020-of-00086.safetensors +3 -0
- model-00021-of-00086.safetensors +3 -0
- model-00022-of-00086.safetensors +3 -0
- model-00023-of-00086.safetensors +3 -0
- model-00024-of-00086.safetensors +3 -0
- model-00025-of-00086.safetensors +3 -0
- model-00026-of-00086.safetensors +3 -0
- model-00027-of-00086.safetensors +3 -0
- model-00028-of-00086.safetensors +3 -0
- model-00029-of-00086.safetensors +3 -0
- model-00030-of-00086.safetensors +3 -0
- model-00031-of-00086.safetensors +3 -0
- model-00032-of-00086.safetensors +3 -0
- model-00033-of-00086.safetensors +3 -0
- model-00034-of-00086.safetensors +3 -0
- model-00035-of-00086.safetensors +3 -0
- model-00036-of-00086.safetensors +3 -0
- model-00037-of-00086.safetensors +3 -0
- model-00038-of-00086.safetensors +3 -0
- model-00039-of-00086.safetensors +3 -0
- model-00040-of-00086.safetensors +3 -0
- model-00041-of-00086.safetensors +3 -0
- model-00042-of-00086.safetensors +3 -0
- model-00043-of-00086.safetensors +3 -0
- model-00044-of-00086.safetensors +3 -0
- model-00045-of-00086.safetensors +3 -0
- model-00046-of-00086.safetensors +3 -0
- model-00047-of-00086.safetensors +3 -0
- model-00048-of-00086.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 16384,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 53248,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 128,
|
18 |
+
"num_hidden_layers": 126,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"quantization_config": {
|
22 |
+
"_load_in_4bit": false,
|
23 |
+
"_load_in_8bit": true,
|
24 |
+
"bnb_4bit_compute_dtype": "float32",
|
25 |
+
"bnb_4bit_quant_storage": "uint8",
|
26 |
+
"bnb_4bit_quant_type": "fp4",
|
27 |
+
"bnb_4bit_use_double_quant": false,
|
28 |
+
"llm_int8_enable_fp32_cpu_offload": false,
|
29 |
+
"llm_int8_has_fp16_weight": false,
|
30 |
+
"llm_int8_skip_modules": null,
|
31 |
+
"llm_int8_threshold": 6.0,
|
32 |
+
"load_in_4bit": false,
|
33 |
+
"load_in_8bit": true,
|
34 |
+
"quant_method": "bitsandbytes"
|
35 |
+
},
|
36 |
+
"rms_norm_eps": 1e-05,
|
37 |
+
"rope_scaling": {
|
38 |
+
"factor": 8.0,
|
39 |
+
"high_freq_factor": 4.0,
|
40 |
+
"low_freq_factor": 1.0,
|
41 |
+
"original_max_position_embeddings": 8192,
|
42 |
+
"rope_type": "llama3"
|
43 |
+
},
|
44 |
+
"rope_theta": 500000.0,
|
45 |
+
"tie_word_embeddings": false,
|
46 |
+
"torch_dtype": "float16",
|
47 |
+
"transformers_version": "4.44.2",
|
48 |
+
"use_cache": true,
|
49 |
+
"vocab_size": 128256
|
50 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128001,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.9,
|
8 |
+
"transformers_version": "4.44.2"
|
9 |
+
}
|
model-00001-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b92a64c79de5198c8cd70b9a1a1b631665712cd0e65040f514d56b055c385f71
|
3 |
+
size 4773258676
|
model-00002-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90671fc56d26137a6239a809b68c5071cdf07e679c4ee94d0d95a070a2b6bc77
|
3 |
+
size 4933626985
|
model-00003-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa5102057d66000e251032bd26f5839769d294d4e98ea78ca20402e44ddf2fc2
|
3 |
+
size 4631482668
|
model-00004-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919044b8a3366d44e5672ff6802d1da0a3c138a2e1e4e2ae89ab9f83331c2491
|
3 |
+
size 4933626985
|
model-00005-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75ee7824f04afa01b11b65fbb7425c96a54ff418f808989005935cfc0ca8b4bc
|
3 |
+
size 4631482668
|
model-00006-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fa5ddc572cb928a837c5144d3ddddf85ca8ce9929441267ac978cfb5a3ffd7a
|
3 |
+
size 4933626985
|
model-00007-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1969ce0689a1a742feaefd29350bf08b3e3bd1d625ec80f15643f2c410ff16e4
|
3 |
+
size 4631482668
|
model-00008-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d86c4729435efdd6cf523f513ff8a7f82aa12585a260a6785d290bbb7e2f49
|
3 |
+
size 4933627009
|
model-00009-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5b9d793c6ff74c92193155665db6a30cc2199c12a038f057992fb8abf448e85
|
3 |
+
size 4631482708
|
model-00010-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aebceaec7bdb0fd110706fce7041cdf6fbbdc5c6f16dc84c2c7130c7afed49e2
|
3 |
+
size 4933627017
|
model-00011-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54159588787a6d307e55de4de0a7e00cec9ae8ef66adc36d16dadcbcc8b3eddb
|
3 |
+
size 4631482708
|
model-00012-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00d03a49d11895e45a566ad5d582d3183a5ec0c863eba30ac1c816f4492d60fb
|
3 |
+
size 4933627017
|
model-00013-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02e0730263eeb16b60f1c59b8bd92be1fd356e64d4c6d66acd3c576d854fea06
|
3 |
+
size 4631482708
|
model-00014-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6373b62a430f6541920af31cc36900532a1507ffb1cd4b047fb5df1031f4e01e
|
3 |
+
size 4933627017
|
model-00015-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc694925249a65e040e4ca7e04d601647594b8afc8adb9422cecbd034a43f8ab
|
3 |
+
size 4631482708
|
model-00016-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ac7e51f817b9b9021ac30b5743f7cfb8adf2545527ca9aa9dcc0754aab02c45
|
3 |
+
size 4933627017
|
model-00017-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d81aa8994681501dae7648f1bc36278fa7a17c0f776b269bca52672901fb09c
|
3 |
+
size 4631482708
|
model-00018-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef7102056decbb8801613640dbe749711dcafac023d41b4cebab5a3670ef231f
|
3 |
+
size 4933627017
|
model-00019-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92ba41d40b96675249c6c1caf37896bb354127204fc20692256a1921f8fb436
|
3 |
+
size 4631482708
|
model-00020-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78d323880add2b6b0834c21548d4e3293a874419dc5e9bedeeed8aa4beba2dd9
|
3 |
+
size 4933627017
|
model-00021-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53801c7b41eceb8deb4e169d715eaccaf5d4dabb8d7fa01ebec3bf5fde1acfdb
|
3 |
+
size 4631482708
|
model-00022-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1246bf5f5dd56b6c0d00e8c37434e4ac6296ff8fb0cebfa3e5adb167fc2e1ea
|
3 |
+
size 4933627017
|
model-00023-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ae27e3e7aaf3248d86ceacbce5f7bcfbf2f54b2b6b9edab11450a3b91827dcb
|
3 |
+
size 4631482708
|
model-00024-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ab9aa16b89dce57cf900fa9699d46900e383534608b3a8a7a88bc85ca801af
|
3 |
+
size 4933627017
|
model-00025-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee501376ed91dad856438cce58ef5465281d9f990328a1af6bb76d908d841053
|
3 |
+
size 4631482708
|
model-00026-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:126ebe74ce5c0b0c10a440c06482a070787b8fb60187722d0271866a36f6497f
|
3 |
+
size 4933627017
|
model-00027-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d0b8be15f36ab278896248c95e01db86f9a11dc336af940d6b2ce2ee083e97e
|
3 |
+
size 4631482708
|
model-00028-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12befd0992fcac106a846211b1f5955899e0c3df2965541c7dab2a24cf450115
|
3 |
+
size 4933627017
|
model-00029-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:885b3dca03fa6c7732df21a7ee404f19c47b9c8994c2acdf4417edbab64e6f28
|
3 |
+
size 4631482708
|
model-00030-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb8319583e729b31d2b48de9eab43ccbc3d1cb2c182dedda62a1ca6c15260b49
|
3 |
+
size 4933627017
|
model-00031-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d43f3b1798b5015cbab3f9d421554394ead888e760cd2c96bfac5028ac6e857e
|
3 |
+
size 4631482708
|
model-00032-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:873e5fd2d46a9b61f287dc384bb1e5fd6f4eec51c25b39271f235148796f1abf
|
3 |
+
size 4933627017
|
model-00033-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc667d37e93ba202375587c84e959b54f4b425666e88d84b305486c308fbe50b
|
3 |
+
size 4631482708
|
model-00034-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b753dfd2ed46c132846e2365cb5c40faa933f671330276a2cec12facf6a43e24
|
3 |
+
size 4933627017
|
model-00035-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9711b034d8eb2d02857f3a9c96fcd64a7c8d66cfd1d0c6e21b9baad975506a75
|
3 |
+
size 4631482708
|
model-00036-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ac51a525dc1151e5cf3aab421fb4eec283dea61bcd5469d2993babf8c870e85
|
3 |
+
size 4933627017
|
model-00037-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd3ccafabd7730e24ca7db358dda92c5d3a5722006f625bc719fc050b48df863
|
3 |
+
size 4631482708
|
model-00038-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9161c27893fd19092e670e05d15d0d69fac500242faf5504d1dcd2b93bc543
|
3 |
+
size 4933627017
|
model-00039-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:baea9714a4638627551743ad8124f63cdf272ca9c3524d99b5b8909a4d5522ef
|
3 |
+
size 4631482708
|
model-00040-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d394c1ea6107c1c8f068951a7d3cf16e2eecc24d98f0f59b5190b35f08af96b
|
3 |
+
size 4933627017
|
model-00041-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:300d5e66b5c7f31fb578ac8fe942929f51bb5ae090cc36446eedc8e79811115f
|
3 |
+
size 4631482708
|
model-00042-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6afe7b2f601793a2a9c517e5fb5db47a49a9f10b41b1ada36c8a9c72f3035c9f
|
3 |
+
size 4933627017
|
model-00043-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:588cb9bb1d9ea03ea03e6109cdfb9346fbb57d6cb8c07d5d523e496c05eda6e7
|
3 |
+
size 4631482708
|
model-00044-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46da69474a89df60629357f0037d0e46b543c4df5f8d8d765e06d81c2954ec56
|
3 |
+
size 4933627017
|
model-00045-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f008d7d6c1f3c56ed3fc49fc3c46002c8c9c42a66be5a4c930492b3f6808fa4
|
3 |
+
size 4631482708
|
model-00046-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d9afeb374c0314579150bcedf688cf12f7244b727b9da57ff57e7080410beeb
|
3 |
+
size 4933627017
|
model-00047-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5324dcb2c173a63cc3437f04b4624dc52407b0060de5c1cbf2e368f8a0d18be4
|
3 |
+
size 4631482708
|
model-00048-of-00086.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:611962796b6a74b507043c914a54ee9147b0fe48c995c0a9f335db90d7be592d
|
3 |
+
size 4933627017
|