junzhang74 commited on
Commit
0b4e111
1 Parent(s): 56e91ab

commit from

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +50 -0
  2. generation_config.json +9 -0
  3. model-00001-of-00086.safetensors +3 -0
  4. model-00002-of-00086.safetensors +3 -0
  5. model-00003-of-00086.safetensors +3 -0
  6. model-00004-of-00086.safetensors +3 -0
  7. model-00005-of-00086.safetensors +3 -0
  8. model-00006-of-00086.safetensors +3 -0
  9. model-00007-of-00086.safetensors +3 -0
  10. model-00008-of-00086.safetensors +3 -0
  11. model-00009-of-00086.safetensors +3 -0
  12. model-00010-of-00086.safetensors +3 -0
  13. model-00011-of-00086.safetensors +3 -0
  14. model-00012-of-00086.safetensors +3 -0
  15. model-00013-of-00086.safetensors +3 -0
  16. model-00014-of-00086.safetensors +3 -0
  17. model-00015-of-00086.safetensors +3 -0
  18. model-00016-of-00086.safetensors +3 -0
  19. model-00017-of-00086.safetensors +3 -0
  20. model-00018-of-00086.safetensors +3 -0
  21. model-00019-of-00086.safetensors +3 -0
  22. model-00020-of-00086.safetensors +3 -0
  23. model-00021-of-00086.safetensors +3 -0
  24. model-00022-of-00086.safetensors +3 -0
  25. model-00023-of-00086.safetensors +3 -0
  26. model-00024-of-00086.safetensors +3 -0
  27. model-00025-of-00086.safetensors +3 -0
  28. model-00026-of-00086.safetensors +3 -0
  29. model-00027-of-00086.safetensors +3 -0
  30. model-00028-of-00086.safetensors +3 -0
  31. model-00029-of-00086.safetensors +3 -0
  32. model-00030-of-00086.safetensors +3 -0
  33. model-00031-of-00086.safetensors +3 -0
  34. model-00032-of-00086.safetensors +3 -0
  35. model-00033-of-00086.safetensors +3 -0
  36. model-00034-of-00086.safetensors +3 -0
  37. model-00035-of-00086.safetensors +3 -0
  38. model-00036-of-00086.safetensors +3 -0
  39. model-00037-of-00086.safetensors +3 -0
  40. model-00038-of-00086.safetensors +3 -0
  41. model-00039-of-00086.safetensors +3 -0
  42. model-00040-of-00086.safetensors +3 -0
  43. model-00041-of-00086.safetensors +3 -0
  44. model-00042-of-00086.safetensors +3 -0
  45. model-00043-of-00086.safetensors +3 -0
  46. model-00044-of-00086.safetensors +3 -0
  47. model-00045-of-00086.safetensors +3 -0
  48. model-00046-of-00086.safetensors +3 -0
  49. model-00047-of-00086.safetensors +3 -0
  50. model-00048-of-00086.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 16384,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 53248,
14
+ "max_position_embeddings": 131072,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 128,
18
+ "num_hidden_layers": 126,
19
+ "num_key_value_heads": 8,
20
+ "pretraining_tp": 1,
21
+ "quantization_config": {
22
+ "_load_in_4bit": false,
23
+ "_load_in_8bit": true,
24
+ "bnb_4bit_compute_dtype": "float32",
25
+ "bnb_4bit_quant_storage": "uint8",
26
+ "bnb_4bit_quant_type": "fp4",
27
+ "bnb_4bit_use_double_quant": false,
28
+ "llm_int8_enable_fp32_cpu_offload": false,
29
+ "llm_int8_has_fp16_weight": false,
30
+ "llm_int8_skip_modules": null,
31
+ "llm_int8_threshold": 6.0,
32
+ "load_in_4bit": false,
33
+ "load_in_8bit": true,
34
+ "quant_method": "bitsandbytes"
35
+ },
36
+ "rms_norm_eps": 1e-05,
37
+ "rope_scaling": {
38
+ "factor": 8.0,
39
+ "high_freq_factor": 4.0,
40
+ "low_freq_factor": 1.0,
41
+ "original_max_position_embeddings": 8192,
42
+ "rope_type": "llama3"
43
+ },
44
+ "rope_theta": 500000.0,
45
+ "tie_word_embeddings": false,
46
+ "torch_dtype": "float16",
47
+ "transformers_version": "4.44.2",
48
+ "use_cache": true,
49
+ "vocab_size": 128256
50
+ }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 128000,
4
+ "do_sample": true,
5
+ "eos_token_id": 128001,
6
+ "temperature": 0.6,
7
+ "top_p": 0.9,
8
+ "transformers_version": "4.44.2"
9
+ }
model-00001-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b92a64c79de5198c8cd70b9a1a1b631665712cd0e65040f514d56b055c385f71
3
+ size 4773258676
model-00002-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90671fc56d26137a6239a809b68c5071cdf07e679c4ee94d0d95a070a2b6bc77
3
+ size 4933626985
model-00003-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa5102057d66000e251032bd26f5839769d294d4e98ea78ca20402e44ddf2fc2
3
+ size 4631482668
model-00004-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:919044b8a3366d44e5672ff6802d1da0a3c138a2e1e4e2ae89ab9f83331c2491
3
+ size 4933626985
model-00005-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75ee7824f04afa01b11b65fbb7425c96a54ff418f808989005935cfc0ca8b4bc
3
+ size 4631482668
model-00006-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa5ddc572cb928a837c5144d3ddddf85ca8ce9929441267ac978cfb5a3ffd7a
3
+ size 4933626985
model-00007-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1969ce0689a1a742feaefd29350bf08b3e3bd1d625ec80f15643f2c410ff16e4
3
+ size 4631482668
model-00008-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37d86c4729435efdd6cf523f513ff8a7f82aa12585a260a6785d290bbb7e2f49
3
+ size 4933627009
model-00009-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5b9d793c6ff74c92193155665db6a30cc2199c12a038f057992fb8abf448e85
3
+ size 4631482708
model-00010-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aebceaec7bdb0fd110706fce7041cdf6fbbdc5c6f16dc84c2c7130c7afed49e2
3
+ size 4933627017
model-00011-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54159588787a6d307e55de4de0a7e00cec9ae8ef66adc36d16dadcbcc8b3eddb
3
+ size 4631482708
model-00012-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00d03a49d11895e45a566ad5d582d3183a5ec0c863eba30ac1c816f4492d60fb
3
+ size 4933627017
model-00013-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02e0730263eeb16b60f1c59b8bd92be1fd356e64d4c6d66acd3c576d854fea06
3
+ size 4631482708
model-00014-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6373b62a430f6541920af31cc36900532a1507ffb1cd4b047fb5df1031f4e01e
3
+ size 4933627017
model-00015-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc694925249a65e040e4ca7e04d601647594b8afc8adb9422cecbd034a43f8ab
3
+ size 4631482708
model-00016-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ac7e51f817b9b9021ac30b5743f7cfb8adf2545527ca9aa9dcc0754aab02c45
3
+ size 4933627017
model-00017-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d81aa8994681501dae7648f1bc36278fa7a17c0f776b269bca52672901fb09c
3
+ size 4631482708
model-00018-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef7102056decbb8801613640dbe749711dcafac023d41b4cebab5a3670ef231f
3
+ size 4933627017
model-00019-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a92ba41d40b96675249c6c1caf37896bb354127204fc20692256a1921f8fb436
3
+ size 4631482708
model-00020-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d323880add2b6b0834c21548d4e3293a874419dc5e9bedeeed8aa4beba2dd9
3
+ size 4933627017
model-00021-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53801c7b41eceb8deb4e169d715eaccaf5d4dabb8d7fa01ebec3bf5fde1acfdb
3
+ size 4631482708
model-00022-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1246bf5f5dd56b6c0d00e8c37434e4ac6296ff8fb0cebfa3e5adb167fc2e1ea
3
+ size 4933627017
model-00023-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ae27e3e7aaf3248d86ceacbce5f7bcfbf2f54b2b6b9edab11450a3b91827dcb
3
+ size 4631482708
model-00024-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ab9aa16b89dce57cf900fa9699d46900e383534608b3a8a7a88bc85ca801af
3
+ size 4933627017
model-00025-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee501376ed91dad856438cce58ef5465281d9f990328a1af6bb76d908d841053
3
+ size 4631482708
model-00026-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:126ebe74ce5c0b0c10a440c06482a070787b8fb60187722d0271866a36f6497f
3
+ size 4933627017
model-00027-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d0b8be15f36ab278896248c95e01db86f9a11dc336af940d6b2ce2ee083e97e
3
+ size 4631482708
model-00028-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12befd0992fcac106a846211b1f5955899e0c3df2965541c7dab2a24cf450115
3
+ size 4933627017
model-00029-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:885b3dca03fa6c7732df21a7ee404f19c47b9c8994c2acdf4417edbab64e6f28
3
+ size 4631482708
model-00030-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb8319583e729b31d2b48de9eab43ccbc3d1cb2c182dedda62a1ca6c15260b49
3
+ size 4933627017
model-00031-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d43f3b1798b5015cbab3f9d421554394ead888e760cd2c96bfac5028ac6e857e
3
+ size 4631482708
model-00032-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:873e5fd2d46a9b61f287dc384bb1e5fd6f4eec51c25b39271f235148796f1abf
3
+ size 4933627017
model-00033-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc667d37e93ba202375587c84e959b54f4b425666e88d84b305486c308fbe50b
3
+ size 4631482708
model-00034-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b753dfd2ed46c132846e2365cb5c40faa933f671330276a2cec12facf6a43e24
3
+ size 4933627017
model-00035-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9711b034d8eb2d02857f3a9c96fcd64a7c8d66cfd1d0c6e21b9baad975506a75
3
+ size 4631482708
model-00036-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ac51a525dc1151e5cf3aab421fb4eec283dea61bcd5469d2993babf8c870e85
3
+ size 4933627017
model-00037-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd3ccafabd7730e24ca7db358dda92c5d3a5722006f625bc719fc050b48df863
3
+ size 4631482708
model-00038-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea9161c27893fd19092e670e05d15d0d69fac500242faf5504d1dcd2b93bc543
3
+ size 4933627017
model-00039-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baea9714a4638627551743ad8124f63cdf272ca9c3524d99b5b8909a4d5522ef
3
+ size 4631482708
model-00040-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d394c1ea6107c1c8f068951a7d3cf16e2eecc24d98f0f59b5190b35f08af96b
3
+ size 4933627017
model-00041-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:300d5e66b5c7f31fb578ac8fe942929f51bb5ae090cc36446eedc8e79811115f
3
+ size 4631482708
model-00042-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6afe7b2f601793a2a9c517e5fb5db47a49a9f10b41b1ada36c8a9c72f3035c9f
3
+ size 4933627017
model-00043-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:588cb9bb1d9ea03ea03e6109cdfb9346fbb57d6cb8c07d5d523e496c05eda6e7
3
+ size 4631482708
model-00044-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46da69474a89df60629357f0037d0e46b543c4df5f8d8d765e06d81c2954ec56
3
+ size 4933627017
model-00045-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f008d7d6c1f3c56ed3fc49fc3c46002c8c9c42a66be5a4c930492b3f6808fa4
3
+ size 4631482708
model-00046-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d9afeb374c0314579150bcedf688cf12f7244b727b9da57ff57e7080410beeb
3
+ size 4933627017
model-00047-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5324dcb2c173a63cc3437f04b4624dc52407b0060de5c1cbf2e368f8a0d18be4
3
+ size 4631482708
model-00048-of-00086.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:611962796b6a74b507043c914a54ee9147b0fe48c995c0a9f335db90d7be592d
3
+ size 4933627017