lixin4sky commited on
Commit
db1be90
1 Parent(s): 71baa83

datasets commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .DS_Store +0 -0
  2. README.md +1 -1
  3. datasets/.DS_Store +0 -0
  4. datasets/code_data/dataset_dict.json +1 -0
  5. datasets/code_data/test/cache-2c70f7a7d5e2fb42.arrow +3 -0
  6. datasets/code_data/test/cache-39e7b9181004d4a5.arrow +3 -0
  7. datasets/code_data/test/cache-444e15f3134aed35_00000_of_00004.arrow +3 -0
  8. datasets/code_data/test/cache-444e15f3134aed35_00001_of_00004.arrow +3 -0
  9. datasets/code_data/test/cache-444e15f3134aed35_00002_of_00004.arrow +3 -0
  10. datasets/code_data/test/cache-444e15f3134aed35_00003_of_00004.arrow +3 -0
  11. datasets/code_data/test/cache-4650cd749e3e19b3.arrow +3 -0
  12. datasets/code_data/test/cache-557e89bf3e0d06f1.arrow +3 -0
  13. datasets/code_data/test/cache-57df2e74a89a0bb7.arrow +3 -0
  14. datasets/code_data/test/cache-5d4ed3ae78960812.arrow +3 -0
  15. datasets/code_data/test/cache-62d32ecd714989d5.arrow +3 -0
  16. datasets/code_data/test/cache-f575994e5c23f284_00000_of_00004.arrow +3 -0
  17. datasets/code_data/test/cache-f575994e5c23f284_00001_of_00004.arrow +3 -0
  18. datasets/code_data/test/cache-f575994e5c23f284_00002_of_00004.arrow +3 -0
  19. datasets/code_data/test/cache-f575994e5c23f284_00003_of_00004.arrow +3 -0
  20. datasets/code_data/test/data-00000-of-00001.arrow +3 -0
  21. datasets/code_data/test/dataset_info.json +24 -0
  22. datasets/code_data/test/state.json +13 -0
  23. datasets/code_data/train/cache-22c2044f2379d425.arrow +3 -0
  24. datasets/code_data/train/cache-49f9224594160d92.arrow +3 -0
  25. datasets/code_data/train/cache-6573b445e8476215.arrow +3 -0
  26. datasets/code_data/train/cache-69650c9c107d83f9.arrow +3 -0
  27. datasets/code_data/train/cache-7bd58c3bb50b7ac7.arrow +3 -0
  28. datasets/code_data/train/cache-d4aef90b7bf61304_00000_of_00004.arrow +3 -0
  29. datasets/code_data/train/cache-d4aef90b7bf61304_00001_of_00004.arrow +3 -0
  30. datasets/code_data/train/cache-d4aef90b7bf61304_00002_of_00004.arrow +3 -0
  31. datasets/code_data/train/cache-d4aef90b7bf61304_00003_of_00004.arrow +3 -0
  32. datasets/code_data/train/cache-ea0920a856ca6c6b_00000_of_00004.arrow +3 -0
  33. datasets/code_data/train/cache-ea0920a856ca6c6b_00001_of_00004.arrow +3 -0
  34. datasets/code_data/train/cache-ea0920a856ca6c6b_00002_of_00004.arrow +3 -0
  35. datasets/code_data/train/cache-ea0920a856ca6c6b_00003_of_00004.arrow +3 -0
  36. datasets/code_data/train/data-00000-of-00001.arrow +3 -0
  37. datasets/code_data/train/dataset_info.json +24 -0
  38. datasets/code_data/train/state.json +13 -0
  39. datasets/doc_and_code/dataset_dict.json +1 -0
  40. datasets/doc_and_code/test/cache-3be0d55acefd340c.arrow +3 -0
  41. datasets/doc_and_code/test/cache-56b65669ef6ab26f.arrow +3 -0
  42. datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00000_of_00004.arrow +3 -0
  43. datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00001_of_00004.arrow +3 -0
  44. datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00002_of_00004.arrow +3 -0
  45. datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00003_of_00004.arrow +3 -0
  46. datasets/doc_and_code/test/cache-d6e80d3035fcdcd4.arrow +3 -0
  47. datasets/doc_and_code/test/cache-e48b563586733a70.arrow +3 -0
  48. datasets/doc_and_code/test/cache-ed29fdd6a41aa6ba.arrow +3 -0
  49. datasets/doc_and_code/test/cache-f3711d2297e0fd99.arrow +3 -0
  50. datasets/doc_and_code/test/cache-f8ea63f132267268_00000_of_00004.arrow +3 -0
.DS_Store CHANGED
Binary files a/.DS_Store and b/.DS_Store differ
 
README.md CHANGED
@@ -67,7 +67,7 @@ from peft import PeftModel
67
 
68
  device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
69
 
70
- model_name_or_path = 'deepseek-ai/deepseek-coder-7b-instruct-v1.5'
71
  # You can use Llama-3-8B by 'meta-llama/Meta-Llama-3-8B-Instruct'.
72
  # You can also use your local path.
73
  peft_model_path = 'https://huggingface.co/lixin4sky/ProGraph/tree/main/deepseek-code-only'
 
67
 
68
  device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
69
 
70
+ model_name_or_path = '../models/deepseek-ai/deepseek-coder-7b-instruct-v1.5'
71
  # You can use Llama-3-8B by 'meta-llama/Meta-Llama-3-8B-Instruct'.
72
  # You can also use your local path.
73
  peft_model_path = 'https://huggingface.co/lixin4sky/ProGraph/tree/main/deepseek-code-only'
datasets/.DS_Store ADDED
Binary file (6.15 kB). View file
 
datasets/code_data/dataset_dict.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"splits": ["train", "test"]}
datasets/code_data/test/cache-2c70f7a7d5e2fb42.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06bef7f6d991273dbee48ae14bfdccf7629943f6fda4cf04ab59b38b04752f59
3
+ size 38655360
datasets/code_data/test/cache-39e7b9181004d4a5.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07de1df690d66506e919d3e55fa8076c05583e8a9d22e4b8b91446ef77b195cc
3
+ size 34532328
datasets/code_data/test/cache-444e15f3134aed35_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0996566e20205801956ed172bbeefb5077cfb8c08f15cec0285e6f8009647c09
3
+ size 7499872
datasets/code_data/test/cache-444e15f3134aed35_00001_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de875c7faccd4859492e00f27be249c69b7356fbb183af1a72048d944cbe7893
3
+ size 7582392
datasets/code_data/test/cache-444e15f3134aed35_00002_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea3982c4843c0b5d638abd947f9857aeb442302d6838fab9d03cd117ed50692f
3
+ size 7439960
datasets/code_data/test/cache-444e15f3134aed35_00003_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:340f0760ede2b86184aefe46685dcff887319d957c9b9ba74e89533271b0f8a7
3
+ size 7483176
datasets/code_data/test/cache-4650cd749e3e19b3.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e8449b57f97be24413c786a5d99b4b1c6fc9b0df28c7b0a023b4edb478a129b
3
+ size 38655360
datasets/code_data/test/cache-557e89bf3e0d06f1.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7dcd5f3bb9a90a341486203f324e99851e4cf61d42ada43fb2dafb38e08f179
3
+ size 244432
datasets/code_data/test/cache-57df2e74a89a0bb7.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59af5993efbaf5d9d19944b27bc394b5f33dbce39a6cb02e4ef02eb3ff18d2b0
3
+ size 244432
datasets/code_data/test/cache-5d4ed3ae78960812.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df408a3298dd25c51c77fd4c263fd283d6c62fa28a4a17dc5e2f8ff35d3c33c3
3
+ size 244432
datasets/code_data/test/cache-62d32ecd714989d5.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f639781007729d58fbed66182c235d14fc4fb6847cf2fa54dd0de0a2e718789
3
+ size 34532328
datasets/code_data/test/cache-f575994e5c23f284_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62e202729d0c82b868b2941fa98dbcacb703acd25f30ef4fd9338cb4e2a59819
3
+ size 7919536
datasets/code_data/test/cache-f575994e5c23f284_00001_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9875e5760c7c44da42872dba2c8af144cdd1b61649e942bb334bc3a6ceec59e
3
+ size 8002056
datasets/code_data/test/cache-f575994e5c23f284_00002_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef62827b890a8927b907be0fd2f507e301bbffc601129208b9fa2de8d284b10
3
+ size 7859624
datasets/code_data/test/cache-f575994e5c23f284_00003_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:508f7b4e3d148fa50ebc795643bc690c30189b8f06b697d399aa13c91c64445a
3
+ size 7902840
datasets/code_data/test/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49da1c2f40b17b6b22e59ebe437b03508d12441c3e3b1ca964a71d78705d7998
3
+ size 29594528
datasets/code_data/test/dataset_info.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "citation": "",
3
+ "description": "",
4
+ "features": {
5
+ "api": {
6
+ "dtype": "string",
7
+ "_type": "Value"
8
+ },
9
+ "messages": [
10
+ {
11
+ "content": {
12
+ "dtype": "string",
13
+ "_type": "Value"
14
+ },
15
+ "role": {
16
+ "dtype": "string",
17
+ "_type": "Value"
18
+ }
19
+ }
20
+ ]
21
+ },
22
+ "homepage": "",
23
+ "license": ""
24
+ }
datasets/code_data/test/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "99495646072e17ba",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
datasets/code_data/train/cache-22c2044f2379d425.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9088b4c432f0055ff6d9c3387e233b5db0c739d174dd77dd0fbbf981c01dea8b
3
+ size 34532328
datasets/code_data/train/cache-49f9224594160d92.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1794517749dc684314aef13286366cdea5ca033f585cf1eaf6ddd853a0b63b
3
+ size 244432
datasets/code_data/train/cache-6573b445e8476215.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88bb957b3dadfad9b3704ec16463092ce184a202d6e612a31ad67fbecb4c259b
3
+ size 38655360
datasets/code_data/train/cache-69650c9c107d83f9.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d7f6504df958012c3a67e486041cf4240c4c54abf9d48e9dd6f6cf00d4cee43
3
+ size 244432
datasets/code_data/train/cache-7bd58c3bb50b7ac7.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:187657e13f1837546df60e2e6e65dd4690debaee1ab5e7eceebd52147bea9f6d
3
+ size 244432
datasets/code_data/train/cache-d4aef90b7bf61304_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af757c931ba8b0923d723b03fe01e4ad4820d4b1e0bcde01fc4e74401f817aaf
3
+ size 7919536
datasets/code_data/train/cache-d4aef90b7bf61304_00001_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:079d2e4966c87fc3910a9080ab43472a7c441eb9a01efdcec587f3329af64082
3
+ size 8002056
datasets/code_data/train/cache-d4aef90b7bf61304_00002_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:228df6ecbc9ec2cb6d191679d1d9fe4843ea5c413d841ea97efc2a37be0c38a3
3
+ size 7859624
datasets/code_data/train/cache-d4aef90b7bf61304_00003_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00c4277310541969caed004ad201289804ee6dc9c17d621cf8cbe3d503735ed0
3
+ size 7902840
datasets/code_data/train/cache-ea0920a856ca6c6b_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba566c47ae9eff475c83d70b45208ff99f38f192999013a2277ad2ff975d5d25
3
+ size 7499872
datasets/code_data/train/cache-ea0920a856ca6c6b_00001_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1279b8e4f609b7cf84750053c02b17cbd4acd23e9026623800eb232526d403
3
+ size 7582392
datasets/code_data/train/cache-ea0920a856ca6c6b_00002_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed4dfa9fc376e6e87e5c06205fb95654509fd44bfe38f97e94846299d08ea06
3
+ size 7439960
datasets/code_data/train/cache-ea0920a856ca6c6b_00003_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec27186f3da9545bc2aa5fd86faa8261ee634295ec19590233994c718e6cb910
3
+ size 7483176
datasets/code_data/train/data-00000-of-00001.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49da1c2f40b17b6b22e59ebe437b03508d12441c3e3b1ca964a71d78705d7998
3
+ size 29594528
datasets/code_data/train/dataset_info.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "citation": "",
3
+ "description": "",
4
+ "features": {
5
+ "api": {
6
+ "dtype": "string",
7
+ "_type": "Value"
8
+ },
9
+ "messages": [
10
+ {
11
+ "content": {
12
+ "dtype": "string",
13
+ "_type": "Value"
14
+ },
15
+ "role": {
16
+ "dtype": "string",
17
+ "_type": "Value"
18
+ }
19
+ }
20
+ ]
21
+ },
22
+ "homepage": "",
23
+ "license": ""
24
+ }
datasets/code_data/train/state.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_data_files": [
3
+ {
4
+ "filename": "data-00000-of-00001.arrow"
5
+ }
6
+ ],
7
+ "_fingerprint": "99495646072e17ba",
8
+ "_format_columns": null,
9
+ "_format_kwargs": {},
10
+ "_format_type": null,
11
+ "_output_all_columns": false,
12
+ "_split": null
13
+ }
datasets/doc_and_code/dataset_dict.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"splits": ["train", "test"]}
datasets/doc_and_code/test/cache-3be0d55acefd340c.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f91945a79de83989af8b42b854d3ea5b5945ef6f270aac563959450923887313
3
+ size 72849472
datasets/doc_and_code/test/cache-56b65669ef6ab26f.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6423b1c43ed61b7cf7b8348bde7ccfc208342b0aac3c011b8adedc3e5d54391f
3
+ size 72849472
datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:957ee7b987cd6523d4f8364f761171f76810768120f8549b4584439d7a774e21
3
+ size 16482360
datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00001_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1be68808c3b8bf0677581a59e26f082335e986eddb92169de9c9b811f3ea485d
3
+ size 16360472
datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00002_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae0de04cfd2e69b4b46eaaf14d156b9578844ed6eafb31c9cbc1c86f9c5f0206
3
+ size 16348456
datasets/doc_and_code/test/cache-b8182fb692f5fc4f_00003_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6e6146be000ee4213f6f93ae960981e5ec8dc6c6cf41e6b88dce566f0b8fe67
3
+ size 16265080
datasets/doc_and_code/test/cache-d6e80d3035fcdcd4.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:502919b73aa7e8ad6b6ccd472ed7ab4e46ba56f89b52b1c35f6a5cdad832ae04
3
+ size 244432
datasets/doc_and_code/test/cache-e48b563586733a70.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa74da25b1aa83cbf8b0b6f1e7a97bcb353eac09b713b592a7ba1cb57197c75
3
+ size 244432
datasets/doc_and_code/test/cache-ed29fdd6a41aa6ba.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea8c9cac65fd730cfd1dc9b997280186ee7d900c9440b29069898ca347aadfc1
3
+ size 81242584
datasets/doc_and_code/test/cache-f3711d2297e0fd99.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eacc6b257e1338613b6ef362f16a1b91ccba583f81a9a3fe3582668bba9ca18
3
+ size 81242584
datasets/doc_and_code/test/cache-f8ea63f132267268_00000_of_00004.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cea366d8abcb0dcd57c4108d591ab80168fc057ea574da28f819ead9e9f35e3c
3
+ size 16902024