Training in progress, step 10
Browse files- .gitattributes +1 -0
- adapter_config.json +32 -0
- adapter_model.safetensors +3 -0
- added_tokens.json +5 -0
- merges.txt +0 -0
- runs/Jan30_16-45-36_add665d75a5a/events.out.tfevents.1738255553.add665d75a5a.2008.0 +3 -0
- runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255599.add665d75a5a.2008.1 +3 -0
- runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255647.add665d75a5a.2008.2 +3 -0
- runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255658.add665d75a5a.2008.3 +3 -0
- runs/Jan30_16-48-51_add665d75a5a/events.out.tfevents.1738255733.add665d75a5a.10136.0 +3 -0
- runs/Jan30_16-51-05_add665d75a5a/events.out.tfevents.1738255871.add665d75a5a.10136.1 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255882.add665d75a5a.10136.2 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255910.add665d75a5a.10136.3 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255934.add665d75a5a.10136.4 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255955.add665d75a5a.10136.5 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256044.add665d75a5a.10136.6 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256101.add665d75a5a.10136.7 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256119.add665d75a5a.10136.8 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256140.add665d75a5a.10136.9 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256194.add665d75a5a.10136.10 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256276.add665d75a5a.10136.11 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256300.add665d75a5a.10136.12 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256394.add665d75a5a.10136.13 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256417.add665d75a5a.10136.14 +3 -0
- runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256567.add665d75a5a.10136.15 +3 -0
- special_tokens_map.json +20 -0
- tokenizer.json +3 -0
- tokenizer_config.json +45 -0
- training_args.bin +3 -0
- vocab.json +0 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
adapter_config.json
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"alpha_pattern": {},
|
3 |
+
"auto_mapping": null,
|
4 |
+
"base_model_name_or_path": "Qwen/Qwen2-0.5B-Instruct",
|
5 |
+
"bias": "none",
|
6 |
+
"eva_config": null,
|
7 |
+
"exclude_modules": null,
|
8 |
+
"fan_in_fan_out": false,
|
9 |
+
"inference_mode": true,
|
10 |
+
"init_lora_weights": true,
|
11 |
+
"layer_replication": null,
|
12 |
+
"layers_pattern": null,
|
13 |
+
"layers_to_transform": null,
|
14 |
+
"loftq_config": {},
|
15 |
+
"lora_alpha": 32,
|
16 |
+
"lora_bias": false,
|
17 |
+
"lora_dropout": 0.1,
|
18 |
+
"megatron_config": null,
|
19 |
+
"megatron_core": "megatron.core",
|
20 |
+
"modules_to_save": null,
|
21 |
+
"peft_type": "LORA",
|
22 |
+
"r": 8,
|
23 |
+
"rank_pattern": {},
|
24 |
+
"revision": null,
|
25 |
+
"target_modules": [
|
26 |
+
"q_proj",
|
27 |
+
"v_proj"
|
28 |
+
],
|
29 |
+
"task_type": "CAUSAL_LM",
|
30 |
+
"use_dora": false,
|
31 |
+
"use_rslora": false
|
32 |
+
}
|
adapter_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11b30593f48f463bb0f9339b781e22b531de0f572ae5700775ae2e43e1594bff
|
3 |
+
size 2175168
|
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
runs/Jan30_16-45-36_add665d75a5a/events.out.tfevents.1738255553.add665d75a5a.2008.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0641be9ec4d3744d6a61d81d9a23c99f5c97bed2d89ae1a9ded8fed671c7b1d8
|
3 |
+
size 5377
|
runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255599.add665d75a5a.2008.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46ba1b7d3f1b01105ba6b062146d34a0b0784b7ab543622a3eb1cd2931f26beb
|
3 |
+
size 4184
|
runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255647.add665d75a5a.2008.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47863a7c80e52e93a0ded25eb40c475205718ecbf3ff1ecdc3da55027461abdb
|
3 |
+
size 4184
|
runs/Jan30_16-46-35_add665d75a5a/events.out.tfevents.1738255658.add665d75a5a.2008.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2318a3c0e10bee57b7a6e182ad2fa04991a3e8becad96f3d3e4b5b3458856eec
|
3 |
+
size 4184
|
runs/Jan30_16-48-51_add665d75a5a/events.out.tfevents.1738255733.add665d75a5a.10136.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e72161a2992b784545834a7345d403d803d1cadabecaebb2f6670b7bff95e97
|
3 |
+
size 5378
|
runs/Jan30_16-51-05_add665d75a5a/events.out.tfevents.1738255871.add665d75a5a.10136.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8dbc9eb8304f8222de8a1e8cc189a3ddb6ec22d91f6e1381249bf9100efacb39
|
3 |
+
size 5377
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255882.add665d75a5a.10136.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c0228a3c53be4e7651ff562244dc837e16300c1e5227de1eeb75649b213acff
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255910.add665d75a5a.10136.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bcf10625d93167f1dd74a3322bcc64179ae385e93f0c73ac32a1a8f2a9a823e
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255934.add665d75a5a.10136.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29bfe04d74947d0dc8670b06525f2d50c8ae9245cb2327a4ad01909acebb020d
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738255955.add665d75a5a.10136.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9ee817596629f2d8d9f117b849857a181d59389de8413ac4cce9e96e271c1a7
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256044.add665d75a5a.10136.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ca01c431cb0d9da0b3facd18c739f377884e460cf6619c44d83707e4309a3d
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256101.add665d75a5a.10136.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f41669496c6fc07d697b9dd3af8e2b5832fcc1dbb90deadbf23e4bf501686a9
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256119.add665d75a5a.10136.8
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:886e76759c7792284f7ea7633dd325207135d0f39b0380c28d41adc4e759da65
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256140.add665d75a5a.10136.9
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:524f573d21671b60f2e0c0aa641b18c03d0fbe71baaabe4ce0c3246f3a428600
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256194.add665d75a5a.10136.10
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bff51ee77adeb4bf90ee2d321288d23c1de94c09f408104b03ddaa3c694fe310
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256276.add665d75a5a.10136.11
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eea4ac695cfa875b4ca5937070776107f6c9795517bf4cdb22528bc6f5806fda
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256300.add665d75a5a.10136.12
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fa07ddb55edf315fe526c61fb77afd7a89815e92d8ed12897ea86cb86677618
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256394.add665d75a5a.10136.13
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a34e5d33f32835b71c4e3b3ac6fbf8e4dbcee6bef58c5adb0917c2959afcf5b
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256417.add665d75a5a.10136.14
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77f9e251e47b4b93f3d27592d71d04cd8d8e886cd76a25a51ed01a9e0881c9f7
|
3 |
+
size 5378
|
runs/Jan30_16-51-18_add665d75a5a/events.out.tfevents.1738256567.add665d75a5a.10136.15
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96716cf7800cb1d98573f328f73cb3762b67592c2448d2f93c228d0b39e12952
|
3 |
+
size 5993
|
special_tokens_map.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"additional_special_tokens": [
|
3 |
+
"<|im_start|>",
|
4 |
+
"<|im_end|>"
|
5 |
+
],
|
6 |
+
"eos_token": {
|
7 |
+
"content": "<|im_end|>",
|
8 |
+
"lstrip": false,
|
9 |
+
"normalized": false,
|
10 |
+
"rstrip": false,
|
11 |
+
"single_word": false
|
12 |
+
},
|
13 |
+
"pad_token": {
|
14 |
+
"content": "<|endoftext|>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false
|
19 |
+
}
|
20 |
+
}
|
tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7c852534ad33d333aa478034d64cd37cb14da033a24674c4b2518300f488efa
|
3 |
+
size 11418433
|
tokenizer_config.json
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"151643": {
|
5 |
+
"content": "<|endoftext|>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": false,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
},
|
12 |
+
"151644": {
|
13 |
+
"content": "<|im_start|>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": false,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"151645": {
|
21 |
+
"content": "<|im_end|>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": false,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"additional_special_tokens": [
|
30 |
+
"<|im_start|>",
|
31 |
+
"<|im_end|>"
|
32 |
+
],
|
33 |
+
"bos_token": null,
|
34 |
+
"chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
|
35 |
+
"clean_up_tokenization_spaces": false,
|
36 |
+
"eos_token": "<|im_end|>",
|
37 |
+
"errors": "replace",
|
38 |
+
"extra_special_tokens": {},
|
39 |
+
"model_max_length": 32768,
|
40 |
+
"pad_token": "<|endoftext|>",
|
41 |
+
"padding_side": "left",
|
42 |
+
"split_special_tokens": false,
|
43 |
+
"tokenizer_class": "Qwen2Tokenizer",
|
44 |
+
"unk_token": null
|
45 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d10c5b20cbd66152bffa7dca593c19fca5fa1f6380a6ca69373b1d1b76f6eb4
|
3 |
+
size 5560
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|