Femboyuwu2000
commited on
Commit
•
c8aef10
1
Parent(s):
0c3458c
Training in progress, step 40
Browse files- adapter_model.safetensors +1 -1
- runs/Apr13_02-50-02_4be9d1bc899e/events.out.tfevents.1712977457.4be9d1bc899e.109.0 +2 -2
- wandb/debug-internal.log +22 -0
- wandb/run-20240413_030720-hqqism3w/files/config.yaml +16 -0
- wandb/run-20240413_030720-hqqism3w/files/output.log +2 -0
- wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json +1 -1
- wandb/run-20240413_030720-hqqism3w/logs/debug-internal.log +22 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 12803224
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7598e4d11a7e88a2cd048c7d81b03a00065ebccc133982b8a62f1502da78a828
|
3 |
size 12803224
|
runs/Apr13_02-50-02_4be9d1bc899e/events.out.tfevents.1712977457.4be9d1bc899e.109.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce87010a8fba3aeaebae80900ef8dc44dbc7334adfc638b206adfd2654ee5d75
|
3 |
+
size 5696
|
wandb/debug-internal.log
CHANGED
@@ -86,3 +86,25 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
|
|
86 |
2024-04-13 03:08:10,148 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
87 |
2024-04-13 03:08:10,150 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
88 |
2024-04-13 03:08:10,396 INFO Thread-12 :162 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
86 |
2024-04-13 03:08:10,148 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
87 |
2024-04-13 03:08:10,150 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
88 |
2024-04-13 03:08:10,396 INFO Thread-12 :162 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|
89 |
+
2024-04-13 03:08:12,938 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
90 |
+
2024-04-13 03:08:13,397 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/output.log
|
91 |
+
2024-04-13 03:08:17,938 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
92 |
+
2024-04-13 03:08:21,491 DEBUG SystemMonitor:162 [system_monitor.py:_start():172] Starting system metrics aggregation loop
|
93 |
+
2024-04-13 03:08:21,492 DEBUG SenderThread:162 [sender.py:send():379] send: stats
|
94 |
+
2024-04-13 03:08:22,561 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: stop_status
|
95 |
+
2024-04-13 03:08:22,562 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: stop_status
|
96 |
+
2024-04-13 03:08:22,566 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: internal_messages
|
97 |
+
2024-04-13 03:08:23,629 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
98 |
+
2024-04-13 03:08:24,401 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/config.yaml
|
99 |
+
2024-04-13 03:08:28,735 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
100 |
+
2024-04-13 03:08:33,736 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
101 |
+
2024-04-13 03:08:37,561 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: stop_status
|
102 |
+
2024-04-13 03:08:37,562 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: stop_status
|
103 |
+
2024-04-13 03:08:37,602 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: internal_messages
|
104 |
+
2024-04-13 03:08:39,617 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
105 |
+
2024-04-13 03:08:44,618 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
106 |
+
2024-04-13 03:08:45,115 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: partial_history
|
107 |
+
2024-04-13 03:08:45,116 DEBUG SenderThread:162 [sender.py:send():379] send: history
|
108 |
+
2024-04-13 03:08:45,116 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
109 |
+
2024-04-13 03:08:45,118 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
110 |
+
2024-04-13 03:08:45,409 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|
wandb/run-20240413_030720-hqqism3w/files/config.yaml
CHANGED
@@ -58,6 +58,22 @@ _wandb:
|
|
58 |
- 1: train/global_step
|
59 |
6:
|
60 |
- 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
61 |
vocab_size:
|
62 |
desc: null
|
63 |
value: 250880
|
|
|
58 |
- 1: train/global_step
|
59 |
6:
|
60 |
- 3
|
61 |
+
- 1: train/loss
|
62 |
+
5: 1
|
63 |
+
6:
|
64 |
+
- 1
|
65 |
+
- 1: train/grad_norm
|
66 |
+
5: 1
|
67 |
+
6:
|
68 |
+
- 1
|
69 |
+
- 1: train/learning_rate
|
70 |
+
5: 1
|
71 |
+
6:
|
72 |
+
- 1
|
73 |
+
- 1: train/epoch
|
74 |
+
5: 1
|
75 |
+
6:
|
76 |
+
- 1
|
77 |
vocab_size:
|
78 |
desc: null
|
79 |
value: 250880
|
wandb/run-20240413_030720-hqqism3w/files/output.log
CHANGED
@@ -1 +1,3 @@
|
|
|
|
|
|
1 |
/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
|
|
|
1 |
+
/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
|
2 |
+
warnings.warn(
|
3 |
/opt/conda/lib/python3.10/site-packages/torch/utils/checkpoint.py:429: UserWarning: torch.utils.checkpoint: please pass in use_reentrant=True or use_reentrant=False explicitly. The default value of use_reentrant will be updated to be False in the future. To maintain current behavior, pass use_reentrant=True. It is recommended that you use use_reentrant=False. Refer to docs for more details on the differences between the two variants.
|
wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"train/loss": 3.
|
|
|
1 |
+
{"train/loss": 3.7271, "train/grad_norm": 90.37364196777344, "train/learning_rate": 3.3333333333333333e-06, "train/epoch": 0.0, "train/global_step": 40, "_timestamp": 1712977725.1147408, "_runtime": 84.30216884613037, "_step": 1}
|
wandb/run-20240413_030720-hqqism3w/logs/debug-internal.log
CHANGED
@@ -86,3 +86,25 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
|
|
86 |
2024-04-13 03:08:10,148 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
87 |
2024-04-13 03:08:10,150 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
88 |
2024-04-13 03:08:10,396 INFO Thread-12 :162 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
86 |
2024-04-13 03:08:10,148 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
87 |
2024-04-13 03:08:10,150 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
88 |
2024-04-13 03:08:10,396 INFO Thread-12 :162 [dir_watcher.py:_on_file_created():271] file/dir created: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|
89 |
+
2024-04-13 03:08:12,938 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
90 |
+
2024-04-13 03:08:13,397 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/output.log
|
91 |
+
2024-04-13 03:08:17,938 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
92 |
+
2024-04-13 03:08:21,491 DEBUG SystemMonitor:162 [system_monitor.py:_start():172] Starting system metrics aggregation loop
|
93 |
+
2024-04-13 03:08:21,492 DEBUG SenderThread:162 [sender.py:send():379] send: stats
|
94 |
+
2024-04-13 03:08:22,561 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: stop_status
|
95 |
+
2024-04-13 03:08:22,562 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: stop_status
|
96 |
+
2024-04-13 03:08:22,566 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: internal_messages
|
97 |
+
2024-04-13 03:08:23,629 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
98 |
+
2024-04-13 03:08:24,401 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/config.yaml
|
99 |
+
2024-04-13 03:08:28,735 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
100 |
+
2024-04-13 03:08:33,736 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
101 |
+
2024-04-13 03:08:37,561 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: stop_status
|
102 |
+
2024-04-13 03:08:37,562 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: stop_status
|
103 |
+
2024-04-13 03:08:37,602 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: internal_messages
|
104 |
+
2024-04-13 03:08:39,617 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
105 |
+
2024-04-13 03:08:44,618 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: status_report
|
106 |
+
2024-04-13 03:08:45,115 DEBUG HandlerThread:162 [handler.py:handle_request():146] handle_request: partial_history
|
107 |
+
2024-04-13 03:08:45,116 DEBUG SenderThread:162 [sender.py:send():379] send: history
|
108 |
+
2024-04-13 03:08:45,116 DEBUG SenderThread:162 [sender.py:send_request():406] send_request: summary_record
|
109 |
+
2024-04-13 03:08:45,118 INFO SenderThread:162 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
|
110 |
+
2024-04-13 03:08:45,409 INFO Thread-12 :162 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240413_030720-hqqism3w/files/wandb-summary.json
|