ben81828 commited on
Commit
847c72c
·
verified ·
1 Parent(s): d5799e2

Training in progress, step 3400, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b41c1be8b974e693981390b4f8ea3183b990f4c6cbeb85e09c310968df2c797
3
  size 29034840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d712f05560ef9d87500810ebe4e96f57f0c9005ed8838b0dd018fe564e447831
3
  size 29034840
last-checkpoint/global_step3400/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90042a29ea832b455e0b0febb703a80c27669d31f9276f94b31408d71131b4eb
3
+ size 43429616
last-checkpoint/global_step3400/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb05ce0de6c9cc9511842de2c347ed48abb1f8974e7d760fcd5aa31191bad35
3
+ size 43429616
last-checkpoint/global_step3400/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bba280d3f32e7dc1f7458fecad62f8a761d5d50be21d68ad1b200a64ca75a15e
3
+ size 43429616
last-checkpoint/global_step3400/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bee7623add4bb2ee37b178a4b5c0be5536d5ad2b1dc326c8ce3238e32b4cca1b
3
+ size 43429616
last-checkpoint/global_step3400/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f0a5054eba9f5f2ca369e0534352b8e94fdf765e97f88e64f72db4ba475921
3
+ size 637299
last-checkpoint/global_step3400/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f4d45ab2afd18d672717de6056f7b8589be6a43ccd2a95722949876973300f7
3
+ size 637171
last-checkpoint/global_step3400/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea3071cbf7dfa8e2d404c25c04d958ee3c7a04c22c8522cafd06b4dff7601dd9
3
+ size 637171
last-checkpoint/global_step3400/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4167c44ffe9ec068048477eaf74c83fdb2ca9cf033c480fee6e89e70506c8e98
3
+ size 637171
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step3350
 
1
+ global_step3400
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26d08ced4d0f6490515a22c9e9401cc7f71de8b6e2c1525e9c8dac221d4b80ab
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe9163f042a56ab41ea5c2436dff084d8a4a6358e7f4cb1f18e04cb69810300
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:182d3e4bee7983edebdece2816547628c5ac3e14f5b53eac54c08ad9cbfbfac7
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c621ead8d06a0f1d00c5217cc2cfdc90c8c62fa1cb0da0986461ec51fd1766b
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:674c98433de6d8eccea8d9f711e54aa6a237220bb981e22133b7735c14dc835f
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eff8dbefa4ff395a5376144d756cbe824baaab98a892f200d30b7916c24d27cf
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e6ca2e2b0a88474561faf5e462ebee1de20672630f977a22533f633eb059d6d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd67eb847a256b4f0de5857c5e8a43697485d1a0f6032004d0bc19149d77879c
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df3be552cf2524f9ece2b6a286f0ce246d18d14d42f9b8c771a555e051bcee33
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5fc2897164e26dbf189cf39613143884cb612b3f808a6a18c481ece64d73bc7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.4145541489124298,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_stenosis_detect_scale4/lora/sft/checkpoint-2350",
4
- "epoch": 0.8627349987123358,
5
  "eval_steps": 50,
6
- "global_step": 3350,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5970,11 +5970,100 @@
5970
  "eval_steps_per_second": 0.798,
5971
  "num_input_tokens_seen": 35179104,
5972
  "step": 3350
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5973
  }
5974
  ],
5975
  "logging_steps": 5,
5976
  "max_steps": 3400,
5977
- "num_input_tokens_seen": 35179104,
5978
  "num_train_epochs": 1,
5979
  "save_steps": 50,
5980
  "stateful_callbacks": {
@@ -5984,12 +6073,12 @@
5984
  "should_evaluate": false,
5985
  "should_log": false,
5986
  "should_save": true,
5987
- "should_training_stop": false
5988
  },
5989
  "attributes": {}
5990
  }
5991
  },
5992
- "total_flos": 2321016547704832.0,
5993
  "train_batch_size": 1,
5994
  "trial_name": null,
5995
  "trial_params": null
 
1
  {
2
  "best_metric": 0.4145541489124298,
3
  "best_model_checkpoint": "saves/CADICA_qwenvl_stenosis_detect_scale4/lora/sft/checkpoint-2350",
4
+ "epoch": 0.8756116404841617,
5
  "eval_steps": 50,
6
+ "global_step": 3400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5970
  "eval_steps_per_second": 0.798,
5971
  "num_input_tokens_seen": 35179104,
5972
  "step": 3350
5973
+ },
5974
+ {
5975
+ "epoch": 0.8640226628895185,
5976
+ "grad_norm": 5.553235621230406,
5977
+ "learning_rate": 4.788399817602929e-08,
5978
+ "loss": 0.3179,
5979
+ "num_input_tokens_seen": 35231608,
5980
+ "step": 3355
5981
+ },
5982
+ {
5983
+ "epoch": 0.865310327066701,
5984
+ "grad_norm": 4.202242288396885,
5985
+ "learning_rate": 3.7835537837338506e-08,
5986
+ "loss": 0.2829,
5987
+ "num_input_tokens_seen": 35284448,
5988
+ "step": 3360
5989
+ },
5990
+ {
5991
+ "epoch": 0.8665979912438836,
5992
+ "grad_norm": 3.6414795103608255,
5993
+ "learning_rate": 2.8968690057051828e-08,
5994
+ "loss": 0.2579,
5995
+ "num_input_tokens_seen": 35336520,
5996
+ "step": 3365
5997
+ },
5998
+ {
5999
+ "epoch": 0.8678856554210662,
6000
+ "grad_norm": 4.481511308866539,
6001
+ "learning_rate": 2.128366453743591e-08,
6002
+ "loss": 0.2862,
6003
+ "num_input_tokens_seen": 35388728,
6004
+ "step": 3370
6005
+ },
6006
+ {
6007
+ "epoch": 0.8691733195982487,
6008
+ "grad_norm": 4.3032070874799,
6009
+ "learning_rate": 1.4780643030476438e-08,
6010
+ "loss": 0.2812,
6011
+ "num_input_tokens_seen": 35441824,
6012
+ "step": 3375
6013
+ },
6014
+ {
6015
+ "epoch": 0.8704609837754314,
6016
+ "grad_norm": 5.8821140210764336,
6017
+ "learning_rate": 9.459779333587104e-09,
6018
+ "loss": 0.3174,
6019
+ "num_input_tokens_seen": 35495128,
6020
+ "step": 3380
6021
+ },
6022
+ {
6023
+ "epoch": 0.871748647952614,
6024
+ "grad_norm": 7.380544386822247,
6025
+ "learning_rate": 5.3211992859791835e-09,
6026
+ "loss": 0.3049,
6027
+ "num_input_tokens_seen": 35548144,
6028
+ "step": 3385
6029
+ },
6030
+ {
6031
+ "epoch": 0.8730363121297966,
6032
+ "grad_norm": 1.5375610441333851,
6033
+ "learning_rate": 2.3650007656805806e-09,
6034
+ "loss": 0.2882,
6035
+ "num_input_tokens_seen": 35600936,
6036
+ "step": 3390
6037
+ },
6038
+ {
6039
+ "epoch": 0.8743239763069791,
6040
+ "grad_norm": 6.170480848656164,
6041
+ "learning_rate": 5.912536872321184e-10,
6042
+ "loss": 0.2789,
6043
+ "num_input_tokens_seen": 35653896,
6044
+ "step": 3395
6045
+ },
6046
+ {
6047
+ "epoch": 0.8756116404841617,
6048
+ "grad_norm": 5.211578123351505,
6049
+ "learning_rate": 0.0,
6050
+ "loss": 0.3187,
6051
+ "num_input_tokens_seen": 35706848,
6052
+ "step": 3400
6053
+ },
6054
+ {
6055
+ "epoch": 0.8756116404841617,
6056
+ "eval_loss": 0.4701705873012543,
6057
+ "eval_runtime": 37.5324,
6058
+ "eval_samples_per_second": 3.197,
6059
+ "eval_steps_per_second": 0.799,
6060
+ "num_input_tokens_seen": 35706848,
6061
+ "step": 3400
6062
  }
6063
  ],
6064
  "logging_steps": 5,
6065
  "max_steps": 3400,
6066
+ "num_input_tokens_seen": 35706848,
6067
  "num_train_epochs": 1,
6068
  "save_steps": 50,
6069
  "stateful_callbacks": {
 
6073
  "should_evaluate": false,
6074
  "should_log": false,
6075
  "should_save": true,
6076
+ "should_training_stop": true
6077
  },
6078
  "attributes": {}
6079
  }
6080
  },
6081
+ "total_flos": 2355853440057344.0,
6082
  "train_batch_size": 1,
6083
  "trial_name": null,
6084
  "trial_params": null