ivangrapher commited on
Commit
fe84df4
·
verified ·
1 Parent(s): 6edd05f

Training in progress, step 30, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
23
  "o_proj",
24
- "v_proj",
25
  "down_proj",
26
  "gate_proj",
27
- "up_proj",
28
- "q_proj",
29
- "k_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "k_proj",
24
+ "up_proj",
25
+ "q_proj",
26
  "o_proj",
 
27
  "down_proj",
28
  "gate_proj",
29
+ "v_proj"
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
last-checkpoint/trainer_state.json CHANGED
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 0.0030075187969924814,
13
  "eval_loss": NaN,
14
- "eval_runtime": 26.6856,
15
- "eval_samples_per_second": 5.246,
16
- "eval_steps_per_second": 2.623,
17
  "step": 1
18
  },
19
  {
@@ -26,9 +26,9 @@
26
  {
27
  "epoch": 0.015037593984962405,
28
  "eval_loss": NaN,
29
- "eval_runtime": 27.5034,
30
- "eval_samples_per_second": 5.09,
31
- "eval_steps_per_second": 2.545,
32
  "step": 5
33
  },
34
  {
@@ -48,9 +48,9 @@
48
  {
49
  "epoch": 0.03007518796992481,
50
  "eval_loss": NaN,
51
- "eval_runtime": 27.5491,
52
- "eval_samples_per_second": 5.082,
53
- "eval_steps_per_second": 2.541,
54
  "step": 10
55
  },
56
  {
@@ -70,9 +70,9 @@
70
  {
71
  "epoch": 0.045112781954887216,
72
  "eval_loss": NaN,
73
- "eval_runtime": 27.6227,
74
- "eval_samples_per_second": 5.068,
75
- "eval_steps_per_second": 2.534,
76
  "step": 15
77
  },
78
  {
@@ -85,9 +85,9 @@
85
  {
86
  "epoch": 0.06015037593984962,
87
  "eval_loss": NaN,
88
- "eval_runtime": 27.5039,
89
- "eval_samples_per_second": 5.09,
90
- "eval_steps_per_second": 2.545,
91
  "step": 20
92
  },
93
  {
@@ -107,9 +107,9 @@
107
  {
108
  "epoch": 0.07518796992481203,
109
  "eval_loss": NaN,
110
- "eval_runtime": 27.5947,
111
- "eval_samples_per_second": 5.073,
112
- "eval_steps_per_second": 2.537,
113
  "step": 25
114
  },
115
  {
@@ -129,9 +129,9 @@
129
  {
130
  "epoch": 0.09022556390977443,
131
  "eval_loss": NaN,
132
- "eval_runtime": 27.6176,
133
- "eval_samples_per_second": 5.069,
134
- "eval_steps_per_second": 2.535,
135
  "step": 30
136
  }
137
  ],
 
11
  {
12
  "epoch": 0.0030075187969924814,
13
  "eval_loss": NaN,
14
+ "eval_runtime": 27.481,
15
+ "eval_samples_per_second": 5.094,
16
+ "eval_steps_per_second": 2.547,
17
  "step": 1
18
  },
19
  {
 
26
  {
27
  "epoch": 0.015037593984962405,
28
  "eval_loss": NaN,
29
+ "eval_runtime": 27.5842,
30
+ "eval_samples_per_second": 5.075,
31
+ "eval_steps_per_second": 2.538,
32
  "step": 5
33
  },
34
  {
 
48
  {
49
  "epoch": 0.03007518796992481,
50
  "eval_loss": NaN,
51
+ "eval_runtime": 27.6578,
52
+ "eval_samples_per_second": 5.062,
53
+ "eval_steps_per_second": 2.531,
54
  "step": 10
55
  },
56
  {
 
70
  {
71
  "epoch": 0.045112781954887216,
72
  "eval_loss": NaN,
73
+ "eval_runtime": 26.6388,
74
+ "eval_samples_per_second": 5.255,
75
+ "eval_steps_per_second": 2.628,
76
  "step": 15
77
  },
78
  {
 
85
  {
86
  "epoch": 0.06015037593984962,
87
  "eval_loss": NaN,
88
+ "eval_runtime": 27.7237,
89
+ "eval_samples_per_second": 5.05,
90
+ "eval_steps_per_second": 2.525,
91
  "step": 20
92
  },
93
  {
 
107
  {
108
  "epoch": 0.07518796992481203,
109
  "eval_loss": NaN,
110
+ "eval_runtime": 27.6693,
111
+ "eval_samples_per_second": 5.06,
112
+ "eval_steps_per_second": 2.53,
113
  "step": 25
114
  },
115
  {
 
129
  {
130
  "epoch": 0.09022556390977443,
131
  "eval_loss": NaN,
132
+ "eval_runtime": 24.5914,
133
+ "eval_samples_per_second": 5.693,
134
+ "eval_steps_per_second": 2.847,
135
  "step": 30
136
  }
137
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aadbb2cc0e6d20d3373ebcf4dbeb7b0874555a2254d75c2babdcd1a27f59d922
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20186f755d00f92880a9ff8e59a22ed00993d2306608766329a7eb9705257573
3
  size 6776