nthungdev commited on
Commit
2db3e83
·
verified ·
1 Parent(s): 4b35f1e

Training complete

Browse files
README.md CHANGED
@@ -40,7 +40,7 @@ The following hyperparameters were used during training:
40
  - train_batch_size: 32
41
  - eval_batch_size: 64
42
  - seed: 42
43
- - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
44
  - lr_scheduler_type: linear
45
  - num_epochs: 3
46
  - mixed_precision_training: Native AMP
@@ -51,7 +51,7 @@ The following hyperparameters were used during training:
51
 
52
  ### Framework versions
53
 
54
- - Transformers 4.46.2
55
  - Pytorch 2.5.1+cu121
56
  - Datasets 3.1.0
57
  - Tokenizers 0.20.3
 
40
  - train_batch_size: 32
41
  - eval_batch_size: 64
42
  - seed: 42
43
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
  - num_epochs: 3
46
  - mixed_precision_training: Native AMP
 
51
 
52
  ### Framework versions
53
 
54
+ - Transformers 4.45.2
55
  - Pytorch 2.5.1+cu121
56
  - Datasets 3.1.0
57
  - Tokenizers 0.20.3
generation_config.json CHANGED
@@ -12,5 +12,5 @@
12
  "num_beams": 4,
13
  "pad_token_id": 46275,
14
  "renormalize_logits": true,
15
- "transformers_version": "4.46.2"
16
  }
 
12
  "num_beams": 4,
13
  "pad_token_id": 46275,
14
  "renormalize_logits": true,
15
+ "transformers_version": "4.45.2"
16
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23e0d8894883d106c7fefd931b5ee647e5856c191dfe1cb918e4cc3df8822aa6
3
  size 271541392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e6e144efcc29fc46b9d4925b8115d7290ce27f093655549c50d3aef771442a8
3
  size 271541392
runs/Dec02_08-31-51_4bb14ee925ea/events.out.tfevents.1733128992.4bb14ee925ea.1931.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07753b81c7eb437492b39f8e07289bffbd9f06bd2aeb0c8dbb54218533ae91cb
3
- size 9134
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c66ae84da2c81c77cbdf797b877c934c3e11ef5c61e480ce2baa3f833fe3b0
3
+ size 11176