AjayP13 commited on
Commit
d930e1b
·
verified ·
1 Parent(s): ecc1555

Pushed by DataDreamer

Browse files

Update training_args.json

Files changed (1) hide show
  1. training_args.json +11 -11
training_args.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
- "output_dir": "/project_data/data/train_matcher/train-matching-embedding/_checkpoints",
3
  "overwrite_output_dir": false,
4
  "do_train": false,
5
  "do_eval": true,
6
  "do_predict": false,
7
- "eval_strategy": "epoch",
8
  "prediction_loss_only": false,
9
- "per_device_train_batch_size": 8,
10
- "per_device_eval_batch_size": 8,
11
  "per_gpu_train_batch_size": null,
12
  "per_gpu_eval_batch_size": null,
13
- "gradient_accumulation_steps": 1,
14
  "eval_accumulation_steps": 1,
15
  "eval_delay": 0,
16
  "torch_empty_cache_steps": null,
@@ -20,7 +20,7 @@
20
  "adam_beta2": 0.999,
21
  "adam_epsilon": 1e-08,
22
  "max_grad_norm": 1.0,
23
- "num_train_epochs": 5,
24
  "max_steps": -1,
25
  "lr_scheduler_type": "linear",
26
  "lr_scheduler_kwargs": {},
@@ -29,14 +29,14 @@
29
  "log_level": "passive",
30
  "log_level_replica": "warning",
31
  "log_on_each_node": true,
32
- "logging_dir": "/project_data/data/train_matcher/train-matching-embedding/_checkpoints/runs/Mar03_18-28-25_0b651df549d8",
33
  "logging_strategy": "steps",
34
  "logging_first_step": false,
35
  "logging_steps": 1,
36
  "logging_nan_inf_filter": true,
37
- "save_strategy": "epoch",
38
- "save_steps": 500,
39
- "save_total_limit": 1,
40
  "save_safetensors": false,
41
  "save_on_each_node": false,
42
  "save_only_model": false,
@@ -61,7 +61,7 @@
61
  "tpu_metrics_debug": false,
62
  "debug": [],
63
  "dataloader_drop_last": false,
64
- "eval_steps": null,
65
  "dataloader_num_workers": 0,
66
  "dataloader_prefetch_factor": null,
67
  "past_index": -1,
 
1
  {
2
+ "output_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-05-13:09:26/data/train_matcher/train-matching-embedding/_checkpoints",
3
  "overwrite_output_dir": false,
4
  "do_train": false,
5
  "do_eval": true,
6
  "do_predict": false,
7
+ "eval_strategy": "steps",
8
  "prediction_loss_only": false,
9
+ "per_device_train_batch_size": 1,
10
+ "per_device_eval_batch_size": 1,
11
  "per_gpu_train_batch_size": null,
12
  "per_gpu_eval_batch_size": null,
13
+ "gradient_accumulation_steps": 8,
14
  "eval_accumulation_steps": 1,
15
  "eval_delay": 0,
16
  "torch_empty_cache_steps": null,
 
20
  "adam_beta2": 0.999,
21
  "adam_epsilon": 1e-08,
22
  "max_grad_norm": 1.0,
23
+ "num_train_epochs": 3,
24
  "max_steps": -1,
25
  "lr_scheduler_type": "linear",
26
  "lr_scheduler_kwargs": {},
 
29
  "log_level": "passive",
30
  "log_level_replica": "warning",
31
  "log_on_each_node": true,
32
+ "logging_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-05-13:09:26/data/train_matcher/train-matching-embedding/_checkpoints/runs/Mar06_20-29-59_nlpgpu04.seas.upenn.edu",
33
  "logging_strategy": "steps",
34
  "logging_first_step": false,
35
  "logging_steps": 1,
36
  "logging_nan_inf_filter": true,
37
+ "save_strategy": "steps",
38
+ "save_steps": 600,
39
+ "save_total_limit": null,
40
  "save_safetensors": false,
41
  "save_on_each_node": false,
42
  "save_only_model": false,
 
61
  "tpu_metrics_debug": false,
62
  "debug": [],
63
  "dataloader_drop_last": false,
64
+ "eval_steps": 600,
65
  "dataloader_num_workers": 0,
66
  "dataloader_prefetch_factor": null,
67
  "past_index": -1,