gushcloudcashteo commited on
Commit
210a2c3
1 Parent(s): f341bab

falcon-7b-instruct-ft-instagram-adapters-trainer-2

Browse files
README.md CHANGED
@@ -34,7 +34,7 @@ More information needed
34
  ### Training hyperparameters
35
 
36
  The following hyperparameters were used during training:
37
- - learning_rate: 0.0002
38
  - train_batch_size: 4
39
  - eval_batch_size: 8
40
  - seed: 42
@@ -43,7 +43,7 @@ The following hyperparameters were used during training:
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: constant
45
  - lr_scheduler_warmup_ratio: 0.03
46
- - training_steps: 500
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
 
34
  ### Training hyperparameters
35
 
36
  The following hyperparameters were used during training:
37
+ - learning_rate: 0.02
38
  - train_batch_size: 4
39
  - eval_batch_size: 8
40
  - seed: 42
 
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: constant
45
  - lr_scheduler_warmup_ratio: 0.03
46
+ - training_steps: 20
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
adapter_config.json CHANGED
@@ -19,10 +19,10 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "query_key_value",
23
- "dense_h_to_4h",
24
  "dense",
25
- "dense_4h_to_h"
26
  ],
27
  "task_type": "CAUSAL_LM",
28
  "use_rslora": false
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
+ "dense_4h_to_h",
23
  "query_key_value",
 
24
  "dense",
25
+ "dense_h_to_4h"
26
  ],
27
  "task_type": "CAUSAL_LM",
28
  "use_rslora": false
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4699f11ee549e908e5de2f10521979aa21f6175d1deacfba28c89e8a49c4e225
3
  size 522227376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:effcd3c9f4daf872ebb52d9d050d58f127c2d742267eaeab77f5726ef0046825
3
  size 522227376
runs/Jan18_10-17-25_4e5acb56f0db/events.out.tfevents.1705573053.4e5acb56f0db.4020.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe7b31b4390f14f0f2743f6d1c1576bcab114bbd573e7d56d637df8c40bdc34a
3
+ size 5522
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1f6f70619b34e35719bed8cbe1ba864b41e2510a83f204a94c745e8a6d5b64f
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:928ae454a3915a9895db74def7092addf02f2e7e75b2351a522b166c23d0d42b
3
  size 4664