inflaton commited on
Commit
bc0d2ff
·
1 Parent(s): 0d2096e

attempted gemma2

Browse files
llama-factory/config/{gemma2_9b_lora_sft-p1.yaml → gemma2-9b_lora_sft_bf16-p1.yaml} RENAMED
@@ -13,7 +13,7 @@ upcast_layernorm: true
13
 
14
  ### dataset
15
  dataset: alpaca_mgtv_p1
16
- template: gemma2
17
  cutoff_len: 4096
18
  max_samples: 25000
19
  overwrite_cache: true
@@ -44,4 +44,4 @@ eval_strategy: steps
44
  eval_steps: 2109
45
 
46
  report_to: wandb
47
- run_name: qwen2_72b_4bit_p1_full # optional
 
13
 
14
  ### dataset
15
  dataset: alpaca_mgtv_p1
16
+ template: gemma
17
  cutoff_len: 4096
18
  max_samples: 25000
19
  overwrite_cache: true
 
44
  eval_steps: 2109
45
 
46
  report_to: wandb
47
+ run_name: gemma2_9b_p1_full # optional
scripts/tune-mgtv-gemma2_9b.sh CHANGED
@@ -14,7 +14,9 @@ lscpu
14
  grep MemTotal /proc/meminfo
15
 
16
  #pip install -r requirements.txt
17
- #cd ../LLaMA-Factory && pip install -e .[torch,bitsandbytes]
 
 
18
 
19
  export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
20
 
 
14
  grep MemTotal /proc/meminfo
15
 
16
  #pip install -r requirements.txt
17
+ cd ../LLaMA-Factory && pip install -e .[torch,bitsandbytes] && cd $BASEDIR
18
+ #pip install -U transformers
19
+ #pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
20
 
21
  export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
22
 
scripts/tune-mgtv.sh CHANGED
@@ -1 +1 @@
1
- tune-mgtv-qwen2_72b.sh
 
1
+ tune-mgtv-gemma2_9b.sh