logical-reasoning / scripts /tune-mgtv-llama3_8b.sh
inflaton's picture
llama3 8b base model results
ad9400c
raw
history blame
923 Bytes
#!/bin/sh
BASEDIR=$(dirname "$0")
cd $BASEDIR/..
echo Current Directory:
pwd
BASEDIR=`pwd`
nvidia-smi
uname -a
cat /etc/os-release
lscpu
grep MemTotal /proc/meminfo
#pip install -r requirements.txt
#cd ../LLaMA-Factory && pip install -e .[torch,bitsandbytes] && cd $BASEDIR
#pip install transformers==4.41.2
#pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
export LOGICAL_REASONING_DATA_PATH=datasets/mgtv
#export MODEL_NAME=FlagAlpha/Llama3-Chinese-8B-Instruct
export MODEL_NAME=shenzhi-wang/Llama3-8B-Chinese-Chat
export MODEL_PREFIX=llama3-8b_lora_sft_bf16
export CONFIG_FILE=config/$MODEL_PREFIX-p1.yaml
echo "Tuning $MODEL_NAME with $CONFIG_FILE"
$BASEDIR/scripts/tune-lf.sh $CONFIG_FILE
export CONFIG_FILE=config/$MODEL_PREFIX-p2.yaml
echo "Tuning $MODEL_NAME with $CONFIG_FILE"
$BASEDIR/scripts/tune-lf.sh $CONFIG_FILE
$BASEDIR/scripts/eval-mgtv-llama3_8b.sh