Commit 82cb25c1 authored by Yen-Ting Lin's avatar Yen-Ting Lin
Browse files

Update SLURM script and add new models

parent ce343750
......@@ -3,7 +3,7 @@
# this is a multi-node SLURM script using `accelerate` launcher
#SBATCH --job-name=eval-harness
#SBATCH --partition=defq
#SBATCH --partition=no_multi,defq
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1 # crucial - only 1 task per node
#SBATCH --gres=gpu:8 # EDIT this if it's not 8-gpus per node
......
......@@ -3,7 +3,21 @@
# Define the models to run
declare -a models=(
"yentinglin/Llama-3-Taiwan-70B-Instruct"
"yentinglin/Llama-3-Taiwan-70B-Instruct-DPO"
"yentinglin/Llama-3-Taiwan-8B-Instruct-rc1"
"yentinglin/Taiwan-LLM-34B-Instruct"
"yentinglin/Taiwan-LLM-MoE-pilot"
"yentinglin/Taiwan-LLM-8x7B-DPO"
"yentinglin/Taiwan-LLM-7B-v2.0-base"
"yentinglin/Taiwan-LLM-7B-v2.0-chat"
"yentinglin/Taiwan-LLM-7B-v2.0.1-chat"
"yentinglin/Taiwan-LLM-7B-v2.1-chat"
"yentinglin/Taiwan-LLM-13B-v2.0-base"
"yentinglin/Taiwan-LLM-13B-v2.0-chat"
"yentinglin/Taiwan-LLaMa-v1.0"
"yentinglin/Taiwan-LLaMa-v1.0-base"
"yentinglin/Taiwan-LLaMa-v0.9"
"yentinglin/Taiwan-LLaMa-v0.0"
"meta-llama/Meta-Llama-3-70B-Instruct"
"meta-llama/Meta-Llama-3-70B"
"meta-llama/Meta-Llama-3-8B-Instruct"
......@@ -57,6 +71,15 @@ declare -a models=(
"taide/TAIDE-LX-7B-Chat"
"taide/TAIDE-LX-7B"
"microsoft/Phi-3-mini-4k-instruct"
"microsoft/Phi-3-mini-128k-instruct"
"microsoft/Phi-3-small-8k-instruct"
"microsoft/Phi-3-small-128k-instruct"
"microsoft/Phi-3-medium-4k-instruct"
"microsoft/Phi-3-medium-128k-instruct"
"google/gemma-1.1-2b-it"
"google/gemma-1.1-7b-it"
"google/gemma-7b"
"google/gemma-2b"
"apple/OpenELM-3B-Instruct"
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment