Update SLURM script and add new models

82cb25c1 · Yen-Ting Lin · ce343750 · 82cb25c1 · 82cb25c1
Commit 82cb25c1 authored Jun 13, 2024 by Yen-Ting Lin
Hide whitespace changes
Inline Side-by-side

Showing with 24 additions and 1 deletion

harness_eval.slurm harness_eval.slurm +1 -1

run_all.sh run_all.sh +23 -0

No files found.
--- a/harness_eval.slurm
+++ b/harness_eval.slurm
@@ -3,7 +3,7 @@
 # this is a multi-node SLURM script using `accelerate` launcher
 #SBATCH --job-name=eval-harness
-#SBATCH --partition=defq
+#SBATCH --partition=no_multi,defq
 #SBATCH --nodes=1
 #SBATCH --ntasks-per-node=1          # crucial - only 1 task per node
 #SBATCH --gres=gpu:8                 # EDIT this if it's not 8-gpus per node

--- a/run_all.sh
+++ b/run_all.sh
@@ -3,7 +3,21 @@
 # Define the models to run
 declare -a models=(
 "yentinglin/Llama-3-Taiwan-70B-Instruct"
+"yentinglin/Llama-3-Taiwan-70B-Instruct-DPO"
 "yentinglin/Llama-3-Taiwan-8B-Instruct-rc1"
+"yentinglin/Taiwan-LLM-34B-Instruct"
+"yentinglin/Taiwan-LLM-MoE-pilot"
+"yentinglin/Taiwan-LLM-8x7B-DPO"
+"yentinglin/Taiwan-LLM-7B-v2.0-base"
+"yentinglin/Taiwan-LLM-7B-v2.0-chat"
+"yentinglin/Taiwan-LLM-7B-v2.0.1-chat"
+"yentinglin/Taiwan-LLM-7B-v2.1-chat"
+"yentinglin/Taiwan-LLM-13B-v2.0-base"
+"yentinglin/Taiwan-LLM-13B-v2.0-chat"
+"yentinglin/Taiwan-LLaMa-v1.0"
+"yentinglin/Taiwan-LLaMa-v1.0-base"
+"yentinglin/Taiwan-LLaMa-v0.9"
+"yentinglin/Taiwan-LLaMa-v0.0"
 "meta-llama/Meta-Llama-3-70B-Instruct"
 "meta-llama/Meta-Llama-3-70B"
 "meta-llama/Meta-Llama-3-8B-Instruct"
@@ -57,6 +71,15 @@ declare -a models=(
 "taide/TAIDE-LX-7B-Chat"
 "taide/TAIDE-LX-7B"
 "microsoft/Phi-3-mini-4k-instruct"
+"microsoft/Phi-3-mini-128k-instruct"
+"microsoft/Phi-3-small-8k-instruct"
+"microsoft/Phi-3-small-128k-instruct"
+"microsoft/Phi-3-medium-4k-instruct"
+"microsoft/Phi-3-medium-128k-instruct"
+"google/gemma-1.1-2b-it"
+"google/gemma-1.1-7b-it"
+"google/gemma-7b"
+"google/gemma-2b"
 "apple/OpenELM-3B-Instruct"
 )