diff --git a/run_model_cot.sh b/run_model_cot.sh
new file mode 100755
index 0000000..24ac222
--- /dev/null
+++ b/run_model_cot.sh
@@ -0,0 +1,49 @@
+#!/bin/zsh
+
+model_dir="${HOME}/models"
+# parse in model_names from args to script
+model_names=("$@")
+# if model_names is empty, print and exit
+if [ -z "$model_names" ]; then
+  echo "No model names provided"
+  exit 1
+fi
+PORT=8084 # avoid 8081 as it's used by nginx
+export CUDA_VISIBLE_DEVICES=0 # set gpu you want to use (just 1 will do)
+
+# Loop over model names
+for model_name in "${model_names[@]}"; do
+
+  echo "Running model ${model_name}"
+  # first, get the API up
+  python3 utils/api_server.py --model "${model_dir}/${model_name}" --tensor-parallel-size 1 --dtype float16 --max-model-len 8192 --gpu-memory-utilization 0.90 --block-size 16 --disable-log-requests --port "${PORT}" &
+
+  # run a loop to check if the http://localhost:8080/health endpoint returns a valid 200 result
+  while true; do
+    http_status=$(curl -s -o /dev/null -w "%{http_code}" "http://localhost:${PORT}/health")
+    if [ "$http_status" -eq 200 ]; then
+      echo "API server is up and running"
+      break
+    else
+      echo "Waiting for API server to be up..."
+      sleep 1
+    fi
+  done
+
+  # then run sql-eval
+  python3 main.py -db postgres \
+    -f prompts/prompt_cot.md \
+    -q "data/questions_gen_postgres.csv" "data/instruct_basic_postgres.csv" "data/instruct_advanced_postgres.csv" "data/idk.csv" \
+    -o "results/${model_name}/api_v1_cot.csv" "results/${model_name}/api_basic_cot.csv" "results/${model_name}/api_advanced_cot.csv" "results/${model_name}/api_idk_cot.csv" \
+    -g api \
+    -b 1 \
+    -c 0 \
+    --api_url "http://localhost:${PORT}/generate" \
+    --api_type "vllm" \
+    -p 10 \
+    --cot_table_alias "prealias" \
+    --logprobs
+  # finally, kill the api server
+  pkill -9 -f "python3 utils/api_server.py.*--port ${PORT}"
+
+done