Skip to content

Commit 690a56a

Browse files
silviaseclaude
andcommitted
feat: Update model list and HPC configurations for nvlink
- Sync MODEL_LIST in make_leaderboard.py with eval.sh - Add new models: Qwen2-VL variants, Llama-3.2-90B, gemma-3 pt variants, Heron-NVILA-Lite models - Comment out deprecated models to match eval.sh configuration - Update eval.sh time limit to 24 hours and use /data directory for caching - Fix ring.sh to use correct project paths 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <[email protected]>
1 parent 5d1fc4e commit 690a56a

File tree

3 files changed

+31
-19
lines changed

3 files changed

+31
-19
lines changed

scripts/make_leaderboard.py

Lines changed: 22 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -52,31 +52,42 @@
5252
}
5353

5454
MODEL_LIST = [
55-
"stabilityai/japanese-instructblip-alpha",
55+
# "stabilityai/japanese-instructblip-alpha",
5656
"stabilityai/japanese-stable-vlm",
57-
"SakanaAI/Llama-3-EvoVLM-JP-v2",
5857
"cyberagent/llava-calm2-siglip",
59-
"llm-jp/llm-jp-3-vila-14b",
60-
"sbintuitions/sarashina2-vision-8b",
61-
"sbintuitions/sarashina2-vision-14b",
62-
"MIL-UT/Asagi-14B",
6358
"llava-hf/llava-1.5-7b-hf",
6459
"llava-hf/llava-v1.6-mistral-7b-hf",
6560
"neulab/Pangea-7B-hf",
66-
"mistralai/Pixtral-12B-2409",
6761
"meta-llama/Llama-3.2-11B-Vision-Instruct",
68-
"Efficient-Large-Model/VILA1.5-13b",
69-
"OpenGVLab/InternVL2-8B",
70-
"OpenGVLab/InternVL2-26B",
62+
"meta-llama/Llama-3.2-90B-Vision-Instruct",
63+
# "OpenGVLab/InternVL2-8B",
64+
# "OpenGVLab/InternVL2-26B",
65+
"Qwen/Qwen2-VL-7B-Instruct",
66+
"Qwen/Qwen2-VL-72B-Instruct",
67+
"Qwen/Qwen2.5-VL-3B-Instruct",
7168
"Qwen/Qwen2.5-VL-7B-Instruct",
7269
"Qwen/Qwen2.5-VL-32B-Instruct",
7370
"Qwen/Qwen2.5-VL-72B-Instruct",
71+
"gpt-4o-2024-11-20",
72+
# "mistralai/Pixtral-12B-2409",
73+
"llm-jp/llm-jp-3-vila-14b",
74+
# "Efficient-Large-Model/VILA1.5-13b",
75+
"SakanaAI/Llama-3-EvoVLM-JP-v2",
7476
"google/gemma-3-4b-it",
7577
"google/gemma-3-12b-it",
7678
"google/gemma-3-27b-it",
79+
"google/gemma-3-4b-pt",
80+
"google/gemma-3-12b-pt",
81+
"google/gemma-3-27b-pt",
82+
# "tokyotech-llm/gemma3_4b_exp8-checkpoint-50000",
83+
"sbintuitions/sarashina2-vision-8b",
84+
"sbintuitions/sarashina2-vision-14b",
7785
"microsoft/Phi-4-multimodal-instruct",
78-
"gpt-4o-2024-11-20",
86+
"MIL-UT/Asagi-14B",
87+
"turing-motors/Heron-NVILA-Lite-1B",
88+
"turing-motors/Heron-NVILA-Lite-2B",
7989
"turing-motors/Heron-NVILA-Lite-15B",
90+
"turing-motors/Heron-NVILA-Lite-33B",
8091
]
8192

8293

scripts/nvlink/eval.sh

Lines changed: 6 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
#!/bin/bash
22
#SBATCH --job-name=llm-jp-eval-mm
3-
#SBATCH --time=2:00:00
3+
#SBATCH --time=24:00:00
44
#SBATCH --gres=gpu:NUM_GPUS
55
#SBATCH --ntasks=1
66
#SBATCH --cpus-per-task=8
@@ -20,10 +20,11 @@ num_gpus=${4:-1} # Default to 1 GPU if not specified
2020
# PATH config
2121
export PATH="$HOME/.local/bin:$PATH"
2222
export ROOT_DIR="/home/silviase/"
23-
export HF_HOME="$ROOT_DIR/.hf_cache"
24-
export HF_DATASETS_CACHE=$HF_HOME/datasets
25-
export HF_HUB_CACHE=$HF_HOME/models
26-
export APPTAINER_CACHEDIR="$ROOT_DIR/apptainer_cache"
23+
export DATA_DIR="/data/silviase/"
24+
export HF_HOME="$DATA_DIR/.hf_cache"
25+
export HF_DATASETS_CACHE=$DATA_DIR/datasets
26+
export HF_HUB_CACHE=$DATA_DIR/models
27+
export APPTAINER_CACHEDIR="$DATA_DIR/apptainer_cache"
2728

2829
# Environment Variables
2930
export TORCH_COMPILE_DISABLE=1

scripts/nvlink/ring.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,8 @@ EXIT_CODE=${1:-0}
77
JOB_NAME=${2:-"Unknown Job"}
88

99
# Load environment variables from .env file
10-
if [ -f "/home/silviase/augeo/.env" ]; then
11-
export $(grep -v '^#' /home/silviase/augeo/.env | xargs)
10+
if [ -f "/home/silviase/llm-jp-eval-mm/.env" ]; then
11+
export $(grep -v '^#' /home/silviase/llm-jp-eval-mm/.env | xargs)
1212
fi
1313

1414
# Check if webhook URL is set
@@ -45,7 +45,7 @@ curl -X POST "$SLACK_WEBHOOK_URL" \
4545
{"title": "Node", "value": "$NODE", "short": true},
4646
{"title": "Completed", "value": "$CURRENT_TIME", "short": true}
4747
],
48-
"footer": "Augeo Project",
48+
"footer": "LLM-jp EvalMM Project",
4949
"ts": $(date +%s)
5050
}]
5151
}

0 commit comments

Comments
 (0)