|
| 1 | +#!/bin/bash |
| 2 | + |
| 3 | +# Qwen3-VL Evaluation Script with SGLang Backend |
| 4 | +# This script demonstrates how to evaluate Qwen3-VL models using SGLang for accelerated inference |
| 5 | +# |
| 6 | +# Requirements: |
| 7 | +# - sglang>=0.4.6 |
| 8 | +# - qwen-vl-utils |
| 9 | +# - CUDA-enabled GPU(s) |
| 10 | +# |
| 11 | +# Installation: |
| 12 | +# uv add "sglang[all]" qwen-vl-utils |
| 13 | +# OR |
| 14 | +# pip install "sglang[all]>=0.4.6" qwen-vl-utils |
| 15 | + |
| 16 | +# ============================================================================ |
| 17 | +# Configuration |
| 18 | +# ============================================================================ |
| 19 | + |
| 20 | +# Model Configuration |
| 21 | +# Available Qwen3-VL models: |
| 22 | +# - Qwen/Qwen3-VL-30B-A3B-Instruct |
| 23 | +# - Qwen/Qwen3-VL-30B-A3B-Thinking |
| 24 | +# - Qwen/Qwen3-VL-235B-A22B-Instruct |
| 25 | +# - Qwen/Qwen3-VL-235B-A22B-Thinking |
| 26 | +MODEL="Qwen/Qwen3-VL-30B-A3B-Instruct" |
| 27 | + |
| 28 | +# Parallelization Settings |
| 29 | +# Adjust based on your GPU configuration |
| 30 | +TENSOR_PARALLEL_SIZE=4 # Number of GPUs for tensor parallelism (tp_size in SGLang) |
| 31 | + |
| 32 | +# Memory and Performance Settings |
| 33 | +GPU_MEMORY_UTILIZATION=0.85 # mem_fraction_static in SGLang (0.0 - 1.0) |
| 34 | +BATCH_SIZE=64 # Batch size for evaluation |
| 35 | + |
| 36 | +# SGLang Specific Settings |
| 37 | +MAX_PIXELS=1605632 # Maximum pixels for image processing |
| 38 | +MIN_PIXELS=784 # Minimum pixels (28x28) |
| 39 | +MAX_FRAME_NUM=32 # Maximum number of video frames |
| 40 | +THREADS=16 # Number of threads for decoding visuals |
| 41 | + |
| 42 | +# Task Configuration |
| 43 | +# Common tasks: mmmu_val, mme, mathvista, ai2d, etc. |
| 44 | +TASKS="mmmu_val,mme" |
| 45 | + |
| 46 | +# Output Configuration |
| 47 | +OUTPUT_PATH="./logs/qwen3vl_sglang" |
| 48 | +LOG_SAMPLES=true |
| 49 | +LOG_SUFFIX="qwen3vl_sglang" |
| 50 | + |
| 51 | +# Evaluation Limits (optional) |
| 52 | +# LIMIT=100 # Uncomment to limit number of samples (for testing) |
| 53 | + |
| 54 | +# ============================================================================ |
| 55 | +# Environment Configuration |
| 56 | +# ============================================================================ |
| 57 | +export HF_HOME="${HF_HOME:-$HOME/.cache/huggingface}" |
| 58 | + |
| 59 | +# ============================================================================ |
| 60 | +# Run Evaluation |
| 61 | +# ============================================================================ |
| 62 | + |
| 63 | +echo "==========================================" |
| 64 | +echo "Qwen3-VL Evaluation with SGLang" |
| 65 | +echo "==========================================" |
| 66 | +echo "Model: $MODEL" |
| 67 | +echo "Tensor Parallel Size: $TENSOR_PARALLEL_SIZE" |
| 68 | +echo "Tasks: $TASKS" |
| 69 | +echo "Batch Size: $BATCH_SIZE" |
| 70 | +echo "Max Pixels: $MAX_PIXELS" |
| 71 | +echo "Output Path: $OUTPUT_PATH" |
| 72 | +echo "==========================================" |
| 73 | + |
| 74 | +# Build the command |
| 75 | +CMD="uv run python -m lmms_eval \ |
| 76 | + --model sglang_runtime \ |
| 77 | + --model_args model=${MODEL},tensor_parallel_size=${TENSOR_PARALLEL_SIZE},gpu_memory_utilization=${GPU_MEMORY_UTILIZATION},max_pixels=${MAX_PIXELS},min_pixels=${MIN_PIXELS},max_frame_num=${MAX_FRAME_NUM},threads=${THREADS} \ |
| 78 | + --tasks ${TASKS} \ |
| 79 | + --batch_size ${BATCH_SIZE} \ |
| 80 | + --output_path ${OUTPUT_PATH}" |
| 81 | + |
| 82 | +# Add optional arguments |
| 83 | +if [ "$LOG_SAMPLES" = true ]; then |
| 84 | + CMD="$CMD --log_samples --log_samples_suffix ${LOG_SUFFIX}" |
| 85 | +fi |
| 86 | + |
| 87 | +if [ ! -z "$LIMIT" ]; then |
| 88 | + CMD="$CMD --limit ${LIMIT}" |
| 89 | +fi |
| 90 | + |
| 91 | +# Execute |
| 92 | +echo "Running command:" |
| 93 | +echo "$CMD" |
| 94 | +echo "" |
| 95 | + |
| 96 | +eval $CMD |
| 97 | + |
| 98 | +echo "" |
| 99 | +echo "==========================================" |
| 100 | +echo "Evaluation Complete!" |
| 101 | +echo "Results saved to: $OUTPUT_PATH" |
| 102 | +echo "==========================================" |
0 commit comments