CognitiveKernel-Pro/example_run_vlm.sh at main · open-compass/CognitiveKernel-Pro · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
#!/usr/bin/env bash
set -euo pipefail

# VLM example (multimodal enabled)
export PYTHONPATH="$(pwd)"
WEB_IP=localhost:3001

# Use gpt: mode with your vLLM OpenAI-compatible endpoint
export LLM_URL="gpt:qwen3-235b-thinking"   # text LLM
export VLM_URL="${LLM_URL}"                # reuse same model for multimodal
export OPENAI_ENDPOINT="https://sd1lpbei9optek6oou0s0.apigateway-cn-beijing.volceapi.com/v1"
export OPENAI_API_KEY="EMPTY"              # replace if your vLLM enables auth

mkdir -p test_output

MAIN_ARGS="{'web_agent': {'use_multimodal': 'yes', 'model': {'call_target': '${LLM_URL}'}, 'model_multimodal': {'call_target': '${VLM_URL}'}, 'web_env_kwargs': {'web_ip': '${WEB_IP}'}}, 'file_agent': {'model': {'call_target': '${LLM_URL}'}, 'model_multimodal': {'call_target': '${VLM_URL}'}}, 'model': {'call_target': '${LLM_URL}'}}"

# You can remove -mpdb to run without debugger; remove --input to type from stdin
NO_NULL_STDIN=1 python3 -u -mpdb -m ck_pro.ck_main.main \
  --updates "${MAIN_ARGS}" \
  --input ck_pro/ck_main/_test/simple_test.jsonl \
  --output test_output/simple_test.vlm.output.jsonl |& tee _log_simple_test_vlm

less -R _log_simple_test_vlm  # colored output