Skip to content
6 changes: 6 additions & 0 deletions .github/workflows/galaxy-quick-impl.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -131,6 +131,8 @@ jobs:
LD_LIBRARY_PATH: /work/build/lib
LOGURU_LEVEL: INFO
LLAMA_DIR: /mnt/MLPerf/tt_dnn-models/llama/Llama3.3-70B-Instruct/
DEEPSEEK_V3_HF_MODEL: /mnt/MLPerf/tt_dnn-models/deepseek-ai/DeepSeek-R1-0528
DEEPSEEK_V3_CACHE: /mnt/MLPerf/tt_dnn-models/deepseek-ai/DeepSeek-R1-0528-Cache/CI
TT_METAL_ENABLE_ERISC_IRAM: 1
GTEST_OUTPUT: xml:/work/generated/test_reports/
volumes:
Expand Down Expand Up @@ -167,6 +169,10 @@ jobs:
# pytest models/demos/llama3_70b_galaxy/tests/unit_tests/test_llama_model_prefill.py;
# CCL smoke tests - exactly one representative test from each op category

uv pip install -r models/demos/deepseek_v3/reference/deepseek/requirements.txt
# Running only decode and prefill-128 tests with HF weights
MESH_DEVICE=TG pytest models/demos/deepseek_v3/tests/test_decoder_block.py -k "model.layers and (mode_decode or mode_prefill_seq_128)" --timeout 600 --durations=0;

pytest "tests/nightly/tg/ccl/test_all_to_all_combine_6U.py::test_all_to_all_combine_8x4[wormhole_b0-dram_in_l1_out_axis0-bfloat16-None-num_links_4-2-dense-s2-7000-8-256-32-8x4_grid-False-fabric_2d]" --timeout=300;

pytest "tests/nightly/tg/ccl/test_minimal_all_gather_async.py::test_all_gather_async[wormhole_b0-mesh_device0-normal-2-2-20-fabric_linear-DRAM_memconfig-sd35_prompt_check-3links]" --timeout=300;
Expand Down
Loading