File tree Expand file tree Collapse file tree 1 file changed +2
-3
lines changed
Expand file tree Collapse file tree 1 file changed +2
-3
lines changed Original file line number Diff line number Diff line change 77# This prevents errors when trying to create CUDA streams on TPU hardware
88# The issue was introduced by vllm-project/vllm#26440
99os .environ ["VLLM_DISABLE_SHARED_EXPERTS_STREAM" ] = "1"
10- os .environ [
11- "LIBTPU_INIT_ARGS" ] = "--xla_tpu_use_tc_device_shape_on_sc=true --xla_tpu_scheduler_percent_shared_memory_limit=1000"
10+ os .environ ["LIBTPU_INIT_ARGS" ] = "--xla_tpu_use_tc_device_shape_on_sc=true"
1211
1312# Monkeypatch vLLM to avoid ImportError: cannot import name 'SamplingParams' from 'vllm'
1413# in vllm/v1/... submodules due to circular imports or lazy loading failures.
2322 from vllm .sampling_params import RequestOutputKind
2423 vllm .RequestOutputKind = RequestOutputKind
2524except ImportError :
26- pass
25+ pass
You can’t perform that action at this time.
0 commit comments