Skip to content

Commit 38dd0ec

Browse files
committed
Revert changes to env_override.py
1 parent 576bf2f commit 38dd0ec

File tree

1 file changed

+2
-3
lines changed

1 file changed

+2
-3
lines changed

tpu_inference/env_override.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,7 @@
77
# This prevents errors when trying to create CUDA streams on TPU hardware
88
# The issue was introduced by vllm-project/vllm#26440
99
os.environ["VLLM_DISABLE_SHARED_EXPERTS_STREAM"] = "1"
10-
os.environ[
11-
"LIBTPU_INIT_ARGS"] = "--xla_tpu_use_tc_device_shape_on_sc=true --xla_tpu_scheduler_percent_shared_memory_limit=1000"
10+
os.environ["LIBTPU_INIT_ARGS"] = "--xla_tpu_use_tc_device_shape_on_sc=true"
1211

1312
# Monkeypatch vLLM to avoid ImportError: cannot import name 'SamplingParams' from 'vllm'
1413
# in vllm/v1/... submodules due to circular imports or lazy loading failures.
@@ -23,4 +22,4 @@
2322
from vllm.sampling_params import RequestOutputKind
2423
vllm.RequestOutputKind = RequestOutputKind
2524
except ImportError:
26-
pass
25+
pass

0 commit comments

Comments
 (0)