Skip to content

Commit 5bc4f5c

Browse files
authored
fix: raise MemoryError when available_dram becomes negative (#80)
1 parent 575a316 commit 5bc4f5c

1 file changed

Lines changed: 6 additions & 0 deletions

File tree

vllm_rbln/worker/utils.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -78,6 +78,10 @@ def align_2MB(x: int) -> int:
7878
available_dram = tensor_parallel_size * (ATOM_DRAM_NBYTES -
7979
ATOM_SYS_DRAM_NBYTES)
8080

81+
def check_oom(available_dram: int) -> None:
82+
if available_dram <= 0:
83+
raise MemoryError("Insufficient DRAM during block calculation.")
84+
8185
if kernel_size is None:
8286
if n_model_params is None:
8387
raise ValueError("`n_model_params` should be specified \
@@ -106,6 +110,8 @@ def align_2MB(x: int) -> int:
106110
buffer = buffer_per_core * tensor_parallel_size
107111
available_dram -= buffer
108112

113+
check_oom(available_dram)
114+
109115
b = kvcache_block_size * align(head_dim, 64) * math.ceil(
110116
num_key_value_heads / tensor_parallel_size) * 2
111117
c = num_layers * 2 * tensor_parallel_size

0 commit comments

Comments
 (0)