Skip to content

Commit 8be6d90

Browse files
authored
Merge pull request #136 from Project-HAMi/fix_vllm
Fix vllm issues: Project-HAMi/HAMi#1381, Project-HAMi/HAMi#1461
2 parents 950c62f + f716b5d commit 8be6d90

File tree

4 files changed

+5
-6
lines changed

4 files changed

+5
-6
lines changed

src/cuda/hook.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -134,7 +134,7 @@ cuda_entry_t cuda_library_entry[] = {
134134
{.name = "cuMemCreate"},
135135
{.name = "cuMemRelease"},
136136
{.name = "cuMemMap"},
137-
{.name = "cucuMemImportFromShareableHandle"},
137+
{.name = "cuMemImportFromShareableHandle"},
138138
{.name = "cuMemAllocAsync"},
139139
{.name = "cuMemFreeAsync"},
140140
/* cuda11.7 new api memory part */

src/cuda/memory.c

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -493,8 +493,8 @@ CUresult cuMemGetInfo_v2(size_t* free, size_t* total) {
493493
LOG_DEBUG("cuMemGetInfo_v2");
494494
ENSURE_INITIALIZED();
495495
CHECK_DRV_API(cuCtxGetDevice(&dev));
496-
size_t usage = get_current_device_memory_usage(dev);
497-
size_t limit = get_current_device_memory_limit(dev);
496+
size_t usage = get_current_device_memory_usage(cuda_to_nvml_map(dev));
497+
size_t limit = get_current_device_memory_limit(cuda_to_nvml_map(dev));
498498
if (limit == 0) {
499499
CUDA_OVERRIDE_CALL(cuda_library_entry,cuMemGetInfo_v2, free, total);
500500
LOG_INFO("orig free=%ld total=%ld", *free, *total);

src/libvgpu.c

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -848,7 +848,7 @@ void preInit(){
848848

849849
void postInit(){
850850
allocator_init();
851-
851+
map_cuda_visible_devices();
852852
try_lock_unified_lock();
853853
nvmlReturn_t res = set_task_pid();
854854
try_unlock_unified_lock();
@@ -860,7 +860,6 @@ void postInit(){
860860
pidfound=1;
861861
}
862862

863-
map_cuda_visible_devices();
864863
//add_gpu_device_memory_usage(getpid(),0,context_size,0);
865864
env_utilization_switch = set_env_utilization_switch();
866865
init_utilization_watcher();

src/utils.c

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -193,7 +193,7 @@ int parse_cuda_visible_env() {
193193
for (int i = 0; i < CUDA_DEVICE_MAX_COUNT; i++) {
194194
LOG_INFO("device %d -> %d",i,cuda_to_nvml_map(i));
195195
}
196-
LOG_DEBUG("get default cuda from %s",getenv("CUDA_VISIBLE_DEVICES"));
196+
LOG_INFO("get default cuda from %s", getenv("CUDA_VISIBLE_DEVICES"));
197197
return count;
198198
}
199199

0 commit comments

Comments
 (0)