File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 2424 has_torch_rbln = False
2525
2626from vllm_rbln .logger import init_logger
27+ from vllm_rbln .torch_compile_backend import logged_rbln_backend
2728from vllm .v1 .sample .metadata import SamplingMetadata
2829from vllm .v1 .sample .sampler import Sampler as VLLMSampler
2930import rebel
@@ -175,7 +176,7 @@ def __init__(
175176 rbln_top_k_top_p_sample ,
176177 dynamic = False ,
177178 fullgraph = True ,
178- backend = "rbln" ,
179+ backend = logged_rbln_backend ,
179180 options = options ,
180181 )
181182 self .forward = self .forward_rbln
Original file line number Diff line number Diff line change 3030import vllm_rbln .rbln_envs as envs
3131import vllm_rbln .utils as rbln_utils
3232from vllm_rbln .logger import init_logger
33+ from vllm_rbln .torch_compile_backend import logged_rbln_backend
3334from vllm_rbln .v1 .attention .kv_cache_bindings import (
3435 attach_kv_cache_bindings ,
3536 build_kv_cache_forward_context_kwargs ,
@@ -515,7 +516,7 @@ def _compile_model(self, model):
515516
516517 return torch .compile (
517518 model ,
518- backend = "rbln" ,
519+ backend = logged_rbln_backend ,
519520 options = copy (options ),
520521 dynamic = False ,
521522 )
Original file line number Diff line number Diff line change 2323from vllm .v1 .spec_decode .medusa import MedusaProposer
2424
2525import vllm_rbln .rbln_envs as envs
26+ from vllm_rbln .torch_compile_backend import logged_rbln_backend
2627
2728
2829class RBLNMedusaProposer (MedusaProposer ):
@@ -74,7 +75,7 @@ def _compile_model(self, model: nn.Module):
7475
7576 return torch .compile (
7677 model ,
77- backend = "rbln" ,
78+ backend = logged_rbln_backend ,
7879 options = copy (options ),
7980 dynamic = False ,
8081 )
You can’t perform that action at this time.
0 commit comments