-
Notifications
You must be signed in to change notification settings - Fork 28
Description
My environment:
Xinference== 1.8.1
Vllm==0.8.5
Torch==2.6.0
Torchaudio==2.6.0
Transformers==4.52.4
xoscar==0.7.13
When I use xinference to deploy Qwen3, I get the following error:
Traceback (most recent call last):
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/communication/socket.py", line 388, in handle_connection
return await server.on_connected(
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/communication/socket.py", line 184, in on_connected
await self.channel_handler(channel)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/pool.py", line 577, in on_new_channel
message = await channel.recv()
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/communication/socket.py", line 104, in recv
return deserialize(header, buffers)
File "xoscar/serialization/core.pyx", line 943, in xoscar.serialization.core.deserialize
File "xoscar/backends/message.pyx", line 636, in xoscar.backends.message.MessageSerializer.on_deserial_error
xoscar.backends.message.DeserializeMessageFailed: Deserialize b'<=\xef\xd0n\x87\xf9\xe5\x03\t\\x82b\xb0\n\x92\xe4\x05\xa8gQN\xeb,^\xb5\x1b\\x955c\x0b' failed
2025-08-04 02:18:57,372 xinference.core.worker 142 ERROR Failed to load model qwen2.5-105-0
Traceback (most recent call last):
File "/usr/local/lib/python3.10/dist-packages/xinference/core/worker.py", line 1088, in launch_builtin_model
model_ref = await xo.create_actor(
File "/usr/local/lib/python3.10/dist-packages/xoscar/api.py", line 79, in create_actor
return await ctx.create_actor(actor_cls, *args, uid=uid, address=address, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 151, in create_actor
result = await self._wait(future, address, create_actor_message) # type: ignore
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 124, in _wait
return await future
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/core.py", line 104, in _listen
raise ServerClosed(
xoscar.errors.ServerClosed: Remote server unixsocket:///74448896 closed: 0 bytes read on a total of 11 expected bytes
2025-08-04 02:18:57,426 xinference.core.worker 142 ERROR [request 09779770-7114-11f0-98ab-0242c0a8c803] Leave launch_builtin_model, error: Remote server unixsocket:///74448896 closed: 0 bytes read on a total of 11 expected bytes, elapsed time: 5 s
Traceback (most recent call last):
File "/usr/local/lib/python3.10/dist-packages/xinference/core/utils.py", line 93, in wrapped
ret = await func(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/xinference/core/worker.py", line 1088, in launch_builtin_model
model_ref = await xo.create_actor(
File "/usr/local/lib/python3.10/dist-packages/xoscar/api.py", line 79, in create_actor
return await ctx.create_actor(actor_cls, *args, uid=uid, address=address, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 151, in create_actor
result = await self._wait(future, address, create_actor_message) # type: ignore
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 124, in _wait
return await future
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/core.py", line 104, in _listen
raise ServerClosed(
xoscar.errors.ServerClosed: Remote server unixsocket:///74448896 closed: 0 bytes read on a total of 11 expected bytes
2025-08-04 02:18:57,429 xinference.api.restful_api 1 ERROR [address=0.0.0.0:22388, pid=142] Remote server unixsocket:///74448896 closed: 0 bytes read on a total of 11 expected bytes
Traceback (most recent call last):
File "/usr/local/lib/python3.10/dist-packages/xinference/api/restful_api.py", line 1083, in launch_model
model_uid = await (await self._get_supervisor_ref()).launch_builtin_model(
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 262, in send
return self._process_result_message(result)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 111, in _process_result_message
raise message.as_instanceof_cause()
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/pool.py", line 689, in send
result = await self._run_coro(message.message_id, coro)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/pool.py", line 389, in _run_coro
return await coro
File "/usr/local/lib/python3.10/dist-packages/xoscar/api.py", line 418, in on_receive
return await super().on_receive(message) # type: ignore
File "xoscar/core.pyx", line 564, in on_receive
�
raise ex
File "xoscar/core.pyx", line 526, in xoscar.core._BaseActor.on_receive
async with self._lock:
File "xoscar/core.pyx", line 527, in xoscar.core._BaseActor.on_receive
with debug_async_timeout('actor_lock_timeout',
File "xoscar/core.pyx", line 532, in xoscar.core._BaseActor.on_receive
result = await result
File "/usr/local/lib/python3.10/dist-packages/xinference/core/supervisor.py", line 1253, in launch_builtin_model
await _launch_model()
File "/usr/local/lib/python3.10/dist-packages/xinference/core/supervisor.py", line 1188, in _launch_model
subpool_address = await _launch_one_model(
File "/usr/local/lib/python3.10/dist-packages/xinference/core/supervisor.py", line 1139, in _launch_one_model
subpool_address = await worker_ref.launch_builtin_model(
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 262, in send
return self._process_result_message(result)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 111, in _process_result_message
raise message.as_instanceof_cause()
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/pool.py", line 689, in send
result = await self._run_coro(message.message_id, coro)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/pool.py", line 389, in _run_coro
return await coro
File "/usr/local/lib/python3.10/dist-packages/xoscar/api.py", line 418, in on_receive
return await super().on_receive(message) # type: ignore
File "xoscar/core.pyx", line 564, in on_receive
�
raise ex
File "xoscar/core.pyx", line 526, in xoscar.core._BaseActor.on_receive
async with self._lock:
File "xoscar/core.pyx", line 527, in xoscar.core._BaseActor.on_receive
with debug_async_timeout('actor_lock_timeout',
File "xoscar/core.pyx", line 532, in xoscar.core._BaseActor.on_receive
result = await result
File "/usr/local/lib/python3.10/dist-packages/xinference/core/utils.py", line 93, in wrapped
ret = await func(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/xinference/core/worker.py", line 1088, in launch_builtin_model
model_ref = await xo.create_actor(
File "/usr/local/lib/python3.10/dist-packages/xoscar/api.py", line 79, in create_actor
return await ctx.create_actor(actor_cls, *args, uid=uid, address=address, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 151, in create_actor
result = await self._wait(future, address, create_actor_message) # type: ignore
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/context.py", line 124, in _wait
return await future
File "/usr/local/lib/python3.10/dist-packages/xoscar/backends/core.py", line 104, in _listen
raise ServerClosed(
xoscar.errors.ServerClosed: [address=0.0.0.0:22388, pid=142] Remote server unixsocket:///74448896 closed: 0 bytes read on a total of 11 expected bytes