Error executing method ‘initialize_from_config’. This might cause deadlock in distributed execution.
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] Traceback (most recent call last):
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/worker_base.py”, line 334, in execute_method
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] return run_method(self, method, args, kwargs)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/serial_utils.py”, line 461, in run_method
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] return func(*args, **kwargs)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/ray/util/tracing/tracing_helper.py”, line 461, in _resume_span
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] return method(self, *_args, **_kwargs)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/worker_base.py”, line 320, in initialize_from_config
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] self.worker.initialize_from_config(kv_cache_config) # type: ignore
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/gpu_worker.py”, line 412, in initialize_from_config
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] self.model_runner.initialize_kv_cache(kv_cache_config)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/gpu_model_runner.py”, line 5862, in initialize_kv_cache
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] self.initialize_attn_backend(kv_cache_config)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/gpu_model_runner.py”, line 5203, in initialize_attn_backend
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] attn_backends = get_attn_backends_for_group(kv_cache_group_spec)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/v1/worker/gpu_model_runner.py”, line 5151, in get_attn_backends_for_group
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] layers = get_layers_from_vllm_config(
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/config/vllm.py”, line 1501, in get_layers_from_vllm_config
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] return {
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] File “/home/deploy/.conda/envs/zm_glm/lib/python3.10/site-packages/vllm/config/vllm.py”, line 1504, in
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] if isinstance(forward_context[layer_name], layer_type)
e[0;36m(EngineCore_DP0 pid=194587)e[0;0m e[36m(RayWorkerWrapper pid=150609)e[0m ERROR 02-03 16:20:26 [worker_base.py:344] KeyError: ‘model.layers.31.self_attn.attn’