We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 03e6bc2 commit 052788eCopy full SHA for 052788e
vllm/worker/cpu_embedding_model_runner.py
@@ -66,6 +66,10 @@ def execute_model(
66
67
hidden_states = model_executable(**execute_model_kwargs)
68
69
+ # Only perform pooling in the driver worker.
70
+ if not self.is_driver_worker:
71
+ return []
72
+
73
return [
74
self.model.pooler(hidden_states=hidden_states,
75
pooling_metadata=model_input.pooling_metadata)
0 commit comments