Fix

vllm-project · WoosukKwon · Aug 30, 2024 · Aug 28, 2024 · Aug 29, 2024 · Aug 29, 2024
commit c11eccfaad175196840764a49166c1620f256f78
diff --git a/vllm/config.py b/vllm/config.py
@@ -347,10 +347,10 @@ def verify_async_output_proc(self, parallel_config, speculative_config,
             self.use_async_output_proc = False
             return
 
-        if device_config.device_type not in {"cuda", "tpu"}:
+        if device_config.device_type not in ("cuda", "tpu"):
             logger.warning(
-                "Async output processing is only supported for CUDA."
-                " Disabling it for other platforms.")
+                "Async output processing is only supported for CUDA or TPU. "
+                "Disabling it for other platforms.")
             self.use_async_output_proc = False
             return