Fix

vllm-project · Oct 18, 2024 · beae068 · beae068
1 parent 72f1e72
commit beae068
Show file tree

Hide file tree

Showing 2 changed files with 12 additions and 12 deletions.
diff --git a/vllm/config.py b/vllm/config.py
@@ -261,33 +261,33 @@ def _resolve_task(
         architectures = getattr(hf_config, "architectures", [])
 
         task_support: Dict[Task, bool] = {
-            # NOTE: They are listed from highest to lowest priority, in case
-            # the model supports multiple of them
+            # NOTE: Listed from highest to lowest priority,
+            # in case the model supports multiple of them
             "generate": ModelRegistry.is_text_generation_model(architectures),
             "embedding": ModelRegistry.is_embedding_model(architectures),
         }
-        supported_tasks: Set[Task] = {
-            task
-            for task, is_supported in task_support.items() if is_supported
-        }
+        supported_tasks_lst: List[Task] = [
+            task for task, is_supported in task_support.items() if is_supported
+        ]
+        supported_tasks = set(supported_tasks_lst)
 
         if task_option == "auto":
-            task = next(iter(supported_tasks))
+            selected_task = next(iter(supported_tasks_lst))
 
             if len(supported_tasks) > 1:
                 logger.info(
                     "This model supports multiple tasks: %s. "
-                    "Defaulting to '%s'.", supported_tasks, task)
+                    "Defaulting to '%s'.", supported_tasks, selected_task)
         else:
             if task_option not in supported_tasks:
                 msg = (
                     f"This model does not support the '{task_option}' task. "
                     f"Supported tasks: {supported_tasks}")
                 raise ValueError(msg)
 
-            task = task_option
+            selected_task = task_option
 
-        return supported_tasks, task
+        return supported_tasks, selected_task
 
     def _parse_quant_hf_config(self):
         quant_cfg = getattr(self.hf_config, "quantization_config", None)

diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py
@@ -341,7 +341,7 @@ def generate(
 
             supported_tasks = self.llm_engine.model_config.supported_tasks
             if "generate" in supported_tasks:
-                messages += (
+                messages.append(
                     "Your model supports the 'generate' task, but is "
                     f"currently initialized for the '{task}' task. Please "
                     "initialize the model using `--task generate`.")
@@ -724,7 +724,7 @@ def encode(
 
             supported_tasks = self.llm_engine.model_config.supported_tasks
             if "embedding" in supported_tasks:
-                messages += (
+                messages.append(
                     "Your model supports the 'embedding' task, but is "
                     f"currently initialized for the '{task}' task. Please "
                     "initialize the model using `--task embedding`.")