From 3676621d4a4901a8cb2bdac6d8521b9aa9eaf11e Mon Sep 17 00:00:00 2001
From: Eliza Wszola <eliza@neuralmagic.com>
Date: Thu, 29 Aug 2024 08:00:54 +0000
Subject: [PATCH] update todo

---
 vllm/model_executor/models/mixtral.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/vllm/model_executor/models/mixtral.py b/vllm/model_executor/models/mixtral.py
index d3471959a1766..1cdf1c5f18ca5 100644
--- a/vllm/model_executor/models/mixtral.py
+++ b/vllm/model_executor/models/mixtral.py
@@ -450,8 +450,8 @@ def __init__(
         lora_config: Optional[LoRAConfig] = None,
     ) -> None:
         super().__init__()
-        # TODO keep the fused mixtral_quant codepath around as long as we don't
-        # support all quant_types
+        # TODO keep the unfused mixtral_quant-like codepath around as long as
+        # we don't support all quant_types
         self.is_compressed = isinstance(quant_config, CompressedTensorsConfig)
         self.use_fused_moe = (
             self.is_compressed