diff --git a/fastdeploy/config.py b/fastdeploy/config.py index 1563e2030a8..428509938f2 100644 --- a/fastdeploy/config.py +++ b/fastdeploy/config.py @@ -1760,8 +1760,6 @@ def postprocess(self): f"set to max_num_batched_tokens." ) self.cache_config.max_encoder_cache = self.scheduler_config.max_num_batched_tokens - # TODO: mm encoder_cache close for now - self.cache_config.max_encoder_cache = 0 else: self.cache_config.max_encoder_cache = 0