disable prefix cache

gongshaotian · gongshaotian · commit 00d303ebcb06 · 2025-12-10T21:29:14.000+08:00
diff --git a/fastdeploy/config.py b/fastdeploy/config.py
@@ -1691,7 +1691,9 @@ def postprocess(self):
         self.cache_config.postprocess(self.scheduler_config.max_num_batched_tokens, self.scheduler_config.max_num_seqs)
         if self.model_config is not None and self.model_config.enable_mm and not envs.ENABLE_V1_KVCACHE_SCHEDULER:
             self.cache_config.enable_prefix_caching = False
-
+        if self.routing_replay_config.enable_routing_replay:
+            # TODO(gongshaotian): R3 support prefix caching
+            self.cache_config.enable_prefix_caching = False
         if (
             self.structured_outputs_config is not None
             and self.structured_outputs_config.guided_decoding_backend != "off"