From b58e882eaa5d1dd52edf9bf44f3c007ba58c2620 Mon Sep 17 00:00:00 2001 From: Yongteng Lei Date: Wed, 3 Sep 2025 13:31:43 +0800 Subject: [PATCH] Feat: add exponential back-off for Chat LiteLLM (#9880) ### What problem does this PR solve? Add exponential back-off for Chat LiteLLM. #9858. ### Type of change - [x] New Feature (non-breaking change which adds functionality) --- rag/llm/chat_model.py | 1 + 1 file changed, 1 insertion(+) diff --git a/rag/llm/chat_model.py b/rag/llm/chat_model.py index 17a6ccea9..98d71141c 100644 --- a/rag/llm/chat_model.py +++ b/rag/llm/chat_model.py @@ -1534,6 +1534,7 @@ class LiteLLMBase(ABC): "model": self.model_name, "messages": history, "api_key": self.api_key, + "num_retries": self.max_retries, **kwargs, } if stream: