From 38c279a07d4bf5521e8e88497138af5207349a53 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Cl=C3=A9mence=20Lesn=C3=A9?= <clemence@lesne.pro>
Date: Mon, 12 Feb 2024 16:21:44 +0100
Subject: [PATCH] refacto: Manage LLM retries by OpenAI SDK not Tenacity

---
 helpers/llm.py | 22 +++++-----------------
 1 file changed, 5 insertions(+), 17 deletions(-)

diff --git a/helpers/llm.py b/helpers/llm.py
index 1cf58de6..697bcdf2 100644
--- a/helpers/llm.py
+++ b/helpers/llm.py
@@ -53,15 +53,6 @@ def __str__(self) -> str:
         return self.message
 
 
-@retry(
-    reraise=True,
-    retry=(
-        retry_if_exception_type(APIResponseValidationError)
-        | retry_if_exception_type(APIStatusError)
-    ),
-    stop=stop_after_attempt(3),
-    wait=wait_random_exponential(multiplier=0.5, max=30),
-)
 async def completion_stream(
     messages: List[ChatCompletionMessageParam],
     max_tokens: int,
@@ -69,8 +60,6 @@ async def completion_stream(
 ) -> AsyncGenerator[ChoiceDelta, None]:
     """
     Returns a stream of completion results.
-
-    Catch errors for a maximum of 3 times. Won't retry on connection errors (like timeouts) as the stream will be already partially consumed.
     """
     extra = {}
 
@@ -93,12 +82,7 @@ async def completion_stream(
 
 @retry(
     reraise=True,
-    retry=(
-        retry_if_exception_type(APIConnectionError)
-        | retry_if_exception_type(APIResponseValidationError)
-        | retry_if_exception_type(APIStatusError)
-        | retry_if_exception_type(SafetyCheckError)
-    ),
+    retry=retry_if_exception_type(SafetyCheckError),
     stop=stop_after_attempt(3),
     wait=wait_random_exponential(multiplier=0.5, max=30),
 )
@@ -252,6 +236,10 @@ def _contentsafety_category_test(
 @asynccontextmanager
 async def _use_oai() -> AsyncGenerator[AsyncAzureOpenAI, None]:
     client = AsyncAzureOpenAI(
+        # Reliability
+        max_retries=3,
+        timeout=60,
+        # Azure deployment
         api_version="2023-12-01-preview",
         azure_deployment=CONFIG.openai.gpt_deployment,
         azure_endpoint=CONFIG.openai.endpoint,