Fix retry with backoff

huggingface · Aug 25, 2024 · 80b2677 · 80b2677
1 parent 7415803
commit 80b2677
Show file tree

Hide file tree

Showing 3 changed files with 6 additions and 6 deletions.
diff --git a/src/lighteval/models/endpoint_model.py b/src/lighteval/models/endpoint_model.py
@@ -156,16 +156,16 @@ def _async_process_request(
     ) -> Coroutine[None, list[TextGenerationOutput], str]:
         # Todo: add an option to launch with conversational instead for chat prompts
         # https://huggingface.co/docs/huggingface_hub/v0.20.3/en/package_reference/inference_client#huggingface_hub.AsyncInferenceClient.conversational
-        generated_text = self.async_client.text_generation(
+        generated_text = retry_with_backoff(lambda: self.async_client.text_generation(
             prompt=context,
             details=True,
             decoder_input_details=True,
             max_new_tokens=max_tokens,
             stop_sequences=stop_tokens,
             # truncate=,
-        )
+        ))
 
-        return retry_with_backoff(generated_text)
+        return generated_text
 
     def _process_request(self, context: str, stop_tokens: list[str], max_tokens: int) -> TextGenerationOutput:
         # Todo: add an option to launch with conversational instead for chat prompts

diff --git a/src/lighteval/models/oai_model.py b/src/lighteval/models/oai_model.py
@@ -46,7 +46,7 @@ async def _async_process_request(
         self, context: str, stop_tokens: list[str], max_tokens: int
     ) -> Coroutine[None, TextGenerationOutput, str]:
         # Todo: add an option to launch with conversational instead for chat prompts
-        output = await retry_with_backoff(self.client.completions.create(
+        output = await retry_with_backoff(lambda: self.client.completions.create(
             model="/repository", 
             prompt=context,
             max_tokens=max_tokens,

diff --git a/src/lighteval/models/utils.py b/src/lighteval/models/utils.py
@@ -103,10 +103,10 @@ def batched(iterable, n):
 import random
 MAX_RETRIES = 5
 INITIAL_BACKOFF = 1
-async def retry_with_backoff(coro):
+async def retry_with_backoff(coro_fn):
     for attempt in range(MAX_RETRIES):
         try:
-            return await coro
+            return await coro_fn()
         except Exception as e:
             if attempt < MAX_RETRIES - 1:
                 backoff_time = INITIAL_BACKOFF * (2 ** attempt) + random.uniform(0, 1)