Skip to content

Commit

Permalink
Unit Test: Add error handling for rate limit exceeded in model list (#…
Browse files Browse the repository at this point in the history
…5715)

This PR fixes the random failure in our unit test due to HTTP 429

---------

Co-authored-by: Logan Adams <114770087+loadams@users.noreply.github.com>
  • Loading branch information
HeyangQin and loadams authored Jul 11, 2024
1 parent 74f3dca commit 83aa184
Showing 1 changed file with 16 additions and 3 deletions.
19 changes: 16 additions & 3 deletions tests/unit/inference/test_inference.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
import pickle
import os
import time
import requests

from dataclasses import dataclass
from typing import List
Expand Down Expand Up @@ -101,9 +102,21 @@ def _hf_model_list() -> List[ModelInfo]:
if ((model_data["cache_time"] + cache_expiration_seconds) < current_time) or os.getenv("FORCE_UPDATE_HF_CACHE",
default=False):
api = HfApi()
model_data["model_list"] = [
ModelInfo(modelId=m.modelId, pipeline_tag=m.pipeline_tag, tags=m.tags) for m in api.list_models()
]
while True:
try:
model_list = []
for model in _test_models:
model_list.extend(api.list_models(model_name=model))
model_data["model_list"] = [
ModelInfo(modelId=m.modelId, pipeline_tag=m.pipeline_tag, tags=m.tags) for m in model_list
]
break # Exit the loop if the operation is successful
except requests.exceptions.HTTPError as e:
if e.response.status_code == 429:
print("Rate limit exceeded. Retrying in 60 seconds...")
time.sleep(60)
else:
raise # Re-raise the exception if it's not a 429 error
model_data["cache_time"] = current_time

# Save the updated cache
Expand Down

0 comments on commit 83aa184

Please # to comment.