Spaces:

TeddyYao
/

grok4-gpqa-eval

Sleeping

App Files Files Community

grok4-gpqa-eval / apis /base_api.py

TeddyYao

Upload 38 files

8474f02 verified 5 months ago

raw

history blame

2.34 kB

	from abc import ABC, abstractmethod
	import time
	import asyncio
	from typing import List, Dict, Any, Optional

	class BaseAPI(ABC):
	"""Base class for all API implementations"""

	def __init__(self, api_key: str, model_name: str, **kwargs):
	self.api_key = api_key
	self.model_name = model_name
	self.rate_limit_delay = kwargs.get('rate_limit_delay', 1.0)
	self.max_retries = kwargs.get('max_retries', 3)
	self.timeout = kwargs.get('timeout', 30)

	@abstractmethod
	async def generate_response(self, prompt: str, **kwargs) -> str:
	"""Generate a response from the model"""
	pass

	async def generate_with_retry(self, prompt: str, **kwargs) -> str:
	"""Generate response with retry logic"""
	for attempt in range(self.max_retries):
	try:
	response = await self.generate_response(prompt, **kwargs)
	return response
	except Exception as e:
	error_str = str(e).lower()

	# Check if it's a timeout error
	if 'timeout' in error_str or 'timed out' in error_str:
	# For timeout errors, use longer backoff
	max_retries = min(self.max_retries + 2, 5) # Allow more retries for timeouts
	if attempt < max_retries - 1:
	backoff = min(60, 5 * (2 ** attempt)) # Max 60 seconds wait
	print(f"Timeout error, retrying in {backoff}s... (attempt {attempt + 1}/{max_retries})")
	await asyncio.sleep(backoff)
	continue

	# For other errors, use standard backoff
	if attempt == self.max_retries - 1:
	raise e

	backoff = min(30, 2 ** attempt) # Max 30 seconds for other errors
	await asyncio.sleep(backoff)

	async def batch_generate(self, prompts: List[str], **kwargs) -> List[str]:
	"""Generate responses for multiple prompts"""
	responses = []
	for prompt in prompts:
	response = await self.generate_with_retry(prompt, **kwargs)
	responses.append(response)
	await asyncio.sleep(self.rate_limit_delay)
	return responses