gpu-services/hub-api/middleware/rate_limit.py

from fastapi import HTTPException

from services.registry import registry


def check_backend_rate_limit(backend_id: str):
    """Raise 429 if rate limit exceeded for this backend."""
    if not registry.check_rate_limit(backend_id):
        raise HTTPException(
            status_code=429,
            detail={
                "error": {
                    "message": f"Rate limit exceeded for backend '{backend_id}'",
                    "type": "rate_limit_error",
                    "code": "rate_limit_exceeded",
                }
            },
        )