Spaces:

akhaliq
/

anycoder

Running

App Files Files Community

akhaliq HF Staff commited on 4 days ago

Commit

3c247ba

1 Parent(s): e6104d9

update

Browse files

Files changed (3) hide show

backend_api.py +56 -3
frontend/src/app/page.tsx +33 -15
frontend/src/lib/api.ts +6 -0

backend_api.py CHANGED Viewed

@@ -90,7 +90,7 @@ def get_cached_client(model_id: str, provider: str = "auto"):
 # Define models and languages here to avoid importing Gradio UI
 AVAILABLE_MODELS = [
     {"name": "Gemini 3.0 Pro", "id": "gemini-3.0-pro", "description": "Google Gemini 3.0 Pro via Poe with advanced reasoning"},
-    {"name": "Grok 4.1 Fast", "id": "x-ai/grok-4.1-fast", "description": "Grok 4.1 Fast model via OpenRouter"},
     {"name": "MiniMax M2", "id": "MiniMaxAI/MiniMax-M2", "description": "MiniMax M2 model via HuggingFace InferenceClient with Novita provider"},
     {"name": "DeepSeek V3.2-Exp", "id": "deepseek-ai/DeepSeek-V3.2-Exp", "description": "DeepSeek V3.2 Experimental via HuggingFace"},
     {"name": "DeepSeek R1", "id": "deepseek-ai/DeepSeek-R1-0528", "description": "DeepSeek R1 model for code generation"},
@@ -490,16 +490,69 @@ async def generate_code(
                 yield f"data: {completion_data}\n\n"
             except Exception as e:
                 error_data = json.dumps({
                     "type": "error",
-                    "message": str(e)
                 })
                 yield f"data: {error_data}\n\n"
         except Exception as e:
             error_data = json.dumps({
                 "type": "error",
-                "message": f"Generation error: {str(e)}"
             })
             yield f"data: {error_data}\n\n"

 # Define models and languages here to avoid importing Gradio UI
 AVAILABLE_MODELS = [
     {"name": "Gemini 3.0 Pro", "id": "gemini-3.0-pro", "description": "Google Gemini 3.0 Pro via Poe with advanced reasoning"},
+    {"name": "Grok 4.1 Fast", "id": "x-ai/grok-4.1-fast", "description": "Grok 4.1 Fast model via OpenRouter (20 req/min on free tier)"},
     {"name": "MiniMax M2", "id": "MiniMaxAI/MiniMax-M2", "description": "MiniMax M2 model via HuggingFace InferenceClient with Novita provider"},
     {"name": "DeepSeek V3.2-Exp", "id": "deepseek-ai/DeepSeek-V3.2-Exp", "description": "DeepSeek V3.2 Experimental via HuggingFace"},
     {"name": "DeepSeek R1", "id": "deepseek-ai/DeepSeek-R1-0528", "description": "DeepSeek R1 model for code generation"},
                 yield f"data: {completion_data}\n\n"
             except Exception as e:
+                # Handle rate limiting and other API errors
+                error_message = str(e)
+                is_rate_limit = False
+                error_type = type(e).__name__
+                # Check for OpenAI SDK rate limit errors
+                if error_type == "RateLimitError" or "rate_limit" in error_type.lower():
+                    is_rate_limit = True
+                # Check if this is a rate limit error (429 status code)
+                elif hasattr(e, 'status_code') and e.status_code == 429:
+                    is_rate_limit = True
+                # Check error message for rate limit indicators
+                elif "429" in error_message or "rate limit" in error_message.lower() or "too many requests" in error_message.lower():
+                    is_rate_limit = True
+                if is_rate_limit:
+                    # Try to extract retry-after header or message
+                    retry_after = None
+                    if hasattr(e, 'response') and e.response:
+                        retry_after = e.response.headers.get('Retry-After') or e.response.headers.get('retry-after')
+                    # Also check if the error object has retry_after
+                    elif hasattr(e, 'retry_after'):
+                        retry_after = str(e.retry_after)
+                    if selected_model_id == "x-ai/grok-4.1-fast" or selected_model_id.startswith("openrouter/"):
+                        error_message = "⏱️ Rate limit exceeded for OpenRouter model"
+                        if retry_after:
+                            error_message += f". Please wait {retry_after} seconds before trying again."
+                        else:
+                            error_message += ". Free tier allows up to 20 requests per minute. Please wait a moment and try again."
+                    else:
+                        error_message = f"⏱️ Rate limit exceeded. Please wait before trying again."
+                        if retry_after:
+                            error_message += f" Retry after {retry_after} seconds."
+                # Check for other common API errors
+                elif hasattr(e, 'status_code'):
+                    if e.status_code == 401:
+                        error_message = "❌ Authentication failed. Please check your API key."
+                    elif e.status_code == 403:
+                        error_message = "❌ Access forbidden. Please check your API key permissions."
+                    elif e.status_code == 500 or e.status_code == 502 or e.status_code == 503:
+                        error_message = "❌ Service temporarily unavailable. Please try again later."
                 error_data = json.dumps({
                     "type": "error",
+                    "message": error_message
                 })
                 yield f"data: {error_data}\n\n"
         except Exception as e:
+            # Fallback error handling
+            error_message = str(e)
+            # Check if it's a rate limit error in the exception message
+            if "429" in error_message or "rate limit" in error_message.lower() or "too many requests" in error_message.lower():
+                if selected_model_id == "x-ai/grok-4.1-fast" or selected_model_id.startswith("openrouter/"):
+                    error_message = "⏱️ Rate limit exceeded for OpenRouter model. Free tier allows up to 20 requests per minute. Please wait a moment and try again."
+                else:
+                    error_message = "⏱️ Rate limit exceeded. Please wait before trying again."
             error_data = json.dumps({
                 "type": "error",
+                "message": f"Generation error: {error_message}"
             })
             yield f"data: {error_data}\n\n"

frontend/src/app/page.tsx CHANGED Viewed

@@ -59,6 +59,8 @@ export default function Home() {
   // Track if we've attempted to fetch username to avoid repeated failures
   const usernameFetchAttemptedRef = useRef(false);
   // Check auth on mount and handle OAuth callback
   useEffect(() => {
@@ -68,8 +70,9 @@ export default function Home() {
     // initializeOAuth already handles this, but we call checkAuth to sync state
     const urlParams = new URLSearchParams(window.location.search);
     if (urlParams.get('session')) {
-      // OAuth callback - reset username fetch attempt and check auth after a brief delay
       usernameFetchAttemptedRef.current = false;
       setTimeout(() => checkAuth(), 200);
     }
   }, []); // Only run once on mount
@@ -79,8 +82,11 @@ export default function Home() {
   useEffect(() => {
     const handleStorageChange = (e: StorageEvent) => {
       if (e.key === 'hf_oauth_token' || e.key === 'hf_user_info') {
-        // Reset username fetch attempt when storage changes
-        usernameFetchAttemptedRef.current = false;
         checkAuth();
       }
     };
@@ -90,10 +96,16 @@ export default function Home() {
   }, []);
   // Listen for window focus (user returns to tab after OAuth redirect)
   useEffect(() => {
     const handleFocus = () => {
-      // Reset username fetch attempt on focus (user might have logged in elsewhere)
-      usernameFetchAttemptedRef.current = false;
       checkAuth();
     };
@@ -111,18 +123,18 @@ export default function Home() {
       if (token) {
         apiClient.setToken(token);
-        // Get username from auth status (only if we don't have it yet and haven't failed)
-        // This is a one-time fetch per session, not polling
-        if (!username && !usernameFetchAttemptedRef.current) {
           usernameFetchAttemptedRef.current = true;
           try {
             const authStatus = await apiClient.getAuthStatus();
             if (authStatus.username) {
               setUsername(authStatus.username);
             }
           } catch (error: any) {
-            // Silently handle connection errors - don't spam console
-            // Connection errors mean backend isn't available, which is OK for client-side auth
             const isConnectionError =
               error.code === 'ECONNABORTED' ||
               error.code === 'ECONNRESET' ||
@@ -133,12 +145,16 @@ export default function Home() {
               error.response?.status === 503 ||
               error.response?.status === 502;
-            if (!isConnectionError) {
-              // Only log non-connection errors
               console.error('Failed to get username:', error);
             }
-            // Reset attempt flag so we can try again later (e.g., when backend comes up)
-            usernameFetchAttemptedRef.current = false;
           }
         }
       } else {
@@ -148,14 +164,16 @@ export default function Home() {
           setUsername(null);
         }
         usernameFetchAttemptedRef.current = false;
       }
     } else {
-      // Not authenticated - clear username and reset fetch attempt
       apiClient.setToken(null);
       if (username) {
         setUsername(null);
       }
       usernameFetchAttemptedRef.current = false;
     }
   };

   // Track if we've attempted to fetch username to avoid repeated failures
   const usernameFetchAttemptedRef = useRef(false);
+  // Track if backend appears to be unavailable (to avoid repeated failed requests)
+  const backendUnavailableRef = useRef(false);
   // Check auth on mount and handle OAuth callback
   useEffect(() => {
     // initializeOAuth already handles this, but we call checkAuth to sync state
     const urlParams = new URLSearchParams(window.location.search);
     if (urlParams.get('session')) {
+      // OAuth callback - reset both flags and check auth after a brief delay
       usernameFetchAttemptedRef.current = false;
+      backendUnavailableRef.current = false; // Reset backend status on OAuth callback
       setTimeout(() => checkAuth(), 200);
     }
   }, []); // Only run once on mount
   useEffect(() => {
     const handleStorageChange = (e: StorageEvent) => {
       if (e.key === 'hf_oauth_token' || e.key === 'hf_user_info') {
+        // Only reset username fetch if we have a token (might be logging in)
+        if (e.newValue) {
+          usernameFetchAttemptedRef.current = false;
+          backendUnavailableRef.current = false; // Reset backend status on login
+        }
         checkAuth();
       }
     };
   }, []);
   // Listen for window focus (user returns to tab after OAuth redirect)
+  // Only check if backend was available before or if we're authenticated with token
   useEffect(() => {
     const handleFocus = () => {
+      // Only reset and check if we're authenticated (might have logged in elsewhere)
+      // Don't reset if backend is known to be unavailable and we're not authenticated
+      const authenticated = checkIsAuthenticated();
+      if (authenticated) {
+        usernameFetchAttemptedRef.current = false;
+        backendUnavailableRef.current = false; // Reset backend status - might be back up
+      }
       checkAuth();
     };
       if (token) {
         apiClient.setToken(token);
+        // Get username from auth status (only if we don't have it yet and backend is available)
+        // Skip if backend is known to be unavailable to avoid repeated failed requests
+        if (!username && !usernameFetchAttemptedRef.current && !backendUnavailableRef.current) {
           usernameFetchAttemptedRef.current = true;
           try {
             const authStatus = await apiClient.getAuthStatus();
             if (authStatus.username) {
               setUsername(authStatus.username);
+              backendUnavailableRef.current = false; // Backend is working
             }
           } catch (error: any) {
+            // Check if this is a connection error
             const isConnectionError =
               error.code === 'ECONNABORTED' ||
               error.code === 'ECONNRESET' ||
               error.response?.status === 503 ||
               error.response?.status === 502;
+            if (isConnectionError) {
+              // Mark backend as unavailable to avoid repeated requests
+              backendUnavailableRef.current = true;
+              // Don't reset attempt flag - keep it true so we don't retry until explicitly reset
+              // This prevents repeated failed requests when backend is down
+            } else {
+              // Non-connection error - log it and reset attempt flag
               console.error('Failed to get username:', error);
+              usernameFetchAttemptedRef.current = false;
             }
           }
         }
       } else {
           setUsername(null);
         }
         usernameFetchAttemptedRef.current = false;
+        backendUnavailableRef.current = false;
       }
     } else {
+      // Not authenticated - clear username and reset flags
       apiClient.setToken(null);
       if (username) {
         setUsername(null);
       }
       usernameFetchAttemptedRef.current = false;
+      // Keep backendUnavailableRef as is - it's useful information even when not authenticated
     }
   };

frontend/src/lib/api.ts CHANGED Viewed

@@ -177,6 +177,12 @@ class ApiClient {
       signal: abortController.signal,
     })
       .then(async (response) => {
         if (!response.ok) {
           throw new Error(`HTTP error! status: ${response.status}`);
         }

       signal: abortController.signal,
     })
       .then(async (response) => {
+        // Handle rate limit errors before parsing response
+        if (response.status === 429) {
+          onError('⏱️ Rate limit exceeded. Free tier allows up to 20 requests per minute. Please wait a moment and try again.');
+          return;
+        }
         if (!response.ok) {
           throw new Error(`HTTP error! status: ${response.status}`);
         }