anycoder

Runtime error

App Files Files Community

akhaliq HF Staff commited on Dec 24, 2025

Commit

2f53e3f

1 Parent(s): afb81bf

show reasoning

Browse files

Files changed (3) hide show

backend_api.py +47 -3
frontend/src/app/page.tsx +7 -3
frontend/src/lib/api.ts +45 -45

backend_api.py CHANGED Viewed

@@ -733,12 +733,49 @@ def cleanup_generated_code(code: str, language: str) -> str:
         return code
 @app.post("/api/generate")
 async def generate_code(
     request: CodeGenerationRequest,
     authorization: Optional[str] = Header(None)
 ):
     """Generate code based on user query - returns streaming response"""
     # Dev mode: No authentication required - just use server's HF_TOKEN
     # In production, you would check real OAuth tokens here
@@ -872,14 +909,21 @@ async def generate_code(
                             })
                             yield f"data: {event_data}\n\n"
                 # Clean up generated code (remove LLM explanatory text and markdown)
                 generated_code = cleanup_generated_code(generated_code, language)
-                # Send completion event (optimized - no timestamp in hot path)
-                completion_data = json.dumps({
                     "type": "complete",
                     "code": generated_code
-                })
                 yield f"data: {completion_data}\n\n"
                 # Auto-deploy after code generation (if authenticated and not skipped)

         return code
+def extract_reasoning(code: str, language: str) -> str:
+    """Extract LLM reasoning/explanatory text that's outside the main code block"""
+    try:
+        if not code:
+            return ""
+        # 1. Check for <think> tags (e.g. from DeepSeek-R1 or newer GLM-4)
+        think_match = re.search(r'<think>([\s\S]*?)</think>', code, re.IGNORECASE)
+        if think_match:
+            return think_match.group(1).strip()
+        # 2. Extract everything outside of markdown code blocks
+        blocks = list(re.finditer(r'```(?:[\w]*)\s*\n([\s\S]*?)(?:\n```|$)', code, re.IGNORECASE))
+        if not blocks:
+            return ""
+        text_parts = []
+        last_end = 0
+        for match in blocks:
+            pre_text = code[last_end:match.start()].strip()
+            if pre_text and len(pre_text) > 10:
+                text_parts.append(pre_text)
+            last_end = match.end()
+        post_text = code[last_end:].strip()
+        if post_text and len(post_text) > 10:
+            text_parts.append(post_text)
+        return "\n\n".join(text_parts).strip()
+    except Exception as e:
+        print(f"[Reasoning Extraction] Error: {e}")
+        return ""
 @app.post("/api/generate")
 async def generate_code(
     request: CodeGenerationRequest,
     authorization: Optional[str] = Header(None)
 ):
     """Generate code based on user query - returns streaming response"""
     # Dev mode: No authentication required - just use server's HF_TOKEN
     # In production, you would check real OAuth tokens here
                             })
                             yield f"data: {event_data}\n\n"
+                # Extract reasoning before cleaning up
+                reasoning = extract_reasoning(generated_code, language)
                 # Clean up generated code (remove LLM explanatory text and markdown)
                 generated_code = cleanup_generated_code(generated_code, language)
+                # Send completion event (include reasoning for GLM-4.7)
+                completion_dict = {
                     "type": "complete",
                     "code": generated_code
+                }
+                if selected_model_id == "zai-org/GLM-4.7" and reasoning:
+                    completion_dict["reasoning"] = reasoning
+                completion_data = json.dumps(completion_dict)
                 yield f"data: {completion_data}\n\n"
                 # Auto-deploy after code generation (if authenticated and not skipped)

frontend/src/app/page.tsx CHANGED Viewed

@@ -367,16 +367,20 @@ export default function Home() {
           });
         },
         // onComplete
-        (code: string) => {
           setGeneratedCode(code);
           setIsGenerating(false);
-          // Update final message - just show success, not the code
           setMessages((prev) => {
             const newMessages = [...prev];
             newMessages[newMessages.length - 1] = {
               ...assistantMessage,
-              content: '✅ Code generated successfully! Check the editor →',
             };
             return newMessages;
           });

           });
         },
         // onComplete
+        (code: string, reasoning?: string) => {
           setGeneratedCode(code);
           setIsGenerating(false);
+          // Update final message - include reasoning if available
           setMessages((prev) => {
             const newMessages = [...prev];
+            const content = reasoning
+              ? `✅ Code generated successfully!\n\n**Reasoning:**\n${reasoning}\n\nCheck the editor →`
+              : '✅ Code generated successfully! Check the editor →';
             newMessages[newMessages.length - 1] = {
               ...assistantMessage,
+              content: content,
             };
             return newMessages;
           });

frontend/src/lib/api.ts CHANGED Viewed

@@ -18,20 +18,20 @@ const getApiUrl = () => {
     console.log('[API Client] Using explicit API URL:', process.env.NEXT_PUBLIC_API_URL);
     return process.env.NEXT_PUBLIC_API_URL;
   }
   // For server-side rendering, always use relative URLs
   if (typeof window === 'undefined') {
     console.log('[API Client] SSR mode: using relative URLs');
     return '';
   }
   // On localhost (dev mode), use direct backend URL
   const hostname = window.location.hostname;
   if (hostname === 'localhost' || hostname === '127.0.0.1') {
     console.log('[API Client] Localhost dev mode: using http://localhost:8000');
     return 'http://localhost:8000';
   }
   // In production (HF Space), use relative URLs (Next.js proxies to backend)
   console.log('[API Client] Production mode: using relative URLs (proxied by Next.js)');
   return '';
@@ -70,23 +70,23 @@ class ApiClient {
         if (error.response && error.response.status === 401) {
           const errorData = error.response.data;
           const errorMessage = errorData?.detail || errorData?.message || '';
           // Only log out if it's an authentication/session issue
           // Don't log out for permission errors on specific resources
-          const shouldLogout =
             errorMessage.includes('Authentication required') ||
             errorMessage.includes('Invalid token') ||
             errorMessage.includes('Token expired') ||
             errorMessage.includes('Session expired') ||
             error.config?.url?.includes('/auth/');
           if (shouldLogout && typeof window !== 'undefined') {
             // Clear ALL authentication data including session token
             localStorage.removeItem('hf_oauth_token');
             localStorage.removeItem('hf_session_token');
             localStorage.removeItem('hf_user_info');
             this.token = null;
             // Dispatch custom event to notify UI components
             window.dispatchEvent(new CustomEvent('auth-expired', {
               detail: { message: 'Your session has expired. Please sign in again.' }
@@ -116,19 +116,19 @@ class ApiClient {
   // Cache helpers
   private getCachedData<T>(key: string, maxAgeMs: number): T | null {
     if (typeof window === 'undefined') return null;
     try {
       const cached = localStorage.getItem(key);
       if (!cached) return null;
       const { data, timestamp } = JSON.parse(cached);
       const age = Date.now() - timestamp;
       if (age > maxAgeMs) {
         localStorage.removeItem(key);
         return null;
       }
       return data;
     } catch (error) {
       console.error(`Failed to get cached data for ${key}:`, error);
@@ -138,7 +138,7 @@ class ApiClient {
   private setCachedData<T>(key: string, data: T): void {
     if (typeof window === 'undefined') return;
     try {
       localStorage.setItem(key, JSON.stringify({
         data,
@@ -161,26 +161,26 @@ class ApiClient {
       console.log('Fetching models from API...');
       const response = await this.client.get<Model[]>('/api/models');
       const models = response.data;
       // Cache the successful response
       if (models && models.length > 0) {
         this.setCachedData('anycoder_models', models);
         console.log('Cached', models.length, 'models (valid for 24 hours)');
       }
       return models;
     } catch (error: any) {
       // Handle connection errors gracefully
-      const isConnectionError =
-        error.code === 'ECONNABORTED' ||
-        error.code === 'ECONNRESET' ||
         error.code === 'ECONNREFUSED' ||
         error.message?.includes('socket hang up') ||
         error.message?.includes('timeout') ||
         error.message?.includes('Network Error') ||
         error.response?.status === 503 ||
         error.response?.status === 502;
       if (isConnectionError) {
         // Try to return stale cache if available
         const staleCache = this.getCachedData<Model[]>('anycoder_models', Infinity);
@@ -188,7 +188,7 @@ class ApiClient {
           console.warn('Backend not available, using stale cached models');
           return staleCache;
         }
         console.warn('Backend not available, cannot load models');
         return [];
       }
@@ -209,26 +209,26 @@ class ApiClient {
       console.log('Fetching languages from API...');
       const response = await this.client.get<{ languages: Language[] }>('/api/languages');
       const languages = response.data.languages;
       // Cache the successful response
       if (languages && languages.length > 0) {
         this.setCachedData('anycoder_languages', languages);
         console.log('Cached', languages.length, 'languages (valid for 24 hours)');
       }
       return response.data;
     } catch (error: any) {
       // Handle connection errors gracefully
-      const isConnectionError =
-        error.code === 'ECONNABORTED' ||
-        error.code === 'ECONNRESET' ||
         error.code === 'ECONNREFUSED' ||
         error.message?.includes('socket hang up') ||
         error.message?.includes('timeout') ||
         error.message?.includes('Network Error') ||
         error.response?.status === 503 ||
         error.response?.status === 502;
       if (isConnectionError) {
         // Try to return stale cache if available
         const staleCache = this.getCachedData<Language[]>('anycoder_languages', Infinity);
@@ -236,7 +236,7 @@ class ApiClient {
           console.warn('Backend not available, using stale cached languages');
           return { languages: staleCache };
         }
         // Fall back to default languages
         console.warn('Backend not available, using default languages');
         return { languages: ['html', 'gradio', 'transformers.js', 'streamlit', 'comfyui', 'react'] };
@@ -273,7 +273,7 @@ class ApiClient {
   generateCodeStream(
     request: CodeGenerationRequest,
     onChunk: (content: string) => void,
-    onComplete: (code: string) => void,
     onError: (error: string) => void,
     onDeploying?: (message: string) => void,
     onDeployed?: (message: string, spaceUrl: string) => void,
@@ -282,11 +282,11 @@ class ApiClient {
     // Build the URL correctly whether we have a base URL or not
     const baseUrl = API_URL || window.location.origin;
     const url = new URL('/api/generate', baseUrl);
     let abortController = new AbortController();
     let accumulatedCode = '';
     let buffer = ''; // Buffer for incomplete SSE lines
     // Use fetch with POST to support large payloads
     fetch(url.toString(), {
       method: 'POST',
@@ -303,21 +303,21 @@ class ApiClient {
           onError('⏱️ Rate limit exceeded. Free tier allows up to 20 requests per minute. Please wait a moment and try again.');
           return;
         }
         if (!response.ok) {
           throw new Error(`HTTP error! status: ${response.status}`);
         }
         if (!response.body) {
           throw new Error('Response body is null');
         }
         const reader = response.body.getReader();
         const decoder = new TextDecoder();
         while (true) {
           const { done, value } = await reader.read();
           if (done) {
             console.log('[Stream] Stream ended, total code length:', accumulatedCode.length);
             if (accumulatedCode) {
@@ -325,20 +325,20 @@ class ApiClient {
             }
             break;
           }
           // Decode chunk and add to buffer
           buffer += decoder.decode(value, { stream: true });
           // Process complete SSE messages (ending with \n\n)
           const messages = buffer.split('\n\n');
           // Keep the last incomplete message in the buffer
           buffer = messages.pop() || '';
           // Process each complete message
           for (const message of messages) {
             if (!message.trim()) continue;
             // Parse SSE format: "data: {...}"
             const lines = message.split('\n');
             for (const line of lines) {
@@ -347,7 +347,7 @@ class ApiClient {
                   const jsonStr = line.substring(6);
                   const data = JSON.parse(jsonStr);
                   console.log('[Stream] Received event:', data.type, data.content?.substring(0, 50));
                   if (data.type === 'chunk' && data.content) {
                     accumulatedCode += data.content;
                     onChunk(data.content);
@@ -355,7 +355,7 @@ class ApiClient {
                     console.log('[Stream] Generation complete, total code length:', data.code?.length || accumulatedCode.length);
                     // Use the complete code from the message if available, otherwise use accumulated
                     const finalCode = data.code || accumulatedCode;
-                    onComplete(finalCode);
                     // Don't return yet - might have deployment events coming
                   } else if (data.type === 'deploying') {
                     console.log('[Stream] Deployment started:', data.message);
@@ -419,7 +419,7 @@ class ApiClient {
     ws.onmessage = (event) => {
       try {
         const data = JSON.parse(event.data);
         if (data.type === 'chunk' && data.content) {
           onChunk(data.content);
         } else if (data.type === 'complete' && data.code) {
@@ -453,7 +453,7 @@ class ApiClient {
       space_name: request.space_name,
       existing_repo_id: request.existing_repo_id,
     });
     try {
       const response = await this.client.post<DeploymentResponse>('/api/deploy', request);
       console.log('[API Client] Deploy response:', response.status, response.data);
@@ -521,13 +521,13 @@ class ApiClient {
       const response = await axios.get('https://huggingface.co/api/spaces', {
         timeout: 5000,
       });
       // Filter for apps with 'anycoder' tag and sort by trendingScore
       const anycoderApps = response.data
         .filter((space: any) => space.tags && space.tags.includes('anycoder'))
         .sort((a: any, b: any) => (b.trendingScore || 0) - (a.trendingScore || 0))
         .slice(0, 6);
       return anycoderApps;
     } catch (error) {
       console.error('Failed to fetch trending anycoder apps:', error);

     console.log('[API Client] Using explicit API URL:', process.env.NEXT_PUBLIC_API_URL);
     return process.env.NEXT_PUBLIC_API_URL;
   }
   // For server-side rendering, always use relative URLs
   if (typeof window === 'undefined') {
     console.log('[API Client] SSR mode: using relative URLs');
     return '';
   }
   // On localhost (dev mode), use direct backend URL
   const hostname = window.location.hostname;
   if (hostname === 'localhost' || hostname === '127.0.0.1') {
     console.log('[API Client] Localhost dev mode: using http://localhost:8000');
     return 'http://localhost:8000';
   }
   // In production (HF Space), use relative URLs (Next.js proxies to backend)
   console.log('[API Client] Production mode: using relative URLs (proxied by Next.js)');
   return '';
         if (error.response && error.response.status === 401) {
           const errorData = error.response.data;
           const errorMessage = errorData?.detail || errorData?.message || '';
           // Only log out if it's an authentication/session issue
           // Don't log out for permission errors on specific resources
+          const shouldLogout =
             errorMessage.includes('Authentication required') ||
             errorMessage.includes('Invalid token') ||
             errorMessage.includes('Token expired') ||
             errorMessage.includes('Session expired') ||
             error.config?.url?.includes('/auth/');
           if (shouldLogout && typeof window !== 'undefined') {
             // Clear ALL authentication data including session token
             localStorage.removeItem('hf_oauth_token');
             localStorage.removeItem('hf_session_token');
             localStorage.removeItem('hf_user_info');
             this.token = null;
             // Dispatch custom event to notify UI components
             window.dispatchEvent(new CustomEvent('auth-expired', {
               detail: { message: 'Your session has expired. Please sign in again.' }
   // Cache helpers
   private getCachedData<T>(key: string, maxAgeMs: number): T | null {
     if (typeof window === 'undefined') return null;
     try {
       const cached = localStorage.getItem(key);
       if (!cached) return null;
       const { data, timestamp } = JSON.parse(cached);
       const age = Date.now() - timestamp;
       if (age > maxAgeMs) {
         localStorage.removeItem(key);
         return null;
       }
       return data;
     } catch (error) {
       console.error(`Failed to get cached data for ${key}:`, error);
   private setCachedData<T>(key: string, data: T): void {
     if (typeof window === 'undefined') return;
     try {
       localStorage.setItem(key, JSON.stringify({
         data,
       console.log('Fetching models from API...');
       const response = await this.client.get<Model[]>('/api/models');
       const models = response.data;
       // Cache the successful response
       if (models && models.length > 0) {
         this.setCachedData('anycoder_models', models);
         console.log('Cached', models.length, 'models (valid for 24 hours)');
       }
       return models;
     } catch (error: any) {
       // Handle connection errors gracefully
+      const isConnectionError =
+        error.code === 'ECONNABORTED' ||
+        error.code === 'ECONNRESET' ||
         error.code === 'ECONNREFUSED' ||
         error.message?.includes('socket hang up') ||
         error.message?.includes('timeout') ||
         error.message?.includes('Network Error') ||
         error.response?.status === 503 ||
         error.response?.status === 502;
       if (isConnectionError) {
         // Try to return stale cache if available
         const staleCache = this.getCachedData<Model[]>('anycoder_models', Infinity);
           console.warn('Backend not available, using stale cached models');
           return staleCache;
         }
         console.warn('Backend not available, cannot load models');
         return [];
       }
       console.log('Fetching languages from API...');
       const response = await this.client.get<{ languages: Language[] }>('/api/languages');
       const languages = response.data.languages;
       // Cache the successful response
       if (languages && languages.length > 0) {
         this.setCachedData('anycoder_languages', languages);
         console.log('Cached', languages.length, 'languages (valid for 24 hours)');
       }
       return response.data;
     } catch (error: any) {
       // Handle connection errors gracefully
+      const isConnectionError =
+        error.code === 'ECONNABORTED' ||
+        error.code === 'ECONNRESET' ||
         error.code === 'ECONNREFUSED' ||
         error.message?.includes('socket hang up') ||
         error.message?.includes('timeout') ||
         error.message?.includes('Network Error') ||
         error.response?.status === 503 ||
         error.response?.status === 502;
       if (isConnectionError) {
         // Try to return stale cache if available
         const staleCache = this.getCachedData<Language[]>('anycoder_languages', Infinity);
           console.warn('Backend not available, using stale cached languages');
           return { languages: staleCache };
         }
         // Fall back to default languages
         console.warn('Backend not available, using default languages');
         return { languages: ['html', 'gradio', 'transformers.js', 'streamlit', 'comfyui', 'react'] };
   generateCodeStream(
     request: CodeGenerationRequest,
     onChunk: (content: string) => void,
+    onComplete: (code: string, reasoning?: string) => void,
     onError: (error: string) => void,
     onDeploying?: (message: string) => void,
     onDeployed?: (message: string, spaceUrl: string) => void,
     // Build the URL correctly whether we have a base URL or not
     const baseUrl = API_URL || window.location.origin;
     const url = new URL('/api/generate', baseUrl);
     let abortController = new AbortController();
     let accumulatedCode = '';
     let buffer = ''; // Buffer for incomplete SSE lines
     // Use fetch with POST to support large payloads
     fetch(url.toString(), {
       method: 'POST',
           onError('⏱️ Rate limit exceeded. Free tier allows up to 20 requests per minute. Please wait a moment and try again.');
           return;
         }
         if (!response.ok) {
           throw new Error(`HTTP error! status: ${response.status}`);
         }
         if (!response.body) {
           throw new Error('Response body is null');
         }
         const reader = response.body.getReader();
         const decoder = new TextDecoder();
         while (true) {
           const { done, value } = await reader.read();
           if (done) {
             console.log('[Stream] Stream ended, total code length:', accumulatedCode.length);
             if (accumulatedCode) {
             }
             break;
           }
           // Decode chunk and add to buffer
           buffer += decoder.decode(value, { stream: true });
           // Process complete SSE messages (ending with \n\n)
           const messages = buffer.split('\n\n');
           // Keep the last incomplete message in the buffer
           buffer = messages.pop() || '';
           // Process each complete message
           for (const message of messages) {
             if (!message.trim()) continue;
             // Parse SSE format: "data: {...}"
             const lines = message.split('\n');
             for (const line of lines) {
                   const jsonStr = line.substring(6);
                   const data = JSON.parse(jsonStr);
                   console.log('[Stream] Received event:', data.type, data.content?.substring(0, 50));
                   if (data.type === 'chunk' && data.content) {
                     accumulatedCode += data.content;
                     onChunk(data.content);
                     console.log('[Stream] Generation complete, total code length:', data.code?.length || accumulatedCode.length);
                     // Use the complete code from the message if available, otherwise use accumulated
                     const finalCode = data.code || accumulatedCode;
+                    onComplete(finalCode, data.reasoning);
                     // Don't return yet - might have deployment events coming
                   } else if (data.type === 'deploying') {
                     console.log('[Stream] Deployment started:', data.message);
     ws.onmessage = (event) => {
       try {
         const data = JSON.parse(event.data);
         if (data.type === 'chunk' && data.content) {
           onChunk(data.content);
         } else if (data.type === 'complete' && data.code) {
       space_name: request.space_name,
       existing_repo_id: request.existing_repo_id,
     });
     try {
       const response = await this.client.post<DeploymentResponse>('/api/deploy', request);
       console.log('[API Client] Deploy response:', response.status, response.data);
       const response = await axios.get('https://huggingface.co/api/spaces', {
         timeout: 5000,
       });
       // Filter for apps with 'anycoder' tag and sort by trendingScore
       const anycoderApps = response.data
         .filter((space: any) => space.tags && space.tags.includes('anycoder'))
         .sort((a: any, b: any) => (b.trendingScore || 0) - (a.trendingScore || 0))
         .slice(0, 6);
       return anycoderApps;
     } catch (error) {
       console.error('Failed to fetch trending anycoder apps:', error);