Spaces:

GlobalStudio
/

starflow

Running on Zero

leoeric commited on 12 days ago

Commit

0a33f4f

1 Parent(s): b9eaf60

Fix log visibility: Display logs directly in UI instead of relying on file access

- Remove dependency on outputs/ folder for logs (not accessible in HF Spaces)
- Display all logs directly in the status output
- Show full STDERR, STDOUT, and log content in error messages
- No need to access Files tab - everything shown in UI
- Better for debugging GPU abort issues

Files changed (1) hide show

app.py +35 -61

app.py CHANGED Viewed

@@ -199,7 +199,8 @@ def _generate_image_impl(prompt, aspect_ratio, cfg, seed, checkpoint_file, confi
     status_msg += "   - Subsequent runs: Only generation time (~1-3 min)\n"
     try:
-        # Create output directory
         output_dir = Path("outputs")
         output_dir.mkdir(exist_ok=True)
@@ -218,18 +219,16 @@ def _generate_image_impl(prompt, aspect_ratio, cfg, seed, checkpoint_file, confi
             "--jacobi", "1",
             "--jacobi_th", "0.001",
             "--jacobi_block_size", "16",
-            "--logdir", str(output_dir)  # Set logdir to outputs directory
         ]
         status_msg += "🚀 Running generation...\n"
         status_msg += "📊 Current step: Model inference (checkpoint should already be downloaded)\n"
-        # Create log file for debugging
-        log_file = output_dir / "generation.log"
-        status_msg += f"\n📋 LOG FILE LOCATION:\n"
-        status_msg += f"   File: {log_file}\n"
-        status_msg += f"   View in Space: Files tab → outputs → generation.log\n"
-        status_msg += f"   (Logs are written in real-time during generation)\n\n"
         # Ensure GPU environment variables are passed to subprocess
         env = os.environ.copy()
@@ -266,39 +265,24 @@ def _generate_image_impl(prompt, aspect_ratio, cfg, seed, checkpoint_file, confi
             timeout=2700
         )
-        # Write comprehensive log file
-        with open(log_file, 'w') as log:
-            log.write("=== GENERATION LOG ===\n\n")
-            log.write(f"Command: {' '.join(cmd)}\n\n")
-            log.write(f"Environment Variables:\n")
-            log.write(f"  CUDA_VISIBLE_DEVICES={env.get('CUDA_VISIBLE_DEVICES', 'not set')}\n")
-            log.write(f"  CUDA_AVAILABLE={torch.cuda.is_available()}\n")
-            if torch.cuda.is_available():
-                log.write(f"  GPU_NAME={torch.cuda.get_device_name(0)}\n")
-                log.write(f"  GPU_MEMORY_TOTAL={torch.cuda.get_device_properties(0).total_memory / 1024**3:.2f} GB\n")
-            log.write(f"\n")
-            log.write("=== STDOUT ===\n")
-            log.write(result.stdout if result.stdout else "(empty)\n")
-            log.write("\n\n=== STDERR ===\n")
-            log.write(result.stderr if result.stderr else "(empty)\n")
-            log.write(f"\n\n=== RETURN CODE: {result.returncode} ===\n")
-            # Add note about GPU abort
-            if result.returncode != 0:
-                log.write(f"\n⚠️  PROCESS FAILED WITH RETURN CODE {result.returncode}\n")
-                log.write("This could indicate:\n")
-                log.write("- GPU abort/timeout\n")
-                log.write("- CUDA out of memory\n")
-                log.write("- Process killed by system\n")
-                log.write("- Model loading error\n")
-                log.write("\nCheck the STDERR section above for detailed error messages.\n")
-        # Read log file for detailed output
-        log_content = ""
-        if log_file.exists():
-            with open(log_file, 'r') as f:
-                log_content = f.read()
-            status_msg += f"\n📋 Full logs available at: {log_file}\n"
         if result.returncode != 0:
             error_msg = f"❌ Error during generation (return code: {result.returncode})\n\n"
@@ -343,28 +327,18 @@ def _generate_image_impl(prompt, aspect_ratio, cfg, seed, checkpoint_file, confi
                 stdout_preview = result.stdout[-5000:] if len(result.stdout) > 5000 else result.stdout
                 error_msg += f"{stdout_preview}\n\n"
-            # Show log file content if available
-            if log_content:
-                error_msg += f"=== LOG FILE CONTENT ({log_file}) ===\n"
-                # Show last 5000 chars of log
-                log_preview = log_content[-5000:] if len(log_content) > 5000 else log_content
-                error_msg += f"{log_preview}\n\n"
-            else:
-                error_msg += f"⚠️  Log file not found at: {log_file}\n\n"
-            # Instructions on where to find logs
             error_msg += f"{'='*80}\n"
-            error_msg += f"📁 HOW TO VIEW FULL LOGS:\n"
             error_msg += f"{'='*80}\n"
-            error_msg += f"OPTION 1 - Space Files Tab (Recommended):\n"
-            error_msg += f"  1. Click 'Files' tab in your Space\n"
-            error_msg += f"  2. Navigate to: outputs/generation.log\n"
-            error_msg += f"  3. Click to view/download the full log\n\n"
-            error_msg += f"OPTION 2 - Space Logs Tab:\n"
-            error_msg += f"  1. Click 'Logs' tab in your Space\n"
-            error_msg += f"  2. Look for messages starting with '[sample.py]'\n"
-            error_msg += f"  3. Check for GPU abort or CUDA errors\n\n"
-            error_msg += f"Full log path: {log_file}\n"
             error_msg += f"{'='*80}\n"
             return None, error_msg
@@ -413,9 +387,9 @@ def _generate_image_impl(prompt, aspect_ratio, cfg, seed, checkpoint_file, confi
             error_msg += f"Searched in: {output_dir} and {model_output_dir}\n"
             error_msg += debug_info
             if log_content:
-                error_msg += f"\n\n📋 Check log file for details: {log_file}\nLast 2000 chars:\n{log_content[-2000:]}"
             else:
-                error_msg += f"\n\nCheck stdout:\n{result.stdout[-1000:]}"
             return None, error_msg
     except Exception as e:

     status_msg += "   - Subsequent runs: Only generation time (~1-3 min)\n"
     try:
+        # Create output directory (use /tmp for logs, outputs/ for images)
+        # In HF Spaces, /tmp is accessible and outputs/ may not be visible in Files tab
         output_dir = Path("outputs")
         output_dir.mkdir(exist_ok=True)
             "--jacobi", "1",
             "--jacobi_th", "0.001",
             "--jacobi_block_size", "16",
+            "--logdir", str(output_dir)  # Set logdir to outputs directory for images
         ]
         status_msg += "🚀 Running generation...\n"
         status_msg += "📊 Current step: Model inference (checkpoint should already be downloaded)\n"
+        # Note about log file location
+        status_msg += f"\n📋 LOGS:\n"
+        status_msg += f"   All logs will be shown in the status output below\n"
+        status_msg += f"   (Logs are captured in real-time)\n\n"
         # Ensure GPU environment variables are passed to subprocess
         env = os.environ.copy()
             timeout=2700
         )
+        # Build comprehensive log content for display (not relying on file access)
+        log_content_parts = []
+        log_content_parts.append("=== GENERATION LOG ===\n\n")
+        log_content_parts.append(f"Command: {' '.join(cmd)}\n\n")
+        log_content_parts.append(f"Environment Variables:\n")
+        log_content_parts.append(f"  CUDA_VISIBLE_DEVICES={env.get('CUDA_VISIBLE_DEVICES', 'not set')}\n")
+        log_content_parts.append(f"  CUDA_AVAILABLE={torch.cuda.is_available()}\n")
+        if torch.cuda.is_available():
+            log_content_parts.append(f"  GPU_NAME={torch.cuda.get_device_name(0)}\n")
+            log_content_parts.append(f"  GPU_MEMORY_TOTAL={torch.cuda.get_device_properties(0).total_memory / 1024**3:.2f} GB\n")
+        log_content_parts.append(f"\n")
+        log_content_parts.append("=== STDOUT ===\n")
+        log_content_parts.append(result.stdout if result.stdout else "(empty)\n")
+        log_content_parts.append("\n\n=== STDERR ===\n")
+        log_content_parts.append(result.stderr if result.stderr else "(empty)\n")
+        log_content_parts.append(f"\n\n=== RETURN CODE: {result.returncode} ===\n")
+        log_content = ''.join(log_content_parts)
         if result.returncode != 0:
             error_msg = f"❌ Error during generation (return code: {result.returncode})\n\n"
                 stdout_preview = result.stdout[-5000:] if len(result.stdout) > 5000 else result.stdout
                 error_msg += f"{stdout_preview}\n\n"
+            # Show full log content directly in error message (no file access needed)
+            error_msg += f"=== FULL GENERATION LOG ===\n"
+            error_msg += f"{log_content}\n\n"
+            # Instructions on where to find more info
             error_msg += f"{'='*80}\n"
+            error_msg += f"📁 ADDITIONAL DEBUGGING:\n"
             error_msg += f"{'='*80}\n"
+            error_msg += f"1. Check the Space 'Logs' tab for container logs\n"
+            error_msg += f"2. Look for messages from sample.py\n"
+            error_msg += f"3. Check for GPU abort or CUDA errors\n"
+            error_msg += f"4. All logs are shown above in this error message\n"
             error_msg += f"{'='*80}\n"
             return None, error_msg
             error_msg += f"Searched in: {output_dir} and {model_output_dir}\n"
             error_msg += debug_info
             if log_content:
+                error_msg += f"\n\n📋 Full log details:\n{log_content[-2000:]}"
             else:
+                error_msg += f"\n\nCheck stdout:\n{result.stdout[-1000:] if result.stdout else '(no output)'}"
             return None, error_msg
     except Exception as e: