Spaces:

mac9087
/

rightnight

Sleeping

App Files Files Community

mac9087 commited on Apr 24

Commit

a1d5bed

verified ·

1 Parent(s): f515ccd

Update app.py

Browse files

Files changed (1) hide show

app.py +439 -433

app.py CHANGED Viewed

@@ -11,14 +11,19 @@ import io
 import zipfile
 import uuid
 import traceback
-from huggingface_hub import snapshot_download, hf_hub_download
 from flask_cors import CORS
 import numpy as np
 import trimesh
 from scipy.ndimage import gaussian_filter
 import cv2
 import torch.nn.functional as F
-from transformers import AutoFeatureExtractor, AutoModelForDepthEstimation
 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
@@ -38,6 +43,7 @@ os.makedirs(CACHE_DIR, exist_ok=True)
 os.environ['HF_HOME'] = CACHE_DIR
 os.environ['TRANSFORMERS_CACHE'] = os.path.join(CACHE_DIR, 'transformers')
 os.environ['HF_DATASETS_CACHE'] = os.path.join(CACHE_DIR, 'datasets')
 app.config['UPLOAD_FOLDER'] = UPLOAD_FOLDER
 app.config['MAX_CONTENT_LENGTH'] = 16 * 1024 * 1024  # 16MB max
@@ -52,6 +58,9 @@ openlrm_model = None
 model_loaded = False
 model_loading = False
 # Constants for processing
 TIMEOUT_SECONDS = 240  # 4 minutes max for processing
 MAX_DIMENSION = 512    # Max image dimension to process
@@ -90,6 +99,12 @@ def process_with_timeout(function, args, timeout):
     return result[0], None
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
@@ -135,21 +150,49 @@ def preprocess_image(image_path):
         return img
-# Remove background function to help with 3D reconstruction
 def remove_background(image):
     try:
         import rembg
         return rembg.remove(image)
     except ImportError:
         print("Rembg not available, skipping background removal")
-        # Create a white background transparent image as fallback
         return image
-# Load OpenLRM model for 3D reconstruction
 def load_openlrm_model():
     global openlrm_model, model_loaded, model_loading
-    if model_loaded:
         return openlrm_model
     if model_loading:
@@ -160,103 +203,69 @@ def load_openlrm_model():
     try:
         model_loading = True
-        print("Loading OpenLRM model...")
-        # For Hugging Face free tier, use the smaller model
-        model_repo = "zxhezexin/openlrm-mix-small-1.1"  # Smallest OpenLRM model that works well
-        model_file = "model.safetensors"
-        # Download OpenLRM model
-        model_path = hf_hub_download(
-            repo_id=model_repo,
-            filename=model_file,
-            cache_dir=CACHE_DIR,
-            resume_download=True
-        )
-        # Download config file
-        config_path = hf_hub_download(
-            repo_id=model_repo,
-            filename="config.json",
-            cache_dir=CACHE_DIR,
-            resume_download=True
-        )
-        # Load OpenLRM for inference
-        # Simplified loading for memory efficiency
         device = "cuda" if torch.cuda.is_available() else "cpu"
-        # Import necessary modules for OpenLRM
-        from transformers import AutoConfig
-        # Load configuration
-        config = AutoConfig.from_pretrained(config_path)
-        # Initialize a lightweight model class
-        class OpenLRMWrapper:
-            def __init__(self, model_path, config, device):
-                self.model_path = model_path
-                self.config = config
                 self.device = device
-                # Load the model weights lazily when needed
-                self.model = None
             def __call__(self, image):
-                # Only load the full model when it's actually used
-                if self.model is None:
-                    # Import necessary modules
-                    from transformers import AutoModelForSeq2SeqLM
-                    # Load model with minimal memory footprint for Hugging Face free tier
-                    self.model = AutoModelForSeq2SeqLM.from_pretrained(
-                        self.model_path,
-                        config=self.config,
-                        torch_dtype=torch.float16 if self.device == "cuda" else torch.float32,
-                        device_map=self.device
-                    )
-                # Process image
-                with torch.no_grad():
-                    # Convert image to tensor and process
-                    image_tensor = self._preprocess_image(image)
-                    result = self.model.generate(image_tensor)
-                    return self._process_result(result)
-            def _preprocess_image(self, image):
-                # Convert PIL image to tensor and normalize
-                from torchvision import transforms
-                transform = transforms.Compose([
-                    transforms.Resize((224, 224)),
-                    transforms.ToTensor(),
-                    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
-                ])
-                tensor = transform(image).unsqueeze(0).to(self.device)
-                return tensor
-            def _process_result(self, result):
-                # Process the model output to get 3D mesh data
-                # This is a simplified version for illustration
-                # The actual processing depends on the model's output format
-                return result
-        # Create a wrapper instance
-        openlrm_model = OpenLRMWrapper(model_path, config, device)
         model_loaded = True
-        print(f"OpenLRM model loaded successfully on {device}")
         return openlrm_model
     except Exception as e:
-        print(f"Error loading OpenLRM model: {str(e)}")
         print(traceback.format_exc())
-        # Fallback to depth estimation model if OpenLRM fails
-        load_depth_model()
         return None
     finally:
         model_loading = False
-# Load depth estimation model as fallback
 def load_depth_model():
     global depth_model, feature_extractor, model_loaded, model_loading
@@ -264,18 +273,37 @@ def load_depth_model():
         return depth_model, feature_extractor
     try:
-        print("Loading depth estimation model as fallback...")
-        # Use DINOv2-small which provides good balance between quality and memory usage
-        model_name = "LiheYoung/depth-anything-small"
-        # Initialize model with appropriate precision
         device = "cuda" if torch.cuda.is_available() else "cpu"
-        # Load feature extractor and model
-        feature_extractor = AutoFeatureExtractor.from_pretrained(model_name)
-        depth_model = AutoModelForDepthEstimation.from_pretrained(model_name)
         if device == "cuda":
             depth_model = depth_model.to(device)
@@ -285,25 +313,73 @@ def load_depth_model():
     except Exception as e:
         print(f"Error loading depth model: {str(e)}")
         print(traceback.format_exc())
-        raise
-# Process image to create 3D model using OpenLRM
 def process_openlrm(image, job_id, detail_level='medium', output_format='obj'):
     try:
-        # Load OpenLRM model
         model = load_openlrm_model()
         if model is None:
             # Fallback to depth-based approach
             return process_depth_based(image, job_id, detail_level, output_format)
         # Preprocess image - remove background for better results
         image_rgba = remove_background(image)
         # Update progress
-        processing_jobs[job_id]['progress'] = 30
-        # Process with OpenLRM model to get 3D mesh
-        # This is where the magic happens - OpenLRM will create a full 3D model
         result = model(image_rgba)
         # Update progress
@@ -326,61 +402,76 @@ def process_openlrm(image, job_id, detail_level='medium', output_format='obj'):
 # Convert OpenLRM result to trimesh
 def convert_to_trimesh(result, image):
-    # This is a placeholder for the actual conversion from OpenLRM output to trimesh
-    # Actual implementation depends on the output format of OpenLRM
-    # For now, create a sample mesh with UV mapping
-    # In a real implementation, this would use the actual model output
-    vertices = result.get("vertices", generate_sample_vertices())
-    faces = result.get("faces", generate_sample_faces())
-    # Create mesh with texture coordinates
     mesh = trimesh.Trimesh(vertices=vertices, faces=faces)
     # Add texture from the original image
     if hasattr(image, 'convert'):
-        img_array = np.array(image.convert("RGBA"))
-        if img_array.shape[2] == 4:  # RGBA
-            vertex_colors = sample_texture_from_image(img_array, vertices)
-            mesh.visual.vertex_colors = vertex_colors
     return mesh
 # Sample helper functions for mesh creation
-def generate_sample_vertices():
-    # Create a cube-like object for testing
-    x = np.linspace(-1, 1, 10)
-    y = np.linspace(-1, 1, 10)
-    z = np.linspace(-1, 1, 10)
-    x_grid, y_grid, z_grid = np.meshgrid(x, y, z)
-    vertices = np.vstack([x_grid.flatten(), y_grid.flatten(), z_grid.flatten()]).T
-    return vertices
-def generate_sample_faces():
-    # Create simple faces connecting vertices
-    faces = []
-    n = 10  # Grid size from generate_sample_vertices
-    for i in range(n-1):
-        for j in range(n-1):
-            for k in range(n-1):
-                idx = i*n*n + j*n + k
-                faces.append([idx, idx+1, idx+n])
-                faces.append([idx+1, idx+n+1, idx+n])
-    return np.array(faces)
 def sample_texture_from_image(image, vertices):
     # Sample colors from image based on vertex positions
     h, w = image.shape[:2]
     colors = np.zeros((len(vertices), 4), dtype=np.uint8)
-    # Normalize vertex positions to [0,1] for sampling
-    pos = (vertices[:, :2] + 1) / 2  # Assuming vertices are in [-1,1] range
-    # Sample image colors
-    for i, p in enumerate(pos):
-        if 0 <= p[0] <= 1 and 0 <= p[1] <= 1:
-            x = int(p[0] * (w-1))
-            y = int(p[1] * (h-1))
             colors[i] = image[y, x]
         else:
             colors[i] = [200, 200, 200, 255]  # Default color
@@ -390,40 +481,58 @@ def sample_texture_from_image(image, vertices):
 # Process using depth-based approach as fallback
 def process_depth_based(image, job_id, detail_level='medium', output_format='obj'):
     try:
-        # Load depth model if not already loaded
-        global depth_model, feature_extractor
-        if depth_model is None or feature_extractor is None:
-            depth_model, feature_extractor = load_depth_model()
         # Update progress
         processing_jobs[job_id]['progress'] = 30
-        # Get depth map
-        with torch.no_grad():
-            # Prepare image for the model
-            inputs = feature_extractor(images=image, return_tensors="pt")
-            if torch.cuda.is_available():
-                inputs = {k: v.cuda() for k, v in inputs.items()}
-            # Forward pass
-            outputs = depth_model(**inputs)
-            predicted_depth = outputs.predicted_depth
-            # Normalize and resize depth to original image size
-            depth_map = F.interpolate(
-                predicted_depth.unsqueeze(1),
-                size=(image.height, image.width),
-                mode="bicubic",
-                align_corners=False,
-            ).squeeze().cpu().numpy()
         # Update progress
         processing_jobs[job_id]['progress'] = 60
-        # Convert to normalized depth map
-        depth_min = depth_map.min()
-        depth_max = depth_map.max()
-        depth_normalized = (depth_map - depth_min) / (depth_max - depth_min)
         # Create mesh from depth map
         mesh = depth_to_mesh(depth_normalized, image,
@@ -434,12 +543,24 @@ def process_depth_based(image, job_id, detail_level='medium', output_format='obj
         # Update progress
         processing_jobs[job_id]['progress'] = 80
         return mesh
     except Exception as e:
         print(f"Error in depth-based processing: {str(e)}")
         print(traceback.format_exc())
-        raise
 # Enhanced depth map processing
 def enhance_depth_map(depth_map, detail_level='medium'):
@@ -548,7 +669,7 @@ def depth_to_mesh(depth_map, image, resolution=100, detail_level='medium'):
     mesh = trimesh.Trimesh(vertices=vertices, faces=faces)
     # Apply texturing if image is provided
-    if image:
         # Convert to numpy array if needed
         if isinstance(image, Image.Image):
             img_array = np.array(image)
@@ -556,153 +677,149 @@ def depth_to_mesh(depth_map, image, resolution=100, detail_level='medium'):
             img_array = image
         # Create vertex colors
-        if resolution <= img_array.shape[0] and resolution <= img_array.shape[1]:
             # Create vertex colors by sampling the image
             vertex_colors = np.zeros((vertices.shape[0], 4), dtype=np.uint8)
             for i in range(resolution):
                 for j in range(resolution):
                     # Calculate image coordinates
-                    img_x = j * (img_array.shape[1] - 1) / (resolution - 1)
-                    img_y = i * (img_array.shape[0] - 1) / (resolution - 1)
-                    # Bilinear interpolation
-                    x0, y0 = int(img_x), int(img_y)
-                    x1, y1 = min(x0 + 1, img_array.shape[1] - 1), min(y0 + 1, img_array.shape[0] - 1)
-                    # Interpolation weights
-                    wx = img_x - x0
-                    wy = img_y - y0
                     vertex_idx = i * resolution + j
                     if len(img_array.shape) == 3 and img_array.shape[2] == 3:  # RGB
-                        # Perform bilinear interpolation
-                        r = int((1-wx)*(1-wy)*img_array[y0, x0, 0] + wx*(1-wy)*img_array[y0, x1, 0] +
-                                (1-wx)*wy*img_array[y1, x0, 0] + wx*wy*img_array[y1, x1, 0])
-                        g = int((1-wx)*(1-wy)*img_array[y0, x0, 1] + wx*(1-wy)*img_array[y0, x1, 1] +
-                                (1-wx)*wy*img_array[y1, x0, 1] + wx*wy*img_array[y1, x1, 1])
-                        b = int((1-wx)*(1-wy)*img_array[y0, x0, 2] + wx*(1-wy)*img_array[y0, x1, 2] +
-                                (1-wx)*wy*img_array[y1, x0, 2] + wx*wy*img_array[y1, x1, 2])
-                        vertex_colors[vertex_idx, :3] = [r, g, b]
-                        vertex_colors[vertex_idx, 3] = 255  # Alpha
                     elif len(img_array.shape) == 3 and img_array.shape[2] == 4:  # RGBA
-                        for c in range(4):  # For each RGBA channel
-                            vertex_colors[vertex_idx, c] = int((1-wx)*(1-wy)*img_array[y0, x0, c] +
-                                                            wx*(1-wy)*img_array[y0, x1, c] +
-                                                            (1-wx)*wy*img_array[y1, x0, c] +
-                                                            wx*wy*img_array[y1, x1, c])
                     else:
                         # Handle grayscale
-                        gray = int((1-wx)*(1-wy)*img_array[y0, x0] + wx*(1-wy)*img_array[y0, x1] +
-                                (1-wx)*wy*img_array[y1, x0] + wx*wy*img_array[y1, x1])
-                        vertex_colors[vertex_idx, :3] = [gray, gray, gray]
-                        vertex_colors[vertex_idx, 3] = 255
             mesh.visual.vertex_colors = vertex_colors
     # Apply smoothing to get rid of staircase artifacts
     if detail_level != 'high':
-        mesh = mesh.smoothed(method='laplacian', iterations=1)
     # Fix normals for better rendering
-    mesh.fix_normals()
-    # Simulate full 3D by duplicating and flipping the mesh
-    if detail_level != 'low':
-        # Create a complete 3D object by duplicating and flipping the mesh
-        back_mesh = mesh.copy()
-        # Flip to create the back side
-        back_mesh.vertices[:, 2] = -back_mesh.vertices[:, 2]
-        # Fix normals after flipping
-        back_mesh.fix_normals()
-        # Combine front and back meshes
-        combined_mesh = trimesh.util.concatenate([mesh, back_mesh])
-        # Add side panels to create a watertight model
-        combined_mesh = create_watertight_model(combined_mesh)
-        return combined_mesh
     return mesh
-# Create a watertight model by adding side panels
 def create_watertight_model(mesh):
-    # Extract boundary edges
-    edges = mesh.edges_unique
-    edge_faces = mesh.edges_unique_inverse
-    boundary_edges = edges[np.where(np.bincount(edge_faces) == 1)[0]]
-    # If no boundary edges, return the original mesh
-    if len(boundary_edges) == 0:
-        return mesh
-    # Create side panels along boundary edges
-    new_faces = []
-    # Sort boundary edges to form loops
-    edge_loops = []
-    current_loop = [boundary_edges[0][0], boundary_edges[0][1]]
-    boundary_edges = boundary_edges[1:]
-    # Try to create continuous edge loops
-    while len(boundary_edges) > 0:
-        found = False
-        for i, edge in enumerate(boundary_edges):
-            if edge[0] == current_loop[-1]:
-                current_loop.append(edge[1])
-                boundary_edges = np.delete(boundary_edges, i, axis=0)
-                found = True
-                break
-            elif edge[1] == current_loop[-1]:
-                current_loop.append(edge[0])
-                boundary_edges = np.delete(boundary_edges, i, axis=0)
-                found = True
-                break
-        if not found:
-            # Start a new loop
-            edge_loops.append(current_loop)
-            if len(boundary_edges) > 0:
-                current_loop = [boundary_edges[0][0], boundary_edges[0][1]]
-                boundary_edges = boundary_edges[1:]
-            else:
-                break
-    if len(current_loop) > 0:
-        edge_loops.append(current_loop)
-    # Create faces for each loop
-    for loop in edge_loops:
-        if len(loop) < 3:
-            continue
-        # Create triangles by triangulating the loop
-        for i in range(1, len(loop) - 1):
-            new_faces.append([loop[0], loop[i], loop[i+1]])
-    # Add new faces to the mesh
-    if len(new_faces) > 0:
-        new_faces = np.array(new_faces)
-        combined_faces = np.vstack([mesh.faces, new_faces])
-        watertight_mesh = trimesh.Trimesh(vertices=mesh.vertices, faces=combined_faces)
-        # Copy vertex colors if they exist
-        if hasattr(mesh.visual, 'vertex_colors') and mesh.visual.vertex_colors is not None:
-            watertight_mesh.visual.vertex_colors = mesh.visual.vertex_colors
-        return watertight_mesh
-    return mesh
 @app.route('/health', methods=['GET'])
 def health_check():
     return jsonify({
         "status": "healthy",
-        "model": "Enhanced 3D Model Generator with OpenLRM and Depth-Anything",
-        "device": "cuda" if torch.cuda.is_available() else "cpu"
     }), 200
 @app.route('/progress/<job_id>', methods=['GET'])
@@ -736,7 +853,7 @@ def progress(job_id):
                     break
                 check_count = 0
-                        # Send final status
         if job['status'] == 'completed':
             yield f"data: {json.dumps({'status': 'completed', 'progress': 100, 'result_url': job['result_url'], 'preview_url': job['preview_url']})}\n\n"
         else:
@@ -763,6 +880,12 @@ def convert_image_to_3d():
         output_format = request.form.get('output_format', 'obj').lower()
         detail_level = request.form.get('detail_level', 'medium').lower()  # Parameter for detail level
         model_type = request.form.get('model_type', 'openlrm').lower()  # 'openlrm' or 'depth'
     except ValueError:
         return jsonify({"error": "Invalid parameter values"}), 400
@@ -869,9 +992,7 @@ def convert_image_to_3d():
                 os.remove(filepath)
             # Force garbage collection to free memory
-            gc.collect()
-            if torch.cuda.is_available():
-                torch.cuda.empty_cache()
         except Exception as e:
             # Handle errors
@@ -1014,7 +1135,7 @@ def model_info(job_id):
 @app.route('/', methods=['GET'])
 def index():
     return jsonify({
-        "message": "Enhanced 3D Model Generator with OpenLRM",
         "endpoints": [
             "/convert",
             "/progress/<job_id>",
@@ -1028,164 +1149,49 @@ def index():
             "detail_level": "low, medium, or high - controls the level of detail in the final model",
             "model_type": "openlrm (default, full 3D) or depth (faster but simpler)"
         },
-        "description": "This API creates high-quality 3D models from 2D images with full 3D structure and texturing"
     }), 200
-# Example endpoint showing model comparison
-@app.route('/model-comparison', methods=['POST'])
-def compare_models():
-    # Check if image is in the request
-    if 'image' not in request.files:
-        return jsonify({"error": "No image provided"}), 400
-    file = request.files['image']
-    if file.filename == '':
-        return jsonify({"error": "No image selected"}), 400
-    if not allowed_file(file.filename):
-        return jsonify({"error": f"File type not allowed. Supported types: {', '.join(ALLOWED_EXTENSIONS)}"}), 400
-    # Create a job ID
-    job_id = str(uuid.uuid4())
-    output_dir = os.path.join(RESULTS_FOLDER, job_id)
-    os.makedirs(output_dir, exist_ok=True)
-    # Save the uploaded file
-    filename = secure_filename(file.filename)
-    filepath = os.path.join(app.config['UPLOAD_FOLDER'], f"{job_id}_{filename}")
-    file.save(filepath)
-    # Initialize job tracking
-    processing_jobs[job_id] = {
-        'status': 'processing',
-        'progress': 0,
-        'result_urls': {},
-        'error': None,
-        'created_at': time.time(),
-        'comparison': True
-    }
-    # Process in separate thread to create models with both approaches
-    def process_comparison():
-        thread = threading.current_thread()
-        processing_jobs[job_id]['thread_alive'] = lambda: thread.is_alive()
         try:
-            # Preprocess image
-            image = preprocess_image(filepath)
-            processing_jobs[job_id]['progress'] = 10
-            # Dictionary to store results
-            result_urls = {}
-            # Process with both models
-            try:
-                # First try with OpenLRM for full 3D
-                processing_jobs[job_id]['progress'] = 30
-                openlrm_mesh = process_openlrm(image, job_id, 'medium', 'glb')
-                # Export OpenLRM result
-                openlrm_path = os.path.join(output_dir, "model_openlrm.glb")
-                openlrm_mesh.export(openlrm_path, file_type='glb')
-                result_urls['openlrm'] = f"/compare-download/{job_id}/openlrm"
-                processing_jobs[job_id]['progress'] = 60
-                # Then process with depth-based approach
-                depth_mesh = process_depth_based(image, job_id, 'medium', 'glb')
-                # Export depth-based result
-                depth_path = os.path.join(output_dir, "model_depth.glb")
-                depth_mesh.export(depth_path, file_type='glb')
-                result_urls['depth'] = f"/compare-download/{job_id}/depth"
-                processing_jobs[job_id]['progress'] = 90
-            except Exception as e:
-                print(f"Error in comparison processing: {str(e)}")
-                # If at least one model was successful, continue
-                if not result_urls:
-                    raise
-            # Update job status
-            processing_jobs[job_id]['status'] = 'completed'
-            processing_jobs[job_id]['progress'] = 100
-            processing_jobs[job_id]['result_urls'] = result_urls
-            processing_jobs[job_id]['completed_at'] = time.time()
-            # Clean up temporary file
-            if os.path.exists(filepath):
-                os.remove(filepath)
-            # Force garbage collection
-            gc.collect()
-            if torch.cuda.is_available():
-                torch.cuda.empty_cache()
         except Exception as e:
-            # Handle errors
-            processing_jobs[job_id]['status'] = 'error'
-            processing_jobs[job_id]['error'] = f"Error during processing: {str(e)}"
-            # Clean up on error
-            if os.path.exists(filepath):
-                os.remove(filepath)
-    # Start processing thread
-    processing_thread = threading.Thread(target=process_comparison)
-    processing_thread.daemon = True
-    processing_thread.start()
-    # Return job ID immediately
-    return jsonify({"job_id": job_id, "check_progress_at": f"/progress/{job_id}"}), 202
-@app.route('/compare-download/<job_id>/<model_type>', methods=['GET'])
-def download_comparison_model(job_id, model_type):
-    if job_id not in processing_jobs or processing_jobs[job_id]['status'] != 'completed':
-        return jsonify({"error": "Model not found or processing not complete"}), 404
-    if 'comparison' not in processing_jobs[job_id] or not processing_jobs[job_id]['comparison']:
-        return jsonify({"error": "This is not a comparison job"}), 400
-    if model_type not in ['openlrm', 'depth']:
-        return jsonify({"error": "Invalid model type"}), 400
-    # Get the output directory for this job
-    output_dir = os.path.join(RESULTS_FOLDER, job_id)
-    model_path = os.path.join(output_dir, f"model_{model_type}.glb")
-    if os.path.exists(model_path):
-        return send_file(model_path, as_attachment=True, download_name=f"model_{model_type}.glb")
-    return jsonify({"error": "File not found"}), 404
-@app.route('/install-dependencies', methods=['POST'])
-def install_dependencies():
-    """Admin route to install additional dependencies if needed"""
-    try:
-        # Check for admin token (you should implement proper authentication)
-        token = request.json.get('token')
-        if token != 'admin_secure_token':  # Replace with proper auth
-            return jsonify({"error": "Unauthorized"}), 401
-        # Install dependencies
-        import subprocess
-        # Install rembg for background removal
-        subprocess.check_call([sys.executable, "-m", "pip", "install", "rembg"])
-        # Try to install torchmcubes with CUDA support
-        try:
-            subprocess.check_call([sys.executable, "-m", "pip", "uninstall", "-y", "torchmcubes"])
-            subprocess.check_call([sys.executable, "-m", "pip", "install", "git+https://github.com/tatsy/torchmcubes.git"])
-        except:
-            print("Could not install torchmcubes with CUDA support")
-        return jsonify({"message": "Dependencies installed successfully"}), 200
-    except Exception as e:
-        return jsonify({"error": f"Failed to install dependencies: {str(e)}"}), 500
 if __name__ == '__main__':
     # Start the cleanup thread
     cleanup_old_jobs()

 import zipfile
 import uuid
 import traceback
+from huggingface_hub import snapshot_download, hf_hub_download, login
 from flask_cors import CORS
 import numpy as np
 import trimesh
 from scipy.ndimage import gaussian_filter
 import cv2
 import torch.nn.functional as F
+# Try to login with token if available
+HF_TOKEN = os.environ.get("HF_TOKEN", None)
+if HF_TOKEN:
+    print("Logging in with Hugging Face token")
+    login(token=HF_TOKEN)
 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
 os.environ['HF_HOME'] = CACHE_DIR
 os.environ['TRANSFORMERS_CACHE'] = os.path.join(CACHE_DIR, 'transformers')
 os.environ['HF_DATASETS_CACHE'] = os.path.join(CACHE_DIR, 'datasets')
+os.environ['PYTORCH_CUDA_ALLOC_CONF'] = 'max_split_size_mb:128'  # Limit CUDA memory splits
 app.config['UPLOAD_FOLDER'] = UPLOAD_FOLDER
 app.config['MAX_CONTENT_LENGTH'] = 16 * 1024 * 1024  # 16MB max
 model_loaded = False
 model_loading = False
+# Flag to control whether to use simplified mode (for Hugging Face Spaces)
+USE_SIMPLIFIED_MODE = os.environ.get('USE_SIMPLIFIED_MODE', 'false').lower() == 'true'
 # Constants for processing
 TIMEOUT_SECONDS = 240  # 4 minutes max for processing
 MAX_DIMENSION = 512    # Max image dimension to process
     return result[0], None
+def optimize_memory():
+    """Free up memory to avoid OOM errors"""
+    gc.collect()
+    if torch.cuda.is_available():
+        torch.cuda.empty_cache()
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
         return img
+# Try to remove background - simplified version that won't fail if rembg is not available
 def remove_background(image):
+    """Remove background if rembg is available, otherwise return original image"""
     try:
         import rembg
         return rembg.remove(image)
     except ImportError:
         print("Rembg not available, skipping background removal")
+        # Create a copy of the image with RGBA
+        if isinstance(image, Image.Image):
+            if image.mode != 'RGBA':
+                return image.convert('RGBA')
         return image
+# Function to select available models - checks which models are accessible
+def select_available_model():
+    """Try to find an available public model for depth estimation"""
+    public_models = [
+        "facebook/dpt-hybrid-midas",  # Public DPT model
+        "Intel/dpt-large",            # Intel's DPT model
+        "facebook/dinov2-base",       # General vision model
+    ]
+    # Try each model in turn
+    for model_name in public_models:
+        try:
+            print(f"Testing model availability: {model_name}")
+            # Just try to download the config to check if accessible
+            from transformers import AutoConfig
+            AutoConfig.from_pretrained(model_name, force_download=False)
+            print(f"Model {model_name} is available")
+            return model_name
+        except Exception as e:
+            print(f"Model {model_name} not available: {str(e)}")
+    print("No suitable models found. Using manual depth map generation.")
+    return None
+# Updated OpenLRM loading with fallback to simplified model
 def load_openlrm_model():
     global openlrm_model, model_loaded, model_loading
+    if model_loaded and openlrm_model is not None:
         return openlrm_model
     if model_loading:
     try:
         model_loading = True
+        print("Initializing 3D model generator...")
+        # Device selection - prefer CUDA if available
         device = "cuda" if torch.cuda.is_available() else "cpu"
+        # Instead of using OpenLRM which is problematic on Spaces, create a simpler wrapper
+        # This will generate basic 3D structure without requiring complex models
+        class Simple3DWrapper:
+            def __init__(self, device):
                 self.device = device
+                print(f"Initialized simple 3D wrapper on {device}")
             def __call__(self, image):
+                """Create a 3D mesh representation from an image"""
+                # Generate a depth map without complex models
+                depth_map = create_simple_depth_map(image)
+                # Convert depth map to vertices and faces
+                h, w = depth_map.shape
+                vertices = []
+                # Create vertices - scale to [-1, 1] range for x and y
+                scale_factor = 2.0
+                for i in range(h):
+                    for j in range(w):
+                        x = (j / w - 0.5) * scale_factor
+                        y = (i / h - 0.5) * scale_factor
+                        z = depth_map[i, j] * scale_factor * -1  # Negative to make closer objects "pop out"
+                        vertices.append([x, y, z])
+                # Create faces - connect neighboring vertices
+                faces = []
+                for i in range(h-1):
+                    for j in range(w-1):
+                        v0 = i * w + j
+                        v1 = i * w + (j + 1)
+                        v2 = (i + 1) * w + j
+                        v3 = (i + 1) * w + (j + 1)
+                        # Two triangles per grid cell
+                        faces.append([v0, v1, v3])
+                        faces.append([v0, v3, v2])
+                return {
+                    "vertices": np.array(vertices),
+                    "faces": np.array(faces)
+                }
+        # Create the 3D model wrapper
+        openlrm_model = Simple3DWrapper(device)
         model_loaded = True
+        print(f"Simple 3D model generator initialized on {device}")
         return openlrm_model
     except Exception as e:
+        print(f"Error initializing 3D model: {str(e)}")
         print(traceback.format_exc())
         return None
     finally:
         model_loading = False
+# Updated depth model loading with public model support
 def load_depth_model():
     global depth_model, feature_extractor, model_loaded, model_loading
         return depth_model, feature_extractor
     try:
+        print("Loading depth estimation model...")
+        # Select an available public model
+        model_name = select_available_model()
+        if model_name is None:
+            print("No suitable depth model found. Using manual depth map generation.")
+            return None, None
+        # Device selection
         device = "cuda" if torch.cuda.is_available() else "cpu"
+        # Import appropriate model class for the selected model
+        if "dpt" in model_name.lower():
+            from transformers import DPTForDepthEstimation, DPTFeatureExtractor
+            print(f"Loading DPT model: {model_name}")
+            feature_extractor = DPTFeatureExtractor.from_pretrained(model_name, token=HF_TOKEN)
+            depth_model = DPTForDepthEstimation.from_pretrained(model_name, token=HF_TOKEN)
+        elif "dinov2" in model_name.lower():
+            from transformers import AutoFeatureExtractor, AutoModel
+            print(f"Loading DINOv2 model: {model_name}")
+            feature_extractor = AutoFeatureExtractor.from_pretrained(model_name, token=HF_TOKEN)
+            depth_model = AutoModel.from_pretrained(model_name, token=HF_TOKEN)
+        else:
+            # Generic loading
+            from transformers import AutoFeatureExtractor, AutoModelForDepthEstimation
+            print(f"Loading Auto depth model: {model_name}")
+            feature_extractor = AutoFeatureExtractor.from_pretrained(model_name, token=HF_TOKEN)
+            depth_model = AutoModelForDepthEstimation.from_pretrained(model_name, token=HF_TOKEN)
+        # Move to appropriate device
         if device == "cuda":
             depth_model = depth_model.to(device)
     except Exception as e:
         print(f"Error loading depth model: {str(e)}")
         print(traceback.format_exc())
+        print("Using manual depth map generation instead.")
+        return None, None
+# Create a simple depth map without ML models
+def create_simple_depth_map(image):
+    """Create a simple depth map from image without ML models"""
+    # Convert to numpy array if needed
+    if isinstance(image, Image.Image):
+        img_array = np.array(image)
+    else:
+        img_array = image
+    # Convert to grayscale
+    if len(img_array.shape) == 3 and img_array.shape[2] >= 3:
+        gray = cv2.cvtColor(img_array, cv2.COLOR_RGB2GRAY)
+    else:
+        gray = img_array.astype(np.uint8)
+    # Apply edge detection
+    edges = cv2.Canny(gray, 100, 200)
+    # Create depth map using blur and edges
+    depth_map = cv2.GaussianBlur(gray, (15, 15), 0)
+    # Combine with edges to preserve details
+    depth_map = depth_map.astype(float) / 255.0
+    edges = edges.astype(float) / 255.0
+    # Edges should be deeper in the depth map
+    depth_map = depth_map * (1.0 - 0.5 * edges)
+    # Center objects usually closer to viewer (create a radial gradient)
+    h, w = depth_map.shape
+    center_y, center_x = h // 2, w // 2
+    y, x = np.ogrid[:h, :w]
+    dist_from_center = np.sqrt((x - center_x)**2 + (y - center_y)**2)
+    max_dist = np.sqrt(center_x**2 + center_y**2)
+    dist_factor = dist_from_center / max_dist
+    # Apply center bias - center is closer (lower depth values)
+    depth_map = depth_map + 0.3 * dist_factor
+    # Normalize
+    depth_map = (depth_map - depth_map.min()) / (depth_map.max() - depth_map.min() + 1e-10)
+    # Smooth the depth map to avoid artifacts
+    depth_map = gaussian_filter(depth_map, sigma=1.0)
+    return depth_map
+# Process image to create 3D model using simplified approach
 def process_openlrm(image, job_id, detail_level='medium', output_format='obj'):
     try:
+        # Load OpenLRM model - now returns simplified 3D generator
         model = load_openlrm_model()
         if model is None:
             # Fallback to depth-based approach
             return process_depth_based(image, job_id, detail_level, output_format)
         # Preprocess image - remove background for better results
+        processing_jobs[job_id]['progress'] = 20
         image_rgba = remove_background(image)
         # Update progress
+        processing_jobs[job_id]['progress'] = 40
+        # Process with model to get 3D mesh
         result = model(image_rgba)
         # Update progress
 # Convert OpenLRM result to trimesh
 def convert_to_trimesh(result, image):
+    # Use the provided vertices and faces from the model result
+    vertices = np.array(result.get("vertices", []))
+    faces = np.array(result.get("faces", []))
+    # Create a default mesh if needed
+    if len(vertices) == 0 or len(faces) == 0:
+        # Generate sample vertices and faces
+        x = np.linspace(-1, 1, 20)
+        y = np.linspace(-1, 1, 20)
+        z = np.linspace(-1, 1, 10)
+        # Create grid points
+        xx, yy = np.meshgrid(x, y)
+        zz = np.zeros_like(xx)
+        # Create a simple height field
+        vertices = np.vstack([xx.flatten(), yy.flatten(), zz.flatten()]).T
+        # Create faces
+        faces = []
+        n = 20  # Grid size
+        for i in range(n-1):
+            for j in range(n-1):
+                idx = i*n + j
+                faces.append([idx, idx+1, idx+n])
+                faces.append([idx+1, idx+n+1, idx+n])
+        faces = np.array(faces)
+    # Create mesh with provided data
     mesh = trimesh.Trimesh(vertices=vertices, faces=faces)
     # Add texture from the original image
     if hasattr(image, 'convert'):
+        try:
+            img_array = np.array(image.convert("RGBA"))
+            if img_array.shape[2] == 4:  # RGBA
+                vertex_colors = sample_texture_from_image(img_array, vertices)
+                mesh.visual.vertex_colors = vertex_colors
+        except Exception as e:
+            print(f"Error applying texture: {e}")
     return mesh
 # Sample helper functions for mesh creation
 def sample_texture_from_image(image, vertices):
+    """Sample colors from image based on vertex positions"""
     # Sample colors from image based on vertex positions
     h, w = image.shape[:2]
     colors = np.zeros((len(vertices), 4), dtype=np.uint8)
+    # Find the range of vertex positions
+    min_x, min_y = vertices[:, 0].min(), vertices[:, 1].min()
+    max_x, max_y = vertices[:, 0].max(), vertices[:, 1].max()
+    # Normalize vertex positions to [0,1] for sampling
+    for i, v in enumerate(vertices):
+        # Map from vertex coordinates to image coordinates
+        x_norm = (v[0] - min_x) / (max_x - min_x) if max_x > min_x else 0.5
+        y_norm = (v[1] - min_y) / (max_y - min_y) if max_y > min_y else 0.5
+        # Clamp to valid range
+        x_norm = max(0, min(1, x_norm))
+        y_norm = max(0, min(1, y_norm))
+        # Convert to image coordinates
+        x = int(x_norm * (w-1))
+        y = int(y_norm * (h-1))
+        # Sample color
+        if 0 <= x < w and 0 <= y < h:
             colors[i] = image[y, x]
         else:
             colors[i] = [200, 200, 200, 255]  # Default color
 # Process using depth-based approach as fallback
 def process_depth_based(image, job_id, detail_level='medium', output_format='obj'):
     try:
+        # Load depth model
+        depth_model_result = load_depth_model()
         # Update progress
         processing_jobs[job_id]['progress'] = 30
+        # Check if model loading was successful
+        if depth_model_result[0] is None:
+            # Use manual depth map generation
+            print("Using manual depth map generation")
+            depth_map = create_simple_depth_map(image)
+        else:
+            # Extract model and feature extractor
+            depth_model, feature_extractor = depth_model_result
+            # Get depth map from model
+            with torch.no_grad():
+                # Prepare image for the model
+                inputs = feature_extractor(images=image, return_tensors="pt")
+                if torch.cuda.is_available():
+                    inputs = {k: v.cuda() for k, v in inputs.items()}
+                # Forward pass
+                outputs = depth_model(**inputs)
+                # Different models have different output formats
+                if hasattr(outputs, "predicted_depth"):
+                    predicted_depth = outputs.predicted_depth
+                elif hasattr(outputs, "logits"):  # For some models
+                    predicted_depth = outputs.logits
+                else:
+                    # Generic handling - take the first output tensor
+                    predicted_depth = list(outputs.values())[0]
+                # Resize depth to original image size
+                depth_map = F.interpolate(
+                    predicted_depth.unsqueeze(1),
+                    size=(image.height, image.width),
+                    mode="bicubic",
+                    align_corners=False,
+                ).squeeze().cpu().numpy()
         # Update progress
         processing_jobs[job_id]['progress'] = 60
+        # Normalize depth map if from model
+        if 'depth_map' not in locals():
+            depth_min = depth_map.min()
+            depth_max = depth_map.max()
+            depth_normalized = (depth_map - depth_min) / (depth_max - depth_min + 1e-10)
+        else:
+            depth_normalized = depth_map
         # Create mesh from depth map
         mesh = depth_to_mesh(depth_normalized, image,
         # Update progress
         processing_jobs[job_id]['progress'] = 80
+        # Clean up to free memory
+        optimize_memory()
         return mesh
     except Exception as e:
         print(f"Error in depth-based processing: {str(e)}")
         print(traceback.format_exc())
+        # Ultimate fallback - create a simple mesh from the image
+        try:
+            print("Using emergency fallback mesh generation")
+            depth_map = create_simple_depth_map(image)
+            mesh = depth_to_mesh(depth_map, image, resolution=50, detail_level='low')
+            return mesh
+        except Exception as fallback_error:
+            print(f"Fallback mesh generation failed: {fallback_error}")
+            raise
 # Enhanced depth map processing
 def enhance_depth_map(depth_map, detail_level='medium'):
     mesh = trimesh.Trimesh(vertices=vertices, faces=faces)
     # Apply texturing if image is provided
+    if image is not None:
         # Convert to numpy array if needed
         if isinstance(image, Image.Image):
             img_array = np.array(image)
             img_array = image
         # Create vertex colors
+        if len(img_array.shape) >= 2:
             # Create vertex colors by sampling the image
             vertex_colors = np.zeros((vertices.shape[0], 4), dtype=np.uint8)
             for i in range(resolution):
                 for j in range(resolution):
                     # Calculate image coordinates
+                    img_x = min(max(0, int(j * (img_array.shape[1] - 1) / (resolution - 1))), img_array.shape[1] - 1)
+                    img_y = min(max(0, int(i * (img_array.shape[0] - 1) / (resolution - 1))), img_array.shape[0] - 1)
                     vertex_idx = i * resolution + j
                     if len(img_array.shape) == 3 and img_array.shape[2] == 3:  # RGB
+                        r, g, b = img_array[img_y, img_x]
+                        vertex_colors[vertex_idx] = [r, g, b, 255]
                     elif len(img_array.shape) == 3 and img_array.shape[2] == 4:  # RGBA
+                        vertex_colors[vertex_idx] = img_array[img_y, img_x]
                     else:
                         # Handle grayscale
+                        gray = img_array[img_y, img_x]
+                        if np.isscalar(gray):
+                            vertex_colors[vertex_idx] = [gray, gray, gray, 255]
+                        else:
+                            # Just in case gray is some kind of array
+                            gray_val = np.mean(gray)
+                            vertex_colors[vertex_idx] = [gray_val, gray_val, gray_val, 255]
             mesh.visual.vertex_colors = vertex_colors
     # Apply smoothing to get rid of staircase artifacts
     if detail_level != 'high':
+        try:
+            # Use laplacian smoothing if available
+            mesh = mesh.smoothed(method='laplacian', iterations=1)
+        except Exception as e:
+            print(f"Smoothing error (non-critical): {e}")
     # Fix normals for better rendering
+    try:
+        mesh.fix_normals()
+    except Exception as e:
+        print(f"Normal fixing error (non-critical): {e}")
+    # Simulate full 3D by duplicating and flipping the mesh only if detail level is higher
+    if detail_level == 'high' and not USE_SIMPLIFIED_MODE:
+        try:
+            # Create a complete 3D object by duplicating and flipping the mesh
+            back_mesh = mesh.copy()
+            # Flip to create the back side
+            back_mesh.vertices[:, 2] = -back_mesh.vertices[:, 2] - 0.1  # Add small offset to avoid z-fighting
+            # Fix normals after flipping
+            back_mesh.fix_normals()
+            # Combine front and back meshes
+            combined_mesh = trimesh.util.concatenate([mesh, back_mesh])
+            # Add side panels to create a watertight model
+            combined_mesh = create_watertight_model(combined_mesh)
+            return combined_mesh
+        except Exception as e:
+            print(f"3D completion error (non-critical): {e}")
     return mesh
+    # Create a watertight model by adding side panels
 def create_watertight_model(mesh):
+    try:
+        # Extract boundary edges - simplified approach to avoid errors
+        edges = mesh.edges_unique
+        edge_faces = mesh.edges_face
+        boundary_edges = []
+        # Find edges that are only part of one face (boundaries)
+        edge_face_counts = np.bincount(edge_faces.flatten(), minlength=len(mesh.faces))
+        boundary_face_indices = np.where(edge_face_counts == 1)[0]
+        # Get boundary edges
+        for i, edge in enumerate(edges):
+            faces = edge_faces[i]
+            if -1 in faces or len(np.unique(faces)) == 1:
+                boundary_edges.append(edge)
+        # If no boundary edges, return the original mesh
+        if len(boundary_edges) == 0:
+            return mesh
+        # Simplify for Hugging Face Space - just return original mesh
+        if USE_SIMPLIFIED_MODE:
+            return mesh
+        # Create side panels along boundary edges - simplified version
+        new_faces = []
+        new_vertices = mesh.vertices.copy()
+        # Just add a base and close the model
+        min_z = np.min(mesh.vertices[:, 2])
+        max_z = np.max(mesh.vertices[:, 2])
+        # Find vertices near the minimum z height
+        bottom_vertices = np.where(np.isclose(mesh.vertices[:, 2], min_z, atol=0.1))[0]
+        if len(bottom_vertices) > 3:
+            # Create a simple bottom face - simplified approach
+            center = np.mean(mesh.vertices[bottom_vertices], axis=0)
+            center_idx = len(new_vertices)
+            new_vertices = np.vstack([new_vertices, center])
+            # Add triangles connecting the boundary vertices to the center
+            for i in range(len(bottom_vertices)-1):
+                new_faces.append([bottom_vertices[i], bottom_vertices[i+1], center_idx])
+            # Close the loop
+            new_faces.append([bottom_vertices[-1], bottom_vertices[0], center_idx])
+        # Create new mesh with added faces
+        if len(new_faces) > 0:
+            new_faces = np.array(new_faces)
+            combined_faces = np.vstack([mesh.faces, new_faces])
+            watertight_mesh = trimesh.Trimesh(vertices=new_vertices, faces=combined_faces)
+            # Copy vertex colors if they exist
+            if hasattr(mesh.visual, 'vertex_colors') and mesh.visual.vertex_colors is not None:
+                # Extend vertex colors array for new vertices
+                extended_colors = np.vstack([
+                    mesh.visual.vertex_colors,
+                    np.full((len(new_vertices) - len(mesh.vertices), 4), [200, 200, 200, 255], dtype=np.uint8)
+                ])
+                watertight_mesh.visual.vertex_colors = extended_colors
+            return watertight_mesh
+        return mesh
+    except Exception as e:
+        print(f"Watertight model creation failed (non-critical): {e}")
+        return mesh
 @app.route('/health', methods=['GET'])
 def health_check():
     return jsonify({
         "status": "healthy",
+        "model": "Enhanced 3D Model Generator",
+        "device": "cuda" if torch.cuda.is_available() else "cpu",
+        "simplified_mode": USE_SIMPLIFIED_MODE
     }), 200
 @app.route('/progress/<job_id>', methods=['GET'])
                     break
                 check_count = 0
+        # Send final status
         if job['status'] == 'completed':
             yield f"data: {json.dumps({'status': 'completed', 'progress': 100, 'result_url': job['result_url'], 'preview_url': job['preview_url']})}\n\n"
         else:
         output_format = request.form.get('output_format', 'obj').lower()
         detail_level = request.form.get('detail_level', 'medium').lower()  # Parameter for detail level
         model_type = request.form.get('model_type', 'openlrm').lower()  # 'openlrm' or 'depth'
+        # Adjust parameters for simplified mode
+        if USE_SIMPLIFIED_MODE:
+            mesh_resolution = min(mesh_resolution, 100)  # Lower resolution for simplified mode
+            if detail_level == 'high':
+                detail_level = 'medium'  # Downgrade detail level in simplified mode
     except ValueError:
         return jsonify({"error": "Invalid parameter values"}), 400
                 os.remove(filepath)
             # Force garbage collection to free memory
+            optimize_memory()
         except Exception as e:
             # Handle errors
 @app.route('/', methods=['GET'])
 def index():
     return jsonify({
+        "message": "Enhanced 3D Model Generator",
         "endpoints": [
             "/convert",
             "/progress/<job_id>",
             "detail_level": "low, medium, or high - controls the level of detail in the final model",
             "model_type": "openlrm (default, full 3D) or depth (faster but simpler)"
         },
+        "description": "This API creates high-quality 3D models from 2D images with full 3D structure and texturing",
+        "simplified_mode": USE_SIMPLIFIED_MODE
     }), 200
+# System compatibility check function
+def check_system_compatibility():
+    """Check if the system can run the full model or needs simplified mode"""
+    print("Checking system compatibility...")
+    # Check available memory
+    try:
+        import psutil
+        mem = psutil.virtual_memory()
+        free_mem_gb = mem.available / (1024 ** 3)
+        print(f"Available memory: {free_mem_gb:.2f} GB")
+    except ImportError:
+        print("psutil not available, cannot check memory")
+        free_mem_gb = 1.0  # Assume low memory
+    # Check GPU
+    gpu_available = torch.cuda.is_available()
+    gpu_mem_gb = 0
+    if gpu_available:
         try:
+            gpu_mem_gb = torch.cuda.get_device_properties(0).total_memory / (1024 ** 3)
+            print(f"GPU available: {gpu_available}, Memory: {gpu_mem_gb:.2f} GB")
         except Exception as e:
+            print(f"Error checking GPU memory: {e}")
+    else:
+        print("No GPU available")
+    # Set simplified mode if limited resources
+    global USE_SIMPLIFIED_MODE
+    if free_mem_gb < 4.0 or (gpu_available and gpu_mem_gb < 2.0):
+        print("Limited resources detected, using simplified mode")
+        USE_SIMPLIFIED_MODE = True
+    else:
+        print("Sufficient resources detected")
 if __name__ == '__main__':
+    # Check system compatibility
+    check_system_compatibility()
     # Start the cleanup thread
     cleanup_old_jobs()