Spaces:

mac9087
/

rightnight

Sleeping

App Files Files Community

mac9087 commited on Apr 23

Commit

e4c93be

verified ·

1 Parent(s): 5a23d7c

Update app.py

Browse files

Files changed (1) hide show

app.py +118 -43

app.py CHANGED Viewed

@@ -11,11 +11,11 @@ import io
 import zipfile
 import uuid
 import traceback
-from diffusers import ShapEImg2ImgPipeline
-from diffusers.utils import export_to_obj
 from huggingface_hub import snapshot_download
 from flask_cors import CORS
-import functools
 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
@@ -42,15 +42,15 @@ app.config['MAX_CONTENT_LENGTH'] = 16 * 1024 * 1024  # 16MB max
 # Job tracking dictionary
 processing_jobs = {}
-# Global model variable
-pipe = None
 model_loaded = False
 model_loading = False
 # Configuration for processing
-TIMEOUT_SECONDS = 300  # 5 minutes max for processing
 MAX_DIMENSION = 512    # Max image dimension to process
-MAX_INFERENCE_STEPS = 64  # Maximum allowed inference steps to prevent the index error
 # TimeoutError for handling timeouts
 class TimeoutError(Exception):
@@ -89,7 +89,7 @@ def process_with_timeout(function, args, timeout):
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
-# Function to preprocess image - resize if needed
 def preprocess_image(image_path):
     with Image.open(image_path) as img:
         img = img.convert("RGB")
@@ -104,26 +104,26 @@ def preprocess_image(image_path):
                 new_width = int(img.width * (MAX_DIMENSION / img.height))
             img = img.resize((new_width, new_height), Image.LANCZOS)
-        # Convert to RGB and return
         return img
 def load_model():
-    global pipe, model_loaded, model_loading
     if model_loaded:
-        return pipe
     if model_loading:
         # Wait for model to load if it's already in progress
         while model_loading and not model_loaded:
             time.sleep(0.5)
-        return pipe
     try:
         model_loading = True
         print("Starting model loading...")
-        model_name = "openai/shap-e-img2img"
         # Download model with retry mechanism
         max_retries = 3
@@ -145,24 +145,26 @@ def load_model():
                 else:
                     raise
-        # Initialize pipeline with lower precision to save memory
         device = "cuda" if torch.cuda.is_available() else "cpu"
         dtype = torch.float16 if device == "cuda" else torch.float32
-        pipe = ShapEImg2ImgPipeline.from_pretrained(
             model_name,
             torch_dtype=dtype,
             cache_dir=CACHE_DIR,
         )
-        pipe = pipe.to(device)
         # Optimize for inference
         if device == "cuda":
-            pipe.enable_model_cpu_offload()
         model_loaded = True
         print(f"Model loaded successfully on {device}")
-        return pipe
     except Exception as e:
         print(f"Error loading model: {str(e)}")
@@ -171,11 +173,89 @@ def load_model():
     finally:
         model_loading = False
 @app.route('/health', methods=['GET'])
 def health_check():
     return jsonify({
         "status": "healthy",
-        "model": "Shap-E Image to 3D",
         "device": "cuda" if torch.cuda.is_available() else "cpu"
     }), 200
@@ -234,7 +314,6 @@ def convert_image_to_3d():
     # Get optional parameters with defaults
     try:
         guidance_scale = float(request.form.get('guidance_scale', 3.0))
-        num_inference_steps = min(int(request.form.get('num_inference_steps', 64)), MAX_INFERENCE_STEPS)
         output_format = request.form.get('output_format', 'obj').lower()
     except ValueError:
         return jsonify({"error": "Invalid parameter values"}), 400
@@ -243,9 +322,6 @@ def convert_image_to_3d():
     if guidance_scale < 1.0 or guidance_scale > 5.0:
         return jsonify({"error": "Guidance scale must be between 1.0 and 5.0"}), 400
-    if num_inference_steps < 32 or num_inference_steps > MAX_INFERENCE_STEPS:
-        num_inference_steps = min(num_inference_steps, MAX_INFERENCE_STEPS)
     # Validate output format
     if output_format not in ['obj', 'glb']:
         return jsonify({"error": "Unsupported output format. Use 'obj' or 'glb'"}), 400
@@ -277,14 +353,14 @@ def convert_image_to_3d():
         processing_jobs[job_id]['thread_alive'] = lambda: thread.is_alive()
         try:
-            # Preprocess image (resize if needed)
             processing_jobs[job_id]['progress'] = 5
             image = preprocess_image(filepath)
             processing_jobs[job_id]['progress'] = 10
             # Load model
             try:
-                pipe = load_model()
                 processing_jobs[job_id]['progress'] = 30
             except Exception as e:
                 processing_jobs[job_id]['status'] = 'error'
@@ -293,15 +369,18 @@ def convert_image_to_3d():
             # Process image with thread-safe timeout
             try:
-                def generate_mesh():
-                    return pipe(
-                        image,
-                        guidance_scale=guidance_scale,
-                        num_inference_steps=num_inference_steps,
-                        output_type="mesh",
-                    ).images
-                images, error = process_with_timeout(generate_mesh, [], TIMEOUT_SECONDS)
                 if error:
                     if isinstance(error, TimeoutError):
@@ -312,6 +391,10 @@ def convert_image_to_3d():
                         raise error
                 processing_jobs[job_id]['progress'] = 80
             except Exception as e:
                 error_details = traceback.format_exc()
                 processing_jobs[job_id]['status'] = 'error'
@@ -324,7 +407,7 @@ def convert_image_to_3d():
             try:
                 if output_format == 'obj':
                     obj_path = os.path.join(output_dir, "model.obj")
-                    export_to_obj(images[0], obj_path)
                     # Create a zip file with OBJ and MTL
                     zip_path = os.path.join(output_dir, "model.zip")
@@ -338,17 +421,9 @@ def convert_image_to_3d():
                     processing_jobs[job_id]['preview_url'] = f"/preview/{job_id}"
                 elif output_format == 'glb':
-                    from trimesh import Trimesh
-                    mesh = images[0]
-                    vertices = mesh.verts
-                    faces = mesh.faces
-                    # Create a trimesh object
-                    trimesh_obj = Trimesh(vertices=vertices, faces=faces)
                     # Export as GLB
                     glb_path = os.path.join(output_dir, "model.glb")
-                    trimesh_obj.export(glb_path)
                     processing_jobs[job_id]['result_url'] = f"/download/{job_id}"
                     processing_jobs[job_id]['preview_url'] = f"/preview/{job_id}"

 import zipfile
 import uuid
 import traceback
+from transformers import AutoImageProcessor, AutoModel
 from huggingface_hub import snapshot_download
 from flask_cors import CORS
+import numpy as np
+import trimesh
 app = Flask(__name__)
 CORS(app)  # Enable CORS for all routes
 # Job tracking dictionary
 processing_jobs = {}
+# Global model variables
+image_processor = None
+model = None
 model_loaded = False
 model_loading = False
 # Configuration for processing
+TIMEOUT_SECONDS = 180  # 3 minutes max for processing
 MAX_DIMENSION = 512    # Max image dimension to process
 # TimeoutError for handling timeouts
 class TimeoutError(Exception):
 def allowed_file(filename):
     return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS
+# Function to preprocess image
 def preprocess_image(image_path):
     with Image.open(image_path) as img:
         img = img.convert("RGB")
                 new_width = int(img.width * (MAX_DIMENSION / img.height))
             img = img.resize((new_width, new_height), Image.LANCZOS)
         return img
 def load_model():
+    global image_processor, model, model_loaded, model_loading
     if model_loaded:
+        return image_processor, model
     if model_loading:
         # Wait for model to load if it's already in progress
         while model_loading and not model_loaded:
             time.sleep(0.5)
+        return image_processor, model
     try:
         model_loading = True
         print("Starting model loading...")
+        # Using a lightweight model: Pictorial 3D Scene Representation
+        model_name = "damo-vilab/text-to-3d-texture-base" # Smaller model than ShapE-img2img
         # Download model with retry mechanism
         max_retries = 3
                 else:
                     raise
+        # Initialize model with lower precision to save memory
         device = "cuda" if torch.cuda.is_available() else "cpu"
         dtype = torch.float16 if device == "cuda" else torch.float32
+        image_processor = AutoImageProcessor.from_pretrained(model_name, cache_dir=CACHE_DIR)
+        model = AutoModel.from_pretrained(
             model_name,
             torch_dtype=dtype,
             cache_dir=CACHE_DIR,
+            low_cpu_mem_usage=True,
         )
+        model = model.to(device)
         # Optimize for inference
         if device == "cuda":
+            model = model.half()  # Use half precision on GPU
         model_loaded = True
         print(f"Model loaded successfully on {device}")
+        return image_processor, model
     except Exception as e:
         print(f"Error loading model: {str(e)}")
     finally:
         model_loading = False
+# Convert model output to 3D mesh
+def create_mesh_from_output(output, resolution=64):
+    """Create a mesh from model output"""
+    # Extract features from model output and create mesh
+    # This is a simplified implementation - adapt based on your specific model
+    features = output.last_hidden_state.detach().cpu().numpy()[0]
+    # Create a simple cube mesh as placeholder - replace with actual mesh generation
+    vertices, faces = create_primitive_mesh(features, resolution)
+    mesh = trimesh.Trimesh(vertices=vertices, faces=faces)
+    return mesh
+def create_primitive_mesh(features, resolution=64):
+    """Create a simple primitive mesh based on features"""
+    # Create a mesh using features as modifiers
+    # This is a simplified implementation - adapt based on your specific model's output
+    # Create a cube/sphere mesh as a placeholder
+    use_sphere = True  # Change to False for cube
+    if use_sphere:
+        # Create a sphere
+        u = np.linspace(0, 2 * np.pi, resolution)
+        v = np.linspace(0, np.pi, resolution)
+        # Base radius and modifiers
+        base_radius = 1.0
+        # Use some features to modify the radius (just as an example)
+        feature_sum = np.sum(features[:10])  # Use first 10 features
+        radius_mod = 0.5 + (feature_sum % 1.0)  # Simple modifier between 0.5 and 1.5
+        # Create vertices
+        x = base_radius * radius_mod * np.outer(np.cos(u), np.sin(v))
+        y = base_radius * radius_mod * np.outer(np.sin(u), np.sin(v))
+        z = base_radius * radius_mod * np.outer(np.ones_like(u), np.cos(v))
+        # Reshape to get list of vertices
+        vertices = np.vstack([x.flatten(), y.flatten(), z.flatten()]).T
+        # Create faces (triangles)
+        faces = []
+        for i in range(resolution-1):
+            for j in range(resolution-1):
+                p1 = i * resolution + j
+                p2 = i * resolution + (j + 1)
+                p3 = (i + 1) * resolution + j
+                p4 = (i + 1) * resolution + (j + 1)
+                faces.append([p1, p2, p4])
+                faces.append([p1, p4, p3])
+        faces = np.array(faces)
+    else:
+        # Create a cube
+        vertices = np.array([
+            [-1, -1, -1], [1, -1, -1], [1, 1, -1], [-1, 1, -1],
+            [-1, -1, 1], [1, -1, 1], [1, 1, 1], [-1, 1, 1]
+        ])
+        # Apply some feature-based modifications
+        feature_sum = np.sum(features[:10])  # Use first 10 features
+        scale_factor = 0.5 + (feature_sum % 1.0)  # Simple modifier between 0.5 and 1.5
+        vertices *= scale_factor
+        # Faces (triangles)
+        faces = np.array([
+            [0, 1, 2], [0, 2, 3],  # Bottom face
+            [4, 5, 6], [4, 6, 7],  # Top face
+            [0, 1, 5], [0, 5, 4],  # Front face
+            [2, 3, 7], [2, 7, 6],  # Back face
+            [0, 3, 7], [0, 7, 4],  # Left face
+            [1, 2, 6], [1, 6, 5]   # Right face
+        ])
+    return vertices, faces
 @app.route('/health', methods=['GET'])
 def health_check():
     return jsonify({
         "status": "healthy",
+        "model": "Lightweight 3D Model Generator",
         "device": "cuda" if torch.cuda.is_available() else "cpu"
     }), 200
     # Get optional parameters with defaults
     try:
         guidance_scale = float(request.form.get('guidance_scale', 3.0))
         output_format = request.form.get('output_format', 'obj').lower()
     except ValueError:
         return jsonify({"error": "Invalid parameter values"}), 400
     if guidance_scale < 1.0 or guidance_scale > 5.0:
         return jsonify({"error": "Guidance scale must be between 1.0 and 5.0"}), 400
     # Validate output format
     if output_format not in ['obj', 'glb']:
         return jsonify({"error": "Unsupported output format. Use 'obj' or 'glb'"}), 400
         processing_jobs[job_id]['thread_alive'] = lambda: thread.is_alive()
         try:
+            # Preprocess image
             processing_jobs[job_id]['progress'] = 5
             image = preprocess_image(filepath)
             processing_jobs[job_id]['progress'] = 10
             # Load model
             try:
+                processor, model_instance = load_model()
                 processing_jobs[job_id]['progress'] = 30
             except Exception as e:
                 processing_jobs[job_id]['status'] = 'error'
             # Process image with thread-safe timeout
             try:
+                def generate_3d():
+                    # Process the image
+                    device = model_instance.device
+                    inputs = processor(images=image, return_tensors="pt").to(device)
+                    # Forward pass through model
+                    with torch.no_grad():
+                        outputs = model_instance(**inputs)
+                    return outputs
+                outputs, error = process_with_timeout(generate_3d, [], TIMEOUT_SECONDS)
                 if error:
                     if isinstance(error, TimeoutError):
                         raise error
                 processing_jobs[job_id]['progress'] = 80
+                # Create mesh from outputs
+                mesh = create_mesh_from_output(outputs)
             except Exception as e:
                 error_details = traceback.format_exc()
                 processing_jobs[job_id]['status'] = 'error'
             try:
                 if output_format == 'obj':
                     obj_path = os.path.join(output_dir, "model.obj")
+                    mesh.export(obj_path, file_type='obj')
                     # Create a zip file with OBJ and MTL
                     zip_path = os.path.join(output_dir, "model.zip")
                     processing_jobs[job_id]['preview_url'] = f"/preview/{job_id}"
                 elif output_format == 'glb':
                     # Export as GLB
                     glb_path = os.path.join(output_dir, "model.glb")
+                    mesh.export(glb_path, file_type='glb')
                     processing_jobs[job_id]['result_url'] = f"/download/{job_id}"
                     processing_jobs[job_id]['preview_url'] = f"/preview/{job_id}"