Spaces:

ju4nppp
/

dcgan-mouse-generator

Sleeping

App Files Files Community

ju4nppp commited on Apr 27

Commit

e352aba

verified ·

1 Parent(s): 4fa9660

Uploaded 3 files

Browse files

Uploaded readme, app, and requirements

Files changed (3) hide show

README.md +47 -0
app.py +126 -0
requirements.txt +8 -0

README.md ADDED Viewed

	@@ -0,0 +1,47 @@

+---
+title: Computer Mouse GAN Generator
+emoji: 🖱️
+colorFrom: blue
+colorTo: purple
+sdk: gradio
+sdk_version: 3.50.0
+app_file: app.py
+pinned: false
+---
+# Computer Mouse GAN Generator
+This project uses a Deep Convolutional Generative Adversarial Network (DCGAN) to generate realistic images of computer mice. The model was trained on a dataset of computer mouse images with data augmentation to expand the training set.
+## Model Architecture
+The model is based on the DCGAN architecture from the paper [Unsupervised Representation Learning with Deep Convolutional Generative Adversarial Networks](https://arxiv.org/abs/1511.06434).
+- Generator: 5 transpose convolutional layers with batch normalization
+- RGB color output (3 channels)
+- Trained with Weights & Biases monitoring
+- Training included data augmentation (flips, rotations, brightness/contrast adjustments)
+## Demo App
+The Gradio interface allows you to:
+- Generate multiple computer mouse images at once
+- Set the number of images to generate (1-64)
+- Use a specific random seed for reproducible results
+- Toggle random seed generation for variety
+## Training Process
+The model was trained on:
+- ~300 original computer mouse images
+- Expanded to ~2,500 training samples through augmentation
+- Trained for 150+ epochs
+- Used CUDA acceleration on an RTX 3070
+## Examples
+Generated images show a variety of computer mouse designs with different colors and shapes. Each image is completely new and generated from random noise - these mice don't exist in the real world!
+## Usage
+Simply adjust the sliders and click "Generate Mice" to create new computer mouse designs.

app.py ADDED Viewed

	@@ -0,0 +1,126 @@

+import torch
+import torch.nn as nn
+import torchvision.utils as vutils
+import gradio as gr
+import numpy as np
+import matplotlib.pyplot as plt
+# Define Generator architecture - must match what you used during training
+class Generator(nn.Module):
+    def __init__(self, ngpu=1, nz=100, ngf=64, nc=3):
+        super(Generator, self).__init__()
+        self.ngpu = ngpu
+        self.main = nn.Sequential(
+            # input is Z, going into a convolution
+            nn.ConvTranspose2d(nz, ngf * 8, 4, 1, 0, bias=False),
+            nn.BatchNorm2d(ngf * 8),
+            nn.ReLU(True),
+            # state size. (ngf*8) x 4 x 4
+            nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf * 4),
+            nn.ReLU(True),
+            # state size. (ngf*4) x 8 x 8
+            nn.ConvTranspose2d(ngf * 4, ngf * 2, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf * 2),
+            nn.ReLU(True),
+            # state size. (ngf*2) x 16 x 16
+            nn.ConvTranspose2d(ngf * 2, ngf, 4, 2, 1, bias=False),
+            nn.BatchNorm2d(ngf),
+            nn.ReLU(True),
+            # state size. (ngf) x 32 x 32
+            nn.ConvTranspose2d(ngf, nc, 4, 2, 1, bias=False),
+            nn.Tanh()
+            # state size. (nc) x 64 x 64
+        )
+    def forward(self, input):
+        return self.main(input)
+# Load the generator
+def load_model(model_path="model/netG_best.pth"):
+    # Create the generator and load the saved weights
+    device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+    netG = Generator(ngpu=1, nz=100, ngf=64, nc=3).to(device)
+    try:
+        netG.load_state_dict(torch.load(model_path, map_location=device))
+        netG.eval()  # Set to evaluation mode
+        print(f"Model loaded successfully from {model_path}")
+        return netG, device
+    except Exception as e:
+        print(f"Error loading model: {e}")
+        return None, device
+# Generate images using the model
+def generate_images(num_images=16, seed=None, randomize=True):
+    # Load the model (do this once when needed)
+    global model, device
+    if 'model' not in globals():
+        model, device = load_model()
+        if model is None:
+            return np.zeros((299, 299, 3))
+    # Set random seed for reproducibility if provided
+    if seed is not None and not randomize:
+        torch.manual_seed(seed)
+        np.random.seed(seed)
+    # Generate latent vectors
+    nz = 100  # Size of the latent vector
+    noise = torch.randn(num_images, nz, 1, 1, device=device)
+    # Generate fake images
+    with torch.no_grad():
+        fake_images = model(noise).detach().cpu()
+    # Convert to grid for display
+    grid = vutils.make_grid(fake_images, padding=2, normalize=True, nrow=int(np.sqrt(num_images)))
+    # Convert from tensor to numpy array for Gradio
+    grid_np = grid.numpy().transpose((1, 2, 0))
+    # Make sure values are in 0-1 range
+    grid_np = np.clip(grid_np, 0, 1)
+    return grid_np
+# Create Gradio interface
+def create_gradio_app():
+    with gr.Blocks(title="Computer Mouse Generator") as app:
+        gr.Markdown("# Computer Mouse GAN Generator")
+        gr.Markdown("Generate computer mice using a Deep Convolutional GAN trained on ~2,500 augmented images")
+        with gr.Row():
+            with gr.Column():
+                num_images = gr.Slider(minimum=1, maximum=64, value=16, step=1, label="Number of Images")
+                seed = gr.Number(label="Random Seed", value=42, precision=0)
+                randomize = gr.Checkbox(label="Use Random Seeds (ignore seed value)", value=True)
+                generate_button = gr.Button("Generate Mice")
+            with gr.Column():
+                output_image = gr.Image(label="Generated Computer Mice")
+        generate_button.click(fn=generate_images, inputs=[num_images, seed, randomize], outputs=output_image)
+        gr.Markdown("## About")
+        gr.Markdown("""This model was trained using a PyTorch DCGAN implementation on a dataset of computer mouse images.
+The training process used data augmentation to expand a small dataset of 300+ original images into 2,500+ training samples through techniques like flipping, rotation, and brightness/contrast adjustments.
+The generator creates brand new, never-before-seen computer mice from random noise!""")
+    return app
+# Initialize global variables
+model = None
+device = None
+# Launch the app if the script is run directly
+if __name__ == "__main__":
+    app = create_gradio_app()
+    app.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+torch>=2.0.0
+torchvision>=0.15.0
+matplotlib>=3.5.0
+numpy>=1.22.0
+Pillow>=9.0.0
+gradio>=3.50.0
+tqdm>=4.64.0
+ipython>=8.0.0