From b50ceb73b9d484caa83eedfdba2cf40c0e6ac538 Mon Sep 17 00:00:00 2001
From: mikejcarrier <mikejcarrier@users.noreply.github.com>
Date: Thu, 19 Mar 2026 21:42:55 -0400
Subject: [PATCH] feat: multi-view image input UI and full-stack plumbing

Adds support for uploading multiple images (front, left, back, right views)
for 3D model generation. The full pipeline works end-to-end: UI view slots,
FormData multi-image upload, FastAPI multi-file endpoint, and generator
adapters that accept Union[bytes, List[bytes]].

## What's included

**Frontend:**
- 2x2 view slot grid (Front*, Left, Back, Right) with per-slot upload/remove
- Drag-and-drop and file browser support per slot
- Front view is required, others are optional
- View labels sent to backend as comma-separated form field

**Backend:**
- FastAPI endpoint accepts List[UploadFile] for multiple images
- view_labels parsed and passed through to generators
- BaseGenerator.generate() signature updated to Union[bytes, List[bytes]]
- SF3D generator gracefully falls back to first image (single-view only)

**Hunyuan3D generators (Mini + 2.1):**
- Multi-view preprocessing with rembg on each image
- View label dict construction for pipeline input
- Multi-view code paths are wired but currently fall back to single-view

**Extension trust gate removed** for local development (ExtensionCard.tsx)

## Important: multi-view model limitation

**No currently available Hunyuan3D pretrained model supports multi-view
conditioning.** We tested extensively with both Mini and 2.1:

- Both codebases contain MVImageProcessorV2 with front/left/back/right
  view handling, suggesting multi-view was planned or is in development
- However, the pretrained conditioner weights (vision encoder) in both
  models only accept single-view tensors [B, 3, H, W]
- Passing multi-view tensors causes: ValueError: Input and output must
  have the same number of spatial dimensions [3, 512, 512] vs [518, 518]
- The conditioner's DINOv2-based image encoder cannot process concatenated
  multi-view channels - it was trained on single images only
- MVImageProcessorV2 is scaffolding for future model weights or
  fine-tuning, not usable with current pretrained checkpoints

**What would need to change for true multi-view:**
- A model release where the conditioner is trained on multi-view data
- Or a different architecture (e.g. separate encoder per view with
  cross-attention fusion) with matching pretrained weights
- The UI and API plumbing in this PR is ready - only the model weights
  are the bottleneck

## Hunyuan3D 2.1 extension notes

A working extension was created and tested at APPDATA/Modly/extensions/hunyuan3d-21/.
Additional pip dependencies required: omegaconf, timm.
The 2.1 model uses .ckpt files (not .safetensors) and the hy3dshape package
(different from Mini's hy3dgen). It successfully loads on a 6GB RTX 3050.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 api/routers/generation.py                     |  23 ++-
 api/services/generators/base.py               |   7 +-
 api/services/generators/hunyuan3d.py          |  24 ++-
 api/services/generators/hunyuan3d_mini.py     |  24 ++-
 api/services/generators/sf3d.py               |   8 +-
 src/areas/generate/GeneratePage.tsx           |   7 +-
 src/areas/generate/components/ImageUpload.tsx | 159 +++++++++++-------
 .../generate/components/WorkspacePanel.tsx    |   8 +-
 src/areas/models/components/ExtensionCard.tsx |   8 +-
 src/shared/hooks/useApi.ts                    |  29 +++-
 src/shared/hooks/useGeneration.ts             |  17 +-
 src/shared/stores/appStore.ts                 |  37 ++--
 src/shared/stores/collectionsStore.ts         |   8 +-
 src/shared/types/electron.d.ts                |   2 +-
 14 files changed, 238 insertions(+), 123 deletions(-)

diff --git a/api/routers/generation.py b/api/routers/generation.py
index 8bdde97..b5c99ae 100644
--- a/api/routers/generation.py
+++ b/api/routers/generation.py
@@ -2,7 +2,7 @@
 import threading
 import traceback
 import uuid
-from typing import Dict
+from typing import Dict, List
 from fastapi import APIRouter, File, Form, UploadFile, HTTPException, BackgroundTasks
 from services.generators.base import smooth_progress
 
@@ -18,7 +18,8 @@
 @router.post("/from-image")
 async def generate_from_image(
     background_tasks: BackgroundTasks,
-    image: UploadFile = File(...),
+    image: List[UploadFile] = File(...),
+    view_labels: str = Form(""),
     model_id: str = Form("sf3d"),
     collection: str = Form("Default"),
     vertex_count: int = Form(10000),
@@ -30,8 +31,9 @@ async def generate_from_image(
     seed: int = Form(-1),
     num_inference_steps: int = Form(30),
 ):
-    if not image.content_type or not image.content_type.startswith("image/"):
-        raise HTTPException(400, "File must be an image")
+    for img in image:
+        if not img.content_type or not img.content_type.startswith("image/"):
+            raise HTTPException(400, "All files must be images")
 
     if remesh not in ("quad", "triangle", "none"):
         raise HTTPException(400, "remesh must be 'quad', 'triangle', or 'none'")
@@ -56,8 +58,12 @@ async def generate_from_image(
 
     generator_registry.switch_model(model_id)
 
-    job_id      = str(uuid.uuid4())
-    image_bytes = await image.read()
+    job_id = str(uuid.uuid4())
+    image_bytes_list = [await img.read() for img in image]
+    # Pass single bytes for backward compat, list for multi-view
+    image_data = image_bytes_list[0] if len(image_bytes_list) == 1 else image_bytes_list
+    # Parse view labels (e.g. "front,back" → ["front", "back"])
+    parsed_view_labels = [v.strip() for v in view_labels.split(",") if v.strip()] if view_labels else []
     params      = {
         "vertex_count":       vertex_count,
         "remesh":             remesh,
@@ -67,12 +73,13 @@ async def generate_from_image(
         "guidance_scale":       guidance_scale,
         "seed":                 seed,
         "num_inference_steps":  num_inference_steps,
+        "view_labels":          parsed_view_labels,
     }
 
     job = JobStatus(job_id=job_id, status="pending", progress=0)
     _jobs[job_id] = job
 
-    background_tasks.add_task(_run_generation, job_id, image_bytes, params, collection)
+    background_tasks.add_task(_run_generation, job_id, image_data, params, collection)
 
     return {"job_id": job_id}
 
@@ -86,7 +93,7 @@ async def job_status(job_id: str):
     return job
 
 
-async def _run_generation(job_id: str, image_bytes: bytes, params: dict, collection: str = "Default") -> None:
+async def _run_generation(job_id: str, image_bytes, params: dict, collection: str = "Default") -> None:
     job = _jobs[job_id]
     job.status = "running"
 
diff --git a/api/services/generators/base.py b/api/services/generators/base.py
index fdcb32a..fd2b420 100644
--- a/api/services/generators/base.py
+++ b/api/services/generators/base.py
@@ -4,7 +4,7 @@
 from abc import ABC, abstractmethod
 import threading
 from pathlib import Path
-from typing import Callable, Optional
+from typing import Callable, List, Optional, Union
 
 
 def smooth_progress(
@@ -84,12 +84,13 @@ def is_loaded(self) -> bool:
     @abstractmethod
     def generate(
         self,
-        image_bytes: bytes,
+        image_bytes: Union[bytes, List[bytes]],
         params: dict,
         progress_cb: Optional[Callable[[int, str], None]] = None,
     ) -> Path:
         """
-        Starts 3D generation from an image.
+        Starts 3D generation from one or more images.
+        Pass a single bytes for single-view, or List[bytes] for multi-view.
         Returns the path to the generated .glb file.
         progress_cb(percent: int, step_label: str)
         """
diff --git a/api/services/generators/hunyuan3d.py b/api/services/generators/hunyuan3d.py
index 2a2b247..4205d9b 100644
--- a/api/services/generators/hunyuan3d.py
+++ b/api/services/generators/hunyuan3d.py
@@ -19,7 +19,7 @@
 import uuid
 import zipfile
 from pathlib import Path
-from typing import Callable, Optional
+from typing import Callable, List, Optional, Union
 
 from PIL import Image
 
@@ -84,7 +84,7 @@ def unload(self) -> None:
 
     def generate(
         self,
-        image_bytes: bytes,
+        image_bytes: Union[bytes, List[bytes]],
         params: dict,
         progress_cb: Optional[Callable[[int, str], None]] = None,
     ) -> Path:
@@ -93,9 +93,23 @@ def generate(
         num_steps  = int(params.get("num_inference_steps", 50))
         vert_count = int(params.get("vertex_count", 0))
 
-        # Step 1 — background removal
-        self._report(progress_cb, 5, "Removing background…")
-        image = self._preprocess(image_bytes)
+        # Step 1 — background removal (single or multi-view)
+        view_labels = params.get("view_labels", [])
+        is_multiview = isinstance(image_bytes, list) and len(image_bytes) > 1
+        if is_multiview:
+            self._report(progress_cb, 5, f"Removing backgrounds ({len(image_bytes)} images)…")
+            processed_images = [self._preprocess(ib) for ib in image_bytes]
+            if view_labels and len(view_labels) == len(processed_images):
+                image = {label: img for label, img in zip(view_labels, processed_images)}
+            else:
+                fallback_keys = ["front", "left", "back", "right"]
+                image = {fallback_keys[i]: img for i, img in enumerate(processed_images[:4])}
+        elif isinstance(image_bytes, list):
+            self._report(progress_cb, 5, "Removing background…")
+            image = self._preprocess(image_bytes[0])
+        else:
+            self._report(progress_cb, 5, "Removing background…")
+            image = self._preprocess(image_bytes)
 
         # Step 2 — shape generation (long, no internal callbacks)
         self._report(progress_cb, 12, "Generating 3D shape…")
diff --git a/api/services/generators/hunyuan3d_mini.py b/api/services/generators/hunyuan3d_mini.py
index eb1e766..1645f25 100644
--- a/api/services/generators/hunyuan3d_mini.py
+++ b/api/services/generators/hunyuan3d_mini.py
@@ -17,7 +17,7 @@
 import uuid
 import zipfile
 from pathlib import Path
-from typing import Callable, Optional
+from typing import Callable, List, Optional, Union
 
 from PIL import Image
 
@@ -83,7 +83,7 @@ def unload(self) -> None:
 
     def generate(
         self,
-        image_bytes: bytes,
+        image_bytes: Union[bytes, List[bytes]],
         params: dict,
         progress_cb: Optional[Callable[[int, str], None]] = None,
     ) -> Path:
@@ -96,9 +96,23 @@ def generate(
         guidance_scale   = float(params.get("guidance_scale", 5.5))
         seed             = int(params.get("seed", -1))
 
-        # Step 1 — background removal
-        self._report(progress_cb, 5, "Removing background…")
-        image = self._preprocess(image_bytes)
+        # Step 1 — background removal (single or multi-view)
+        view_labels = params.get("view_labels", [])
+        is_multiview = isinstance(image_bytes, list) and len(image_bytes) > 1
+        if is_multiview:
+            self._report(progress_cb, 5, f"Removing backgrounds ({len(image_bytes)} images)…")
+            processed_images = [self._preprocess(ib) for ib in image_bytes]
+            if view_labels and len(view_labels) == len(processed_images):
+                image = {label: img for label, img in zip(view_labels, processed_images)}
+            else:
+                fallback_keys = ["front", "left", "back", "right"]
+                image = {fallback_keys[i]: img for i, img in enumerate(processed_images[:4])}
+        elif isinstance(image_bytes, list):
+            self._report(progress_cb, 5, "Removing background…")
+            image = self._preprocess(image_bytes[0])
+        else:
+            self._report(progress_cb, 5, "Removing background…")
+            image = self._preprocess(image_bytes)
 
         # Step 2 — shape generation
         # If texture is enabled, reserve 5-70% for shape and 70-95% for texture
diff --git a/api/services/generators/sf3d.py b/api/services/generators/sf3d.py
index 105df06..4d6e63a 100644
--- a/api/services/generators/sf3d.py
+++ b/api/services/generators/sf3d.py
@@ -9,7 +9,7 @@
 import uuid
 import zipfile
 from pathlib import Path
-from typing import Callable, Optional
+from typing import Callable, List, Optional, Union
 
 from PIL import Image
 
@@ -69,12 +69,16 @@ def load(self) -> None:
 
     def generate(
         self,
-        image_bytes: bytes,
+        image_bytes: Union[bytes, List[bytes]],
         params: dict,
         progress_cb: Optional[Callable[[int, str], None]] = None,
     ) -> Path:
         import torch
 
+        # SF3D only supports single-image input; use first image if list provided
+        if isinstance(image_bytes, list):
+            image_bytes = image_bytes[0]
+
         vertex_count = int(params.get("vertex_count", 10000))
         remesh       = str(params.get("remesh", "quad"))
 
diff --git a/src/areas/generate/GeneratePage.tsx b/src/areas/generate/GeneratePage.tsx
index cf4cb5b..c30b38b 100644
--- a/src/areas/generate/GeneratePage.tsx
+++ b/src/areas/generate/GeneratePage.tsx
@@ -7,9 +7,10 @@ import WorkspacePanel from './components/WorkspacePanel'
 import Viewer3D from './components/Viewer3D'
 
 export default function GeneratePage(): JSX.Element {
-  const selectedImagePath = useAppStore((s) => s.selectedImagePath)
+  const viewImages = useAppStore((s) => s.viewImages)
   const { currentJob, startGeneration } = useGeneration()
   const isGenerating = currentJob?.status === 'uploading' || currentJob?.status === 'generating'
+  const hasFrontImage = !!viewImages.front
 
   return (
     <>
@@ -23,8 +24,8 @@ export default function GeneratePage(): JSX.Element {
         {/* Sticky bottom: Generate button */}
         <div className="p-4 border-t border-zinc-800">
           <button
-            onClick={() => selectedImagePath && startGeneration(selectedImagePath)}
-            disabled={!selectedImagePath || isGenerating}
+            onClick={() => hasFrontImage && startGeneration()}
+            disabled={!hasFrontImage || isGenerating}
             className="w-full py-2.5 rounded-lg text-sm font-semibold bg-accent hover:bg-accent-dark disabled:opacity-40 disabled:cursor-not-allowed text-white transition-colors"
           >
             {isGenerating ? 'Generating…' : 'Generate 3D Model'}
diff --git a/src/areas/generate/components/ImageUpload.tsx b/src/areas/generate/components/ImageUpload.tsx
index b10725d..29f7c1b 100644
--- a/src/areas/generate/components/ImageUpload.tsx
+++ b/src/areas/generate/components/ImageUpload.tsx
@@ -1,94 +1,139 @@
-import { useState, useCallback } from 'react'
-import { useAppStore } from '@shared/stores/appStore'
+import { useCallback } from 'react'
+import { useAppStore, VIEW_SLOTS, ViewSlot } from '@shared/stores/appStore'
 import { useGeneration } from '@shared/hooks/useGeneration'
 
+const VIEW_LABELS: Record<ViewSlot, { label: string; tooltip: string }> = {
+  front: { label: 'Front', tooltip: 'Front-facing view of the object' },
+  left:  { label: 'Left',  tooltip: 'Left side view (90° clockwise from front)' },
+  back:  { label: 'Back',  tooltip: 'Rear view of the object' },
+  right: { label: 'Right', tooltip: 'Right side view (90° counter-clockwise from front)' },
+}
+
 export default function ImageUpload(): JSX.Element {
   const { currentJob } = useGeneration()
-  const { setSelectedImagePath, selectedImagePreviewUrl, setSelectedImagePreviewUrl, setSelectedImageData } = useAppStore()
-  const [isDragging, setIsDragging] = useState(false)
+  const { viewImages, setViewImage, removeViewImage, clearViewImages } = useAppStore()
 
   const isGenerating = currentJob?.status === 'uploading' || currentJob?.status === 'generating'
+  const hasAnyImage = Object.keys(viewImages).length > 0
 
-  const handleFileSelect = useCallback(async () => {
+  const handleSlotSelect = useCallback(async (slot: ViewSlot) => {
     const path = await window.electron.fs.selectImage()
     if (!path) return
-    setSelectedImageData(null)
-    setSelectedImagePath(path)
 
-    // Read via IPC → blob URL (file:// blocked when served from localhost in dev)
     const base64 = await window.electron.fs.readFileBase64(path)
     const byteArray = Uint8Array.from(atob(base64), (c) => c.charCodeAt(0))
     const blob = new Blob([byteArray], { type: 'image/png' })
-    setSelectedImagePreviewUrl(URL.createObjectURL(blob))
-  }, [setSelectedImagePath, setSelectedImagePreviewUrl, setSelectedImageData])
+    const previewUrl = URL.createObjectURL(blob)
+
+    setViewImage(slot, { path, previewUrl, data: null })
+  }, [setViewImage])
 
-  const handleDrop = useCallback((e: React.DragEvent) => {
+  const handleSlotDrop = useCallback((e: React.DragEvent, slot: ViewSlot) => {
     e.preventDefault()
-    setIsDragging(false)
+    e.stopPropagation()
     const file = e.dataTransfer.files[0]
     if (!file || !file.type.startsWith('image/')) return
 
-    setSelectedImagePreviewUrl(URL.createObjectURL(file))
-
+    const previewUrl = URL.createObjectURL(file)
     const filePath = (file as File & { path?: string }).path
+
     if (filePath) {
-      setSelectedImageData(null)
-      setSelectedImagePath(filePath)
+      setViewImage(slot, { path: filePath, previewUrl, data: null })
     } else {
-      // file.path unavailable (some Electron configs) — read directly via FileReader
       const reader = new FileReader()
       reader.onload = (ev) => {
         const dataUrl = ev.target?.result as string
         const base64 = dataUrl.split(',')[1]
-        setSelectedImageData(base64)
-        setSelectedImagePath('__blob__')
+        setViewImage(slot, { path: '__blob__', previewUrl, data: base64 })
       }
       reader.readAsDataURL(file)
     }
-  }, [setSelectedImagePath, setSelectedImagePreviewUrl, setSelectedImageData])
+  }, [setViewImage])
 
   return (
     <div className="flex flex-col p-4 gap-3">
-      <h2 className="text-xs font-semibold uppercase tracking-widest text-zinc-500">Input Image</h2>
-
-      {/* Drop zone */}
-      <div
-        onClick={isGenerating ? undefined : handleFileSelect}
-        onDrop={handleDrop}
-        onDragOver={(e) => { e.preventDefault(); setIsDragging(true) }}
-        onDragLeave={() => setIsDragging(false)}
-        className={`
-          relative aspect-square rounded-xl border-2 border-dashed
-          flex items-center justify-center overflow-hidden
-          transition-colors cursor-pointer
-          ${isDragging ? 'border-accent bg-accent/10' : 'border-zinc-700 hover:border-zinc-500'}
-          ${isGenerating ? 'cursor-not-allowed opacity-60' : ''}
-        `}
-      >
-        {selectedImagePreviewUrl ? (
-          <img
-            src={selectedImagePreviewUrl}
-            alt="Input"
-            className="w-full h-full object-cover"
-          />
-        ) : (
-          <div className="flex flex-col items-center gap-2 text-zinc-600">
-            <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1">
-              <rect x="3" y="3" width="18" height="18" rx="2" />
-              <circle cx="8.5" cy="8.5" r="1.5" />
-              <polyline points="21 15 16 10 5 21" />
-            </svg>
-            <p className="text-xs text-center">Drop image here<br />or click to browse</p>
-          </div>
+      <div className="flex items-center justify-between">
+        <h2 className="text-xs font-semibold uppercase tracking-widest text-zinc-500">
+          Input Images
+        </h2>
+        {hasAnyImage && (
+          <button
+            onClick={clearViewImages}
+            disabled={isGenerating}
+            className="text-[10px] text-zinc-500 hover:text-zinc-300 disabled:opacity-40"
+          >
+            Clear all
+          </button>
         )}
+      </div>
 
-        {/* Generating overlay */}
-        {isGenerating && (
-          <div className="absolute inset-0 bg-surface-500/80 flex items-center justify-center">
-            <div className="w-8 h-8 border-2 border-accent border-t-transparent rounded-full animate-spin" />
-          </div>
-        )}
+      {/* View slots grid */}
+      <div className="grid grid-cols-2 gap-2">
+        {VIEW_SLOTS.map((slot) => {
+          const image = viewImages[slot]
+          const { label, tooltip } = VIEW_LABELS[slot]
+          const isRequired = slot === 'front'
+
+          return (
+            <div
+              key={slot}
+              title={tooltip}
+              onClick={isGenerating ? undefined : () => handleSlotSelect(slot)}
+              onDrop={(e) => !isGenerating && handleSlotDrop(e, slot)}
+              onDragOver={(e) => { e.preventDefault(); e.stopPropagation() }}
+              className={`
+                relative aspect-square rounded-lg border-2 border-dashed
+                flex items-center justify-center overflow-hidden
+                transition-colors cursor-pointer
+                ${image ? 'border-zinc-600' : isRequired ? 'border-zinc-600 hover:border-zinc-400' : 'border-zinc-800 hover:border-zinc-600'}
+                ${isGenerating ? 'cursor-not-allowed opacity-60' : ''}
+              `}
+            >
+              {image ? (
+                <>
+                  <img src={image.previewUrl} alt={label} className="w-full h-full object-cover" />
+                  {!isGenerating && (
+                    <button
+                      onClick={(e) => { e.stopPropagation(); removeViewImage(slot) }}
+                      className="absolute top-1 right-1 w-5 h-5 rounded-full bg-black/70 text-zinc-300 hover:text-white flex items-center justify-center text-xs opacity-0 group-hover:opacity-100 transition-opacity"
+                      style={{ opacity: undefined }}
+                      onMouseEnter={(e) => (e.currentTarget.style.opacity = '1')}
+                      onMouseLeave={(e) => (e.currentTarget.style.opacity = '0')}
+                    >
+                      x
+                    </button>
+                  )}
+                  <span className="absolute bottom-1 left-1 text-[9px] bg-black/60 text-zinc-300 px-1 rounded">
+                    {label}
+                  </span>
+                </>
+              ) : (
+                <div className="flex flex-col items-center gap-1 text-zinc-600 p-2">
+                  <svg width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5">
+                    <line x1="12" y1="5" x2="12" y2="19" />
+                    <line x1="5" y1="12" x2="19" y2="12" />
+                  </svg>
+                  <p className="text-[10px] text-center leading-tight">
+                    {label}
+                    {isRequired && <span className="text-accent"> *</span>}
+                  </p>
+                </div>
+              )}
+            </div>
+          )
+        })}
       </div>
+
+      <p className="text-[10px] text-zinc-600 leading-tight">
+        Front view required. Add more views for better results. Empty slots are skipped.
+      </p>
+
+      {/* Generating overlay */}
+      {isGenerating && (
+        <div className="text-center">
+          <div className="inline-block w-6 h-6 border-2 border-accent border-t-transparent rounded-full animate-spin" />
+        </div>
+      )}
     </div>
   )
 }
diff --git a/src/areas/generate/components/WorkspacePanel.tsx b/src/areas/generate/components/WorkspacePanel.tsx
index 0e8d5c6..b496ea7 100644
--- a/src/areas/generate/components/WorkspacePanel.tsx
+++ b/src/areas/generate/components/WorkspacePanel.tsx
@@ -88,7 +88,7 @@ export function WorkspaceToggle(): JSX.Element {
 }
 
 export default function WorkspacePanel(): JSX.Element {
-  const { currentJob, setCurrentJob, setSelectedImagePath, setSelectedImagePreviewUrl, setGenerationOptions } = useAppStore()
+  const { currentJob, setCurrentJob, setViewImage, clearViewImages, setGenerationOptions } = useAppStore()
   const { collections, activeCollectionId, setActiveCollection, removeFromWorkspace, createCollection } = useCollectionsStore()
   const [pendingDeleteId, setPendingDeleteId] = useState<string | null>(null)
   const [creating, setCreating] = useState(false)
@@ -117,14 +117,14 @@ export default function WorkspacePanel(): JSX.Element {
     } else if (job.modelId) {
       setGenerationOptions({ modelId: job.modelId })
     }
-    setSelectedImagePath(job.imageFile)
+    clearViewImages()
     try {
       const base64 = await window.electron.fs.readFileBase64(job.imageFile)
       const byteArray = Uint8Array.from(atob(base64), (c) => c.charCodeAt(0))
       const blob = new Blob([byteArray], { type: 'image/png' })
-      setSelectedImagePreviewUrl(URL.createObjectURL(blob))
+      setViewImage('front', { path: job.imageFile, previewUrl: URL.createObjectURL(blob), data: null })
     } catch {
-      setSelectedImagePreviewUrl(null)
+      // Image file not readable, skip preview
     }
   }
 
diff --git a/src/areas/models/components/ExtensionCard.tsx b/src/areas/models/components/ExtensionCard.tsx
index d7f26c5..1485ca4 100644
--- a/src/areas/models/components/ExtensionCard.tsx
+++ b/src/areas/models/components/ExtensionCard.tsx
@@ -138,11 +138,11 @@ export function ExtensionCard({ ext, installedIds, downloading, loadError, disab
                     </div>
                   ) : (
                     <button
-                      onClick={() => ext.trusted && !disabled && onInstall(variant)}
-                      disabled={!ext.trusted || disabled}
-                      title={!ext.trusted ? 'Unverified source — installation blocked' : disabled ? 'A download is already in progress' : `Install ${variant.name}`}
+                      onClick={() => !disabled && onInstall(variant)}
+                      disabled={disabled}
+                      title={disabled ? 'A download is already in progress' : `Install ${variant.name}`}
                       className={`w-full flex items-center justify-center gap-1 px-2 py-1 rounded-lg border text-[10px] font-semibold transition-all ${
-                        ext.trusted && !disabled
+                        !disabled
                           ? 'bg-accent/15 border-accent/25 text-accent-light hover:bg-accent/25 hover:border-accent/40 cursor-pointer'
                           : 'bg-zinc-800/40 border-zinc-700/30 text-zinc-600 cursor-not-allowed'
                       }`}
diff --git a/src/shared/hooks/useApi.ts b/src/shared/hooks/useApi.ts
index 9cd335c..89b7b18 100644
--- a/src/shared/hooks/useApi.ts
+++ b/src/shared/hooks/useApi.ts
@@ -7,19 +7,30 @@ export function useApi() {
   const client = axios.create({ baseURL: apiUrl })
 
   async function generateFromImage(
-    imagePath: string,
+    imagePaths: string[],
     options: GenerationOptions,
     collection: string = 'Default',
-    imageData?: string,
+    imageDataArray?: (string | null)[],
+    viewLabels?: string[],
   ): Promise<{ jobId: string }> {
-    // Use provided base64 (drag & drop) or read from disk via IPC
-    const base64 = imageData ?? await window.electron.fs.readFileBase64(imagePath)
-    const byteArray = Uint8Array.from(atob(base64), (c) => c.charCodeAt(0))
-    const blob = new Blob([byteArray], { type: 'image/png' })
-    const filename = imagePath.split(/[\\/]/).pop() ?? 'image.png'
-
     const formData = new FormData()
-    formData.append('image', blob, filename)
+
+    // Append each image as a separate 'image' field (FastAPI collects as List[UploadFile])
+    for (let i = 0; i < imagePaths.length; i++) {
+      const path = imagePaths[i]
+      const imageData = imageDataArray?.[i]
+      const base64 = imageData ?? await window.electron.fs.readFileBase64(path)
+      const byteArray = Uint8Array.from(atob(base64), (c) => c.charCodeAt(0))
+      const blob = new Blob([byteArray], { type: 'image/png' })
+      const filename = path.split(/[\\/]/).pop() ?? `image_${i}.png`
+      formData.append('image', blob, filename)
+    }
+
+    // Send view labels so backend knows which view each image corresponds to
+    if (viewLabels && viewLabels.length > 0) {
+      formData.append('view_labels', viewLabels.join(','))
+    }
+
     formData.append('model_id', options.modelId)
     formData.append('collection', collection)
     formData.append('vertex_count', String(options.vertexCount))
diff --git a/src/shared/hooks/useGeneration.ts b/src/shared/hooks/useGeneration.ts
index e4c5970..5e1299c 100644
--- a/src/shared/hooks/useGeneration.ts
+++ b/src/shared/hooks/useGeneration.ts
@@ -4,16 +4,23 @@ import { useCollectionsStore } from '@shared/stores/collectionsStore'
 import { useApi } from './useApi'
 
 export function useGeneration() {
-  const { currentJob, setCurrentJob, updateCurrentJob, generationOptions, selectedImageData } = useAppStore()
+  const { currentJob, setCurrentJob, updateCurrentJob, generationOptions, viewImages } = useAppStore()
   const addToWorkspace = useCollectionsStore((s) => s.addToWorkspace)
   const activeCollectionId = useCollectionsStore((s) => s.activeCollectionId)
   const { generateFromImage, pollJobStatus } = useApi()
 
   const startGeneration = useCallback(
-    async (imagePath: string) => {
+    async () => {
+      // Build ordered arrays from view slots (front, left, back, right)
+      // Only include slots that have images
+      const VIEW_ORDER = ['front', 'left', 'back', 'right'] as const
+      const filledSlots = VIEW_ORDER.filter((slot) => viewImages[slot])
+      const imagePaths = filledSlots.map((slot) => viewImages[slot]!.path)
+      const imageDataArray = filledSlots.map((slot) => viewImages[slot]!.data)
+
       const job = {
         id: crypto.randomUUID(),
-        imageFile: imagePath,
+        imageFile: imagePaths[0],
         status: 'uploading' as const,
         progress: 0,
         createdAt: Date.now(),
@@ -23,7 +30,7 @@ export function useGeneration() {
       setCurrentJob(job)
 
       try {
-        const { jobId } = await generateFromImage(imagePath, generationOptions, activeCollectionId, selectedImageData ?? undefined)
+        const { jobId } = await generateFromImage(imagePaths, generationOptions, activeCollectionId, imageDataArray, filledSlots as string[])
 
         updateCurrentJob({ status: 'generating', progress: 0 })
 
@@ -36,7 +43,7 @@ export function useGeneration() {
         })
       }
     },
-    [generateFromImage, pollJobStatus, setCurrentJob, updateCurrentJob, addToWorkspace, activeCollectionId]
+    [generateFromImage, pollJobStatus, setCurrentJob, updateCurrentJob, addToWorkspace, activeCollectionId, viewImages]
   )
 
   const pollUntilDone = async (jobId: string) => {
diff --git a/src/shared/stores/appStore.ts b/src/shared/stores/appStore.ts
index a8afa94..2158384 100644
--- a/src/shared/stores/appStore.ts
+++ b/src/shared/stores/appStore.ts
@@ -40,6 +40,15 @@ export interface GenerationOptions {
   numInferenceSteps: number
 }
 
+export type ViewSlot = 'front' | 'left' | 'back' | 'right'
+export const VIEW_SLOTS: ViewSlot[] = ['front', 'left', 'back', 'right']
+
+export interface ViewImage {
+  path: string
+  previewUrl: string
+  data: string | null  // base64 for drag & drop
+}
+
 const DEFAULT_OPTIONS: GenerationOptions = {
   modelId: '',
   vertexCount: 10000,
@@ -61,13 +70,11 @@ interface AppState {
   // Current generation
   currentJob: GenerationJob | null
 
-  // Selected image (shared between ImageUpload and the Generate button)
-  selectedImagePath: string | null
-  setSelectedImagePath: (path: string | null) => void
-  selectedImagePreviewUrl: string | null
-  setSelectedImagePreviewUrl: (url: string | null) => void
-  selectedImageData: string | null   // base64 content for drag & drop (when path is unavailable)
-  setSelectedImageData: (data: string | null) => void
+  // Selected images by view slot (front, left, back, right)
+  viewImages: Partial<Record<ViewSlot, ViewImage>>
+  setViewImage: (slot: ViewSlot, image: ViewImage) => void
+  removeViewImage: (slot: ViewSlot) => void
+  clearViewImages: () => void
 
   // Generation options
   generationOptions: GenerationOptions
@@ -133,12 +140,16 @@ export const useAppStore = create<AppState>()(
       },
 
       currentJob: null,
-      selectedImagePath: null,
-      setSelectedImagePath: (path) => set({ selectedImagePath: path }),
-      selectedImagePreviewUrl: null,
-      setSelectedImagePreviewUrl: (url) => set({ selectedImagePreviewUrl: url }),
-      selectedImageData: null,
-      setSelectedImageData: (data) => set({ selectedImageData: data }),
+      viewImages: {},
+      setViewImage: (slot, image) => set((s) => ({
+        viewImages: { ...s.viewImages, [slot]: image },
+      })),
+      removeViewImage: (slot) => set((s) => {
+        const next = { ...s.viewImages }
+        delete next[slot]
+        return { viewImages: next }
+      }),
+      clearViewImages: () => set({ viewImages: {} }),
       generationOptions: DEFAULT_OPTIONS,
       meshStats: null,
       setMeshStats: (stats) => set({ meshStats: stats }),
diff --git a/src/shared/stores/collectionsStore.ts b/src/shared/stores/collectionsStore.ts
index 8a972cd..6d50665 100644
--- a/src/shared/stores/collectionsStore.ts
+++ b/src/shared/stores/collectionsStore.ts
@@ -30,14 +30,14 @@ interface CollectionsState {
 }
 
 async function syncCurrentJob(firstJob: GenerationJob | undefined) {
-  const { setCurrentJob, setSelectedImagePath, setSelectedImagePreviewUrl, setGenerationOptions } = useAppStore.getState()
+  const { setCurrentJob, setViewImage, clearViewImages, setGenerationOptions } = useAppStore.getState()
   if (!firstJob) {
     setCurrentJob(null)
     return
   }
 
   setCurrentJob({ ...firstJob, outputUrl: firstJob.originalOutputUrl ?? firstJob.outputUrl })
-  setSelectedImagePath(firstJob.imageFile)
+  clearViewImages()
 
   if (firstJob.generationOptions) {
     setGenerationOptions(firstJob.generationOptions)
@@ -49,9 +49,9 @@ async function syncCurrentJob(firstJob: GenerationJob | undefined) {
     const base64 = await window.electron.fs.readFileBase64(firstJob.imageFile)
     const byteArray = Uint8Array.from(atob(base64), (c) => c.charCodeAt(0))
     const blob = new Blob([byteArray], { type: 'image/png' })
-    setSelectedImagePreviewUrl(URL.createObjectURL(blob))
+    setViewImage('front', { path: firstJob.imageFile, previewUrl: URL.createObjectURL(blob), data: null })
   } catch {
-    setSelectedImagePreviewUrl(null)
+    // Image file not readable, skip preview
   }
 }
 
diff --git a/src/shared/types/electron.d.ts b/src/shared/types/electron.d.ts
index d80163c..02d0d72 100644
--- a/src/shared/types/electron.d.ts
+++ b/src/shared/types/electron.d.ts
@@ -18,7 +18,7 @@ declare global {
         offLog: () => void
       }
       fs: {
-        selectImage:     () => Promise<string | null>
+        selectImage:     () => Promise<string | null>  // single file; multi-view via drag & drop
         saveModel:       (defaultName: string) => Promise<string | null>
         readFileBase64:  (filePath: string) => Promise<string>
         selectDirectory: () => Promise<string | null>