From d7b70fceb320c7d1097cbdd5aa5fd58b30882353 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Mon, 22 Sep 2025 15:16:10 -0400
Subject: [PATCH 01/13] initial ui changes

---
 morphocluster/api.py                          | 266 ++++++++
 morphocluster/frontend/.gitignore             |   2 +
 .../frontend/src/components/FeatureModal.vue  | 596 ++++++++++++++++++
 .../frontend/src/components/FormatModal.vue   | 399 ++++++++++++
 .../frontend/src/components/JobStatus.vue     | 512 +++++++++++++++
 .../frontend/src/components/UploadZone.vue    | 484 ++++++++++++++
 morphocluster/frontend/src/helpers/api.js     |  61 ++
 morphocluster/frontend/src/router.js          |   5 +
 morphocluster/frontend/src/views/Home.vue     |   5 +
 morphocluster/frontend/src/views/Upload.vue   | 562 +++++++++++++++++
 10 files changed, 2892 insertions(+)
 create mode 100644 morphocluster/frontend/src/components/FeatureModal.vue
 create mode 100644 morphocluster/frontend/src/components/FormatModal.vue
 create mode 100644 morphocluster/frontend/src/components/JobStatus.vue
 create mode 100644 morphocluster/frontend/src/components/UploadZone.vue
 create mode 100644 morphocluster/frontend/src/views/Upload.vue

diff --git a/morphocluster/api.py b/morphocluster/api.py
index 74cbe4c..2f453c4 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -325,6 +325,272 @@ def upload_files(path=""):
         raise werkzeug.exceptions.BadRequest()
 
 
+# ===============================================================================
+# /upload - Data Pipeline Upload Interface
+# ===============================================================================
+
+@api.route("/upload", methods=["POST"])
+def upload_archives():
+    """
+    Mock endpoint for uploading data archives.
+    Returns mock response for frontend testing.
+    """
+    uploaded_files = request.files.getlist("files")
+
+    if not uploaded_files:
+        raise werkzeug.exceptions.BadRequest("No files provided")
+
+    # Mock response
+    result = {
+        "message": "Files uploaded successfully",
+        "files": [
+            {
+                "name": file.filename,
+                "size": file.content_length or 1024000,  # Mock size if not available
+                "id": str(uuid.uuid4()),
+                "status": "uploaded"
+            }
+            for file in uploaded_files
+        ]
+    }
+
+    return jsonify(result), 200
+
+
+@api.route("/files/<file_id>/validate", methods=["GET"])
+def validate_archive(file_id):
+    """
+    Mock endpoint for archive validation.
+    Returns mock validation data for frontend testing.
+    """
+    # Mock validation response
+    result = {
+        "is_valid": True,
+        "format": "ecotaxa" if "ecotaxa" in file_id.lower() else "standard",
+        "needs_conversion": "ecotaxa" in file_id.lower(),
+        "file_count": 1250,
+        "image_count": 1200,
+        "detected_encoding": "utf-8",
+        "detected_delimiter": "\t" if "ecotaxa" in file_id.lower() else ",",
+        "validation_warnings": []
+    }
+
+    return jsonify(result), 200
+
+
+@api.route("/files/<file_id>/preview", methods=["GET"])
+def preview_archive(file_id):
+    """
+    Mock endpoint for archive preview.
+    Returns mock preview data for frontend testing.
+    """
+    # Mock preview response
+    result = {
+        "files": [
+            "index.csv",
+            "images/img001.jpg",
+            "images/img002.jpg",
+            "images/img003.jpg",
+            "images/img004.jpg",
+            "images/img005.jpg"
+        ],
+        "total_rows": 1200,
+        "detected_encoding": "utf-8",
+        "detected_delimiter": "," if "standard" in file_id.lower() else "\t",
+        "columns": [
+            {"key": "object_id", "label": "Object ID"},
+            {"key": "img_file_name", "label": "Image File"},
+            {"key": "object_lat", "label": "Latitude"},
+            {"key": "object_lon", "label": "Longitude"},
+            {"key": "object_depth", "label": "Depth"}
+        ],
+        "sample_rows": [
+            {
+                "object_id": "obj_001",
+                "img_file_name": "images/img001.jpg",
+                "object_lat": "45.123",
+                "object_lon": "-125.456",
+                "object_depth": "10.5"
+            },
+            {
+                "object_id": "obj_002",
+                "img_file_name": "images/img002.jpg",
+                "object_lat": "45.124",
+                "object_lon": "-125.457",
+                "object_depth": "12.1"
+            },
+            {
+                "object_id": "obj_003",
+                "img_file_name": "images/img003.jpg",
+                "object_lat": "45.125",
+                "object_lon": "-125.458",
+                "object_depth": "8.9"
+            }
+        ]
+    }
+
+    return jsonify(result), 200
+
+
+@api.route("/files/<file_id>/convert", methods=["POST"])
+def convert_ecotaxa_format(file_id):
+    """
+    Mock endpoint for EcoTaxa format conversion.
+    Creates a mock background job for frontend testing.
+    """
+    data = request.get_json() or {}
+
+    # Mock job creation
+    job_id = str(uuid.uuid4())
+
+    result = {
+        "job_id": job_id,
+        "status": "started",
+        "message": "EcoTaxa conversion job started",
+        "parameters": data
+    }
+
+    return jsonify(result), 202
+
+
+@api.route("/files/<file_id>/extract", methods=["POST"])
+def extract_features(file_id):
+    """
+    Mock endpoint for feature extraction.
+    Creates a mock background job for frontend testing.
+    """
+    data = request.get_json() or {}
+
+    # Mock job creation
+    job_id = str(uuid.uuid4())
+
+    result = {
+        "job_id": job_id,
+        "status": "started",
+        "message": "Feature extraction job started",
+        "parameters": data
+    }
+
+    return jsonify(result), 202
+
+
+@api.route("/jobs/user", methods=["GET"])
+def get_user_jobs():
+    """
+    Mock endpoint for getting user jobs.
+    Returns mock job data for frontend testing.
+    """
+    # Mock jobs with different statuses
+    jobs = [
+        {
+            "id": "job_001",
+            "job_type": "format_conversion",
+            "status": "completed",
+            "progress": 100,
+            "created_at": "2024-01-15T10:30:00Z",
+            "completed_at": "2024-01-15T10:32:15Z",
+            "parameters": {
+                "archive_name": "sample_ecotaxa.zip",
+                "encoding": "utf-8",
+                "delimiter": "\t"
+            },
+            "result_url": "/files/converted_sample"
+        },
+        {
+            "id": "job_002",
+            "job_type": "feature_extraction",
+            "status": "running",
+            "progress": 45,
+            "created_at": "2024-01-15T11:00:00Z",
+            "current_step": "Processing batch 450/1000",
+            "eta": 300,
+            "parameters": {
+                "archive_name": "marine_plankton.zip",
+                "model": "resnet50",
+                "batch_size": 512
+            },
+            "logs": [
+                {
+                    "timestamp": "2024-01-15T11:00:00Z",
+                    "level": "info",
+                    "message": "Starting feature extraction..."
+                },
+                {
+                    "timestamp": "2024-01-15T11:05:30Z",
+                    "level": "info",
+                    "message": "Processed 200 images"
+                },
+                {
+                    "timestamp": "2024-01-15T11:10:15Z",
+                    "level": "info",
+                    "message": "Processed 450 images"
+                }
+            ]
+        },
+        {
+            "id": "job_003",
+            "job_type": "initial_clustering",
+            "status": "failed",
+            "progress": 25,
+            "created_at": "2024-01-15T09:15:00Z",
+            "failed_at": "2024-01-15T09:45:30Z",
+            "error_message": "Insufficient memory for clustering. Try reducing batch size.",
+            "parameters": {
+                "min_cluster_size": 128,
+                "method": "EOM"
+            }
+        }
+    ]
+
+    return jsonify(jobs), 200
+
+
+@api.route("/jobs/<job_id>/status", methods=["GET"])
+def get_job_status(job_id):
+    """
+    Mock endpoint for getting individual job status.
+    Returns mock job status for frontend testing.
+    """
+    # Mock job status based on job_id
+    if job_id == "job_001":
+        job = {
+            "id": job_id,
+            "status": "completed",
+            "progress": 100,
+            "result_url": "/files/converted_sample"
+        }
+    elif job_id == "job_002":
+        job = {
+            "id": job_id,
+            "status": "running",
+            "progress": 65,
+            "current_step": "Processing batch 650/1000",
+            "eta": 180
+        }
+    else:
+        job = {
+            "id": job_id,
+            "status": "pending",
+            "progress": 0
+        }
+
+    return jsonify(job), 200
+
+
+@api.route("/jobs/<job_id>", methods=["DELETE"])
+def cancel_job(job_id):
+    """
+    Mock endpoint for cancelling a job.
+    Returns mock cancellation response for frontend testing.
+    """
+    result = {
+        "message": f"Job {job_id} cancellation requested",
+        "status": "cancelling"
+    }
+
+    return jsonify(result), 200
+
+
 # ===============================================================================
 # /projects
 # ===============================================================================
diff --git a/morphocluster/frontend/.gitignore b/morphocluster/frontend/.gitignore
index c6e316b..e5fa33f 100644
--- a/morphocluster/frontend/.gitignore
+++ b/morphocluster/frontend/.gitignore
@@ -1,5 +1,6 @@
 .DS_Store
 node_modules
+/dist
 
 # local env files
 .env.local
@@ -9,6 +10,7 @@ node_modules
 npm-debug.log*
 yarn-debug.log*
 yarn-error.log*
+pnpm-debug.log*
 
 # Editor directories and files
 .idea
diff --git a/morphocluster/frontend/src/components/FeatureModal.vue b/morphocluster/frontend/src/components/FeatureModal.vue
new file mode 100644
index 0000000..1cd0cce
--- /dev/null
+++ b/morphocluster/frontend/src/components/FeatureModal.vue
@@ -0,0 +1,596 @@
+<template>
+  <b-modal
+    v-model="isVisible"
+    title="Extract Features"
+    size="lg"
+    @ok="handleExtract"
+    @cancel="handleCancel"
+    :ok-disabled="!isValid"
+    ok-title="Start Extraction"
+    cancel-title="Cancel"
+  >
+    <div class="feature-extraction-form">
+      <b-alert variant="info" show class="mb-4">
+        <i class="mdi mdi-cog"></i>
+        <strong>Feature Extraction</strong><br>
+        Extract image features using deep learning models. This process will analyze all images
+        in the archive and generate feature vectors for clustering.
+      </b-alert>
+
+      <!-- Archive Information -->
+      <div class="archive-info mb-4">
+        <h6>Archive Information</h6>
+        <div class="info-grid">
+          <div class="info-item">
+            <strong>Archive:</strong>
+            <span>{{ archive?.name || 'Unknown' }}</span>
+          </div>
+          <div class="info-item" v-if="archive?.validation?.image_count">
+            <strong>Images:</strong>
+            <span>{{ archive.validation.image_count }} images</span>
+          </div>
+          <div class="info-item" v-if="estimatedTime">
+            <strong>Estimated Time:</strong>
+            <span>{{ estimatedTime }}</span>
+          </div>
+          <div class="info-item" v-if="estimatedMemory">
+            <strong>Memory Required:</strong>
+            <span>{{ estimatedMemory }}</span>
+          </div>
+        </div>
+      </div>
+
+      <!-- Model Selection -->
+      <b-form @submit.prevent="handleExtract">
+        <b-form-group
+          label="Feature Extraction Model"
+          label-for="model"
+          description="Choose the deep learning model for feature extraction"
+        >
+          <b-form-select
+            id="model"
+            v-model="parameters.model"
+            :options="modelOptions"
+          />
+          <div v-if="selectedModelInfo" class="model-info mt-2">
+            <small class="text-muted">
+              <strong>{{ selectedModelInfo.name }}</strong><br>
+              {{ selectedModelInfo.description }}<br>
+              Output dimensions: {{ selectedModelInfo.output_dim }}
+            </small>
+          </div>
+        </b-form-group>
+
+        <!-- Custom Model Upload -->
+        <div v-if="parameters.model === 'custom'" class="custom-model-section mb-4">
+          <b-form-group
+            label="Custom Model File"
+            label-for="custom-model"
+            description="Upload a pre-trained model file (.pth, .h5, .onnx)"
+          >
+            <b-form-file
+              id="custom-model"
+              v-model="customModelFile"
+              accept=".pth,.h5,.onnx"
+              placeholder="Choose model file..."
+              drop-placeholder="Drop model file here..."
+            />
+          </b-form-group>
+          
+          <b-form-group
+            label="Model Architecture"
+            label-for="model-architecture"
+            description="Specify the model architecture"
+          >
+            <b-form-select
+              id="model-architecture"
+              v-model="parameters.custom_architecture"
+              :options="architectureOptions"
+            />
+          </b-form-group>
+        </div>
+
+        <!-- Processing Parameters -->
+        <b-card class="processing-params mb-4" no-body>
+          <b-card-header>
+            <h6 class="mb-0">Processing Parameters</h6>
+          </b-card-header>
+          <b-card-body>
+            <b-form-group
+              label="Batch Size"
+              label-for="batch-size"
+              :description="batchSizeDescription"
+            >
+              <b-form-input
+                id="batch-size"
+                v-model.number="parameters.batch_size"
+                type="number"
+                min="1"
+                max="1024"
+                step="1"
+              />
+              <div class="batch-size-presets mt-2">
+                <small class="text-muted">Presets: </small>
+                <b-button
+                  v-for="preset in batchSizePresets"
+                  :key="preset.value"
+                  size="sm"
+                  variant="outline-secondary"
+                  class="me-1"
+                  @click="parameters.batch_size = preset.value"
+                >
+                  {{ preset.label }}
+                </b-button>
+              </div>
+            </b-form-group>
+
+            <b-form-group
+              label="Normalization"
+              description="Apply ImageNet normalization to input images"
+            >
+              <b-form-checkbox
+                v-model="parameters.normalize"
+                value="true"
+                unchecked-value="false"
+              >
+                Apply normalization (recommended)
+              </b-form-checkbox>
+            </b-form-group>
+
+            <b-form-group
+              label="Hardware"
+              label-for="device"
+              description="Choose processing hardware"
+            >
+              <b-form-select
+                id="device"
+                v-model="parameters.device"
+                :options="deviceOptions"
+              />
+              <div v-if="deviceInfo" class="device-info mt-2">
+                <small class="text-muted">
+                  {{ deviceInfo }}
+                </small>
+              </div>
+            </b-form-group>
+          </b-card-body>
+        </b-card>
+
+        <!-- Advanced Options -->
+        <b-card class="advanced-options" no-body>
+          <b-card-header>
+            <b-button
+              v-b-toggle.advanced-collapse
+              variant="link"
+              class="p-0 text-decoration-none"
+            >
+              <i :class="showAdvanced ? 'mdi mdi-chevron-up' : 'mdi mdi-chevron-down'"></i>
+              Advanced Options
+            </b-button>
+          </b-card-header>
+          <b-collapse id="advanced-collapse" v-model="showAdvanced">
+            <b-card-body>
+              <b-form-group
+                label="Input Mean"
+                label-for="input-mean"
+                description="Custom normalization mean values (R,G,B)"
+              >
+                <b-form-input
+                  id="input-mean"
+                  v-model="parameters.input_mean"
+                  placeholder="0.485,0.456,0.406"
+                />
+              </b-form-group>
+
+              <b-form-group
+                label="Input Std"
+                label-for="input-std"
+                description="Custom normalization standard deviation values (R,G,B)"
+              >
+                <b-form-input
+                  id="input-std"
+                  v-model="parameters.input_std"
+                  placeholder="0.229,0.224,0.225"
+                />
+              </b-form-group>
+
+              <b-form-group
+                label="Image Resize"
+                label-for="image-size"
+                description="Target image size for processing (pixels)"
+              >
+                <b-form-input
+                  id="image-size"
+                  v-model.number="parameters.image_size"
+                  type="number"
+                  min="32"
+                  max="1024"
+                  step="1"
+                />
+              </b-form-group>
+
+              <b-form-group
+                label="Number of Workers"
+                label-for="num-workers"
+                description="Parallel data loading workers (0 = auto)"
+              >
+                <b-form-input
+                  id="num-workers"
+                  v-model.number="parameters.num_workers"
+                  type="number"
+                  min="0"
+                  max="16"
+                  step="1"
+                />
+              </b-form-group>
+
+              <b-form-group
+                label="Output Format"
+                label-for="output-format"
+                description="Feature vector storage format"
+              >
+                <b-form-select
+                  id="output-format"
+                  v-model="parameters.output_format"
+                  :options="outputFormatOptions"
+                />
+              </b-form-group>
+            </b-card-body>
+          </b-collapse>
+        </b-card>
+
+        <!-- Validation Warnings -->
+        <div v-if="validationWarnings.length" class="validation-warnings mt-3">
+          <b-alert
+            v-for="(warning, index) in validationWarnings"
+            :key="index"
+            variant="warning"
+            show
+            class="small"
+          >
+            <i class="mdi mdi-alert"></i>
+            {{ warning }}
+          </b-alert>
+        </div>
+      </b-form>
+    </div>
+  </b-modal>
+</template>
+
+<script>
+export default {
+  name: 'FeatureModal',
+  props: {
+    archive: {
+      type: Object,
+      required: true
+    }
+  },
+  emits: ['extract', 'cancel'],
+  data() {
+    return {
+      isVisible: true,
+      showAdvanced: false,
+      customModelFile: null,
+      parameters: {
+        model: 'resnet50',
+        custom_architecture: '',
+        batch_size: 512,
+        normalize: true,
+        device: 'auto',
+        input_mean: '',
+        input_std: '',
+        image_size: 224,
+        num_workers: 0,
+        output_format: 'hdf5'
+      },
+      modelOptions: [
+        { value: 'resnet50', text: 'ResNet-50 (ImageNet)' },
+        { value: 'resnet101', text: 'ResNet-101 (ImageNet)' },
+        { value: 'vgg16', text: 'VGG-16 (ImageNet)' },
+        { value: 'vgg19', text: 'VGG-19 (ImageNet)' },
+        { value: 'densenet121', text: 'DenseNet-121 (ImageNet)' },
+        { value: 'mobilenet_v2', text: 'MobileNet V2 (ImageNet)' },
+        { value: 'efficientnet_b0', text: 'EfficientNet B0 (ImageNet)' },
+        { value: 'custom', text: 'Upload Custom Model...' }
+      ],
+      architectureOptions: [
+        { value: 'resnet', text: 'ResNet' },
+        { value: 'vgg', text: 'VGG' },
+        { value: 'densenet', text: 'DenseNet' },
+        { value: 'mobilenet', text: 'MobileNet' },
+        { value: 'efficientnet', text: 'EfficientNet' },
+        { value: 'custom', text: 'Custom Architecture' }
+      ],
+      deviceOptions: [
+        { value: 'auto', text: 'Auto-detect (Recommended)' },
+        { value: 'gpu', text: 'GPU (CUDA)' },
+        { value: 'cpu', text: 'CPU Only' }
+      ],
+      outputFormatOptions: [
+        { value: 'hdf5', text: 'HDF5 (.h5)' },
+        { value: 'numpy', text: 'NumPy (.npz)' },
+        { value: 'pickle', text: 'Pickle (.pkl)' }
+      ],
+      batchSizePresets: [
+        { label: 'Small (128)', value: 128 },
+        { label: 'Medium (512)', value: 512 },
+        { label: 'Large (1024)', value: 1024 }
+      ],
+      modelInfo: {
+        'resnet50': {
+          name: 'ResNet-50',
+          description: 'Deep residual network with 50 layers, pre-trained on ImageNet',
+          output_dim: 2048
+        },
+        'resnet101': {
+          name: 'ResNet-101',
+          description: 'Deep residual network with 101 layers, pre-trained on ImageNet',
+          output_dim: 2048
+        },
+        'vgg16': {
+          name: 'VGG-16',
+          description: 'Visual Geometry Group network with 16 layers',
+          output_dim: 4096
+        },
+        'vgg19': {
+          name: 'VGG-19',
+          description: 'Visual Geometry Group network with 19 layers',
+          output_dim: 4096
+        },
+        'densenet121': {
+          name: 'DenseNet-121',
+          description: 'Densely connected convolutional network',
+          output_dim: 1024
+        },
+        'mobilenet_v2': {
+          name: 'MobileNet V2',
+          description: 'Efficient architecture for mobile devices',
+          output_dim: 1280
+        },
+        'efficientnet_b0': {
+          name: 'EfficientNet B0',
+          description: 'Efficient and accurate convolutional neural network',
+          output_dim: 1280
+        }
+      },
+      validationWarnings: []
+    };
+  },
+  computed: {
+    isValid() {
+      const baseValid = this.parameters.model && this.parameters.batch_size > 0;
+      if (this.parameters.model === 'custom') {
+        return baseValid && this.customModelFile && this.parameters.custom_architecture;
+      }
+      return baseValid;
+    },
+    
+    selectedModelInfo() {
+      return this.modelInfo[this.parameters.model] || null;
+    },
+    
+    batchSizeDescription() {
+      const imageCount = this.archive?.validation?.image_count || 0;
+      const batches = Math.ceil(imageCount / this.parameters.batch_size);
+      return `Images per batch. Total batches: ${batches} (${imageCount} images)`;
+    },
+    
+    deviceInfo() {
+      if (this.parameters.device === 'gpu') {
+        return 'GPU acceleration will be used if available';
+      } else if (this.parameters.device === 'cpu') {
+        return 'Processing will use CPU only (slower but more compatible)';
+      }
+      return 'Automatically choose best available hardware';
+    },
+    
+    estimatedTime() {
+      const imageCount = this.archive?.validation?.image_count || 0;
+      if (imageCount === 0) return null;
+      
+      // Rough estimates based on batch size and device
+      const imagesPerSecond = this.parameters.device === 'gpu' ? 50 : 10;
+      const seconds = Math.ceil(imageCount / imagesPerSecond);
+      
+      if (seconds < 60) return `~${seconds}s`;
+      if (seconds < 3600) return `~${Math.ceil(seconds / 60)}m`;
+      return `~${Math.ceil(seconds / 3600)}h`;
+    },
+    
+    estimatedMemory() {
+      const batchSize = this.parameters.batch_size;
+      const imageSize = this.parameters.image_size;
+      
+      // Rough memory estimate: batch_size * image_size^2 * 3 channels * 4 bytes * model overhead
+      const memoryMB = Math.ceil((batchSize * imageSize * imageSize * 3 * 4 * 2) / (1024 * 1024));
+      
+      if (memoryMB < 1024) return `~${memoryMB}MB`;
+      return `~${Math.ceil(memoryMB / 1024)}GB`;
+    }
+  },
+  mounted() {
+    this.validateParameters();
+  },
+  watch: {
+    parameters: {
+      handler: 'validateParameters',
+      deep: true
+    },
+    customModelFile: 'validateParameters'
+  },
+  methods: {
+    validateParameters() {
+      this.validationWarnings = [];
+
+      // Check batch size
+      if (this.parameters.batch_size > 1024) {
+        this.validationWarnings.push('Large batch size may cause out-of-memory errors.');
+      }
+
+      // Check custom model
+      if (this.parameters.model === 'custom' && !this.customModelFile) {
+        this.validationWarnings.push('Please upload a custom model file.');
+      }
+
+      // Check image count
+      const imageCount = this.archive?.validation?.image_count || 0;
+      if (imageCount === 0) {
+        this.validationWarnings.push('No images found in archive.');
+      } else if (imageCount > 100000) {
+        this.validationWarnings.push('Large number of images detected. Processing may take a long time.');
+      }
+
+      // Check memory requirements
+      const estimatedMemoryGB = parseInt(this.estimatedMemory);
+      if (estimatedMemoryGB > 8) {
+        this.validationWarnings.push('High memory usage expected. Consider reducing batch size.');
+      }
+
+      // Check normalization parameters
+      if (this.parameters.input_mean && !this.isValidFloatList(this.parameters.input_mean)) {
+        this.validationWarnings.push('Input mean must be three comma-separated numbers.');
+      }
+      
+      if (this.parameters.input_std && !this.isValidFloatList(this.parameters.input_std)) {
+        this.validationWarnings.push('Input std must be three comma-separated numbers.');
+      }
+    },
+
+    isValidFloatList(value) {
+      if (!value) return true;
+      const parts = value.split(',');
+      if (parts.length !== 3) return false;
+      return parts.every(part => !isNaN(parseFloat(part.trim())));
+    },
+
+    async handleExtract() {
+      if (!this.isValid) return;
+
+      // Prepare parameters for API
+      const extractParams = { ...this.parameters };
+      
+      // Convert string booleans to actual booleans
+      extractParams.normalize = extractParams.normalize === 'true' || extractParams.normalize === true;
+
+      // Parse normalization parameters
+      if (extractParams.input_mean) {
+        extractParams.input_mean = extractParams.input_mean.split(',').map(x => parseFloat(x.trim()));
+      }
+      if (extractParams.input_std) {
+        extractParams.input_std = extractParams.input_std.split(',').map(x => parseFloat(x.trim()));
+      }
+
+      // Handle custom model file
+      if (extractParams.model === 'custom' && this.customModelFile) {
+        // In a real implementation, you would upload the file first
+        extractParams.custom_model_path = this.customModelFile.name;
+      }
+
+      this.$emit('extract', extractParams);
+      this.isVisible = false;
+    },
+
+    handleCancel() {
+      this.$emit('cancel');
+      this.isVisible = false;
+    }
+  }
+};
+</script>
+
+<style scoped>
+.feature-extraction-form {
+  max-height: 70vh;
+  overflow-y: auto;
+}
+
+.archive-info {
+  background-color: #f8f9fa;
+  border: 1px solid #dee2e6;
+  border-radius: 4px;
+  padding: 1rem;
+}
+
+.info-grid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 0.5rem;
+}
+
+.info-item {
+  display: flex;
+  justify-content: space-between;
+}
+
+.info-item strong {
+  margin-right: 0.5rem;
+}
+
+.custom-model-section {
+  background-color: #f8f9fa;
+  border: 1px solid #dee2e6;
+  border-radius: 4px;
+  padding: 1rem;
+}
+
+.model-info {
+  background-color: #e7f3ff;
+  border: 1px solid #bee5eb;
+  border-radius: 4px;
+  padding: 0.75rem;
+}
+
+.processing-params .card-header {
+  background-color: #f8f9fa;
+}
+
+.batch-size-presets .btn {
+  margin-bottom: 0.25rem;
+}
+
+.device-info {
+  background-color: #e7f3ff;
+  border: 1px solid #bee5eb;
+  border-radius: 4px;
+  padding: 0.5rem;
+}
+
+.advanced-options {
+  margin-top: 1rem;
+}
+
+.advanced-options .card-header {
+  padding: 0.75rem 1rem;
+  background-color: #f8f9fa;
+}
+
+.validation-warnings .alert {
+  padding: 0.5rem 0.75rem;
+  margin-bottom: 0.5rem;
+}
+
+.validation-warnings .alert:last-child {
+  margin-bottom: 0;
+}
+
+@media (max-width: 768px) {
+  .info-grid {
+    grid-template-columns: 1fr;
+  }
+  
+  .info-item {
+    flex-direction: column;
+  }
+  
+  .info-item strong {
+    margin-right: 0;
+    margin-bottom: 0.25rem;
+  }
+
+  .batch-size-presets .btn {
+    width: 100%;
+    margin-bottom: 0.5rem;
+  }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/components/FormatModal.vue b/morphocluster/frontend/src/components/FormatModal.vue
new file mode 100644
index 0000000..5adc17e
--- /dev/null
+++ b/morphocluster/frontend/src/components/FormatModal.vue
@@ -0,0 +1,399 @@
+<template>
+  <b-modal
+    v-model="isVisible"
+    title="Convert EcoTaxa Format"
+    size="lg"
+    @ok="handleConvert"
+    @cancel="handleCancel"
+    :ok-disabled="!isValid"
+    ok-title="Start Conversion"
+    cancel-title="Cancel"
+  >
+    <div class="format-conversion-form">
+      <b-alert variant="info" show class="mb-4">
+        <i class="mdi mdi-information"></i>
+        <strong>EcoTaxa Format Detected</strong><br>
+        This archive appears to be in EcoTaxa format. We'll convert it to the standard MorphoCluster format
+        by processing the TSV/CSV files and organizing the images correctly.
+      </b-alert>
+
+      <!-- Archive Information -->
+      <div class="archive-info mb-4">
+        <h6>Archive Information</h6>
+        <div class="info-grid">
+          <div class="info-item">
+            <strong>File:</strong>
+            <span>{{ archive?.name || 'Unknown' }}</span>
+          </div>
+          <div class="info-item">
+            <strong>Size:</strong>
+            <span>{{ formatBytes(archive?.size || 0) }}</span>
+          </div>
+          <div class="info-item" v-if="archive?.validation?.file_count">
+            <strong>Files:</strong>
+            <span>{{ archive.validation.file_count }} files</span>
+          </div>
+          <div class="info-item" v-if="archive?.validation?.image_count">
+            <strong>Images:</strong>
+            <span>{{ archive.validation.image_count }} images</span>
+          </div>
+        </div>
+      </div>
+
+      <!-- Conversion Parameters -->
+      <b-form @submit.prevent="handleConvert">
+        <!-- Encoding Detection -->
+        <b-form-group
+          label="File Encoding"
+          label-for="encoding"
+          description="Character encoding for text files (usually auto-detected)"
+        >
+          <b-form-select
+            id="encoding"
+            v-model="parameters.encoding"
+            :options="encodingOptions"
+          />
+        </b-form-group>
+
+        <!-- Delimiter Detection -->
+        <b-form-group
+          label="CSV Delimiter"
+          label-for="delimiter"
+          description="Separator used in CSV/TSV files (usually auto-detected)"
+        >
+          <b-form-select
+            id="delimiter"
+            v-model="parameters.delimiter"
+            :options="delimiterOptions"
+          />
+        </b-form-group>
+
+        <!-- Source Format Preview -->
+        <div v-if="previewData" class="format-preview mb-4">
+          <h6>Source Format Preview</h6>
+          <div class="preview-container">
+            <b-table
+              :items="previewData.sample_rows"
+              :fields="previewData.columns"
+              small
+              striped
+              class="preview-table"
+            />
+            <small class="text-muted">
+              Showing first {{ previewData.sample_rows.length }} rows of {{ previewData.total_rows }} total rows
+            </small>
+          </div>
+        </div>
+
+        <!-- Advanced Options -->
+        <b-card class="advanced-options" no-body>
+          <b-card-header>
+            <b-button
+              v-b-toggle.advanced-collapse
+              variant="link"
+              class="p-0 text-decoration-none"
+            >
+              <i :class="showAdvanced ? 'mdi mdi-chevron-up' : 'mdi mdi-chevron-down'"></i>
+              Advanced Options
+            </b-button>
+          </b-card-header>
+          <b-collapse id="advanced-collapse" v-model="showAdvanced">
+            <b-card-body>
+              <b-form-group
+                label="Force Overwrite"
+                description="Overwrite existing index.csv if it already exists"
+              >
+                <b-form-checkbox
+                  v-model="parameters.force_overwrite"
+                  value="true"
+                  unchecked-value="false"
+                >
+                  Force overwrite existing files
+                </b-form-checkbox>
+              </b-form-group>
+
+              <b-form-group
+                label="Skip Image Validation"
+                description="Skip checking if all referenced images exist (faster but less safe)"
+              >
+                <b-form-checkbox
+                  v-model="parameters.skip_image_validation"
+                  value="true"
+                  unchecked-value="false"
+                >
+                  Skip image validation
+                </b-form-checkbox>
+              </b-form-group>
+
+              <b-form-group
+                label="Custom Image Path Column"
+                label-for="image-column"
+                description="Column name containing image paths (auto-detected if empty)"
+              >
+                <b-form-input
+                  id="image-column"
+                  v-model="parameters.image_column"
+                  placeholder="Auto-detect"
+                />
+              </b-form-group>
+            </b-card-body>
+          </b-collapse>
+        </b-card>
+
+        <!-- Validation Warnings -->
+        <div v-if="validationWarnings.length" class="validation-warnings mt-3">
+          <b-alert
+            v-for="(warning, index) in validationWarnings"
+            :key="index"
+            variant="warning"
+            show
+            class="small"
+          >
+            <i class="mdi mdi-alert"></i>
+            {{ warning }}
+          </b-alert>
+        </div>
+      </b-form>
+    </div>
+  </b-modal>
+</template>
+
+<script>
+import * as api from '@/helpers/api.js';
+
+export default {
+  name: 'FormatModal',
+  props: {
+    archive: {
+      type: Object,
+      required: true
+    }
+  },
+  emits: ['convert', 'cancel'],
+  data() {
+    return {
+      isVisible: true,
+      showAdvanced: false,
+      parameters: {
+        encoding: 'auto',
+        delimiter: 'auto',
+        force_overwrite: false,
+        skip_image_validation: false,
+        image_column: ''
+      },
+      encodingOptions: [
+        { value: 'auto', text: 'Auto-detect' },
+        { value: 'utf-8', text: 'UTF-8' },
+        { value: 'latin-1', text: 'Latin-1 (ISO-8859-1)' },
+        { value: 'windows-1252', text: 'Windows-1252' },
+        { value: 'ascii', text: 'ASCII' }
+      ],
+      delimiterOptions: [
+        { value: 'auto', text: 'Auto-detect' },
+        { value: ',', text: 'Comma (,)' },
+        { value: '\t', text: 'Tab' },
+        { value: ';', text: 'Semicolon (;)' },
+        { value: '|', text: 'Pipe (|)' }
+      ],
+      previewData: null,
+      validationWarnings: [],
+      isLoading: false
+    };
+  },
+  computed: {
+    isValid() {
+      return this.parameters.encoding && this.parameters.delimiter;
+    }
+  },
+  async mounted() {
+    await this.loadPreview();
+    this.validateParameters();
+  },
+  watch: {
+    parameters: {
+      handler: 'validateParameters',
+      deep: true
+    }
+  },
+  methods: {
+    async loadPreview() {
+      if (!this.archive?.name) return;
+      
+      this.isLoading = true;
+      try {
+        this.previewData = await api.previewArchive(this.archive.name);
+        
+        // Auto-detect encoding and delimiter from preview
+        if (this.previewData.detected_encoding) {
+          this.parameters.encoding = this.previewData.detected_encoding;
+        }
+        if (this.previewData.detected_delimiter) {
+          this.parameters.delimiter = this.previewData.detected_delimiter;
+        }
+        
+      } catch (error) {
+        console.error('Failed to load preview:', error);
+        this.validationWarnings.push('Could not load file preview. Conversion may not work correctly.');
+      } finally {
+        this.isLoading = false;
+      }
+    },
+
+    validateParameters() {
+      this.validationWarnings = [];
+
+      // Check if encoding is supported
+      if (this.parameters.encoding === 'auto' && !this.previewData?.detected_encoding) {
+        this.validationWarnings.push('Encoding could not be auto-detected. Please select manually.');
+      }
+
+      // Check if delimiter is supported
+      if (this.parameters.delimiter === 'auto' && !this.previewData?.detected_delimiter) {
+        this.validationWarnings.push('CSV delimiter could not be auto-detected. Please select manually.');
+      }
+
+      // Check for image column
+      if (this.parameters.image_column && this.previewData?.columns) {
+        const columnExists = this.previewData.columns.some(col => 
+          col.key === this.parameters.image_column
+        );
+        if (!columnExists) {
+          this.validationWarnings.push(`Column "${this.parameters.image_column}" not found in the CSV file.`);
+        }
+      }
+
+      // Check file size
+      if (this.archive?.size > 1024 * 1024 * 1024) { // 1GB
+        this.validationWarnings.push('Large archive detected. Conversion may take a long time.');
+      }
+    },
+
+    async handleConvert() {
+      if (!this.isValid) return;
+
+      // Prepare parameters for API
+      const convertParams = { ...this.parameters };
+      
+      // Convert 'auto' values to actual detected values
+      if (convertParams.encoding === 'auto') {
+        convertParams.encoding = this.previewData?.detected_encoding || 'utf-8';
+      }
+      if (convertParams.delimiter === 'auto') {
+        convertParams.delimiter = this.previewData?.detected_delimiter || ',';
+      }
+
+      // Convert string booleans to actual booleans
+      convertParams.force_overwrite = convertParams.force_overwrite === 'true' || convertParams.force_overwrite === true;
+      convertParams.skip_image_validation = convertParams.skip_image_validation === 'true' || convertParams.skip_image_validation === true;
+
+      this.$emit('convert', convertParams);
+      this.isVisible = false;
+    },
+
+    handleCancel() {
+      this.$emit('cancel');
+      this.isVisible = false;
+    },
+
+    formatBytes(bytes) {
+      if (bytes === 0) return '0 Bytes';
+      const k = 1024;
+      const sizes = ['Bytes', 'KB', 'MB', 'GB'];
+      const i = Math.floor(Math.log(bytes) / Math.log(k));
+      return parseFloat((bytes / Math.pow(k, i)).toFixed(2)) + ' ' + sizes[i];
+    }
+  }
+};
+</script>
+
+<style scoped>
+.format-conversion-form {
+  max-height: 70vh;
+  overflow-y: auto;
+}
+
+.archive-info {
+  background-color: #f8f9fa;
+  border: 1px solid #dee2e6;
+  border-radius: 4px;
+  padding: 1rem;
+}
+
+.info-grid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 0.5rem;
+}
+
+.info-item {
+  display: flex;
+  justify-content: space-between;
+}
+
+.info-item strong {
+  margin-right: 0.5rem;
+}
+
+.format-preview {
+  border: 1px solid #dee2e6;
+  border-radius: 4px;
+  padding: 1rem;
+  background-color: #f8f9fa;
+}
+
+.preview-container {
+  max-height: 300px;
+  overflow: auto;
+}
+
+.preview-table {
+  font-size: 0.875rem;
+}
+
+.advanced-options {
+  margin-top: 1rem;
+}
+
+.advanced-options .card-header {
+  padding: 0.75rem 1rem;
+  background-color: #f8f9fa;
+}
+
+.validation-warnings .alert {
+  padding: 0.5rem 0.75rem;
+  margin-bottom: 0.5rem;
+}
+
+.validation-warnings .alert:last-child {
+  margin-bottom: 0;
+}
+
+/* Loading states */
+.loading-overlay {
+  position: absolute;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+  background-color: rgba(255, 255, 255, 0.8);
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  z-index: 10;
+}
+
+@media (max-width: 768px) {
+  .info-grid {
+    grid-template-columns: 1fr;
+  }
+  
+  .info-item {
+    flex-direction: column;
+  }
+  
+  .info-item strong {
+    margin-right: 0;
+    margin-bottom: 0.25rem;
+  }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/components/JobStatus.vue b/morphocluster/frontend/src/components/JobStatus.vue
new file mode 100644
index 0000000..fbd8150
--- /dev/null
+++ b/morphocluster/frontend/src/components/JobStatus.vue
@@ -0,0 +1,512 @@
+<template>
+  <div class="job-status-container">
+    <div v-if="jobs.length === 0" class="no-jobs">
+      <i class="mdi mdi-briefcase-outline"></i>
+      <p>No active jobs</p>
+    </div>
+
+    <div v-else class="jobs-list">
+      <div
+        v-for="job in jobs"
+        :key="job.id"
+        class="job-item"
+        :class="{ 
+          'job-completed': job.status === 'completed',
+          'job-failed': job.status === 'failed',
+          'job-running': job.status === 'running'
+        }"
+      >
+        <div class="job-header">
+          <div class="job-info">
+            <h6 class="job-title">{{ getJobTitle(job) }}</h6>
+            <small class="job-details">{{ getJobDetails(job) }}</small>
+          </div>
+          <div class="job-actions">
+            <b-button
+              v-if="job.status === 'running'"
+              size="sm"
+              variant="outline-danger"
+              @click="cancelJob(job.id)"
+              :disabled="job.cancelling"
+            >
+              <i class="mdi mdi-stop"></i>
+              {{ job.cancelling ? 'Cancelling...' : 'Cancel' }}
+            </b-button>
+            <b-button
+              v-if="job.status === 'completed' || job.status === 'failed'"
+              size="sm"
+              variant="outline-secondary"
+              @click="removeJob(job.id)"
+            >
+              <i class="mdi mdi-close"></i>
+            </b-button>
+          </div>
+        </div>
+
+        <div class="job-status">
+          <div class="status-info">
+            <i :class="getStatusIcon(job.status)"></i>
+            <span class="status-text">{{ getStatusText(job.status) }}</span>
+            <span v-if="job.status === 'running' && job.eta" class="eta">
+              ETA: {{ formatTime(job.eta) }}
+            </span>
+          </div>
+          
+          <div v-if="job.status === 'running'" class="progress-container">
+            <b-progress 
+              :value="job.progress || 0" 
+              :max="100"
+              :variant="getProgressVariant(job.status)"
+              :animated="job.status === 'running'"
+              show-progress
+            ></b-progress>
+            <div v-if="job.current_step" class="current-step">
+              {{ job.current_step }}
+            </div>
+          </div>
+
+          <div v-if="job.status === 'failed' && job.error_message" class="error-message">
+            <i class="mdi mdi-alert-circle"></i>
+            {{ job.error_message }}
+          </div>
+
+          <div v-if="job.status === 'completed' && job.result_url" class="result-actions">
+            <b-button
+              size="sm"
+              variant="success"
+              @click="viewResult(job)"
+            >
+              <i class="mdi mdi-eye"></i>
+              View Result
+            </b-button>
+          </div>
+        </div>
+
+        <div v-if="showLogs && job.logs && job.logs.length" class="job-logs">
+          <small class="logs-title">Recent logs:</small>
+          <div class="logs-content">
+            <div
+              v-for="(log, index) in job.logs.slice(-5)"
+              :key="index"
+              class="log-entry"
+              :class="'log-' + log.level"
+            >
+              <span class="log-time">{{ formatLogTime(log.timestamp) }}</span>
+              <span class="log-message">{{ log.message }}</span>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+
+    <div v-if="jobs.length > 0" class="jobs-actions">
+      <b-button
+        size="sm"
+        variant="outline-secondary"
+        @click="toggleLogs"
+      >
+        <i :class="showLogs ? 'mdi mdi-chevron-up' : 'mdi mdi-chevron-down'"></i>
+        {{ showLogs ? 'Hide' : 'Show' }} Logs
+      </b-button>
+      <b-button
+        size="sm"
+        variant="outline-danger"
+        @click="clearCompletedJobs"
+        :disabled="!hasCompletedJobs"
+      >
+        <i class="mdi mdi-delete-sweep"></i>
+        Clear Completed
+      </b-button>
+    </div>
+  </div>
+</template>
+
+<script>
+
+export default {
+  name: 'JobStatus',
+  props: {
+    autoRefresh: {
+      type: Boolean,
+      default: true
+    },
+    refreshInterval: {
+      type: Number,
+      default: 2000 // 2 seconds
+    }
+  },
+  emits: ['job-completed', 'job-failed', 'job-cancelled'],
+  data() {
+    return {
+      jobs: [],
+      showLogs: false,
+      refreshTimer: null,
+      isLoading: false
+    };
+  },
+  computed: {
+    hasCompletedJobs() {
+      return this.jobs.some(job => ['completed', 'failed'].includes(job.status));
+    }
+  },
+  async mounted() {
+    await this.fetchJobs();
+    if (this.autoRefresh) {
+      this.startRefresh();
+    }
+  },
+  beforeUnmount() {
+    this.stopRefresh();
+  },
+  methods: {
+    async fetchJobs() {
+      if (this.isLoading) return;
+      
+      this.isLoading = true;
+      try {
+        const response = await this.$axios.get('/api/jobs/user');
+        const newJobs = response.data;
+        
+        // Check for status changes
+        this.jobs.forEach(oldJob => {
+          const newJob = newJobs.find(j => j.id === oldJob.id);
+          if (newJob && oldJob.status !== newJob.status) {
+            if (newJob.status === 'completed') {
+              this.$emit('job-completed', newJob);
+            } else if (newJob.status === 'failed') {
+              this.$emit('job-failed', newJob);
+            }
+          }
+        });
+        
+        this.jobs = newJobs;
+      } catch (error) {
+        console.error('Failed to fetch jobs:', error);
+      } finally {
+        this.isLoading = false;
+      }
+    },
+
+    async cancelJob(jobId) {
+      const job = this.jobs.find(j => j.id === jobId);
+      if (job) {
+        job.cancelling = true;
+        try {
+          await this.$axios.delete(`/api/jobs/${jobId}`);
+          this.$emit('job-cancelled', job);
+        } catch (error) {
+          console.error('Failed to cancel job:', error);
+          job.cancelling = false;
+        }
+      }
+    },
+
+    removeJob(jobId) {
+      const index = this.jobs.findIndex(j => j.id === jobId);
+      if (index !== -1) {
+        this.jobs.splice(index, 1);
+      }
+    },
+
+    clearCompletedJobs() {
+      this.jobs = this.jobs.filter(job => !['completed', 'failed'].includes(job.status));
+    },
+
+    viewResult(job) {
+      if (job.result_url) {
+        this.$router.push(job.result_url);
+      }
+    },
+
+    startRefresh() {
+      if (this.refreshTimer) {
+        clearInterval(this.refreshTimer);
+      }
+      this.refreshTimer = setInterval(() => {
+        this.fetchJobs();
+      }, this.refreshInterval);
+    },
+
+    stopRefresh() {
+      if (this.refreshTimer) {
+        clearInterval(this.refreshTimer);
+        this.refreshTimer = null;
+      }
+    },
+
+    toggleLogs() {
+      this.showLogs = !this.showLogs;
+    },
+
+    getJobTitle(job) {
+      const titles = {
+        'format_conversion': 'Converting EcoTaxa Format',
+        'feature_extraction': 'Extracting Features',
+        'initial_clustering': 'Creating Project',
+        'reclustering': 'Re-clustering Project'
+      };
+      return titles[job.job_type] || 'Processing';
+    },
+
+    getJobDetails(job) {
+      if (job.job_type === 'format_conversion') {
+        return `Archive: ${job.parameters?.archive_name || 'Unknown'}`;
+      } else if (job.job_type === 'feature_extraction') {
+        return `Model: ${job.parameters?.model || 'ImageNet'}, Batch: ${job.parameters?.batch_size || 512}`;
+      } else if (job.job_type === 'initial_clustering' || job.job_type === 'reclustering') {
+        return `Min cluster size: ${job.parameters?.min_cluster_size || 128}`;
+      }
+      return '';
+    },
+
+    getStatusIcon(status) {
+      const icons = {
+        'pending': 'mdi mdi-clock-outline text-warning',
+        'running': 'mdi mdi-loading mdi-spin text-primary',
+        'completed': 'mdi mdi-check-circle text-success',
+        'failed': 'mdi mdi-alert-circle text-danger',
+        'cancelled': 'mdi mdi-stop-circle text-secondary'
+      };
+      return icons[status] || 'mdi mdi-help-circle text-muted';
+    },
+
+    getStatusText(status) {
+      const texts = {
+        'pending': 'Pending',
+        'running': 'Running',
+        'completed': 'Completed',
+        'failed': 'Failed',
+        'cancelled': 'Cancelled'
+      };
+      return texts[status] || 'Unknown';
+    },
+
+    getProgressVariant(status) {
+      const variants = {
+        'running': 'primary',
+        'completed': 'success',
+        'failed': 'danger'
+      };
+      return variants[status] || 'secondary';
+    },
+
+    formatTime(seconds) {
+      if (seconds < 60) return `${Math.round(seconds)}s`;
+      if (seconds < 3600) return `${Math.round(seconds / 60)}m`;
+      return `${Math.round(seconds / 3600)}h`;
+    },
+
+    formatLogTime(timestamp) {
+      return new Date(timestamp).toLocaleTimeString();
+    }
+  }
+};
+</script>
+
+<style scoped>
+.job-status-container {
+  border: 1px solid #dee2e6;
+  border-radius: 8px;
+  background: white;
+}
+
+.no-jobs {
+  text-align: center;
+  padding: 2rem;
+  color: #6c757d;
+}
+
+.no-jobs i {
+  font-size: 3rem;
+  margin-bottom: 0.5rem;
+}
+
+.job-item {
+  border-bottom: 1px solid #e9ecef;
+  padding: 1rem;
+}
+
+.job-item:last-child {
+  border-bottom: none;
+}
+
+.job-item.job-completed {
+  border-left: 4px solid #28a745;
+  background-color: #f8fff9;
+}
+
+.job-item.job-failed {
+  border-left: 4px solid #dc3545;
+  background-color: #fff5f5;
+}
+
+.job-item.job-running {
+  border-left: 4px solid #007bff;
+  background-color: #f8f9ff;
+}
+
+.job-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: flex-start;
+  margin-bottom: 0.5rem;
+}
+
+.job-info {
+  flex: 1;
+}
+
+.job-title {
+  margin: 0 0 0.25rem 0;
+  font-weight: 600;
+  color: #495057;
+}
+
+.job-details {
+  color: #6c757d;
+  font-size: 0.875rem;
+}
+
+.job-actions {
+  margin-left: 1rem;
+}
+
+.job-status {
+  margin-bottom: 0.5rem;
+}
+
+.status-info {
+  display: flex;
+  align-items: center;
+  margin-bottom: 0.75rem;
+}
+
+.status-info i {
+  margin-right: 0.5rem;
+}
+
+.status-text {
+  font-weight: 500;
+  margin-right: 1rem;
+}
+
+.eta {
+  color: #6c757d;
+  font-size: 0.875rem;
+}
+
+.progress-container {
+  margin-bottom: 0.5rem;
+}
+
+.current-step {
+  font-size: 0.875rem;
+  color: #6c757d;
+  margin-top: 0.25rem;
+}
+
+.error-message {
+  display: flex;
+  align-items: flex-start;
+  color: #dc3545;
+  font-size: 0.875rem;
+  padding: 0.5rem;
+  background-color: #f8d7da;
+  border: 1px solid #f5c6cb;
+  border-radius: 4px;
+}
+
+.error-message i {
+  margin-right: 0.5rem;
+  margin-top: 0.1rem;
+}
+
+.result-actions {
+  margin-top: 0.5rem;
+}
+
+.job-logs {
+  margin-top: 1rem;
+  padding-top: 0.75rem;
+  border-top: 1px solid #e9ecef;
+}
+
+.logs-title {
+  font-weight: 600;
+  color: #495057;
+  display: block;
+  margin-bottom: 0.5rem;
+}
+
+.logs-content {
+  background-color: #f8f9fa;
+  border: 1px solid #dee2e6;
+  border-radius: 4px;
+  padding: 0.5rem;
+  max-height: 200px;
+  overflow-y: auto;
+}
+
+.log-entry {
+  font-family: monospace;
+  font-size: 0.75rem;
+  margin-bottom: 0.25rem;
+  display: flex;
+}
+
+.log-time {
+  color: #6c757d;
+  margin-right: 0.5rem;
+  flex-shrink: 0;
+}
+
+.log-message {
+  flex: 1;
+}
+
+.log-entry.log-error {
+  color: #dc3545;
+}
+
+.log-entry.log-warning {
+  color: #fd7e14;
+}
+
+.log-entry.log-info {
+  color: #17a2b8;
+}
+
+.jobs-actions {
+  padding: 0.75rem 1rem;
+  border-top: 1px solid #e9ecef;
+  background-color: #f8f9fa;
+  display: flex;
+  justify-content: space-between;
+}
+
+@media (max-width: 768px) {
+  .job-header {
+    flex-direction: column;
+    align-items: stretch;
+  }
+
+  .job-actions {
+    margin-left: 0;
+    margin-top: 0.5rem;
+  }
+
+  .status-info {
+    flex-wrap: wrap;
+  }
+
+  .eta {
+    width: 100%;
+    margin-top: 0.25rem;
+  }
+
+  .jobs-actions {
+    flex-direction: column;
+    gap: 0.5rem;
+  }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/components/UploadZone.vue b/morphocluster/frontend/src/components/UploadZone.vue
new file mode 100644
index 0000000..bb61135
--- /dev/null
+++ b/morphocluster/frontend/src/components/UploadZone.vue
@@ -0,0 +1,484 @@
+<template>
+  <div class="upload-zone-container">
+    <div
+      class="upload-zone"
+      :class="{
+        'drag-over': isDragOver,
+        'uploading': isUploading,
+        'upload-complete': uploadComplete
+      }"
+      @dragover.prevent="handleDragOver"
+      @dragenter.prevent="handleDragEnter"
+      @dragleave.prevent="handleDragLeave"
+      @drop.prevent="handleDrop"
+      @click="openFileInput"
+    >
+      <div v-if="!isUploading && !uploadComplete" class="upload-content">
+        <i class="mdi mdi-cloud-upload upload-icon"></i>
+        <h4>{{ isDragOver ? 'Drop files here' : 'Upload Archive Files' }}</h4>
+        <p>Drag & drop ZIP archives or click to browse</p>
+        <p class="supported-formats">Supported: ZIP archives with images and index.csv</p>
+        <b-button variant="primary" size="lg" class="upload-btn">
+          <i class="mdi mdi-file-multiple"></i> Browse Files
+        </b-button>
+      </div>
+
+      <div v-if="isUploading" class="upload-progress">
+        <i class="mdi mdi-loading mdi-spin upload-icon"></i>
+        <h4>Uploading Files...</h4>
+        <div class="progress-container">
+          <b-progress 
+            :value="uploadProgress" 
+            :max="100" 
+            class="mb-3"
+            :variant="uploadProgress === 100 ? 'success' : 'primary'"
+            show-progress
+          ></b-progress>
+          <div class="upload-stats">
+            <span>{{ formatBytes(uploadedBytes) }} / {{ formatBytes(totalBytes) }}</span>
+            <span v-if="uploadSpeed > 0">{{ formatBytes(uploadSpeed) }}/s</span>
+            <span v-if="timeRemaining > 0">{{ formatTime(timeRemaining) }} remaining</span>
+          </div>
+        </div>
+        <b-button variant="outline-danger" size="sm" @click="cancelUpload" class="mt-2">
+          Cancel Upload
+        </b-button>
+      </div>
+
+      <div v-if="uploadComplete" class="upload-complete">
+        <i class="mdi mdi-check-circle upload-icon text-success"></i>
+        <h4>Upload Complete!</h4>
+        <p>{{ uploadedFiles.length }} file(s) uploaded successfully</p>
+        <div class="uploaded-files">
+          <div v-for="file in uploadedFiles" :key="file.name" class="uploaded-file">
+            <i class="mdi mdi-file-outline"></i>
+            <span>{{ file.name }}</span>
+            <span class="file-size">{{ formatBytes(file.size) }}</span>
+          </div>
+        </div>
+        <div class="upload-actions mt-3">
+          <b-button variant="success" @click="$emit('upload-complete', uploadedFiles)">
+            Process Files
+          </b-button>
+          <b-button variant="outline-primary" @click="resetUpload" class="ms-2">
+            Upload More
+          </b-button>
+        </div>
+      </div>
+    </div>
+
+    <input
+      ref="fileInput"
+      type="file"
+      multiple
+      accept=".zip,.tar,.tar.gz"
+      style="display: none"
+      @change="handleFileSelect"
+    />
+
+    <div v-if="errors.length" class="upload-errors mt-3">
+      <b-alert
+        v-for="(error, index) in errors"
+        :key="index"
+        variant="danger"
+        dismissible
+        @dismissed="removeError(index)"
+      >
+        {{ error }}
+      </b-alert>
+    </div>
+  </div>
+</template>
+
+<script>
+import axios from 'axios';
+
+export default {
+  name: 'UploadZone',
+  props: {
+    uploadUrl: {
+      type: String,
+      default: '/api/upload'
+    },
+    maxFileSize: {
+      type: Number,
+      default: 1024 * 1024 * 1024 // 1GB default
+    },
+    acceptedTypes: {
+      type: Array,
+      default: () => ['.zip', '.tar', '.tar.gz']
+    }
+  },
+  emits: ['upload-start', 'upload-progress', 'upload-complete', 'upload-error', 'upload-cancel'],
+  data() {
+    return {
+      isDragOver: false,
+      isUploading: false,
+      uploadComplete: false,
+      uploadProgress: 0,
+      uploadedBytes: 0,
+      totalBytes: 0,
+      uploadSpeed: 0,
+      timeRemaining: 0,
+      uploadedFiles: [],
+      errors: [],
+      uploadStartTime: 0,
+      cancelTokenSource: null
+    };
+  },
+  methods: {
+    handleDragOver(event) {
+      event.preventDefault();
+      this.isDragOver = true;
+    },
+    
+    handleDragEnter(event) {
+      event.preventDefault();
+      this.isDragOver = true;
+    },
+    
+    handleDragLeave(event) {
+      event.preventDefault();
+      // Only set to false if we're leaving the upload zone entirely
+      if (!this.$el.contains(event.relatedTarget)) {
+        this.isDragOver = false;
+      }
+    },
+    
+    handleDrop(event) {
+      event.preventDefault();
+      this.isDragOver = false;
+      const files = Array.from(event.dataTransfer.files);
+      this.processFiles(files);
+    },
+    
+    openFileInput() {
+      if (!this.isUploading) {
+        this.$refs.fileInput.click();
+      }
+    },
+    
+    handleFileSelect(event) {
+      const files = Array.from(event.target.files);
+      this.processFiles(files);
+      // Clear the input so same file can be selected again
+      event.target.value = '';
+    },
+    
+    processFiles(files) {
+      this.errors = [];
+      
+      if (files.length === 0) return;
+      
+      // Validate files
+      const validFiles = [];
+      for (const file of files) {
+        if (!this.validateFile(file)) continue;
+        validFiles.push(file);
+      }
+      
+      if (validFiles.length === 0) return;
+      
+      this.uploadFiles(validFiles);
+    },
+    
+    validateFile(file) {
+      // Check file size
+      if (file.size > this.maxFileSize) {
+        this.errors.push(`File "${file.name}" is too large. Maximum size is ${this.formatBytes(this.maxFileSize)}.`);
+        return false;
+      }
+      
+      // Check file type
+      const fileName = file.name.toLowerCase();
+      const isAccepted = this.acceptedTypes.some(type => 
+        fileName.endsWith(type.toLowerCase())
+      );
+      
+      if (!isAccepted) {
+        this.errors.push(`File "${file.name}" is not an accepted format. Accepted formats: ${this.acceptedTypes.join(', ')}`);
+        return false;
+      }
+      
+      return true;
+    },
+    
+    async uploadFiles(files) {
+      this.isUploading = true;
+      this.uploadComplete = false;
+      this.uploadProgress = 0;
+      this.uploadedBytes = 0;
+      this.totalBytes = files.reduce((total, file) => total + file.size, 0);
+      this.uploadStartTime = Date.now();
+      
+      // Create cancel token
+      this.cancelTokenSource = axios.CancelToken.source();
+      
+      const formData = new FormData();
+      files.forEach(file => {
+        formData.append('files', file);
+      });
+      
+      this.$emit('upload-start', files);
+      
+      try {
+        const response = await axios.post(this.uploadUrl, formData, {
+          headers: {
+            'Content-Type': 'multipart/form-data',
+          },
+          cancelToken: this.cancelTokenSource.token,
+          onUploadProgress: (progressEvent) => {
+            this.updateProgress(progressEvent);
+          },
+        });
+        
+        this.uploadedFiles = files.map(file => ({
+          name: file.name,
+          size: file.size,
+          type: file.type
+        }));
+        
+        this.uploadComplete = true;
+        this.isUploading = false;
+        
+        this.$emit('upload-complete', {
+          files: this.uploadedFiles,
+          response: response.data
+        });
+        
+      } catch (error) {
+        this.isUploading = false;
+        
+        if (axios.isCancel(error)) {
+          this.$emit('upload-cancel');
+        } else {
+          this.errors.push(error.response?.data?.message || 'Upload failed. Please try again.');
+          this.$emit('upload-error', error);
+        }
+      }
+    },
+    
+    updateProgress(progressEvent) {
+      this.uploadedBytes = progressEvent.loaded;
+      this.uploadProgress = Math.round((progressEvent.loaded / progressEvent.total) * 100);
+      
+      const elapsed = (Date.now() - this.uploadStartTime) / 1000;
+      this.uploadSpeed = elapsed > 0 ? progressEvent.loaded / elapsed : 0;
+      
+      if (this.uploadSpeed > 0) {
+        const remaining = (progressEvent.total - progressEvent.loaded) / this.uploadSpeed;
+        this.timeRemaining = remaining;
+      }
+      
+      this.$emit('upload-progress', {
+        progress: this.uploadProgress,
+        uploadedBytes: this.uploadedBytes,
+        totalBytes: this.totalBytes,
+        uploadSpeed: this.uploadSpeed,
+        timeRemaining: this.timeRemaining
+      });
+    },
+    
+    cancelUpload() {
+      if (this.cancelTokenSource) {
+        this.cancelTokenSource.cancel('Upload cancelled by user');
+      }
+    },
+    
+    resetUpload() {
+      this.isUploading = false;
+      this.uploadComplete = false;
+      this.uploadProgress = 0;
+      this.uploadedBytes = 0;
+      this.totalBytes = 0;
+      this.uploadSpeed = 0;
+      this.timeRemaining = 0;
+      this.uploadedFiles = [];
+      this.errors = [];
+    },
+    
+    removeError(index) {
+      this.errors.splice(index, 1);
+    },
+    
+    formatBytes(bytes) {
+      if (bytes === 0) return '0 Bytes';
+      const k = 1024;
+      const sizes = ['Bytes', 'KB', 'MB', 'GB'];
+      const i = Math.floor(Math.log(bytes) / Math.log(k));
+      return parseFloat((bytes / Math.pow(k, i)).toFixed(2)) + ' ' + sizes[i];
+    },
+    
+    formatTime(seconds) {
+      if (seconds < 60) return `${Math.round(seconds)}s`;
+      if (seconds < 3600) return `${Math.round(seconds / 60)}m`;
+      return `${Math.round(seconds / 3600)}h`;
+    }
+  }
+};
+</script>
+
+<style scoped>
+.upload-zone-container {
+  width: 100%;
+}
+
+.upload-zone {
+  border: 3px dashed #dee2e6;
+  border-radius: 12px;
+  padding: 3rem 2rem;
+  text-align: center;
+  background-color: #f8f9fa;
+  cursor: pointer;
+  transition: all 0.3s ease;
+  position: relative;
+  min-height: 300px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+}
+
+.upload-zone:hover {
+  border-color: #007bff;
+  background-color: #e7f3ff;
+}
+
+.upload-zone.drag-over {
+  border-color: #28a745;
+  background-color: #d4edda;
+  transform: scale(1.02);
+}
+
+.upload-zone.uploading {
+  border-color: #007bff;
+  background-color: #e7f3ff;
+  cursor: not-allowed;
+}
+
+.upload-zone.upload-complete {
+  border-color: #28a745;
+  background-color: #d4edda;
+  cursor: default;
+}
+
+.upload-content, .upload-progress, .upload-complete {
+  width: 100%;
+}
+
+.upload-icon {
+  font-size: 4rem;
+  margin-bottom: 1rem;
+  color: #6c757d;
+}
+
+.upload-zone.drag-over .upload-icon {
+  color: #28a745;
+}
+
+.upload-zone.uploading .upload-icon {
+  color: #007bff;
+}
+
+.upload-complete .upload-icon {
+  color: #28a745 !important;
+}
+
+.upload-zone h4 {
+  margin-bottom: 1rem;
+  color: #495057;
+  font-weight: 600;
+}
+
+.upload-zone p {
+  margin-bottom: 0.5rem;
+  color: #6c757d;
+}
+
+.supported-formats {
+  font-size: 0.875rem;
+  font-style: italic;
+  margin-bottom: 2rem !important;
+}
+
+.upload-btn {
+  margin-top: 1rem;
+  padding: 0.75rem 2rem;
+  font-size: 1.1rem;
+  font-weight: 500;
+}
+
+.progress-container {
+  max-width: 500px;
+  margin: 0 auto 1rem;
+}
+
+.upload-stats {
+  display: flex;
+  justify-content: space-between;
+  font-size: 0.875rem;
+  color: #6c757d;
+  margin-top: 0.5rem;
+}
+
+.uploaded-files {
+  max-width: 500px;
+  margin: 1rem auto;
+  text-align: left;
+}
+
+.uploaded-file {
+  display: flex;
+  align-items: center;
+  padding: 0.5rem;
+  background-color: rgba(40, 167, 69, 0.1);
+  border: 1px solid rgba(40, 167, 69, 0.2);
+  border-radius: 4px;
+  margin-bottom: 0.5rem;
+}
+
+.uploaded-file i {
+  margin-right: 0.5rem;
+  color: #28a745;
+}
+
+.uploaded-file span:first-of-type {
+  flex: 1;
+  font-weight: 500;
+}
+
+.file-size {
+  color: #6c757d;
+  font-size: 0.875rem;
+}
+
+.upload-actions {
+  display: flex;
+  justify-content: center;
+  gap: 0.5rem;
+}
+
+.upload-errors {
+  text-align: left;
+}
+
+@media (max-width: 768px) {
+  .upload-zone {
+    padding: 2rem 1rem;
+    min-height: 250px;
+  }
+  
+  .upload-icon {
+    font-size: 3rem;
+  }
+  
+  .upload-actions {
+    flex-direction: column;
+    align-items: center;
+  }
+  
+  .upload-stats {
+    flex-direction: column;
+    text-align: center;
+  }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/helpers/api.js b/morphocluster/frontend/src/helpers/api.js
index 7f9929d..d0bfe3c 100644
--- a/morphocluster/frontend/src/helpers/api.js
+++ b/morphocluster/frontend/src/helpers/api.js
@@ -142,4 +142,65 @@ export function getUnfilledNodes(project_id) {
 export function log(action, node_id = null, reverse_action = null, data = null) {
     return axios.post(`/api/log`,
         { action, node_id, reverse_action, data });
+}
+
+// Upload and Processing Pipeline
+
+export function uploadArchives(files) {
+    const formData = new FormData();
+    files.forEach(file => {
+        formData.append('files', file);
+    });
+    return axios.post('/api/upload', formData, {
+        headers: {
+            'Content-Type': 'multipart/form-data',
+        },
+    }).then(response => response.data);
+}
+
+export function validateArchive(fileName) {
+    return axios.get(`/api/files/${fileName}/validate`)
+        .then(response => response.data);
+}
+
+export function previewArchive(fileName) {
+    return axios.get(`/api/files/${fileName}/preview`)
+        .then(response => response.data);
+}
+
+export function convertEcoTaxaFormat(fileName, parameters) {
+    return axios.post(`/api/files/${fileName}/convert`, parameters)
+        .then(response => response.data);
+}
+
+export function extractFeatures(fileName, parameters) {
+    return axios.post(`/api/files/${fileName}/extract`, parameters)
+        .then(response => response.data);
+}
+
+export function createProjectFromFeatures(featuresId, parameters) {
+    return axios.post(`/api/features/${featuresId}/cluster`, parameters)
+        .then(response => response.data);
+}
+
+export function reclusterProject(projectId, parameters) {
+    return axios.post(`/api/projects/${projectId}/recluster`, parameters)
+        .then(response => response.data);
+}
+
+// Job Management
+
+export function getUserJobs() {
+    return axios.get('/api/jobs/user')
+        .then(response => response.data);
+}
+
+export function getJobStatus(jobId) {
+    return axios.get(`/api/jobs/${jobId}/status`)
+        .then(response => response.data);
+}
+
+export function cancelJob(jobId) {
+    return axios.delete(`/api/jobs/${jobId}`)
+        .then(response => response.data);
 }
\ No newline at end of file
diff --git a/morphocluster/frontend/src/router.js b/morphocluster/frontend/src/router.js
index d2dafd4..3ecd376 100644
--- a/morphocluster/frontend/src/router.js
+++ b/morphocluster/frontend/src/router.js
@@ -29,6 +29,11 @@ const routes = [
       path: '/p',
       component: () => import(/* webpackChunkName: "projects" */ './views/Projects.vue'),
     },
+    {
+      name: 'upload',
+      path: '/upload',
+      component: () => import(/* webpackChunkName: "upload" */ './views/Upload.vue'),
+    },
     {
       name: 'files',
       path: '/files/:file_path?',
diff --git a/morphocluster/frontend/src/views/Home.vue b/morphocluster/frontend/src/views/Home.vue
index 2d87fb8..30e1654 100644
--- a/morphocluster/frontend/src/views/Home.vue
+++ b/morphocluster/frontend/src/views/Home.vue
@@ -12,6 +12,11 @@
       }">
         Files
       </b-button>
+      <b-button size="l" variant="success" class="mr-2" :to="{
+        name: 'upload'
+      }">
+        Upload Data
+      </b-button>
     </div>
   </div>
 </template>
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
new file mode 100644
index 0000000..1d13e8c
--- /dev/null
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -0,0 +1,562 @@
+<template>
+  <div id="upload-view">
+    <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
+      <router-link class="navbar-brand" :to="{ name: 'home' }">MorphoCluster</router-link>
+      <div class="navbar-collapse">
+        <ul class="navbar-nav me-auto">
+          <li class="navbar-item">
+            <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
+          </li>
+          <li class="navbar-item">
+            <span class="nav-link active">Upload</span>
+          </li>
+        </ul>
+      </div>
+      <dark-mode-control />
+    </nav>
+
+    <div class="upload-container">
+      <div class="container-fluid">
+        <div class="row">
+          <!-- Main Upload Section -->
+          <div class="col-lg-8">
+            <div class="upload-section">
+              <h2>Upload Data Archives</h2>
+              <p class="section-description">
+                Upload ZIP archives containing images and metadata for processing in MorphoCluster.
+                Supports EcoTaxa format and standard archive structures.
+              </p>
+
+              <upload-zone
+                :upload-url="uploadUrl"
+                :max-file-size="maxFileSize"
+                :accepted-types="acceptedTypes"
+                @upload-start="handleUploadStart"
+                @upload-progress="handleUploadProgress"
+                @upload-complete="handleUploadComplete"
+                @upload-error="handleUploadError"
+                @upload-cancel="handleUploadCancel"
+              />
+
+              <!-- Format Detection & Conversion -->
+              <div v-if="uploadedArchives.length" class="mt-4">
+                <h4>Uploaded Archives</h4>
+                <div class="archives-list">
+                  <div
+                    v-for="archive in uploadedArchives"
+                    :key="archive.id"
+                    class="archive-item"
+                    :class="{ 'needs-conversion': archive.needsConversion }"
+                  >
+                    <div class="archive-header">
+                      <div class="archive-info">
+                        <h6>{{ archive.name }}</h6>
+                        <small class="text-muted">{{ formatBytes(archive.size) }}</small>
+                      </div>
+                      <div class="archive-status">
+                        <b-badge
+                          :variant="getArchiveStatusVariant(archive.status)"
+                          class="me-2"
+                        >
+                          {{ getArchiveStatusText(archive.status) }}
+                        </b-badge>
+                        <span v-if="archive.format" class="format-badge">
+                          {{ archive.format }}
+                        </span>
+                      </div>
+                    </div>
+
+                    <!-- EcoTaxa Conversion Warning -->
+                    <b-alert
+                      v-if="archive.needsConversion"
+                      variant="warning"
+                      show
+                      class="mt-2"
+                    >
+                      <i class="mdi mdi-alert"></i>
+                      This archive appears to be in EcoTaxa format and needs conversion.
+                      <b-button
+                        variant="warning"
+                        size="sm"
+                        class="ms-2"
+                        @click="showConvertModal(archive)"
+                      >
+                        Convert Format
+                      </b-button>
+                    </b-alert>
+
+                    <!-- Archive Actions -->
+                    <div v-if="archive.status === 'ready'" class="archive-actions mt-2">
+                      <b-button
+                        variant="info"
+                        size="sm"
+                        @click="showExtractModal(archive)"
+                        :disabled="!isArchiveValid(archive)"
+                        class="me-2"
+                      >
+                        <i class="mdi mdi-cog"></i>
+                        Extract Features
+                      </b-button>
+                      <b-button
+                        variant="outline-secondary"
+                        size="sm"
+                        @click="previewArchive(archive)"
+                      >
+                        <i class="mdi mdi-eye"></i>
+                        Preview
+                      </b-button>
+                    </div>
+                  </div>
+                </div>
+              </div>
+            </div>
+          </div>
+
+          <!-- Job Status Sidebar -->
+          <div class="col-lg-4">
+            <div class="job-status-section">
+              <h4>Processing Jobs</h4>
+              <job-status
+                @job-completed="handleJobCompleted"
+                @job-failed="handleJobFailed"
+                @job-cancelled="handleJobCancelled"
+              />
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+
+    <!-- Format Conversion Modal -->
+    <format-modal
+      v-if="showingConvertModal"
+      :archive="selectedArchive"
+      @convert="handleConvert"
+      @cancel="hideConvertModal"
+    />
+
+    <!-- Feature Extraction Modal -->
+    <feature-modal
+      v-if="showingExtractModal"
+      :archive="selectedArchive"
+      @extract="handleExtract"
+      @cancel="hideExtractModal"
+    />
+
+    <!-- Archive Preview Modal -->
+    <b-modal
+      v-model="showingPreviewModal"
+      title="Archive Preview"
+      size="lg"
+      ok-only
+      ok-title="Close"
+    >
+      <div v-if="previewData">
+        <h6>Archive Contents</h6>
+        <ul class="list-unstyled">
+          <li v-for="file in previewData.files.slice(0, 10)" :key="file">
+            <i class="mdi mdi-file"></i> {{ file }}
+          </li>
+          <li v-if="previewData.files.length > 10" class="text-muted">
+            ... and {{ previewData.files.length - 10 }} more files
+          </li>
+        </ul>
+        
+        <h6 class="mt-3">Sample Entries</h6>
+        <div v-if="previewData.sample_entries" class="table-responsive">
+          <table class="table table-sm">
+            <thead>
+              <tr>
+                <th v-for="column in Object.keys(previewData.sample_entries[0] || {})" :key="column">
+                  {{ column }}
+                </th>
+              </tr>
+            </thead>
+            <tbody>
+              <tr v-for="(entry, index) in previewData.sample_entries.slice(0, 5)" :key="index">
+                <td v-for="column in Object.keys(entry)" :key="column">
+                  {{ entry[column] }}
+                </td>
+              </tr>
+            </tbody>
+          </table>
+        </div>
+      </div>
+    </b-modal>
+  </div>
+</template>
+
+<script>
+import UploadZone from '@/components/UploadZone.vue';
+import JobStatus from '@/components/JobStatus.vue';
+import DarkModeControl from '@/components/DarkModeControl.vue';
+import FormatModal from '@/components/FormatModal.vue';
+import FeatureModal from '@/components/FeatureModal.vue';
+
+export default {
+  name: 'UploadView',
+  components: {
+    UploadZone,
+    JobStatus,
+    DarkModeControl,
+    FormatModal,
+    FeatureModal
+  },
+  data() {
+    return {
+      uploadUrl: '/api/upload',
+      maxFileSize: 2 * 1024 * 1024 * 1024, // 2GB
+      acceptedTypes: ['.zip', '.tar', '.tar.gz'],
+      uploadedArchives: [],
+      selectedArchive: null,
+      showingConvertModal: false,
+      showingExtractModal: false,
+      showingPreviewModal: false,
+      previewData: null
+    };
+  },
+  methods: {
+    handleUploadStart(files) {
+      console.log('Upload started:', files);
+    },
+
+    handleUploadProgress(progress) {
+      console.log('Upload progress:', progress);
+    },
+
+    async handleUploadComplete(result) {
+      console.log('Upload completed:', result);
+      
+      // Process uploaded files and validate them
+      for (const file of result.files) {
+        try {
+          const validation = await this.$axios.get(`/api/files/${file.name}/validate`);
+          this.uploadedArchives.push({
+            id: Date.now() + Math.random(),
+            name: file.name,
+            size: file.size,
+            status: 'validating',
+            format: validation.data.format,
+            needsConversion: validation.data.needs_conversion,
+            isValid: validation.data.is_valid,
+            validation: validation.data
+          });
+        } catch (error) {
+          console.error('Validation failed:', error);
+          this.uploadedArchives.push({
+            id: Date.now() + Math.random(),
+            name: file.name,
+            size: file.size,
+            status: 'error',
+            error: error.message
+          });
+        }
+      }
+      
+      // Update archive statuses
+      this.updateArchiveStatuses();
+    },
+
+    handleUploadError(error) {
+      console.error('Upload error:', error);
+      this.$bvToast.toast('Upload failed. Please try again.', {
+        title: 'Upload Error',
+        variant: 'danger',
+        solid: true
+      });
+    },
+
+    handleUploadCancel() {
+      console.log('Upload cancelled');
+    },
+
+    async updateArchiveStatuses() {
+      for (const archive of this.uploadedArchives) {
+        if (archive.status === 'validating') {
+          // Simulate validation completion
+          setTimeout(() => {
+            archive.status = archive.isValid ? 'ready' : 'error';
+          }, 1000);
+        }
+      }
+    },
+
+    showConvertModal(archive) {
+      this.selectedArchive = archive;
+      this.showingConvertModal = true;
+    },
+
+    hideConvertModal() {
+      this.showingConvertModal = false;
+      this.selectedArchive = null;
+    },
+
+    showExtractModal(archive) {
+      this.selectedArchive = archive;
+      this.showingExtractModal = true;
+    },
+
+    hideExtractModal() {
+      this.showingExtractModal = false;
+      this.selectedArchive = null;
+    },
+
+    async previewArchive(archive) {
+      try {
+        const response = await this.$axios.get(`/api/files/${archive.name}/preview`);
+        this.previewData = response.data;
+        this.showingPreviewModal = true;
+      } catch (error) {
+        console.error('Preview failed:', error);
+        this.$bvToast.toast('Failed to load preview.', {
+          title: 'Preview Error',
+          variant: 'danger',
+          solid: true
+        });
+      }
+    },
+
+    async handleConvert(parameters) {
+      this.hideConvertModal();
+      
+      try {
+        await this.$axios.post(
+          `/api/files/${this.selectedArchive.name}/convert`,
+          parameters
+        );
+        
+        this.$bvToast.toast('Format conversion started.', {
+          title: 'Conversion Started',
+          variant: 'info',
+          solid: true
+        });
+        
+        // Update archive status
+        this.selectedArchive.status = 'converting';
+        
+      } catch (error) {
+        console.error('Conversion failed:', error);
+        this.$bvToast.toast('Failed to start conversion.', {
+          title: 'Conversion Error',
+          variant: 'danger',
+          solid: true
+        });
+      }
+    },
+
+    async handleExtract(parameters) {
+      this.hideExtractModal();
+      
+      try {
+        await this.$axios.post(
+          `/api/files/${this.selectedArchive.name}/extract`,
+          parameters
+        );
+        
+        this.$bvToast.toast('Feature extraction started.', {
+          title: 'Extraction Started',
+          variant: 'info',
+          solid: true
+        });
+        
+      } catch (error) {
+        console.error('Extraction failed:', error);
+        this.$bvToast.toast('Failed to start feature extraction.', {
+          title: 'Extraction Error',
+          variant: 'danger',
+          solid: true
+        });
+      }
+    },
+
+    handleJobCompleted(job) {
+      this.$bvToast.toast(`${this.getJobTitle(job)} completed successfully!`, {
+        title: 'Job Completed',
+        variant: 'success',
+        solid: true
+      });
+      
+      // Navigate to result if applicable
+      if (job.result_url) {
+        this.$router.push(job.result_url);
+      }
+    },
+
+    handleJobFailed(job) {
+      this.$bvToast.toast(`${this.getJobTitle(job)} failed: ${job.error_message}`, {
+        title: 'Job Failed',
+        variant: 'danger',
+        solid: true,
+        autoHideDelay: 8000
+      });
+    },
+
+    handleJobCancelled(job) {
+      this.$bvToast.toast(`${this.getJobTitle(job)} was cancelled.`, {
+        title: 'Job Cancelled',
+        variant: 'warning',
+        solid: true
+      });
+    },
+
+    getJobTitle(job) {
+      const titles = {
+        'format_conversion': 'Format Conversion',
+        'feature_extraction': 'Feature Extraction',
+        'initial_clustering': 'Project Creation',
+        'reclustering': 'Re-clustering'
+      };
+      return titles[job.job_type] || 'Job';
+    },
+
+    isArchiveValid(archive) {
+      return archive.status === 'ready' && archive.isValid;
+    },
+
+    getArchiveStatusVariant(status) {
+      const variants = {
+        'validating': 'warning',
+        'ready': 'success',
+        'converting': 'info',
+        'error': 'danger'
+      };
+      return variants[status] || 'secondary';
+    },
+
+    getArchiveStatusText(status) {
+      const texts = {
+        'validating': 'Validating',
+        'ready': 'Ready',
+        'converting': 'Converting',
+        'error': 'Error'
+      };
+      return texts[status] || 'Unknown';
+    },
+
+    formatBytes(bytes) {
+      if (bytes === 0) return '0 Bytes';
+      const k = 1024;
+      const sizes = ['Bytes', 'KB', 'MB', 'GB'];
+      const i = Math.floor(Math.log(bytes) / Math.log(k));
+      return parseFloat((bytes / Math.pow(k, i)).toFixed(2)) + ' ' + sizes[i];
+    }
+  }
+};
+</script>
+
+<style scoped>
+#upload-view {
+  display: flex;
+  flex-direction: column;
+  min-height: 100vh;
+}
+
+.upload-container {
+  flex: 1;
+  padding: 2rem 0;
+  background-color: #f8f9fa;
+}
+
+.upload-section {
+  background: white;
+  border-radius: 8px;
+  padding: 2rem;
+  margin-bottom: 2rem;
+}
+
+.section-description {
+  color: #6c757d;
+  margin-bottom: 2rem;
+}
+
+.job-status-section {
+  background: white;
+  border-radius: 8px;
+  padding: 1.5rem;
+  position: sticky;
+  top: 2rem;
+}
+
+.archives-list {
+  border: 1px solid #dee2e6;
+  border-radius: 8px;
+  background: white;
+}
+
+.archive-item {
+  padding: 1.5rem;
+  border-bottom: 1px solid #e9ecef;
+}
+
+.archive-item:last-child {
+  border-bottom: none;
+}
+
+.archive-item.needs-conversion {
+  background-color: #fff3cd;
+  border-left: 4px solid #ffc107;
+}
+
+.archive-header {
+  display: flex;
+  justify-content: space-between;
+  align-items: flex-start;
+  margin-bottom: 0.5rem;
+}
+
+.archive-info h6 {
+  margin: 0;
+  font-weight: 600;
+}
+
+.archive-status {
+  display: flex;
+  align-items: center;
+}
+
+.format-badge {
+  background-color: #e9ecef;
+  padding: 0.25rem 0.5rem;
+  border-radius: 4px;
+  font-size: 0.75rem;
+  font-weight: 500;
+  color: #495057;
+}
+
+.archive-actions {
+  display: flex;
+  gap: 0.5rem;
+}
+
+@media (max-width: 992px) {
+  .job-status-section {
+    position: static;
+    margin-top: 2rem;
+  }
+  
+  .upload-container {
+    padding: 1rem 0;
+  }
+  
+  .upload-section,
+  .job-status-section {
+    padding: 1.5rem;
+  }
+}
+
+@media (max-width: 576px) {
+  .archive-header {
+    flex-direction: column;
+    align-items: stretch;
+  }
+  
+  .archive-status {
+    margin-top: 0.5rem;
+    justify-content: flex-start;
+  }
+  
+  .archive-actions {
+    flex-direction: column;
+  }
+}
+</style>
\ No newline at end of file

From e79e7ed88be90fb47dbfe5d1417727e8c146e939 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Mon, 22 Sep 2025 15:27:54 -0400
Subject: [PATCH 02/13] simplify upload buttons

---
 morphocluster/frontend/src/components/UploadZone.vue | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/morphocluster/frontend/src/components/UploadZone.vue b/morphocluster/frontend/src/components/UploadZone.vue
index bb61135..0cc327f 100644
--- a/morphocluster/frontend/src/components/UploadZone.vue
+++ b/morphocluster/frontend/src/components/UploadZone.vue
@@ -57,11 +57,9 @@
           </div>
         </div>
         <div class="upload-actions mt-3">
-          <b-button variant="success" @click="$emit('upload-complete', uploadedFiles)">
-            Process Files
-          </b-button>
-          <b-button variant="outline-primary" @click="resetUpload" class="ms-2">
-            Upload More
+          <b-button variant="primary" @click="resetUpload">
+            <i class="mdi mdi-plus"></i>
+            Upload More Files
           </b-button>
         </div>
       </div>

From e0afef4ec7d036d2d86cd249d1cf774138d0fc68 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Wed, 24 Sep 2025 17:18:02 -0400
Subject: [PATCH 03/13] complete upload -> ecotaxa conversion -> feature
 extraction -> cluster functionality

---
 docker/morphocluster/Dockerfile               |   1 +
 morphocluster/api.py                          | 644 +++++++++++++-----
 morphocluster/background.py                   | 513 +++++++++++++-
 .../frontend/src/components/ClusterModal.vue  | 360 ++++++++++
 .../frontend/src/components/FeatureModal.vue  |  14 +-
 .../frontend/src/components/JobStatus.vue     |  74 +-
 .../frontend/src/components/UploadZone.vue    |  14 +-
 morphocluster/frontend/src/main.js            |   4 +
 morphocluster/frontend/src/views/Approve.vue  |  14 +
 morphocluster/frontend/src/views/Project.vue  |  57 +-
 morphocluster/frontend/src/views/Upload.vue   | 311 +++++++--
 11 files changed, 1727 insertions(+), 279 deletions(-)
 create mode 100644 morphocluster/frontend/src/components/ClusterModal.vue

diff --git a/docker/morphocluster/Dockerfile b/docker/morphocluster/Dockerfile
index 77afe45..05cacca 100644
--- a/docker/morphocluster/Dockerfile
+++ b/docker/morphocluster/Dockerfile
@@ -39,6 +39,7 @@ COPY pyproject.toml uv.lock versioneer.py setup.cfg MANIFEST.in README.rst ./
 COPY tests ./tests
 COPY morphocluster ./morphocluster
 COPY migrations ./migrations
+COPY data ./data
 
 # Install the application with dependencies from lockfile
 RUN uv sync --frozen
diff --git a/morphocluster/api.py b/morphocluster/api.py
index 2f453c4..c5689b5 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -332,217 +332,541 @@ def upload_files(path=""):
 @api.route("/upload", methods=["POST"])
 def upload_archives():
     """
-    Mock endpoint for uploading data archives.
-    Returns mock response for frontend testing.
+    Upload data archives for processing pipeline.
+    Saves files to FILES_DIR and returns file information.
     """
     uploaded_files = request.files.getlist("files")
 
     if not uploaded_files:
         raise werkzeug.exceptions.BadRequest("No files provided")
 
-    # Mock response
     result = {
         "message": "Files uploaded successfully",
-        "files": [
-            {
-                "name": file.filename,
-                "size": file.content_length or 1024000,  # Mock size if not available
-                "id": str(uuid.uuid4()),
-                "status": "uploaded"
-            }
-            for file in uploaded_files
-        ]
+        "files": []
     }
 
+    for upload_file in uploaded_files:
+        if upload_file.filename:
+            # Use the same security function as the existing upload
+            filename = secure_path_and_name(upload_file.filename)
+
+            # Save to FILES_DIR (same location validation expects)
+            server_path = os.path.join(app.config["FILES_DIR"], filename)
+
+            # Ensure directory exists
+            os.makedirs(os.path.dirname(server_path), exist_ok=True)
+
+            # Save the file
+            upload_file.save(server_path)
+
+            # Get actual file size
+            file_size = os.path.getsize(server_path)
+
+            result["files"].append({
+                "name": filename,
+                "size": file_size,
+                "id": filename,  # Use filename as ID for validation
+                "status": "uploaded"
+            })
+
     return jsonify(result), 200
 
 
 @api.route("/files/<file_id>/validate", methods=["GET"])
 def validate_archive(file_id):
     """
-    Mock endpoint for archive validation.
-    Returns mock validation data for frontend testing.
+    Validate an uploaded archive file.
+    Checks ZIP structure, required files, and detects format.
     """
-    # Mock validation response
-    result = {
-        "is_valid": True,
-        "format": "ecotaxa" if "ecotaxa" in file_id.lower() else "standard",
-        "needs_conversion": "ecotaxa" in file_id.lower(),
-        "file_count": 1250,
-        "image_count": 1200,
-        "detected_encoding": "utf-8",
-        "detected_delimiter": "\t" if "ecotaxa" in file_id.lower() else ",",
-        "validation_warnings": []
-    }
+    import zipfile
+    import csv
+    import chardet
+    from pathlib import Path
 
-    return jsonify(result), 200
+    try:
+        # Decode URL-encoded filename
+        from urllib.parse import unquote
+        filename = unquote(file_id)
+
+        # Find the uploaded file
+        upload_path = Path(app.config["FILES_DIR"]) / filename
+
+        if not upload_path.exists():
+            return jsonify({
+                "is_valid": False,
+                "error": f"File {filename} not found",
+                "validation_warnings": []
+            }), 404
+
+        result = {
+            "is_valid": False,
+            "format": "unknown",
+            "needs_conversion": False,
+            "file_count": 0,
+            "image_count": 0,
+            "detected_encoding": None,
+            "detected_delimiter": None,
+            "validation_warnings": []
+        }
+
+        # Check if it's a ZIP file
+        if not zipfile.is_zipfile(upload_path):
+            result["error"] = "File is not a valid ZIP archive"
+            return jsonify(result), 200
+
+        # Examine ZIP contents
+        with zipfile.ZipFile(upload_path, 'r') as zip_file:
+            file_list = zip_file.namelist()
+            result["file_count"] = len(file_list)
+
+            # Count image files
+            image_extensions = ('.jpg', '.jpeg', '.png', '.tiff', '.tif')
+            image_files = [f for f in file_list if f.lower().endswith(image_extensions)]
+            result["image_count"] = len(image_files)
+
+            # Look for metadata files
+            csv_files = [f for f in file_list if f.endswith('.csv')]
+            tsv_files = [f for f in file_list if f.endswith('.tsv')]
+
+            # Detect format based on files present
+            if 'index.csv' in file_list:
+                result["format"] = "standard"
+                result["needs_conversion"] = False
+                metadata_file = 'index.csv'
+            elif tsv_files or any('ecotaxa' in f.lower() for f in csv_files):
+                result["format"] = "ecotaxa"
+                result["needs_conversion"] = True
+                metadata_file = tsv_files[0] if tsv_files else csv_files[0]
+            elif csv_files:
+                result["format"] = "csv"
+                result["needs_conversion"] = True
+                metadata_file = csv_files[0]
+            else:
+                result["validation_warnings"].append("No metadata file (CSV/TSV) found")
+                metadata_file = None
+
+            # Analyze metadata file if found
+            if metadata_file:
+                try:
+                    with zip_file.open(metadata_file) as csv_data:
+                        # Detect encoding
+                        raw_data = csv_data.read(10000)  # Read first 10KB
+                        encoding_result = chardet.detect(raw_data)
+                        result["detected_encoding"] = encoding_result.get('encoding', 'utf-8')
+
+                        # Detect delimiter
+                        sample_text = raw_data.decode(result["detected_encoding"], errors='ignore')
+                        sample_lines = sample_text.split('\n')[:5]
+
+                        if sample_lines:
+                            # Count delimiters in first few lines
+                            delimiters = [',', '\t', ';', '|']
+                            delimiter_counts = {}
+
+                            for line in sample_lines:
+                                for delim in delimiters:
+                                    delimiter_counts[delim] = delimiter_counts.get(delim, 0) + line.count(delim)
+
+                            # Choose most common delimiter
+                            if delimiter_counts:
+                                result["detected_delimiter"] = max(delimiter_counts, key=delimiter_counts.get)
+
+                except Exception as e:
+                    result["validation_warnings"].append(f"Could not analyze metadata file: {str(e)}")
+
+            # Validation checks
+            if result["image_count"] == 0:
+                result["validation_warnings"].append("No image files found")
+
+            if metadata_file is None:
+                result["validation_warnings"].append("No metadata file found")
+
+            # Archive is valid if it has images and metadata
+            result["is_valid"] = (result["image_count"] > 0 and metadata_file is not None)
+
+        return jsonify(result), 200
+
+    except Exception as e:
+        return jsonify({
+            "is_valid": False,
+            "error": f"Validation failed: {str(e)}",
+            "validation_warnings": []
+        }), 500
 
 
 @api.route("/files/<file_id>/preview", methods=["GET"])
 def preview_archive(file_id):
     """
-    Mock endpoint for archive preview.
-    Returns mock preview data for frontend testing.
+    Preview archive contents and extract sample data from CSV/TSV files.
     """
-    # Mock preview response
-    result = {
-        "files": [
-            "index.csv",
-            "images/img001.jpg",
-            "images/img002.jpg",
-            "images/img003.jpg",
-            "images/img004.jpg",
-            "images/img005.jpg"
-        ],
-        "total_rows": 1200,
-        "detected_encoding": "utf-8",
-        "detected_delimiter": "," if "standard" in file_id.lower() else "\t",
-        "columns": [
-            {"key": "object_id", "label": "Object ID"},
-            {"key": "img_file_name", "label": "Image File"},
-            {"key": "object_lat", "label": "Latitude"},
-            {"key": "object_lon", "label": "Longitude"},
-            {"key": "object_depth", "label": "Depth"}
-        ],
-        "sample_rows": [
-            {
-                "object_id": "obj_001",
-                "img_file_name": "images/img001.jpg",
-                "object_lat": "45.123",
-                "object_lon": "-125.456",
-                "object_depth": "10.5"
-            },
-            {
-                "object_id": "obj_002",
-                "img_file_name": "images/img002.jpg",
-                "object_lat": "45.124",
-                "object_lon": "-125.457",
-                "object_depth": "12.1"
-            },
-            {
-                "object_id": "obj_003",
-                "img_file_name": "images/img003.jpg",
-                "object_lat": "45.125",
-                "object_lon": "-125.458",
-                "object_depth": "8.9"
-            }
-        ]
-    }
+    import zipfile
+    import csv
+    import chardet
+    from pathlib import Path
+    from urllib.parse import unquote
 
-    return jsonify(result), 200
+    try:
+        filename = unquote(file_id)
+        upload_path = Path(app.config["FILES_DIR"]) / filename
+
+        if not upload_path.exists():
+            return jsonify({"error": f"File {filename} not found"}), 404
+
+        if not zipfile.is_zipfile(upload_path):
+            return jsonify({"error": "File is not a valid ZIP archive"}), 400
+
+        result = {
+            "files": [],
+            "total_rows": 0,
+            "detected_encoding": None,
+            "detected_delimiter": None,
+            "columns": [],
+            "sample_rows": []
+        }
+
+        with zipfile.ZipFile(upload_path, 'r') as zip_file:
+            # Get all files in archive
+            file_list = zip_file.namelist()
+            result["files"] = sorted(file_list)
+
+            # Find metadata file (CSV/TSV)
+            csv_files = [f for f in file_list if f.endswith('.csv')]
+            tsv_files = [f for f in file_list if f.endswith('.tsv')]
+
+            metadata_file = None
+            if 'index.csv' in file_list:
+                metadata_file = 'index.csv'
+            elif tsv_files:
+                metadata_file = tsv_files[0]
+            elif csv_files:
+                metadata_file = csv_files[0]
+
+            if metadata_file:
+                try:
+                    with zip_file.open(metadata_file) as csv_data:
+                        # Detect encoding
+                        raw_data = csv_data.read(50000)  # Read first 50KB for better detection
+                        encoding_result = chardet.detect(raw_data)
+                        detected_encoding = encoding_result.get('encoding', 'utf-8')
+
+                        # Handle common encoding issues
+                        if detected_encoding.lower() in ['ascii', 'windows-1252', 'iso-8859-1']:
+                            detected_encoding = 'utf-8'
+
+                        result["detected_encoding"] = detected_encoding
+
+                        # Decode text and detect delimiter
+                        try:
+                            text = raw_data.decode(detected_encoding, errors='replace')
+                        except UnicodeDecodeError:
+                            text = raw_data.decode('utf-8', errors='replace')
+
+                        # Detect delimiter by analyzing first few lines
+                        lines = text.split('\n')[:10]
+                        non_empty_lines = [line.strip() for line in lines if line.strip()]
+
+                        if non_empty_lines:
+                            # Count delimiters in header and first few data rows
+                            delimiters = [',', '\t', ';', '|']
+                            delimiter_scores = {}
+
+                            for delim in delimiters:
+                                scores = []
+                                for line in non_empty_lines[:5]:  # Check first 5 lines
+                                    count = line.count(delim)
+                                    scores.append(count)
+
+                                # Prefer delimiters that appear consistently
+                                if scores and max(scores) > 0:
+                                    consistency = len(set(scores)) == 1  # All lines have same count
+                                    delimiter_scores[delim] = (max(scores), consistency)
+
+                            if delimiter_scores:
+                                # Choose delimiter with highest count and consistency
+                                best_delim = max(delimiter_scores,
+                                               key=lambda x: (delimiter_scores[x][1], delimiter_scores[x][0]))
+                                result["detected_delimiter"] = best_delim
+
+                        # Parse CSV and extract sample data
+                        if result["detected_delimiter"]:
+                            # Re-read file from beginning for CSV parsing
+                            zip_file.seek(0)  # Reset zip file position
+                            with zip_file.open(metadata_file) as csv_data:
+                                text_data = csv_data.read().decode(detected_encoding, errors='replace')
+                                lines = text_data.split('\n')
+
+                                # Parse with detected delimiter
+                                csv_reader = csv.DictReader(
+                                    lines,
+                                    delimiter=result["detected_delimiter"]
+                                )
+
+                                # Get column names
+                                if csv_reader.fieldnames:
+                                    result["columns"] = [
+                                        {"key": col.strip(), "label": col.strip()}
+                                        for col in csv_reader.fieldnames if col
+                                    ]
+
+                                # Get sample rows (first 5)
+                                sample_rows = []
+                                row_count = 0
+
+                                for row in csv_reader:
+                                    row_count += 1
+                                    if len(sample_rows) < 5:
+                                        # Clean up row data
+                                        clean_row = {}
+                                        for key, value in row.items():
+                                            if key:  # Skip empty keys
+                                                clean_row[key.strip()] = str(value).strip() if value else ""
+                                        if clean_row:  # Only add non-empty rows
+                                            sample_rows.append(clean_row)
+
+                                result["sample_rows"] = sample_rows
+                                result["total_rows"] = row_count
+
+                except Exception as e:
+                    result["error"] = f"Could not parse metadata file: {str(e)}"
+
+        return jsonify(result), 200
+
+    except Exception as e:
+        return jsonify({
+            "error": f"Preview failed: {str(e)}"
+        }), 500
 
 
 @api.route("/files/<file_id>/convert", methods=["POST"])
 def convert_ecotaxa_format(file_id):
     """
-    Mock endpoint for EcoTaxa format conversion.
-    Creates a mock background job for frontend testing.
+    Start EcoTaxa format conversion background job for uploaded archive.
     """
-    data = request.get_json() or {}
+    from urllib.parse import unquote
+    from morphocluster.background import convert_ecotaxa_job
 
-    # Mock job creation
-    job_id = str(uuid.uuid4())
+    filename = unquote(file_id)
+    parameters = request.get_json() or {}
 
-    result = {
-        "job_id": job_id,
-        "status": "started",
-        "message": "EcoTaxa conversion job started",
-        "parameters": data
-    }
+    try:
+        # Queue the background job
+        job = convert_ecotaxa_job.queue(filename, parameters)
+
+        # Initialize job metadata
+        job.meta['status'] = 'queued'
+        job.meta['progress'] = 0
+        job.meta['current_step'] = 'Waiting in queue...'
+        job.meta['created_at'] = datetime.now().isoformat()
+        job.meta['job_type'] = 'format_conversion'
+        job.meta['archive_name'] = filename
+        job.meta['parameters'] = parameters
+        job.save_meta()
+
+        result = {
+            "job_id": job.id,
+            "status": "queued",
+            "message": "EcoTaxa conversion job queued",
+            "parameters": parameters
+        }
 
-    return jsonify(result), 202
+        return jsonify(result), 202
+
+    except Exception as e:
+        return jsonify({
+            "error": f"Failed to queue EcoTaxa conversion job: {str(e)}"
+        }), 500
 
 
 @api.route("/files/<file_id>/extract", methods=["POST"])
 def extract_features(file_id):
     """
-    Mock endpoint for feature extraction.
-    Creates a mock background job for frontend testing.
+    Start feature extraction background job for uploaded archive.
     """
-    data = request.get_json() or {}
+    from urllib.parse import unquote
+    from morphocluster.background import extract_features_job
 
-    # Mock job creation
-    job_id = str(uuid.uuid4())
+    filename = unquote(file_id)
+    parameters = request.get_json() or {}
 
-    result = {
-        "job_id": job_id,
-        "status": "started",
-        "message": "Feature extraction job started",
-        "parameters": data
-    }
+    try:
+        # Queue the background job
+        job = extract_features_job.queue(filename, parameters)
+
+        # Initialize job metadata
+        job.meta['status'] = 'queued'
+        job.meta['progress'] = 0
+        job.meta['current_step'] = 'Waiting in queue...'
+        job.meta['created_at'] = datetime.now().isoformat()
+        job.meta['job_type'] = 'feature_extraction'
+        job.meta['archive_name'] = filename
+        job.meta['parameters'] = parameters
+        job.save_meta()
+
+        result = {
+            "job_id": job.id,
+            "status": "queued",
+            "message": "Feature extraction job queued",
+            "parameters": parameters
+        }
+
+        return jsonify(result), 202
+
+    except Exception as e:
+        return jsonify({
+            "error": f"Failed to queue feature extraction job: {str(e)}"
+        }), 500
+
+
+@api.route("/files/<file_id>/cluster", methods=["POST"])
+def create_clustering_project(file_id):
+    """
+    Start initial clustering background job to create a new MorphoCluster project.
+    """
+    from urllib.parse import unquote
+    from morphocluster.background import initial_clustering_job
+
+    filename = unquote(file_id)
+    parameters = request.get_json() or {}
+
+    # Extract feature file from parameters or construct default name
+    feature_file = parameters.get('feature_file')
+    if not feature_file:
+        # Construct feature file name based on archive name
+        archive_stem = pathlib.Path(filename).stem
+        feature_file = f"{archive_stem}_features.h5"
+
+    try:
+        # Queue the background job
+        job = initial_clustering_job.queue(filename, feature_file, parameters)
+
+        # Initialize job metadata
+        job.meta['status'] = 'queued'
+        job.meta['progress'] = 0
+        job.meta['current_step'] = 'Waiting in queue...'
+        job.meta['created_at'] = datetime.now().isoformat()
+        job.meta['job_type'] = 'initial_clustering'
+        job.meta['archive_name'] = filename
+        job.meta['feature_file'] = feature_file
+        job.meta['parameters'] = parameters
+        job.save_meta()
+
+        result = {
+            "job_id": job.id,
+            "status": "queued",
+            "message": "Initial clustering job queued",
+            "parameters": parameters,
+            "feature_file": feature_file
+        }
+
+        return jsonify(result), 202
 
-    return jsonify(result), 202
+    except Exception as e:
+        return jsonify({
+            "error": f"Failed to queue initial clustering job: {str(e)}"
+        }), 500
 
 
 @api.route("/jobs/user", methods=["GET"])
 def get_user_jobs():
     """
-    Mock endpoint for getting user jobs.
-    Returns mock job data for frontend testing.
+    Get all jobs from the RQ queue.
+    Returns jobs with status, progress, and metadata.
     """
-    # Mock jobs with different statuses
-    jobs = [
-        {
-            "id": "job_001",
-            "job_type": "format_conversion",
-            "status": "completed",
-            "progress": 100,
-            "created_at": "2024-01-15T10:30:00Z",
-            "completed_at": "2024-01-15T10:32:15Z",
-            "parameters": {
-                "archive_name": "sample_ecotaxa.zip",
-                "encoding": "utf-8",
-                "delimiter": "\t"
-            },
-            "result_url": "/files/converted_sample"
-        },
-        {
-            "id": "job_002",
-            "job_type": "feature_extraction",
-            "status": "running",
-            "progress": 45,
-            "created_at": "2024-01-15T11:00:00Z",
-            "current_step": "Processing batch 450/1000",
-            "eta": 300,
-            "parameters": {
-                "archive_name": "marine_plankton.zip",
-                "model": "resnet50",
-                "batch_size": 512
-            },
-            "logs": [
-                {
-                    "timestamp": "2024-01-15T11:00:00Z",
-                    "level": "info",
-                    "message": "Starting feature extraction..."
-                },
-                {
-                    "timestamp": "2024-01-15T11:05:30Z",
-                    "level": "info",
-                    "message": "Processed 200 images"
-                },
-                {
-                    "timestamp": "2024-01-15T11:10:15Z",
-                    "level": "info",
-                    "message": "Processed 450 images"
-                }
-            ]
-        },
-        {
-            "id": "job_003",
-            "job_type": "initial_clustering",
-            "status": "failed",
-            "progress": 25,
-            "created_at": "2024-01-15T09:15:00Z",
-            "failed_at": "2024-01-15T09:45:30Z",
-            "error_message": "Insufficient memory for clustering. Try reducing batch size.",
-            "parameters": {
-                "min_cluster_size": 128,
-                "method": "EOM"
-            }
+    try:
+        from rq import Queue
+        from morphocluster.extensions import rq
+
+        queue = rq.get_queue()
+        all_jobs = []
+
+        # Get jobs from different registries
+        try:
+            # Active/queued jobs
+            for job in queue.jobs:
+                job_data = _format_job_data(job)
+                if job_data:
+                    all_jobs.append(job_data)
+
+            # Recently finished jobs
+            finished_registry = queue.finished_job_registry
+            for job_id in finished_registry.get_job_ids(0, 20):
+                job = queue.fetch_job(job_id)
+                if job:
+                    job_data = _format_job_data(job)
+                    if job_data:
+                        all_jobs.append(job_data)
+
+            # Failed jobs
+            failed_registry = queue.failed_job_registry
+            for job_id in failed_registry.get_job_ids(0, 20):
+                job = queue.fetch_job(job_id)
+                if job:
+                    job_data = _format_job_data(job)
+                    if job_data:
+                        all_jobs.append(job_data)
+
+        except Exception as e:
+            print(f"Error fetching jobs: {e}")
+
+        # Sort by creation time (newest first)
+        all_jobs.sort(key=lambda x: x.get('created_at', ''), reverse=True)
+
+        return jsonify(all_jobs), 200
+
+    except Exception as e:
+        print(f"Error in get_user_jobs: {e}")
+        return jsonify([]), 200
+
+
+def _format_job_data(job):
+    """Format RQ job data for frontend consumption."""
+    try:
+        if not job:
+            return None
+
+        # Determine job status
+        if job.is_queued:
+            status = 'queued'
+        elif job.is_started:
+            status = job.meta.get('status', 'running')
+        elif job.is_finished:
+            status = job.meta.get('status', 'completed')
+        elif job.is_failed:
+            status = 'failed'
+        else:
+            status = 'unknown'
+
+        job_data = {
+            "id": job.id,
+            "job_type": job.meta.get('job_type', 'unknown'),
+            "status": status,
+            "progress": job.meta.get('progress', 0),
+            "created_at": job.meta.get('created_at'),
+            "current_step": job.meta.get('current_step'),
+            "parameters": job.meta.get('parameters', {}),
+            "archive_name": job.meta.get('archive_name')
         }
-    ]
 
-    return jsonify(jobs), 200
+        # Add completion/failure details
+        if job.meta.get('completed_at'):
+            job_data['completed_at'] = job.meta['completed_at']
+            job_data['result'] = job.meta.get('result')
+
+        if job.meta.get('failed_at'):
+            job_data['failed_at'] = job.meta['failed_at']
+            job_data['error_message'] = job.meta.get('error_message')
+
+        # Add timing info
+        if job.started_at:
+            job_data['started_at'] = job.started_at.isoformat()
+        if job.ended_at:
+            job_data['ended_at'] = job.ended_at.isoformat()
+
+        return job_data
+
+    except Exception as e:
+        print(f"Error formatting job {job.id if job else 'None'}: {e}")
+        return None
 
 
 @api.route("/jobs/<job_id>/status", methods=["GET"])
diff --git a/morphocluster/background.py b/morphocluster/background.py
index a212510..675f354 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -1,12 +1,17 @@
 import datetime as dt
 import os
+import zipfile
+import csv
+import time
+from pathlib import Path
 
 import flask_rq2
 from flask import current_app as app
 
 from morphocluster.extensions import database, rq
 from morphocluster.processing.recluster import Recluster
-from morphocluster.processing.tree import Tree
+from morphocluster.processing.tree import Tree as ProcessingTree
+from morphocluster.tree import Tree
 
 
 def validate_background_job(fun):
@@ -97,3 +102,509 @@ def recluster_project(project_id, min_cluster_size):
         print("Project ID: {}".format(project_id))
 
     print("Done.")
+
+
+# ===============================================================================
+# Upload Pipeline Background Jobs
+# ===============================================================================
+
+@rq.job(timeout=3600)  # 1 hour timeout
+def extract_features_job(filename, parameters=None):
+    """
+    Background job for extracting features from uploaded archive using MorphoCluster's real feature extraction.
+    """
+    print(f"Starting feature extraction for {filename}")
+
+    # Get current job for progress updates
+    from rq import get_current_job
+    from morphocluster.processing.extract_features import extract_features
+    import zipfile
+
+    job = get_current_job()
+
+    if parameters is None:
+        parameters = {}
+
+    # Create application context for Flask app access
+    from morphocluster import create_app
+    app_instance = create_app()
+    with app_instance.app_context():
+        try:
+            files_dir = Path(app_instance.config["FILES_DIR"])
+            archive_path = files_dir / filename
+
+            if not archive_path.exists():
+                raise FileNotFoundError(f"Archive {filename} not found")
+
+            # Create features output filename
+            features_filename = f"{archive_path.stem}_features.h5"
+            features_path = archive_path.parent / features_filename
+
+            # Step 1: Validate archive
+            job.meta['status'] = 'validating'
+            job.meta['progress'] = 5
+            job.meta['current_step'] = 'Validating archive structure...'
+            job.save_meta()
+
+            # Check if archive has index.csv
+            with zipfile.ZipFile(archive_path, 'r') as zip_file:
+                file_list = zip_file.namelist()
+                print(f"Archive contents: {file_list[:10]}...")  # Show first 10 files for debugging
+
+                if 'index.csv' not in file_list:
+                    # Check if this is an unconverted EcoTaxa file - suggest conversion
+                    ecotaxa_files = [f for f in file_list if f.startswith('ecotaxa_') and f.endswith('.tsv')]
+                    if ecotaxa_files:
+                        raise ValueError(f"Archive appears to be in EcoTaxa format (found {ecotaxa_files[0]}). Please convert it first.")
+                    else:
+                        raise ValueError(f"Archive must contain index.csv file. Found files: {', '.join(file_list[:5])}")
+
+                image_files = [f for f in file_list if f.lower().endswith(('.jpg', '.jpeg', '.png', '.tiff', '.tif'))]
+                total_images = len(image_files)
+
+            print(f"Archive validation passed. Found {total_images} images")
+
+            # Step 2: Setup parameters
+            job.meta['progress'] = 10
+            job.meta['current_step'] = 'Setting up feature extraction parameters...'
+            job.save_meta()
+
+            # Extract parameters with defaults
+            normalize = parameters.get('normalize', True)
+            batch_size = parameters.get('batch_size', 512)
+            model_file = parameters.get('model_file', None)
+
+            # Set default model file if not specified
+            if model_file is None:
+                model_file = '/code/data/model_state.pth'
+
+            # Parse input_mean and input_std - handle both string and list formats
+            def parse_mean_std(value, default):
+                if isinstance(value, str):
+                    if value.strip():
+                        return tuple(map(float, value.split(',')))
+                    else:
+                        return default
+                elif isinstance(value, (list, tuple)):
+                    return tuple(value)
+                else:
+                    return default
+
+            input_mean = parse_mean_std(parameters.get('input_mean'), (0, 0, 0))
+            input_std = parse_mean_std(parameters.get('input_std'), (1, 1, 1))
+
+            print(f"Using parameters: normalize={normalize}, batch_size={batch_size}, model_file={model_file}")
+            print(f"Input normalization: mean={input_mean}, std={input_std}")
+
+            # Step 3: Start feature extraction
+            job.meta['progress'] = 15
+            job.meta['current_step'] = 'Starting feature extraction (this may take several minutes)...'
+            job.meta['total_images'] = total_images
+            job.save_meta()
+
+            # Run MorphoCluster's real feature extraction
+            extract_features(
+                archive_fn=str(archive_path),
+                features_fn=str(features_path),
+                parameters_fn=model_file,  # None for pretrained ImageNet
+                normalize=normalize,
+                batch_size=batch_size,
+                cuda=True,  # Use GPU if available
+                input_mean=input_mean,
+                input_std=input_std
+            )
+
+            # Step 4: Complete
+            job.meta['status'] = 'completed'
+            job.meta['progress'] = 100
+            job.meta['current_step'] = 'Feature extraction completed'
+            job.meta['completed_at'] = dt.datetime.now().isoformat()
+
+            # Create result with actual feature file info
+            result = {
+                'feature_file': features_filename,
+                'feature_path': str(features_path),
+                'total_images': total_images,
+                'feature_dimensions': 32,  # ResNet18 with 32-dim bottleneck
+                'model_used': f'ResNet18 with 32-dim bottleneck: {model_file}',
+                'normalize': normalize,
+                'batch_size': batch_size
+            }
+
+            job.meta['result'] = result
+            job.save_meta()
+
+            print(f"Feature extraction completed for {filename}")
+            print(f"Features saved to: {features_path}")
+            return result
+
+        except Exception as e:
+            print(f"Feature extraction failed: {str(e)}")
+            job.meta['status'] = 'failed'
+            job.meta['error_message'] = str(e)
+            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.save_meta()
+            raise
+
+
+@rq.job(timeout=1800)  # 30 minutes timeout
+def convert_ecotaxa_job(filename, parameters=None):
+    """
+    Background job for converting EcoTaxa format to standard format.
+    Uses MorphoCluster's existing fix_ecotaxa functionality.
+    """
+    print(f"Starting EcoTaxa conversion for {filename}")
+
+    from rq import get_current_job
+    import shutil
+
+    job = get_current_job()
+
+    if parameters is None:
+        parameters = {}
+
+    # Create application context for Flask app access
+    from morphocluster import create_app
+    app_instance = create_app()
+    with app_instance.app_context():
+        try:
+            archive_path = Path(app_instance.config["FILES_DIR"]) / filename
+
+            if not archive_path.exists():
+                raise FileNotFoundError(f"Archive {filename} not found")
+
+            # Step 1: Analyze parameters
+            job.meta['status'] = 'analyzing'
+            job.meta['progress'] = 10
+            job.meta['current_step'] = 'Analyzing EcoTaxa format and parameters...'
+            job.save_meta()
+
+            encoding = parameters.get('encoding')
+            delimiter = parameters.get('delimiter')
+            force = parameters.get('force', False)
+
+            # Step 2: Create working copy for conversion
+            job.meta['progress'] = 20
+            job.meta['current_step'] = 'Creating working copy...'
+            job.save_meta()
+
+            # Create a copy to work on (fix_ecotaxa modifies in place)
+            work_path = archive_path.with_suffix('.converting.zip')
+            shutil.copy2(archive_path, work_path)
+
+            # Step 3: Run EcoTaxa conversion using existing MorphoCluster function
+            job.meta['progress'] = 40
+            job.meta['current_step'] = 'Converting EcoTaxa format to standard format...'
+            job.save_meta()
+
+            try:
+                # Call fix_ecotaxa function directly (it's a Click command)
+                from click.testing import CliRunner
+                from morphocluster.scripts import fix_ecotaxa
+
+                runner = CliRunner()
+                args = [str(work_path)]
+                if encoding:
+                    args.extend(['--encoding', encoding])
+                if delimiter:
+                    args.extend(['--delimiter', delimiter])
+                if force:
+                    args.append('--force')
+
+                result = runner.invoke(fix_ecotaxa, args)
+                if result.exit_code != 0:
+                    raise RuntimeError(f"EcoTaxa conversion failed: {result.output}")
+            except Exception as conversion_error:
+                # Clean up working file
+                if work_path.exists():
+                    work_path.unlink()
+                raise conversion_error
+
+            # Step 4: Validate conversion result
+            job.meta['progress'] = 80
+            job.meta['current_step'] = 'Validating converted archive...'
+            job.save_meta()
+
+            # Check that index.csv was created
+            import zipfile
+            with zipfile.ZipFile(work_path, 'r') as zf:
+                if 'index.csv' not in zf.namelist():
+                    raise ValueError("Conversion failed: index.csv not created")
+
+            # Step 5: Replace original with converted version
+            job.meta['progress'] = 95
+            job.meta['current_step'] = 'Finalizing converted archive...'
+            job.save_meta()
+
+            # Move converted file to final location
+            converted_path = archive_path.with_name(f"{archive_path.stem}_converted{archive_path.suffix}")
+            work_path.rename(converted_path)
+
+            # Complete
+            job.meta['status'] = 'completed'
+            job.meta['progress'] = 100
+            job.meta['current_step'] = 'EcoTaxa conversion completed'
+            job.meta['completed_at'] = dt.datetime.now().isoformat()
+            job.meta['result'] = {
+                'converted_file': converted_path.name,
+                'original_file': filename,
+                'encoding': encoding,
+                'delimiter': delimiter,
+                'conversion_method': 'morphocluster.scripts.fix_ecotaxa'
+            }
+            job.save_meta()
+
+            print(f"EcoTaxa conversion completed: {filename} -> {converted_path.name}")
+            return job.meta['result']
+
+        except Exception as e:
+            print(f"EcoTaxa conversion failed: {str(e)}")
+            job.meta['status'] = 'failed'
+            job.meta['error_message'] = str(e)
+            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.save_meta()
+            raise
+
+
+@rq.job(timeout=7200)  # 2 hours timeout
+def initial_clustering_job(archive_name, feature_file, parameters=None):
+    """
+    Background job for initial clustering to create a new MorphoCluster project.
+    """
+    print(f"Starting initial clustering for {archive_name}")
+
+    from rq import get_current_job
+
+    job = get_current_job()
+
+    if parameters is None:
+        parameters = {}
+
+    # Create application context for Flask app access
+    from morphocluster import create_app
+    app_instance = create_app()
+    with app_instance.app_context():
+        try:
+            files_dir = Path(app_instance.config["FILES_DIR"])
+            archive_path = files_dir / archive_name
+            feature_path = files_dir / feature_file
+
+            if not archive_path.exists():
+                raise FileNotFoundError(f"Archive {archive_name} not found")
+            if not feature_path.exists():
+                raise FileNotFoundError(f"Feature file {feature_file} not found")
+
+            # Step 1: Setup parameters
+            job.meta['status'] = 'setting_up'
+            job.meta['progress'] = 10
+            job.meta['current_step'] = 'Setting up clustering parameters...'
+            job.save_meta()
+
+            # Extract parameters with defaults
+            project_name = parameters.get('project_name', f"Project-{archive_path.stem}")
+            description = parameters.get('description', '')
+            min_cluster_size = parameters.get('min_cluster_size', 128)
+            min_samples = parameters.get('min_samples', 1)
+            cluster_selection_method = parameters.get('cluster_selection_method', 'leaf')
+            sample_size = parameters.get('sample_size', 0)  # 0 = use all
+            keep_unexplored_ratio = parameters.get('keep_unexplored_ratio', 0.0)
+
+            print(f"Clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}")
+
+            # Step 2: Extract images from archive
+            job.meta['progress'] = 15
+            job.meta['current_step'] = 'Extracting images from archive...'
+            job.save_meta()
+
+            import zipfile
+            import pandas as pd
+            import h5py
+            import shutil
+            from morphocluster import models
+
+            # Create images directory for this archive
+            images_dir = Path(app_instance.config["IMAGES_DIR"])
+            archive_images_dir = images_dir / archive_path.stem
+            archive_images_dir.mkdir(parents=True, exist_ok=True)
+
+            # Read index.csv from archive to get object_id and path mappings
+            with zipfile.ZipFile(archive_path, 'r') as zf:
+                with zf.open('index.csv') as fp:
+                    archive_df = pd.read_csv(fp, dtype=str, usecols=["object_id", "path"])
+
+                # Extract image files
+                print(f"Extracting {len(archive_df)} images to {archive_images_dir}")
+                for _, row in archive_df.iterrows():
+                    image_path = row['path']
+                    if image_path in zf.namelist():
+                        # Extract to the archive-specific directory
+                        extracted_path = zf.extract(image_path, archive_images_dir)
+
+                        # Move to flat structure if needed (some archives have subdirectories)
+                        final_path = archive_images_dir / Path(image_path).name
+                        if Path(extracted_path) != final_path:
+                            shutil.move(extracted_path, final_path)
+
+            # Step 3: Load objects from archive into database
+            job.meta['progress'] = 25
+            job.meta['current_step'] = 'Loading objects into database...'
+            job.save_meta()
+
+            # Load feature vectors from H5 file
+            with h5py.File(feature_path, 'r') as h5f:
+                feature_object_ids = h5f['object_id'][:]
+                features = h5f['features'][:]
+
+                # Convert bytes to strings if necessary
+                if hasattr(feature_object_ids[0], 'decode'):
+                    feature_object_ids = [oid.decode('utf-8') for oid in feature_object_ids]
+                else:
+                    feature_object_ids = list(feature_object_ids)
+
+            feature_dims = features.shape[1] if len(features.shape) > 1 else len(features[0]) if len(features) > 0 else 0
+            print(f"Archive contains {len(archive_df)} objects, features for {len(feature_object_ids)} objects")
+            print(f"Feature dimensions: {feature_dims}")
+
+            # Step 3: Insert objects into database with vectors
+            job.meta['progress'] = 30
+            job.meta['current_step'] = 'Inserting objects into database...'
+            job.save_meta()
+
+            # Create object data for database insertion
+            object_data = []
+            feature_dict = dict(zip(feature_object_ids, features))
+
+            for _, row in archive_df.iterrows():
+                object_id = row['object_id']
+                original_path = row['path']
+                # Update path to point to extracted image in archive subdirectory
+                extracted_path = f"{archive_path.stem}/{Path(original_path).name}"
+                vector = feature_dict.get(object_id)
+
+                if vector is not None:
+                    object_data.append({
+                        'object_id': object_id,
+                        'path': extracted_path,  # Path relative to IMAGES_DIR
+                        'vector': vector  # Keep as numpy array - should be 32 dimensions now
+                    })
+
+            # Insert objects into database
+            with database.engine.connect() as conn:
+                with conn.begin():
+                    # Check if objects already exist to avoid duplicates
+                    existing_objects = conn.execute(
+                        models.objects.select().where(
+                            models.objects.c.object_id.in_([obj['object_id'] for obj in object_data])
+                        )
+                    ).fetchall()
+                    existing_object_ids = {obj.object_id for obj in existing_objects}
+
+                    # Only insert new objects
+                    new_objects = [obj for obj in object_data if obj['object_id'] not in existing_object_ids]
+
+                    if new_objects:
+                        print(f"Inserting {len(new_objects)} new objects into database")
+                        conn.execute(models.objects.insert(), new_objects)
+                    else:
+                        print("All objects already exist in database")
+
+            # Step 4: Initialize clustering
+            job.meta['progress'] = 40
+            job.meta['current_step'] = 'Initializing clustering algorithm...'
+            job.save_meta()
+
+            recluster = Recluster()
+
+            # Step 5: Load features
+            job.meta['progress'] = 50
+            job.meta['current_step'] = 'Loading extracted features...'
+            job.save_meta()
+
+            recluster.load_features(str(feature_path))
+
+            # Step 6: Skip init_tree() - let clustering create the tree structure
+            job.meta['progress'] = 60
+            job.meta['current_step'] = 'Preparing clustering...'
+            job.save_meta()
+
+            # Note: Not calling recluster.init_tree() - this was interfering with clustering
+
+            # Step 7: Run clustering
+            job.meta['progress'] = 70
+            job.meta['current_step'] = 'Running HDBSCAN clustering (this may take several minutes)...'
+            job.save_meta()
+
+            # Apply sample size and keep_unexplored_ratio if specified
+            cluster_kwargs = {
+                'min_cluster_size': min_cluster_size,
+                'min_samples': min_samples,
+                'cluster_selection_method': cluster_selection_method,
+            }
+
+            if sample_size > 0:
+                cluster_kwargs['sample_size'] = sample_size
+                print(f"Using sample size: {sample_size}")
+
+            if keep_unexplored_ratio > 0:
+                cluster_kwargs['keep_unexplored'] = keep_unexplored_ratio
+
+            recluster.cluster(**cluster_kwargs)
+
+            # Step 8: Get the clustered tree
+            job.meta['progress'] = 80
+            job.meta['current_step'] = 'Building project tree structure...'
+            job.save_meta()
+
+            # Get the first (and only) tree from recluster
+            tree = recluster.trees[0]
+
+            # Step 9: Load into database
+            job.meta['progress'] = 90
+            job.meta['current_step'] = 'Creating project in database...'
+            job.save_meta()
+
+            with database.engine.connect() as conn:
+                db_tree = Tree(conn)
+
+                with conn.begin():
+                    project_id = db_tree.load_project(project_name, tree)
+                    root_id = db_tree.get_root_id(project_id)
+
+                    print("Consolidating tree structure...")
+                    db_tree.consolidate_node(root_id)
+
+            # Step 10: Complete
+            job.meta['status'] = 'completed'
+            job.meta['progress'] = 100
+            job.meta['current_step'] = 'Project created successfully'
+            job.meta['completed_at'] = dt.datetime.now().isoformat()
+
+            # Get final statistics
+            cluster_count = len(tree.nodes)  # Number of nodes/clusters
+            object_count = len(tree.objects)  # Number of objects
+
+            result = {
+                'project_id': project_id,
+                'project_name': project_name,
+                'root_id': root_id,
+                'cluster_count': cluster_count,
+                'object_count': object_count,
+                'min_cluster_size': min_cluster_size,
+                'cluster_selection_method': cluster_selection_method,
+                'project_url': f'/projects/{project_id}'
+            }
+
+            job.meta['result'] = result
+            job.save_meta()
+
+            print(f"Initial clustering completed for {archive_name}")
+            print(f"Created project '{project_name}' with {cluster_count} clusters and {object_count} objects")
+            return result
+
+        except Exception as e:
+            print(f"Initial clustering failed: {str(e)}")
+            job.meta['status'] = 'failed'
+            job.meta['error_message'] = str(e)
+            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.save_meta()
+            raise
diff --git a/morphocluster/frontend/src/components/ClusterModal.vue b/morphocluster/frontend/src/components/ClusterModal.vue
new file mode 100644
index 0000000..3ccb84d
--- /dev/null
+++ b/morphocluster/frontend/src/components/ClusterModal.vue
@@ -0,0 +1,360 @@
+<template>
+  <b-modal
+    v-model="isVisible"
+    title="Create Project (Initial Clustering)"
+    size="lg"
+    @ok="handleCluster"
+    @cancel="handleCancel"
+    :ok-disabled="!isValid"
+    ok-title="Create Project"
+    cancel-title="Cancel"
+  >
+    <div class="cluster-form">
+      <b-alert variant="info" show class="mb-4">
+        <i class="mdi mdi-sitemap"></i>
+        <strong>Initial Clustering</strong><br>
+        Create a new MorphoCluster project by clustering the extracted features.
+        This will group similar images together based on their visual features.
+      </b-alert>
+
+      <!-- Archive Information -->
+      <div class="archive-info mb-4">
+        <h6>Source Information</h6>
+        <div class="info-grid">
+          <div class="info-item">
+            <strong>Archive:</strong>
+            <span>{{ archive?.name || 'Unknown' }}</span>
+          </div>
+          <div class="info-item" v-if="archive?.validation?.image_count">
+            <strong>Images:</strong>
+            <span>{{ archive.validation.image_count }} images</span>
+          </div>
+          <div class="info-item">
+            <strong>Features:</strong>
+            <span>{{ featureFile || 'Feature extraction completed' }}</span>
+          </div>
+        </div>
+      </div>
+
+      <!-- Project Settings -->
+      <b-form @submit.prevent="handleCluster">
+        <b-form-group
+          label="Project Name"
+          label-for="project-name"
+          description="Choose a descriptive name for your new project"
+          :invalid-feedback="projectNameError"
+          :state="projectNameState"
+        >
+          <b-form-input
+            id="project-name"
+            v-model="parameters.project_name"
+            :state="projectNameState"
+            placeholder="e.g., Plankton Dataset 2023"
+            required
+          />
+        </b-form-group>
+
+        <b-form-group
+          label="Project Description"
+          label-for="project-description"
+          description="Optional description of your dataset"
+        >
+          <b-form-textarea
+            id="project-description"
+            v-model="parameters.description"
+            placeholder="Description of the dataset, sampling location, date, etc."
+            rows="3"
+          />
+        </b-form-group>
+
+        <!-- Clustering Parameters -->
+        <b-card class="clustering-params mb-4" no-body>
+          <b-card-header>
+            <h6 class="mb-0">Clustering Parameters</h6>
+          </b-card-header>
+          <b-card-body>
+            <b-form-group
+              label="Minimum Cluster Size"
+              label-for="min-cluster-size"
+              :description="minClusterSizeDescription"
+            >
+              <b-form-input
+                id="min-cluster-size"
+                v-model.number="parameters.min_cluster_size"
+                type="number"
+                min="1"
+                max="10000"
+                step="1"
+              />
+              <div class="cluster-size-presets mt-2">
+                <small class="text-muted">Presets: </small>
+                <b-button
+                  v-for="preset in clusterSizePresets"
+                  :key="preset.value"
+                  size="sm"
+                  variant="outline-secondary"
+                  class="me-1"
+                  @click="parameters.min_cluster_size = preset.value"
+                >
+                  {{ preset.label }}
+                </b-button>
+              </div>
+            </b-form-group>
+
+            <b-form-group
+              label="Minimum Samples"
+              label-for="min-samples"
+              description="Minimum number of samples for a point to be considered a core point"
+            >
+              <b-form-input
+                id="min-samples"
+                v-model.number="parameters.min_samples"
+                type="number"
+                min="1"
+                max="100"
+                step="1"
+              />
+            </b-form-group>
+
+            <b-form-group
+              label="Cluster Selection Method"
+              label-for="cluster-method"
+              description="Method for selecting final clusters from the hierarchy"
+            >
+              <b-form-select
+                id="cluster-method"
+                v-model="parameters.cluster_selection_method"
+                :options="clusterMethodOptions"
+              />
+            </b-form-group>
+          </b-card-body>
+        </b-card>
+
+        <!-- Advanced Options -->
+        <b-card class="advanced-options mb-4" no-body>
+          <b-card-header class="d-flex justify-content-between align-items-center">
+            <h6 class="mb-0">Advanced Options</h6>
+            <b-button
+              variant="link"
+              size="sm"
+              @click="showAdvanced = !showAdvanced"
+              class="p-0"
+            >
+              {{ showAdvanced ? 'Hide' : 'Show' }} Advanced
+              <i :class="showAdvanced ? 'mdi mdi-chevron-up' : 'mdi mdi-chevron-down'"></i>
+            </b-button>
+          </b-card-header>
+          <b-collapse v-model="showAdvanced">
+            <b-card-body>
+              <b-form-group
+                label="Sample Size"
+                label-for="sample-size"
+                description="Maximum number of objects to use for clustering (0 = use all)"
+              >
+                <b-form-input
+                  id="sample-size"
+                  v-model.number="parameters.sample_size"
+                  type="number"
+                  min="0"
+                  max="1000000"
+                  step="1000"
+                />
+              </b-form-group>
+
+              <b-form-group
+                label="Keep Unexplored Ratio"
+                label-for="keep-unexplored"
+                description="Ratio of objects to keep unexplored for future analysis"
+              >
+                <b-form-input
+                  id="keep-unexplored"
+                  v-model.number="parameters.keep_unexplored_ratio"
+                  type="number"
+                  min="0"
+                  max="1"
+                  step="0.1"
+                />
+              </b-form-group>
+            </b-card-body>
+          </b-collapse>
+        </b-card>
+
+        <!-- Estimation Info -->
+        <div v-if="estimatedTime || estimatedClusters" class="estimation-info">
+          <b-alert variant="light" show>
+            <div class="d-flex justify-content-between">
+              <div v-if="estimatedTime">
+                <strong>Estimated Time:</strong> {{ estimatedTime }}
+              </div>
+              <div v-if="estimatedClusters">
+                <strong>Expected Clusters:</strong> ~{{ estimatedClusters }}
+              </div>
+            </div>
+          </b-alert>
+        </div>
+      </b-form>
+    </div>
+  </b-modal>
+</template>
+
+<script>
+export default {
+  name: 'ClusterModal',
+  props: {
+    archive: {
+      type: Object,
+      required: true
+    },
+    featureFile: {
+      type: String,
+      default: null
+    }
+  },
+  emits: ['cluster', 'cancel'],
+  data() {
+    return {
+      isVisible: true,
+      showAdvanced: false,
+      parameters: {
+        project_name: '',
+        description: '',
+        min_cluster_size: 128,
+        min_samples: 1,
+        cluster_selection_method: 'leaf',
+        sample_size: 0, // 0 means use all
+        keep_unexplored_ratio: 0.0
+      },
+      clusterSizePresets: [
+        { value: 32, label: 'Small (32)' },
+        { value: 64, label: 'Medium (64)' },
+        { value: 128, label: 'Large (128)' },
+        { value: 256, label: 'X-Large (256)' }
+      ],
+      clusterMethodOptions: [
+        { value: 'eom', text: 'EOM (Excess of Mass)' },
+        { value: 'leaf', text: 'Leaf (Most Granular)' }
+      ]
+    };
+  },
+  computed: {
+    projectNameState() {
+      if (this.parameters.project_name.length === 0) return null;
+      return this.parameters.project_name.length >= 3 ? true : false;
+    },
+    projectNameError() {
+      if (this.parameters.project_name.length > 0 && this.parameters.project_name.length < 3) {
+        return 'Project name must be at least 3 characters long';
+      }
+      return '';
+    },
+    isValid() {
+      return this.parameters.project_name.length >= 3;
+    },
+    minClusterSizeDescription() {
+      const size = this.parameters.min_cluster_size;
+      if (size < 32) return 'Very small clusters - may produce many tiny groups';
+      if (size < 64) return 'Small clusters - good for detailed analysis';
+      if (size < 128) return 'Medium clusters - balanced approach';
+      if (size < 256) return 'Large clusters - broader groupings';
+      return 'Very large clusters - coarse groupings';
+    },
+    estimatedTime() {
+      const imageCount = this.archive?.validation?.image_count || 0;
+      if (imageCount > 10000) return '10-30 minutes';
+      if (imageCount > 5000) return '5-15 minutes';
+      if (imageCount > 1000) return '2-5 minutes';
+      return '1-2 minutes';
+    },
+    estimatedClusters() {
+      const imageCount = this.archive?.validation?.image_count || 0;
+      const clusterSize = this.parameters.min_cluster_size;
+      if (imageCount && clusterSize) {
+        return Math.floor(imageCount / clusterSize / 2); // Rough estimate
+      }
+      return null;
+    }
+  },
+  mounted() {
+    // Set default project name based on archive name
+    if (this.archive?.name) {
+      const baseName = this.archive.name.replace(/\.(zip|tar|tar\.gz)$/i, '');
+      this.parameters.project_name = baseName.replace(/_/g, ' ');
+    }
+  },
+  methods: {
+    handleCluster() {
+      if (this.isValid) {
+        this.$emit('cluster', this.parameters);
+      }
+    },
+    handleCancel() {
+      this.isVisible = false;
+      this.$emit('cancel');
+    }
+  }
+};
+</script>
+
+<style scoped>
+.cluster-form {
+  max-height: 70vh;
+  overflow-y: auto;
+}
+
+.archive-info {
+  background: #f8f9fa;
+  border: 1px solid #dee2e6;
+  border-radius: 6px;
+  padding: 1rem;
+}
+
+.info-grid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 0.5rem;
+}
+
+.info-item {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 0.25rem 0;
+}
+
+.info-item strong {
+  margin-right: 0.5rem;
+}
+
+.clustering-params .card-header,
+.advanced-options .card-header {
+  background-color: #f8f9fa;
+  border-bottom: 1px solid #dee2e6;
+}
+
+.cluster-size-presets {
+  display: flex;
+  align-items: center;
+  gap: 0.25rem;
+  flex-wrap: wrap;
+}
+
+.estimation-info {
+  margin-top: 1rem;
+}
+
+@media (max-width: 768px) {
+  .info-grid {
+    grid-template-columns: 1fr;
+  }
+
+  .info-item {
+    flex-direction: column;
+    align-items: flex-start;
+  }
+
+  .cluster-size-presets {
+    flex-direction: column;
+    align-items: flex-start;
+  }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/components/FeatureModal.vue b/morphocluster/frontend/src/components/FeatureModal.vue
index 1cd0cce..9813d2c 100644
--- a/morphocluster/frontend/src/components/FeatureModal.vue
+++ b/morphocluster/frontend/src/components/FeatureModal.vue
@@ -273,25 +273,19 @@ export default {
       showAdvanced: false,
       customModelFile: null,
       parameters: {
-        model: 'resnet50',
+        model: 'resnet18',
         custom_architecture: '',
         batch_size: 512,
         normalize: true,
         device: 'auto',
-        input_mean: '',
-        input_std: '',
+        input_mean: '0.485,0.456,0.406',
+        input_std: '0.229,0.224,0.225',
         image_size: 224,
         num_workers: 0,
         output_format: 'hdf5'
       },
       modelOptions: [
-        { value: 'resnet50', text: 'ResNet-50 (ImageNet)' },
-        { value: 'resnet101', text: 'ResNet-101 (ImageNet)' },
-        { value: 'vgg16', text: 'VGG-16 (ImageNet)' },
-        { value: 'vgg19', text: 'VGG-19 (ImageNet)' },
-        { value: 'densenet121', text: 'DenseNet-121 (ImageNet)' },
-        { value: 'mobilenet_v2', text: 'MobileNet V2 (ImageNet)' },
-        { value: 'efficientnet_b0', text: 'EfficientNet B0 (ImageNet)' },
+        { value: 'resnet18', text: 'ResNet-18 (ImageNet) - Default' },
         { value: 'custom', text: 'Upload Custom Model...' }
       ],
       architectureOptions: [
diff --git a/morphocluster/frontend/src/components/JobStatus.vue b/morphocluster/frontend/src/components/JobStatus.vue
index fbd8150..22714a7 100644
--- a/morphocluster/frontend/src/components/JobStatus.vue
+++ b/morphocluster/frontend/src/components/JobStatus.vue
@@ -10,10 +10,11 @@
         v-for="job in jobs"
         :key="job.id"
         class="job-item"
-        :class="{ 
+        :class="{
           'job-completed': job.status === 'completed',
           'job-failed': job.status === 'failed',
-          'job-running': job.status === 'running'
+          'job-running': job.status === 'running',
+          'job-queued': job.status === 'queued'
         }"
       >
         <div class="job-header">
@@ -38,7 +39,7 @@
               variant="outline-secondary"
               @click="removeJob(job.id)"
             >
-              <i class="mdi mdi-close"></i>
+              ×
             </b-button>
           </div>
         </div>
@@ -141,7 +142,8 @@ export default {
       jobs: [],
       showLogs: false,
       refreshTimer: null,
-      isLoading: false
+      isLoading: false,
+      removedJobIds: new Set()
     };
   },
   computed: {
@@ -150,6 +152,7 @@ export default {
     }
   },
   async mounted() {
+    this.loadRemovedJobIds();
     await this.fetchJobs();
     if (this.autoRefresh) {
       this.startRefresh();
@@ -159,14 +162,36 @@ export default {
     this.stopRefresh();
   },
   methods: {
+    loadRemovedJobIds() {
+      try {
+        const stored = localStorage.getItem('removedJobIds');
+        if (stored) {
+          this.removedJobIds = new Set(JSON.parse(stored));
+        }
+      } catch (error) {
+        console.error('Failed to load removed job IDs:', error);
+        this.removedJobIds = new Set();
+      }
+    },
+
+    saveRemovedJobIds() {
+      try {
+        localStorage.setItem('removedJobIds', JSON.stringify([...this.removedJobIds]));
+      } catch (error) {
+        console.error('Failed to save removed job IDs:', error);
+      }
+    },
     async fetchJobs() {
       if (this.isLoading) return;
       
       this.isLoading = true;
       try {
         const response = await this.$axios.get('/api/jobs/user');
-        const newJobs = response.data;
-        
+        const allJobs = response.data;
+
+        // Filter out manually removed jobs
+        const newJobs = allJobs.filter(job => !this.removedJobIds.has(job.id));
+
         // Check for status changes
         this.jobs.forEach(oldJob => {
           const newJob = newJobs.find(j => j.id === oldJob.id);
@@ -178,7 +203,17 @@ export default {
             }
           }
         });
-        
+
+        // Also check for newly completed jobs that weren't in the old list
+        newJobs.forEach(newJob => {
+          const oldJob = this.jobs.find(j => j.id === newJob.id);
+          if (!oldJob && newJob.status === 'completed') {
+            this.$emit('job-completed', newJob);
+          } else if (!oldJob && newJob.status === 'failed') {
+            this.$emit('job-failed', newJob);
+          }
+        });
+
         this.jobs = newJobs;
       } catch (error) {
         console.error('Failed to fetch jobs:', error);
@@ -202,6 +237,11 @@ export default {
     },
 
     removeJob(jobId) {
+      // Add to removed set so it doesn't reappear
+      this.removedJobIds.add(jobId);
+      this.saveRemovedJobIds();
+
+      // Remove from current jobs array
       const index = this.jobs.findIndex(j => j.id === jobId);
       if (index !== -1) {
         this.jobs.splice(index, 1);
@@ -209,6 +249,15 @@ export default {
     },
 
     clearCompletedJobs() {
+      // Add completed/failed jobs to removed set
+      this.jobs.forEach(job => {
+        if (['completed', 'failed'].includes(job.status)) {
+          this.removedJobIds.add(job.id);
+        }
+      });
+      this.saveRemovedJobIds();
+
+      // Filter out completed/failed jobs
       this.jobs = this.jobs.filter(job => !['completed', 'failed'].includes(job.status));
     },
 
@@ -250,7 +299,7 @@ export default {
 
     getJobDetails(job) {
       if (job.job_type === 'format_conversion') {
-        return `Archive: ${job.parameters?.archive_name || 'Unknown'}`;
+        return `Archive: ${job.archive_name || job.parameters?.archive_name || 'Unknown'}`;
       } else if (job.job_type === 'feature_extraction') {
         return `Model: ${job.parameters?.model || 'ImageNet'}, Batch: ${job.parameters?.batch_size || 512}`;
       } else if (job.job_type === 'initial_clustering' || job.job_type === 'reclustering') {
@@ -262,6 +311,7 @@ export default {
     getStatusIcon(status) {
       const icons = {
         'pending': 'mdi mdi-clock-outline text-warning',
+        'queued': 'mdi mdi-clock-outline text-info',
         'running': 'mdi mdi-loading mdi-spin text-primary',
         'completed': 'mdi mdi-check-circle text-success',
         'failed': 'mdi mdi-alert-circle text-danger',
@@ -273,6 +323,7 @@ export default {
     getStatusText(status) {
       const texts = {
         'pending': 'Pending',
+        'queued': 'Queued',
         'running': 'Running',
         'completed': 'Completed',
         'failed': 'Failed',
@@ -308,6 +359,8 @@ export default {
   border: 1px solid #dee2e6;
   border-radius: 8px;
   background: white;
+  max-height: 600px;
+  overflow-y: auto;
 }
 
 .no-jobs {
@@ -345,6 +398,11 @@ export default {
   background-color: #f8f9ff;
 }
 
+.job-item.job-queued {
+  border-left: 4px solid #17a2b8;
+  background-color: #f0f9ff;
+}
+
 .job-header {
   display: flex;
   justify-content: space-between;
diff --git a/morphocluster/frontend/src/components/UploadZone.vue b/morphocluster/frontend/src/components/UploadZone.vue
index 0cc327f..10671b0 100644
--- a/morphocluster/frontend/src/components/UploadZone.vue
+++ b/morphocluster/frontend/src/components/UploadZone.vue
@@ -220,6 +220,7 @@ export default {
       this.$emit('upload-start', files);
       
       try {
+        console.log('UploadZone: Starting axios post to', this.uploadUrl);
         const response = await axios.post(this.uploadUrl, formData, {
           headers: {
             'Content-Type': 'multipart/form-data',
@@ -229,22 +230,29 @@ export default {
             this.updateProgress(progressEvent);
           },
         });
-        
+
+        console.log('UploadZone: Axios post completed, response:', response);
+
         this.uploadedFiles = files.map(file => ({
           name: file.name,
           size: file.size,
           type: file.type
         }));
-        
+
+        console.log('UploadZone: Set uploadedFiles:', this.uploadedFiles);
+
         this.uploadComplete = true;
         this.isUploading = false;
-        
+
+        console.log('UploadZone: About to emit upload-complete event');
         this.$emit('upload-complete', {
           files: this.uploadedFiles,
           response: response.data
         });
+        console.log('UploadZone: Emitted upload-complete event');
         
       } catch (error) {
+        console.error('UploadZone: Error during upload:', error);
         this.isUploading = false;
         
         if (axios.isCancel(error)) {
diff --git a/morphocluster/frontend/src/main.js b/morphocluster/frontend/src/main.js
index 9061aac..4ac7433 100644
--- a/morphocluster/frontend/src/main.js
+++ b/morphocluster/frontend/src/main.js
@@ -1,6 +1,7 @@
 import { createApp } from 'vue'
 import App from './App.vue'
 import router from './router'
+import axios from 'axios'
 
 // Bootstrap Vue 3
 import BootstrapVueNext from 'bootstrap-vue-next'
@@ -12,6 +13,9 @@ import './assets/styles.css'
 
 const app = createApp(App)
 
+// Configure axios
+app.config.globalProperties.$axios = axios
+
 app.use(router)
 app.use(BootstrapVueNext)
 
diff --git a/morphocluster/frontend/src/views/Approve.vue b/morphocluster/frontend/src/views/Approve.vue
index 5d313ec..776b77e 100644
--- a/morphocluster/frontend/src/views/Approve.vue
+++ b/morphocluster/frontend/src/views/Approve.vue
@@ -281,6 +281,14 @@ export default {
             // Should members_url be updated (with unique id etc.) on response?
             var updateMembersUrl = false;
 
+            // Guard against null node
+            if (!this.node) {
+                if ($state && $state.complete) {
+                    $state.complete();
+                }
+                return;
+            }
+
             if (!this.members_url) {
                 const nodes = this.node.children;
                 this.members_url = `/api/nodes/${
@@ -402,6 +410,12 @@ export default {
         moveupMember(member) {
             console.log("Remove", this.getUniqueId(member));
 
+            // Guard against null node
+            if (!this.node || !this.node.parent_id) {
+                console.error("Cannot move member: node or parent_id is null");
+                return;
+            }
+
             // TODO: Also reject members.
             api.nodeAdoptMembers(this.node.parent_id, [member])
                 .then(() => {
diff --git a/morphocluster/frontend/src/views/Project.vue b/morphocluster/frontend/src/views/Project.vue
index 98952e7..9660b58 100644
--- a/morphocluster/frontend/src/views/Project.vue
+++ b/morphocluster/frontend/src/views/Project.vue
@@ -7,7 +7,7 @@
                     <li class="nav-item">
                         <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
                     </li>
-                    <li class="nav-item">
+                    <li class="nav-item" v-if="project">
                         <router-link class="nav-link"
                             :to="{ name: 'project', params: { project_id: project.project_id } }">{{
                                 project.name }}</router-link>
@@ -17,31 +17,36 @@
             <dark-mode-control />
         </nav>
         <div class="container">
-            <table id="table" style="width=100%">
-                <tbody>
-                    <tr>
-                        <td>Created on</td>
-                        <td>{{ project.creation_date }}</td>
-                    </tr>
-                    <tr>
-                        <td>Name</td>
-                        <td>{{ project.name }}</td>
-                    </tr>
-                    <tr>
-                        <td>Node_id</td>
-                        <td>{{ project.node_id }}</td>
-                    </tr>
-                    <tr>
-                        <td>Project_id</td>
-                        <td>{{ project.project_id }}</td>
-                    </tr>
-                    <tr>
-                        <td>Visible</td>
-                        <td>{{ project.visible }}</td>
-                    </tr>
-                </tbody>
-            </table>
-            <div style="margin: auto ; width: 0; padding-top: 7px ">
+            <div v-if="project">
+                <table id="table" style="width=100%">
+                    <tbody>
+                        <tr>
+                            <td>Created on</td>
+                            <td>{{ project.creation_date }}</td>
+                        </tr>
+                        <tr>
+                            <td>Name</td>
+                            <td>{{ project.name }}</td>
+                        </tr>
+                        <tr>
+                            <td>Node_id</td>
+                            <td>{{ project.node_id }}</td>
+                        </tr>
+                        <tr>
+                            <td>Project_id</td>
+                            <td>{{ project.project_id }}</td>
+                        </tr>
+                        <tr>
+                            <td>Visible</td>
+                            <td>{{ project.visible }}</td>
+                        </tr>
+                    </tbody>
+                </table>
+            </div>
+            <div v-else>
+                <p>Loading project...</p>
+            </div>
+            <div v-if="project" style="margin: auto ; width: 0; padding-top: 7px ">
                 <b-button size="sm" variant="primary" href="" @click.prevent="showSaveModal(project)">
                     Save Project
                 </b-button>
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
index 1d13e8c..367f752 100644
--- a/morphocluster/frontend/src/views/Upload.vue
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -67,22 +67,35 @@
                     </div>
 
                     <!-- EcoTaxa Conversion Warning -->
-                    <b-alert
-                      v-if="archive.needsConversion"
-                      variant="warning"
-                      show
-                      class="mt-2"
-                    >
+                    <div v-if="archive.needsConversion" class="alert alert-warning mt-2">
                       <i class="mdi mdi-alert"></i>
                       This archive appears to be in EcoTaxa format and needs conversion.
-                      <b-button
-                        variant="warning"
-                        size="sm"
-                        class="ms-2"
+                      <button
+                        class="btn btn-warning btn-sm ms-2"
                         @click="showConvertModal(archive)"
                       >
                         Convert Format
-                      </b-button>
+                      </button>
+                    </div>
+
+                    <!-- Error Details -->
+                    <b-alert
+                      v-if="archive.status === 'error'"
+                      variant="danger"
+                      show
+                      class="mt-2"
+                    >
+                      <i class="mdi mdi-alert-circle"></i>
+                      <strong>Validation Error:</strong><br>
+                      {{ archive.error || 'Unknown error occurred during validation' }}
+                      <div v-if="archive.validation && archive.validation.validation_warnings && archive.validation.validation_warnings.length" class="mt-2">
+                        <small><strong>Warnings:</strong></small>
+                        <ul class="mb-0 mt-1">
+                          <li v-for="warning in archive.validation.validation_warnings" :key="warning">
+                            {{ warning }}
+                          </li>
+                        </ul>
+                      </div>
                     </b-alert>
 
                     <!-- Archive Actions -->
@@ -106,6 +119,42 @@
                         Preview
                       </b-button>
                     </div>
+
+                    <!-- Post-Processing Actions -->
+                    <div v-if="archive.status === 'processed'" class="archive-actions mt-2">
+                      <b-button
+                        variant="success"
+                        size="sm"
+                        @click="showClusterModal(archive)"
+                        class="me-2"
+                      >
+                        <i class="mdi mdi-sitemap"></i>
+                        Create Project
+                      </b-button>
+                      <b-button
+                        variant="outline-secondary"
+                        size="sm"
+                        @click="previewArchive(archive)"
+                      >
+                        <i class="mdi mdi-eye"></i>
+                        Preview
+                      </b-button>
+                    </div>
+                    <!-- Project Actions -->
+                    <div v-if="archive.status === 'clustered'" class="archive-actions mt-2">
+                      <b-button
+                        variant="primary"
+                        size="sm"
+                        @click="viewProject(archive)"
+                        class="me-2"
+                      >
+                        <i class="mdi mdi-folder-open"></i>
+                        View Project
+                      </b-button>
+                      <span class="project-info text-muted">
+                        Project: {{ archive.projectName || 'Unknown' }}
+                      </span>
+                    </div>
                   </div>
                 </div>
               </div>
@@ -143,6 +192,15 @@
       @cancel="hideExtractModal"
     />
 
+    <!-- Clustering Modal -->
+    <cluster-modal
+      v-if="showingClusterModal"
+      :archive="selectedArchive"
+      :feature-file="selectedArchive?.featureFile"
+      @cluster="handleCluster"
+      @cancel="hideClusterModal"
+    />
+
     <!-- Archive Preview Modal -->
     <b-modal
       v-model="showingPreviewModal"
@@ -192,6 +250,7 @@ import JobStatus from '@/components/JobStatus.vue';
 import DarkModeControl from '@/components/DarkModeControl.vue';
 import FormatModal from '@/components/FormatModal.vue';
 import FeatureModal from '@/components/FeatureModal.vue';
+import ClusterModal from '@/components/ClusterModal.vue';
 
 export default {
   name: 'UploadView',
@@ -200,7 +259,8 @@ export default {
     JobStatus,
     DarkModeControl,
     FormatModal,
-    FeatureModal
+    FeatureModal,
+    ClusterModal
   },
   data() {
     return {
@@ -211,6 +271,7 @@ export default {
       selectedArchive: null,
       showingConvertModal: false,
       showingExtractModal: false,
+      showingClusterModal: false,
       showingPreviewModal: false,
       previewData: null
     };
@@ -225,36 +286,52 @@ export default {
     },
 
     async handleUploadComplete(result) {
+      console.log('Upload.vue: handleUploadComplete called');
       console.log('Upload completed:', result);
-      
+
+      // Debug: check the structure
+      console.log('result.response:', result.response);
+      console.log('result.response?.files:', result.response?.files);
+
+      // Get files from the API response (not the component's uploadedFiles)
+      const uploadedFiles = result.response?.files || [];
+      console.log('Files to validate:', uploadedFiles);
+
+      if (uploadedFiles.length === 0) {
+        console.error('No files found in response for validation');
+        return;
+      }
+
       // Process uploaded files and validate them
-      for (const file of result.files) {
+      for (const file of uploadedFiles) {
+        console.log('Validating file:', file.name);
         try {
-          const validation = await this.$axios.get(`/api/files/${file.name}/validate`);
-          this.uploadedArchives.push({
+          const validation = await this.$axios.get(`/api/files/${encodeURIComponent(file.name)}/validate`);
+          console.log('Validation result:', validation.data);
+
+          const archiveData = {
             id: Date.now() + Math.random(),
             name: file.name,
             size: file.size,
-            status: 'validating',
+            status: 'ready',
             format: validation.data.format,
             needsConversion: validation.data.needs_conversion,
             isValid: validation.data.is_valid,
             validation: validation.data
-          });
+          };
+
+          this.uploadedArchives.push(archiveData);
         } catch (error) {
-          console.error('Validation failed:', error);
+          console.error('Validation failed for', file.name, ':', error);
           this.uploadedArchives.push({
             id: Date.now() + Math.random(),
             name: file.name,
             size: file.size,
             status: 'error',
-            error: error.message
+            error: error.response?.data?.error || error.message
           });
         }
       }
-      
-      // Update archive statuses
-      this.updateArchiveStatuses();
     },
 
     handleUploadError(error) {
@@ -301,6 +378,24 @@ export default {
       this.selectedArchive = null;
     },
 
+    showClusterModal(archive) {
+      this.selectedArchive = archive;
+      this.showingClusterModal = true;
+    },
+
+    hideClusterModal() {
+      this.showingClusterModal = false;
+      this.selectedArchive = null;
+    },
+    viewProject(archive) {
+      if (archive.projectId) {
+        // Navigate to the project view
+        this.$router.push(`/projects/${archive.projectId}`);
+      } else {
+        console.error('No project ID available for archive:', archive.name);
+      }
+    },
+
     async previewArchive(archive) {
       try {
         const response = await this.$axios.get(`/api/files/${archive.name}/preview`);
@@ -317,65 +412,118 @@ export default {
     },
 
     async handleConvert(parameters) {
+      const archive = this.selectedArchive;
       this.hideConvertModal();
-      
+
+      if (!archive) {
+        console.error('No archive selected for conversion');
+        return;
+      }
+
       try {
         await this.$axios.post(
-          `/api/files/${this.selectedArchive.name}/convert`,
+          `/api/files/${archive.name}/convert`,
           parameters
         );
-        
-        this.$bvToast.toast('Format conversion started.', {
-          title: 'Conversion Started',
-          variant: 'info',
-          solid: true
-        });
-        
+
+        console.log('Format conversion started for:', archive.name);
+
         // Update archive status
-        this.selectedArchive.status = 'converting';
-        
+        archive.status = 'converting';
+
       } catch (error) {
         console.error('Conversion failed:', error);
-        this.$bvToast.toast('Failed to start conversion.', {
-          title: 'Conversion Error',
-          variant: 'danger',
-          solid: true
-        });
+        console.error('Error details:', error.response?.data);
       }
     },
 
     async handleExtract(parameters) {
+      const archive = this.selectedArchive;
       this.hideExtractModal();
-      
+
+      if (!archive) {
+        console.error('No archive selected for extraction');
+        return;
+      }
+
       try {
         await this.$axios.post(
-          `/api/files/${this.selectedArchive.name}/extract`,
+          `/api/files/${archive.name}/extract`,
           parameters
         );
-        
-        this.$bvToast.toast('Feature extraction started.', {
-          title: 'Extraction Started',
-          variant: 'info',
-          solid: true
-        });
-        
+
+        console.log('Feature extraction started for:', archive.name);
+
+        // Update archive status
+        archive.status = 'extracting';
+
       } catch (error) {
         console.error('Extraction failed:', error);
-        this.$bvToast.toast('Failed to start feature extraction.', {
-          title: 'Extraction Error',
-          variant: 'danger',
-          solid: true
-        });
+        console.error('Error details:', error.response?.data);
+      }
+    },
+
+    async handleCluster(parameters) {
+      const archive = this.selectedArchive;
+      this.hideClusterModal();
+
+      if (!archive) {
+        console.error('No archive selected for clustering');
+        return;
+      }
+
+      try {
+        await this.$axios.post(
+          `/api/files/${encodeURIComponent(archive.name)}/cluster`,
+          { ...parameters, feature_file: archive.featureFile }
+        );
+
+        console.log('Clustering started for:', archive.name);
+
+        // Update archive status
+        archive.status = 'clustering';
+
+      } catch (error) {
+        console.error('Clustering failed:', error);
+        console.error('Error details:', error.response?.data);
       }
     },
 
     handleJobCompleted(job) {
-      this.$bvToast.toast(`${this.getJobTitle(job)} completed successfully!`, {
-        title: 'Job Completed',
-        variant: 'success',
-        solid: true
-      });
-      
+      // Update archive status based on job type
+      if (job.job_type === 'format_conversion' && job.archive_name) {
+        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        if (archive) {
+          archive.status = 'ready';
+          archive.format = 'standard';
+          archive.needsConversion = false;
+
+          // Update archive name to point to converted file
+          if (job.result && job.result.converted_file) {
+            archive.name = job.result.converted_file;
+          }
+        }
+      } else if (job.job_type === 'feature_extraction' && job.archive_name) {
+        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        if (archive) {
+          archive.status = 'processed';
+          // Store feature file info for clustering
+          if (job.result && job.result.feature_file) {
+            archive.featureFile = job.result.feature_file;
+          }
+        }
+      } else if (job.job_type === 'initial_clustering' && job.archive_name) {
+        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        if (archive) {
+          archive.status = 'clustered';
+          // Store project info
+          if (job.result && job.result.project_id) {
+            archive.projectId = job.result.project_id;
+            archive.projectName = job.result.project_name;
+          }
+        }
+      }
+
       // Navigate to result if applicable
       if (job.result_url) {
         this.$router.push(job.result_url);
@@ -383,20 +531,17 @@ export default {
     },
 
     handleJobFailed(job) {
-      this.$bvToast.toast(`${this.getJobTitle(job)} failed: ${job.error_message}`, {
-        title: 'Job Failed',
-        variant: 'danger',
-        solid: true,
-        autoHideDelay: 8000
-      });
+      // Reset archive status if conversion failed
+      if (job.job_type === 'format_conversion' && job.archive_name) {
+        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        if (archive) {
+          archive.status = 'ready'; // Back to ready so user can try again
+        }
+      }
     },
 
-    handleJobCancelled(job) {
-      this.$bvToast.toast(`${this.getJobTitle(job)} was cancelled.`, {
-        title: 'Job Cancelled',
-        variant: 'warning',
-        solid: true
-      });
+    handleJobCancelled() {
+      // Job was cancelled, no specific action needed
     },
 
     getJobTitle(job) {
@@ -418,6 +563,11 @@ export default {
         'validating': 'warning',
         'ready': 'success',
         'converting': 'info',
+        'extracting': 'info',
+        'processing': 'info',
+        'clustering': 'info',
+        'processed': 'primary',
+        'clustered': 'success',
         'error': 'danger'
       };
       return variants[status] || 'secondary';
@@ -428,6 +578,11 @@ export default {
         'validating': 'Validating',
         'ready': 'Ready',
         'converting': 'Converting',
+        'extracting': 'Extracting',
+        'processing': 'Processing',
+        'clustering': 'Clustering',
+        'processed': 'Processed',
+        'clustered': 'Project Created',
         'error': 'Error'
       };
       return texts[status] || 'Unknown';
@@ -475,6 +630,20 @@ export default {
   padding: 1.5rem;
   position: sticky;
   top: 2rem;
+  max-height: calc(100vh - 4rem);
+  overflow: hidden;
+  display: flex;
+  flex-direction: column;
+}
+
+.job-status-section h4 {
+  margin-bottom: 1rem;
+  flex-shrink: 0;
+}
+
+.job-status-section .job-status-container {
+  flex: 1;
+  min-height: 0;
 }
 
 .archives-list {

From d2ce9fcda65c88faa7a8ae7cd70552e068a7bb71 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 10:36:12 -0400
Subject: [PATCH 04/13] add initial reclustering implementation

---
 morphocluster/api.py                          |  38 ++++
 morphocluster/background.py                   | 174 ++++++++++++++++++
 .../frontend/src/components/ClusterModal.vue  |  56 ++++--
 morphocluster/frontend/src/views/Projects.vue |  54 +++++-
 4 files changed, 307 insertions(+), 15 deletions(-)

diff --git a/morphocluster/api.py b/morphocluster/api.py
index c5689b5..08ac53a 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -999,6 +999,44 @@ def save_project(project_id):
         return jsonify({"url": tree_url})
 
 
+@api.route("/projects/<int:project_id>/recluster", methods=["POST"])
+def recluster_project(project_id):
+    """
+    Start re-clustering background job for an existing project.
+    """
+    from morphocluster.background import reclustering_job
+
+    parameters = request.get_json() or {}
+
+    try:
+        # Queue the background job
+        job = reclustering_job.queue(project_id, parameters)
+
+        # Initialize job metadata
+        job.meta['status'] = 'queued'
+        job.meta['progress'] = 0
+        job.meta['current_step'] = 'Waiting in queue...'
+        job.meta['created_at'] = datetime.now().isoformat()
+        job.meta['job_type'] = 'reclustering'
+        job.meta['project_id'] = project_id
+        job.meta['parameters'] = parameters
+        job.save_meta()
+
+        result = {
+            "job_id": job.id,
+            "status": "queued",
+            "message": "Re-clustering job queued",
+            "parameters": parameters
+        }
+
+        return jsonify(result), 202
+
+    except Exception as e:
+        return jsonify({
+            "error": f"Failed to queue re-clustering job: {str(e)}"
+        }), 500
+
+
 # ===============================================================================
 # /nodes
 # ===============================================================================
diff --git a/morphocluster/background.py b/morphocluster/background.py
index 675f354..98c01bc 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -608,3 +608,177 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
             job.meta['failed_at'] = dt.datetime.now().isoformat()
             job.save_meta()
             raise
+
+
+@rq.job(timeout=3600)  # 1 hour timeout
+def reclustering_job(project_id, parameters=None):
+    """
+    Background job for re-clustering an existing project.
+    """
+    print(f"Starting re-clustering for project {project_id}")
+    from rq import get_current_job
+    job = get_current_job()
+    if parameters is None:
+        parameters = {}
+
+    # Create application context for Flask app access
+    from morphocluster import create_app
+    app_instance = create_app()
+
+    with app_instance.app_context():
+        try:
+            from morphocluster.processing.recluster import Recluster
+            from morphocluster.tree import Tree
+            from morphocluster import models
+            import datetime as dt
+            from pathlib import Path
+            import h5py
+
+            # Step 1: Setup parameters
+            job.meta['status'] = 'setting_up'
+            job.meta['progress'] = 10
+            job.meta['current_step'] = 'Setting up re-clustering parameters...'
+            job.save_meta()
+
+            # Extract parameters with defaults
+            new_project_name = parameters.get('project_name', f"Re-clustered Project {project_id}")
+            min_cluster_size = parameters.get('min_cluster_size', 32)
+            min_samples = parameters.get('min_samples', 1)
+            cluster_selection_method = parameters.get('cluster_selection_method', 'leaf')
+            sample_size = parameters.get('sample_size', 0)  # 0 = use all
+            keep_unexplored_ratio = parameters.get('keep_unexplored_ratio', 0.0)
+
+            print(f"Re-clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}")
+
+            # Step 2: Load the existing project and export it
+            job.meta['progress'] = 20
+            job.meta['current_step'] = 'Loading existing project...'
+            job.save_meta()
+
+            with database.engine.connect() as conn:
+                db_tree = Tree(conn)
+                existing_project = db_tree.get_project(project_id)
+                root_id = db_tree.get_root_id(project_id)
+
+                # Export existing tree to temporary file
+                temp_tree_path = f"/tmp/temp_tree_{project_id}.zip"
+                db_tree.export_tree(root_id, temp_tree_path)
+
+            # Step 3: Find the feature file (look for existing feature files)
+            job.meta['progress'] = 30
+            job.meta['current_step'] = 'Finding feature file...'
+            job.save_meta()
+
+            files_dir = Path(app_instance.config["FILES_DIR"])
+            # Look for feature files that might match this project
+            feature_files = list(files_dir.glob("*_features.h5"))
+
+            if not feature_files:
+                raise FileNotFoundError("No feature files found for re-clustering")
+
+            # Use the most recent feature file (or implement better matching logic)
+            feature_path = max(feature_files, key=lambda x: x.stat().st_mtime)
+            print(f"Using feature file: {feature_path}")
+
+            # Step 4: Initialize clustering
+            job.meta['progress'] = 40
+            job.meta['current_step'] = 'Initializing re-clustering algorithm...'
+            job.save_meta()
+
+            recluster = Recluster()
+
+            # Step 5: Load features
+            job.meta['progress'] = 50
+            job.meta['current_step'] = 'Loading features...'
+            job.save_meta()
+
+            recluster.load_features(str(feature_path))
+
+            # Step 6: Load existing tree
+            job.meta['progress'] = 60
+            job.meta['current_step'] = 'Loading existing project tree...'
+            job.save_meta()
+
+            recluster.load_tree(temp_tree_path)
+
+            # Step 7: Run clustering
+            job.meta['progress'] = 70
+            job.meta['current_step'] = 'Running HDBSCAN re-clustering...'
+            job.save_meta()
+
+            cluster_kwargs = {
+                'min_cluster_size': min_cluster_size,
+                'min_samples': min_samples,
+                'cluster_selection_method': cluster_selection_method,
+            }
+
+            if sample_size > 0:
+                cluster_kwargs['sample_size'] = sample_size
+
+            if keep_unexplored_ratio > 0:
+                cluster_kwargs['keep_unexplored'] = keep_unexplored_ratio
+
+            recluster.cluster(**cluster_kwargs)
+
+            # Step 8: Create new project from re-clustered tree
+            job.meta['progress'] = 80
+            job.meta['current_step'] = 'Creating new project...'
+            job.save_meta()
+
+            # Get the new clustered tree (should be the second tree)
+            new_tree = recluster.trees[-1]  # Get the most recent tree
+
+            # Step 9: Load into database as new project
+            job.meta['progress'] = 90
+            job.meta['current_step'] = 'Saving new project to database...'
+            job.save_meta()
+
+            with database.engine.connect() as conn:
+                db_tree = Tree(conn)
+
+                with conn.begin():
+                    new_project_id = db_tree.load_project(new_project_name, new_tree)
+                    new_root_id = db_tree.get_root_id(new_project_id)
+
+                    print("Consolidating new tree structure...")
+                    db_tree.consolidate_node(new_root_id)
+
+            # Clean up temporary file
+            Path(temp_tree_path).unlink(missing_ok=True)
+
+            # Step 10: Complete
+            job.meta['status'] = 'completed'
+            job.meta['progress'] = 100
+            job.meta['current_step'] = 'Re-clustering completed successfully'
+            job.meta['completed_at'] = dt.datetime.now().isoformat()
+
+            # Get final statistics
+            cluster_count = len(new_tree.nodes)
+            object_count = len(new_tree.objects)
+
+            result = {
+                'original_project_id': project_id,
+                'new_project_id': new_project_id,
+                'new_project_name': new_project_name,
+                'new_root_id': new_root_id,
+                'cluster_count': cluster_count,
+                'object_count': object_count,
+                'min_cluster_size': min_cluster_size,
+                'cluster_selection_method': cluster_selection_method,
+                'project_url': f'/projects/{new_project_id}'
+            }
+
+            job.meta['result'] = result
+            job.save_meta()
+
+            print(f"Re-clustering completed for project {project_id}")
+            print(f"Created new project '{new_project_name}' (ID: {new_project_id}) with {cluster_count} clusters")
+            return result
+
+        except Exception as e:
+            print(f"Re-clustering failed: {str(e)}")
+            job.meta['status'] = 'failed'
+            job.meta['error_message'] = str(e)
+            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.save_meta()
+            raise
diff --git a/morphocluster/frontend/src/components/ClusterModal.vue b/morphocluster/frontend/src/components/ClusterModal.vue
index 3ccb84d..5138207 100644
--- a/morphocluster/frontend/src/components/ClusterModal.vue
+++ b/morphocluster/frontend/src/components/ClusterModal.vue
@@ -1,35 +1,45 @@
 <template>
   <b-modal
     v-model="isVisible"
-    title="Create Project (Initial Clustering)"
+    :title="modalTitle"
     size="lg"
     @ok="handleCluster"
     @cancel="handleCancel"
     :ok-disabled="!isValid"
-    ok-title="Create Project"
+    :ok-title="okTitle"
     cancel-title="Cancel"
   >
     <div class="cluster-form">
       <b-alert variant="info" show class="mb-4">
         <i class="mdi mdi-sitemap"></i>
-        <strong>Initial Clustering</strong><br>
-        Create a new MorphoCluster project by clustering the extracted features.
-        This will group similar images together based on their visual features.
+        <strong>{{ isReclusterMode ? 'Re-clustering' : 'Initial Clustering' }}</strong><br>
+        {{ isReclusterMode
+           ? 'Re-cluster an existing project with different parameters to create a new project.'
+           : 'Create a new MorphoCluster project by clustering the extracted features.' }}
+        {{ !isReclusterMode ? 'This will group similar images together based on their visual features.' : '' }}
       </b-alert>
 
-      <!-- Archive Information -->
-      <div class="archive-info mb-4">
+      <!-- Source Information -->
+      <div class="source-info mb-4">
         <h6>Source Information</h6>
         <div class="info-grid">
-          <div class="info-item">
+          <div v-if="!isReclusterMode" class="info-item">
             <strong>Archive:</strong>
             <span>{{ archive?.name || 'Unknown' }}</span>
           </div>
-          <div class="info-item" v-if="archive?.validation?.image_count">
+          <div v-if="isReclusterMode" class="info-item">
+            <strong>Original Project:</strong>
+            <span>{{ project?.name || 'Unknown' }}</span>
+          </div>
+          <div v-if="!isReclusterMode && archive?.validation?.image_count" class="info-item">
             <strong>Images:</strong>
             <span>{{ archive.validation.image_count }} images</span>
           </div>
-          <div class="info-item">
+          <div v-if="isReclusterMode" class="info-item">
+            <strong>Project ID:</strong>
+            <span>{{ project?.project_id || 'Unknown' }}</span>
+          </div>
+          <div v-if="!isReclusterMode" class="info-item">
             <strong>Features:</strong>
             <span>{{ featureFile || 'Feature extraction completed' }}</span>
           </div>
@@ -41,7 +51,7 @@
         <b-form-group
           label="Project Name"
           label-for="project-name"
-          description="Choose a descriptive name for your new project"
+          :description="isReclusterMode ? 'Choose a name for the new re-clustered project' : 'Choose a descriptive name for your new project'"
           :invalid-feedback="projectNameError"
           :state="projectNameState"
         >
@@ -203,11 +213,17 @@ export default {
   props: {
     archive: {
       type: Object,
-      required: true
+      required: false,
+      default: null
     },
     featureFile: {
       type: String,
       default: null
+    },
+    project: {
+      type: Object,
+      required: false,
+      default: null
     }
   },
   emits: ['cluster', 'cancel'],
@@ -237,6 +253,15 @@ export default {
     };
   },
   computed: {
+    isReclusterMode() {
+      return this.project !== null;
+    },
+    modalTitle() {
+      return this.isReclusterMode ? 'Re-cluster Project' : 'Create Project (Initial Clustering)';
+    },
+    okTitle() {
+      return this.isReclusterMode ? 'Start Re-clustering' : 'Create Project';
+    },
     projectNameState() {
       if (this.parameters.project_name.length === 0) return null;
       return this.parameters.project_name.length >= 3 ? true : false;
@@ -275,8 +300,11 @@ export default {
     }
   },
   mounted() {
-    // Set default project name based on archive name
-    if (this.archive?.name) {
+    if (this.isReclusterMode && this.project?.name) {
+      // For re-clustering, suggest a name based on the original project
+      this.parameters.project_name = `${this.project.name} (Re-clustered)`;
+    } else if (this.archive?.name) {
+      // For initial clustering, set default project name based on archive name
       const baseName = this.archive.name.replace(/\.(zip|tar|tar\.gz)$/i, '');
       this.parameters.project_name = baseName.replace(/_/g, ' ');
     }
diff --git a/morphocluster/frontend/src/views/Projects.vue b/morphocluster/frontend/src/views/Projects.vue
index 74d8bdc..15df5a8 100644
--- a/morphocluster/frontend/src/views/Projects.vue
+++ b/morphocluster/frontend/src/views/Projects.vue
@@ -71,6 +71,14 @@
                             name: 'bisect',
                             params: { project_id: data.item.project_id },
                         }">Grow</b-button>
+                        <b-button
+                            size="sm"
+                            variant="info"
+                            class="mr-2"
+                            @click="showReclusterModal(data.item)"
+                        >
+                            Re-cluster
+                        </b-button>
                     </template>
                     <template v-slot:empty>
                         <div class="text-center">No projects available.</div>
@@ -84,12 +92,21 @@
                 </div>
             </div>
         </div>
+
+        <!-- Re-cluster Modal -->
+        <cluster-modal
+            v-if="showReclusteringModal"
+            :project="selectedProject"
+            @cluster="handleRecluster"
+            @cancel="handleReclusterCancel"
+        />
     </div>
 </template>
 
 <script>
 import * as api from "@/helpers/api.js";
 import DarkModeControl from "@/components/DarkModeControl.vue";
+import ClusterModal from "@/components/ClusterModal.vue";
 
 
 import Humanize from "humanize-plus";
@@ -97,7 +114,10 @@ import Humanize from "humanize-plus";
 export default {
     name: "ProjectsView",
     props: {},
-    components: { DarkModeControl },
+    components: {
+        DarkModeControl,
+        ClusterModal
+    },
     data() {
         return {
             fields: [
@@ -108,12 +128,44 @@ export default {
             ],
             projects: [],
             alerts: [],
+            showReclusteringModal: false,
+            selectedProject: null,
             // Make Humanize available in template:
             Humanize,
         };
     },
     methods: {
+        showReclusterModal(project) {
+            this.selectedProject = project;
+            this.showReclusteringModal = true;
+        },
+
+        handleRecluster(parameters) {
+            if (!this.selectedProject) return;
+
+            // Start re-clustering job
+            api.reclusterProject(this.selectedProject.project_id, parameters)
+                .then(response => {
+                    this.alerts.push({
+                        variant: 'success',
+                        message: `Re-clustering job started for "${this.selectedProject.name}". Job ID: ${response.job_id}`
+                    });
+                    this.showReclusteringModal = false;
+                    this.selectedProject = null;
+                })
+                .catch(error => {
+                    console.error('Re-clustering failed:', error);
+                    this.alerts.push({
+                        variant: 'danger',
+                        message: `Failed to start re-clustering: ${error.response?.data?.error || error.message}`
+                    });
+                });
+        },
 
+        handleReclusterCancel() {
+            this.showReclusteringModal = false;
+            this.selectedProject = null;
+        },
     },
     mounted() {
         // Load node info

From d5db22c1f52395cb80994abf5d6c7ecc9463176a Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 10:43:28 -0400
Subject: [PATCH 05/13] limit reclustering to projects finished with validation
 and growing

---
 morphocluster/frontend/src/views/Projects.vue | 58 ++++++++++++++++++-
 1 file changed, 57 insertions(+), 1 deletion(-)

diff --git a/morphocluster/frontend/src/views/Projects.vue b/morphocluster/frontend/src/views/Projects.vue
index 15df5a8..3024aef 100644
--- a/morphocluster/frontend/src/views/Projects.vue
+++ b/morphocluster/frontend/src/views/Projects.vue
@@ -73,9 +73,12 @@
                         }">Grow</b-button>
                         <b-button
                             size="sm"
-                            variant="info"
+                            :variant="isProjectReadyForReclustering(data.item) ? 'info' : 'secondary'"
+                            :disabled="!isProjectReadyForReclustering(data.item)"
                             class="mr-2"
                             @click="showReclusterModal(data.item)"
+                            v-b-tooltip.hover
+                            :title="getReclusterTooltip(data.item)"
                         >
                             Re-cluster
                         </b-button>
@@ -136,6 +139,14 @@ export default {
     },
     methods: {
         showReclusterModal(project) {
+            if (!this.isProjectReadyForReclustering(project)) {
+                this.alerts.push({
+                    variant: 'warning',
+                    message: 'Complete validation and growing stages before re-clustering this project.'
+                });
+                return;
+            }
+
             this.selectedProject = project;
             this.showReclusteringModal = true;
         },
@@ -166,6 +177,51 @@ export default {
             this.showReclusteringModal = false;
             this.selectedProject = null;
         },
+
+        isProjectReadyForReclustering(project) {
+            // Project is ready for re-clustering when both validation and growing are complete
+            if (!project.progress) return false;
+
+            const progress = project.progress;
+            const totalNodes = progress.leaves_n_nodes || 0;
+            const approvedNodes = progress.leaves_n_approved_nodes || 0;
+            const filledNodes = progress.leaves_n_filled_nodes || 0;
+
+            // Both validation and growing must be complete
+            return totalNodes > 0 && approvedNodes === totalNodes && filledNodes === totalNodes;
+        },
+
+        getReclusterTooltip(project) {
+            if (!project.progress) {
+                return 'No progress information available';
+            }
+
+            const progress = project.progress;
+            const totalNodes = progress.leaves_n_nodes || 0;
+            const approvedNodes = progress.leaves_n_approved_nodes || 0;
+            const filledNodes = progress.leaves_n_filled_nodes || 0;
+
+            if (totalNodes === 0) {
+                return 'Project has no clusters to re-cluster';
+            }
+
+            const validationComplete = approvedNodes === totalNodes;
+            const growingComplete = filledNodes === totalNodes;
+
+            if (validationComplete && growingComplete) {
+                return 'Ready for re-clustering - validation and growing are complete';
+            }
+
+            const missing = [];
+            if (!validationComplete) {
+                missing.push(`validation (${approvedNodes}/${totalNodes} clusters validated)`);
+            }
+            if (!growingComplete) {
+                missing.push(`growing (${filledNodes}/${totalNodes} clusters grown)`);
+            }
+
+            return `Complete ${missing.join(' and ')} before re-clustering`;
+        },
     },
     mounted() {
         // Load node info

From 61884f989c82925c9c0a2c459848ede27dc09014 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 11:23:48 -0400
Subject: [PATCH 06/13] add project metadata to track clustering params and
 predict next iteration's params

---
 .../frontend/src/components/ClusterModal.vue  | 49 ++++++++++++++++++-
 morphocluster/models.py                       |  1 +
 morphocluster/tree.py                         | 12 +++--
 3 files changed, 56 insertions(+), 6 deletions(-)

diff --git a/morphocluster/frontend/src/components/ClusterModal.vue b/morphocluster/frontend/src/components/ClusterModal.vue
index 5138207..556d516 100644
--- a/morphocluster/frontend/src/components/ClusterModal.vue
+++ b/morphocluster/frontend/src/components/ClusterModal.vue
@@ -301,15 +301,60 @@ export default {
   },
   mounted() {
     if (this.isReclusterMode && this.project?.name) {
-      // For re-clustering, suggest a name based on the original project
-      this.parameters.project_name = `${this.project.name} (Re-clustered)`;
+      // For re-clustering, extract previous parameters and set new defaults
+      const previousParams = this.extractClusteringParameters();
+
+      if (previousParams.min_cluster_size) {
+        // Set new min_cluster_size to half of previous (minimum 8)
+        this.parameters.min_cluster_size = Math.max(8, Math.floor(previousParams.min_cluster_size / 2));
+      } else {
+        // Fallback: assume previous was 64, so new default is 32
+        this.parameters.min_cluster_size = 32;
+      }
+
+      // Copy other parameters from previous clustering
+      if (previousParams.min_samples) {
+        this.parameters.min_samples = previousParams.min_samples;
+      }
+      if (previousParams.cluster_selection_method) {
+        this.parameters.cluster_selection_method = previousParams.cluster_selection_method;
+      }
+
+      // Set project name with new cluster size
+      this.parameters.project_name = `${this.project.name} (${this.parameters.min_cluster_size})`;
     } else if (this.archive?.name) {
       // For initial clustering, set default project name based on archive name
       const baseName = this.archive.name.replace(/\.(zip|tar|tar\.gz)$/i, '');
       this.parameters.project_name = baseName.replace(/_/g, ' ');
     }
   },
+  watch: {
+    // Update project name when min_cluster_size changes (for re-clustering mode)
+    'parameters.min_cluster_size'() {
+      if (this.isReclusterMode && this.project?.name) {
+        // Extract the base name (remove existing cluster size if present)
+        const baseName = this.project.name.replace(/\s*\(\d+\)$/, '');
+        this.parameters.project_name = `${baseName} (${this.parameters.min_cluster_size})`;
+      }
+    }
+  },
   methods: {
+    extractClusteringParameters() {
+      // Extract clustering parameters from project metadata
+      if (!this.project?.metadata) {
+        return {};
+      }
+
+      try {
+        const metadata = JSON.parse(this.project.metadata);
+        // The clustering parameters should be under metadata.cluster
+        return metadata.cluster || {};
+      } catch (e) {
+        console.warn('Failed to parse project metadata:', e);
+        return {};
+      }
+    },
+
     handleCluster() {
       if (this.isValid) {
         this.$emit('cluster', this.parameters);
diff --git a/morphocluster/models.py b/morphocluster/models.py
index 2a848ac..a6f77a7 100644
--- a/morphocluster/models.py
+++ b/morphocluster/models.py
@@ -45,6 +45,7 @@
     Column("name", String),
     Column("creation_date", DateTime, default=datetime.datetime.now),
     Column("visible", Boolean, nullable=False, server_default="t"),
+    Column("metadata", Text, nullable=True),  # JSON metadata for clustering parameters
 )
 
 #: :type nodes: sqlalchemy.sql.schema.Table
diff --git a/morphocluster/tree.py b/morphocluster/tree.py
index 3f866a7..6fc7d37 100644
--- a/morphocluster/tree.py
+++ b/morphocluster/tree.py
@@ -174,7 +174,7 @@ def load_project(self, name, tree):
         if not isinstance(tree, processing.Tree):
             tree = processing.Tree.from_saved(tree)
 
-        project_id = self.create_project(name)
+        project_id = self.create_project(name, metadata=tree.meta)
 
         # Lock project
         self.lock_project(project_id)
@@ -692,11 +692,15 @@ def get_path_ids(self, node_id):
         rows = self.connection.execute(stmt, {"node_id": node_id}).fetchall()
         return [r for (r,) in rows]
 
-    def create_project(self, name):
+    def create_project(self, name, metadata=None):
         """
-        Create a project with a name and return its id.
+        Create a project with a name and optional metadata, return its id.
         """
-        stmt = projects.insert().values(name=name)
+        import json
+        values = {"name": name}
+        if metadata is not None:
+            values["metadata"] = json.dumps(metadata)
+        stmt = projects.insert().values(**values)
         result = self.connection.execute(stmt)
         project_id = result.inserted_primary_key[0]
 

From 3674f9c1f03b1b25d4d7784027ea064e001f08c2 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 12:25:41 -0400
Subject: [PATCH 07/13] remove unused footer buttons

---
 morphocluster/frontend/src/views/Approve.vue | 5 +++--
 morphocluster/frontend/src/views/Bisect.vue  | 5 +++--
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/morphocluster/frontend/src/views/Approve.vue b/morphocluster/frontend/src/views/Approve.vue
index 776b77e..b2a254c 100644
--- a/morphocluster/frontend/src/views/Approve.vue
+++ b/morphocluster/frontend/src/views/Approve.vue
@@ -107,15 +107,16 @@
             no-fade
             header-bg-variant="success"
             title="Approval done"
+            hide-footer
         >
             <div class="d-block text-center">
                 Approval is done for this project.
             </div>
-            <footer slot="modal-footer">
+            <div class="d-flex justify-content-center mt-3">
                 <b-button variant="primary" :to="{ name: 'projects' }"
                     >Back to projects</b-button
                 >
-            </footer>
+            </div>
         </b-modal>
     </div>
 </template>
diff --git a/morphocluster/frontend/src/views/Bisect.vue b/morphocluster/frontend/src/views/Bisect.vue
index b625757..187ce4f 100644
--- a/morphocluster/frontend/src/views/Bisect.vue
+++ b/morphocluster/frontend/src/views/Bisect.vue
@@ -182,15 +182,16 @@
             no-fade
             header-bg-variant="success"
             title="Growing done"
+            hide-footer
         >
             <div class="d-block text-center">
                 Growing is done for this project.
             </div>
-            <footer slot="modal-footer">
+            <div class="d-flex justify-content-center mt-3">
                 <b-button variant="primary" :to="{ name: 'projects' }"
                     >Back to projects</b-button
                 >
-            </footer>
+            </div>
         </b-modal>
     </div>
 </template>

From 48037be57a357e46a2c1e6645c4725da6775fdb5 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 12:26:05 -0400
Subject: [PATCH 08/13] black formatting

---
 morphocluster/api.py        | 312 ++++++++++++++-----------
 morphocluster/background.py | 451 ++++++++++++++++++++----------------
 morphocluster/tree.py       |   1 +
 3 files changed, 430 insertions(+), 334 deletions(-)

diff --git a/morphocluster/api.py b/morphocluster/api.py
index 08ac53a..1e0e4cc 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -329,6 +329,7 @@ def upload_files(path=""):
 # /upload - Data Pipeline Upload Interface
 # ===============================================================================
 
+
 @api.route("/upload", methods=["POST"])
 def upload_archives():
     """
@@ -340,10 +341,7 @@ def upload_archives():
     if not uploaded_files:
         raise werkzeug.exceptions.BadRequest("No files provided")
 
-    result = {
-        "message": "Files uploaded successfully",
-        "files": []
-    }
+    result = {"message": "Files uploaded successfully", "files": []}
 
     for upload_file in uploaded_files:
         if upload_file.filename:
@@ -362,12 +360,14 @@ def upload_archives():
             # Get actual file size
             file_size = os.path.getsize(server_path)
 
-            result["files"].append({
-                "name": filename,
-                "size": file_size,
-                "id": filename,  # Use filename as ID for validation
-                "status": "uploaded"
-            })
+            result["files"].append(
+                {
+                    "name": filename,
+                    "size": file_size,
+                    "id": filename,  # Use filename as ID for validation
+                    "status": "uploaded",
+                }
+            )
 
     return jsonify(result), 200
 
@@ -386,17 +386,23 @@ def validate_archive(file_id):
     try:
         # Decode URL-encoded filename
         from urllib.parse import unquote
+
         filename = unquote(file_id)
 
         # Find the uploaded file
         upload_path = Path(app.config["FILES_DIR"]) / filename
 
         if not upload_path.exists():
-            return jsonify({
-                "is_valid": False,
-                "error": f"File {filename} not found",
-                "validation_warnings": []
-            }), 404
+            return (
+                jsonify(
+                    {
+                        "is_valid": False,
+                        "error": f"File {filename} not found",
+                        "validation_warnings": [],
+                    }
+                ),
+                404,
+            )
 
         result = {
             "is_valid": False,
@@ -406,7 +412,7 @@ def validate_archive(file_id):
             "image_count": 0,
             "detected_encoding": None,
             "detected_delimiter": None,
-            "validation_warnings": []
+            "validation_warnings": [],
         }
 
         # Check if it's a ZIP file
@@ -415,25 +421,25 @@ def validate_archive(file_id):
             return jsonify(result), 200
 
         # Examine ZIP contents
-        with zipfile.ZipFile(upload_path, 'r') as zip_file:
+        with zipfile.ZipFile(upload_path, "r") as zip_file:
             file_list = zip_file.namelist()
             result["file_count"] = len(file_list)
 
             # Count image files
-            image_extensions = ('.jpg', '.jpeg', '.png', '.tiff', '.tif')
+            image_extensions = (".jpg", ".jpeg", ".png", ".tiff", ".tif")
             image_files = [f for f in file_list if f.lower().endswith(image_extensions)]
             result["image_count"] = len(image_files)
 
             # Look for metadata files
-            csv_files = [f for f in file_list if f.endswith('.csv')]
-            tsv_files = [f for f in file_list if f.endswith('.tsv')]
+            csv_files = [f for f in file_list if f.endswith(".csv")]
+            tsv_files = [f for f in file_list if f.endswith(".tsv")]
 
             # Detect format based on files present
-            if 'index.csv' in file_list:
+            if "index.csv" in file_list:
                 result["format"] = "standard"
                 result["needs_conversion"] = False
-                metadata_file = 'index.csv'
-            elif tsv_files or any('ecotaxa' in f.lower() for f in csv_files):
+                metadata_file = "index.csv"
+            elif tsv_files or any("ecotaxa" in f.lower() for f in csv_files):
                 result["format"] = "ecotaxa"
                 result["needs_conversion"] = True
                 metadata_file = tsv_files[0] if tsv_files else csv_files[0]
@@ -452,27 +458,37 @@ def validate_archive(file_id):
                         # Detect encoding
                         raw_data = csv_data.read(10000)  # Read first 10KB
                         encoding_result = chardet.detect(raw_data)
-                        result["detected_encoding"] = encoding_result.get('encoding', 'utf-8')
+                        result["detected_encoding"] = encoding_result.get(
+                            "encoding", "utf-8"
+                        )
 
                         # Detect delimiter
-                        sample_text = raw_data.decode(result["detected_encoding"], errors='ignore')
-                        sample_lines = sample_text.split('\n')[:5]
+                        sample_text = raw_data.decode(
+                            result["detected_encoding"], errors="ignore"
+                        )
+                        sample_lines = sample_text.split("\n")[:5]
 
                         if sample_lines:
                             # Count delimiters in first few lines
-                            delimiters = [',', '\t', ';', '|']
+                            delimiters = [",", "\t", ";", "|"]
                             delimiter_counts = {}
 
                             for line in sample_lines:
                                 for delim in delimiters:
-                                    delimiter_counts[delim] = delimiter_counts.get(delim, 0) + line.count(delim)
+                                    delimiter_counts[delim] = delimiter_counts.get(
+                                        delim, 0
+                                    ) + line.count(delim)
 
                             # Choose most common delimiter
                             if delimiter_counts:
-                                result["detected_delimiter"] = max(delimiter_counts, key=delimiter_counts.get)
+                                result["detected_delimiter"] = max(
+                                    delimiter_counts, key=delimiter_counts.get
+                                )
 
                 except Exception as e:
-                    result["validation_warnings"].append(f"Could not analyze metadata file: {str(e)}")
+                    result["validation_warnings"].append(
+                        f"Could not analyze metadata file: {str(e)}"
+                    )
 
             # Validation checks
             if result["image_count"] == 0:
@@ -482,16 +498,21 @@ def validate_archive(file_id):
                 result["validation_warnings"].append("No metadata file found")
 
             # Archive is valid if it has images and metadata
-            result["is_valid"] = (result["image_count"] > 0 and metadata_file is not None)
+            result["is_valid"] = result["image_count"] > 0 and metadata_file is not None
 
         return jsonify(result), 200
 
     except Exception as e:
-        return jsonify({
-            "is_valid": False,
-            "error": f"Validation failed: {str(e)}",
-            "validation_warnings": []
-        }), 500
+        return (
+            jsonify(
+                {
+                    "is_valid": False,
+                    "error": f"Validation failed: {str(e)}",
+                    "validation_warnings": [],
+                }
+            ),
+            500,
+        )
 
 
 @api.route("/files/<file_id>/preview", methods=["GET"])
@@ -521,21 +542,21 @@ def preview_archive(file_id):
             "detected_encoding": None,
             "detected_delimiter": None,
             "columns": [],
-            "sample_rows": []
+            "sample_rows": [],
         }
 
-        with zipfile.ZipFile(upload_path, 'r') as zip_file:
+        with zipfile.ZipFile(upload_path, "r") as zip_file:
             # Get all files in archive
             file_list = zip_file.namelist()
             result["files"] = sorted(file_list)
 
             # Find metadata file (CSV/TSV)
-            csv_files = [f for f in file_list if f.endswith('.csv')]
-            tsv_files = [f for f in file_list if f.endswith('.tsv')]
+            csv_files = [f for f in file_list if f.endswith(".csv")]
+            tsv_files = [f for f in file_list if f.endswith(".tsv")]
 
             metadata_file = None
-            if 'index.csv' in file_list:
-                metadata_file = 'index.csv'
+            if "index.csv" in file_list:
+                metadata_file = "index.csv"
             elif tsv_files:
                 metadata_file = tsv_files[0]
             elif csv_files:
@@ -545,29 +566,37 @@ def preview_archive(file_id):
                 try:
                     with zip_file.open(metadata_file) as csv_data:
                         # Detect encoding
-                        raw_data = csv_data.read(50000)  # Read first 50KB for better detection
+                        raw_data = csv_data.read(
+                            50000
+                        )  # Read first 50KB for better detection
                         encoding_result = chardet.detect(raw_data)
-                        detected_encoding = encoding_result.get('encoding', 'utf-8')
+                        detected_encoding = encoding_result.get("encoding", "utf-8")
 
                         # Handle common encoding issues
-                        if detected_encoding.lower() in ['ascii', 'windows-1252', 'iso-8859-1']:
-                            detected_encoding = 'utf-8'
+                        if detected_encoding.lower() in [
+                            "ascii",
+                            "windows-1252",
+                            "iso-8859-1",
+                        ]:
+                            detected_encoding = "utf-8"
 
                         result["detected_encoding"] = detected_encoding
 
                         # Decode text and detect delimiter
                         try:
-                            text = raw_data.decode(detected_encoding, errors='replace')
+                            text = raw_data.decode(detected_encoding, errors="replace")
                         except UnicodeDecodeError:
-                            text = raw_data.decode('utf-8', errors='replace')
+                            text = raw_data.decode("utf-8", errors="replace")
 
                         # Detect delimiter by analyzing first few lines
-                        lines = text.split('\n')[:10]
-                        non_empty_lines = [line.strip() for line in lines if line.strip()]
+                        lines = text.split("\n")[:10]
+                        non_empty_lines = [
+                            line.strip() for line in lines if line.strip()
+                        ]
 
                         if non_empty_lines:
                             # Count delimiters in header and first few data rows
-                            delimiters = [',', '\t', ';', '|']
+                            delimiters = [",", "\t", ";", "|"]
                             delimiter_scores = {}
 
                             for delim in delimiters:
@@ -578,13 +607,20 @@ def preview_archive(file_id):
 
                                 # Prefer delimiters that appear consistently
                                 if scores and max(scores) > 0:
-                                    consistency = len(set(scores)) == 1  # All lines have same count
+                                    consistency = (
+                                        len(set(scores)) == 1
+                                    )  # All lines have same count
                                     delimiter_scores[delim] = (max(scores), consistency)
 
                             if delimiter_scores:
                                 # Choose delimiter with highest count and consistency
-                                best_delim = max(delimiter_scores,
-                                               key=lambda x: (delimiter_scores[x][1], delimiter_scores[x][0]))
+                                best_delim = max(
+                                    delimiter_scores,
+                                    key=lambda x: (
+                                        delimiter_scores[x][1],
+                                        delimiter_scores[x][0],
+                                    ),
+                                )
                                 result["detected_delimiter"] = best_delim
 
                         # Parse CSV and extract sample data
@@ -592,20 +628,22 @@ def preview_archive(file_id):
                             # Re-read file from beginning for CSV parsing
                             zip_file.seek(0)  # Reset zip file position
                             with zip_file.open(metadata_file) as csv_data:
-                                text_data = csv_data.read().decode(detected_encoding, errors='replace')
-                                lines = text_data.split('\n')
+                                text_data = csv_data.read().decode(
+                                    detected_encoding, errors="replace"
+                                )
+                                lines = text_data.split("\n")
 
                                 # Parse with detected delimiter
                                 csv_reader = csv.DictReader(
-                                    lines,
-                                    delimiter=result["detected_delimiter"]
+                                    lines, delimiter=result["detected_delimiter"]
                                 )
 
                                 # Get column names
                                 if csv_reader.fieldnames:
                                     result["columns"] = [
                                         {"key": col.strip(), "label": col.strip()}
-                                        for col in csv_reader.fieldnames if col
+                                        for col in csv_reader.fieldnames
+                                        if col
                                     ]
 
                                 # Get sample rows (first 5)
@@ -619,7 +657,9 @@ def preview_archive(file_id):
                                         clean_row = {}
                                         for key, value in row.items():
                                             if key:  # Skip empty keys
-                                                clean_row[key.strip()] = str(value).strip() if value else ""
+                                                clean_row[key.strip()] = (
+                                                    str(value).strip() if value else ""
+                                                )
                                         if clean_row:  # Only add non-empty rows
                                             sample_rows.append(clean_row)
 
@@ -632,9 +672,7 @@ def preview_archive(file_id):
         return jsonify(result), 200
 
     except Exception as e:
-        return jsonify({
-            "error": f"Preview failed: {str(e)}"
-        }), 500
+        return jsonify({"error": f"Preview failed: {str(e)}"}), 500
 
 
 @api.route("/files/<file_id>/convert", methods=["POST"])
@@ -653,28 +691,29 @@ def convert_ecotaxa_format(file_id):
         job = convert_ecotaxa_job.queue(filename, parameters)
 
         # Initialize job metadata
-        job.meta['status'] = 'queued'
-        job.meta['progress'] = 0
-        job.meta['current_step'] = 'Waiting in queue...'
-        job.meta['created_at'] = datetime.now().isoformat()
-        job.meta['job_type'] = 'format_conversion'
-        job.meta['archive_name'] = filename
-        job.meta['parameters'] = parameters
+        job.meta["status"] = "queued"
+        job.meta["progress"] = 0
+        job.meta["current_step"] = "Waiting in queue..."
+        job.meta["created_at"] = datetime.now().isoformat()
+        job.meta["job_type"] = "format_conversion"
+        job.meta["archive_name"] = filename
+        job.meta["parameters"] = parameters
         job.save_meta()
 
         result = {
             "job_id": job.id,
             "status": "queued",
             "message": "EcoTaxa conversion job queued",
-            "parameters": parameters
+            "parameters": parameters,
         }
 
         return jsonify(result), 202
 
     except Exception as e:
-        return jsonify({
-            "error": f"Failed to queue EcoTaxa conversion job: {str(e)}"
-        }), 500
+        return (
+            jsonify({"error": f"Failed to queue EcoTaxa conversion job: {str(e)}"}),
+            500,
+        )
 
 
 @api.route("/files/<file_id>/extract", methods=["POST"])
@@ -693,28 +732,29 @@ def extract_features(file_id):
         job = extract_features_job.queue(filename, parameters)
 
         # Initialize job metadata
-        job.meta['status'] = 'queued'
-        job.meta['progress'] = 0
-        job.meta['current_step'] = 'Waiting in queue...'
-        job.meta['created_at'] = datetime.now().isoformat()
-        job.meta['job_type'] = 'feature_extraction'
-        job.meta['archive_name'] = filename
-        job.meta['parameters'] = parameters
+        job.meta["status"] = "queued"
+        job.meta["progress"] = 0
+        job.meta["current_step"] = "Waiting in queue..."
+        job.meta["created_at"] = datetime.now().isoformat()
+        job.meta["job_type"] = "feature_extraction"
+        job.meta["archive_name"] = filename
+        job.meta["parameters"] = parameters
         job.save_meta()
 
         result = {
             "job_id": job.id,
             "status": "queued",
             "message": "Feature extraction job queued",
-            "parameters": parameters
+            "parameters": parameters,
         }
 
         return jsonify(result), 202
 
     except Exception as e:
-        return jsonify({
-            "error": f"Failed to queue feature extraction job: {str(e)}"
-        }), 500
+        return (
+            jsonify({"error": f"Failed to queue feature extraction job: {str(e)}"}),
+            500,
+        )
 
 
 @api.route("/files/<file_id>/cluster", methods=["POST"])
@@ -729,7 +769,7 @@ def create_clustering_project(file_id):
     parameters = request.get_json() or {}
 
     # Extract feature file from parameters or construct default name
-    feature_file = parameters.get('feature_file')
+    feature_file = parameters.get("feature_file")
     if not feature_file:
         # Construct feature file name based on archive name
         archive_stem = pathlib.Path(filename).stem
@@ -740,14 +780,14 @@ def create_clustering_project(file_id):
         job = initial_clustering_job.queue(filename, feature_file, parameters)
 
         # Initialize job metadata
-        job.meta['status'] = 'queued'
-        job.meta['progress'] = 0
-        job.meta['current_step'] = 'Waiting in queue...'
-        job.meta['created_at'] = datetime.now().isoformat()
-        job.meta['job_type'] = 'initial_clustering'
-        job.meta['archive_name'] = filename
-        job.meta['feature_file'] = feature_file
-        job.meta['parameters'] = parameters
+        job.meta["status"] = "queued"
+        job.meta["progress"] = 0
+        job.meta["current_step"] = "Waiting in queue..."
+        job.meta["created_at"] = datetime.now().isoformat()
+        job.meta["job_type"] = "initial_clustering"
+        job.meta["archive_name"] = filename
+        job.meta["feature_file"] = feature_file
+        job.meta["parameters"] = parameters
         job.save_meta()
 
         result = {
@@ -755,15 +795,16 @@ def create_clustering_project(file_id):
             "status": "queued",
             "message": "Initial clustering job queued",
             "parameters": parameters,
-            "feature_file": feature_file
+            "feature_file": feature_file,
         }
 
         return jsonify(result), 202
 
     except Exception as e:
-        return jsonify({
-            "error": f"Failed to queue initial clustering job: {str(e)}"
-        }), 500
+        return (
+            jsonify({"error": f"Failed to queue initial clustering job: {str(e)}"}),
+            500,
+        )
 
 
 @api.route("/jobs/user", methods=["GET"])
@@ -809,7 +850,7 @@ def get_user_jobs():
             print(f"Error fetching jobs: {e}")
 
         # Sort by creation time (newest first)
-        all_jobs.sort(key=lambda x: x.get('created_at', ''), reverse=True)
+        all_jobs.sort(key=lambda x: x.get("created_at", ""), reverse=True)
 
         return jsonify(all_jobs), 200
 
@@ -826,41 +867,41 @@ def _format_job_data(job):
 
         # Determine job status
         if job.is_queued:
-            status = 'queued'
+            status = "queued"
         elif job.is_started:
-            status = job.meta.get('status', 'running')
+            status = job.meta.get("status", "running")
         elif job.is_finished:
-            status = job.meta.get('status', 'completed')
+            status = job.meta.get("status", "completed")
         elif job.is_failed:
-            status = 'failed'
+            status = "failed"
         else:
-            status = 'unknown'
+            status = "unknown"
 
         job_data = {
             "id": job.id,
-            "job_type": job.meta.get('job_type', 'unknown'),
+            "job_type": job.meta.get("job_type", "unknown"),
             "status": status,
-            "progress": job.meta.get('progress', 0),
-            "created_at": job.meta.get('created_at'),
-            "current_step": job.meta.get('current_step'),
-            "parameters": job.meta.get('parameters', {}),
-            "archive_name": job.meta.get('archive_name')
+            "progress": job.meta.get("progress", 0),
+            "created_at": job.meta.get("created_at"),
+            "current_step": job.meta.get("current_step"),
+            "parameters": job.meta.get("parameters", {}),
+            "archive_name": job.meta.get("archive_name"),
         }
 
         # Add completion/failure details
-        if job.meta.get('completed_at'):
-            job_data['completed_at'] = job.meta['completed_at']
-            job_data['result'] = job.meta.get('result')
+        if job.meta.get("completed_at"):
+            job_data["completed_at"] = job.meta["completed_at"]
+            job_data["result"] = job.meta.get("result")
 
-        if job.meta.get('failed_at'):
-            job_data['failed_at'] = job.meta['failed_at']
-            job_data['error_message'] = job.meta.get('error_message')
+        if job.meta.get("failed_at"):
+            job_data["failed_at"] = job.meta["failed_at"]
+            job_data["error_message"] = job.meta.get("error_message")
 
         # Add timing info
         if job.started_at:
-            job_data['started_at'] = job.started_at.isoformat()
+            job_data["started_at"] = job.started_at.isoformat()
         if job.ended_at:
-            job_data['ended_at'] = job.ended_at.isoformat()
+            job_data["ended_at"] = job.ended_at.isoformat()
 
         return job_data
 
@@ -881,7 +922,7 @@ def get_job_status(job_id):
             "id": job_id,
             "status": "completed",
             "progress": 100,
-            "result_url": "/files/converted_sample"
+            "result_url": "/files/converted_sample",
         }
     elif job_id == "job_002":
         job = {
@@ -889,14 +930,10 @@ def get_job_status(job_id):
             "status": "running",
             "progress": 65,
             "current_step": "Processing batch 650/1000",
-            "eta": 180
+            "eta": 180,
         }
     else:
-        job = {
-            "id": job_id,
-            "status": "pending",
-            "progress": 0
-        }
+        job = {"id": job_id, "status": "pending", "progress": 0}
 
     return jsonify(job), 200
 
@@ -907,10 +944,7 @@ def cancel_job(job_id):
     Mock endpoint for cancelling a job.
     Returns mock cancellation response for frontend testing.
     """
-    result = {
-        "message": f"Job {job_id} cancellation requested",
-        "status": "cancelling"
-    }
+    result = {"message": f"Job {job_id} cancellation requested", "status": "cancelling"}
 
     return jsonify(result), 200
 
@@ -1013,28 +1047,26 @@ def recluster_project(project_id):
         job = reclustering_job.queue(project_id, parameters)
 
         # Initialize job metadata
-        job.meta['status'] = 'queued'
-        job.meta['progress'] = 0
-        job.meta['current_step'] = 'Waiting in queue...'
-        job.meta['created_at'] = datetime.now().isoformat()
-        job.meta['job_type'] = 'reclustering'
-        job.meta['project_id'] = project_id
-        job.meta['parameters'] = parameters
+        job.meta["status"] = "queued"
+        job.meta["progress"] = 0
+        job.meta["current_step"] = "Waiting in queue..."
+        job.meta["created_at"] = datetime.now().isoformat()
+        job.meta["job_type"] = "reclustering"
+        job.meta["project_id"] = project_id
+        job.meta["parameters"] = parameters
         job.save_meta()
 
         result = {
             "job_id": job.id,
             "status": "queued",
             "message": "Re-clustering job queued",
-            "parameters": parameters
+            "parameters": parameters,
         }
 
         return jsonify(result), 202
 
     except Exception as e:
-        return jsonify({
-            "error": f"Failed to queue re-clustering job: {str(e)}"
-        }), 500
+        return jsonify({"error": f"Failed to queue re-clustering job: {str(e)}"}), 500
 
 
 # ===============================================================================
diff --git a/morphocluster/background.py b/morphocluster/background.py
index 98c01bc..4ff3389 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -108,6 +108,7 @@ def recluster_project(project_id, min_cluster_size):
 # Upload Pipeline Background Jobs
 # ===============================================================================
 
+
 @rq.job(timeout=3600)  # 1 hour timeout
 def extract_features_job(filename, parameters=None):
     """
@@ -127,6 +128,7 @@ def extract_features_job(filename, parameters=None):
 
     # Create application context for Flask app access
     from morphocluster import create_app
+
     app_instance = create_app()
     with app_instance.app_context():
         try:
@@ -141,48 +143,62 @@ def extract_features_job(filename, parameters=None):
             features_path = archive_path.parent / features_filename
 
             # Step 1: Validate archive
-            job.meta['status'] = 'validating'
-            job.meta['progress'] = 5
-            job.meta['current_step'] = 'Validating archive structure...'
+            job.meta["status"] = "validating"
+            job.meta["progress"] = 5
+            job.meta["current_step"] = "Validating archive structure..."
             job.save_meta()
 
             # Check if archive has index.csv
-            with zipfile.ZipFile(archive_path, 'r') as zip_file:
+            with zipfile.ZipFile(archive_path, "r") as zip_file:
                 file_list = zip_file.namelist()
-                print(f"Archive contents: {file_list[:10]}...")  # Show first 10 files for debugging
+                print(
+                    f"Archive contents: {file_list[:10]}..."
+                )  # Show first 10 files for debugging
 
-                if 'index.csv' not in file_list:
+                if "index.csv" not in file_list:
                     # Check if this is an unconverted EcoTaxa file - suggest conversion
-                    ecotaxa_files = [f for f in file_list if f.startswith('ecotaxa_') and f.endswith('.tsv')]
+                    ecotaxa_files = [
+                        f
+                        for f in file_list
+                        if f.startswith("ecotaxa_") and f.endswith(".tsv")
+                    ]
                     if ecotaxa_files:
-                        raise ValueError(f"Archive appears to be in EcoTaxa format (found {ecotaxa_files[0]}). Please convert it first.")
+                        raise ValueError(
+                            f"Archive appears to be in EcoTaxa format (found {ecotaxa_files[0]}). Please convert it first."
+                        )
                     else:
-                        raise ValueError(f"Archive must contain index.csv file. Found files: {', '.join(file_list[:5])}")
+                        raise ValueError(
+                            f"Archive must contain index.csv file. Found files: {', '.join(file_list[:5])}"
+                        )
 
-                image_files = [f for f in file_list if f.lower().endswith(('.jpg', '.jpeg', '.png', '.tiff', '.tif'))]
+                image_files = [
+                    f
+                    for f in file_list
+                    if f.lower().endswith((".jpg", ".jpeg", ".png", ".tiff", ".tif"))
+                ]
                 total_images = len(image_files)
 
             print(f"Archive validation passed. Found {total_images} images")
 
             # Step 2: Setup parameters
-            job.meta['progress'] = 10
-            job.meta['current_step'] = 'Setting up feature extraction parameters...'
+            job.meta["progress"] = 10
+            job.meta["current_step"] = "Setting up feature extraction parameters..."
             job.save_meta()
 
             # Extract parameters with defaults
-            normalize = parameters.get('normalize', True)
-            batch_size = parameters.get('batch_size', 512)
-            model_file = parameters.get('model_file', None)
+            normalize = parameters.get("normalize", True)
+            batch_size = parameters.get("batch_size", 512)
+            model_file = parameters.get("model_file", None)
 
             # Set default model file if not specified
             if model_file is None:
-                model_file = '/code/data/model_state.pth'
+                model_file = "/code/data/model_state.pth"
 
             # Parse input_mean and input_std - handle both string and list formats
             def parse_mean_std(value, default):
                 if isinstance(value, str):
                     if value.strip():
-                        return tuple(map(float, value.split(',')))
+                        return tuple(map(float, value.split(",")))
                     else:
                         return default
                 elif isinstance(value, (list, tuple)):
@@ -190,16 +206,20 @@ def parse_mean_std(value, default):
                 else:
                     return default
 
-            input_mean = parse_mean_std(parameters.get('input_mean'), (0, 0, 0))
-            input_std = parse_mean_std(parameters.get('input_std'), (1, 1, 1))
+            input_mean = parse_mean_std(parameters.get("input_mean"), (0, 0, 0))
+            input_std = parse_mean_std(parameters.get("input_std"), (1, 1, 1))
 
-            print(f"Using parameters: normalize={normalize}, batch_size={batch_size}, model_file={model_file}")
+            print(
+                f"Using parameters: normalize={normalize}, batch_size={batch_size}, model_file={model_file}"
+            )
             print(f"Input normalization: mean={input_mean}, std={input_std}")
 
             # Step 3: Start feature extraction
-            job.meta['progress'] = 15
-            job.meta['current_step'] = 'Starting feature extraction (this may take several minutes)...'
-            job.meta['total_images'] = total_images
+            job.meta["progress"] = 15
+            job.meta["current_step"] = (
+                "Starting feature extraction (this may take several minutes)..."
+            )
+            job.meta["total_images"] = total_images
             job.save_meta()
 
             # Run MorphoCluster's real feature extraction
@@ -211,27 +231,27 @@ def parse_mean_std(value, default):
                 batch_size=batch_size,
                 cuda=True,  # Use GPU if available
                 input_mean=input_mean,
-                input_std=input_std
+                input_std=input_std,
             )
 
             # Step 4: Complete
-            job.meta['status'] = 'completed'
-            job.meta['progress'] = 100
-            job.meta['current_step'] = 'Feature extraction completed'
-            job.meta['completed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "completed"
+            job.meta["progress"] = 100
+            job.meta["current_step"] = "Feature extraction completed"
+            job.meta["completed_at"] = dt.datetime.now().isoformat()
 
             # Create result with actual feature file info
             result = {
-                'feature_file': features_filename,
-                'feature_path': str(features_path),
-                'total_images': total_images,
-                'feature_dimensions': 32,  # ResNet18 with 32-dim bottleneck
-                'model_used': f'ResNet18 with 32-dim bottleneck: {model_file}',
-                'normalize': normalize,
-                'batch_size': batch_size
+                "feature_file": features_filename,
+                "feature_path": str(features_path),
+                "total_images": total_images,
+                "feature_dimensions": 32,  # ResNet18 with 32-dim bottleneck
+                "model_used": f"ResNet18 with 32-dim bottleneck: {model_file}",
+                "normalize": normalize,
+                "batch_size": batch_size,
             }
 
-            job.meta['result'] = result
+            job.meta["result"] = result
             job.save_meta()
 
             print(f"Feature extraction completed for {filename}")
@@ -240,9 +260,9 @@ def parse_mean_std(value, default):
 
         except Exception as e:
             print(f"Feature extraction failed: {str(e)}")
-            job.meta['status'] = 'failed'
-            job.meta['error_message'] = str(e)
-            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "failed"
+            job.meta["error_message"] = str(e)
+            job.meta["failed_at"] = dt.datetime.now().isoformat()
             job.save_meta()
             raise
 
@@ -265,6 +285,7 @@ def convert_ecotaxa_job(filename, parameters=None):
 
     # Create application context for Flask app access
     from morphocluster import create_app
+
     app_instance = create_app()
     with app_instance.app_context():
         try:
@@ -274,27 +295,27 @@ def convert_ecotaxa_job(filename, parameters=None):
                 raise FileNotFoundError(f"Archive {filename} not found")
 
             # Step 1: Analyze parameters
-            job.meta['status'] = 'analyzing'
-            job.meta['progress'] = 10
-            job.meta['current_step'] = 'Analyzing EcoTaxa format and parameters...'
+            job.meta["status"] = "analyzing"
+            job.meta["progress"] = 10
+            job.meta["current_step"] = "Analyzing EcoTaxa format and parameters..."
             job.save_meta()
 
-            encoding = parameters.get('encoding')
-            delimiter = parameters.get('delimiter')
-            force = parameters.get('force', False)
+            encoding = parameters.get("encoding")
+            delimiter = parameters.get("delimiter")
+            force = parameters.get("force", False)
 
             # Step 2: Create working copy for conversion
-            job.meta['progress'] = 20
-            job.meta['current_step'] = 'Creating working copy...'
+            job.meta["progress"] = 20
+            job.meta["current_step"] = "Creating working copy..."
             job.save_meta()
 
             # Create a copy to work on (fix_ecotaxa modifies in place)
-            work_path = archive_path.with_suffix('.converting.zip')
+            work_path = archive_path.with_suffix(".converting.zip")
             shutil.copy2(archive_path, work_path)
 
             # Step 3: Run EcoTaxa conversion using existing MorphoCluster function
-            job.meta['progress'] = 40
-            job.meta['current_step'] = 'Converting EcoTaxa format to standard format...'
+            job.meta["progress"] = 40
+            job.meta["current_step"] = "Converting EcoTaxa format to standard format..."
             job.save_meta()
 
             try:
@@ -305,11 +326,11 @@ def convert_ecotaxa_job(filename, parameters=None):
                 runner = CliRunner()
                 args = [str(work_path)]
                 if encoding:
-                    args.extend(['--encoding', encoding])
+                    args.extend(["--encoding", encoding])
                 if delimiter:
-                    args.extend(['--delimiter', delimiter])
+                    args.extend(["--delimiter", delimiter])
                 if force:
-                    args.append('--force')
+                    args.append("--force")
 
                 result = runner.invoke(fix_ecotaxa, args)
                 if result.exit_code != 0:
@@ -321,47 +342,50 @@ def convert_ecotaxa_job(filename, parameters=None):
                 raise conversion_error
 
             # Step 4: Validate conversion result
-            job.meta['progress'] = 80
-            job.meta['current_step'] = 'Validating converted archive...'
+            job.meta["progress"] = 80
+            job.meta["current_step"] = "Validating converted archive..."
             job.save_meta()
 
             # Check that index.csv was created
             import zipfile
-            with zipfile.ZipFile(work_path, 'r') as zf:
-                if 'index.csv' not in zf.namelist():
+
+            with zipfile.ZipFile(work_path, "r") as zf:
+                if "index.csv" not in zf.namelist():
                     raise ValueError("Conversion failed: index.csv not created")
 
             # Step 5: Replace original with converted version
-            job.meta['progress'] = 95
-            job.meta['current_step'] = 'Finalizing converted archive...'
+            job.meta["progress"] = 95
+            job.meta["current_step"] = "Finalizing converted archive..."
             job.save_meta()
 
             # Move converted file to final location
-            converted_path = archive_path.with_name(f"{archive_path.stem}_converted{archive_path.suffix}")
+            converted_path = archive_path.with_name(
+                f"{archive_path.stem}_converted{archive_path.suffix}"
+            )
             work_path.rename(converted_path)
 
             # Complete
-            job.meta['status'] = 'completed'
-            job.meta['progress'] = 100
-            job.meta['current_step'] = 'EcoTaxa conversion completed'
-            job.meta['completed_at'] = dt.datetime.now().isoformat()
-            job.meta['result'] = {
-                'converted_file': converted_path.name,
-                'original_file': filename,
-                'encoding': encoding,
-                'delimiter': delimiter,
-                'conversion_method': 'morphocluster.scripts.fix_ecotaxa'
+            job.meta["status"] = "completed"
+            job.meta["progress"] = 100
+            job.meta["current_step"] = "EcoTaxa conversion completed"
+            job.meta["completed_at"] = dt.datetime.now().isoformat()
+            job.meta["result"] = {
+                "converted_file": converted_path.name,
+                "original_file": filename,
+                "encoding": encoding,
+                "delimiter": delimiter,
+                "conversion_method": "morphocluster.scripts.fix_ecotaxa",
             }
             job.save_meta()
 
             print(f"EcoTaxa conversion completed: {filename} -> {converted_path.name}")
-            return job.meta['result']
+            return job.meta["result"]
 
         except Exception as e:
             print(f"EcoTaxa conversion failed: {str(e)}")
-            job.meta['status'] = 'failed'
-            job.meta['error_message'] = str(e)
-            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "failed"
+            job.meta["error_message"] = str(e)
+            job.meta["failed_at"] = dt.datetime.now().isoformat()
             job.save_meta()
             raise
 
@@ -382,6 +406,7 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
 
     # Create application context for Flask app access
     from morphocluster import create_app
+
     app_instance = create_app()
     with app_instance.app_context():
         try:
@@ -395,25 +420,31 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                 raise FileNotFoundError(f"Feature file {feature_file} not found")
 
             # Step 1: Setup parameters
-            job.meta['status'] = 'setting_up'
-            job.meta['progress'] = 10
-            job.meta['current_step'] = 'Setting up clustering parameters...'
+            job.meta["status"] = "setting_up"
+            job.meta["progress"] = 10
+            job.meta["current_step"] = "Setting up clustering parameters..."
             job.save_meta()
 
             # Extract parameters with defaults
-            project_name = parameters.get('project_name', f"Project-{archive_path.stem}")
-            description = parameters.get('description', '')
-            min_cluster_size = parameters.get('min_cluster_size', 128)
-            min_samples = parameters.get('min_samples', 1)
-            cluster_selection_method = parameters.get('cluster_selection_method', 'leaf')
-            sample_size = parameters.get('sample_size', 0)  # 0 = use all
-            keep_unexplored_ratio = parameters.get('keep_unexplored_ratio', 0.0)
+            project_name = parameters.get(
+                "project_name", f"Project-{archive_path.stem}"
+            )
+            description = parameters.get("description", "")
+            min_cluster_size = parameters.get("min_cluster_size", 128)
+            min_samples = parameters.get("min_samples", 1)
+            cluster_selection_method = parameters.get(
+                "cluster_selection_method", "leaf"
+            )
+            sample_size = parameters.get("sample_size", 0)  # 0 = use all
+            keep_unexplored_ratio = parameters.get("keep_unexplored_ratio", 0.0)
 
-            print(f"Clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}")
+            print(
+                f"Clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}"
+            )
 
             # Step 2: Extract images from archive
-            job.meta['progress'] = 15
-            job.meta['current_step'] = 'Extracting images from archive...'
+            job.meta["progress"] = 15
+            job.meta["current_step"] = "Extracting images from archive..."
             job.save_meta()
 
             import zipfile
@@ -428,14 +459,16 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
             archive_images_dir.mkdir(parents=True, exist_ok=True)
 
             # Read index.csv from archive to get object_id and path mappings
-            with zipfile.ZipFile(archive_path, 'r') as zf:
-                with zf.open('index.csv') as fp:
-                    archive_df = pd.read_csv(fp, dtype=str, usecols=["object_id", "path"])
+            with zipfile.ZipFile(archive_path, "r") as zf:
+                with zf.open("index.csv") as fp:
+                    archive_df = pd.read_csv(
+                        fp, dtype=str, usecols=["object_id", "path"]
+                    )
 
                 # Extract image files
                 print(f"Extracting {len(archive_df)} images to {archive_images_dir}")
                 for _, row in archive_df.iterrows():
-                    image_path = row['path']
+                    image_path = row["path"]
                     if image_path in zf.namelist():
                         # Extract to the archive-specific directory
                         extracted_path = zf.extract(image_path, archive_images_dir)
@@ -446,28 +479,36 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                             shutil.move(extracted_path, final_path)
 
             # Step 3: Load objects from archive into database
-            job.meta['progress'] = 25
-            job.meta['current_step'] = 'Loading objects into database...'
+            job.meta["progress"] = 25
+            job.meta["current_step"] = "Loading objects into database..."
             job.save_meta()
 
             # Load feature vectors from H5 file
-            with h5py.File(feature_path, 'r') as h5f:
-                feature_object_ids = h5f['object_id'][:]
-                features = h5f['features'][:]
+            with h5py.File(feature_path, "r") as h5f:
+                feature_object_ids = h5f["object_id"][:]
+                features = h5f["features"][:]
 
                 # Convert bytes to strings if necessary
-                if hasattr(feature_object_ids[0], 'decode'):
-                    feature_object_ids = [oid.decode('utf-8') for oid in feature_object_ids]
+                if hasattr(feature_object_ids[0], "decode"):
+                    feature_object_ids = [
+                        oid.decode("utf-8") for oid in feature_object_ids
+                    ]
                 else:
                     feature_object_ids = list(feature_object_ids)
 
-            feature_dims = features.shape[1] if len(features.shape) > 1 else len(features[0]) if len(features) > 0 else 0
-            print(f"Archive contains {len(archive_df)} objects, features for {len(feature_object_ids)} objects")
+            feature_dims = (
+                features.shape[1]
+                if len(features.shape) > 1
+                else len(features[0]) if len(features) > 0 else 0
+            )
+            print(
+                f"Archive contains {len(archive_df)} objects, features for {len(feature_object_ids)} objects"
+            )
             print(f"Feature dimensions: {feature_dims}")
 
             # Step 3: Insert objects into database with vectors
-            job.meta['progress'] = 30
-            job.meta['current_step'] = 'Inserting objects into database...'
+            job.meta["progress"] = 30
+            job.meta["current_step"] = "Inserting objects into database..."
             job.save_meta()
 
             # Create object data for database insertion
@@ -475,18 +516,20 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
             feature_dict = dict(zip(feature_object_ids, features))
 
             for _, row in archive_df.iterrows():
-                object_id = row['object_id']
-                original_path = row['path']
+                object_id = row["object_id"]
+                original_path = row["path"]
                 # Update path to point to extracted image in archive subdirectory
                 extracted_path = f"{archive_path.stem}/{Path(original_path).name}"
                 vector = feature_dict.get(object_id)
 
                 if vector is not None:
-                    object_data.append({
-                        'object_id': object_id,
-                        'path': extracted_path,  # Path relative to IMAGES_DIR
-                        'vector': vector  # Keep as numpy array - should be 32 dimensions now
-                    })
+                    object_data.append(
+                        {
+                            "object_id": object_id,
+                            "path": extracted_path,  # Path relative to IMAGES_DIR
+                            "vector": vector,  # Keep as numpy array - should be 32 dimensions now
+                        }
+                    )
 
             # Insert objects into database
             with database.engine.connect() as conn:
@@ -494,13 +537,19 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                     # Check if objects already exist to avoid duplicates
                     existing_objects = conn.execute(
                         models.objects.select().where(
-                            models.objects.c.object_id.in_([obj['object_id'] for obj in object_data])
+                            models.objects.c.object_id.in_(
+                                [obj["object_id"] for obj in object_data]
+                            )
                         )
                     ).fetchall()
                     existing_object_ids = {obj.object_id for obj in existing_objects}
 
                     # Only insert new objects
-                    new_objects = [obj for obj in object_data if obj['object_id'] not in existing_object_ids]
+                    new_objects = [
+                        obj
+                        for obj in object_data
+                        if obj["object_id"] not in existing_object_ids
+                    ]
 
                     if new_objects:
                         print(f"Inserting {len(new_objects)} new objects into database")
@@ -509,58 +558,60 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                         print("All objects already exist in database")
 
             # Step 4: Initialize clustering
-            job.meta['progress'] = 40
-            job.meta['current_step'] = 'Initializing clustering algorithm...'
+            job.meta["progress"] = 40
+            job.meta["current_step"] = "Initializing clustering algorithm..."
             job.save_meta()
 
             recluster = Recluster()
 
             # Step 5: Load features
-            job.meta['progress'] = 50
-            job.meta['current_step'] = 'Loading extracted features...'
+            job.meta["progress"] = 50
+            job.meta["current_step"] = "Loading extracted features..."
             job.save_meta()
 
             recluster.load_features(str(feature_path))
 
             # Step 6: Skip init_tree() - let clustering create the tree structure
-            job.meta['progress'] = 60
-            job.meta['current_step'] = 'Preparing clustering...'
+            job.meta["progress"] = 60
+            job.meta["current_step"] = "Preparing clustering..."
             job.save_meta()
 
             # Note: Not calling recluster.init_tree() - this was interfering with clustering
 
             # Step 7: Run clustering
-            job.meta['progress'] = 70
-            job.meta['current_step'] = 'Running HDBSCAN clustering (this may take several minutes)...'
+            job.meta["progress"] = 70
+            job.meta["current_step"] = (
+                "Running HDBSCAN clustering (this may take several minutes)..."
+            )
             job.save_meta()
 
             # Apply sample size and keep_unexplored_ratio if specified
             cluster_kwargs = {
-                'min_cluster_size': min_cluster_size,
-                'min_samples': min_samples,
-                'cluster_selection_method': cluster_selection_method,
+                "min_cluster_size": min_cluster_size,
+                "min_samples": min_samples,
+                "cluster_selection_method": cluster_selection_method,
             }
 
             if sample_size > 0:
-                cluster_kwargs['sample_size'] = sample_size
+                cluster_kwargs["sample_size"] = sample_size
                 print(f"Using sample size: {sample_size}")
 
             if keep_unexplored_ratio > 0:
-                cluster_kwargs['keep_unexplored'] = keep_unexplored_ratio
+                cluster_kwargs["keep_unexplored"] = keep_unexplored_ratio
 
             recluster.cluster(**cluster_kwargs)
 
             # Step 8: Get the clustered tree
-            job.meta['progress'] = 80
-            job.meta['current_step'] = 'Building project tree structure...'
+            job.meta["progress"] = 80
+            job.meta["current_step"] = "Building project tree structure..."
             job.save_meta()
 
             # Get the first (and only) tree from recluster
             tree = recluster.trees[0]
 
             # Step 9: Load into database
-            job.meta['progress'] = 90
-            job.meta['current_step'] = 'Creating project in database...'
+            job.meta["progress"] = 90
+            job.meta["current_step"] = "Creating project in database..."
             job.save_meta()
 
             with database.engine.connect() as conn:
@@ -574,38 +625,40 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                     db_tree.consolidate_node(root_id)
 
             # Step 10: Complete
-            job.meta['status'] = 'completed'
-            job.meta['progress'] = 100
-            job.meta['current_step'] = 'Project created successfully'
-            job.meta['completed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "completed"
+            job.meta["progress"] = 100
+            job.meta["current_step"] = "Project created successfully"
+            job.meta["completed_at"] = dt.datetime.now().isoformat()
 
             # Get final statistics
             cluster_count = len(tree.nodes)  # Number of nodes/clusters
             object_count = len(tree.objects)  # Number of objects
 
             result = {
-                'project_id': project_id,
-                'project_name': project_name,
-                'root_id': root_id,
-                'cluster_count': cluster_count,
-                'object_count': object_count,
-                'min_cluster_size': min_cluster_size,
-                'cluster_selection_method': cluster_selection_method,
-                'project_url': f'/projects/{project_id}'
+                "project_id": project_id,
+                "project_name": project_name,
+                "root_id": root_id,
+                "cluster_count": cluster_count,
+                "object_count": object_count,
+                "min_cluster_size": min_cluster_size,
+                "cluster_selection_method": cluster_selection_method,
+                "project_url": f"/projects/{project_id}",
             }
 
-            job.meta['result'] = result
+            job.meta["result"] = result
             job.save_meta()
 
             print(f"Initial clustering completed for {archive_name}")
-            print(f"Created project '{project_name}' with {cluster_count} clusters and {object_count} objects")
+            print(
+                f"Created project '{project_name}' with {cluster_count} clusters and {object_count} objects"
+            )
             return result
 
         except Exception as e:
             print(f"Initial clustering failed: {str(e)}")
-            job.meta['status'] = 'failed'
-            job.meta['error_message'] = str(e)
-            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "failed"
+            job.meta["error_message"] = str(e)
+            job.meta["failed_at"] = dt.datetime.now().isoformat()
             job.save_meta()
             raise
 
@@ -617,12 +670,14 @@ def reclustering_job(project_id, parameters=None):
     """
     print(f"Starting re-clustering for project {project_id}")
     from rq import get_current_job
+
     job = get_current_job()
     if parameters is None:
         parameters = {}
 
     # Create application context for Flask app access
     from morphocluster import create_app
+
     app_instance = create_app()
 
     with app_instance.app_context():
@@ -635,24 +690,30 @@ def reclustering_job(project_id, parameters=None):
             import h5py
 
             # Step 1: Setup parameters
-            job.meta['status'] = 'setting_up'
-            job.meta['progress'] = 10
-            job.meta['current_step'] = 'Setting up re-clustering parameters...'
+            job.meta["status"] = "setting_up"
+            job.meta["progress"] = 10
+            job.meta["current_step"] = "Setting up re-clustering parameters..."
             job.save_meta()
 
             # Extract parameters with defaults
-            new_project_name = parameters.get('project_name', f"Re-clustered Project {project_id}")
-            min_cluster_size = parameters.get('min_cluster_size', 32)
-            min_samples = parameters.get('min_samples', 1)
-            cluster_selection_method = parameters.get('cluster_selection_method', 'leaf')
-            sample_size = parameters.get('sample_size', 0)  # 0 = use all
-            keep_unexplored_ratio = parameters.get('keep_unexplored_ratio', 0.0)
+            new_project_name = parameters.get(
+                "project_name", f"Re-clustered Project {project_id}"
+            )
+            min_cluster_size = parameters.get("min_cluster_size", 32)
+            min_samples = parameters.get("min_samples", 1)
+            cluster_selection_method = parameters.get(
+                "cluster_selection_method", "leaf"
+            )
+            sample_size = parameters.get("sample_size", 0)  # 0 = use all
+            keep_unexplored_ratio = parameters.get("keep_unexplored_ratio", 0.0)
 
-            print(f"Re-clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}")
+            print(
+                f"Re-clustering parameters: min_cluster_size={min_cluster_size}, method={cluster_selection_method}"
+            )
 
             # Step 2: Load the existing project and export it
-            job.meta['progress'] = 20
-            job.meta['current_step'] = 'Loading existing project...'
+            job.meta["progress"] = 20
+            job.meta["current_step"] = "Loading existing project..."
             job.save_meta()
 
             with database.engine.connect() as conn:
@@ -665,8 +726,8 @@ def reclustering_job(project_id, parameters=None):
                 db_tree.export_tree(root_id, temp_tree_path)
 
             # Step 3: Find the feature file (look for existing feature files)
-            job.meta['progress'] = 30
-            job.meta['current_step'] = 'Finding feature file...'
+            job.meta["progress"] = 30
+            job.meta["current_step"] = "Finding feature file..."
             job.save_meta()
 
             files_dir = Path(app_instance.config["FILES_DIR"])
@@ -681,56 +742,56 @@ def reclustering_job(project_id, parameters=None):
             print(f"Using feature file: {feature_path}")
 
             # Step 4: Initialize clustering
-            job.meta['progress'] = 40
-            job.meta['current_step'] = 'Initializing re-clustering algorithm...'
+            job.meta["progress"] = 40
+            job.meta["current_step"] = "Initializing re-clustering algorithm..."
             job.save_meta()
 
             recluster = Recluster()
 
             # Step 5: Load features
-            job.meta['progress'] = 50
-            job.meta['current_step'] = 'Loading features...'
+            job.meta["progress"] = 50
+            job.meta["current_step"] = "Loading features..."
             job.save_meta()
 
             recluster.load_features(str(feature_path))
 
             # Step 6: Load existing tree
-            job.meta['progress'] = 60
-            job.meta['current_step'] = 'Loading existing project tree...'
+            job.meta["progress"] = 60
+            job.meta["current_step"] = "Loading existing project tree..."
             job.save_meta()
 
             recluster.load_tree(temp_tree_path)
 
             # Step 7: Run clustering
-            job.meta['progress'] = 70
-            job.meta['current_step'] = 'Running HDBSCAN re-clustering...'
+            job.meta["progress"] = 70
+            job.meta["current_step"] = "Running HDBSCAN re-clustering..."
             job.save_meta()
 
             cluster_kwargs = {
-                'min_cluster_size': min_cluster_size,
-                'min_samples': min_samples,
-                'cluster_selection_method': cluster_selection_method,
+                "min_cluster_size": min_cluster_size,
+                "min_samples": min_samples,
+                "cluster_selection_method": cluster_selection_method,
             }
 
             if sample_size > 0:
-                cluster_kwargs['sample_size'] = sample_size
+                cluster_kwargs["sample_size"] = sample_size
 
             if keep_unexplored_ratio > 0:
-                cluster_kwargs['keep_unexplored'] = keep_unexplored_ratio
+                cluster_kwargs["keep_unexplored"] = keep_unexplored_ratio
 
             recluster.cluster(**cluster_kwargs)
 
             # Step 8: Create new project from re-clustered tree
-            job.meta['progress'] = 80
-            job.meta['current_step'] = 'Creating new project...'
+            job.meta["progress"] = 80
+            job.meta["current_step"] = "Creating new project..."
             job.save_meta()
 
             # Get the new clustered tree (should be the second tree)
             new_tree = recluster.trees[-1]  # Get the most recent tree
 
             # Step 9: Load into database as new project
-            job.meta['progress'] = 90
-            job.meta['current_step'] = 'Saving new project to database...'
+            job.meta["progress"] = 90
+            job.meta["current_step"] = "Saving new project to database..."
             job.save_meta()
 
             with database.engine.connect() as conn:
@@ -747,38 +808,40 @@ def reclustering_job(project_id, parameters=None):
             Path(temp_tree_path).unlink(missing_ok=True)
 
             # Step 10: Complete
-            job.meta['status'] = 'completed'
-            job.meta['progress'] = 100
-            job.meta['current_step'] = 'Re-clustering completed successfully'
-            job.meta['completed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "completed"
+            job.meta["progress"] = 100
+            job.meta["current_step"] = "Re-clustering completed successfully"
+            job.meta["completed_at"] = dt.datetime.now().isoformat()
 
             # Get final statistics
             cluster_count = len(new_tree.nodes)
             object_count = len(new_tree.objects)
 
             result = {
-                'original_project_id': project_id,
-                'new_project_id': new_project_id,
-                'new_project_name': new_project_name,
-                'new_root_id': new_root_id,
-                'cluster_count': cluster_count,
-                'object_count': object_count,
-                'min_cluster_size': min_cluster_size,
-                'cluster_selection_method': cluster_selection_method,
-                'project_url': f'/projects/{new_project_id}'
+                "original_project_id": project_id,
+                "new_project_id": new_project_id,
+                "new_project_name": new_project_name,
+                "new_root_id": new_root_id,
+                "cluster_count": cluster_count,
+                "object_count": object_count,
+                "min_cluster_size": min_cluster_size,
+                "cluster_selection_method": cluster_selection_method,
+                "project_url": f"/projects/{new_project_id}",
             }
 
-            job.meta['result'] = result
+            job.meta["result"] = result
             job.save_meta()
 
             print(f"Re-clustering completed for project {project_id}")
-            print(f"Created new project '{new_project_name}' (ID: {new_project_id}) with {cluster_count} clusters")
+            print(
+                f"Created new project '{new_project_name}' (ID: {new_project_id}) with {cluster_count} clusters"
+            )
             return result
 
         except Exception as e:
             print(f"Re-clustering failed: {str(e)}")
-            job.meta['status'] = 'failed'
-            job.meta['error_message'] = str(e)
-            job.meta['failed_at'] = dt.datetime.now().isoformat()
+            job.meta["status"] = "failed"
+            job.meta["error_message"] = str(e)
+            job.meta["failed_at"] = dt.datetime.now().isoformat()
             job.save_meta()
             raise
diff --git a/morphocluster/tree.py b/morphocluster/tree.py
index 6fc7d37..bd3964c 100644
--- a/morphocluster/tree.py
+++ b/morphocluster/tree.py
@@ -697,6 +697,7 @@ def create_project(self, name, metadata=None):
         Create a project with a name and optional metadata, return its id.
         """
         import json
+
         values = {"name": name}
         if metadata is not None:
             values["metadata"] = json.dumps(metadata)

From c653765773f0603c6b1905dca4c3f9debce42ed0 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 25 Sep 2025 12:51:14 -0400
Subject: [PATCH 09/13] remove files page upload, make navbar consistent across
 all pages, and fix files page null error

---
 morphocluster/frontend/src/views/Approve.vue  |  2 +-
 morphocluster/frontend/src/views/Bisect.vue   |  2 +-
 .../frontend/src/views/BisectContainer.vue    |  2 +-
 morphocluster/frontend/src/views/Files.vue    | 55 ++++++-------------
 morphocluster/frontend/src/views/Project.vue  |  8 ++-
 morphocluster/frontend/src/views/Projects.vue | 10 +++-
 morphocluster/frontend/src/views/Upload.vue   |  5 +-
 7 files changed, 38 insertions(+), 46 deletions(-)

diff --git a/morphocluster/frontend/src/views/Approve.vue b/morphocluster/frontend/src/views/Approve.vue
index b2a254c..a4838df 100644
--- a/morphocluster/frontend/src/views/Approve.vue
+++ b/morphocluster/frontend/src/views/Approve.vue
@@ -1,7 +1,7 @@
 <template>
     <div id="approve">
         <nav class="navbar navbar-expand-lg navbar-light bg-dark text-light">
-            <router-link class="navbar-brand text-light" to="/"
+            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }"
                 >MorphoCluster</router-link
             >
             <div class="collapse navbar-collapse">
diff --git a/morphocluster/frontend/src/views/Bisect.vue b/morphocluster/frontend/src/views/Bisect.vue
index 187ce4f..0b0b9ec 100644
--- a/morphocluster/frontend/src/views/Bisect.vue
+++ b/morphocluster/frontend/src/views/Bisect.vue
@@ -1,7 +1,7 @@
 <template>
     <div id="bisect">
         <nav class="navbar navbar-expand-lg navbar-light bg-dark text-light">
-            <router-link class="navbar-brand text-light" to="/"
+            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }"
                 >MorphoCluster</router-link
             >
             <div class="collapse navbar-collapse">
diff --git a/morphocluster/frontend/src/views/BisectContainer.vue b/morphocluster/frontend/src/views/BisectContainer.vue
index 93d228c..a28f322 100644
--- a/morphocluster/frontend/src/views/BisectContainer.vue
+++ b/morphocluster/frontend/src/views/BisectContainer.vue
@@ -1,7 +1,7 @@
 <template>
     <div id="bisect-container">
         <nav class="navbar navbar-expand-lg navbar-light bg-dark">
-            <router-link class="navbar-brand text-light" to="/">MorphoCluster</router-link>
+            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }">MorphoCluster</router-link>
             <div class="collapse navbar-collapse">
                 <ul class="navbar-nav mr-auto">
                     <li class="nav-item nav-link text-light" v-if="project">
diff --git a/morphocluster/frontend/src/views/Files.vue b/morphocluster/frontend/src/views/Files.vue
index 2f39bf8..4f22aba 100644
--- a/morphocluster/frontend/src/views/Files.vue
+++ b/morphocluster/frontend/src/views/Files.vue
@@ -1,32 +1,38 @@
 <template>
     <div id="files">
         <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-            <router-link class="navbar-brand" :to="{ name: 'home' }">MorphoCluster</router-link>
+            <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
             <div class="navbar-collapse" id="navbarNav">
                 <ul class="navbar-nav me-auto">
                     <li class="navbar-item">
-                        <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
+                        <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
                     </li>
-                    <li v-for="(parent, index) in entry.parents.slice()" :key="index" class="navbar-item">
+                    <li class="navbar-item">
+                        <span class="nav-link active">Files</span>
+                    </li>
+                    <li class="navbar-item">
+                        <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
+                    </li>
+                    <li v-for="(parent, index) in entry && entry.parents ? entry.parents.slice() : []" :key="index" class="navbar-item">
                         <router-link class="nav-link" :to="{ name: 'files', params: { file_path: parent.path } }">{{
                             parent.name
                         }}</router-link>
                     </li>
-                    <li class="navbar-item" v-if="this.entry.name != '.'">
-                        <span class="nav-link">{{ this.entry.name }}</span>
+                    <li class="navbar-item" v-if="entry && entry.name != '.'">
+                        <span class="nav-link">{{ entry.name }}</span>
                     </li>
                 </ul>
             </div>
             <dark-mode-control />
         </nav>
         <div class="scrollable">
-            <div class="container" v-if="this.entry.type === 'directory'">
+            <div class="container" v-if="entry && entry.type === 'directory'">
                 <div class="alerts" v-if="alerts.length">
                     <b-alert :key="a" v-for="a of alerts" dismissible show :variant="a.variant">
                         {{ a.message }}
                     </b-alert>
                 </div>
-                <b-table id="files_table" striped :items="entry.children" :fields="fields" showEmpty>
+                <b-table id="files_table" striped :items="entry.children || []" :fields="fields" showEmpty>
                     <template v-slot:cell(name)="child">
                         <router-link v-if="child.item.type === 'directory'" :to="{
                             name: 'files',
@@ -38,24 +44,17 @@
                         }"><i class="mdi mdi-file" /> {{ child.item.name }} </router-link>
                     </template>
                 </b-table>
-                <div class="dropzone" @dragover.prevent @dragenter.prevent @dragleave.prevent @drop="handleDrop">
-                    Upload Files
-                </div>
-                <input type="file" id="fileInput" style="display: none" @change="handleFileSelect" multiple />
-                <div class="container mt-4 text-center">
-                    <button class="btn btn-primary" @click="openFileInput">Select File</button>
-                </div>
             </div>
-            <div class="container" v-if="this.entry.type === 'file'">
+            <div class="container" v-if="entry && entry.type === 'file'">
                 <!--TODO: Convert to regular table and select and format properties by hand. -->
                 <table id="table" style="width=100%">
                     <tr>
                         <td style="padding-right: 20px;">Name:</td>
-                        <td>{{ this.entry.name }}</td>
+                        <td>{{ entry.name }}</td>
                     </tr>
                     <tr>
                         <td style="padding-right: 20px;">Created On:</td>
-                        <td>{{ this.entry.last_modified }}</td>
+                        <td>{{ entry.last_modified }}</td>
                     </tr>
                 </table>
                 <div class=" d-flex justify-content-center">
@@ -75,7 +74,6 @@
 import "@mdi/font/css/materialdesignicons.css";
 import * as api from "@/helpers/api.js";
 // Bootstrap is already imported globally in main.js
-import { uploadFiles } from "../helpers/api.js";
 import DarkModeControl from "@/components/DarkModeControl.vue";
 
 export default {
@@ -104,9 +102,6 @@ export default {
             const parts = path.split('/');
             return parts[parts.length - 1];
         },
-        openFileInput() {
-            document.getElementById("fileInput").click();
-        },
         async initialize() {
             try {
                 this.entry = await api.getFileInfo(this.file_path);
@@ -118,24 +113,6 @@ export default {
                 });
             }
         },
-        async handleDrop(event) {
-            event.preventDefault();
-            this.uploadFiles(event.dataTransfer.files);
-        },
-        async handleFileSelect(event) {
-            event.preventDefault();
-            this.uploadFiles(event.target.files);
-        },
-        async uploadFiles(selectedFiles) {
-            const formData = new FormData();
-            for (let i = 0; i < selectedFiles.length; i++) {
-                const file = selectedFiles[i];
-                formData.append('file', file);
-            }
-            const response = await uploadFiles(formData, this.entry.path);
-            console.log("Data upload successful", response.message);
-            this.initialize();
-        },
         downloadFile() {
             window.open(`/api/files/${this.entry.path}?download=1`);
         },
diff --git a/morphocluster/frontend/src/views/Project.vue b/morphocluster/frontend/src/views/Project.vue
index 9660b58..f7b615f 100644
--- a/morphocluster/frontend/src/views/Project.vue
+++ b/morphocluster/frontend/src/views/Project.vue
@@ -1,12 +1,18 @@
 <template>
     <div id="project">
         <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-            <router-link class="navbar-brand" :to="{ name: 'home' }">MorphoCluster</router-link>
+            <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
             <div class="navbar-collapse" id="navbarNav">
                 <ul class="navbar-nav me-auto">
                     <li class="nav-item">
                         <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
                     </li>
+                    <li class="nav-item">
+                        <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
+                    </li>
+                    <li class="nav-item">
+                        <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
+                    </li>
                     <li class="nav-item" v-if="project">
                         <router-link class="nav-link"
                             :to="{ name: 'project', params: { project_id: project.project_id } }">{{
diff --git a/morphocluster/frontend/src/views/Projects.vue b/morphocluster/frontend/src/views/Projects.vue
index 3024aef..4aac21f 100644
--- a/morphocluster/frontend/src/views/Projects.vue
+++ b/morphocluster/frontend/src/views/Projects.vue
@@ -1,10 +1,16 @@
 <template>
     <div id="projects">
         <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-            <router-link class="navbar-brand" :to="{ name: 'home' }">MorphoCluster</router-link>
+            <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
             <ul class="navbar-nav me-auto">
                 <li class="nav-item">
-                    <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
+                    <span class="nav-link active">Projects</span>
+                </li>
+                <li class="nav-item">
+                    <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
+                </li>
+                <li class="nav-item">
+                    <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
                 </li>
             </ul>
             <dark-mode-control />
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
index 367f752..f3c9ffc 100644
--- a/morphocluster/frontend/src/views/Upload.vue
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -1,9 +1,12 @@
 <template>
   <div id="upload-view">
     <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-      <router-link class="navbar-brand" :to="{ name: 'home' }">MorphoCluster</router-link>
+      <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
       <div class="navbar-collapse">
         <ul class="navbar-nav me-auto">
+          <li class="navbar-item">
+            <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
+          </li>
           <li class="navbar-item">
             <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
           </li>

From ca4bb3d3dc188b212729f32ef8b0a8890923797d Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Fri, 26 Sep 2025 16:46:04 -0400
Subject: [PATCH 10/13] various improvements to help track state of uploaded
 archives

---
 morphocluster/api.py                          | 149 ++++++
 morphocluster/background.py                   | 153 +++++-
 .../frontend/src/components/ClusterModal.vue  |   6 +-
 .../frontend/src/components/FeatureModal.vue  |   2 +-
 .../frontend/src/components/FormatModal.vue   |  39 +-
 .../frontend/src/components/JobStatus.vue     |  38 +-
 morphocluster/frontend/src/helpers/api.js     |  19 +
 morphocluster/frontend/src/router.js          |   7 +-
 morphocluster/frontend/src/views/Files.vue    |   3 +
 morphocluster/frontend/src/views/JobQueue.vue | 441 ++++++++++++++++++
 morphocluster/frontend/src/views/Project.vue  |   3 +
 morphocluster/frontend/src/views/Projects.vue |   3 +
 morphocluster/frontend/src/views/Upload.vue   | 315 ++++++++++---
 morphocluster/models.py                       |  18 +
 14 files changed, 1085 insertions(+), 111 deletions(-)
 create mode 100644 morphocluster/frontend/src/views/JobQueue.vue

diff --git a/morphocluster/api.py b/morphocluster/api.py
index 1e0e4cc..4dc3878 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -886,6 +886,7 @@ def _format_job_data(job):
             "current_step": job.meta.get("current_step"),
             "parameters": job.meta.get("parameters", {}),
             "archive_name": job.meta.get("archive_name"),
+            "logs": job.meta.get("logs", []),
         }
 
         # Add completion/failure details
@@ -2108,3 +2109,151 @@ def get_job(job_id):
     result = JobSchema().dump(data)
 
     return jsonify(result)
+
+
+# ===============================================================================
+# Uploaded Archives Management
+# ===============================================================================
+
+@api.route("/uploaded-archives", methods=["GET"])
+def get_uploaded_archives():
+    """Get all uploaded archives for the current user/session."""
+    from morphocluster.models import uploaded_archives
+
+    with database.engine.connect() as conn:
+        result = conn.execute(
+            uploaded_archives.select().order_by(uploaded_archives.c.upload_date.desc())
+        ).fetchall()
+
+        archives = []
+        for row in result:
+            archive_data = {
+                "id": row.id,
+                "filename": row.filename,
+                "original_filename": row.original_filename,
+                "file_size": row.file_size,
+                "upload_date": row.upload_date.isoformat() if row.upload_date else None,
+                "status": row.status,
+                "is_valid": row.is_valid,
+                "needs_conversion": row.needs_conversion,
+                "validation_data": row.validation_data,
+                "feature_file": row.feature_file,
+                "project_id": row.project_id,
+                "error_message": row.error_message,
+                "metadata": row.metadata or "{}"
+            }
+            archives.append(archive_data)
+
+        return jsonify(archives)
+
+
+@api.route("/uploaded-archives", methods=["POST"])
+def save_uploaded_archive():
+    """Save a new uploaded archive record."""
+    from morphocluster.models import uploaded_archives
+    import json
+
+    data = request.get_json()
+
+    insert_data = {
+        "filename": data.get("filename"),
+        "original_filename": data.get("original_filename"),
+        "file_size": data.get("file_size", 0),
+        "status": data.get("status", "uploaded"),
+        "is_valid": data.get("is_valid", False),
+        "needs_conversion": data.get("needs_conversion", False),
+        "validation_data": data.get("validation_data"),
+        "feature_file": data.get("feature_file"),
+        "project_id": data.get("project_id"),
+        "error_message": data.get("error_message"),
+        "metadata": data.get("metadata", "{}")
+    }
+
+    with database.engine.connect() as conn:
+        with conn.begin():
+            result = conn.execute(uploaded_archives.insert().values(**insert_data))
+            archive_id = result.inserted_primary_key[0]
+
+            # Return the created archive with ID
+            row = conn.execute(
+                uploaded_archives.select().where(uploaded_archives.c.id == archive_id)
+            ).fetchone()
+
+            return jsonify({
+                "id": row.id,
+                "filename": row.filename,
+                "original_filename": row.original_filename,
+                "file_size": row.file_size,
+                "upload_date": row.upload_date.isoformat() if row.upload_date else None,
+                "status": row.status,
+                "is_valid": row.is_valid,
+                "needs_conversion": row.needs_conversion,
+                "validation_data": row.validation_data,
+                "feature_file": row.feature_file,
+                "project_id": row.project_id,
+                "error_message": row.error_message,
+                "metadata": row.metadata or "{}"
+            })
+
+
+@api.route("/uploaded-archives/<int:archive_id>", methods=["PUT"])
+def update_uploaded_archive(archive_id):
+    """Update an uploaded archive record."""
+    from morphocluster.models import uploaded_archives
+    import json
+
+    data = request.get_json()
+
+    update_data = {}
+    if "status" in data:
+        update_data["status"] = data["status"]
+    if "feature_file" in data:
+        update_data["feature_file"] = data["feature_file"]
+    if "project_id" in data:
+        update_data["project_id"] = data["project_id"]
+    if "error" in data:
+        update_data["error_message"] = data["error"]
+    if "metadata" in data:
+        # Handle metadata - if it's already a string, use it directly
+        # If it's an object, JSON encode it
+        metadata = data["metadata"]
+        if isinstance(metadata, str):
+            update_data["metadata"] = metadata
+        else:
+            update_data["metadata"] = json.dumps(metadata)
+    if "needs_conversion" in data:
+        update_data["needs_conversion"] = data["needs_conversion"]
+    if "filename" in data:
+        update_data["filename"] = data["filename"]
+
+    with database.engine.connect() as conn:
+        with conn.begin():
+            conn.execute(
+                uploaded_archives.update()
+                .where(uploaded_archives.c.id == archive_id)
+                .values(**update_data)
+            )
+
+            # Return updated archive
+            row = conn.execute(
+                uploaded_archives.select().where(uploaded_archives.c.id == archive_id)
+            ).fetchone()
+
+            if not row:
+                raise werkzeug.exceptions.NotFound("Archive not found")
+
+            return jsonify({
+                "id": row.id,
+                "filename": row.filename,
+                "original_filename": row.original_filename,
+                "file_size": row.file_size,
+                "upload_date": row.upload_date.isoformat() if row.upload_date else None,
+                "status": row.status,
+                "is_valid": row.is_valid,
+                "needs_conversion": row.needs_conversion,
+                "validation_data": row.validation_data,
+                "feature_file": row.feature_file,
+                "project_id": row.project_id,
+                "error_message": row.error_message,
+                "metadata": row.metadata or "{}"
+            })
diff --git a/morphocluster/background.py b/morphocluster/background.py
index 4ff3389..44c9f8c 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -14,6 +14,52 @@
 from morphocluster.tree import Tree
 
 
+class JobLogger:
+    """Logger for background jobs that stores logs in job metadata"""
+
+    def __init__(self, job):
+        self.job = job
+        # Initialize logs list if not exists
+        if "logs" not in self.job.meta:
+            self.job.meta["logs"] = []
+
+    def log(self, message, level="info"):
+        """Add a log entry with timestamp"""
+        log_entry = {
+            "timestamp": dt.datetime.now().isoformat(),
+            "level": level,
+            "message": str(message)
+        }
+
+        # Add to logs array
+        if "logs" not in self.job.meta:
+            self.job.meta["logs"] = []
+
+        self.job.meta["logs"].append(log_entry)
+
+        # Keep only last 50 logs to prevent metadata bloat
+        if len(self.job.meta["logs"]) > 50:
+            self.job.meta["logs"] = self.job.meta["logs"][-50:]
+
+        # Also print for console output
+        print(f"[{level.upper()}] {message}")
+
+        # Save metadata
+        self.job.save_meta()
+
+    def info(self, message):
+        self.log(message, "info")
+
+    def warning(self, message):
+        self.log(message, "warning")
+
+    def error(self, message):
+        self.log(message, "error")
+
+    def success(self, message):
+        self.log(message, "success")
+
+
 def validate_background_job(fun):
     return isinstance(getattr(fun, "helper", None), flask_rq2.functions.JobFunctions)
 
@@ -114,15 +160,16 @@ def extract_features_job(filename, parameters=None):
     """
     Background job for extracting features from uploaded archive using MorphoCluster's real feature extraction.
     """
-    print(f"Starting feature extraction for {filename}")
-
-    # Get current job for progress updates
     from rq import get_current_job
+    job = get_current_job()
+    logger = JobLogger(job)
+
+    logger.info(f"Starting feature extraction for {filename}")
+
+    # Import required modules
     from morphocluster.processing.extract_features import extract_features
     import zipfile
 
-    job = get_current_job()
-
     if parameters is None:
         parameters = {}
 
@@ -148,10 +195,12 @@ def extract_features_job(filename, parameters=None):
             job.meta["current_step"] = "Validating archive structure..."
             job.save_meta()
 
+            logger.info("Validating archive structure and contents")
+
             # Check if archive has index.csv
             with zipfile.ZipFile(archive_path, "r") as zip_file:
                 file_list = zip_file.namelist()
-                print(
+                logger.info(
                     f"Archive contents: {file_list[:10]}..."
                 )  # Show first 10 files for debugging
 
@@ -178,7 +227,7 @@ def extract_features_job(filename, parameters=None):
                 ]
                 total_images = len(image_files)
 
-            print(f"Archive validation passed. Found {total_images} images")
+            logger.success(f"Archive validation passed. Found {total_images} images")
 
             # Step 2: Setup parameters
             job.meta["progress"] = 10
@@ -209,10 +258,10 @@ def parse_mean_std(value, default):
             input_mean = parse_mean_std(parameters.get("input_mean"), (0, 0, 0))
             input_std = parse_mean_std(parameters.get("input_std"), (1, 1, 1))
 
-            print(
+            logger.info(
                 f"Using parameters: normalize={normalize}, batch_size={batch_size}, model_file={model_file}"
             )
-            print(f"Input normalization: mean={input_mean}, std={input_std}")
+            logger.info(f"Input normalization: mean={input_mean}, std={input_std}")
 
             # Step 3: Start feature extraction
             job.meta["progress"] = 15
@@ -254,12 +303,12 @@ def parse_mean_std(value, default):
             job.meta["result"] = result
             job.save_meta()
 
-            print(f"Feature extraction completed for {filename}")
-            print(f"Features saved to: {features_path}")
+            logger.success(f"Feature extraction completed for {filename}")
+            logger.info(f"Features saved to: {features_path}")
             return result
 
         except Exception as e:
-            print(f"Feature extraction failed: {str(e)}")
+            logger.error(f"Feature extraction failed: {str(e)}")
             job.meta["status"] = "failed"
             job.meta["error_message"] = str(e)
             job.meta["failed_at"] = dt.datetime.now().isoformat()
@@ -273,12 +322,12 @@ def convert_ecotaxa_job(filename, parameters=None):
     Background job for converting EcoTaxa format to standard format.
     Uses MorphoCluster's existing fix_ecotaxa functionality.
     """
-    print(f"Starting EcoTaxa conversion for {filename}")
-
     from rq import get_current_job
     import shutil
 
     job = get_current_job()
+    logger = JobLogger(job)
+    logger.info(f"Starting EcoTaxa conversion for {filename}")
 
     if parameters is None:
         parameters = {}
@@ -289,10 +338,16 @@ def convert_ecotaxa_job(filename, parameters=None):
     app_instance = create_app()
     with app_instance.app_context():
         try:
-            archive_path = Path(app_instance.config["FILES_DIR"]) / filename
+            # Always use the original file for conversion, not the _converted version
+            original_filename = filename
+            if filename.endswith('_converted.zip'):
+                original_filename = filename.replace('_converted.zip', '.zip')
+                logger.info(f"Converting from original file: {original_filename} instead of {filename}")
+
+            archive_path = Path(app_instance.config["FILES_DIR"]) / original_filename
 
             if not archive_path.exists():
-                raise FileNotFoundError(f"Archive {filename} not found")
+                raise FileNotFoundError(f"Original archive {original_filename} not found")
 
             # Step 1: Analyze parameters
             job.meta["status"] = "analyzing"
@@ -302,7 +357,13 @@ def convert_ecotaxa_job(filename, parameters=None):
 
             encoding = parameters.get("encoding")
             delimiter = parameters.get("delimiter")
-            force = parameters.get("force", False)
+            force = parameters.get("force_overwrite", parameters.get("force", False))
+
+            logger.info(f"Conversion parameters:")
+            logger.info(f"  encoding: {encoding}")
+            logger.info(f"  delimiter: {delimiter}")
+            logger.info(f"  force: {force}")
+            logger.info(f"  raw parameters: {parameters}")
 
             # Step 2: Create working copy for conversion
             job.meta["progress"] = 20
@@ -332,9 +393,53 @@ def convert_ecotaxa_job(filename, parameters=None):
                 if force:
                     args.append("--force")
 
+                logger.info(f"About to call fix_ecotaxa with:")
+                logger.info(f"  work_path: {work_path}")
+                logger.info(f"  work_path exists: {work_path.exists()}")
+                logger.info(f"  args: {args}")
+                logger.info(f"  encoding: {encoding}")
+                logger.info(f"  delimiter: {delimiter}")
+
+                # Debug: Check the actual file contents before conversion
+                try:
+                    import zipfile
+
+                    with zipfile.ZipFile(work_path, 'r') as zf:
+                        ecotaxa_files = [f for f in zf.namelist() if 'ecotaxa' in f.lower()]
+                        logger.info(f"  ecotaxa files in work zip: {ecotaxa_files}")
+
+                        if ecotaxa_files:
+                            with zf.open(ecotaxa_files[0]) as fp:
+                                first_line = fp.readline().decode(encoding or 'ascii').strip()
+                                logger.info(f"  first line: {repr(first_line)}")
+
+                                actual_delimiter = delimiter or '\t'
+                                columns = first_line.split(actual_delimiter)
+                                logger.info(f"  actual columns found: {columns}")
+                                logger.info(f"  number of columns: {len(columns)}")
+                                logger.info(f"  delimiter used: {repr(actual_delimiter)}")
+                                logger.info(f"  has object_id: {'object_id' in columns}")
+                                logger.info(f"  has img_file_name: {'img_file_name' in columns}")
+
+                                # Show each column individually for debugging
+                                for i, col in enumerate(columns):
+                                    logger.info(f"  column {i}: {repr(col)}")
+                except Exception as debug_error:
+                    logger.error(f"  debug file inspection failed: {debug_error}")
+
                 result = runner.invoke(fix_ecotaxa, args)
+
+                # Log full output for debugging
+                logger.info(f"fix_ecotaxa exit_code: {result.exit_code}")
+                logger.info(f"fix_ecotaxa output: {result.output}")
+                if result.exception:
+                    logger.error(f"fix_ecotaxa exception: {result.exception}")
+
                 if result.exit_code != 0:
-                    raise RuntimeError(f"EcoTaxa conversion failed: {result.output}")
+                    error_msg = f"EcoTaxa conversion failed (exit code {result.exit_code}): {result.output}"
+                    if result.exception:
+                        error_msg += f"\nException: {result.exception}"
+                    raise RuntimeError(error_msg)
             except Exception as conversion_error:
                 # Clean up working file
                 if work_path.exists():
@@ -395,11 +500,11 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
     """
     Background job for initial clustering to create a new MorphoCluster project.
     """
-    print(f"Starting initial clustering for {archive_name}")
-
     from rq import get_current_job
-
     job = get_current_job()
+    logger = JobLogger(job)
+
+    logger.info(f"Starting initial clustering for {archive_name}")
 
     if parameters is None:
         parameters = {}
@@ -648,14 +753,14 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
             job.meta["result"] = result
             job.save_meta()
 
-            print(f"Initial clustering completed for {archive_name}")
-            print(
+            logger.success(f"Initial clustering completed for {archive_name}")
+            logger.info(
                 f"Created project '{project_name}' with {cluster_count} clusters and {object_count} objects"
             )
             return result
 
         except Exception as e:
-            print(f"Initial clustering failed: {str(e)}")
+            logger.error(f"Initial clustering failed: {str(e)}")
             job.meta["status"] = "failed"
             job.meta["error_message"] = str(e)
             job.meta["failed_at"] = dt.datetime.now().isoformat()
diff --git a/morphocluster/frontend/src/components/ClusterModal.vue b/morphocluster/frontend/src/components/ClusterModal.vue
index 556d516..6896d5d 100644
--- a/morphocluster/frontend/src/components/ClusterModal.vue
+++ b/morphocluster/frontend/src/components/ClusterModal.vue
@@ -25,7 +25,7 @@
         <div class="info-grid">
           <div v-if="!isReclusterMode" class="info-item">
             <strong>Archive:</strong>
-            <span>{{ archive?.name || 'Unknown' }}</span>
+            <span>{{ archive?.original_filename || 'Unknown' }}</span>
           </div>
           <div v-if="isReclusterMode" class="info-item">
             <strong>Original Project:</strong>
@@ -322,9 +322,9 @@ export default {
 
       // Set project name with new cluster size
       this.parameters.project_name = `${this.project.name} (${this.parameters.min_cluster_size})`;
-    } else if (this.archive?.name) {
+    } else if (this.archive?.original_filename) {
       // For initial clustering, set default project name based on archive name
-      const baseName = this.archive.name.replace(/\.(zip|tar|tar\.gz)$/i, '');
+      const baseName = this.archive.original_filename.replace(/\.(zip|tar|tar\.gz)$/i, '');
       this.parameters.project_name = baseName.replace(/_/g, ' ');
     }
   },
diff --git a/morphocluster/frontend/src/components/FeatureModal.vue b/morphocluster/frontend/src/components/FeatureModal.vue
index 9813d2c..bc42438 100644
--- a/morphocluster/frontend/src/components/FeatureModal.vue
+++ b/morphocluster/frontend/src/components/FeatureModal.vue
@@ -23,7 +23,7 @@
         <div class="info-grid">
           <div class="info-item">
             <strong>Archive:</strong>
-            <span>{{ archive?.name || 'Unknown' }}</span>
+            <span>{{ archive?.original_filename || 'Unknown' }}</span>
           </div>
           <div class="info-item" v-if="archive?.validation?.image_count">
             <strong>Images:</strong>
diff --git a/morphocluster/frontend/src/components/FormatModal.vue b/morphocluster/frontend/src/components/FormatModal.vue
index 5adc17e..0dc56a8 100644
--- a/morphocluster/frontend/src/components/FormatModal.vue
+++ b/morphocluster/frontend/src/components/FormatModal.vue
@@ -1,6 +1,6 @@
 <template>
   <b-modal
-    v-model="isVisible"
+    v-model="localVisible"
     title="Convert EcoTaxa Format"
     size="lg"
     @ok="handleConvert"
@@ -23,11 +23,11 @@
         <div class="info-grid">
           <div class="info-item">
             <strong>File:</strong>
-            <span>{{ archive?.name || 'Unknown' }}</span>
+            <span>{{ archive?.original_filename || 'Unknown' }}</span>
           </div>
           <div class="info-item">
             <strong>Size:</strong>
-            <span>{{ formatBytes(archive?.size || 0) }}</span>
+            <span>{{ formatBytes(archive?.file_size || 0) }}</span>
           </div>
           <div class="info-item" v-if="archive?.validation?.file_count">
             <strong>Files:</strong>
@@ -167,12 +167,15 @@ export default {
     archive: {
       type: Object,
       required: true
+    },
+    visible: {
+      type: Boolean,
+      default: true
     }
   },
   emits: ['convert', 'cancel'],
   data() {
     return {
-      isVisible: true,
       showAdvanced: false,
       parameters: {
         encoding: 'auto',
@@ -203,6 +206,16 @@ export default {
   computed: {
     isValid() {
       return this.parameters.encoding && this.parameters.delimiter;
+    },
+    localVisible: {
+      get() {
+        return this.visible;
+      },
+      set(value) {
+        if (!value) {
+          this.$emit('cancel');
+        }
+      }
     }
   },
   async mounted() {
@@ -216,6 +229,18 @@ export default {
     }
   },
   methods: {
+    getValidationData() {
+      // Extract validation data from archive
+      if (this.archive && this.archive.validation_data) {
+        try {
+          return JSON.parse(this.archive.validation_data);
+        } catch (error) {
+          console.warn('Failed to parse validation data:', error);
+          return null;
+        }
+      }
+      return null;
+    },
     async loadPreview() {
       if (!this.archive?.name) return;
       
@@ -279,7 +304,9 @@ export default {
         convertParams.encoding = this.previewData?.detected_encoding || 'utf-8';
       }
       if (convertParams.delimiter === 'auto') {
-        convertParams.delimiter = this.previewData?.detected_delimiter || ',';
+        // Try to get delimiter from validation data first, then preview data, then default to comma
+        const validationData = this.getValidationData();
+        convertParams.delimiter = validationData?.detected_delimiter || this.previewData?.detected_delimiter || ',';
       }
 
       // Convert string booleans to actual booleans
@@ -287,12 +314,10 @@ export default {
       convertParams.skip_image_validation = convertParams.skip_image_validation === 'true' || convertParams.skip_image_validation === true;
 
       this.$emit('convert', convertParams);
-      this.isVisible = false;
     },
 
     handleCancel() {
       this.$emit('cancel');
-      this.isVisible = false;
     },
 
     formatBytes(bytes) {
diff --git a/morphocluster/frontend/src/components/JobStatus.vue b/morphocluster/frontend/src/components/JobStatus.vue
index 22714a7..1e747cb 100644
--- a/morphocluster/frontend/src/components/JobStatus.vue
+++ b/morphocluster/frontend/src/components/JobStatus.vue
@@ -1,13 +1,13 @@
 <template>
   <div class="job-status-container">
-    <div v-if="jobs.length === 0" class="no-jobs">
+    <div v-if="filteredJobs.length === 0" class="no-jobs">
       <i class="mdi mdi-briefcase-outline"></i>
-      <p>No active jobs</p>
+      <p>{{ filterStatus ? `No ${filterStatus} jobs` : 'No active jobs' }}</p>
     </div>
 
     <div v-else class="jobs-list">
       <div
-        v-for="job in jobs"
+        v-for="job in filteredJobs"
         :key="job.id"
         class="job-item"
         :class="{
@@ -134,9 +134,13 @@ export default {
     refreshInterval: {
       type: Number,
       default: 2000 // 2 seconds
+    },
+    filterStatus: {
+      type: String,
+      default: null // null means no filtering, show all jobs
     }
   },
-  emits: ['job-completed', 'job-failed', 'job-cancelled'],
+  emits: ['job-completed', 'job-failed', 'job-cancelled', 'jobs-updated'],
   data() {
     return {
       jobs: [],
@@ -147,6 +151,12 @@ export default {
     };
   },
   computed: {
+    filteredJobs() {
+      if (!this.filterStatus) {
+        return this.jobs; // Show all jobs if no filter
+      }
+      return this.jobs.filter(job => job.status === this.filterStatus);
+    },
     hasCompletedJobs() {
       return this.jobs.some(job => ['completed', 'failed'].includes(job.status));
     }
@@ -215,6 +225,7 @@ export default {
         });
 
         this.jobs = newJobs;
+        this.$emit('jobs-updated', this.jobs);
       } catch (error) {
         console.error('Failed to fetch jobs:', error);
       } finally {
@@ -298,12 +309,23 @@ export default {
     },
 
     getJobDetails(job) {
+      let archiveName = job.archive_name || job.parameters?.archive_name || 'Unknown';
+
+      // Remove file extensions and _converted suffix for display
+      if (archiveName !== 'Unknown') {
+        archiveName = archiveName.replace(/\.(zip|tar|tar\.gz)$/i, ''); // Remove file extensions
+        archiveName = archiveName.replace(/_converted$/, ''); // Remove _converted suffix
+      }
+
       if (job.job_type === 'format_conversion') {
-        return `Archive: ${job.archive_name || job.parameters?.archive_name || 'Unknown'}`;
+        return `Archive: ${archiveName}`;
       } else if (job.job_type === 'feature_extraction') {
-        return `Model: ${job.parameters?.model || 'ImageNet'}, Batch: ${job.parameters?.batch_size || 512}`;
-      } else if (job.job_type === 'initial_clustering' || job.job_type === 'reclustering') {
-        return `Min cluster size: ${job.parameters?.min_cluster_size || 128}`;
+        return `Archive: ${archiveName} • Model: ${job.parameters?.model || 'ImageNet'} • Batch: ${job.parameters?.batch_size || 512}`;
+      } else if (job.job_type === 'initial_clustering') {
+        return `Archive: ${archiveName} • Min cluster size: ${job.parameters?.min_cluster_size || 128}`;
+      } else if (job.job_type === 'reclustering') {
+        const projectName = job.parameters?.project_name || job.project_name || 'Unknown Project';
+        return `Project: ${projectName} • Min cluster size: ${job.parameters?.min_cluster_size || 128}`;
       }
       return '';
     },
diff --git a/morphocluster/frontend/src/helpers/api.js b/morphocluster/frontend/src/helpers/api.js
index d0bfe3c..e48fa0e 100644
--- a/morphocluster/frontend/src/helpers/api.js
+++ b/morphocluster/frontend/src/helpers/api.js
@@ -203,4 +203,23 @@ export function getJobStatus(jobId) {
 export function cancelJob(jobId) {
     return axios.delete(`/api/jobs/${jobId}`)
         .then(response => response.data);
+}
+
+// ===============================================================================
+// Uploaded Archives Management
+// ===============================================================================
+
+export function getUploadedArchives() {
+    return axios.get('/api/uploaded-archives')
+        .then(response => response.data);
+}
+
+export function saveUploadedArchive(archiveData) {
+    return axios.post('/api/uploaded-archives', archiveData)
+        .then(response => response.data);
+}
+
+export function updateUploadedArchive(archiveId, updates) {
+    return axios.put(`/api/uploaded-archives/${archiveId}`, updates)
+        .then(response => response.data);
 }
\ No newline at end of file
diff --git a/morphocluster/frontend/src/router.js b/morphocluster/frontend/src/router.js
index 3ecd376..994b1b9 100644
--- a/morphocluster/frontend/src/router.js
+++ b/morphocluster/frontend/src/router.js
@@ -34,6 +34,11 @@ const routes = [
       path: '/upload',
       component: () => import(/* webpackChunkName: "upload" */ './views/Upload.vue'),
     },
+    {
+      name: 'jobs',
+      path: '/jobs',
+      component: () => import(/* webpackChunkName: "jobs" */ './views/JobQueue.vue'),
+    },
     {
       name: 'files',
       path: '/files/:file_path?',
@@ -53,7 +58,7 @@ const routes = [
     },
     {
       path: '/',
-      redirect: '/home'
+      redirect: '/p'
     },
     { path: '/:pathMatch(.*)*', component: NotFound }
   ]
diff --git a/morphocluster/frontend/src/views/Files.vue b/morphocluster/frontend/src/views/Files.vue
index 4f22aba..0e30ccb 100644
--- a/morphocluster/frontend/src/views/Files.vue
+++ b/morphocluster/frontend/src/views/Files.vue
@@ -13,6 +13,9 @@
                     <li class="navbar-item">
                         <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
                     </li>
+                    <li class="navbar-item">
+                        <router-link class="nav-link" :to="{ name: 'jobs' }">Jobs</router-link>
+                    </li>
                     <li v-for="(parent, index) in entry && entry.parents ? entry.parents.slice() : []" :key="index" class="navbar-item">
                         <router-link class="nav-link" :to="{ name: 'files', params: { file_path: parent.path } }">{{
                             parent.name
diff --git a/morphocluster/frontend/src/views/JobQueue.vue b/morphocluster/frontend/src/views/JobQueue.vue
new file mode 100644
index 0000000..0293d38
--- /dev/null
+++ b/morphocluster/frontend/src/views/JobQueue.vue
@@ -0,0 +1,441 @@
+<template>
+  <div id="job-queue">
+    <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
+      <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
+      <ul class="navbar-nav me-auto">
+        <li class="nav-item">
+          <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
+        </li>
+        <li class="nav-item">
+          <router-link class="nav-link" :to="{ name: 'files' }">Files</router-link>
+        </li>
+        <li class="nav-item">
+          <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
+        </li>
+        <li class="nav-item">
+          <span class="nav-link active">Jobs</span>
+        </li>
+      </ul>
+      <dark-mode-control />
+    </nav>
+
+    <div class="scrollable">
+      <div class="container-fluid">
+        <div class="row">
+          <!-- Main Job Queue Section -->
+          <div class="col-lg-12">
+            <div class="job-queue-header">
+              <h2>
+                <i class="mdi mdi-briefcase-multiple"></i>
+                Job Queue
+              </h2>
+              <p class="section-description">
+                Monitor and manage all your background processing jobs including format conversion,
+                feature extraction, clustering, and re-clustering operations.
+              </p>
+            </div>
+
+            <!-- Alerts -->
+            <div class="alerts" v-if="alerts.length">
+              <b-alert :key="alert.id" v-for="alert of alerts" dismissible show :variant="alert.variant" @dismissed="removeAlert(alert.id)">
+                {{ alert.message }}
+              </b-alert>
+            </div>
+
+            <!-- Job Statistics -->
+            <div class="job-stats row mb-4">
+              <div class="col-md-3">
+                <div class="stat-card stat-running">
+                  <div class="stat-icon">
+                    <i class="mdi mdi-play-circle"></i>
+                  </div>
+                  <div class="stat-info">
+                    <div class="stat-number">{{ runningJobs.length }}</div>
+                    <div class="stat-label">Running</div>
+                  </div>
+                </div>
+              </div>
+              <div class="col-md-3">
+                <div class="stat-card stat-queued">
+                  <div class="stat-icon">
+                    <i class="mdi mdi-clock-outline"></i>
+                  </div>
+                  <div class="stat-info">
+                    <div class="stat-number">{{ queuedJobs.length }}</div>
+                    <div class="stat-label">Queued</div>
+                  </div>
+                </div>
+              </div>
+              <div class="col-md-3">
+                <div class="stat-card stat-completed">
+                  <div class="stat-icon">
+                    <i class="mdi mdi-check-circle"></i>
+                  </div>
+                  <div class="stat-info">
+                    <div class="stat-number">{{ completedJobs.length }}</div>
+                    <div class="stat-label">Completed</div>
+                  </div>
+                </div>
+              </div>
+              <div class="col-md-3">
+                <div class="stat-card stat-failed">
+                  <div class="stat-icon">
+                    <i class="mdi mdi-alert-circle"></i>
+                  </div>
+                  <div class="stat-info">
+                    <div class="stat-number">{{ failedJobs.length }}</div>
+                    <div class="stat-label">Failed</div>
+                  </div>
+                </div>
+              </div>
+            </div>
+
+            <!-- Job Filters -->
+            <div class="job-filters mb-4">
+              <div class="filter-buttons">
+                <b-button
+                  v-for="filter in filters"
+                  :key="filter.key"
+                  :variant="activeFilter === filter.key ? 'primary' : 'outline-primary'"
+                  size="sm"
+                  class="me-2"
+                  @click="setFilter(filter.key)"
+                >
+                  {{ filter.label }}
+                  <b-badge v-if="filter.count > 0" variant="light" class="ms-1">
+                    {{ filter.count }}
+                  </b-badge>
+                </b-button>
+              </div>
+              <div class="filter-actions">
+                <b-button
+                  v-if="completedJobs.length > 0 || failedJobs.length > 0"
+                  variant="outline-danger"
+                  size="sm"
+                  @click="clearCompleted"
+                >
+                  <i class="mdi mdi-delete-sweep"></i>
+                  Clear Completed
+                </b-button>
+                <b-button
+                  variant="outline-secondary"
+                  size="sm"
+                  @click="refreshJobs"
+                  :disabled="isRefreshing"
+                >
+                  <i class="mdi mdi-refresh" :class="{ 'mdi-spin': isRefreshing }"></i>
+                  Refresh
+                </b-button>
+              </div>
+            </div>
+
+            <!-- Jobs List -->
+            <div class="jobs-container">
+              <job-status
+                ref="jobStatus"
+                :show-logs="true"
+                :auto-refresh="true"
+                :filter-status="activeFilter !== 'all' ? activeFilter : null"
+                @job-completed="handleJobCompleted"
+                @job-failed="handleJobFailed"
+                @job-cancelled="handleJobCancelled"
+                @jobs-updated="handleJobsUpdated"
+              />
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+</template>
+
+<script>
+import JobStatus from '@/components/JobStatus.vue';
+import DarkModeControl from '@/components/DarkModeControl.vue';
+
+export default {
+  name: 'JobQueueView',
+  components: {
+    JobStatus,
+    DarkModeControl,
+  },
+  data() {
+    return {
+      activeFilter: 'all',
+      isRefreshing: false,
+      completedJobIds: new Set(), // Track completed jobs for notifications
+      alerts: [],
+      nextAlertId: 1,
+      jobs: [], // Local copy of jobs for reactivity
+    };
+  },
+  mounted() {
+    // Sync initial jobs data after JobStatus is mounted
+    this.$nextTick(() => {
+      if (this.$refs.jobStatus && this.$refs.jobStatus.jobs) {
+        this.jobs = this.$refs.jobStatus.jobs;
+      }
+    });
+  },
+  computed: {
+    allJobs() {
+      return this.jobs; // All jobs for statistics
+    },
+    filteredJobs() {
+      // Jobs filtered by active filter for display
+      if (this.activeFilter === 'all') {
+        return this.jobs;
+      }
+      return this.jobs.filter(job => job.status === this.activeFilter);
+    },
+    runningJobs() {
+      return this.jobs.filter(job => job.status === 'running');
+    },
+    queuedJobs() {
+      return this.jobs.filter(job => job.status === 'queued');
+    },
+    completedJobs() {
+      return this.jobs.filter(job => job.status === 'completed');
+    },
+    failedJobs() {
+      return this.jobs.filter(job => job.status === 'failed');
+    },
+    filters() {
+      return [
+        { key: 'all', label: 'All', count: this.jobs.length },
+        { key: 'running', label: 'Running', count: this.runningJobs.length },
+        { key: 'queued', label: 'Queued', count: this.queuedJobs.length },
+        { key: 'completed', label: 'Completed', count: this.completedJobs.length },
+        { key: 'failed', label: 'Failed', count: this.failedJobs.length },
+      ];
+    },
+  },
+  methods: {
+    setFilter(filter) {
+      this.activeFilter = filter;
+    },
+    async refreshJobs() {
+      this.isRefreshing = true;
+      try {
+        await this.$refs.jobStatus.fetchJobs();
+      } finally {
+        this.isRefreshing = false;
+      }
+    },
+    clearCompleted() {
+      this.$refs.jobStatus.clearCompletedJobs();
+    },
+    handleJobCompleted(job) {
+      // Show success alert
+      this.addAlert(`Job "${this.getJobTitle(job)}" completed successfully!`, 'success');
+    },
+    handleJobFailed(job) {
+      // Show error alert
+      this.addAlert(`Job "${this.getJobTitle(job)}" failed: ${job.error_message || 'Unknown error'}`, 'danger');
+    },
+    handleJobCancelled(job) {
+      this.addAlert(`Job "${this.getJobTitle(job)}" was cancelled.`, 'warning');
+    },
+    handleJobsUpdated(jobs) {
+      // Sync jobs data from JobStatus component
+      this.jobs = jobs;
+    },
+    addAlert(message, variant = 'info') {
+      const alert = {
+        id: this.nextAlertId++,
+        message,
+        variant,
+      };
+      this.alerts.unshift(alert);
+
+      // Auto-remove after 5 seconds
+      setTimeout(() => {
+        this.removeAlert(alert.id);
+      }, 5000);
+    },
+    removeAlert(alertId) {
+      const index = this.alerts.findIndex(alert => alert.id === alertId);
+      if (index !== -1) {
+        this.alerts.splice(index, 1);
+      }
+    },
+    getJobTitle(job) {
+      // Use the same logic as JobStatus component
+      if (job.name) return job.name;
+      if (job.description) return job.description;
+      return `${job.type || 'Processing'} Job`;
+    },
+  },
+};
+</script>
+
+<style scoped>
+#job-queue {
+  display: flex;
+  flex-direction: column;
+  align-items: stretch;
+  flex: 1;
+  overflow: hidden;
+}
+
+.scrollable {
+  overflow-y: auto;
+  flex: 1;
+}
+
+.job-queue-header {
+  padding: 1.5rem 0 1rem;
+  border-bottom: 1px solid #dee2e6;
+  margin-bottom: 1.5rem;
+}
+
+.job-queue-header h2 {
+  margin-bottom: 0.5rem;
+  color: #495057;
+}
+
+.job-queue-header h2 i {
+  margin-right: 0.5rem;
+}
+
+.section-description {
+  color: #6c757d;
+  margin-bottom: 0;
+}
+
+/* Alerts */
+.alerts {
+  margin-bottom: 1rem;
+}
+
+/* Job Statistics */
+.job-stats {
+  margin-bottom: 1.5rem;
+}
+
+.stat-card {
+  display: flex;
+  align-items: center;
+  padding: 1rem;
+  border-radius: 8px;
+  box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+  background: white;
+  border-left: 4px solid transparent;
+}
+
+.stat-running {
+  border-left-color: #007bff;
+}
+
+.stat-queued {
+  border-left-color: #ffc107;
+}
+
+.stat-completed {
+  border-left-color: #28a745;
+}
+
+.stat-failed {
+  border-left-color: #dc3545;
+}
+
+.stat-icon {
+  font-size: 2rem;
+  margin-right: 1rem;
+}
+
+.stat-running .stat-icon {
+  color: #007bff;
+}
+
+.stat-queued .stat-icon {
+  color: #ffc107;
+}
+
+.stat-completed .stat-icon {
+  color: #28a745;
+}
+
+.stat-failed .stat-icon {
+  color: #dc3545;
+}
+
+.stat-info {
+  flex: 1;
+}
+
+.stat-number {
+  font-size: 1.5rem;
+  font-weight: bold;
+  line-height: 1;
+  margin-bottom: 0.25rem;
+}
+
+.stat-label {
+  font-size: 0.875rem;
+  color: #6c757d;
+  text-transform: uppercase;
+  letter-spacing: 0.5px;
+}
+
+/* Job Filters */
+.job-filters {
+  display: flex;
+  justify-content: space-between;
+  align-items: center;
+  padding: 1rem;
+  background: #f8f9fa;
+  border-radius: 8px;
+  flex-wrap: wrap;
+  gap: 1rem;
+}
+
+.filter-buttons {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 0.5rem;
+}
+
+.filter-actions {
+  display: flex;
+  gap: 0.5rem;
+}
+
+/* Jobs Container */
+.jobs-container {
+  background: white;
+  border-radius: 8px;
+  box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+  padding: 1rem;
+}
+
+/* Responsive */
+@media (max-width: 768px) {
+  .job-filters {
+    flex-direction: column;
+    align-items: stretch;
+  }
+
+  .filter-buttons {
+    justify-content: center;
+  }
+
+  .filter-actions {
+    justify-content: center;
+  }
+
+  .job-stats .col-md-3 {
+    margin-bottom: 1rem;
+  }
+}
+
+/* Animations */
+.mdi-spin {
+  animation: spin 1s linear infinite;
+}
+
+@keyframes spin {
+  0% { transform: rotate(0deg); }
+  100% { transform: rotate(360deg); }
+}
+</style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/views/Project.vue b/morphocluster/frontend/src/views/Project.vue
index f7b615f..b7c4141 100644
--- a/morphocluster/frontend/src/views/Project.vue
+++ b/morphocluster/frontend/src/views/Project.vue
@@ -13,6 +13,9 @@
                     <li class="nav-item">
                         <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
                     </li>
+                    <li class="nav-item">
+                        <router-link class="nav-link" :to="{ name: 'jobs' }">Jobs</router-link>
+                    </li>
                     <li class="nav-item" v-if="project">
                         <router-link class="nav-link"
                             :to="{ name: 'project', params: { project_id: project.project_id } }">{{
diff --git a/morphocluster/frontend/src/views/Projects.vue b/morphocluster/frontend/src/views/Projects.vue
index 4aac21f..9309eed 100644
--- a/morphocluster/frontend/src/views/Projects.vue
+++ b/morphocluster/frontend/src/views/Projects.vue
@@ -12,6 +12,9 @@
                 <li class="nav-item">
                     <router-link class="nav-link" :to="{ name: 'upload' }">Upload</router-link>
                 </li>
+                <li class="nav-item">
+                    <router-link class="nav-link" :to="{ name: 'jobs' }">Jobs</router-link>
+                </li>
             </ul>
             <dark-mode-control />
         </nav>
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
index f3c9ffc..1f09ca4 100644
--- a/morphocluster/frontend/src/views/Upload.vue
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -13,6 +13,9 @@
           <li class="navbar-item">
             <span class="nav-link active">Upload</span>
           </li>
+          <li class="navbar-item">
+            <router-link class="nav-link" :to="{ name: 'jobs' }">Jobs</router-link>
+          </li>
         </ul>
       </div>
       <dark-mode-control />
@@ -49,12 +52,12 @@
                     v-for="archive in uploadedArchives"
                     :key="archive.id"
                     class="archive-item"
-                    :class="{ 'needs-conversion': archive.needsConversion }"
+                    :class="{ 'needs-conversion': archive.needs_conversion }"
                   >
                     <div class="archive-header">
                       <div class="archive-info">
-                        <h6>{{ archive.name }}</h6>
-                        <small class="text-muted">{{ formatBytes(archive.size) }}</small>
+                        <h6>{{ archive.original_filename || archive.filename || 'Unknown' }}</h6>
+                        <small class="text-muted">{{ formatBytes(archive.file_size) || 'Size unknown' }}</small>
                       </div>
                       <div class="archive-status">
                         <b-badge
@@ -63,14 +66,14 @@
                         >
                           {{ getArchiveStatusText(archive.status) }}
                         </b-badge>
-                        <span v-if="archive.format" class="format-badge">
-                          {{ archive.format }}
+                        <span v-if="getArchiveFormat(archive)" class="format-badge">
+                          {{ getArchiveFormat(archive) }}
                         </span>
                       </div>
                     </div>
 
                     <!-- EcoTaxa Conversion Warning -->
-                    <div v-if="archive.needsConversion" class="alert alert-warning mt-2">
+                    <div v-if="archive.needs_conversion" class="alert alert-warning mt-2">
                       <i class="mdi mdi-alert"></i>
                       This archive appears to be in EcoTaxa format and needs conversion.
                       <button
@@ -90,11 +93,11 @@
                     >
                       <i class="mdi mdi-alert-circle"></i>
                       <strong>Validation Error:</strong><br>
-                      {{ archive.error || 'Unknown error occurred during validation' }}
-                      <div v-if="archive.validation && archive.validation.validation_warnings && archive.validation.validation_warnings.length" class="mt-2">
+                      {{ archive.error_message || 'Unknown error occurred during validation' }}
+                      <div v-if="getValidationData(archive)?.validation_warnings?.length" class="mt-2">
                         <small><strong>Warnings:</strong></small>
                         <ul class="mb-0 mt-1">
-                          <li v-for="warning in archive.validation.validation_warnings" :key="warning">
+                          <li v-for="warning in getValidationData(archive).validation_warnings" :key="warning">
                             {{ warning }}
                           </li>
                         </ul>
@@ -155,7 +158,7 @@
                         View Project
                       </b-button>
                       <span class="project-info text-muted">
-                        Project: {{ archive.projectName || 'Unknown' }}
+                        Project: {{ getProjectName(archive) || 'Unknown' }}
                       </span>
                     </div>
                   </div>
@@ -254,6 +257,7 @@ import DarkModeControl from '@/components/DarkModeControl.vue';
 import FormatModal from '@/components/FormatModal.vue';
 import FeatureModal from '@/components/FeatureModal.vue';
 import ClusterModal from '@/components/ClusterModal.vue';
+import { getUploadedArchives, saveUploadedArchive, updateUploadedArchive } from '@/helpers/api';
 
 export default {
   name: 'UploadView',
@@ -276,9 +280,21 @@ export default {
       showingExtractModal: false,
       showingClusterModal: false,
       showingPreviewModal: false,
-      previewData: null
+      previewData: null,
+      processedJobIds: new Set() // Track processed job IDs to prevent duplicates
     };
   },
+  async mounted() {
+    // Load persisted archives on component mount
+    try {
+      const persistedArchives = await getUploadedArchives();
+      this.uploadedArchives = persistedArchives;
+
+    } catch (error) {
+      console.error('Failed to load persisted archives:', error);
+      // Keep empty array as fallback
+    }
+  },
   methods: {
     handleUploadStart(files) {
       console.log('Upload started:', files);
@@ -313,37 +329,46 @@ export default {
           console.log('Validation result:', validation.data);
 
           const archiveData = {
-            id: Date.now() + Math.random(),
-            name: file.name,
-            size: file.size,
+            filename: file.name,
+            original_filename: file.name,
+            file_size: file.size,
             status: 'ready',
-            format: validation.data.format,
-            needsConversion: validation.data.needs_conversion,
-            isValid: validation.data.is_valid,
-            validation: validation.data
+            is_valid: validation.data.is_valid,
+            needs_conversion: validation.data.needs_conversion,
+            validation_data: JSON.stringify(validation.data),
+            metadata: JSON.stringify({
+              format: validation.data.format
+            })
           };
 
-          this.uploadedArchives.push(archiveData);
+          // Save to backend and get the persisted record
+          console.log('Saving archive to backend:', archiveData);
+          const savedArchive = await saveUploadedArchive(archiveData);
+          console.log('Saved archive response:', savedArchive);
+          this.uploadedArchives.push(savedArchive);
         } catch (error) {
           console.error('Validation failed for', file.name, ':', error);
-          this.uploadedArchives.push({
-            id: Date.now() + Math.random(),
-            name: file.name,
-            size: file.size,
+          const errorArchive = {
+            filename: file.name,
+            original_filename: file.name,
+            file_size: file.size,
             status: 'error',
-            error: error.response?.data?.error || error.message
-          });
+            is_valid: false,
+            needs_conversion: false,
+            error_message: error.response?.data?.error || error.message
+          };
+
+          console.log('Saving error archive to backend:', errorArchive);
+          const savedArchive = await saveUploadedArchive(errorArchive);
+          console.log('Saved error archive response:', savedArchive);
+          this.uploadedArchives.push(savedArchive);
         }
       }
     },
 
     handleUploadError(error) {
       console.error('Upload error:', error);
-      this.$bvToast.toast('Upload failed. Please try again.', {
-        title: 'Upload Error',
-        variant: 'danger',
-        solid: true
-      });
+      alert('Upload failed. Please try again: ' + error.message);
     },
 
     handleUploadCancel() {
@@ -391,17 +416,17 @@ export default {
       this.selectedArchive = null;
     },
     viewProject(archive) {
-      if (archive.projectId) {
+      if (archive.project_id) {
         // Navigate to the project view
-        this.$router.push(`/projects/${archive.projectId}`);
+        this.$router.push(`/p/${archive.project_id}`);
       } else {
-        console.error('No project ID available for archive:', archive.name);
+        console.error('No project ID available for archive:', archive.original_filename);
       }
     },
 
     async previewArchive(archive) {
       try {
-        const response = await this.$axios.get(`/api/files/${archive.name}/preview`);
+        const response = await this.$axios.get(`/api/files/${archive.filename}/preview`);
         this.previewData = response.data;
         this.showingPreviewModal = true;
       } catch (error) {
@@ -424,15 +449,21 @@ export default {
       }
 
       try {
+        console.log('Converting archive:', {
+          filename: archive.filename,
+          original_filename: archive.original_filename,
+          full_archive_object: archive
+        });
+
         await this.$axios.post(
-          `/api/files/${archive.name}/convert`,
+          `/api/files/${archive.filename}/convert`,
           parameters
         );
 
-        console.log('Format conversion started for:', archive.name);
+        console.log('Format conversion started for:', archive.original_filename);
 
         // Update archive status
-        archive.status = 'converting';
+        await this.updateArchive(archive, { status: 'converting' });
 
       } catch (error) {
         console.error('Conversion failed:', error);
@@ -451,14 +482,12 @@ export default {
 
       try {
         await this.$axios.post(
-          `/api/files/${archive.name}/extract`,
+          `/api/files/${archive.filename}/extract`,
           parameters
         );
 
-        console.log('Feature extraction started for:', archive.name);
-
         // Update archive status
-        archive.status = 'extracting';
+        await this.updateArchive(archive, { status: 'extracting' });
 
       } catch (error) {
         console.error('Extraction failed:', error);
@@ -477,53 +506,98 @@ export default {
 
       try {
         await this.$axios.post(
-          `/api/files/${encodeURIComponent(archive.name)}/cluster`,
-          { ...parameters, feature_file: archive.featureFile }
+          `/api/files/${encodeURIComponent(archive.filename)}/cluster`,
+          parameters
         );
 
-        console.log('Clustering started for:', archive.name);
 
         // Update archive status
-        archive.status = 'clustering';
+        await this.updateArchive(archive, { status: 'clustering' });
 
       } catch (error) {
         console.error('Clustering failed:', error);
-        console.error('Error details:', error.response?.data);
       }
     },
 
-    handleJobCompleted(job) {
+    async handleJobCompleted(job) {
+      // Check if this job has already been processed to prevent duplicates
+      if (this.processedJobIds.has(job.id)) {
+        return;
+      }
+
+      // Mark job as processed
+      this.processedJobIds.add(job.id);
+
+      // Helper function to find archive with flexible name matching
+      const findArchive = (archiveName) => {
+        if (!archiveName) return null;
+
+        const nameWithZip = archiveName.endsWith('.zip') ? archiveName : archiveName + '.zip';
+        const nameWithoutZip = archiveName.replace(/\.zip$/, '');
+
+        return this.uploadedArchives.find(a =>
+          a.filename === archiveName ||
+          a.original_filename === archiveName ||
+          a.filename === nameWithZip ||
+          a.original_filename === nameWithZip ||
+          a.filename === nameWithoutZip ||
+          a.original_filename === nameWithoutZip
+        );
+      };
+
       // Update archive status based on job type
       if (job.job_type === 'format_conversion' && job.archive_name) {
-        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
-        if (archive) {
-          archive.status = 'ready';
-          archive.format = 'standard';
-          archive.needsConversion = false;
+        const archive = findArchive(job.archive_name);
+        if (archive && !archive.project_id) { // Don't update if project already exists
+          const updates = {
+            status: 'ready',
+            needs_conversion: false,
+            metadata: JSON.stringify({
+              ...this.parseMetadata(archive),
+              format: 'standard'
+            })
+          };
 
           // Update archive name to point to converted file
           if (job.result && job.result.converted_file) {
-            archive.name = job.result.converted_file;
+            updates.filename = job.result.converted_file;
           }
+
+          await this.updateArchive(archive, updates);
         }
       } else if (job.job_type === 'feature_extraction' && job.archive_name) {
-        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
-        if (archive) {
-          archive.status = 'processed';
+        const archive = findArchive(job.archive_name);
+        if (archive && !archive.project_id) { // Don't update if project already exists
+          const updates = {
+            status: 'processed'
+          };
+
           // Store feature file info for clustering
           if (job.result && job.result.feature_file) {
-            archive.featureFile = job.result.feature_file;
+            updates.feature_file = job.result.feature_file;
           }
+
+          await this.updateArchive(archive, updates);
         }
       } else if (job.job_type === 'initial_clustering' && job.archive_name) {
-        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        const archive = findArchive(job.archive_name);
         if (archive) {
-          archive.status = 'clustered';
+          const updates = {
+            status: 'clustered'
+          };
+
           // Store project info
           if (job.result && job.result.project_id) {
-            archive.projectId = job.result.project_id;
-            archive.projectName = job.result.project_name;
+            updates.project_id = job.result.project_id;
+            // Create clean metadata object
+            const cleanMetadata = {
+              format: 'standard',
+              project_name: job.result.project_name
+            };
+            updates.metadata = JSON.stringify(cleanMetadata);
           }
+
+          await this.updateArchive(archive, updates);
         }
       }
 
@@ -533,12 +607,32 @@ export default {
       }
     },
 
-    handleJobFailed(job) {
+    async handleJobFailed(job) {
+      // Helper function to find archive (same as in handleJobCompleted)
+      const findArchive = (archiveName) => {
+        if (!archiveName) return null;
+
+        const nameWithZip = archiveName.endsWith('.zip') ? archiveName : archiveName + '.zip';
+        const nameWithoutZip = archiveName.replace(/\.zip$/, '');
+
+        return this.uploadedArchives.find(a =>
+          a.filename === archiveName ||
+          a.original_filename === archiveName ||
+          a.filename === nameWithZip ||
+          a.original_filename === nameWithZip ||
+          a.filename === nameWithoutZip ||
+          a.original_filename === nameWithoutZip
+        );
+      };
+
       // Reset archive status if conversion failed
       if (job.job_type === 'format_conversion' && job.archive_name) {
-        const archive = this.uploadedArchives.find(a => a.name === job.archive_name);
+        const archive = findArchive(job.archive_name);
         if (archive) {
-          archive.status = 'ready'; // Back to ready so user can try again
+          await this.updateArchive(archive, {
+            status: 'ready', // Back to ready so user can try again
+            error_message: job.error_message
+          });
         }
       }
     },
@@ -547,6 +641,31 @@ export default {
       // Job was cancelled, no specific action needed
     },
 
+    async updateArchive(archive, updates) {
+      try {
+        console.log('updateArchive: calling API with id:', archive.id, 'updates:', updates);
+        const updatedArchive = await updateUploadedArchive(archive.id, updates);
+        console.log('updateArchive: API response:', updatedArchive);
+        // Update local copy with server response
+        Object.assign(archive, updatedArchive);
+        console.log('updateArchive: local object after assign:', {
+          needs_conversion: archive.needs_conversion,
+          status: archive.status,
+          filename: archive.filename
+        });
+      } catch (error) {
+        console.error('Failed to update archive:', error);
+        console.log('updateArchive: using fallback, applying updates locally:', updates);
+        // Fallback: apply updates locally only
+        Object.assign(archive, updates);
+        console.log('updateArchive: local object after fallback:', {
+          needs_conversion: archive.needs_conversion,
+          status: archive.status,
+          filename: archive.filename
+        });
+      }
+    },
+
     getJobTitle(job) {
       const titles = {
         'format_conversion': 'Format Conversion',
@@ -558,7 +677,47 @@ export default {
     },
 
     isArchiveValid(archive) {
-      return archive.status === 'ready' && archive.isValid;
+      return archive.status === 'ready' && archive.is_valid;
+    },
+
+    getArchiveFormat(archive) {
+      try {
+        const metadata = JSON.parse(archive.metadata || '{}');
+        return metadata.format;
+      } catch {
+        return null;
+      }
+    },
+
+    getValidationData(archive) {
+      try {
+        return JSON.parse(archive.validation_data || '{}');
+      } catch {
+        return {};
+      }
+    },
+
+    getProjectName(archive) {
+      try {
+        const metadata = JSON.parse(archive.metadata || '{}');
+        return metadata.project_name;
+      } catch {
+        return null;
+      }
+    },
+
+    parseMetadata(archive) {
+      try {
+        const metadataStr = archive.metadata || '{}';
+        return JSON.parse(metadataStr);
+      } catch (error) {
+        console.warn('Failed to parse archive metadata:', error, 'Raw metadata:', archive.metadata);
+        // If parsing fails, try to handle common cases
+        if (typeof archive.metadata === 'object') {
+          return archive.metadata; // Already an object
+        }
+        return {}; // Fallback to empty object
+      }
     },
 
     getArchiveStatusVariant(status) {
@@ -592,7 +751,12 @@ export default {
     },
 
     formatBytes(bytes) {
+      // Handle invalid input
+      if (bytes === null || bytes === undefined || isNaN(bytes)) {
+        return null; // This will trigger the fallback in the template
+      }
       if (bytes === 0) return '0 Bytes';
+
       const k = 1024;
       const sizes = ['Bytes', 'KB', 'MB', 'GB'];
       const i = Math.floor(Math.log(bytes) / Math.log(k));
@@ -611,7 +775,7 @@ export default {
 
 .upload-container {
   flex: 1;
-  padding: 2rem 0;
+  padding: 2rem 0 4rem 0;
   background-color: #f8f9fa;
 }
 
@@ -644,15 +808,32 @@ export default {
   flex-shrink: 0;
 }
 
-.job-status-section .job-status-container {
+/* Make the JobStatus component scrollable */
+.job-status-section >>> .job-status-container {
   flex: 1;
   min-height: 0;
+  overflow-y: auto;
+  max-height: calc(100vh - 8rem);
+}
+
+/* Also target the jobs list directly */
+.job-status-section >>> .jobs-list {
+  max-height: calc(100vh - 8rem);
+  overflow-y: auto;
+}
+
+.job-status-section >>> .job-item {
+  flex-shrink: 0;
 }
 
 .archives-list {
   border: 1px solid #dee2e6;
   border-radius: 8px;
   background: white;
+  max-height: 40vh;
+  overflow-y: auto;
+  margin-bottom: 2rem;
+  padding-bottom: 1rem;
 }
 
 .archive-item {
diff --git a/morphocluster/models.py b/morphocluster/models.py
index a6f77a7..81449b2 100644
--- a/morphocluster/models.py
+++ b/morphocluster/models.py
@@ -180,6 +180,24 @@
     Column("data", Text, nullable=True),
 )
 
+uploaded_archives = Table(
+    "uploaded_archives",
+    metadata,
+    Column("id", Integer, primary_key=True),
+    Column("filename", String, nullable=False),
+    Column("original_filename", String, nullable=False),
+    Column("file_size", BigInteger, nullable=False),
+    Column("upload_date", DateTime, default=datetime.datetime.now),
+    Column("status", String, nullable=False, default="uploaded"),  # uploaded, converting, extracting, clustering, completed, error
+    Column("is_valid", Boolean, default=False),
+    Column("needs_conversion", Boolean, default=False),
+    Column("validation_data", Text, nullable=True),  # JSON validation details
+    Column("feature_file", String, nullable=True),  # Generated feature file name
+    Column("project_id", Integer, ForeignKey("projects.project_id"), nullable=True),  # Created project
+    Column("error_message", Text, nullable=True),
+    Column("metadata", Text, nullable=True),  # JSON metadata for additional info
+)
+
 # ===============================================================================
 # categories = Table('names', metadata,
 #     Column('name', String, primary_key = True),

From d9052d769d0ff026cccfb55a454550184a9cded4 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Mon, 29 Sep 2025 17:06:29 -0400
Subject: [PATCH 11/13] fix queueing and progress measurement system

---
 morphocluster/api.py                         | 33 ++++++++++++++------
 morphocluster/background.py                  | 19 ++++++++---
 morphocluster/frontend/src/views/Upload.vue  | 11 ++++++-
 morphocluster/processing/extract_features.py |  9 ++++++
 4 files changed, 57 insertions(+), 15 deletions(-)

diff --git a/morphocluster/api.py b/morphocluster/api.py
index 4dc3878..ab73302 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -828,6 +828,15 @@ def get_user_jobs():
                 if job_data:
                     all_jobs.append(job_data)
 
+            # Running jobs (currently being executed)
+            started_registry = queue.started_job_registry
+            for job_id in started_registry.get_job_ids(0, 20):
+                job = queue.fetch_job(job_id)
+                if job:
+                    job_data = _format_job_data(job)
+                    if job_data:
+                        all_jobs.append(job_data)
+
             # Recently finished jobs
             finished_registry = queue.finished_job_registry
             for job_id in finished_registry.get_job_ids(0, 20):
@@ -865,17 +874,23 @@ def _format_job_data(job):
         if not job:
             return None
 
-        # Determine job status
-        if job.is_queued:
-            status = "queued"
-        elif job.is_started:
-            status = job.meta.get("status", "running")
-        elif job.is_finished:
-            status = job.meta.get("status", "completed")
-        elif job.is_failed:
+        # Determine job status based on RQ job state
+        # Priority: RQ's built-in states take precedence over meta status
+        if job.is_failed:
             status = "failed"
+        elif job.is_finished:
+            status = "completed"
+        elif job.is_started:
+            # Job is actively running - always show "running" status
+            status = "running"
+        elif job.is_queued:
+            status = "queued"
         else:
-            status = "unknown"
+            # Fallback for edge cases
+            if job.started_at:
+                status = "running"
+            else:
+                status = "queued"
 
         job_data = {
             "id": job.id,
diff --git a/morphocluster/background.py b/morphocluster/background.py
index 44c9f8c..54d2ac9 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -190,7 +190,6 @@ def extract_features_job(filename, parameters=None):
             features_path = archive_path.parent / features_filename
 
             # Step 1: Validate archive
-            job.meta["status"] = "validating"
             job.meta["progress"] = 5
             job.meta["current_step"] = "Validating archive structure..."
             job.save_meta()
@@ -263,7 +262,7 @@ def parse_mean_std(value, default):
             )
             logger.info(f"Input normalization: mean={input_mean}, std={input_std}")
 
-            # Step 3: Start feature extraction
+            # Step 3: Start feature extraction with progress tracking
             job.meta["progress"] = 15
             job.meta["current_step"] = (
                 "Starting feature extraction (this may take several minutes)..."
@@ -271,6 +270,15 @@ def parse_mean_std(value, default):
             job.meta["total_images"] = total_images
             job.save_meta()
 
+            # Define progress callback for feature extraction
+            def update_extraction_progress(current_batch, total_batches):
+                """Update job progress during feature extraction"""
+                # Map from 15% to 95% based on batch progress
+                progress = 15 + int((current_batch / total_batches) * 80)
+                job.meta["progress"] = progress
+                job.meta["current_step"] = f"Extracting features: batch {current_batch}/{total_batches}"
+                job.save_meta()
+
             # Run MorphoCluster's real feature extraction
             extract_features(
                 archive_fn=str(archive_path),
@@ -281,6 +289,7 @@ def parse_mean_std(value, default):
                 cuda=True,  # Use GPU if available
                 input_mean=input_mean,
                 input_std=input_std,
+                progress_callback=update_extraction_progress,
             )
 
             # Step 4: Complete
@@ -327,6 +336,7 @@ def convert_ecotaxa_job(filename, parameters=None):
 
     job = get_current_job()
     logger = JobLogger(job)
+
     logger.info(f"Starting EcoTaxa conversion for {filename}")
 
     if parameters is None:
@@ -350,7 +360,6 @@ def convert_ecotaxa_job(filename, parameters=None):
                 raise FileNotFoundError(f"Original archive {original_filename} not found")
 
             # Step 1: Analyze parameters
-            job.meta["status"] = "analyzing"
             job.meta["progress"] = 10
             job.meta["current_step"] = "Analyzing EcoTaxa format and parameters..."
             job.save_meta()
@@ -525,7 +534,6 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
                 raise FileNotFoundError(f"Feature file {feature_file} not found")
 
             # Step 1: Setup parameters
-            job.meta["status"] = "setting_up"
             job.meta["progress"] = 10
             job.meta["current_step"] = "Setting up clustering parameters..."
             job.save_meta()
@@ -777,6 +785,8 @@ def reclustering_job(project_id, parameters=None):
     from rq import get_current_job
 
     job = get_current_job()
+    logger = JobLogger(job)
+
     if parameters is None:
         parameters = {}
 
@@ -795,7 +805,6 @@ def reclustering_job(project_id, parameters=None):
             import h5py
 
             # Step 1: Setup parameters
-            job.meta["status"] = "setting_up"
             job.meta["progress"] = 10
             job.meta["current_step"] = "Setting up re-clustering parameters..."
             job.save_meta()
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
index 1f09ca4..ef3cc65 100644
--- a/morphocluster/frontend/src/views/Upload.vue
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -172,6 +172,7 @@
             <div class="job-status-section">
               <h4>Processing Jobs</h4>
               <job-status
+                ref="jobStatus"
                 @job-completed="handleJobCompleted"
                 @job-failed="handleJobFailed"
                 @job-cancelled="handleJobCancelled"
@@ -465,6 +466,9 @@ export default {
         // Update archive status
         await this.updateArchive(archive, { status: 'converting' });
 
+        // Immediately refresh job list to show the new job
+        this.$refs.jobStatus?.fetchJobs();
+
       } catch (error) {
         console.error('Conversion failed:', error);
         console.error('Error details:', error.response?.data);
@@ -489,6 +493,9 @@ export default {
         // Update archive status
         await this.updateArchive(archive, { status: 'extracting' });
 
+        // Immediately refresh job list to show the new job
+        this.$refs.jobStatus?.fetchJobs();
+
       } catch (error) {
         console.error('Extraction failed:', error);
         console.error('Error details:', error.response?.data);
@@ -510,10 +517,12 @@ export default {
           parameters
         );
 
-
         // Update archive status
         await this.updateArchive(archive, { status: 'clustering' });
 
+        // Immediately refresh job list to show the new job
+        this.$refs.jobStatus?.fetchJobs();
+
       } catch (error) {
         console.error('Clustering failed:', error);
       }
diff --git a/morphocluster/processing/extract_features.py b/morphocluster/processing/extract_features.py
index ae5a874..2bb3429 100644
--- a/morphocluster/processing/extract_features.py
+++ b/morphocluster/processing/extract_features.py
@@ -387,6 +387,7 @@ def extract_features(
     cuda=True,
     input_mean=(0, 0, 0),
     input_std=(1, 1, 1),
+    progress_callback=None,
 ):
     use_cuda = cuda and torch.cuda.is_available()
 
@@ -462,6 +463,9 @@ def extract_features(
         h5_targets = f_features.create_dataset("targets", (n_objects,), dtype="int8")
 
         offset = 0
+        total_batches = len(data_loader)
+        batch_num = 0
+
         for objids, inputs in tqdm(data_loader, unit="batch"):
             if use_cuda:
                 inputs = inputs.cuda(non_blocking=True)
@@ -482,5 +486,10 @@ def extract_features(
             h5_targets[offset : offset + batch_size] = -1
 
             offset += batch_size
+            batch_num += 1
+
+            # Call progress callback if provided
+            if progress_callback:
+                progress_callback(batch_num, total_batches)
 
     print("Done.")

From 0d7fafe5bdc636bf0aeb46ef5caf10e9485f3e10 Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 2 Oct 2025 14:18:32 -0400
Subject: [PATCH 12/13] various frontend fixes to unify UI theming

---
 morphocluster/frontend/public/index.html      |   4 +-
 morphocluster/frontend/src/assets/styles.css  | 381 ++++++++++++++++--
 .../frontend/src/components/ClusterModal.vue  |  31 +-
 .../src/components/DarkModeControl.vue        |  98 +++--
 .../frontend/src/components/FeatureModal.vue  |  32 +-
 .../frontend/src/components/FormatModal.vue   |  22 +-
 .../frontend/src/components/UploadZone.vue    |  14 +-
 morphocluster/frontend/src/views/Approve.vue  |  19 +-
 morphocluster/frontend/src/views/Bisect.vue   |  17 +-
 morphocluster/frontend/src/views/Files.vue    |  59 ++-
 morphocluster/frontend/src/views/JobQueue.vue |  20 +-
 morphocluster/frontend/src/views/Projects.vue |  74 +++-
 morphocluster/frontend/src/views/Upload.vue   |  13 +-
 morphocluster/static/css/labeling.css         |  42 +-
 morphocluster/static/css/layout.css           | 140 +++++++
 morphocluster/templates/layouts/main.html     |  60 ++-
 16 files changed, 890 insertions(+), 136 deletions(-)

diff --git a/morphocluster/frontend/public/index.html b/morphocluster/frontend/public/index.html
index ef21f04..876d0de 100644
--- a/morphocluster/frontend/public/index.html
+++ b/morphocluster/frontend/public/index.html
@@ -5,7 +5,9 @@
     <meta http-equiv="X-UA-Compatible" content="IE=edge">
     <meta name="viewport" content="width=device-width,initial-scale=1.0">
     <link rel="icon" href="<%= BASE_URL %>favicon.png">
-    <script src="<%= BASE_URL %>config.js"></script> 
+    <!-- Material Design Icons -->
+    <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@mdi/font@7.4.47/css/materialdesignicons.min.css">
+    <script src="<%= BASE_URL %>config.js"></script>
     <title>MorphoCluster</title>
   </head>
   <body>
diff --git a/morphocluster/frontend/src/assets/styles.css b/morphocluster/frontend/src/assets/styles.css
index 54a0b36..73a6675 100644
--- a/morphocluster/frontend/src/assets/styles.css
+++ b/morphocluster/frontend/src/assets/styles.css
@@ -4,73 +4,380 @@ html, body {
 	overflow: hidden;
 }
 
-.tooltip kbd {
-	background-color: #f7f7f9;
-	color: #212529;
-}
-
 .info-hint {
 	position: absolute;
 	top: 0.5em;
 	right: 1em;
-	/*color: gray;*/
 }
 
-/* Dark/Light Mode */
+/* ============================================================================
+   Dark/Light Mode System
+   ============================================================================ */
+
+/* Light Mode (Default) */
 :root {
-	--background-color: white;
-	--color: #212529;
+	/* Background colors */
+	--bg-primary: #ffffff;
+	--bg-secondary: #f8f9fa;
+	--bg-tertiary: #e9ecef;
+
+	/* Text colors */
+	--text-primary: #212529;
+	--text-secondary: #6c757d;
+	--text-muted: #adb5bd;
+
+	/* Border colors */
+	--border-color: #dee2e6;
+	--border-light: #e9ecef;
+
+	/* Card/Panel colors */
+	--card-bg: #ffffff;
+	--card-border: #dee2e6;
+
+	/* Navbar */
+	--navbar-bg: #343a40;
+	--navbar-color: #ffffff;
+	--navbar-hover-color: #f8f9fa;
+
+	/* Input colors */
+	--input-bg: #ffffff;
+	--input-border: #ced4da;
+	--input-text: #495057;
+	--input-placeholder: #6c757d;
+
+	/* Button colors */
+	--btn-bg: #ffffff;
+	--btn-text: #212529;
+	--btn-border: #dee2e6;
+
+	/* Table colors */
+	--table-bg: #ffffff;
+	--table-hover-bg: #f8f9fa;
+	--table-border: #dee2e6;
+
+	/* Alert/Badge colors */
+	--alert-bg: #f8f9fa;
+	--badge-bg: #e9ecef;
 }
 
+/* Dark Mode */
 :root.dark-mode {
-	--background-color: black;
-	--color: #f7f7f9;
+	/* Background colors */
+	--bg-primary: #1a1a1a;
+	--bg-secondary: #2d2d2d;
+	--bg-tertiary: #3a3a3a;
+
+	/* Text colors */
+	--text-primary: #e9ecef;
+	--text-secondary: #adb5bd;
+	--text-muted: #6c757d;
+
+	/* Border colors */
+	--border-color: #495057;
+	--border-light: #3a3a3a;
+
+	/* Card/Panel colors */
+	--card-bg: #2d2d2d;
+	--card-border: #495057;
+
+	/* Navbar */
+	--navbar-bg: #0d0d0d;
+	--navbar-color: #e9ecef;
+	--navbar-hover-color: #ffffff;
+
+	/* Input colors */
+	--input-bg: #2d2d2d;
+	--input-border: #495057;
+	--input-text: #e9ecef;
+	--input-placeholder: #6c757d;
+
+	/* Button colors */
+	--btn-bg: #2d2d2d;
+	--btn-text: #e9ecef;
+	--btn-border: #495057;
+
+	/* Table colors */
+	--table-bg: #2d2d2d;
+	--table-hover-bg: #3a3a3a;
+	--table-border: #495057;
+
+	/* Alert/Badge colors */
+	--alert-bg: #2d2d2d;
+	--badge-bg: #3a3a3a;
 }
 
+/* ============================================================================
+   Apply Theme Variables
+   ============================================================================ */
+
 body {
-	color: var(--color);
-	background-color: var(--background-color);
+	color: var(--text-primary);
+	background-color: var(--bg-primary);
+	transition: background-color 0.3s ease, color 0.3s ease;
 }
 
-table, .table {
-	color: var(--color);
+/* Navbar */
+.navbar {
+	background-color: var(--navbar-bg) !important;
+	color: var(--navbar-color) !important;
+	border-bottom: 1px solid var(--border-color);
+	padding-left: 1rem !important;
 }
 
-.modal-dialog {
-	color: black;
+.navbar .navbar-brand {
+	color: var(--navbar-color) !important;
+	display: flex;
+	align-items: center;
+	gap: 0.5rem;
 }
 
-/* Navbar styling for both modes */
-.navbar {
-	background-color: var(--navbar-bg, #343a40) !important;
-	color: var(--navbar-color, #ffffff) !important;
+.navbar .navbar-brand .navbar-logo {
+	height: 32px;
+	width: 32px;
+	object-fit: contain;
+}
+
+:root.dark-mode .navbar .navbar-brand .navbar-logo {
+	filter: brightness(0) invert(1);
 }
 
-.navbar .navbar-brand,
 .navbar .nav-link {
-	color: var(--navbar-color, #ffffff) !important;
+	color: var(--navbar-color) !important;
 }
 
 .navbar .navbar-brand:hover,
 .navbar .nav-link:hover {
-	color: var(--navbar-hover-color, #f8f9fa) !important;
+	color: var(--navbar-hover-color) !important;
 }
 
-/* Dark mode navbar */
-:root.dark-mode {
-	--navbar-bg: #1a1a1a;
-	--navbar-color: #f7f7f9;
-	--navbar-hover-color: #ffffff;
+/* Cards & Panels */
+.card,
+.upload-section,
+.job-status-section,
+.archive-item,
+.job-item {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+	color: var(--text-primary) !important;
 }
 
-/* Light mode navbar */
-:root {
-	--navbar-bg: #343a40;
-	--navbar-color: #ffffff;
-	--navbar-hover-color: #f8f9fa;
+/* Tables */
+table, .table {
+	color: var(--text-primary);
+	background-color: var(--table-bg);
+}
+
+.table thead th {
+	border-color: var(--table-border);
+	background-color: var(--bg-secondary);
+	color: var(--text-primary);
+}
+
+.table td, .table th {
+	border-color: var(--table-border);
+}
+
+.table-hover tbody tr:hover {
+	background-color: var(--table-hover-bg);
+	color: var(--text-primary);
+}
+
+.table-striped tbody tr:nth-of-type(odd) {
+	background-color: var(--bg-secondary);
+}
+
+/* Forms & Inputs */
+.form-control,
+.custom-select,
+input[type="text"],
+input[type="number"],
+input[type="email"],
+textarea,
+select {
+	background-color: var(--input-bg) !important;
+	border-color: var(--input-border) !important;
+	color: var(--input-text) !important;
+}
+
+.form-control::placeholder {
+	color: var(--input-placeholder) !important;
+}
+
+.form-control:focus {
+	background-color: var(--input-bg) !important;
+	color: var(--input-text) !important;
+	border-color: #80bdff !important;
+}
+
+/* Buttons */
+.btn-outline-secondary {
+	color: var(--text-primary) !important;
+	border-color: var(--btn-border) !important;
+	background-color: var(--btn-bg) !important;
+}
+
+.btn-outline-secondary:hover {
+	background-color: var(--bg-tertiary) !important;
+	color: var(--text-primary) !important;
+}
+
+/* Modals */
+.modal-content {
+	background-color: var(--card-bg) !important;
+	color: var(--text-primary) !important;
+	border-color: var(--card-border) !important;
+}
+
+.modal-header,
+.modal-footer {
+	border-color: var(--border-color) !important;
+}
+
+.modal-header .close {
+	color: var(--text-primary) !important;
+}
+
+/* Alerts */
+.alert {
+	background-color: var(--alert-bg) !important;
+	border-color: var(--border-color) !important;
+}
+
+.alert-warning {
+	background-color: #fff3cd !important;
+	color: #856404 !important;
+}
+
+:root.dark-mode .alert-warning {
+	background-color: #3d3417 !important;
+	color: #ffecb3 !important;
+}
+
+.alert-danger {
+	background-color: #f8d7da !important;
+	color: #721c24 !important;
+}
+
+:root.dark-mode .alert-danger {
+	background-color: #3d1a1f !important;
+	color: #f8d7da !important;
+}
+
+/* Badges */
+.badge {
+	background-color: var(--badge-bg) !important;
+	color: var(--text-primary) !important;
+}
+
+/* Containers & Sections */
+.container,
+.container-fluid {
+	color: var(--text-primary);
+}
+
+/* Text colors */
+.text-muted {
+	color: var(--text-secondary) !important;
+}
+
+h1, h2, h3, h4, h5, h6 {
+	color: var(--text-primary);
+}
+
+small {
+	color: var(--text-secondary);
+}
+
+/* Borders */
+.border {
+	border-color: var(--border-color) !important;
+}
+
+hr {
+	border-color: var(--border-color);
+}
+
+/* Dropdown menus */
+.dropdown-menu {
+	background-color: var(--card-bg);
+	border-color: var(--card-border);
+}
+
+.dropdown-item {
+	color: var(--text-primary);
+}
+
+.dropdown-item:hover {
+	background-color: var(--bg-secondary);
+	color: var(--text-primary);
+}
+
+/* Tooltips */
+.tooltip kbd {
+	background-color: var(--bg-tertiary);
+	color: var(--text-primary);
+}
+
+/* Upload page specific */
+.upload-container {
+	background-color: var(--bg-secondary) !important;
+}
+
+.archives-list {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+}
+
+/* Job Status specific */
+.job-status-container {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+}
+
+.no-jobs {
+	color: var(--text-secondary);
+}
+
+/* Progress bars - keep colors for status indication */
+.progress {
+	background-color: var(--bg-tertiary);
+}
+
+/* List groups */
+.list-group-item {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+	color: var(--text-primary) !important;
+}
+
+.list-group-item:hover {
+	background-color: var(--bg-secondary) !important;
+}
+
+/* Ensure light text on dark buttons */
+:root.dark-mode .btn-primary,
+:root.dark-mode .btn-success,
+:root.dark-mode .btn-info,
+:root.dark-mode .btn-warning,
+:root.dark-mode .btn-danger {
+	color: #ffffff !important;
+}
+
+/* Make button text brighter in dark mode */
+:root.dark-mode .btn-primary {
+	background-color: #0d6efd !important;
+	border-color: #0d6efd !important;
+	color: #ffffff !important;
+}
+
+:root.dark-mode .btn-info {
+	background-color: #0dcaf0 !important;
+	border-color: #0dcaf0 !important;
+	color: #000000 !important;
 }
 
-/* Ensure text visibility in all contexts */
-.text-light {
-	color: var(--navbar-color, #ffffff) !important;
+:root.dark-mode .btn-secondary {
+	background-color: #6c757d !important;
+	border-color: #6c757d !important;
+	color: #ffffff !important;
 }
\ No newline at end of file
diff --git a/morphocluster/frontend/src/components/ClusterModal.vue b/morphocluster/frontend/src/components/ClusterModal.vue
index 6896d5d..c615b50 100644
--- a/morphocluster/frontend/src/components/ClusterModal.vue
+++ b/morphocluster/frontend/src/components/ClusterModal.vue
@@ -374,9 +374,10 @@ export default {
   overflow-y: auto;
 }
 
-.archive-info {
-  background: #f8f9fa;
-  border: 1px solid #dee2e6;
+.archive-info,
+.source-info {
+  background: var(--bg-secondary);
+  border: 1px solid var(--border-color);
   border-radius: 6px;
   padding: 1rem;
 }
@@ -392,16 +393,28 @@ export default {
   justify-content: space-between;
   align-items: center;
   padding: 0.25rem 0;
+  color: var(--text-primary);
 }
 
 .info-item strong {
   margin-right: 0.5rem;
+  color: var(--text-primary);
 }
 
 .clustering-params .card-header,
 .advanced-options .card-header {
-  background-color: #f8f9fa;
-  border-bottom: 1px solid #dee2e6;
+  background-color: var(--bg-secondary) !important;
+  border-bottom: 1px solid var(--border-color) !important;
+}
+
+.clustering-params .card-header h6,
+.advanced-options .card-header h6 {
+  color: var(--text-primary) !important;
+}
+
+.clustering-params .card-body,
+.advanced-options .card-body {
+  background-color: var(--card-bg) !important;
 }
 
 .cluster-size-presets {
@@ -415,6 +428,14 @@ export default {
   margin-top: 1rem;
 }
 
+/* Form descriptions should use secondary text color */
+:deep(.form-group small),
+:deep(.form-text),
+:deep(.invalid-feedback),
+:deep(.form-group .text-muted) {
+  color: var(--text-secondary) !important;
+}
+
 @media (max-width: 768px) {
   .info-grid {
     grid-template-columns: 1fr;
diff --git a/morphocluster/frontend/src/components/DarkModeControl.vue b/morphocluster/frontend/src/components/DarkModeControl.vue
index 1444ff6..5d14844 100644
--- a/morphocluster/frontend/src/components/DarkModeControl.vue
+++ b/morphocluster/frontend/src/components/DarkModeControl.vue
@@ -1,40 +1,80 @@
 <template>
-    <div>
-        <input
-            v-model="dark_mode"
-            id="dark-mode-checkbox"
-            type="checkbox"
-            class="switch-checkbox"
-        />
-        <label for="dark-mode-checkbox">Dark Mode</label>
-    </div>
+    <button
+        @click="toggleDarkMode"
+        class="dark-mode-toggle"
+        :title="dark_mode ? 'Switch to Light Mode' : 'Switch to Dark Mode'"
+    >
+        <i v-if="dark_mode" class="mdi mdi-moon-waning-crescent" key="moon"></i>
+        <i v-else class="mdi mdi-weather-sunny" key="sun"></i>
+    </button>
 </template>
 
 <script>
 export default {
     name: "dark-mode-toggle",
+    data() {
+        // Initialize dark mode state immediately, before component is mounted
+        const savedMode = typeof window !== 'undefined' && localStorage.getItem("dark-mode") === "true";
+        console.log("[DarkModeControl] Initializing with dark_mode:", savedMode);
+        return {
+            dark_mode: savedMode
+        };
+    },
     mounted() {
-        // Initialize dark mode state
+        console.log("[DarkModeControl] Mounted with dark_mode:", this.dark_mode);
+        // Apply dark mode state when component is mounted
+        this.applyDarkMode(this.dark_mode);
+        // Force a re-render to ensure icon is visible
+        this.$forceUpdate();
     },
-    computed: {
-        dark_mode: {
-            get() {
-                const dark_mode = localStorage.getItem("dark-mode") == "true";
-                console.log("dark-mode get", dark_mode);
-                return dark_mode;
-            },
-            set(dark_mode) {
-                console.log("dark-mode set", dark_mode);
-
-                localStorage.setItem("dark-mode", dark_mode ? "true" : "false");
-
-                if (dark_mode) {
-                    document.documentElement.classList.add("dark-mode");
-                } else {
-                    document.documentElement.classList.remove("dark-mode");
-                }
-            },
+    methods: {
+        toggleDarkMode() {
+            this.dark_mode = !this.dark_mode;
+            console.log("[DarkModeControl] Toggled to:", this.dark_mode);
+            localStorage.setItem("dark-mode", this.dark_mode ? "true" : "false");
+            this.applyDarkMode(this.dark_mode);
         },
-    },
+        applyDarkMode(isDark) {
+            if (isDark) {
+                document.documentElement.classList.add("dark-mode");
+            } else {
+                document.documentElement.classList.remove("dark-mode");
+            }
+        }
+    }
 };
 </script>
+
+<style scoped>
+.dark-mode-toggle {
+    background: none;
+    border: none;
+    color: #ffffff;
+    font-size: 1.5rem;
+    cursor: pointer;
+    padding: 0.25rem 0.5rem;
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    transition: all 0.2s ease;
+    line-height: 1;
+}
+
+.dark-mode-toggle:hover {
+    opacity: 0.8;
+    transform: scale(1.1);
+}
+
+.dark-mode-toggle:active {
+    transform: scale(0.95);
+}
+
+.dark-mode-toggle i {
+    transition: transform 0.3s ease;
+    color: #ffffff;
+}
+
+.dark-mode-toggle:hover i {
+    transform: rotate(20deg);
+}
+</style>
diff --git a/morphocluster/frontend/src/components/FeatureModal.vue b/morphocluster/frontend/src/components/FeatureModal.vue
index bc42438..788d81b 100644
--- a/morphocluster/frontend/src/components/FeatureModal.vue
+++ b/morphocluster/frontend/src/components/FeatureModal.vue
@@ -500,8 +500,8 @@ export default {
 }
 
 .archive-info {
-  background-color: #f8f9fa;
-  border: 1px solid #dee2e6;
+  background-color: var(--bg-secondary);
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 1rem;
 }
@@ -522,21 +522,21 @@ export default {
 }
 
 .custom-model-section {
-  background-color: #f8f9fa;
-  border: 1px solid #dee2e6;
+  background-color: var(--bg-secondary);
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 1rem;
 }
 
 .model-info {
-  background-color: #e7f3ff;
-  border: 1px solid #bee5eb;
+  background-color: var(--bg-tertiary);
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 0.75rem;
 }
 
 .processing-params .card-header {
-  background-color: #f8f9fa;
+  background-color: var(--bg-secondary);
 }
 
 .batch-size-presets .btn {
@@ -544,8 +544,8 @@ export default {
 }
 
 .device-info {
-  background-color: #e7f3ff;
-  border: 1px solid #bee5eb;
+  background-color: var(--bg-tertiary);
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 0.5rem;
 }
@@ -556,7 +556,7 @@ export default {
 
 .advanced-options .card-header {
   padding: 0.75rem 1rem;
-  background-color: #f8f9fa;
+  background-color: var(--bg-secondary);
 }
 
 .validation-warnings .alert {
@@ -568,15 +568,23 @@ export default {
   margin-bottom: 0;
 }
 
+/* Form descriptions should use secondary text color */
+:deep(.form-group small),
+:deep(.form-text),
+:deep(.invalid-feedback),
+:deep(.form-group .text-muted) {
+  color: var(--text-secondary) !important;
+}
+
 @media (max-width: 768px) {
   .info-grid {
     grid-template-columns: 1fr;
   }
-  
+
   .info-item {
     flex-direction: column;
   }
-  
+
   .info-item strong {
     margin-right: 0;
     margin-bottom: 0.25rem;
diff --git a/morphocluster/frontend/src/components/FormatModal.vue b/morphocluster/frontend/src/components/FormatModal.vue
index 0dc56a8..027c83e 100644
--- a/morphocluster/frontend/src/components/FormatModal.vue
+++ b/morphocluster/frontend/src/components/FormatModal.vue
@@ -338,8 +338,8 @@ export default {
 }
 
 .archive-info {
-  background-color: #f8f9fa;
-  border: 1px solid #dee2e6;
+  background-color: var(--bg-secondary);
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 1rem;
 }
@@ -360,10 +360,10 @@ export default {
 }
 
 .format-preview {
-  border: 1px solid #dee2e6;
+  border: 1px solid var(--border-color);
   border-radius: 4px;
   padding: 1rem;
-  background-color: #f8f9fa;
+  background-color: var(--bg-secondary);
 }
 
 .preview-container {
@@ -381,7 +381,7 @@ export default {
 
 .advanced-options .card-header {
   padding: 0.75rem 1rem;
-  background-color: #f8f9fa;
+  background-color: var(--bg-secondary);
 }
 
 .validation-warnings .alert {
@@ -407,15 +407,23 @@ export default {
   z-index: 10;
 }
 
+/* Form descriptions should use secondary text color */
+:deep(.form-group small),
+:deep(.form-text),
+:deep(.invalid-feedback),
+:deep(.form-group .text-muted) {
+  color: var(--text-secondary) !important;
+}
+
 @media (max-width: 768px) {
   .info-grid {
     grid-template-columns: 1fr;
   }
-  
+
   .info-item {
     flex-direction: column;
   }
-  
+
   .info-item strong {
     margin-right: 0;
     margin-bottom: 0.25rem;
diff --git a/morphocluster/frontend/src/components/UploadZone.vue b/morphocluster/frontend/src/components/UploadZone.vue
index 10671b0..e04760a 100644
--- a/morphocluster/frontend/src/components/UploadZone.vue
+++ b/morphocluster/frontend/src/components/UploadZone.vue
@@ -332,13 +332,13 @@ export default {
 .upload-zone {
   border: 3px dashed #dee2e6;
   border-radius: 12px;
-  padding: 3rem 2rem;
+  padding: 1rem 1.5rem;
   text-align: center;
   background-color: #f8f9fa;
   cursor: pointer;
   transition: all 0.3s ease;
   position: relative;
-  min-height: 300px;
+  min-height: 120px;
   display: flex;
   align-items: center;
   justify-content: center;
@@ -372,8 +372,8 @@ export default {
 }
 
 .upload-icon {
-  font-size: 4rem;
-  margin-bottom: 1rem;
+  font-size: 3rem;
+  margin-bottom: 0.75rem;
   color: #6c757d;
 }
 
@@ -390,20 +390,20 @@ export default {
 }
 
 .upload-zone h4 {
-  margin-bottom: 1rem;
+  margin-bottom: 0.5rem;
   color: #495057;
   font-weight: 600;
 }
 
 .upload-zone p {
-  margin-bottom: 0.5rem;
+  margin-bottom: 0.25rem;
   color: #6c757d;
 }
 
 .supported-formats {
   font-size: 0.875rem;
   font-style: italic;
-  margin-bottom: 2rem !important;
+  margin-bottom: 1rem !important;
 }
 
 .upload-btn {
diff --git a/morphocluster/frontend/src/views/Approve.vue b/morphocluster/frontend/src/views/Approve.vue
index a4838df..f9ff9b1 100644
--- a/morphocluster/frontend/src/views/Approve.vue
+++ b/morphocluster/frontend/src/views/Approve.vue
@@ -1,9 +1,10 @@
 <template>
     <div id="approve">
         <nav class="navbar navbar-expand-lg navbar-light bg-dark text-light">
-            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }"
-                >MorphoCluster</router-link
-            >
+            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }">
+                <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+                MorphoCluster
+            </router-link>
             <div class="collapse navbar-collapse">
                 <ul class="navbar-nav me-auto">
                     <li class="nav-item nav-link text-light" v-if="project">
@@ -441,6 +442,7 @@ export default {
     align-items: stretch;
     flex: 1;
     overflow: hidden;
+    background-color: var(--bg-primary);
 }
 
 #node-info {
@@ -463,6 +465,17 @@ export default {
     margin: 0 1em;
 }
 
+/* Dark mode support */
+#approve .navbar-brand .navbar-logo {
+    height: 32px;
+    width: 32px;
+    object-fit: contain;
+}
+
+:root.dark-mode #approve .navbar-brand .navbar-logo {
+    filter: brightness(0) invert(1);
+}
+
 #progress {
     display: flex;
     flex-wrap: nowrap;
diff --git a/morphocluster/frontend/src/views/Bisect.vue b/morphocluster/frontend/src/views/Bisect.vue
index 0b0b9ec..8be6906 100644
--- a/morphocluster/frontend/src/views/Bisect.vue
+++ b/morphocluster/frontend/src/views/Bisect.vue
@@ -1,9 +1,10 @@
 <template>
     <div id="bisect">
         <nav class="navbar navbar-expand-lg navbar-light bg-dark text-light">
-            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }"
-                >MorphoCluster</router-link
-            >
+            <router-link class="navbar-brand text-light" :to="{ name: 'projects' }">
+                <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+                MorphoCluster
+            </router-link>
             <div class="collapse navbar-collapse">
                 <ul class="navbar-nav me-auto">
                     <li class="nav-item nav-link text-light" v-if="project">
@@ -757,6 +758,16 @@ export default {
 </script>
 
 <style>
+#bisect .navbar-brand .navbar-logo {
+    height: 32px;
+    width: 32px;
+    object-fit: contain;
+}
+
+:root.dark-mode #bisect .navbar-brand .navbar-logo {
+    filter: brightness(0) invert(1);
+}
+
 #bisect {
     display: flex;
     flex-direction: column;
diff --git a/morphocluster/frontend/src/views/Files.vue b/morphocluster/frontend/src/views/Files.vue
index 0e30ccb..44148ab 100644
--- a/morphocluster/frontend/src/views/Files.vue
+++ b/morphocluster/frontend/src/views/Files.vue
@@ -1,7 +1,10 @@
 <template>
     <div id="files">
         <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-            <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
+            <router-link class="navbar-brand" :to="{ name: 'projects' }">
+                <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+                MorphoCluster
+            </router-link>
             <div class="navbar-collapse" id="navbarNav">
                 <ul class="navbar-nav me-auto">
                     <li class="navbar-item">
@@ -132,6 +135,12 @@ export default {
     overflow: hidden;
 }
 
+#files_table,
+#files_table.table {
+    background-color: var(--table-bg) !important;
+    color: var(--text-primary) !important;
+}
+
 #files_table tr td:nth-child(1) {
     width: 100%;
 }
@@ -142,6 +151,50 @@ export default {
     white-space: nowrap;
 }
 
+#files_table thead,
+#files_table thead th {
+    background-color: var(--bg-secondary) !important;
+    color: var(--text-primary) !important;
+    border-color: var(--border-color) !important;
+}
+
+#files_table tbody,
+#files_table tbody tr,
+#files_table.table-striped tbody tr {
+    background-color: var(--table-bg) !important;
+    color: var(--text-primary) !important;
+    border-color: var(--border-color) !important;
+}
+
+#files_table tbody tr:nth-of-type(odd),
+#files_table.table-striped tbody tr:nth-of-type(odd) {
+    background-color: var(--bg-secondary) !important;
+}
+
+#files_table tbody tr:hover,
+#files_table.table-hover tbody tr:hover {
+    background-color: var(--table-hover-bg) !important;
+}
+
+#files_table tbody tr td,
+#files_table tbody td {
+    border-color: var(--border-color) !important;
+    color: var(--text-primary) !important;
+    background-color: transparent !important;
+}
+
+#files_table a {
+    color: var(--text-primary) !important;
+}
+
+:root.dark-mode #files_table a {
+    color: #5cb3ff !important;
+}
+
+:root.dark-mode #files_table a:hover {
+    color: #8dc9ff !important;
+}
+
 .scrollable {
     overflow-y: auto;
 }
@@ -151,9 +204,11 @@ export default {
 }
 
 .dropzone {
-    border: 2px dashed #ccc;
+    border: 2px dashed var(--border-color);
+    background-color: var(--bg-secondary);
     padding: 20px;
     text-align: center;
     cursor: pointer;
+    color: var(--text-secondary);
 }
 </style>
\ No newline at end of file
diff --git a/morphocluster/frontend/src/views/JobQueue.vue b/morphocluster/frontend/src/views/JobQueue.vue
index 0293d38..abef0e4 100644
--- a/morphocluster/frontend/src/views/JobQueue.vue
+++ b/morphocluster/frontend/src/views/JobQueue.vue
@@ -1,7 +1,10 @@
 <template>
   <div id="job-queue">
     <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-      <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
+      <router-link class="navbar-brand" :to="{ name: 'projects' }">
+        <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+        MorphoCluster
+      </router-link>
       <ul class="navbar-nav me-auto">
         <li class="nav-item">
           <router-link class="nav-link" :to="{ name: 'projects' }">Projects</router-link>
@@ -285,13 +288,13 @@ export default {
 
 .job-queue-header {
   padding: 1.5rem 0 1rem;
-  border-bottom: 1px solid #dee2e6;
+  border-bottom: 1px solid var(--border-color);
   margin-bottom: 1.5rem;
 }
 
 .job-queue-header h2 {
   margin-bottom: 0.5rem;
-  color: #495057;
+  color: var(--text-primary);
 }
 
 .job-queue-header h2 i {
@@ -299,7 +302,7 @@ export default {
 }
 
 .section-description {
-  color: #6c757d;
+  color: var(--text-secondary);
   margin-bottom: 0;
 }
 
@@ -319,8 +322,9 @@ export default {
   padding: 1rem;
   border-radius: 8px;
   box-shadow: 0 2px 4px rgba(0,0,0,0.1);
-  background: white;
+  background: var(--card-bg);
   border-left: 4px solid transparent;
+  color: var(--text-primary);
 }
 
 .stat-running {
@@ -373,7 +377,7 @@ export default {
 
 .stat-label {
   font-size: 0.875rem;
-  color: #6c757d;
+  color: var(--text-secondary);
   text-transform: uppercase;
   letter-spacing: 0.5px;
 }
@@ -384,7 +388,7 @@ export default {
   justify-content: space-between;
   align-items: center;
   padding: 1rem;
-  background: #f8f9fa;
+  background: var(--bg-secondary);
   border-radius: 8px;
   flex-wrap: wrap;
   gap: 1rem;
@@ -403,7 +407,7 @@ export default {
 
 /* Jobs Container */
 .jobs-container {
-  background: white;
+  background: var(--card-bg);
   border-radius: 8px;
   box-shadow: 0 2px 4px rgba(0,0,0,0.1);
   padding: 1rem;
diff --git a/morphocluster/frontend/src/views/Projects.vue b/morphocluster/frontend/src/views/Projects.vue
index 9309eed..d8c691d 100644
--- a/morphocluster/frontend/src/views/Projects.vue
+++ b/morphocluster/frontend/src/views/Projects.vue
@@ -1,7 +1,10 @@
 <template>
     <div id="projects">
         <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-            <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
+            <router-link class="navbar-brand" :to="{ name: 'projects' }">
+                <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+                MorphoCluster
+            </router-link>
             <ul class="navbar-nav me-auto">
                 <li class="nav-item">
                     <span class="nav-link active">Projects</span>
@@ -270,6 +273,12 @@ export default {
     overflow: hidden;
 }
 
+#projects_table,
+#projects_table.table {
+    background-color: var(--table-bg) !important;
+    color: var(--text-primary) !important;
+}
+
 #projects_table tr td:nth-child(1) {
     width: 100%;
 }
@@ -280,6 +289,50 @@ export default {
     white-space: nowrap;
 }
 
+#projects_table thead,
+#projects_table thead th {
+    background-color: var(--bg-secondary) !important;
+    color: var(--text-primary) !important;
+    border-color: var(--border-color) !important;
+}
+
+#projects_table tbody,
+#projects_table tbody tr,
+#projects_table.table-striped tbody tr {
+    background-color: var(--table-bg) !important;
+    color: var(--text-primary) !important;
+    border-color: var(--border-color) !important;
+}
+
+#projects_table tbody tr:nth-of-type(odd),
+#projects_table.table-striped tbody tr:nth-of-type(odd) {
+    background-color: var(--bg-secondary) !important;
+}
+
+#projects_table tbody tr:hover,
+#projects_table.table-hover tbody tr:hover {
+    background-color: var(--table-hover-bg) !important;
+}
+
+#projects_table tbody tr td,
+#projects_table tbody td {
+    border-color: var(--border-color) !important;
+    color: var(--text-primary) !important;
+    background-color: transparent !important;
+}
+
+#projects_table a {
+    color: var(--text-primary) !important;
+}
+
+:root.dark-mode #projects_table a {
+    color: #5cb3ff !important;
+}
+
+:root.dark-mode #projects_table a:hover {
+    color: #8dc9ff !important;
+}
+
 .scrollable {
     overflow-y: auto;
 }
@@ -287,4 +340,23 @@ export default {
 .alerts {
     padding-top: 1em;
 }
+
+/* Override Bootstrap button styles in dark mode */
+:root.dark-mode #projects_table .btn-primary {
+    background-color: #0d6efd !important;
+    border-color: #0d6efd !important;
+    color: #ffffff !important;
+}
+
+:root.dark-mode #projects_table .btn-info {
+    background-color: #0dcaf0 !important;
+    border-color: #0dcaf0 !important;
+    color: #000000 !important;
+}
+
+:root.dark-mode #projects_table .btn-secondary {
+    background-color: #6c757d !important;
+    border-color: #6c757d !important;
+    color: #ffffff !important;
+}
 </style>
diff --git a/morphocluster/frontend/src/views/Upload.vue b/morphocluster/frontend/src/views/Upload.vue
index ef3cc65..8add5bf 100644
--- a/morphocluster/frontend/src/views/Upload.vue
+++ b/morphocluster/frontend/src/views/Upload.vue
@@ -1,7 +1,10 @@
 <template>
   <div id="upload-view">
     <nav class="navbar navbar-expand-lg navbar navbar-dark bg-dark">
-      <router-link class="navbar-brand" :to="{ name: 'projects' }">MorphoCluster</router-link>
+      <router-link class="navbar-brand" :to="{ name: 'projects' }">
+        <img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" />
+        MorphoCluster
+      </router-link>
       <div class="navbar-collapse">
         <ul class="navbar-nav me-auto">
           <li class="navbar-item">
@@ -784,7 +787,7 @@ export default {
 
 .upload-container {
   flex: 1;
-  padding: 2rem 0 4rem 0;
+  padding: 2rem 0 8rem 0;
   background-color: #f8f9fa;
 }
 
@@ -839,10 +842,10 @@ export default {
   border: 1px solid #dee2e6;
   border-radius: 8px;
   background: white;
-  max-height: 40vh;
+  max-height: calc(100vh - 600px);
+  min-height: 200px;
   overflow-y: auto;
-  margin-bottom: 2rem;
-  padding-bottom: 1rem;
+  margin-bottom: 20rem;
 }
 
 .archive-item {
diff --git a/morphocluster/static/css/labeling.css b/morphocluster/static/css/labeling.css
index ce97ef0..476be53 100644
--- a/morphocluster/static/css/labeling.css
+++ b/morphocluster/static/css/labeling.css
@@ -108,30 +108,60 @@
 	padding-top: 3px;
 	height: auto;
 	display: flex;
+	color: #212529;
 }
 
 .member-node {
-	background-color: #fdbf6f;
+	background-color: #fdbf6f !important;
 }
 
 .member-node.highlight {
-	background-color: #ff7f00;
+	background-color: #ff7f00 !important;
 }
 
 .member-starred {
-	background-color: #fb9a99;
+	background-color: #fb9a99 !important;
 }
 
 .member-starred.highlight {
-	background-color: #e31a1c;
+	background-color: #e31a1c !important;
 }
 
 .member-object {
-	background-color: #a6cee3;
+	background-color: #a6cee3 !important;
 }
 
 .member-object.highlight {
-	background-color: #1f78b4;
+	background-color: #1f78b4 !important;
+}
+
+/* Dark mode - keep the same colors for visibility */
+:root.dark-mode .member-node {
+	background-color: #fdbf6f !important;
+}
+
+:root.dark-mode .member-node.highlight {
+	background-color: #ff7f00 !important;
+}
+
+:root.dark-mode .member-starred {
+	background-color: #fb9a99 !important;
+}
+
+:root.dark-mode .member-starred.highlight {
+	background-color: #e31a1c !important;
+}
+
+:root.dark-mode .member-object {
+	background-color: #a6cee3 !important;
+}
+
+:root.dark-mode .member-object.highlight {
+	background-color: #1f78b4 !important;
+}
+
+:root.dark-mode .member-headline {
+	color: #212529;
 }
 
 .member.ui-selecting, .member.ui-selected {
diff --git a/morphocluster/static/css/layout.css b/morphocluster/static/css/layout.css
index d1605de..0120dca 100644
--- a/morphocluster/static/css/layout.css
+++ b/morphocluster/static/css/layout.css
@@ -93,4 +93,144 @@ The below snippet of CSS must be included into your project. Future release may
     position: relative;
     top: 3px;
     left: -3px
+}
+
+/* Dark Mode Support */
+:root {
+	--bg-primary: #ffffff;
+	--bg-secondary: #f8f9fa;
+	--bg-tertiary: #e9ecef;
+	--text-primary: #212529;
+	--text-secondary: #6c757d;
+	--border-color: #dee2e6;
+	--card-bg: #ffffff;
+	--card-border: #dee2e6;
+}
+
+:root.dark-mode {
+	--bg-primary: #1a1a1a;
+	--bg-secondary: #2d2d2d;
+	--bg-tertiary: #3a3a3a;
+	--text-primary: #e9ecef;
+	--text-secondary: #adb5bd;
+	--border-color: #495057;
+	--card-bg: #2d2d2d;
+	--card-border: #495057;
+}
+
+body {
+	background-color: var(--bg-primary);
+	color: var(--text-primary);
+	transition: background-color 0.3s ease, color 0.3s ease;
+}
+
+/* Navbar elements should stay light colored */
+.navbar .text-light,
+.navbar a.text-light,
+#nav-info {
+	color: #ffffff !important;
+}
+
+.bg-light {
+	background-color: var(--bg-secondary) !important;
+	color: var(--text-primary) !important;
+}
+
+.card {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+	color: var(--text-primary) !important;
+}
+
+.member {
+	background-color: var(--card-bg) !important;
+	border-color: var(--card-border) !important;
+	color: var(--text-primary) !important;
+}
+
+.form-control {
+	background-color: var(--card-bg) !important;
+	border-color: var(--border-color) !important;
+	color: var(--text-primary) !important;
+}
+
+.btn-secondary {
+	background-color: var(--bg-tertiary) !important;
+	border-color: var(--border-color) !important;
+	color: var(--text-primary) !important;
+}
+
+:root.dark-mode .btn-secondary:hover {
+	background-color: #4a4a4a !important;
+}
+
+/* Navbar should always be dark */
+#navbar.bg-dark {
+	background-color: #343a40 !important;
+}
+
+:root.dark-mode #navbar.bg-dark {
+	background-color: #0d0d0d !important;
+}
+
+/* Dark mode toggle button - always visible */
+#dark-mode-toggle {
+	display: flex !important;
+	align-items: center;
+	margin-left: 1rem;
+	background: none !important;
+	border: none !important;
+	cursor: pointer !important;
+	padding: 0.25rem 0.5rem !important;
+	visibility: visible !important;
+	opacity: 1 !important;
+}
+
+#dark-mode-toggle i {
+	color: #ffffff !important;
+	font-size: 1.5rem !important;
+}
+
+#dark-mode-toggle:hover {
+	opacity: 0.8 !important;
+	transform: scale(1.1);
+}
+
+.navbar-logo {
+	transition: filter 0.3s ease;
+}
+
+/* Expert Mode - Add color to primary action buttons */
+#btn-approve {
+	background-color: #28a745 !important;
+	border-color: #28a745 !important;
+	color: #ffffff !important;
+}
+
+#btn-approve:hover {
+	background-color: #218838 !important;
+	border-color: #1e7e34 !important;
+}
+
+#btn-recommend {
+	background-color: #ffc107 !important;
+	border-color: #ffc107 !important;
+	color: #212529 !important;
+}
+
+#btn-recommend:hover {
+	background-color: #e0a800 !important;
+	border-color: #d39e00 !important;
+}
+
+:root.dark-mode #btn-approve {
+	background-color: #28a745 !important;
+	border-color: #28a745 !important;
+	color: #ffffff !important;
+}
+
+:root.dark-mode #btn-recommend {
+	background-color: #ffc107 !important;
+	border-color: #ffc107 !important;
+	color: #212529 !important;
 }
\ No newline at end of file
diff --git a/morphocluster/templates/layouts/main.html b/morphocluster/templates/layouts/main.html
index 75e6237..8504a79 100644
--- a/morphocluster/templates/layouts/main.html
+++ b/morphocluster/templates/layouts/main.html
@@ -11,7 +11,8 @@
 
 	<!-- Bootstrap -->
 	<link href="/static/css/bootstrap.min.css" rel="stylesheet">
-	<link href="/static/css/materialdesignicons.min.css" rel="stylesheet">
+	<!-- Material Design Icons -->
+	<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@mdi/font@7.4.47/css/materialdesignicons.min.css">
 	<link href="/static/css/layout.css" rel="stylesheet">
 
 	<!-- HTML5 shim and Respond.js for IE8 support of HTML5 elements and media queries -->
@@ -24,14 +25,18 @@
 </head>
 
 <body>
-	<div class="container">
-		<nav id="navbar" class="navbar navbar-expand-lg navbar-light bg-dark">
-			<a class="navbar-brand text-light" href="/">MorphoCluster</a>
-			<ul class="navbar-nav mr-auto" id="nav-title">
-			</ul>
-			<div id="nav-info" class="text-light"></div>
-		</nav>
-	</div>
+	<nav id="navbar" class="navbar navbar-expand-lg navbar-light bg-dark">
+		<a class="navbar-brand text-light" href="/">
+			<img src="/frontend/favicon.png" alt="MorphoCluster" class="navbar-logo" style="height: 32px; width: 32px; object-fit: contain; margin-right: 0.5rem;" />
+			MorphoCluster
+		</a>
+		<ul class="navbar-nav mr-auto" id="nav-title">
+		</ul>
+		<div id="nav-info" class="text-light"></div>
+		<button id="dark-mode-toggle" class="dark-mode-toggle" title="Toggle Dark Mode" style="background: none; border: none; color: #ffffff; font-size: 1.5rem; cursor: pointer; padding: 0.25rem 0.5rem;">
+			<i class="mdi mdi-weather-sunny"></i>
+		</button>
+	</nav>
 
 
 	<!-- Begin page content -->
@@ -54,7 +59,42 @@
 
 	<script src="/static/js/jquery.min.js"></script>
 	<script src="/static/js/popper.min.js"></script>
-	<script src="/static/js/bootstrap.min.js"></script> {% block body_last %}{% endblock %}
+	<script src="/static/js/bootstrap.min.js"></script>
+
+	<script>
+		// Dark mode toggle functionality
+		(function() {
+			const toggle = document.getElementById('dark-mode-toggle');
+			const icon = toggle.querySelector('i');
+
+			// Initialize dark mode from localStorage
+			const isDark = localStorage.getItem('dark-mode') === 'true';
+			if (isDark) {
+				document.documentElement.classList.add('dark-mode');
+				icon.className = 'mdi mdi-moon-waning-crescent';
+			}
+
+			// Apply logo filter in dark mode
+			const logo = document.querySelector('.navbar-logo');
+			if (logo && isDark) {
+				logo.style.filter = 'brightness(0) invert(1)';
+			}
+
+			// Toggle dark mode on click
+			toggle.addEventListener('click', function() {
+				const isDarkNow = document.documentElement.classList.toggle('dark-mode');
+				localStorage.setItem('dark-mode', isDarkNow);
+				icon.className = isDarkNow ? 'mdi mdi-moon-waning-crescent' : 'mdi mdi-weather-sunny';
+
+				// Update logo filter
+				if (logo) {
+					logo.style.filter = isDarkNow ? 'brightness(0) invert(1)' : '';
+				}
+			});
+		})();
+	</script>
+
+	{% block body_last %}{% endblock %}
 </body>
 
 </html>
\ No newline at end of file

From 97db8b556d5b8c0990d1e59b37a57b10b0d8783a Mon Sep 17 00:00:00 2001
From: John Walsh <johnwalsh7412@gmail.com>
Date: Thu, 2 Oct 2025 14:20:44 -0400
Subject: [PATCH 13/13] black formatting

---
 morphocluster/api.py        | 73 +++++++++++++++++++++----------------
 morphocluster/background.py | 44 +++++++++++++++-------
 morphocluster/models.py     |  8 +++-
 3 files changed, 78 insertions(+), 47 deletions(-)

diff --git a/morphocluster/api.py b/morphocluster/api.py
index ab73302..3d34de3 100644
--- a/morphocluster/api.py
+++ b/morphocluster/api.py
@@ -2130,6 +2130,7 @@ def get_job(job_id):
 # Uploaded Archives Management
 # ===============================================================================
 
+
 @api.route("/uploaded-archives", methods=["GET"])
 def get_uploaded_archives():
     """Get all uploaded archives for the current user/session."""
@@ -2155,7 +2156,7 @@ def get_uploaded_archives():
                 "feature_file": row.feature_file,
                 "project_id": row.project_id,
                 "error_message": row.error_message,
-                "metadata": row.metadata or "{}"
+                "metadata": row.metadata or "{}",
             }
             archives.append(archive_data)
 
@@ -2181,7 +2182,7 @@ def save_uploaded_archive():
         "feature_file": data.get("feature_file"),
         "project_id": data.get("project_id"),
         "error_message": data.get("error_message"),
-        "metadata": data.get("metadata", "{}")
+        "metadata": data.get("metadata", "{}"),
     }
 
     with database.engine.connect() as conn:
@@ -2194,21 +2195,25 @@ def save_uploaded_archive():
                 uploaded_archives.select().where(uploaded_archives.c.id == archive_id)
             ).fetchone()
 
-            return jsonify({
-                "id": row.id,
-                "filename": row.filename,
-                "original_filename": row.original_filename,
-                "file_size": row.file_size,
-                "upload_date": row.upload_date.isoformat() if row.upload_date else None,
-                "status": row.status,
-                "is_valid": row.is_valid,
-                "needs_conversion": row.needs_conversion,
-                "validation_data": row.validation_data,
-                "feature_file": row.feature_file,
-                "project_id": row.project_id,
-                "error_message": row.error_message,
-                "metadata": row.metadata or "{}"
-            })
+            return jsonify(
+                {
+                    "id": row.id,
+                    "filename": row.filename,
+                    "original_filename": row.original_filename,
+                    "file_size": row.file_size,
+                    "upload_date": (
+                        row.upload_date.isoformat() if row.upload_date else None
+                    ),
+                    "status": row.status,
+                    "is_valid": row.is_valid,
+                    "needs_conversion": row.needs_conversion,
+                    "validation_data": row.validation_data,
+                    "feature_file": row.feature_file,
+                    "project_id": row.project_id,
+                    "error_message": row.error_message,
+                    "metadata": row.metadata or "{}",
+                }
+            )
 
 
 @api.route("/uploaded-archives/<int:archive_id>", methods=["PUT"])
@@ -2257,18 +2262,22 @@ def update_uploaded_archive(archive_id):
             if not row:
                 raise werkzeug.exceptions.NotFound("Archive not found")
 
-            return jsonify({
-                "id": row.id,
-                "filename": row.filename,
-                "original_filename": row.original_filename,
-                "file_size": row.file_size,
-                "upload_date": row.upload_date.isoformat() if row.upload_date else None,
-                "status": row.status,
-                "is_valid": row.is_valid,
-                "needs_conversion": row.needs_conversion,
-                "validation_data": row.validation_data,
-                "feature_file": row.feature_file,
-                "project_id": row.project_id,
-                "error_message": row.error_message,
-                "metadata": row.metadata or "{}"
-            })
+            return jsonify(
+                {
+                    "id": row.id,
+                    "filename": row.filename,
+                    "original_filename": row.original_filename,
+                    "file_size": row.file_size,
+                    "upload_date": (
+                        row.upload_date.isoformat() if row.upload_date else None
+                    ),
+                    "status": row.status,
+                    "is_valid": row.is_valid,
+                    "needs_conversion": row.needs_conversion,
+                    "validation_data": row.validation_data,
+                    "feature_file": row.feature_file,
+                    "project_id": row.project_id,
+                    "error_message": row.error_message,
+                    "metadata": row.metadata or "{}",
+                }
+            )
diff --git a/morphocluster/background.py b/morphocluster/background.py
index 54d2ac9..f99d779 100644
--- a/morphocluster/background.py
+++ b/morphocluster/background.py
@@ -28,7 +28,7 @@ def log(self, message, level="info"):
         log_entry = {
             "timestamp": dt.datetime.now().isoformat(),
             "level": level,
-            "message": str(message)
+            "message": str(message),
         }
 
         # Add to logs array
@@ -161,6 +161,7 @@ def extract_features_job(filename, parameters=None):
     Background job for extracting features from uploaded archive using MorphoCluster's real feature extraction.
     """
     from rq import get_current_job
+
     job = get_current_job()
     logger = JobLogger(job)
 
@@ -276,7 +277,9 @@ def update_extraction_progress(current_batch, total_batches):
                 # Map from 15% to 95% based on batch progress
                 progress = 15 + int((current_batch / total_batches) * 80)
                 job.meta["progress"] = progress
-                job.meta["current_step"] = f"Extracting features: batch {current_batch}/{total_batches}"
+                job.meta["current_step"] = (
+                    f"Extracting features: batch {current_batch}/{total_batches}"
+                )
                 job.save_meta()
 
             # Run MorphoCluster's real feature extraction
@@ -350,14 +353,18 @@ def convert_ecotaxa_job(filename, parameters=None):
         try:
             # Always use the original file for conversion, not the _converted version
             original_filename = filename
-            if filename.endswith('_converted.zip'):
-                original_filename = filename.replace('_converted.zip', '.zip')
-                logger.info(f"Converting from original file: {original_filename} instead of {filename}")
+            if filename.endswith("_converted.zip"):
+                original_filename = filename.replace("_converted.zip", ".zip")
+                logger.info(
+                    f"Converting from original file: {original_filename} instead of {filename}"
+                )
 
             archive_path = Path(app_instance.config["FILES_DIR"]) / original_filename
 
             if not archive_path.exists():
-                raise FileNotFoundError(f"Original archive {original_filename} not found")
+                raise FileNotFoundError(
+                    f"Original archive {original_filename} not found"
+                )
 
             # Step 1: Analyze parameters
             job.meta["progress"] = 10
@@ -413,22 +420,32 @@ def convert_ecotaxa_job(filename, parameters=None):
                 try:
                     import zipfile
 
-                    with zipfile.ZipFile(work_path, 'r') as zf:
-                        ecotaxa_files = [f for f in zf.namelist() if 'ecotaxa' in f.lower()]
+                    with zipfile.ZipFile(work_path, "r") as zf:
+                        ecotaxa_files = [
+                            f for f in zf.namelist() if "ecotaxa" in f.lower()
+                        ]
                         logger.info(f"  ecotaxa files in work zip: {ecotaxa_files}")
 
                         if ecotaxa_files:
                             with zf.open(ecotaxa_files[0]) as fp:
-                                first_line = fp.readline().decode(encoding or 'ascii').strip()
+                                first_line = (
+                                    fp.readline().decode(encoding or "ascii").strip()
+                                )
                                 logger.info(f"  first line: {repr(first_line)}")
 
-                                actual_delimiter = delimiter or '\t'
+                                actual_delimiter = delimiter or "\t"
                                 columns = first_line.split(actual_delimiter)
                                 logger.info(f"  actual columns found: {columns}")
                                 logger.info(f"  number of columns: {len(columns)}")
-                                logger.info(f"  delimiter used: {repr(actual_delimiter)}")
-                                logger.info(f"  has object_id: {'object_id' in columns}")
-                                logger.info(f"  has img_file_name: {'img_file_name' in columns}")
+                                logger.info(
+                                    f"  delimiter used: {repr(actual_delimiter)}"
+                                )
+                                logger.info(
+                                    f"  has object_id: {'object_id' in columns}"
+                                )
+                                logger.info(
+                                    f"  has img_file_name: {'img_file_name' in columns}"
+                                )
 
                                 # Show each column individually for debugging
                                 for i, col in enumerate(columns):
@@ -510,6 +527,7 @@ def initial_clustering_job(archive_name, feature_file, parameters=None):
     Background job for initial clustering to create a new MorphoCluster project.
     """
     from rq import get_current_job
+
     job = get_current_job()
     logger = JobLogger(job)
 
diff --git a/morphocluster/models.py b/morphocluster/models.py
index 81449b2..fcd9c15 100644
--- a/morphocluster/models.py
+++ b/morphocluster/models.py
@@ -188,12 +188,16 @@
     Column("original_filename", String, nullable=False),
     Column("file_size", BigInteger, nullable=False),
     Column("upload_date", DateTime, default=datetime.datetime.now),
-    Column("status", String, nullable=False, default="uploaded"),  # uploaded, converting, extracting, clustering, completed, error
+    Column(
+        "status", String, nullable=False, default="uploaded"
+    ),  # uploaded, converting, extracting, clustering, completed, error
     Column("is_valid", Boolean, default=False),
     Column("needs_conversion", Boolean, default=False),
     Column("validation_data", Text, nullable=True),  # JSON validation details
     Column("feature_file", String, nullable=True),  # Generated feature file name
-    Column("project_id", Integer, ForeignKey("projects.project_id"), nullable=True),  # Created project
+    Column(
+        "project_id", Integer, ForeignKey("projects.project_id"), nullable=True
+    ),  # Created project
     Column("error_message", Text, nullable=True),
     Column("metadata", Text, nullable=True),  # JSON metadata for additional info
 )