From d62e6d1488a636510addfb786e095ae31d24b6bb Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 1 Apr 2026 10:36:28 -0400
Subject: [PATCH 01/61] fix: increase token limit sent to LLM

---
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 197 ++++++++++++++----
 .../utils/filenameTokenizer.ts                | 116 ++++++++++-
 .../DatasetOrganizer/utils/llmPrompts.ts      |   6 +-
 3 files changed, 265 insertions(+), 54 deletions(-)
diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index d9d6366..a8fd052 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -184,6 +184,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
       });
 
       setEvidenceBundle(bundle);
+      setSubjectAnalysis(null); // ← add this line
       downloadJSON(bundle, "evidence_bundle.json");
       setStatus("✓ Evidence bundle generated and downloaded!");
     } catch (err: any) {
@@ -380,6 +381,43 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
         setStatus("3/3 Generating participants.tsv...");
         const partsPrompt = getParticipantsPrompt(userText);
 
+        // ← ADD HERE: compute subject analysis before try block so it's in scope
+        const currentSubjectAnalysis = extractSubjectAnalysis(
+          evidenceBundle?.all_files || [],
+          evidenceBundle?.user_hints?.n_subjects,
+          evidenceBundle?.filename_analysis?.python_statistics
+            ?.dominant_prefixes
+        );
+
+        console.log("=== PARTICIPANTS DEBUG ===");
+        console.log("method:", currentSubjectAnalysis?.method);
+        console.log("subject_count:", currentSubjectAnalysis?.subject_count);
+        console.log(
+          "id_mapping:",
+          currentSubjectAnalysis?.id_mapping?.id_mapping
+        );
+        console.log(
+          "reverse_mapping:",
+          currentSubjectAnalysis?.id_mapping?.reverse_mapping
+        );
+        console.log(
+          "subject_records sample:",
+          currentSubjectAnalysis?.subject_records?.slice(0, 3)
+        );
+        const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
+        const expectedCount = evidenceBundle?.user_hints?.n_subjects;
+        const subjectLabels: string[] =
+          idMap &&
+          Object.keys(idMap).length > 0 &&
+          (!expectedCount || Object.keys(idMap).length === expectedCount)
+            ? Object.values(idMap).map((id: string) => `sub-${id}`)
+            : Array.from(
+                {
+                  length: expectedCount || Object.keys(idMap || {}).length || 1,
+                },
+                (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+              );
+
         let partsResponse;
         if (currentProvider.isAnthropic) {
           partsResponse = await fetch(currentProvider.baseUrl, {
@@ -435,52 +473,130 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
           : partsData.choices[0].message.content;
 
         // Build TSV from schema
+        // try {
+        //   const schemaText = participantsRaw
+        //     .replace(/^```json\n?/g, "")
+        //     .replace(/\n?```$/g, "")
+        //     .trim();
+        //   const schema = JSON.parse(schemaText);
+        //   const columns: string[] = schema.columns.map((c: any) => c.name);
+
+        //   // Get subject IDs from evidence bundle (extracted by Python-style analysis)
+        //   // const idMapping =
+        //   //   evidenceBundle?.subject_analysis?.id_mapping?.id_mapping;
+        //   // const subjectLabels: string[] = idMapping
+        //   //   ? Object.values(idMapping).map((id) => `sub-${id}`)
+        //   //   : ["sub-01"]; // fallback if no subject analysis
+        //   // Get subject IDs from subjectAnalysis state (computed at plan stage)
+        //   // Fall back to computing fresh if plan hasn't been run yet
+        //   const currentSubjectAnalysis =
+        //     subjectAnalysis ||
+        //     extractSubjectAnalysis(
+        //       evidenceBundle?.all_files || [],
+        //       evidenceBundle?.user_hints?.n_subjects,
+        //       evidenceBundle?.filename_analysis?.python_statistics
+        //         ?.dominant_prefixes
+        //     );
+        //   const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
+        //   const subjectLabels: string[] =
+        //     idMap && Object.keys(idMap).length > 0
+        //       ? Object.values(idMap).map((id) => `sub-${id}`)
+        //       : Array.from(
+        //           { length: evidenceBundle?.user_hints?.n_subjects || 1 },
+        //           (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+        //         );
+
+        //   const header = columns.join("\t");
+        //   // ====origin====
+        //   // const rows = subjectLabels.map((subId) =>
+        //   //   columns
+        //   //     .map((col: string) => (col === "participant_id" ? subId : "n/a"))
+        //   //     .join("\t")
+        //   // );
+        //   //====== end ======
+        //   // =====update start=====
+        //   const reverseMap =
+        //     currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+        //   const subjectRecords = currentSubjectAnalysis?.subject_records || [];
+
+        //   const rows = subjectLabels.map((subId) => {
+        //     const bareId = subId.replace(/^sub-/, "");
+        //     const originalId = reverseMap[bareId];
+        //     const record = subjectRecords.find(
+        //       (r: any) => r.original_id === originalId
+        //     );
+        //     return columns
+        //       .map((col: string) => {
+        //         if (col === "participant_id") return subId;
+        //         if (col === "original_id") return originalId || "n/a";
+        //         if (col === "group") return (record as any)?.group || "n/a";
+        //         return "n/a";
+        //       })
+        //       .join("\t");
+        //   });
+        //   //====update end======
+        //   participantsContent = [header, ...rows].join("\n");
+        // } catch (e) {
+        //   // Fallback: LLM didn't return valid JSON schema, use raw content
+        //   participantsContent = participantsRaw
+        //     .replace(/^```\n?/g, "")
+        //     .replace(/\n?```$/g, "")
+        //     .trim();
+        // }
+        // Build TSV from schema + subject analysis
+        // Mirrors _generate_participants_tsv_from_python() in planner.py
         try {
           const schemaText = participantsRaw
             .replace(/^```json\n?/g, "")
             .replace(/\n?```$/g, "")
             .trim();
           const schema = JSON.parse(schemaText);
-          const columns: string[] = schema.columns.map((c: any) => c.name);
-
-          // Get subject IDs from evidence bundle (extracted by Python-style analysis)
-          // const idMapping =
-          //   evidenceBundle?.subject_analysis?.id_mapping?.id_mapping;
-          // const subjectLabels: string[] = idMapping
-          //   ? Object.values(idMapping).map((id) => `sub-${id}`)
-          //   : ["sub-01"]; // fallback if no subject analysis
-          // Get subject IDs from subjectAnalysis state (computed at plan stage)
-          // Fall back to computing fresh if plan hasn't been run yet
-          const currentSubjectAnalysis =
-            subjectAnalysis ||
-            extractSubjectAnalysis(
-              evidenceBundle?.all_files || [],
-              evidenceBundle?.user_hints?.n_subjects,
-              evidenceBundle?.filename_analysis?.python_statistics
-                ?.dominant_prefixes
+
+          // LLM decides extra demographic columns (sex, age, group etc.)
+          // but we always add participant_id and original_id ourselves
+          const extraColumns: string[] = schema.columns
+            .map((c: any) => c.name)
+            .filter(
+              (name: string) =>
+                name !== "participant_id" && name !== "original_id"
             );
-          const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
-          const subjectLabels: string[] =
-            idMap && Object.keys(idMap).length > 0
-              ? Object.values(idMap).map((id) => `sub-${id}`)
-              : Array.from(
-                  { length: evidenceBundle?.user_hints?.n_subjects || 1 },
-                  (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
-                );
+
+          // Always start with participant_id and original_id
+          const columns = ["participant_id", "original_id", ...extraColumns];
+
+          const reverseMap =
+            currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+          const subjectRecords = currentSubjectAnalysis?.subject_records || [];
 
           const header = columns.join("\t");
-          const rows = subjectLabels.map((subId) =>
-            columns
-              .map((col: string) => (col === "participant_id" ? subId : "n/a"))
-              .join("\t")
-          );
+          const rows = subjectLabels.map((subId) => {
+            const bareId = subId.replace(/^sub-/, "");
+            const originalId = reverseMap[bareId] || "n/a";
+            const record = subjectRecords.find(
+              (r: any) => r.original_id === originalId
+            );
+            return columns
+              .map((col: string) => {
+                if (col === "participant_id") return subId;
+                if (col === "original_id") return originalId;
+                if (col === "group") return (record as any)?.group || "n/a";
+                return "n/a";
+              })
+              .join("\t");
+          });
+
           participantsContent = [header, ...rows].join("\n");
         } catch (e) {
-          // Fallback: LLM didn't return valid JSON schema, use raw content
-          participantsContent = participantsRaw
-            .replace(/^```\n?/g, "")
-            .replace(/\n?```$/g, "")
-            .trim();
+          // Fallback: generate minimal TSV directly from subject analysis
+          const reverseMap =
+            currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+          const header = "participant_id\toriginal_id";
+          const rows = subjectLabels.map((subId) => {
+            const bareId = subId.replace(/^sub-/, "");
+            const originalId = reverseMap[bareId] || "n/a";
+            return `${subId}\t${originalId}`;
+          });
+          participantsContent = [header, ...rows].join("\n");
         }
       }
       // ==========================================
@@ -632,11 +748,6 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
     const filePatterns = analyzeFilePatterns(files);
     const userContext = getUserContext(files);
     const annotations = getFileAnnotations(files);
-    // console.log("=== PROMPT BEING SENT TO LLM ===");
-    // console.log(fileSummary);
-    // console.log(filePatterns);
-    // console.log(userContext);
-    // console.log("=================================");
 
     // UPDATED: Improved prompt that uses trio files
     const prompt = getConversionScriptPrompt(
@@ -788,6 +899,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
       userNSubjects,
       dominantPrefixes
     );
+
     setSubjectAnalysis(computedSubjectAnalysis);
 
     const fileSummary = buildFileSummary(files);
@@ -801,11 +913,6 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
         .map((s: any) => `  - ${s.relpath}`)
         .join("\n") || "";
 
-    // console.log("=== SAMPLE FILES ===");
-    // console.log(sampleFiles);
-    // console.log("=== COUNTS BY EXT ===");
-    // console.log(evidenceBundle?.counts_by_ext);
-
     const prompt = getBIDSPlanPrompt(
       fileSummary,
       filePatterns,
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
index 1c1820b..4708c13 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
@@ -7,6 +7,7 @@ export interface SubjectRecord {
   site: string | null;
   pattern_name: string;
   file_count: number;
+  group?: string;
 }
 
 export interface SubjectAnalysis {
@@ -359,14 +360,52 @@ const extractNumericIdFromIdentifier = (identifier: string): string | null => {
 
 // ── Step 1: Directory structure patterns
 // Mirrors _extract_subjects_from_directory_structure() in planner.py
+const SKIP_DIRS = new Set([
+  "anat",
+  "func",
+  "dwi",
+  "fmap",
+  "nirs",
+  "meg",
+  "eeg",
+  "beh",
+  "perf",
+  "derivatives",
+  "sourcedata",
+  "stimuli",
+  "walking",
+  "resting",
+  "resting_state",
+  "run",
+  "ses",
+  "pd",
+  "control",
+  "hc",
+  "task",
+  "sub",
+  "dataset",
+  "data",
+  "raw",
+  "bids",
+  "output",
+  "outputs",
+  "staging",
+  "_staging",
+  "mri",
+  "fnirs",
+  "edf",
+  "dicom",
+]);
+
 const extractFromDirectoryStructure = (
   allFiles: string[]
 ): Omit<SubjectAnalysis, "id_mapping"> | null => {
   const patterns: Array<[RegExp, boolean, number, number | null, string]> = [
-    [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"],
-    [/^sub-(\w+)$/, false, 1, null, "standard_bids"], // directory named sub-01
-    [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"],
-    [/^\d{3,}$/, false, 1, null, "numeric_only"], // directory named 001
+    [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"], // Beijing_sub82352
+    [/^sub-(\w+)$/, false, 1, null, "standard_bids"], // sub-01
+    [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"], // subject_01
+    [/^\d{3,}$/, false, 1, null, "numeric_only"], // 001
+    [/^([A-Za-z]+\d+)$/, false, 1, null, "alphanum_id"], // PD01, Control01, HC03
   ];
 
   const subjectRecords: SubjectRecord[] = [];
@@ -374,11 +413,14 @@ const extractFromDirectoryStructure = (
 
   for (const filepath of allFiles) {
     const parts = filepath.split("/");
-    // Only check the first 2 path parts (directory levels), not the filename
-    // mirrors: for part in parts[:2]
-    const dirsOnly = parts.slice(0, Math.min(2, parts.length - 1)); // exclude filename
+    // Check ALL directory levels (not just first 2)
+    const dirsOnly = parts.slice(0, parts.length - 1);
+    // const dirsOnly = parts.slice(0, Math.min(2, parts.length - 1)); // only first 2 levels
 
     for (const part of dirsOnly) {
+      // Skip known non-subject directory names
+      // if (SKIP_DIRS.has(part.toLowerCase())) continue;
+
       for (const [
         regex,
         hasSite,
@@ -393,7 +435,7 @@ const extractFromDirectoryStructure = (
           seenIds.add(originalId);
           subjectRecords.push({
             original_id: originalId,
-            numeric_id: match[idGroup],
+            numeric_id: match[idGroup] || match[0],
             site: hasSite && siteGroup ? match[siteGroup] : null,
             pattern_name: patternName,
             file_count: 0,
@@ -407,11 +449,41 @@ const extractFromDirectoryStructure = (
   if (subjectRecords.length === 0) return null;
 
   subjectRecords.sort((a, b) => {
+    // const na = parseInt(a.numeric_id) || 0;
+    // const nb = parseInt(b.numeric_id) || 0;
+    // return na - nb;
+    const aMatch = a.original_id.match(/^([A-Za-z]+)(\d+)$/);
+    const bMatch = b.original_id.match(/^([A-Za-z]+)(\d+)$/);
+
+    if (aMatch && bMatch) {
+      const prefixCompare = aMatch[1].localeCompare(bMatch[1]);
+      if (prefixCompare !== 0) return prefixCompare;
+      return parseInt(aMatch[2]) - parseInt(bMatch[2]);
+    }
+
     const na = parseInt(a.numeric_id) || 0;
     const nb = parseInt(b.numeric_id) || 0;
     return na - nb;
   });
 
+  // Build group map: subject originalId → parent directory name
+  // const groupMap: Record<string, string> = {};
+  // for (const filepath of allFiles) {
+  //   const parts = filepath.split("/");
+  //   for (let i = 1; i < parts.length - 1; i++) {
+  //     if (seenIds.has(parts[i]) && !SKIP_DIRS.has(parts[i - 1].toLowerCase())) {
+  //       groupMap[parts[i]] = parts[i - 1];
+  //     }
+  //   }
+  // }
+
+  // // Attach group to each record
+  // for (const rec of subjectRecords) {
+  //   if (groupMap[rec.original_id]) {
+  //     rec.group = groupMap[rec.original_id];
+  //   }
+  // }
+
   return {
     success: true,
     method: "directory_structure",
@@ -551,6 +623,34 @@ export const extractSubjectAnalysis = (
       python_generated_filename_rules: [],
     };
   }
+  // bug fix for subject mapping
+  // === original
+  // const idMapping = generateIdMapping(subjectInfo);
+  // return { ...subjectInfo, id_mapping: idMapping };
+  // ==== end
+  // ==== updates
+  // CRITICAL: n_subjects is authoritative (mirrors planner.py PROMPT_BIDS_PLAN)
+  // If analysis count doesn't match user input, fall back to sequential numbering
+  const expectedCount = userNSubjects;
+  if (expectedCount && subjectInfo.subject_count !== expectedCount) {
+    const idMap: Record<string, string> = {};
+    const reverseMap: Record<string, string> = {};
+    for (let i = 1; i <= expectedCount; i++) {
+      const bidsId = String(i).padStart(2, "0");
+      idMap[`sub-${bidsId}`] = bidsId;
+      reverseMap[bidsId] = `sub-${bidsId}`;
+    }
+    return {
+      ...subjectInfo,
+      subject_count: expectedCount,
+      id_mapping: {
+        id_mapping: idMap,
+        reverse_mapping: reverseMap,
+        strategy_used: "numeric_fallback",
+        metadata_columns: [],
+      },
+    };
+  }
 
   const idMapping = generateIdMapping(subjectInfo);
   return { ...subjectInfo, id_mapping: idMapping };
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
index 6d6a796..be03f83 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
@@ -9,9 +9,13 @@ export const getDatasetDescriptionPrompt = (
   evidenceBundle?: any
 ): string => {
   const documentsContext =
+    // evidenceBundle?.documents
+    //   ?.map((d: any) => `[${d.filename}]:\n${d.content}`)
+    //   .join("\n\n") || "";
     evidenceBundle?.documents
-      ?.map((d: any) => `[${d.filename}]:\n${d.content}`)
+      ?.map((d: any) => `[${d.filename}]:\n${(d.content || "").slice(0, 500)}`)
       .join("\n\n") || "";
+
   return `You are a BIDS dataset_description.json generator.
   
   CRITICAL: Use the following user-provided content to extract dataset information!

From 843f0a21d95bc273bb2374f57647a6b6bc69cd95 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 1 Apr 2026 15:05:56 -0400
Subject: [PATCH 02/61] fix: resolve leaks in previewModal 3D viewer

---
 src/components/PreviewModal.tsx |  36 +-
 src/utils/preview.js            | 600 +++++++++++++++++++++++---------
 2 files changed, 454 insertions(+), 182 deletions(-)

diff --git a/src/components/PreviewModal.tsx b/src/components/PreviewModal.tsx
index 4a3ce82..bf81318 100644
--- a/src/components/PreviewModal.tsx
+++ b/src/components/PreviewModal.tsx
@@ -28,30 +28,14 @@ const PreviewModal: React.FC<{
   // fix end---------------------
 
   useEffect(() => {
-    if (!isOpen) return;
-    //add spinner
-    // if (!isOpen || isLoading) return;
-
-    // fix start-----------: Get the container element from the ref.
-    // const container = canvasContainerRef.current;
-    // if (!container) {
-    //   // This can happen briefly on the first render, so we just wait for the next render.
-    //   return;
-    // }
-    // // 3. Check for the required legacy functions on the window object.
-    // if (
-    //   typeof window.previewdata !== "function" ||
-    //   typeof window.initcanvas_with_container !== "function"
-    // ) {
-    //   console.error(
-    //     "❌ Legacy preview script functions are not available on the window object."
-    //   );
-    //   return;
-    // }
-
-    // window.previewdata(dataKey, previewIndex, isInternal, false);
-    // fix end---------------------------------
-    // clear old canvas
+    // if (!isOpen) return;
+    if (!isOpen) {
+      // Modal just closed — clean up Three.js immediately
+      if (typeof window.destroyPreview === "function") {
+        window.destroyPreview();
+      }
+      return;
+    }
     const canvasDiv = document.getElementById("canvas");
     if (canvasDiv)
       while (canvasDiv.firstChild) canvasDiv.removeChild(canvasDiv.firstChild);
@@ -69,6 +53,10 @@ const PreviewModal: React.FC<{
 
     return () => {
       clearInterval(interval);
+      // Component unmounting — clean up Three.js
+      if (typeof window.destroyPreview === "function") {
+        window.destroyPreview();
+      }
     };
   }, [isOpen, dataKey, previewIndex, isInternal]);
 
diff --git a/src/utils/preview.js b/src/utils/preview.js
index 912c8f8..496e855 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -74,18 +74,55 @@ var typedfun = {
   BigUint64Array: null,
 };
 
+// function destroyPreview() {
+//   if (window.scene) {
+//     while (window.scene.children.length > 0) {
+//       const obj = window.scene.children[0];
+//       window.scene.remove(obj);
+//       if (obj.geometry) obj.geometry.dispose();
+//       if (obj.material) obj.material.dispose();
+//     }
+//   }
+
+//   if (window.renderer && window.renderer.domElement) {
+//     window.renderer.domElement.remove();
+//     window.renderer.dispose();
+//   }
+
+//   window.scene = undefined;
+//   window.camera = undefined;
+//   window.renderer = undefined;
+//   window.controls = undefined;
+//   window.reqid = undefined;
+// }
 function destroyPreview() {
+  // Cancel animation loop first
+  if (reqid !== undefined) {
+    cancelAnimationFrame(reqid);
+    reqid = undefined;
+    window.reqid = undefined;
+  }
+
   if (window.scene) {
     while (window.scene.children.length > 0) {
       const obj = window.scene.children[0];
       window.scene.remove(obj);
       if (obj.geometry) obj.geometry.dispose();
-      if (obj.material) obj.material.dispose();
+      if (obj.material) {
+        // Dispose any textures stored in shader uniforms
+        if (obj.material.uniforms) {
+          Object.values(obj.material.uniforms).forEach((u) => {
+            if (u.value && u.value.isTexture) u.value.dispose();
+          });
+        }
+        obj.material.dispose();
+      }
     }
   }
 
   if (window.renderer && window.renderer.domElement) {
     window.renderer.domElement.remove();
+    window.renderer.forceContextLoss();
     window.renderer.dispose();
   }
 
@@ -93,7 +130,9 @@ function destroyPreview() {
   window.camera = undefined;
   window.renderer = undefined;
   window.controls = undefined;
-  window.reqid = undefined;
+  lastvolume = null;
+  lastvolumedata = null;
+  texture = undefined;
 }
 
 function drawpreview(cfg) {
@@ -967,183 +1006,428 @@ function initcanvas() {
     panel.appendChild(stats.domElement);
   }
 
-  $("#camera-near").on("input", function () {
-    camera.near = parseFloat($(this).val());
-    renderer.render(scene, camera);
-    controls.update();
-    renderer.updateComplete = false;
-  });
+  // $("#camera-near").on("input", function () {
+  //   camera.near = parseFloat($(this).val());
+  //   renderer.render(scene, camera);
+  //   controls.update();
+  //   renderer.updateComplete = false;
+  // });
 
-  $("#camera-far").on("input", function () {
-    camera.far = parseFloat($(this).val());
-    renderer.render(scene, camera);
-    controls.update();
-    renderer.updateComplete = false;
-  });
+  // $("#camera-far").on("input", function () {
+  //   camera.far = parseFloat($(this).val());
+  //   renderer.render(scene, camera);
+  //   controls.update();
+  //   renderer.updateComplete = false;
+  // });
 
-  $("#clim-low").on("input", function () {
-    $(this).prop(
-      "title",
-      "" +
-        $(this).val() +
-        " [" +
-        $(this).prop("min") +
-        "," +
-        $(this).prop("max") +
-        "]"
-    );
-    if (lastvolume !== null) {
-      let val = lastvolume.material.uniforms["u_clim"].value;
-      lastvolume.material.uniforms["u_clim"].value.set(
-        parseFloat($(this).val()),
-        val.y
-      );
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#clim-low").on("input", function () {
+  //   $(this).prop(
+  //     "title",
+  //     "" +
+  //       $(this).val() +
+  //       " [" +
+  //       $(this).prop("min") +
+  //       "," +
+  //       $(this).prop("max") +
+  //       "]"
+  //   );
+  //   if (lastvolume !== null) {
+  //     let val = lastvolume.material.uniforms["u_clim"].value;
+  //     lastvolume.material.uniforms["u_clim"].value.set(
+  //       parseFloat($(this).val()),
+  //       val.y
+  //     );
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#clim-hi").on("input", function () {
-    $(this).prop(
-      "title",
-      "" +
-        $(this).val() +
-        " [" +
-        $(this).prop("min") +
-        "," +
-        $(this).prop("max") +
-        "]"
-    );
-    if (lastvolume !== null) {
-      let val = lastvolume.material.uniforms["u_clim"].value;
-      lastvolume.material.uniforms["u_clim"].value.set(
-        val.x,
-        parseFloat($(this).val())
-      );
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#clim-hi").on("input", function () {
+  //   $(this).prop(
+  //     "title",
+  //     "" +
+  //       $(this).val() +
+  //       " [" +
+  //       $(this).prop("min") +
+  //       "," +
+  //       $(this).prop("max") +
+  //       "]"
+  //   );
+  //   if (lastvolume !== null) {
+  //     let val = lastvolume.material.uniforms["u_clim"].value;
+  //     lastvolume.material.uniforms["u_clim"].value.set(
+  //       val.x,
+  //       parseFloat($(this).val())
+  //     );
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#isothreshold").on("input", function () {
-    $(this).prop(
-      "title",
-      "" +
-        $(this).val() +
-        " [" +
-        $(this).prop("min") +
-        "," +
-        $(this).prop("max") +
-        "]"
-    );
-    if (lastvolume !== null) {
-      let val = lastvolume.material.uniforms["u_renderthreshold"].value;
-      lastvolume.material.uniforms["u_renderthreshold"].value = parseFloat(
-        $(this).val()
-      );
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#isothreshold").on("input", function () {
+  //   $(this).prop(
+  //     "title",
+  //     "" +
+  //       $(this).val() +
+  //       " [" +
+  //       $(this).prop("min") +
+  //       "," +
+  //       $(this).prop("max") +
+  //       "]"
+  //   );
+  //   if (lastvolume !== null) {
+  //     let val = lastvolume.material.uniforms["u_renderthreshold"].value;
+  //     lastvolume.material.uniforms["u_renderthreshold"].value = parseFloat(
+  //       $(this).val()
+  //     );
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#mip-radio-button").on("change", function () {
-    if (lastvolume !== null) {
-      const unfs = lastvolume.material.uniforms;
-      lastvolume.material = new THREE.ShaderMaterial({
-        uniforms: THREE.UniformsUtils.clone(MipRenderShader.uniforms),
-        vertexShader: MipRenderShader.vertexShader,
-        fragmentShader: MipRenderShader.fragmentShader,
-        side: THREE.BackSide,
-      });
-      lastvolume.material.uniforms = unfs;
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#mip-radio-button").on("change", function () {
+  //   if (lastvolume !== null) {
+  //     const unfs = lastvolume.material.uniforms;
+  //     lastvolume.material = new THREE.ShaderMaterial({
+  //       uniforms: THREE.UniformsUtils.clone(MipRenderShader.uniforms),
+  //       vertexShader: MipRenderShader.vertexShader,
+  //       fragmentShader: MipRenderShader.fragmentShader,
+  //       side: THREE.BackSide,
+  //     });
+  //     lastvolume.material.uniforms = unfs;
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#iso-radio-button").on("change", function () {
-    if (lastvolume !== null) {
-      const unfs = lastvolume.material.uniforms;
-      lastvolume.material = new THREE.ShaderMaterial({
-        uniforms: THREE.UniformsUtils.clone(IsoRenderShader.uniforms),
-        vertexShader: IsoRenderShader.vertexShader,
-        fragmentShader: IsoRenderShader.fragmentShader,
-        side: THREE.BackSide,
-      });
-      lastvolume.material.uniforms = unfs;
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#iso-radio-button").on("change", function () {
+  //   if (lastvolume !== null) {
+  //     const unfs = lastvolume.material.uniforms;
+  //     lastvolume.material = new THREE.ShaderMaterial({
+  //       uniforms: THREE.UniformsUtils.clone(IsoRenderShader.uniforms),
+  //       vertexShader: IsoRenderShader.vertexShader,
+  //       fragmentShader: IsoRenderShader.fragmentShader,
+  //       side: THREE.BackSide,
+  //     });
+  //     lastvolume.material.uniforms = unfs;
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#interp-radio-button").on("change", function () {
-    if (lastvolume !== null) {
-      const unfs = lastvolume.material.uniforms;
-      lastvolume.material = new THREE.RawShaderMaterial(InterpRenderShader());
-      lastvolume.material.uniforms = unfs;
-      lastvolume.material.uniforms.cameraPos.value.copy(camera.position);
-      renderer.updateComplete = false;
-    }
-  });
+  // $("#interp-radio-button").on("change", function () {
+  //   if (lastvolume !== null) {
+  //     const unfs = lastvolume.material.uniforms;
+  //     lastvolume.material = new THREE.RawShaderMaterial(InterpRenderShader());
+  //     lastvolume.material.uniforms = unfs;
+  //     lastvolume.material.uniforms.cameraPos.value.copy(camera.position);
+  //     renderer.updateComplete = false;
+  //   }
+  // });
 
-  $("#cross-x-low").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-x-low").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#cross-y-low").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-y-low").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#cross-z-low").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-z-low").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#cross-x-hi").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-x-hi").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#cross-y-hi").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-y-hi").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#cross-z-hi").on("input", function () {
-    setcrosssectionsizes(this);
-  });
+  // $("#cross-z-hi").on("input", function () {
+  //   setcrosssectionsizes(this);
+  // });
 
-  $("#x_thickness, #y_thickness, #z_thickness").on("input", function () {
-    let eid = $(this).attr("id");
-    let linkedeid1 = eid.replace(/_thickness/, "-low").replace(/^/, "cross-");
-    let linkedeid2 = eid.replace(/_thickness/, "-hi").replace(/^/, "cross-");
-    if ($(this).val() == 0) {
-      $("#" + linkedeid1).val(0);
-      $("#" + linkedeid2).val(1);
-    } else {
-      $("#" + linkedeid1).val(
-        ($("#" + linkedeid1).val() + $("#" + linkedeid2).val()) * 0.5
+  // $("#x_thickness, #y_thickness, #z_thickness").on("input", function () {
+  //   let eid = $(this).attr("id");
+  //   let linkedeid1 = eid.replace(/_thickness/, "-low").replace(/^/, "cross-");
+  //   let linkedeid2 = eid.replace(/_thickness/, "-hi").replace(/^/, "cross-");
+  //   if ($(this).val() == 0) {
+  //     $("#" + linkedeid1).val(0);
+  //     $("#" + linkedeid2).val(1);
+  //   } else {
+  //     $("#" + linkedeid1).val(
+  //       ($("#" + linkedeid1).val() + $("#" + linkedeid2).val()) * 0.5
+  //     );
+  //   }
+  //   setcrosssectionsizes($("#" + linkedeid1));
+  // });
+
+  // $("#pos-x-view").on("click", function () {
+  //   setControlAngles((Math.PI * 90) / 180, (Math.PI * 90) / 180);
+  //   renderer.updateComplete = false;
+  // });
+
+  // $("#neg-x-view").on("click", function () {
+  //   setControlAngles((Math.PI * 90) / 180, (Math.PI * 270) / 180);
+  // });
+
+  // $("#pos-y-view").on("click", function () {
+  //   setControlAngles((Math.PI * 90) / 180, (Math.PI * 180) / 180);
+  // });
+
+  // $("#neg-y-view").on("click", function () {
+  //   setControlAngles((Math.PI * 90) / 180, (Math.PI * 0) / 180);
+  // });
+
+  // $("#pos-z-view").on("click", function () {
+  //   setControlAngles(0, 0);
+  // });
+
+  // $("#neg-z-view").on("click", function () {
+  //   setControlAngles((Math.PI * 180) / 180, 0);
+  // });
+
+  $("#camera-near")
+    .off("input")
+    .on("input", function () {
+      camera.near = parseFloat($(this).val());
+      renderer.render(scene, camera);
+      controls.update();
+      renderer.updateComplete = false;
+    });
+
+  $("#camera-far")
+    .off("input")
+    .on("input", function () {
+      camera.far = parseFloat($(this).val());
+      renderer.render(scene, camera);
+      controls.update();
+      renderer.updateComplete = false;
+    });
+
+  $("#clim-low")
+    .off("input")
+    .on("input", function () {
+      $(this).prop(
+        "title",
+        "" +
+          $(this).val() +
+          " [" +
+          $(this).prop("min") +
+          "," +
+          $(this).prop("max") +
+          "]"
       );
-    }
-    setcrosssectionsizes($("#" + linkedeid1));
-  });
+      if (lastvolume !== null) {
+        let val = lastvolume.material.uniforms["u_clim"].value;
+        lastvolume.material.uniforms["u_clim"].value.set(
+          parseFloat($(this).val()),
+          val.y
+        );
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#pos-x-view").on("click", function () {
-    setControlAngles((Math.PI * 90) / 180, (Math.PI * 90) / 180);
-    renderer.updateComplete = false;
-  });
+  $("#clim-hi")
+    .off("input")
+    .on("input", function () {
+      $(this).prop(
+        "title",
+        "" +
+          $(this).val() +
+          " [" +
+          $(this).prop("min") +
+          "," +
+          $(this).prop("max") +
+          "]"
+      );
+      if (lastvolume !== null) {
+        let val = lastvolume.material.uniforms["u_clim"].value;
+        lastvolume.material.uniforms["u_clim"].value.set(
+          val.x,
+          parseFloat($(this).val())
+        );
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#neg-x-view").on("click", function () {
-    setControlAngles((Math.PI * 90) / 180, (Math.PI * 270) / 180);
-  });
+  $("#isothreshold")
+    .off("input")
+    .on("input", function () {
+      $(this).prop(
+        "title",
+        "" +
+          $(this).val() +
+          " [" +
+          $(this).prop("min") +
+          "," +
+          $(this).prop("max") +
+          "]"
+      );
+      if (lastvolume !== null) {
+        lastvolume.material.uniforms["u_renderthreshold"].value = parseFloat(
+          $(this).val()
+        );
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#pos-y-view").on("click", function () {
-    setControlAngles((Math.PI * 90) / 180, (Math.PI * 180) / 180);
-  });
+  $("#mip-radio-button")
+    .off("change")
+    .on("change", function () {
+      if (lastvolume !== null) {
+        const unfs = lastvolume.material.uniforms;
+        lastvolume.material = new THREE.ShaderMaterial({
+          uniforms: THREE.UniformsUtils.clone(MipRenderShader.uniforms),
+          vertexShader: MipRenderShader.vertexShader,
+          fragmentShader: MipRenderShader.fragmentShader,
+          side: THREE.BackSide,
+        });
+        lastvolume.material.uniforms = unfs;
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#neg-y-view").on("click", function () {
-    setControlAngles((Math.PI * 90) / 180, (Math.PI * 0) / 180);
-  });
+  $("#iso-radio-button")
+    .off("change")
+    .on("change", function () {
+      if (lastvolume !== null) {
+        const unfs = lastvolume.material.uniforms;
+        lastvolume.material = new THREE.ShaderMaterial({
+          uniforms: THREE.UniformsUtils.clone(IsoRenderShader.uniforms),
+          vertexShader: IsoRenderShader.vertexShader,
+          fragmentShader: IsoRenderShader.fragmentShader,
+          side: THREE.BackSide,
+        });
+        lastvolume.material.uniforms = unfs;
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#pos-z-view").on("click", function () {
-    setControlAngles(0, 0);
-  });
+  $("#interp-radio-button")
+    .off("change")
+    .on("change", function () {
+      if (lastvolume !== null) {
+        const unfs = lastvolume.material.uniforms;
+        lastvolume.material = new THREE.RawShaderMaterial(InterpRenderShader());
+        lastvolume.material.uniforms = unfs;
+        lastvolume.material.uniforms.cameraPos.value.copy(camera.position);
+        renderer.updateComplete = false;
+      }
+    });
 
-  $("#neg-z-view").on("click", function () {
-    setControlAngles((Math.PI * 180) / 180, 0);
-  });
+  $("#cross-x-low")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+  $("#cross-y-low")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+  $("#cross-z-low")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+  $("#cross-x-hi")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+  $("#cross-y-hi")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+  $("#cross-z-hi")
+    .off("input")
+    .on("input", function () {
+      setcrosssectionsizes(this);
+    });
+
+  $("#x_thickness, #y_thickness, #z_thickness")
+    .off("input")
+    .on("input", function () {
+      let eid = $(this).attr("id");
+      let linkedeid1 = eid.replace(/_thickness/, "-low").replace(/^/, "cross-");
+      let linkedeid2 = eid.replace(/_thickness/, "-hi").replace(/^/, "cross-");
+      if ($(this).val() == 0) {
+        $("#" + linkedeid1).val(0);
+        $("#" + linkedeid2).val(1);
+      } else {
+        $("#" + linkedeid1).val(
+          ($("#" + linkedeid1).val() + $("#" + linkedeid2).val()) * 0.5
+        );
+      }
+      setcrosssectionsizes($("#" + linkedeid1));
+    });
+
+  $("#pos-x-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles((Math.PI * 90) / 180, (Math.PI * 90) / 180);
+      renderer.updateComplete = false;
+    });
+  $("#neg-x-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles((Math.PI * 90) / 180, (Math.PI * 270) / 180);
+    });
+  $("#pos-y-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles((Math.PI * 90) / 180, (Math.PI * 180) / 180);
+    });
+  $("#neg-y-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles((Math.PI * 90) / 180, (Math.PI * 0) / 180);
+    });
+  $("#pos-z-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles(0, 0);
+    });
+  $("#neg-z-view")
+    .off("click")
+    .on("click", function () {
+      setControlAngles((Math.PI * 180) / 180, 0);
+    });
+
+  $("#cross-t")
+    .off("mouseup")
+    .on("mouseup", function () {
+      $(this).prop(
+        "title",
+        "" +
+          $(this).val() +
+          " [" +
+          $(this).prop("min") +
+          "," +
+          $(this).prop("max") +
+          "]"
+      );
+      if (lastvolume !== null && lastvolumedata !== undefined) {
+        let dim = lastvolumedim;
+        let offset =
+          Math.min($(this).val(), dim[3] - 2) * dim[0] * dim[1] * dim[2];
+        let texture = new THREE.Data3DTexture(
+          lastvolumedata.selection.data.slice(
+            offset - 1,
+            offset + dim[0] * dim[1] * dim[2] - 1
+          ),
+          dim[0],
+          dim[1],
+          dim[2]
+        );
+        texture.format = THREE.RedFormat;
+        texture.type = texture_dtype[lastvolumedata.dtype];
+        texture.minFilter = texture.magFilter = THREE.LinearFilter;
+        texture.unpackAlignment = 1;
+        texture.needsUpdate = true;
+        lastvolume.material.uniforms["u_data"].value = texture;
+        renderer.updateComplete = false;
+      }
+    });
 
   $("#cross-t").on("mouseup", function () {
     $(this).prop(

From e54ea6f058496d17201552a454f8c83d3e9458fe Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 2 Apr 2026 09:32:15 -0400
Subject: [PATCH 03/61] fix: resolve memory leaks in 2D plot viewer

---
 src/utils/preview.js | 37 +++++++++++++++++++++++++++----------
 1 file changed, 27 insertions(+), 10 deletions(-)

diff --git a/src/utils/preview.js b/src/utils/preview.js
index 496e855..02f3908 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -33,6 +33,7 @@ var lastvolume = null;
 var lastvolumedata = null;
 var lastvolumedim = [];
 var lastclim = 0;
+var uplotInstance = null;
 var reqid = undefined;
 
 var canvas = null;
@@ -133,6 +134,12 @@ function destroyPreview() {
   lastvolume = null;
   lastvolumedata = null;
   texture = undefined;
+
+  if (uplotInstance !== null) {
+    uplotInstance.destroy();
+    uplotInstance = null;
+  }
+  $("#chartpanel").hide().html("");
 }
 
 function drawpreview(cfg) {
@@ -428,22 +435,32 @@ function dopreview(key, idx, isinternal, hastime) {
             ? "y" + i
             : hastime[i];
       }
-      let u = new uPlot(opts, plotdata, document.getElementById("plotchart"));
+      // let u = new uPlot(opts, plotdata, document.getElementById("plotchart"));
+      if (uplotInstance !== null) {
+        uplotInstance.destroy();
+        uplotInstance = null;
+      }
+      uplotInstance = new uPlot(
+        opts,
+        plotdata,
+        document.getElementById("plotchart")
+      );
     } else {
-      let u = new uPlot(
+      // let u = new uPlot(
+      //   opts,
+      //   [[...Array(dataroot.length).keys()], dataroot],
+      //   document.getElementById("plotchart")
+      // );
+      if (uplotInstance !== null) {
+        uplotInstance.destroy();
+        uplotInstance = null;
+      }
+      uplotInstance = new uPlot(
         opts,
         [[...Array(dataroot.length).keys()], dataroot],
         document.getElementById("plotchart")
       );
     }
-    // add spinner
-    // --- NEW LOGIC for 2D plot ---
-    // Signal that the 2D plot has just been created and is now visible.
-    // if (typeof window.__onPreviewReady === "function") {
-    //   window.__onPreviewReady();
-    //   window.__onPreviewReady = null; // Clean up to prevent accidental re-firing
-    // }
-    // --- END NEW LOGIC ---
 
     // for spinner
     // --- Signal React that 2D preview is ready ---

From ecf15ebf7146590eb57dcf4d1988290b8aab6bf5 Mon Sep 17 00:00:00 2001
From: Qianqian Fang <fangqq@gmail.com>
Date: Thu, 2 Apr 2026 11:44:01 -0400
Subject: [PATCH 04/61] [debug] print github action server IP

---
 .github/workflows/build-deploy-zodiac.yml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/.github/workflows/build-deploy-zodiac.yml b/.github/workflows/build-deploy-zodiac.yml
index 57a049d..d6d86e6 100644
--- a/.github/workflows/build-deploy-zodiac.yml
+++ b/.github/workflows/build-deploy-zodiac.yml
@@ -18,6 +18,9 @@ jobs:
       - name: Check out the repository
         uses: actions/checkout@v3
 
+      - name: Check IP
+        run: curl https://api.ipify.org
+
       - name: Install dependencies
         run: yarn install --frozen-lockfile
 

From 66f6e435ead30e55958fba297e4255b34a2283e9 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 2 Apr 2026 13:51:51 -0400
Subject: [PATCH 05/61] feat: add executorHelpers and plannerHelpers

---
 .../DatasetOrganizer/utils/executorHelpers.ts | 522 ++++++++++++++++++
 .../DatasetOrganizer/utils/fileAnalyzers.ts   | 332 ++---------
 .../utils/filenameTokenizer.ts                | 505 +++++++++++++++--
 .../DatasetOrganizer/utils/plannerHelpers.ts  |   0
 4 files changed, 1030 insertions(+), 329 deletions(-)
 create mode 100644 src/components/User/Dashboard/DatasetOrganizer/utils/executorHelpers.ts
 create mode 100644 src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts

diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/executorHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/executorHelpers.ts
new file mode 100644
index 0000000..782dee5
--- /dev/null
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/executorHelpers.ts
@@ -0,0 +1,522 @@
+// src/components/DatasetOrganizer/utils/executorHelpers.ts
+//
+// Portable helper functions from autobidsify/converters/executor.py
+//
+// What is NOT here (intentionally — requires server-side CLI):
+//   execute_bids_plan()       — file copy/conversion operations
+//   convert_mat_to_snirf()    — binary .mat read + .snirf write
+//   run_dcm2niix_batch()      — dcm2niix subprocess
+//   convert_jnifti_to_nifti() — nibabel NIfTI write
+//
+// What IS here (useful client-side for plan validation + preview):
+//   sanitizeBidsLabel()       mirrors _sanitize_bids_label()
+//   normalizeFilename()       mirrors _normalize_filename()
+//   extractAcqLabel()         mirrors _extract_acq_label()
+//   selectPreferredFile()     mirrors _select_preferred_file()
+//   matchGlobPattern()        mirrors _match_glob_pattern()
+//   inferScanType()           mirrors infer_scan_type_from_filepath()
+//   inferSubdirectory()       mirrors infer_subdirectory_from_suffix()
+//   categorizeScanType()      mirrors categorize_scan_type()
+//   analyzeFilepathUniversal() mirrors analyze_filepath_universal()
+//   validatePlanCoverage()    NEW — uses matchGlobPattern to check LLM patterns
+
+// ============================================================================
+// sanitizeBidsLabel()
+// Mirrors _sanitize_bids_label() in executor.py
+// Removes all non-alphanumeric characters from a BIDS entity value
+// e.g. "mental_arithmetic" → "mentalarithmetic"
+// ============================================================================
+
+export const sanitizeBidsLabel = (label: string): string =>
+  label.replace(/[^a-zA-Z0-9]/g, "");
+
+// ============================================================================
+// normalizeFilename()
+// Mirrors _normalize_filename() in executor.py
+//
+// Strips extensions and trailing sequence numbers.
+// Used to identify DICOM series and detect format duplicates.
+//
+// Examples:
+//   "VHFCT1mm-Hip (134).dcm"       → "vhfct1mm-hip"
+//   "scan_mprage_anonymized.nii.gz" → "scan_mprage_anonymized"
+//   "scan_001.dcm"                  → "scan"
+// ============================================================================
+
+export const normalizeFilename = (filepath: string): string => {
+  let name = filepath.split("/").pop()!;
+
+  // Strip all extensions (up to 6 chars)
+  while (name.includes(".") && name.split(".").pop()!.length <= 6) {
+    name = name.substring(0, name.lastIndexOf("."));
+  }
+
+  // Strip trailing " (N)"
+  name = name.replace(/\s*\(\d+\)\s*$/, "");
+  // Strip trailing _NNN or -NNN
+  name = name.replace(/[_\-]\d+$/, "");
+
+  return name.trim().toLowerCase();
+};
+
+// ============================================================================
+// extractAcqLabel()
+// Mirrors _extract_acq_label() in executor.py
+//
+// Derives a short, clean acq- label from a normalized DICOM filename.
+// Keeps the last meaningful alphabetic token (body part or scan descriptor).
+//
+// Examples:
+//   "vhfct1mmankle" → "ankle"
+//   "vhfct1mmhead"  → "head"
+//   "vhmct1mmhip"   → "hip"
+//   "scanmprage"    → "mprage"
+// ============================================================================
+
+export const extractAcqLabel = (normalizedFname: string): string => {
+  const skip = new Set(["vhf", "vhm", "ct", "mr", "mri", "mm", "scan", "the"]);
+  const tokens = normalizedFname.match(/[a-z]+/g) || [];
+  const meaningful = tokens.filter((t) => t.length > 2 && !skip.has(t));
+
+  if (meaningful.length > 0) {
+    return meaningful[meaningful.length - 1]; // last = body part
+  }
+  return normalizedFname.slice(0, 20); // fallback: cap at 20 chars
+};
+
+// ============================================================================
+// selectPreferredFile()
+// Mirrors _select_preferred_file() in executor.py
+//
+// Priority: NIfTI dir > non-BRIK > shortest path > alphabetical
+// ============================================================================
+
+export const selectPreferredFile = (files: string[]): string | null => {
+  if (files.length === 0) return null;
+  if (files.length === 1) return files[0];
+
+  const priority = (f: string): [number, number, number, string] => {
+    const parts = f.toLowerCase().split("/");
+    return [
+      parts.some((p) => p.includes("nifti")) ? 0 : 1,
+      parts.some((p) => p.includes("brik")) ? 1 : 0,
+      parts.length,
+      f,
+    ];
+  };
+
+  return [...files].sort((a, b) => {
+    const [a0, a1, a2, a3] = priority(a);
+    const [b0, b1, b2, b3] = priority(b);
+    if (a0 !== b0) return a0 - b0;
+    if (a1 !== b1) return a1 - b1;
+    if (a2 !== b2) return a2 - b2;
+    return a3.localeCompare(b3);
+  })[0];
+};
+
+// ============================================================================
+// matchGlobPattern()
+// Mirrors _match_glob_pattern() in executor.py
+//
+// Supported patterns:
+//   "**/*.nii.gz"  → any .nii.gz at any depth
+//   "**/BRIK/**"   → any file inside a BRIK directory
+//   "*token*"      → filepath contains token
+//   "*.ext"        → filename ends with extension
+//   "token*"       → filename starts with token
+//   "plain"        → substring anywhere in path (fallback)
+// ============================================================================
+
+export const matchGlobPattern = (
+  filepath: string,
+  pattern: string
+): boolean => {
+  const fp = filepath.toLowerCase();
+  const pat = pattern.toLowerCase();
+  const parts = fp.split("/");
+  const filename = parts[parts.length - 1];
+
+  // **/TOKEN/** — directory component match
+  if (pat.startsWith("**/") && pat.endsWith("/**")) {
+    const token = pat.slice(3, -3);
+    return parts.slice(0, -1).includes(token);
+  }
+
+  // **/*.ext — any depth extension match
+  if (pat.startsWith("**/")) {
+    const suffix = pat.slice(3);
+    if (suffix.startsWith("*.")) return fp.endsWith(suffix.slice(1));
+    return fp.includes(suffix);
+  }
+
+  // *token* — substring in full path
+  if (pat.startsWith("*") && pat.endsWith("*")) {
+    return fp.includes(pat.slice(1, -1));
+  }
+
+  // *.ext — extension match on filename only
+  if (pat.startsWith("*.")) {
+    return filename.endsWith(pat.slice(1));
+  }
+
+  // token* — filename prefix
+  if (pat.endsWith("*")) {
+    return filename.startsWith(pat.slice(0, -1));
+  }
+
+  // fallback — substring anywhere in path
+  return fp.includes(pat);
+};
+
+// ============================================================================
+// inferScanType()
+// Mirrors infer_scan_type_from_filepath() in executor.py
+//
+// Priority:
+//   1. LLM filename_rules from BIDSPlan
+//   2. BIDS entities already in filename (ses-, task-, acq-, run-)
+//   3. Keyword detection in path
+//   4. Extension fallback
+// ============================================================================
+
+interface ScanTypeResult {
+  suffix: string;
+  subdirectory: string;
+  category: string;
+}
+
+export const inferScanType = (
+  filepath: string,
+  filenameRules: any[] = []
+): ScanTypeResult => {
+  const pathLower = filepath.toLowerCase();
+  const filename = filepath.split("/").pop()!;
+  const fnameLow = filename.toLowerCase();
+
+  // ── Priority 1: LLM filename_rules ──────────────────────────────────
+  for (const rule of filenameRules) {
+    try {
+      const mp = (rule.match_pattern || "").replace(/\\\\/g, "\\");
+      if (!new RegExp(mp, "i").test(filename)) continue;
+
+      const template: string = rule.bids_template || "";
+      const m = template.match(/sub-[^_]+_(.*?)\.(nii\.gz|snirf|nii)/);
+      if (!m) continue;
+
+      let raw = m[1];
+      // Remove placeholder entities
+      raw = raw
+        .replace(/ses-X_?/g, "")
+        .replace(/task-X_?/g, "")
+        .replace(/^_|_$/g, "");
+
+      // Remove spurious ses- if no ses- dir in path
+      if (
+        /ses-[A-Za-z0-9]+/.test(raw) &&
+        !/\/ses-[A-Za-z0-9]+\//.test(filepath)
+      ) {
+        raw = raw.replace(/ses-[A-Za-z0-9]+_?/g, "").replace(/^_|_$/g, "");
+      }
+
+      if (raw) {
+        // Sanitize entity values — mirrors _sanitize_suffix() in executor.py
+        // "task-mental_arithmetic_nirs" → "task-mentalarithmetic_nirs"
+        raw = raw.replace(
+          /([a-zA-Z]+-)(.+?)(?=_[a-zA-Z]+-|_[a-zA-Z]+$|$)/g,
+          (_match, key, val) => key + sanitizeBidsLabel(val)
+        );
+        const subdir = inferSubdirectory(raw);
+        return {
+          suffix: raw,
+          subdirectory: subdir,
+          category: categorizeScanType(raw),
+        };
+      }
+    } catch {
+      continue;
+    }
+  }
+
+  // ── Priority 2: BIDS entities already in filename ────────────────────
+  const entities: Record<string, string> = {};
+  for (const [key, pattern] of [
+    ["ses", /ses-([A-Za-z0-9]+)/],
+    ["task", /task-([A-Za-z0-9]+)/],
+    ["acq", /acq-([A-Za-z0-9]+)/],
+    ["run", /run-([A-Za-z0-9]+)/],
+  ] as [string, RegExp][]) {
+    const match = filename.match(pattern);
+    if (match) entities[key] = match[1];
+  }
+
+  // Infer task from filename keywords when no task- entity present
+  if (!entities.task) {
+    const nameNoExt = fnameLow.replace(/\.[^.]+$/, "");
+    if (/rest|resting/.test(nameNoExt)) entities.task = "rest";
+    else if (/finger|tapping|fingertap/.test(nameNoExt))
+      entities.task = "fingertapping";
+    else if (/walking|walk/.test(nameNoExt)) entities.task = "walking";
+    else if (/motor|tap/.test(nameNoExt)) entities.task = "motor";
+  }
+
+  let modalityLabel: string | null = null;
+  let subdir = "anat";
+
+  if (fnameLow.endsWith(".snirf") || fnameLow.includes("nirs")) {
+    modalityLabel = "nirs";
+    subdir = "nirs";
+  } else if (/t1w|t1/.test(fnameLow)) {
+    modalityLabel = "T1w";
+    subdir = "anat";
+  } else if (/t2w|t2/.test(fnameLow)) {
+    modalityLabel = "T2w";
+    subdir = "anat";
+  } else if (/bold|func/.test(fnameLow)) {
+    modalityLabel = "bold";
+    subdir = "func";
+  } else if (/dwi/.test(fnameLow)) {
+    modalityLabel = "dwi";
+    subdir = "dwi";
+  }
+
+  // BIDS rule: task-* scans go in func/ (unless nirs)
+  if (subdir !== "nirs" && (entities.task || pathLower.includes("func/"))) {
+    subdir = "func";
+    if (!modalityLabel) modalityLabel = "bold";
+  }
+
+  if (Object.keys(entities).length > 0 || modalityLabel) {
+    const parts: string[] = [];
+    for (const key of ["ses", "task", "acq", "run"]) {
+      if (entities[key])
+        parts.push(`${key}-${sanitizeBidsLabel(entities[key])}`);
+    }
+    if (modalityLabel) parts.push(modalityLabel);
+    if (parts.length > 0) {
+      const suffix = parts.join("_");
+      return {
+        suffix,
+        subdirectory: subdir,
+        category: categorizeScanType(suffix),
+      };
+    }
+  }
+
+  // ── Priority 3: Heuristic path keywords ─────────────────────────────
+  if (/anat|mprage|t1w/.test(pathLower))
+    return { suffix: "T1w", subdirectory: "anat", category: "anatomical" };
+  if (/func|bold/.test(pathLower)) {
+    const m = pathLower.match(/task[_-]([a-z0-9]+)/);
+    const suffix = m ? `task-${m[1]}_bold` : "task-rest_bold";
+    return { suffix, subdirectory: "func", category: "functional" };
+  }
+  if (pathLower.includes("rest"))
+    return {
+      suffix: "task-rest_bold",
+      subdirectory: "func",
+      category: "functional",
+    };
+  if (/nirs|fnirs|\.snirf/.test(pathLower))
+    return { suffix: "nirs", subdirectory: "nirs", category: "functional" };
+  if (pathLower.includes("dwi"))
+    return { suffix: "dwi", subdirectory: "dwi", category: "diffusion" };
+
+  // ── Priority 4: Extension fallback ──────────────────────────────────
+  if (fnameLow.endsWith(".snirf"))
+    return { suffix: "nirs", subdirectory: "nirs", category: "functional" };
+  if (fnameLow.endsWith(".nii") || fnameLow.endsWith(".nii.gz"))
+    return { suffix: "T1w", subdirectory: "anat", category: "anatomical" };
+
+  return { suffix: "unknown", subdirectory: "anat", category: "unknown" };
+};
+
+// ============================================================================
+// inferSubdirectory()
+// Mirrors infer_subdirectory_from_suffix() in executor.py
+// ============================================================================
+
+export const inferSubdirectory = (suffix: string): string => {
+  const s = suffix.toLowerCase();
+  if (s.includes("t1w") || s.includes("t2w")) return "anat";
+  if (s.includes("bold")) return "func";
+  if (s.includes("nirs")) return "nirs";
+  if (s.includes("dwi")) return "dwi";
+  return "anat";
+};
+
+// ============================================================================
+// categorizeScanType()
+// Mirrors categorize_scan_type() in executor.py
+// ============================================================================
+
+export const categorizeScanType = (suffix: string): string => {
+  const s = suffix.toLowerCase();
+  if (s.includes("t1w") || s.includes("t2w")) return "anatomical";
+  if (s.includes("bold") || s.includes("nirs")) return "functional";
+  if (s.includes("dwi")) return "diffusion";
+  return "unknown";
+};
+
+// ============================================================================
+// analyzeFilepathUniversal()
+// Mirrors analyze_filepath_universal() in executor.py
+//
+// Determines BIDS subject ID and output filename for one source file.
+// Used for plan preview — shows user what each file will become.
+// ============================================================================
+
+export interface FilepathAnalysis {
+  subject_id: string;
+  scan_type_suffix: string;
+  bids_filename: string;
+  subdirectory: string;
+  scan_category: string;
+  original_filepath: string;
+  modality: string;
+}
+
+export const analyzeFilepathUniversal = (
+  filepath: string,
+  assignmentRules: any[],
+  filenameRules: any[],
+  modality: string = "mri"
+): FilepathAnalysis => {
+  const filename = filepath.split("/").pop()!;
+  const pathParts = filepath.split("/");
+  let subjectId: string | null = null;
+
+  // Priority 1: match glob patterns
+  for (const rule of assignmentRules) {
+    for (const pat of rule.match || []) {
+      if (matchGlobPattern(filepath, pat)) {
+        subjectId = rule.subject;
+        break;
+      }
+    }
+    if (subjectId) break;
+  }
+
+  // Priority 2: original substring match
+  if (!subjectId) {
+    for (const rule of assignmentRules) {
+      const orig: string = rule.original || "";
+      if (orig && filepath.toLowerCase().includes(orig.toLowerCase())) {
+        subjectId = rule.subject;
+        break;
+      }
+    }
+  }
+
+  // Priority 3: prefix match
+  if (!subjectId) {
+    for (const rule of assignmentRules) {
+      const pfx: string = rule.prefix || "";
+      if (pfx && filename.toLowerCase().startsWith(pfx.toLowerCase())) {
+        subjectId = rule.subject;
+        break;
+      }
+    }
+  }
+
+  // Priority 4: sub-XX already in path
+  if (!subjectId) {
+    for (const part of pathParts) {
+      const m = part.match(/sub[_-]?(\w+)/i);
+      if (m) {
+        subjectId = m[1];
+        break;
+      }
+    }
+  }
+
+  // Fallback
+  if (!subjectId) subjectId = "unknown";
+
+  // Strip accidental sub- prefix
+  if (subjectId.startsWith("sub-")) subjectId = subjectId.slice(4);
+
+  const scanInfo = inferScanType(filepath, filenameRules);
+  const ext = modality === "nirs" ? ".snirf" : ".nii.gz";
+  const bidsFilename = `sub-${subjectId}_${scanInfo.suffix}${ext}`;
+
+  return {
+    subject_id: subjectId,
+    scan_type_suffix: scanInfo.suffix,
+    bids_filename: bidsFilename,
+    subdirectory: scanInfo.subdirectory,
+    scan_category: scanInfo.category,
+    original_filepath: filepath,
+    modality,
+  };
+};
+
+// ============================================================================
+// validatePlanCoverage()
+// NEW — not in Python (Python validates at runtime, we validate at plan-time)
+//
+// Checks that the LLM's match patterns in BIDSPlan actually cover the
+// sample files from the evidence bundle. Warns about uncovered files.
+//
+// Used in plannerHelpers.ts after buildBidsPlan() to surface issues
+// before the user downloads the ZIP.
+// ============================================================================
+
+export interface PlanCoverageResult {
+  covered: string[];
+  uncovered: string[];
+  coveragePercent: number;
+  warnings: string[];
+}
+
+export const validatePlanCoverage = (
+  sampleFiles: string[],
+  mappings: any[]
+): PlanCoverageResult => {
+  const covered: string[] = [];
+  const uncovered: string[] = [];
+  const warnings: string[] = [];
+
+  for (const filepath of sampleFiles) {
+    let isCovered = false;
+
+    for (const mapping of mappings) {
+      const patterns: string[] = mapping.match || [];
+      const excludes: string[] = mapping.exclude || [];
+
+      const isExcluded = excludes.some((ex) => matchGlobPattern(filepath, ex));
+      if (isExcluded) continue;
+
+      const isMatched = patterns.some((pat) => matchGlobPattern(filepath, pat));
+      if (isMatched) {
+        isCovered = true;
+        break;
+      }
+    }
+
+    if (isCovered) covered.push(filepath);
+    else uncovered.push(filepath);
+  }
+
+  if (uncovered.length > 0) {
+    warnings.push(
+      `${uncovered.length} sample file(s) not covered by any mapping pattern.`
+    );
+    for (const f of uncovered.slice(0, 5)) {
+      warnings.push(`  Uncovered: ${f}`);
+    }
+    if (uncovered.length > 5) {
+      warnings.push(`  ... and ${uncovered.length - 5} more`);
+    }
+  }
+
+  return {
+    covered,
+    uncovered,
+    coveragePercent:
+      sampleFiles.length > 0
+        ? Math.round((covered.length / sampleFiles.length) * 100)
+        : 100,
+    warnings,
+  };
+};
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
index 76142c0..c3c89b0 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
@@ -1,54 +1,60 @@
 // src/components/DatasetOrganizer/utils/fileAnalyzers.ts
+// VFS adapter layer because NeuroJSON.io needs to work with FileItem[] objects
+//  No single Python mirror. Functions map to:
+//   categorizeFile()       → executor.py (infer_subdirectory_from_suffix, categorize_scan_type)
+//   detectModality()       → evidence.py (detect_kind) + constants.py (MODALITY_*)
+//   getCountsByExtension() → evidence.py (by_ext dict construction)
+//   getUserContextText()   → evidence.py (_extract_document_content + documents[] assembly)
 import { FileItem } from "redux/projects/types/projects.interface";
 
-/**
- * Categorize a file based on its name and type
- * Returns detailed scan category (anatomical-T1w, functional-bold, etc.)
- */
+// ============================================================================
+// categorizeFile()
+// UI display function — determines file label/color in FileTree.
+//
+// NOT the same as inferScanType() in executorHelpers.ts:
+//   categorizeFile()  → "what to show in the UI"
+//   inferScanType()   → "what BIDS filename to generate"
+//
+// Partial mirror of executor.py → infer_subdirectory_from_suffix()
+//                               + categorize_scan_type()
+// ============================================================================
 export const categorizeFile = (file: FileItem): string => {
   const name = file.name.toLowerCase();
 
   // Functional scans (task-based)
-  if (name.includes("task-") && name.includes("bold")) {
-    return "functional-bold";
-  }
-  if (name.endsWith(".snirf")) {
-    return "functional-nirs";
-  }
-
+  if (name.includes("task-") && name.includes("bold")) return "functional-bold";
+  if (name.endsWith(".snirf")) return "functional-nirs";
   if (name.endsWith(".nirs")) return "functional-nirs";
   if (name.endsWith(".mat")) return "functional-nirs";
 
   // Anatomical scans
-  if (name.includes("t1w")) {
-    return "anatomical-T1w";
-  }
-  if (name.includes("t2w") || name.includes("inplanet2")) {
+  if (name.includes("t1w")) return "anatomical-T1w";
+  if (name.includes("t2w") || name.includes("inplanet2"))
     return "anatomical-T2w";
-  }
-  if (name.includes("flair")) {
-    return "anatomical-FLAIR";
-  }
-
+  if (name.includes("flair")) return "anatomical-FLAIR";
   if (name.endsWith(".dcm")) return "anatomical-dicom";
 
+  // JNIfTI — mirrors JNIFTI_EXT in constants.py: {'.jnii', '.bnii'}
+  if (name.endsWith(".jnii") || name.endsWith(".bnii"))
+    return "anatomical-jnifti";
+
   // Diffusion
-  if (name.includes("dwi") || name.includes("diffusion")) {
-    return "diffusion";
-  }
+  if (name.includes("dwi") || name.includes("diffusion")) return "diffusion";
 
   // Field maps
-  if (name.includes("fieldmap") || name.includes("fmap")) {
-    return "fieldmap";
-  }
+  if (name.includes("fieldmap") || name.includes("fmap")) return "fieldmap";
 
-  // Fall back to file type
+  // Array/HDF5 (non-SNIRF)
+  if (name.endsWith(".h5") || name.endsWith(".hdf5")) return "array";
+
+  // Fall back to fileType from fileProcessors.ts
   return file.fileType || "unknown";
 };
 
-/**
- * Detect modality from file collection
- */
+// ============================================================================
+// Detect modality from file collection
+// Rough equivalent of evidence.py → detect_kind() + constants.py MODALITY_*
+// ============================================================================
 export const detectModality = (files: FileItem[]): string => {
   const counts: Record<string, number> = {};
   files.forEach((f) => {
@@ -57,31 +63,29 @@ export const detectModality = (files: FileItem[]): string => {
   });
 
   if (counts.nifti > 0 || counts.dicom > 0) return "mri";
+  // FIX: fileProcessors.ts returns "nirs" for .nirs files, not "homer3"
   if (
     counts.hdf5 > 0 ||
     counts.matlab > 0 ||
-    counts.homer3 > 0 ||
+    counts.nirs > 0 ||
     files.some((f) => f.name.endsWith(".snirf"))
   )
     return "nirs";
   return "mixed";
 };
 
-/**
- * Get file extension counts
- */
+// ============================================================================
+// Get file extension counts
+// Mirrors evidence.py → by_ext dict construction.
+// Uses ".nii.gz" as a single key — mirrors Python: p.name.lower().endswith(".nii.gz")
+// ============================================================================
 export const getCountsByExtension = (
   files: FileItem[]
 ): Record<string, number> => {
   const counts: Record<string, number> = {};
-  // files.forEach((f) => {
-  //   const ext = f.fileType || "unknown";
-  //   counts[ext] = (counts[ext] || 0) + 1;
-  // });
   files
     .filter((f) => f.source === "user" && f.type === "file")
     .forEach((f) => {
-      // Mirror Python: use ".nii.gz" as a single key for .nii.gz files
       const name = f.name.toLowerCase();
       const ext = name.endsWith(".nii.gz")
         ? ".nii.gz"
@@ -91,9 +95,13 @@ export const getCountsByExtension = (
   return counts;
 };
 
-/**
- * Extract user context from metadata files
- */
+// ============================================================================
+// Extract user context from metadata files
+// Partial mirror of evidence.py → _extract_document_content() +
+// the documents[] assembly in _build_evidence_bundle_internal().
+//
+// Python reads files from disk; this reads from VFS FileItem.content.
+// ============================================================================
 export const getUserContextText = (files: FileItem[]): string => {
   const readme = files.find((f) => f.name.toLowerCase().includes("readme"));
   const instructions = files.find(
@@ -130,243 +138,3 @@ export const getUserContextText = (files: FileItem[]): string => {
   });
   return parts.join("\n\n");
 };
-
-/** (not using yet)
- * Analyze filename patterns to detect subjects
- * (Simplified version inspired by auto-bidsify's filename_tokenizer)
- */
-export const analyzeFilenamePatterns = (
-  files: FileItem[]
-): {
-  subjectCount: number;
-  subjectIds: string[];
-  hasRunNumbers: boolean;
-  hasTaskNames: boolean;
-} => {
-  const dataFiles = files.filter((f) => f.type === "file" && !f.isUserMeta);
-  const subjectIds = new Set<string>();
-  let hasRunNumbers = false;
-  let hasTaskNames = false;
-
-  dataFiles.forEach((f) => {
-    const name = f.name;
-
-    // Extract subject ID (sub-01, sub-02, etc.)
-    const subMatch = name.match(/sub-(\d+)/i);
-    if (subMatch) {
-      subjectIds.add(subMatch[1]);
-    }
-
-    // Check for run numbers
-    if (name.includes("_run-")) {
-      hasRunNumbers = true;
-    }
-
-    // Check for task names
-    if (name.includes("task-")) {
-      hasTaskNames = true;
-    }
-  });
-
-  return {
-    subjectCount: subjectIds.size,
-    subjectIds: Array.from(subjectIds).sort(),
-    hasRunNumbers,
-    hasTaskNames,
-  };
-};
-
-// add to fileAnalyzers.ts
-
-// export interface SubjectRecord {
-//   original_id: string;
-//   numeric_id: string;
-//   site: string | null;
-//   pattern_name: string;
-//   file_count: number;
-// }
-
-// export interface SubjectAnalysis {
-//   success: boolean;
-//   method: string;
-//   subject_records: SubjectRecord[];
-//   subject_count: number;
-//   has_site_info: boolean;
-//   variants_by_subject: Record<string, any>;
-//   python_generated_filename_rules: any[];
-//   id_mapping: {
-//     id_mapping: Record<string, string>;
-//     reverse_mapping: Record<string, string>;
-//     strategy_used: string;
-//     metadata_columns: string[];
-//   };
-// }
-
-// // mirrors _extract_subjects_from_directory_structure
-// const extractFromDirectoryStructure = (
-//   allFiles: string[]
-// ): Omit<SubjectAnalysis, "id_mapping"> | null => {
-//   const patterns: Array<[RegExp, boolean, number, number | null, string]> = [
-//     [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"],
-//     [/^sub-(\d+)$/i, false, 1, null, "standard_bids"],
-//     [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"],
-//     [/^(\d{3,})$/, false, 1, null, "numeric_only"],
-//   ];
-
-//   const subjectRecords: SubjectRecord[] = [];
-//   const seenIds = new Set<string>();
-
-//   for (const filepath of allFiles) {
-//     const parts = filepath.split("/");
-//     for (const part of parts.slice(0, 2)) {
-//       for (const [
-//         regex,
-//         hasSite,
-//         idGroup,
-//         siteGroup,
-//         patternName,
-//       ] of patterns) {
-//         const match = part.match(regex);
-//         if (match) {
-//           const originalId = match[0];
-//           if (seenIds.has(originalId)) break;
-//           seenIds.add(originalId);
-//           subjectRecords.push({
-//             original_id: originalId,
-//             numeric_id: match[idGroup],
-//             site: hasSite && siteGroup ? match[siteGroup] : null,
-//             pattern_name: patternName,
-//             file_count: 0,
-//           });
-//           break;
-//         }
-//       }
-//     }
-//   }
-
-//   if (subjectRecords.length === 0) return null;
-
-//   subjectRecords.sort((a, b) => {
-//     const na = parseInt(a.numeric_id) || 0;
-//     const nb = parseInt(b.numeric_id) || 0;
-//     return na - nb;
-//   });
-
-//   return {
-//     success: true,
-//     method: "directory_structure",
-//     subject_records: subjectRecords,
-//     subject_count: subjectRecords.length,
-//     has_site_info: subjectRecords.some((r) => r.site !== null),
-//     variants_by_subject: {},
-//     python_generated_filename_rules: [],
-//   };
-// };
-
-// // mirrors _extract_subjects_from_flat_filenames
-// const extractFromFlatFilenames = (
-//   allFiles: string[]
-// ): Omit<SubjectAnalysis, "id_mapping"> | null => {
-//   const identifierToFiles: Record<string, string[]> = {};
-
-//   for (const filepath of allFiles) {
-//     const filename = filepath.split("/").pop() || "";
-//     const nameNoExt = filename
-//       .replace(/\.[^/.]+$/, "")
-//       .replace(/\.nii\.gz$/, "");
-//     const match = nameNoExt.match(/^([A-Za-z0-9\-]+)/);
-//     if (match) {
-//       const identifier = match[1];
-//       if (!identifierToFiles[identifier]) identifierToFiles[identifier] = [];
-//       identifierToFiles[identifier].push(filepath);
-//     }
-//   }
-
-//   if (Object.keys(identifierToFiles).length === 0) return null;
-
-//   const extractNumeric = (id: string): number => {
-//     const nums = id.match(/\d+/g);
-//     return nums ? parseInt(nums[nums.length - 1]) : 999999;
-//   };
-
-//   const sortedIdentifiers = Object.keys(identifierToFiles).sort(
-//     (a, b) => extractNumeric(a) - extractNumeric(b)
-//   );
-
-//   const subjectRecords: SubjectRecord[] = sortedIdentifiers.map((id, i) => ({
-//     original_id: id,
-//     numeric_id: String(i + 1),
-//     site: null,
-//     pattern_name: "dominant_prefix",
-//     file_count: identifierToFiles[id].length,
-//   }));
-
-//   return {
-//     success: true,
-//     method: "dominant_prefix_fallback",
-//     subject_records: subjectRecords,
-//     subject_count: subjectRecords.length,
-//     has_site_info: false,
-//     variants_by_subject: {},
-//     python_generated_filename_rules: [],
-//   };
-// };
-
-// // mirrors _generate_subject_id_mapping
-// const generateIdMapping = (
-//   subjectInfo: Omit<SubjectAnalysis, "id_mapping">
-// ): SubjectAnalysis["id_mapping"] => {
-//   const records = subjectInfo.subject_records;
-//   const idMapping: Record<string, string> = {};
-//   const reverseMapping: Record<string, string> = {};
-
-//   // detect already-BIDS format (sub-01, sub-02...)
-//   const allAlreadyBids = records.every((r) => /^sub-\w+$/i.test(r.original_id));
-
-//   if (allAlreadyBids) {
-//     for (const rec of records) {
-//       const bidsId = rec.original_id.replace(/^sub-/i, "");
-//       idMapping[rec.original_id] = bidsId;
-//       reverseMapping[bidsId] = rec.original_id;
-//     }
-//     return {
-//       id_mapping: idMapping,
-//       reverse_mapping: reverseMapping,
-//       strategy_used: "already_bids",
-//       metadata_columns: [],
-//     };
-//   }
-
-//   // numeric strategy
-//   for (let i = 0; i < records.length; i++) {
-//     const orig = records[i].original_id;
-//     const bidsId = String(i + 1);
-//     idMapping[orig] = bidsId;
-//     reverseMapping[bidsId] = orig;
-//   }
-
-//   return {
-//     id_mapping: idMapping,
-//     reverse_mapping: reverseMapping,
-//     strategy_used: "numeric",
-//     metadata_columns: ["original_id"],
-//   };
-// };
-
-// // main export — call this from llmHelpers
-// export const extractSubjectAnalysis = (allFiles: string[]): SubjectAnalysis => {
-//   const fromDir = extractFromDirectoryStructure(allFiles);
-//   const base = fromDir ??
-//     extractFromFlatFilenames(allFiles) ?? {
-//       success: false,
-//       method: "none",
-//       subject_records: [],
-//       subject_count: 0,
-//       has_site_info: false,
-//       variants_by_subject: {},
-//       python_generated_filename_rules: [],
-//     };
-
-//   const idMapping = generateIdMapping(base);
-//   return { ...base, id_mapping: idMapping };
-// };
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
index 4708c13..24aa930 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
@@ -1,6 +1,6 @@
 // src/components/DatasetOrganizer/utils/filenameTokenizer.ts
-// Port of autobidsify's filename_tokenizer.py
-// Philosophy: Python stats → dominant prefixes → subject IDs (no LLM needed for this part)
+// Mirrors filename_tokenizer.py
+
 export interface SubjectRecord {
   original_id: string;
   numeric_id: string;
@@ -52,40 +52,21 @@ const COMMON_WORDS = new Set([
   "experiment",
 ]);
 
+const DATA_EXTENSIONS =
+  /\.(snirf|nii|nii\.gz|dcm|mat|nirs|jnii|bnii|h5|hdf5|edf|bdf)$/i;
+
 // ============================================================================
-// FilenameTokenizer — mirrors FilenameTokenizer class in filename_tokenizer.py
+// FilenamePatternAnalyzer — mirrors FilenameTokenizer class
 // ============================================================================
-
-/**
- * Advanced split: CamelCase + number boundaries
- * "VHMCT" → ["VHM", "CT"]
- * "CT1mm" → ["CT", "1", "mm"]
- * "sub82352" → ["sub", "82352"]
- */
-const splitAdvanced = (text: string): string[] => {
-  if (!text) return [];
-
-  // Keep known neuroimaging terms together
-  if (NEUROIMAGING_TERMS.has(text)) return [text];
-
-  // Split on type boundaries:
-  // - Uppercase sequence before uppercase+lowercase: "VHM" before "CT"
-  // - CamelCase: uppercase followed by lowercase
-  // - Letter/digit boundaries
-  const pattern = /([A-Z]+(?=[A-Z][a-z]|\b|[0-9])|[A-Z][a-z]+|[a-z]+|[0-9]+)/g;
-  const tokens = text.match(pattern) || [];
-  return tokens.filter((t) => t.length > 0);
-};
-
-/**
+/*
  * Tokenize a filename into meaningful tokens.
- * Mirrors FilenameTokenizer.tokenize() in filename_tokenizer.py
  *
  * Examples:
  *   "VHMCT1mm-Hip (134).dcm" → ["VHM", "CT", "1", "mm", "Hip", "134"]
  *   "Beijing_sub82352"       → ["Beijing", "sub", "82352"]
  *   "scan_001_T1w.nii"       → ["scan", "001", "T1w"]
  */
+
 export const tokenizeFilename = (filename: string): string[] => {
   // Step 1: Remove all extensions (up to 6 chars)
   let name = filename;
@@ -111,28 +92,60 @@ export const tokenizeFilename = (filename: string): string[] => {
   return tokens.filter((t) => t.trim().length >= 1);
 };
 
+/*
+ * Advanced split: CamelCase + number boundaries
+ * "VHMCT" → ["VHM", "CT"]
+ * "CT1mm" → ["CT", "1", "mm"]
+ * "sub82352" → ["sub", "82352"]
+ */
+const splitAdvanced = (text: string): string[] => {
+  if (!text) return [];
+
+  // Keep known neuroimaging terms together
+  if (NEUROIMAGING_TERMS.has(text)) return [text];
+
+  // Split on type boundaries:
+  // - Uppercase sequence before uppercase+lowercase: "VHM" before "CT"
+  // - CamelCase: uppercase followed by lowercase
+  // - Letter/digit boundaries
+  const pattern = /([A-Z]+(?=[A-Z][a-z]|\b|[0-9])|[A-Z][a-z]+|[a-z]+|[0-9]+)/g;
+  const tokens = text.match(pattern) || [];
+  return tokens.filter((t) => t.length > 0);
+};
+
 // ============================================================================
 // FilenamePatternAnalyzer — mirrors FilenamePatternAnalyzer class
 // ============================================================================
 
+interface TokenStatistics {
+  totalFiles: number;
+  tokenFrequency: Record<string, number>;
+  prefixFrequency: Record<string, number>;
+  dominantPrefixes: DominantPrefix[];
+  tokenPositions: Record<number, Record<string, number>>; // NEW — mirrors token_positions
+  insights: string[]; // NEW — mirrors _generate_insights()
+  uniqueTokenCount: number; // NEW
+  uniquePrefixCount: number; // NEW
+}
+
 interface DominantPrefix {
   prefix: string;
   count: number;
   percentage: number;
 }
 
-interface TokenStatistics {
-  totalFiles: number;
-  tokenFrequency: Record<string, number>;
-  prefixFrequency: Record<string, number>;
-  dominantPrefixes: DominantPrefix[];
+interface LLMPayload {
+  task: string;
+  statistics: TokenStatistics;
+  filenameSamples: string[];
+  userHints: Record<string, any>;
+  instructions: string;
 }
 
-/**
- * Find dominant prefixes — tokens appearing in >5% of files
- * that are not common words.
- * Mirrors FilenamePatternAnalyzer._find_dominant_prefixes()
- */
+// ─────────────────────────────────────────────────────────────────────────────
+// Mirrors FilenamePatternAnalyzer._find_dominant_prefixes()
+// ─────────────────────────────────────────────────────────────────────────────
+
 const findDominantPrefixes = (
   prefixCounter: Record<string, number>,
   totalFiles: number
@@ -154,18 +167,109 @@ const findDominantPrefixes = (
     }));
 };
 
-/**
- * Analyze token statistics across all filenames.
- * Mirrors FilenamePatternAnalyzer.analyze_token_statistics()
- */
+// ─────────────────────────────────────────────────────────────────────────────
+// _generate_insights()
+// Mirrors FilenamePatternAnalyzer._generate_insights()
+// ─────────────────────────────────────────────────────────────────────────────
+
+const generateInsights = (
+  allTokens: Record<string, number>,
+  prefixTokens: Record<string, number>,
+  dominantPrefixes: DominantPrefix[]
+): string[] => {
+  const insights: string[] = [];
+  const uniqueTokenCount = Object.keys(allTokens).length;
+
+  // Insight 1: token diversity
+  if (uniqueTokenCount < 20) {
+    insights.push(
+      `Low token diversity: only ${uniqueTokenCount} unique tokens across all files`
+    );
+  } else if (uniqueTokenCount > 100) {
+    insights.push(
+      `High token diversity: ${uniqueTokenCount} unique tokens detected`
+    );
+  }
+
+  // Insight 2: prefix distribution
+  if (dominantPrefixes.length === 0) {
+    insights.push("No dominant filename prefixes detected");
+  } else if (dominantPrefixes.length === 1) {
+    const p = dominantPrefixes[0];
+    insights.push(
+      `Single dominant prefix '${p.prefix}' in ${p.percentage}% of files`
+    );
+  } else if (dominantPrefixes.length === 2) {
+    const [p1, p2] = dominantPrefixes;
+    insights.push(
+      `Two major prefixes detected: '${p1.prefix}' (${p1.percentage}%) and '${p2.prefix}' (${p2.percentage}%)`
+    );
+  } else {
+    insights.push(
+      `${dominantPrefixes.length} dominant prefixes detected, suggesting possible subject groupings`
+    );
+  }
+
+  // Insight 3: most common tokens
+  const topTokens = Object.entries(allTokens)
+    .sort((a, b) => b[1] - a[1])
+    .slice(0, 3);
+  if (topTokens.length > 0) {
+    const commonList = topTokens.map(([t, c]) => `'${t}' (${c})`).join(", ");
+    insights.push(`Most frequent tokens: ${commonList}`);
+  }
+
+  return insights;
+};
+
+// ─────────────────────────────────────────────────────────────────────────────
+// _sample_diverse_filenames()
+// Mirrors FilenamePatternAnalyzer._sample_diverse_filenames()
+// ─────────────────────────────────────────────────────────────────────────────
+
+const sampleDiverseFilenames = (
+  filenames: string[],
+  maxSamples: number = 30
+): string[] => {
+  if (filenames.length <= maxSamples) return [...filenames].sort();
+
+  // Group by first token (mirrors Python: prefix_groups[prefix].append(filename))
+  const prefixGroups: Record<string, string[]> = {};
+  for (const filename of filenames) {
+    const tokens = tokenizeFilename(filename);
+    const prefix = tokens.length > 0 ? tokens[0] : "none";
+    if (!prefixGroups[prefix]) prefixGroups[prefix] = [];
+    prefixGroups[prefix].push(filename);
+  }
+
+  const groupCount = Object.keys(prefixGroups).length;
+  const samplesPerGroup = Math.max(1, Math.floor(maxSamples / groupCount));
+
+  const samples: string[] = [];
+  for (const prefix of Object.keys(prefixGroups).sort()) {
+    const groupFiles = prefixGroups[prefix];
+    const n = Math.min(groupFiles.length, samplesPerGroup);
+    samples.push(...[...groupFiles].sort().slice(0, n));
+    if (samples.length >= maxSamples) break;
+  }
+
+  return samples.slice(0, maxSamples);
+};
+
+// ─────────────────────────────────────────────────────────────────────────────
+// analyze_token_statistics()
+// Mirrors FilenamePatternAnalyzer.analyze_token_statistics()
+// ─────────────────────────────────────────────────────────────────────────────
+
 export const analyzeTokenStatistics = (
   filenames: string[]
 ): TokenStatistics => {
   const allTokens: Record<string, number> = {};
-  const prefixTokens: Record<string, number> = {}; // first token only
+  const prefixTokens: Record<string, number> = {};
+  const positionTokens: Record<number, Record<string, number>> = {};
 
   for (const filename of filenames) {
-    // Extract just filename from path
+    // Mirror Python __init__: strip to just filename if path provided
     const fname = filename.includes("/")
       ? filename.split("/").pop()!
       : filename;
@@ -177,23 +281,331 @@ export const analyzeTokenStatistics = (
       allTokens[token] = (allTokens[token] || 0) + 1;
     }
 
-    // CRITICAL: use first TOKEN as prefix (not regex match)
+    // CRITICAL: use first TOKEN as prefix (not regex)
     if (tokens.length > 0) {
       const firstToken = tokens[0];
       prefixTokens[firstToken] = (prefixTokens[firstToken] || 0) + 1;
     }
+
+    // NEW: count tokens by position — mirrors position_tokens[i][token] += 1
+    tokens.forEach((token, i) => {
+      if (!positionTokens[i]) positionTokens[i] = {};
+      positionTokens[i][token] = (positionTokens[i][token] || 0) + 1;
+    });
+  }
+
+  // Cap frequencies — mirrors .most_common(50) / .most_common(20)
+  const tokenFrequency = Object.fromEntries(
+    Object.entries(allTokens)
+      .sort((a, b) => b[1] - a[1])
+      .slice(0, 50)
+  );
+  const prefixFrequency = Object.fromEntries(
+    Object.entries(prefixTokens)
+      .sort((a, b) => b[1] - a[1])
+      .slice(0, 20)
+  );
+
+  // Cap each position bucket at top 10 — mirrors .most_common(10)
+  const tokenPositions: Record<number, Record<string, number>> = {};
+  for (const [pos, counter] of Object.entries(positionTokens)) {
+    tokenPositions[Number(pos)] = Object.fromEntries(
+      Object.entries(counter)
+        .sort((a, b) => b[1] - a[1])
+        .slice(0, 10)
+    );
   }
 
   const dominantPrefixes = findDominantPrefixes(prefixTokens, filenames.length);
+  const insights = generateInsights(allTokens, prefixTokens, dominantPrefixes);
 
   return {
     totalFiles: filenames.length,
-    tokenFrequency: allTokens,
-    prefixFrequency: prefixTokens,
+    tokenFrequency,
+    prefixFrequency,
     dominantPrefixes,
+    tokenPositions, // NEW
+    insights, // NEW
+    uniqueTokenCount: Object.keys(allTokens).length, // NEW
+    uniquePrefixCount: Object.keys(prefixTokens).length, // NEW
+  };
+};
+
+// ─────────────────────────────────────────────────────────────────────────────
+// build_llm_payload()
+// Mirrors FilenamePatternAnalyzer.build_llm_payload()
+// ─────────────────────────────────────────────────────────────────────────────
+
+export const buildLLMPayload = (
+  filenames: string[],
+  userHints: Record<string, any>,
+  maxSamples: number = 30
+): LLMPayload => {
+  const stats = analyzeTokenStatistics(filenames);
+  const filenameSamples = sampleDiverseFilenames(filenames, maxSamples);
+
+  return {
+    task: "subject_identification",
+    statistics: stats,
+    filenameSamples,
+    userHints,
+    instructions:
+      "Analyze the filename token statistics and samples. " +
+      "Determine how to group files by subject. " +
+      "The 'dominant_prefixes' may indicate subject identifiers. " +
+      "The 'insights' provide observations. " +
+      "User hint 'n_subjects' can help validate your hypothesis.",
+  };
+};
+
+/**
+ * Analyze token statistics across all filenames.
+ * Mirrors FilenamePatternAnalyzer.analyze_token_statistics()
+ */
+// export const analyzeTokenStatistics = (
+//   filenames: string[]
+// ): TokenStatistics => {
+//   const allTokens: Record<string, number> = {};
+//   const prefixTokens: Record<string, number> = {}; // first token only
+
+//   for (const filename of filenames) {
+//     // Extract just filename from path
+//     const fname = filename.includes("/")
+//       ? filename.split("/").pop()!
+//       : filename;
+
+//     const tokens = tokenizeFilename(fname);
+
+//     // Count all tokens
+//     for (const token of tokens) {
+//       allTokens[token] = (allTokens[token] || 0) + 1;
+//     }
+
+//     // CRITICAL: use first TOKEN as prefix (not regex match)
+//     if (tokens.length > 0) {
+//       const firstToken = tokens[0];
+//       prefixTokens[firstToken] = (prefixTokens[firstToken] || 0) + 1;
+//     }
+//   }
+
+//   const dominantPrefixes = findDominantPrefixes(prefixTokens, filenames.length);
+
+//   return {
+//     totalFiles: filenames.length,
+//     tokenFrequency: allTokens,
+//     prefixFrequency: prefixTokens,
+//     dominantPrefixes,
+//   };
+// };
+
+/*
+ * Find dominant prefixes — tokens appearing in >5% of files
+ * that are not common words.
+ * Mirrors FilenamePatternAnalyzer._find_dominant_prefixes()
+ */
+// const findDominantPrefixes = (
+//   prefixCounter: Record<string, number>,
+//   totalFiles: number
+// ): DominantPrefix[] => {
+//   const threshold = totalFiles * 0.05; // 5% threshold
+
+//   return Object.entries(prefixCounter)
+//     .filter(([prefix, count]) => {
+//       if (count < threshold) return false;
+//       if (COMMON_WORDS.has(prefix.toLowerCase())) return false;
+//       return true;
+//     })
+//     .sort((a, b) => b[1] - a[1])
+//     .slice(0, 20)
+//     .map(([prefix, count]) => ({
+//       prefix,
+//       count,
+//       percentage: Math.round((count / totalFiles) * 1000) / 10,
+//     }));
+// };
+
+// ============================================================================
+// Integration Functions
+// Mirrors analyze_filenames_for_subjects() + _generate_recommendation() in filename_tokenizer.py
+// ============================================================================
+
+export interface FilenameAnalysisResult {
+  python_statistics: TokenStatistics;
+  llm_payload: LLMPayload;
+  confidence: "high" | "medium" | "low" | "none";
+  recommendation: string;
+}
+
+/**
+ * Main entry point: analyze filenames to detect subject groupings.
+ * Mirrors analyze_filenames_for_subjects() in filename_tokenizer.py
+ *
+ * Called from buildEvidenceBundle() in llmHelpers.ts — replaces the
+ * manual filenameAnalysis block that was built inline there.
+ */
+export const analyzeFilenamesForSubjects = (
+  allFiles: string[],
+  userHints: Record<string, any>
+): FilenameAnalysisResult => {
+  // Mirror Python: extract just filenames, not full paths
+  const filenames = allFiles.map((f) =>
+    f.includes("/") ? f.split("/").pop()! : f
+  );
+
+  const stats = analyzeTokenStatistics(filenames);
+  const llmPayload = buildLLMPayload(filenames, userHints, 30);
+
+  // Assess confidence — mirrors Python confidence logic exactly
+  const dominantCount = stats.dominantPrefixes.length;
+  const userNSubjects: number | null = userHints?.n_subjects ?? null;
+
+  let confidence: "high" | "medium" | "low" | "none" = "none";
+  if (dominantCount > 0) {
+    if (userNSubjects && dominantCount === userNSubjects) {
+      confidence = "high";
+    } else if (dominantCount >= 2 && dominantCount <= 10) {
+      confidence = "medium";
+    } else {
+      confidence = "low";
+    }
+  }
+
+  const recommendation = generateRecommendation(stats, userHints);
+
+  return {
+    python_statistics: stats,
+    llm_payload: llmPayload,
+    confidence,
+    recommendation,
   };
 };
 
+/**
+ * Mirrors _generate_recommendation() in filename_tokenizer.py
+ */
+const generateRecommendation = (
+  stats: TokenStatistics,
+  userHints: Record<string, any>
+): string => {
+  const dominantPrefixes = stats.dominantPrefixes;
+  const userNSubjects: number | null = userHints?.n_subjects ?? null;
+
+  if (dominantPrefixes.length === 0) {
+    return (
+      "No clear filename patterns detected. " +
+      "Recommend using --describe to explain subject identification."
+    );
+  }
+
+  if (userNSubjects && dominantPrefixes.length === userNSubjects) {
+    const prefixesStr = dominantPrefixes.map((p) => p.prefix).join(", ");
+    return (
+      `HIGH CONFIDENCE: Detected ${dominantPrefixes.length} dominant prefixes ` +
+      `(${prefixesStr}) matching user hint of ${userNSubjects} subjects.`
+    );
+  }
+
+  if (dominantPrefixes.length >= 2 && dominantPrefixes.length <= 5) {
+    return (
+      `MEDIUM CONFIDENCE: Detected ${dominantPrefixes.length} potential subject groups. ` +
+      `Will send to LLM for validation.`
+    );
+  }
+
+  return (
+    `LOW CONFIDENCE: Found ${dominantPrefixes.length} prefix patterns, ` +
+    `which may or may not represent subjects. LLM will analyze.`
+  );
+};
+
+// ============================================================================
+// SubjectGroupingDecision
+// Mirrors SubjectGroupingDecision class in filename_tokenizer.py
+// Not used in runtime flow — used as typed helpers when parsing LLM responses
+// ============================================================================
+
+export interface PrefixMappingDecision {
+  method: "prefix_based";
+  description: string;
+  rules: Array<{
+    prefix: string;
+    maps_to_subject: string;
+    match_pattern: string;
+  }>;
+  participant_metadata: Record<string, Record<string, any>>;
+}
+
+export interface SequentialAssignmentDecision {
+  method: "sequential";
+  n_subjects: number;
+  note: string;
+}
+
+export interface BlockingQuestionDecision {
+  method: "blocked";
+  reason: string;
+  question: {
+    type: string;
+    severity: string;
+    message: string;
+    options: string[];
+  };
+}
+
+export type SubjectGroupingDecision =
+  | PrefixMappingDecision
+  | SequentialAssignmentDecision
+  | BlockingQuestionDecision;
+
+/**
+ * Mirrors SubjectGroupingDecision.create_prefix_mapping()
+ */
+export const createPrefixMapping = (
+  prefixToSubject: Record<string, string>,
+  metadata?: Record<string, Record<string, any>>
+): PrefixMappingDecision => ({
+  method: "prefix_based",
+  description: `Files grouped by ${
+    Object.keys(prefixToSubject).length
+  } filename prefixes`,
+  rules: Object.entries(prefixToSubject).map(([prefix, subjId]) => ({
+    prefix,
+    maps_to_subject: subjId,
+    match_pattern: `${prefix}*`,
+  })),
+  participant_metadata: metadata ?? {},
+});
+
+/**
+ * Mirrors SubjectGroupingDecision.create_sequential_assignment()
+ */
+export const createSequentialAssignment = (
+  nSubjects: number
+): SequentialAssignmentDecision => ({
+  method: "sequential",
+  n_subjects: nSubjects,
+  note:
+    "No clear subject grouping pattern detected in filenames. " +
+    "Assigning sequential IDs based on file order or user hint.",
+});
+
+/**
+ * Mirrors SubjectGroupingDecision.create_blocking_question()
+ */
+export const createBlockingQuestion = (
+  reason: string,
+  options: string[]
+): BlockingQuestionDecision => ({
+  method: "blocked",
+  reason,
+  question: {
+    type: "subject_grouping",
+    severity: "block",
+    message: reason,
+    options,
+  },
+});
+
 // ============================================================================
 // extractSubjectAnalysis — mirrors build_bids_plan()'s subject extraction
 // ============================================================================
@@ -495,7 +907,6 @@ const extractFromDirectoryStructure = (
   };
 };
 
-const DATA_EXTENSIONS = /\.(snirf|nii|nii\.gz|dcm|mat|nirs|h5|hdf5|edf|bdf)$/i;
 const TRIO_FILENAMES = new Set([
   "dataset_description.json",
   "participants.tsv",
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
new file mode 100644
index 0000000..e69de29

From edb2a8f9b4291eb30e91a79dbefad237e123378b Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 3 Apr 2026 17:40:39 -0400
Subject: [PATCH 06/61] feat: reorganize the code for integrated autobidsify

---
 package.json                                  |    1 +
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 1384 ++++++++---------
 .../DatasetOrganizer/utils/fileAnalyzers.ts   |  205 ++-
 .../DatasetOrganizer/utils/fileProcessors.ts  |   68 +-
 .../utils/filenameTokenizer.ts                |  588 -------
 .../Dashboard/DatasetOrganizer/utils/llm.ts   |  963 ++++++++++++
 .../DatasetOrganizer/utils/llmHelpers.ts      |  983 +++++++-----
 .../DatasetOrganizer/utils/llmPrompts.ts      |  619 +-------
 .../DatasetOrganizer/utils/plannerHelpers.ts  |  870 +++++++++++
 .../DatasetOrganizer/utils/trioHelpers.ts     |  762 +++++++++
 src/services/ollama.service.ts                |   17 +-
 yarn.lock                                     |    5 +
 12 files changed, 4221 insertions(+), 2244 deletions(-)
 create mode 100644 src/components/User/Dashboard/DatasetOrganizer/utils/llm.ts
 create mode 100644 src/components/User/Dashboard/DatasetOrganizer/utils/trioHelpers.ts

diff --git a/package.json b/package.json
index 1f8144e..6f414ef 100644
--- a/package.json
+++ b/package.json
@@ -63,6 +63,7 @@
   "devDependencies": {
     "@babel/plugin-proposal-private-property-in-object": "^7.21.11",
     "@trivago/prettier-plugin-sort-imports": "^4.2.0",
+    "@types/js-yaml": "^4.0.9",
     "@types/node": "^20.5.7",
     "@types/pako": "^2.0.3",
     "@typescript-eslint/eslint-plugin": "^5.31.0",
diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index a8fd052..9658ec6 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -1,23 +1,12 @@
 import { generateId } from "./utils/fileProcessors";
-import { extractSubjectAnalysis } from "./utils/filenameTokenizer";
-//add
+import { LLMConfig } from "./utils/llm";
 import {
-  buildFileSummary,
-  analyzeFilePatterns,
-  getUserContext,
-  getFileAnnotations,
-  downloadJSON,
   buildEvidenceBundle,
-  extractSubjectsFromFiles,
   buildIngestInfo,
+  downloadJSON,
 } from "./utils/llmHelpers";
-import {
-  getDatasetDescriptionPrompt,
-  getReadmePrompt,
-  getParticipantsPrompt,
-  getConversionScriptPrompt,
-  getBIDSPlanPrompt,
-} from "./utils/llmPrompts";
+import { buildBidsPlan } from "./utils/plannerHelpers";
+import { generateTrioFiles } from "./utils/trioHelpers";
 import {
   Close,
   ContentCopy,
@@ -40,10 +29,12 @@ import {
   Alert,
 } from "@mui/material";
 import { Colors } from "design/theme";
+import { dump as yamlDump } from "js-yaml";
 import JSZip from "jszip";
 import React, { useState, useEffect } from "react";
 import { FileItem } from "redux/projects/types/projects.interface";
-import { OllamaService } from "services/ollama.service";
+
+// import { OllamaService } from "services/ollama.service";
 
 interface LLMPanelProps {
   files: FileItem[];
@@ -158,6 +149,16 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
   const [panelHeight, setPanelHeight] = useState<number>(450);
   const [isResizing, setIsResizing] = useState(false);
 
+  // Build LLMConfig for all helper calls — mirrors autobidsify CLI arg assembly
+  const buildLLMConfig = (): LLMConfig => ({
+    provider,
+    model,
+    apiKey,
+    baseUrl: currentProvider.baseUrl,
+    isAnthropic: currentProvider.isAnthropic,
+    noApiKey: currentProvider.noApiKey,
+  });
+
   // ========================================================================
   // BUTTON 1: GENERATE EVIDENCE BUNDLE
   // ========================================================================
@@ -202,406 +203,27 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
       setError("Please generate evidence bundle first");
       return;
     }
-
     if (!currentProvider.noApiKey && !apiKey.trim()) {
       setError("Please enter an API key");
       return;
     }
 
-    // Create abort controller
     const controller = new AbortController();
     setAbortController(controller);
-
     setGeneratingTrio(true);
     setError(null);
     setStatus("Generating BIDS trio files...");
 
     try {
-      const userText = evidenceBundle.user_hints.user_text || "";
-
-      // ==========================================
-      // Call 1: Generate dataset_description.json
-      // ==========================================
-      let datasetDesc: any;
-      if (evidenceBundle.trio_found?.["dataset_description.json"]) {
-        setStatus("1/3 dataset_description.json already exists, skipping...");
-        const existing = files.find(
-          (f) => f.source === "user" && f.name === "dataset_description.json"
-        );
-        datasetDesc = existing?.content ? JSON.parse(existing.content) : {};
-      } else {
-        setStatus("1/3 Generating dataset_description.json...");
-        const ddPrompt = getDatasetDescriptionPrompt(userText, evidenceBundle);
-
-        let ddResponse;
-        if (currentProvider.isAnthropic) {
-          ddResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              "x-api-key": apiKey,
-              "anthropic-version": "2023-06-01",
-            },
-            body: JSON.stringify({
-              model,
-              max_tokens: 2048,
-              messages: [{ role: "user", content: ddPrompt }],
-            }),
-          });
-        } else if (provider === "ollama") {
-          // const ollamaBaseUrl = ollamaUrl || "http://localhost:11434";
-          // ddResponse = await fetch(`${ollamaBaseUrl}/v1/chat/completions`, {
-          //   method: "POST",
-          //   signal: controller.signal,
-          //   headers: { "Content-Type": "application/json" },
-          //   body: JSON.stringify({
-          //     model,
-          //     messages: [{ role: "user", content: ddPrompt }],
-          //     stream: false,
-          //   }),
-          // });
-          ddResponse = await OllamaService.chat(model, [
-            { role: "user", content: ddPrompt },
-          ]);
-        } else {
-          ddResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              Authorization: `Bearer ${apiKey}`,
-            },
-            body: JSON.stringify({
-              model,
-              messages: [{ role: "user", content: ddPrompt }],
-              max_tokens: 2048,
-            }),
-          });
-        }
-
-        // const ddData = await ddResponse.json();
-        const ddData =
-          provider === "ollama" ? ddResponse : await ddResponse.json();
-        let ddText = currentProvider.isAnthropic
-          ? ddData.content[0].text
-          : ddData.choices[0].message.content;
-
-        // Clean up markdown fences
-        ddText = ddText
-          .replace(/^```json\n?/g, "")
-          .replace(/\n?```$/g, "")
-          .trim();
-        datasetDesc = JSON.parse(ddText);
-      }
-
-      // ==========================================
-      // Call 2: Generate README.md
-      // ==========================================
-      let readmeContent: string;
-      if (evidenceBundle.trio_found?.["README.md"]) {
-        setStatus("2/3 README.md already exists, skipping...");
-        const existing = files.find(
-          (f) =>
-            f.source === "user" &&
-            ["README.md", "README.txt", "README.rst", "readme.md"].includes(
-              f.name
-            )
-        );
-        readmeContent = existing?.content || "";
-      } else {
-        setStatus("2/3 Generating README.md...");
-        const readmePrompt = getReadmePrompt(userText);
-
-        let readmeResponse;
-        if (currentProvider.isAnthropic) {
-          readmeResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              "x-api-key": apiKey,
-              "anthropic-version": "2023-06-01",
-            },
-            body: JSON.stringify({
-              model,
-              max_tokens: 2048,
-              messages: [{ role: "user", content: readmePrompt }],
-            }),
-          });
-        } else if (provider === "ollama") {
-          // const ollamaBaseUrl = ollamaUrl || "http://localhost:11434";
-          // readmeResponse = await fetch(`${ollamaBaseUrl}/v1/chat/completions`, {
-          //   method: "POST",
-          //   signal: controller.signal,
-          //   headers: { "Content-Type": "application/json" },
-          //   body: JSON.stringify({
-          //     model,
-          //     messages: [{ role: "user", content: readmePrompt }],
-          //     stream: false,
-          //   }),
-          // });
-          readmeResponse = await OllamaService.chat(model, [
-            { role: "user", content: readmePrompt },
-          ]);
-        } else {
-          readmeResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              Authorization: `Bearer ${apiKey}`,
-            },
-            body: JSON.stringify({
-              model,
-              messages: [{ role: "user", content: readmePrompt }],
-              max_tokens: 2048,
-            }),
-          });
-        }
-
-        // const readmeData = await readmeResponse.json();
-        const readmeData =
-          provider === "ollama" ? readmeResponse : await readmeResponse.json();
-        readmeContent = currentProvider.isAnthropic
-          ? readmeData.content[0].text
-          : readmeData.choices[0].message.content;
-      }
-      // ==========================================
-      // Call 3: Generate participants.tsv
-      // ==========================================
-      let participantsContent: string;
-      if (evidenceBundle.trio_found?.["participants.tsv"]) {
-        setStatus("3/3 participants.tsv already exists, skipping...");
-        const existing = files.find(
-          (f) => f.source === "user" && f.name === "participants.tsv"
-        );
-        participantsContent = existing?.content || "";
-      } else {
-        setStatus("3/3 Generating participants.tsv...");
-        const partsPrompt = getParticipantsPrompt(userText);
-
-        // ← ADD HERE: compute subject analysis before try block so it's in scope
-        const currentSubjectAnalysis = extractSubjectAnalysis(
-          evidenceBundle?.all_files || [],
-          evidenceBundle?.user_hints?.n_subjects,
-          evidenceBundle?.filename_analysis?.python_statistics
-            ?.dominant_prefixes
-        );
+      const { datasetDesc, readmeContent, participantsTsv, skipped } =
+        await generateTrioFiles({
+          evidenceBundle,
+          files,
+          llmConfig: buildLLMConfig(),
+          signal: controller.signal,
+          onStatus: setStatus,
+        });
 
-        console.log("=== PARTICIPANTS DEBUG ===");
-        console.log("method:", currentSubjectAnalysis?.method);
-        console.log("subject_count:", currentSubjectAnalysis?.subject_count);
-        console.log(
-          "id_mapping:",
-          currentSubjectAnalysis?.id_mapping?.id_mapping
-        );
-        console.log(
-          "reverse_mapping:",
-          currentSubjectAnalysis?.id_mapping?.reverse_mapping
-        );
-        console.log(
-          "subject_records sample:",
-          currentSubjectAnalysis?.subject_records?.slice(0, 3)
-        );
-        const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
-        const expectedCount = evidenceBundle?.user_hints?.n_subjects;
-        const subjectLabels: string[] =
-          idMap &&
-          Object.keys(idMap).length > 0 &&
-          (!expectedCount || Object.keys(idMap).length === expectedCount)
-            ? Object.values(idMap).map((id: string) => `sub-${id}`)
-            : Array.from(
-                {
-                  length: expectedCount || Object.keys(idMap || {}).length || 1,
-                },
-                (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
-              );
-
-        let partsResponse;
-        if (currentProvider.isAnthropic) {
-          partsResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              "x-api-key": apiKey,
-              "anthropic-version": "2023-06-01",
-            },
-            body: JSON.stringify({
-              model,
-              max_tokens: 1024,
-              messages: [{ role: "user", content: partsPrompt }],
-            }),
-          });
-        } else if (provider === "ollama") {
-          // const ollamaBaseUrl = ollamaUrl || "http://localhost:11434";
-          // partsResponse = await fetch(`${ollamaBaseUrl}/v1/chat/completions`, {
-          //   method: "POST",
-          //   signal: controller.signal,
-          //   headers: { "Content-Type": "application/json" },
-          //   body: JSON.stringify({
-          //     model,
-          //     messages: [{ role: "user", content: partsPrompt }],
-          //     stream: false,
-          //   }),
-          // });
-          partsResponse = await OllamaService.chat(model, [
-            { role: "user", content: partsPrompt },
-          ]);
-        } else {
-          partsResponse = await fetch(currentProvider.baseUrl, {
-            method: "POST",
-            signal: controller.signal,
-            headers: {
-              "Content-Type": "application/json",
-              Authorization: `Bearer ${apiKey}`,
-            },
-            body: JSON.stringify({
-              model,
-              messages: [{ role: "user", content: partsPrompt }],
-              max_tokens: 1024,
-            }),
-          });
-        }
-
-        // const partsData = await partsResponse.json();
-        const partsData =
-          provider === "ollama" ? partsResponse : await partsResponse.json();
-        const participantsRaw = currentProvider.isAnthropic
-          ? partsData.content[0].text
-          : partsData.choices[0].message.content;
-
-        // Build TSV from schema
-        // try {
-        //   const schemaText = participantsRaw
-        //     .replace(/^```json\n?/g, "")
-        //     .replace(/\n?```$/g, "")
-        //     .trim();
-        //   const schema = JSON.parse(schemaText);
-        //   const columns: string[] = schema.columns.map((c: any) => c.name);
-
-        //   // Get subject IDs from evidence bundle (extracted by Python-style analysis)
-        //   // const idMapping =
-        //   //   evidenceBundle?.subject_analysis?.id_mapping?.id_mapping;
-        //   // const subjectLabels: string[] = idMapping
-        //   //   ? Object.values(idMapping).map((id) => `sub-${id}`)
-        //   //   : ["sub-01"]; // fallback if no subject analysis
-        //   // Get subject IDs from subjectAnalysis state (computed at plan stage)
-        //   // Fall back to computing fresh if plan hasn't been run yet
-        //   const currentSubjectAnalysis =
-        //     subjectAnalysis ||
-        //     extractSubjectAnalysis(
-        //       evidenceBundle?.all_files || [],
-        //       evidenceBundle?.user_hints?.n_subjects,
-        //       evidenceBundle?.filename_analysis?.python_statistics
-        //         ?.dominant_prefixes
-        //     );
-        //   const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
-        //   const subjectLabels: string[] =
-        //     idMap && Object.keys(idMap).length > 0
-        //       ? Object.values(idMap).map((id) => `sub-${id}`)
-        //       : Array.from(
-        //           { length: evidenceBundle?.user_hints?.n_subjects || 1 },
-        //           (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
-        //         );
-
-        //   const header = columns.join("\t");
-        //   // ====origin====
-        //   // const rows = subjectLabels.map((subId) =>
-        //   //   columns
-        //   //     .map((col: string) => (col === "participant_id" ? subId : "n/a"))
-        //   //     .join("\t")
-        //   // );
-        //   //====== end ======
-        //   // =====update start=====
-        //   const reverseMap =
-        //     currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
-        //   const subjectRecords = currentSubjectAnalysis?.subject_records || [];
-
-        //   const rows = subjectLabels.map((subId) => {
-        //     const bareId = subId.replace(/^sub-/, "");
-        //     const originalId = reverseMap[bareId];
-        //     const record = subjectRecords.find(
-        //       (r: any) => r.original_id === originalId
-        //     );
-        //     return columns
-        //       .map((col: string) => {
-        //         if (col === "participant_id") return subId;
-        //         if (col === "original_id") return originalId || "n/a";
-        //         if (col === "group") return (record as any)?.group || "n/a";
-        //         return "n/a";
-        //       })
-        //       .join("\t");
-        //   });
-        //   //====update end======
-        //   participantsContent = [header, ...rows].join("\n");
-        // } catch (e) {
-        //   // Fallback: LLM didn't return valid JSON schema, use raw content
-        //   participantsContent = participantsRaw
-        //     .replace(/^```\n?/g, "")
-        //     .replace(/\n?```$/g, "")
-        //     .trim();
-        // }
-        // Build TSV from schema + subject analysis
-        // Mirrors _generate_participants_tsv_from_python() in planner.py
-        try {
-          const schemaText = participantsRaw
-            .replace(/^```json\n?/g, "")
-            .replace(/\n?```$/g, "")
-            .trim();
-          const schema = JSON.parse(schemaText);
-
-          // LLM decides extra demographic columns (sex, age, group etc.)
-          // but we always add participant_id and original_id ourselves
-          const extraColumns: string[] = schema.columns
-            .map((c: any) => c.name)
-            .filter(
-              (name: string) =>
-                name !== "participant_id" && name !== "original_id"
-            );
-
-          // Always start with participant_id and original_id
-          const columns = ["participant_id", "original_id", ...extraColumns];
-
-          const reverseMap =
-            currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
-          const subjectRecords = currentSubjectAnalysis?.subject_records || [];
-
-          const header = columns.join("\t");
-          const rows = subjectLabels.map((subId) => {
-            const bareId = subId.replace(/^sub-/, "");
-            const originalId = reverseMap[bareId] || "n/a";
-            const record = subjectRecords.find(
-              (r: any) => r.original_id === originalId
-            );
-            return columns
-              .map((col: string) => {
-                if (col === "participant_id") return subId;
-                if (col === "original_id") return originalId;
-                if (col === "group") return (record as any)?.group || "n/a";
-                return "n/a";
-              })
-              .join("\t");
-          });
-
-          participantsContent = [header, ...rows].join("\n");
-        } catch (e) {
-          // Fallback: generate minimal TSV directly from subject analysis
-          const reverseMap =
-            currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
-          const header = "participant_id\toriginal_id";
-          const rows = subjectLabels.map((subId) => {
-            const bareId = subId.replace(/^sub-/, "");
-            const originalId = reverseMap[bareId] || "n/a";
-            return `${subId}\t${originalId}`;
-          });
-          participantsContent = [header, ...rows].join("\n");
-        }
-      }
-      // ==========================================
-      // Add trio files to Virtual File System
-      // ==========================================
       const timestamp = new Date().toLocaleString();
       const trioFiles: FileItem[] = [
         {
@@ -621,10 +243,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
           name: "README.md",
           type: "file",
           fileType: "meta",
-          content: readmeContent
-            .replace(/^```markdown\n?/g, "")
-            .replace(/\n?```$/g, "")
-            .trim(),
+          content: readmeContent,
           contentType: "text",
           isUserMeta: true,
           parentId: null,
@@ -636,10 +255,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
           name: "participants.tsv",
           type: "file",
           fileType: "meta",
-          content: participantsContent
-            .replace(/^```\n?/g, "")
-            .replace(/\n?```$/g, "")
-            .trim(),
+          content: participantsTsv,
           contentType: "text",
           isUserMeta: true,
           parentId: null,
@@ -647,32 +263,27 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
           generatedAt: timestamp,
         },
       ];
-      // replace existing trio files, add if not exist
+
       updateFiles((prev) => {
         const trioNames = [
           "dataset_description.json",
           "README.md",
           "participants.tsv",
         ];
-
-        // Remove old AI generated trio files
         const withoutOldTrio = prev.filter(
           (f) => !(f.source === "ai" && trioNames.includes(f.name))
         );
-
-        // Add new trio files
-        // return [...withoutOldTrio, ...trioFiles];
-
-        // Only add AI-generated files for ones that weren't user-uploaded
-        const newTrioFiles = trioFiles.filter(
-          (tf) =>
-            !evidenceBundle.trio_found?.[
-              tf.name as keyof typeof evidenceBundle.trio_found
-            ]
-        );
-
+        // Only add AI files for ones that weren't user-uploaded (skipped=true means user-uploaded)
+        const newTrioFiles = trioFiles.filter((tf) => {
+          if (tf.name === "dataset_description.json")
+            return !skipped.datasetDesc;
+          if (tf.name === "README.md") return !skipped.readme;
+          if (tf.name === "participants.tsv") return !skipped.participants;
+          return true;
+        });
         return [...withoutOldTrio, ...newTrioFiles];
       });
+
       setTrioGenerated(true);
       setStatus(
         "✓ BIDS trio files generated and added to Virtual File System!"
@@ -686,9 +297,469 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
       }
     } finally {
       setGeneratingTrio(false);
-      setAbortController(null); // Clear controller
+      setAbortController(null);
     }
   };
+  // const handleGenerateTrio = async () => {
+  //   if (!evidenceBundle) {
+  //     setError("Please generate evidence bundle first");
+  //     return;
+  //   }
+
+  //   if (!currentProvider.noApiKey && !apiKey.trim()) {
+  //     setError("Please enter an API key");
+  //     return;
+  //   }
+
+  //   // Create abort controller
+  //   const controller = new AbortController();
+  //   setAbortController(controller);
+
+  //   setGeneratingTrio(true);
+  //   setError(null);
+  //   setStatus("Generating BIDS trio files...");
+
+  //   try {
+  //     const userText = evidenceBundle.user_hints.user_text || "";
+
+  //     // ==========================================
+  //     // Call 1: Generate dataset_description.json
+  //     // ==========================================
+  //     let datasetDesc: any;
+  //     if (evidenceBundle.trio_found?.["dataset_description.json"]) {
+  //       setStatus("1/3 dataset_description.json already exists, skipping...");
+  //       const existing = files.find(
+  //         (f) => f.source === "user" && f.name === "dataset_description.json"
+  //       );
+  //       datasetDesc = existing?.content ? JSON.parse(existing.content) : {};
+  //     } else {
+  //       setStatus("1/3 Generating dataset_description.json...");
+  //       const ddPrompt = getDatasetDescriptionPrompt(userText, evidenceBundle);
+
+  //       let ddResponse;
+  //       if (currentProvider.isAnthropic) {
+  //         ddResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             "x-api-key": apiKey,
+  //             "anthropic-version": "2023-06-01",
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             max_tokens: 2048,
+  //             messages: [{ role: "user", content: ddPrompt }],
+  //           }),
+  //         });
+  //       } else if (provider === "ollama") {
+
+  //         ddResponse = await OllamaService.chat(model, [
+  //           { role: "user", content: ddPrompt },
+  //         ]);
+  //       } else {
+  //         ddResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             Authorization: `Bearer ${apiKey}`,
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             messages: [{ role: "user", content: ddPrompt }],
+  //             max_tokens: 2048,
+  //           }),
+  //         });
+  //       }
+
+  //       // const ddData = await ddResponse.json();
+  //       const ddData =
+  //         provider === "ollama" ? ddResponse : await ddResponse.json();
+  //       let ddText = currentProvider.isAnthropic
+  //         ? ddData.content[0].text
+  //         : ddData.choices[0].message.content;
+
+  //       // Clean up markdown fences
+  //       ddText = ddText
+  //         .replace(/^```json\n?/g, "")
+  //         .replace(/\n?```$/g, "")
+  //         .trim();
+  //       datasetDesc = JSON.parse(ddText);
+  //     }
+
+  //     // ==========================================
+  //     // Call 2: Generate README.md
+  //     // ==========================================
+  //     let readmeContent: string;
+  //     if (evidenceBundle.trio_found?.["README.md"]) {
+  //       setStatus("2/3 README.md already exists, skipping...");
+  //       const existing = files.find(
+  //         (f) =>
+  //           f.source === "user" &&
+  //           ["README.md", "README.txt", "README.rst", "readme.md"].includes(
+  //             f.name
+  //           )
+  //       );
+  //       readmeContent = existing?.content || "";
+  //     } else {
+  //       setStatus("2/3 Generating README.md...");
+  //       const readmePrompt = getReadmePrompt(userText);
+
+  //       let readmeResponse;
+  //       if (currentProvider.isAnthropic) {
+  //         readmeResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             "x-api-key": apiKey,
+  //             "anthropic-version": "2023-06-01",
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             max_tokens: 2048,
+  //             messages: [{ role: "user", content: readmePrompt }],
+  //           }),
+  //         });
+  //       } else if (provider === "ollama") {
+
+  //         readmeResponse = await OllamaService.chat(model, [
+  //           { role: "user", content: readmePrompt },
+  //         ]);
+  //       } else {
+  //         readmeResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             Authorization: `Bearer ${apiKey}`,
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             messages: [{ role: "user", content: readmePrompt }],
+  //             max_tokens: 2048,
+  //           }),
+  //         });
+  //       }
+
+  //       const readmeData =
+  //         provider === "ollama" ? readmeResponse : await readmeResponse.json();
+  //       readmeContent = currentProvider.isAnthropic
+  //         ? readmeData.content[0].text
+  //         : readmeData.choices[0].message.content;
+  //     }
+  //     // ==========================================
+  //     // Call 3: Generate participants.tsv
+  //     // ==========================================
+  //     let participantsContent: string;
+  //     if (evidenceBundle.trio_found?.["participants.tsv"]) {
+  //       setStatus("3/3 participants.tsv already exists, skipping...");
+  //       const existing = files.find(
+  //         (f) => f.source === "user" && f.name === "participants.tsv"
+  //       );
+  //       participantsContent = existing?.content || "";
+  //     } else {
+  //       setStatus("3/3 Generating participants.tsv...");
+  //       const partsPrompt = getParticipantsPrompt(userText);
+
+  //       const currentSubjectAnalysis = extractSubjectAnalysis(
+  //         evidenceBundle?.all_files || [],
+  //         evidenceBundle?.user_hints?.n_subjects,
+  //         evidenceBundle?.filename_analysis?.python_statistics
+  //           ?.dominant_prefixes
+  //       );
+
+  //       console.log("=== PARTICIPANTS DEBUG ===");
+  //       console.log("method:", currentSubjectAnalysis?.method);
+  //       console.log("subject_count:", currentSubjectAnalysis?.subject_count);
+  //       console.log(
+  //         "id_mapping:",
+  //         currentSubjectAnalysis?.id_mapping?.id_mapping
+  //       );
+  //       console.log(
+  //         "reverse_mapping:",
+  //         currentSubjectAnalysis?.id_mapping?.reverse_mapping
+  //       );
+  //       console.log(
+  //         "subject_records sample:",
+  //         currentSubjectAnalysis?.subject_records?.slice(0, 3)
+  //       );
+  //       const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
+  //       const expectedCount = evidenceBundle?.user_hints?.n_subjects;
+  //       const subjectLabels: string[] =
+  //         idMap &&
+  //         Object.keys(idMap).length > 0 &&
+  //         (!expectedCount || Object.keys(idMap).length === expectedCount)
+  //           ? Object.values(idMap).map((id: string) => `sub-${id}`)
+  //           : Array.from(
+  //               {
+  //                 length: expectedCount || Object.keys(idMap || {}).length || 1,
+  //               },
+  //               (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+  //             );
+
+  //       let partsResponse;
+  //       if (currentProvider.isAnthropic) {
+  //         partsResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             "x-api-key": apiKey,
+  //             "anthropic-version": "2023-06-01",
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             max_tokens: 1024,
+  //             messages: [{ role: "user", content: partsPrompt }],
+  //           }),
+  //         });
+  //       } else if (provider === "ollama") {
+
+  //         partsResponse = await OllamaService.chat(model, [
+  //           { role: "user", content: partsPrompt },
+  //         ]);
+  //       } else {
+  //         partsResponse = await fetch(currentProvider.baseUrl, {
+  //           method: "POST",
+  //           signal: controller.signal,
+  //           headers: {
+  //             "Content-Type": "application/json",
+  //             Authorization: `Bearer ${apiKey}`,
+  //           },
+  //           body: JSON.stringify({
+  //             model,
+  //             messages: [{ role: "user", content: partsPrompt }],
+  //             max_tokens: 1024,
+  //           }),
+  //         });
+  //       }
+
+  //       // const partsData = await partsResponse.json();
+  //       const partsData =
+  //         provider === "ollama" ? partsResponse : await partsResponse.json();
+  //       const participantsRaw = currentProvider.isAnthropic
+  //         ? partsData.content[0].text
+  //         : partsData.choices[0].message.content;
+
+  //       // Build TSV from schema
+  //       // try {
+  //       //   const schemaText = participantsRaw
+  //       //     .replace(/^```json\n?/g, "")
+  //       //     .replace(/\n?```$/g, "")
+  //       //     .trim();
+  //       //   const schema = JSON.parse(schemaText);
+  //       //   const columns: string[] = schema.columns.map((c: any) => c.name);
+
+  //       //   // Get subject IDs from evidence bundle (extracted by Python-style analysis)
+  //       //   // const idMapping =
+  //       //   //   evidenceBundle?.subject_analysis?.id_mapping?.id_mapping;
+  //       //   // const subjectLabels: string[] = idMapping
+  //       //   //   ? Object.values(idMapping).map((id) => `sub-${id}`)
+  //       //   //   : ["sub-01"]; // fallback if no subject analysis
+  //       //   // Get subject IDs from subjectAnalysis state (computed at plan stage)
+  //       //   // Fall back to computing fresh if plan hasn't been run yet
+  //       //   const currentSubjectAnalysis =
+  //       //     subjectAnalysis ||
+  //       //     extractSubjectAnalysis(
+  //       //       evidenceBundle?.all_files || [],
+  //       //       evidenceBundle?.user_hints?.n_subjects,
+  //       //       evidenceBundle?.filename_analysis?.python_statistics
+  //       //         ?.dominant_prefixes
+  //       //     );
+  //       //   const idMap = currentSubjectAnalysis?.id_mapping?.id_mapping;
+  //       //   const subjectLabels: string[] =
+  //       //     idMap && Object.keys(idMap).length > 0
+  //       //       ? Object.values(idMap).map((id) => `sub-${id}`)
+  //       //       : Array.from(
+  //       //           { length: evidenceBundle?.user_hints?.n_subjects || 1 },
+  //       //           (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+  //       //         );
+
+  //       //   const header = columns.join("\t");
+  //       //   // ====origin====
+  //       //   // const rows = subjectLabels.map((subId) =>
+  //       //   //   columns
+  //       //   //     .map((col: string) => (col === "participant_id" ? subId : "n/a"))
+  //       //   //     .join("\t")
+  //       //   // );
+  //       //   //====== end ======
+  //       //   // =====update start=====
+  //       //   const reverseMap =
+  //       //     currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+  //       //   const subjectRecords = currentSubjectAnalysis?.subject_records || [];
+
+  //       //   const rows = subjectLabels.map((subId) => {
+  //       //     const bareId = subId.replace(/^sub-/, "");
+  //       //     const originalId = reverseMap[bareId];
+  //       //     const record = subjectRecords.find(
+  //       //       (r: any) => r.original_id === originalId
+  //       //     );
+  //       //     return columns
+  //       //       .map((col: string) => {
+  //       //         if (col === "participant_id") return subId;
+  //       //         if (col === "original_id") return originalId || "n/a";
+  //       //         if (col === "group") return (record as any)?.group || "n/a";
+  //       //         return "n/a";
+  //       //       })
+  //       //       .join("\t");
+  //       //   });
+  //       //   //====update end======
+  //       //   participantsContent = [header, ...rows].join("\n");
+  //       // } catch (e) {
+  //       //   // Fallback: LLM didn't return valid JSON schema, use raw content
+  //       //   participantsContent = participantsRaw
+  //       //     .replace(/^```\n?/g, "")
+  //       //     .replace(/\n?```$/g, "")
+  //       //     .trim();
+  //       // }
+  //       // Build TSV from schema + subject analysis
+  //       // Mirrors _generate_participants_tsv_from_python() in planner.py
+  //       try {
+  //         const schemaText = participantsRaw
+  //           .replace(/^```json\n?/g, "")
+  //           .replace(/\n?```$/g, "")
+  //           .trim();
+  //         const schema = JSON.parse(schemaText);
+
+  //         // LLM decides extra demographic columns (sex, age, group etc.)
+  //         // but we always add participant_id and original_id ourselves
+  //         const extraColumns: string[] = schema.columns
+  //           .map((c: any) => c.name)
+  //           .filter(
+  //             (name: string) =>
+  //               name !== "participant_id" && name !== "original_id"
+  //           );
+
+  //         // Always start with participant_id and original_id
+  //         const columns = ["participant_id", "original_id", ...extraColumns];
+
+  //         const reverseMap =
+  //           currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+  //         const subjectRecords = currentSubjectAnalysis?.subject_records || [];
+
+  //         const header = columns.join("\t");
+  //         const rows = subjectLabels.map((subId) => {
+  //           const bareId = subId.replace(/^sub-/, "");
+  //           const originalId = reverseMap[bareId] || "n/a";
+  //           const record = subjectRecords.find(
+  //             (r: any) => r.original_id === originalId
+  //           );
+  //           return columns
+  //             .map((col: string) => {
+  //               if (col === "participant_id") return subId;
+  //               if (col === "original_id") return originalId;
+  //               if (col === "group") return (record as any)?.group || "n/a";
+  //               return "n/a";
+  //             })
+  //             .join("\t");
+  //         });
+
+  //         participantsContent = [header, ...rows].join("\n");
+  //       } catch (e) {
+  //         // Fallback: generate minimal TSV directly from subject analysis
+  //         const reverseMap =
+  //           currentSubjectAnalysis?.id_mapping?.reverse_mapping || {};
+  //         const header = "participant_id\toriginal_id";
+  //         const rows = subjectLabels.map((subId) => {
+  //           const bareId = subId.replace(/^sub-/, "");
+  //           const originalId = reverseMap[bareId] || "n/a";
+  //           return `${subId}\t${originalId}`;
+  //         });
+  //         participantsContent = [header, ...rows].join("\n");
+  //       }
+  //     }
+  //     // ==========================================
+  //     // Add trio files to Virtual File System
+  //     // ==========================================
+  //     const timestamp = new Date().toLocaleString();
+  //     const trioFiles: FileItem[] = [
+  //       {
+  //         id: generateId(),
+  //         name: "dataset_description.json",
+  //         type: "file",
+  //         fileType: "meta",
+  //         content: JSON.stringify(datasetDesc, null, 2),
+  //         contentType: "text",
+  //         isUserMeta: true,
+  //         parentId: null,
+  //         source: "ai",
+  //         generatedAt: timestamp,
+  //       },
+  //       {
+  //         id: generateId(),
+  //         name: "README.md",
+  //         type: "file",
+  //         fileType: "meta",
+  //         content: readmeContent
+  //           .replace(/^```markdown\n?/g, "")
+  //           .replace(/\n?```$/g, "")
+  //           .trim(),
+  //         contentType: "text",
+  //         isUserMeta: true,
+  //         parentId: null,
+  //         source: "ai",
+  //         generatedAt: timestamp,
+  //       },
+  //       {
+  //         id: generateId(),
+  //         name: "participants.tsv",
+  //         type: "file",
+  //         fileType: "meta",
+  //         content: participantsContent
+  //           .replace(/^```\n?/g, "")
+  //           .replace(/\n?```$/g, "")
+  //           .trim(),
+  //         contentType: "text",
+  //         isUserMeta: true,
+  //         parentId: null,
+  //         source: "ai",
+  //         generatedAt: timestamp,
+  //       },
+  //     ];
+  //     // replace existing trio files, add if not exist
+  //     updateFiles((prev) => {
+  //       const trioNames = [
+  //         "dataset_description.json",
+  //         "README.md",
+  //         "participants.tsv",
+  //       ];
+
+  //       // Remove old AI generated trio files
+  //       const withoutOldTrio = prev.filter(
+  //         (f) => !(f.source === "ai" && trioNames.includes(f.name))
+  //       );
+
+  //       // Add new trio files
+  //       // return [...withoutOldTrio, ...trioFiles];
+
+  //       // Only add AI-generated files for ones that weren't user-uploaded
+  //       const newTrioFiles = trioFiles.filter(
+  //         (tf) =>
+  //           !evidenceBundle.trio_found?.[
+  //             tf.name as keyof typeof evidenceBundle.trio_found
+  //           ]
+  //       );
+
+  //       return [...withoutOldTrio, ...newTrioFiles];
+  //     });
+  //     setTrioGenerated(true);
+  //     setStatus(
+  //       "✓ BIDS trio files generated and added to Virtual File System!"
+  //     );
+  //   } catch (err: any) {
+  //     if (err.name === "AbortError") {
+  //       setStatus("❌ Generation cancelled");
+  //     } else {
+  //       setError(err.message || "Failed to generate trio files");
+  //       setStatus("❌ Error generating trio files");
+  //     }
+  //   } finally {
+  //     setGeneratingTrio(false);
+  //     setAbortController(null); // Clear controller
+  //   }
+  // };
 
   const handleMouseDown = (e: React.MouseEvent) => {
     setIsResizing(true);
@@ -725,312 +796,222 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
 
   const currentProvider = llmProviders[provider];
 
-  const handleGenerate = async () => {
+  const handleGeneratePlan = async () => {
     if (!currentProvider.noApiKey && !apiKey.trim()) {
       setError("Please enter an API key");
       return;
     }
-
     if (!baseDirectoryPath.trim()) {
       setError("Please enter a base directory path");
       return;
     }
 
-    // Create abort controller
     const controller = new AbortController();
     setAbortController(controller);
-
     setLoading(true);
     setError(null);
-    setStatus(`Generating script using ${currentProvider.name}...`);
-
-    const fileSummary = buildFileSummary(files);
-    const filePatterns = analyzeFilePatterns(files);
-    const userContext = getUserContext(files);
-    const annotations = getFileAnnotations(files);
-
-    // UPDATED: Improved prompt that uses trio files
-    const prompt = getConversionScriptPrompt(
-      baseDirectoryPath,
-      fileSummary,
-      filePatterns,
-      userContext,
-      annotations
-    );
+    setStatus(`Generating BIDSPlan.yaml using ${currentProvider.name}...`);
 
     try {
-      let response;
-
-      if (provider === "ollama") {
-        // const ollamaBaseUrl = ollamaUrl || "http://localhost:11434";
-        // response = await fetch(`${ollamaBaseUrl}/v1/chat/completions`, {
-        //   method: "POST",
-        //   signal: controller.signal,
-        //   headers: {
-        //     "Content-Type": "application/json",
-        //   },
-        //   body: JSON.stringify({
-        //     model,
-        //     messages: [
-        //       {
-        //         role: "system",
-        //         content:
-        //           "You are a neuroimaging data expert specializing in BIDS format conversion. Output only Python code without markdown fences or explanations.",
-        //       },
-        //       { role: "user", content: prompt },
-        //     ],
-        //     stream: false,
-        //   }),
-        // });
-        response = await OllamaService.chat(model, [
-          {
-            role: "system",
-            content:
-              "You are a neuroimaging data expert specializing in BIDS format conversion. Output only Python code without markdown fences or explanations.",
-          },
-          { role: "user", content: prompt },
-        ]);
-      } else if (currentProvider.isAnthropic) {
-        response = await fetch(currentProvider.baseUrl, {
-          method: "POST",
-          signal: controller.signal,
-          headers: {
-            "Content-Type": "application/json",
-            "x-api-key": apiKey,
-            "anthropic-version": "2023-06-01",
-          },
-          body: JSON.stringify({
-            model,
-            max_tokens: 4096,
-            messages: [{ role: "user", content: prompt }],
-          }),
-        });
-      } else {
-        const headers: Record<string, string> = {
-          "Content-Type": "application/json",
-        };
-
-        if (!currentProvider.noApiKey) {
-          headers["Authorization"] = `Bearer ${apiKey}`;
-        }
+      const {
+        planYaml,
+        subjectAnalysis: sa,
+        participantsTsv,
+        coverageWarnings,
+      } = await buildBidsPlan({
+        evidenceBundle,
+        llmConfig: buildLLMConfig(),
+        signal: controller.signal,
+        onStatus: setStatus,
+      });
 
-        response = await fetch(currentProvider.baseUrl, {
-          method: "POST",
-          signal: controller.signal,
-          headers,
-          body: JSON.stringify({
-            model,
-            messages: [
-              {
-                role: "system",
-                content:
-                  "You are a neuroimaging data expert specializing in BIDS format conversion. Output only Python code without markdown fences or explanations.",
-              },
-              { role: "user", content: prompt },
-            ],
-            max_tokens: 4096,
-            temperature: 0.7,
-          }),
+      // Store subject analysis for ZIP packaging
+      setSubjectAnalysis(sa);
+
+      // Dump final YAML string (planYaml is raw string from LLM, already cleaned)
+      setBidsPlan(planYaml);
+
+      // Update participants.tsv in VFS with the full version from the plan stage
+      if (participantsTsv) {
+        const timestamp = new Date().toLocaleString();
+        updateFiles((prev) => {
+          const withoutOld = prev.filter(
+            (f) => !(f.source === "ai" && f.name === "participants.tsv")
+          );
+          return [
+            ...withoutOld,
+            {
+              id: generateId(),
+              name: "participants.tsv",
+              type: "file" as const,
+              fileType: "meta",
+              content: participantsTsv,
+              contentType: "text",
+              isUserMeta: true,
+              parentId: null,
+              source: "ai" as const,
+              generatedAt: timestamp,
+            },
+          ];
         });
       }
 
-      // const data = await response.json();
-      const data = provider === "ollama" ? response : await response.json();
-
-      // if (!response.ok) {
-      //   throw new Error(data.error?.message || "Failed to generate script");
-      // }
-      if (!response.ok && provider !== "ollama") {
-        throw new Error(data.error?.message || "Failed to generate script");
+      if (coverageWarnings.length > 0) {
+        setStatus(
+          `✓ BIDSPlan.yaml generated (${coverageWarnings.length} coverage warning(s) — check console)`
+        );
+      } else {
+        setStatus(`✓ BIDSPlan.yaml generated using ${currentProvider.name}`);
       }
-
-      // let script = "";
-      // if (currentProvider.isAnthropic) {
-      //   script = data.content[0].text;
-      // } else {
-      //   script = data.choices[0].message.content;
-      // }
-      let script = currentProvider.isAnthropic
-        ? data.content[0].text
-        : data.choices[0].message.content;
-
-      // Clean up markdown fences if AI included them anyway
-      script = script.replace(/^```python\n?/g, "").replace(/\n?```$/g, "");
-
-      setGeneratedScript(script);
-      setStatus(`✓ Script generated using ${currentProvider.name}`);
     } catch (err: any) {
       if (err.name === "AbortError") {
         setStatus("❌ Generation cancelled");
       } else {
-        setError(err.message || "Failed to generate script");
-        setStatus("❌ Error generating script");
+        setError(err.message || "Failed to generate BIDSPlan");
+        setStatus("❌ Error generating BIDSPlan");
       }
     } finally {
       setLoading(false);
-      setAbortController(null); // Clear controller
+      setAbortController(null);
     }
   };
+  // const handleGeneratePlan = async () => {
+  //   if (!currentProvider.noApiKey && !apiKey.trim()) {
+  //     setError("Please enter an API key");
+  //     return;
+  //   }
+  //   if (!baseDirectoryPath.trim()) {
+  //     setError("Please enter a base directory path");
+  //     return;
+  //   }
 
-  const handleGeneratePlan = async () => {
-    if (!currentProvider.noApiKey && !apiKey.trim()) {
-      setError("Please enter an API key");
-      return;
-    }
-    if (!baseDirectoryPath.trim()) {
-      setError("Please enter a base directory path");
-      return;
-    }
-
-    const controller = new AbortController();
-    setAbortController(controller);
-    setLoading(true);
-    setError(null);
-    setStatus(`Generating BIDSPlan.yaml using ${currentProvider.name}...`);
-
-    // ── Compute subject analysis (mirrors planner.py Step 1)
-    const allFiles = evidenceBundle?.all_files || [];
-    const userNSubjects = evidenceBundle?.user_hints?.n_subjects;
-    const dominantPrefixes =
-      evidenceBundle?.filename_analysis?.python_statistics?.dominant_prefixes;
-
-    const computedSubjectAnalysis = extractSubjectAnalysis(
-      allFiles,
-      userNSubjects,
-      dominantPrefixes
-    );
-
-    setSubjectAnalysis(computedSubjectAnalysis);
-
-    const fileSummary = buildFileSummary(files);
-    const filePatterns = analyzeFilePatterns(files);
-    const userContext = getUserContext(files);
-    // const subjectInfo = extractSubjectsFromFiles(files);
-    const subjectInfo = computedSubjectAnalysis;
-    const sampleFiles =
-      evidenceBundle?.samples
-        ?.slice(0, 10)
-        .map((s: any) => `  - ${s.relpath}`)
-        .join("\n") || "";
-
-    const prompt = getBIDSPlanPrompt(
-      fileSummary,
-      filePatterns,
-      userContext,
-      {
-        subjects: Object.entries(
-          computedSubjectAnalysis.id_mapping.id_mapping
-        ).map(([originalId, bidsId]) => ({ originalId, bidsId })),
-        strategy: computedSubjectAnalysis.id_mapping.strategy_used,
-      },
-      evidenceBundle?.counts_by_ext || {},
-      sampleFiles,
-      evidenceBundle
-    );
-
-    try {
-      let response;
-
-      if (provider === "ollama") {
-        // const ollamaBaseUrl = ollamaUrl || "http://localhost:11434";
-        // response = await fetch(`${ollamaBaseUrl}/v1/chat/completions`, {
-        //   method: "POST",
-        //   signal: controller.signal,
-        //   headers: { "Content-Type": "application/json" },
-        //   body: JSON.stringify({
-        //     model,
-        //     messages: [
-        //       {
-        //         role: "system",
-        //         content:
-        //           "You are a BIDS dataset architect. Output only valid YAML without markdown fences or explanations.",
-        //       },
-        //       { role: "user", content: prompt },
-        //     ],
-        //     stream: false,
-        //   }),
-        // });
-        response = await OllamaService.chat(model, [
-          {
-            role: "system",
-            content:
-              "You are a BIDS dataset architect. Output only valid YAML without markdown fences or explanations.",
-          },
-          { role: "user", content: prompt },
-        ]);
-      } else if (currentProvider.isAnthropic) {
-        response = await fetch(currentProvider.baseUrl, {
-          method: "POST",
-          signal: controller.signal,
-          headers: {
-            "Content-Type": "application/json",
-            "x-api-key": apiKey,
-            "anthropic-version": "2023-06-01",
-          },
-          body: JSON.stringify({
-            model,
-            max_tokens: 2048,
-            messages: [{ role: "user", content: prompt }],
-          }),
-        });
-      } else {
-        response = await fetch(currentProvider.baseUrl, {
-          method: "POST",
-          signal: controller.signal,
-          headers: {
-            "Content-Type": "application/json",
-            Authorization: `Bearer ${apiKey}`,
-          },
-          body: JSON.stringify({
-            model,
-            messages: [
-              {
-                role: "system",
-                content:
-                  "You are a BIDS dataset architect. Output only valid YAML without markdown fences or explanations.",
-              },
-              { role: "user", content: prompt },
-            ],
-            max_tokens: 2048,
-            temperature: 0.15,
-          }),
-        });
-      }
-
-      // const data = await response.json();
+  //   const controller = new AbortController();
+  //   setAbortController(controller);
+  //   setLoading(true);
+  //   setError(null);
+  //   setStatus(`Generating BIDSPlan.yaml using ${currentProvider.name}...`);
+
+  //   // ── Compute subject analysis (mirrors planner.py Step 1)
+  //   const allFiles = evidenceBundle?.all_files || [];
+  //   const userNSubjects = evidenceBundle?.user_hints?.n_subjects;
+  //   const dominantPrefixes =
+  //     evidenceBundle?.filename_analysis?.python_statistics?.dominant_prefixes;
+
+  //   const computedSubjectAnalysis = extractSubjectAnalysis(
+  //     allFiles,
+  //     userNSubjects,
+  //     dominantPrefixes
+  //   );
 
-      // if (!response.ok) {
-      //   throw new Error(data.error?.message || "Failed to generate BIDSPlan");
-      // }
-      const data = provider === "ollama" ? response : await response.json();
-      if (!response.ok && provider !== "ollama") {
-        throw new Error(data.error?.message || "Failed to generate BIDSPlan");
-      }
+  //   setSubjectAnalysis(computedSubjectAnalysis);
+
+  //   const fileSummary = buildFileSummary(files);
+  //   const filePatterns = analyzeFilePatterns(files);
+  //   const userContext = getUserContext(files);
+  //   // const subjectInfo = extractSubjectsFromFiles(files);
+  //   const subjectInfo = computedSubjectAnalysis;
+  //   const sampleFiles =
+  //     evidenceBundle?.samples
+  //       ?.slice(0, 10)
+  //       .map((s: any) => `  - ${s.relpath}`)
+  //       .join("\n") || "";
+
+  //   const prompt = getBIDSPlanPrompt(
+  //     fileSummary,
+  //     filePatterns,
+  //     userContext,
+  //     {
+  //       subjects: Object.entries(
+  //         computedSubjectAnalysis.id_mapping.id_mapping
+  //       ).map(([originalId, bidsId]) => ({ originalId, bidsId })),
+  //       strategy: computedSubjectAnalysis.id_mapping.strategy_used,
+  //     },
+  //     evidenceBundle?.counts_by_ext || {},
+  //     sampleFiles,
+  //     evidenceBundle
+  //   );
 
-      let plan = currentProvider.isAnthropic
-        ? data.content[0].text
-        : data.choices[0].message.content;
+  //   try {
+  //     let response;
+
+  //     if (provider === "ollama") {
+
+  //       response = await OllamaService.chat(model, [
+  //         {
+  //           role: "system",
+  //           content:
+  //             "You are a BIDS dataset architect. Output only valid YAML without markdown fences or explanations.",
+  //         },
+  //         { role: "user", content: prompt },
+  //       ]);
+  //     } else if (currentProvider.isAnthropic) {
+  //       response = await fetch(currentProvider.baseUrl, {
+  //         method: "POST",
+  //         signal: controller.signal,
+  //         headers: {
+  //           "Content-Type": "application/json",
+  //           "x-api-key": apiKey,
+  //           "anthropic-version": "2023-06-01",
+  //         },
+  //         body: JSON.stringify({
+  //           model,
+  //           max_tokens: 2048,
+  //           messages: [{ role: "user", content: prompt }],
+  //         }),
+  //       });
+  //     } else {
+  //       response = await fetch(currentProvider.baseUrl, {
+  //         method: "POST",
+  //         signal: controller.signal,
+  //         headers: {
+  //           "Content-Type": "application/json",
+  //           Authorization: `Bearer ${apiKey}`,
+  //         },
+  //         body: JSON.stringify({
+  //           model,
+  //           messages: [
+  //             {
+  //               role: "system",
+  //               content:
+  //                 "You are a BIDS dataset architect. Output only valid YAML without markdown fences or explanations.",
+  //             },
+  //             { role: "user", content: prompt },
+  //           ],
+  //           max_tokens: 2048,
+  //           temperature: 0.15,
+  //         }),
+  //       });
+  //     }
 
-      // Clean up markdown fences if present
-      plan = plan
-        .replace(/^```yaml\n?/g, "")
-        .replace(/\n?```$/g, "")
-        .trim();
+  //     const data = provider === "ollama" ? response : await response.json();
+  //     if (!response.ok && provider !== "ollama") {
+  //       throw new Error(data.error?.message || "Failed to generate BIDSPlan");
+  //     }
 
-      setBidsPlan(plan);
-      setStatus(`✓ BIDSPlan.yaml generated using ${currentProvider.name}`);
-    } catch (err: any) {
-      if (err.name === "AbortError") {
-        setStatus("❌ Generation cancelled");
-      } else {
-        setError(err.message || "Failed to generate BIDSPlan");
-        setStatus("❌ Error generating BIDSPlan");
-      }
-    } finally {
-      setLoading(false);
-      setAbortController(null);
-    }
-  };
+  //     let plan = currentProvider.isAnthropic
+  //       ? data.content[0].text
+  //       : data.choices[0].message.content;
+
+  //     // Clean up markdown fences if present
+  //     plan = plan
+  //       .replace(/^```yaml\n?/g, "")
+  //       .replace(/\n?```$/g, "")
+  //       .trim();
+
+  //     setBidsPlan(plan);
+  //     setStatus(`✓ BIDSPlan.yaml generated using ${currentProvider.name}`);
+  //   } catch (err: any) {
+  //     if (err.name === "AbortError") {
+  //       setStatus("❌ Generation cancelled");
+  //     } else {
+  //       setError(err.message || "Failed to generate BIDSPlan");
+  //       setStatus("❌ Error generating BIDSPlan");
+  //     }
+  //   } finally {
+  //     setLoading(false);
+  //     setAbortController(null);
+  //   }
+  // };
 
   const handleDownloadPlan = () => {
     const blob = new Blob([bidsPlan], { type: "text/yaml" });
@@ -1518,7 +1499,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
                 )}
               </FormControl>
 
-              {/* <TextField
+              <TextField
                 label="Describe your dataset (optional)"
                 placeholder='e.g. "DICOM files from 2 subjects, one male one female"'
                 value={describeText}
@@ -1526,7 +1507,8 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
                 size="small"
                 multiline
                 rows={2}
-              /> */}
+                sx={{ mb: 1 }}
+              />
               <Button
                 fullWidth
                 size="small"
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
index c3c89b0..8318a87 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/fileAnalyzers.ts
@@ -18,37 +18,106 @@ import { FileItem } from "redux/projects/types/projects.interface";
 // Partial mirror of executor.py → infer_subdirectory_from_suffix()
 //                               + categorize_scan_type()
 // ============================================================================
+// export const categorizeFile = (file: FileItem): string => {
+//   const name = file.name.toLowerCase();
+
+//   // Functional scans (task-based)
+//   if (name.includes("task-") && name.includes("bold")) return "functional-bold";
+//   if (name.endsWith(".snirf")) return "functional-nirs";
+//   if (name.endsWith(".nirs")) return "functional-nirs";
+//   if (name.endsWith(".mat")) return "functional-nirs";
+
+//   // Anatomical scans
+//   if (name.includes("t1w")) return "anatomical-T1w";
+//   if (name.includes("t2w") || name.includes("inplanet2"))
+//     return "anatomical-T2w";
+//   if (name.includes("flair")) return "anatomical-FLAIR";
+//   if (name.endsWith(".dcm")) return "anatomical-dicom";
+
+//   // JNIfTI — mirrors JNIFTI_EXT in constants.py: {'.jnii', '.bnii'}
+//   if (name.endsWith(".jnii") || name.endsWith(".bnii"))
+//     return "anatomical-jnifti";
+
+//   // Diffusion
+//   if (name.includes("dwi") || name.includes("diffusion")) return "diffusion";
+
+//   // Field maps
+//   if (name.includes("fieldmap") || name.includes("fmap")) return "fieldmap";
+
+//   // Array/HDF5 (non-SNIRF)
+//   if (name.endsWith(".h5") || name.endsWith(".hdf5")) return "array";
+
+//   // Fall back to fileType from fileProcessors.ts
+//   return file.fileType || "unknown";
+// };
+
 export const categorizeFile = (file: FileItem): string => {
   const name = file.name.toLowerCase();
 
-  // Functional scans (task-based)
-  if (name.includes("task-") && name.includes("bold")) return "functional-bold";
-  if (name.endsWith(".snirf")) return "functional-nirs";
-  if (name.endsWith(".nirs")) return "functional-nirs";
-  if (name.endsWith(".mat")) return "functional-nirs";
+  // Mirror detect_kind() priority order exactly:
+  // user_trio → jnifti → nirs → mri → table → array → text_doc → document → archive → other
+
+  // user_trio
+  if (
+    [
+      "dataset_description.json",
+      "participants.tsv",
+      "readme.md",
+      "readme.txt",
+      "readme.rst",
+      "readme",
+    ].includes(name)
+  )
+    return "user_trio";
+
+  // jnifti
+  if (name.endsWith(".jnii") || name.endsWith(".bnii")) return "jnifti";
+
+  // nirs — mirrors NIRS_EXT = {'.snirf', '.nirs', '.mat'}
+  if (
+    name.endsWith(".snirf") ||
+    name.endsWith(".nirs") ||
+    name.endsWith(".mat")
+  )
+    return "nirs";
+
+  // mri — mirrors MRI_EXT = {'.nii', '.dcm'} + .nii.gz
+  if (
+    name.endsWith(".nii.gz") ||
+    name.endsWith(".nii") ||
+    name.endsWith(".dcm")
+  )
+    return "mri";
 
-  // Anatomical scans
-  if (name.includes("t1w")) return "anatomical-T1w";
-  if (name.includes("t2w") || name.includes("inplanet2"))
-    return "anatomical-T2w";
-  if (name.includes("flair")) return "anatomical-FLAIR";
-  if (name.endsWith(".dcm")) return "anatomical-dicom";
+  // table
+  if ([".csv", ".tsv", ".xlsx", ".xls"].some((e) => name.endsWith(e)))
+    return "table";
 
-  // JNIfTI — mirrors JNIFTI_EXT in constants.py: {'.jnii', '.bnii'}
-  if (name.endsWith(".jnii") || name.endsWith(".bnii"))
-    return "anatomical-jnifti";
+  // array — mirrors ARRAY_EXT = {'.h5', '.hdf5', '.npy', '.npz'}
+  if ([".h5", ".hdf5", ".npy", ".npz"].some((e) => name.endsWith(e)))
+    return "array";
 
-  // Diffusion
-  if (name.includes("dwi") || name.includes("diffusion")) return "diffusion";
+  // text_doc — mirrors TEXT_EXT = {'.txt', '.md', '.rst', '.html', '.htm', '.log'}
+  if (
+    [".txt", ".md", ".rst", ".html", ".htm", ".log"].some((e) =>
+      name.endsWith(e)
+    )
+  )
+    return "text_doc";
 
-  // Field maps
-  if (name.includes("fieldmap") || name.includes("fmap")) return "fieldmap";
+  // document — mirrors DOC_EXT = {'.pdf', '.docx', '.doc', '.pptx', '.ppt', '.odt'}
+  if (
+    [".pdf", ".docx", ".doc", ".pptx", ".ppt", ".odt"].some((e) =>
+      name.endsWith(e)
+    )
+  )
+    return "document";
 
-  // Array/HDF5 (non-SNIRF)
-  if (name.endsWith(".h5") || name.endsWith(".hdf5")) return "array";
+  // archive
+  if ([".zip", ".tar", ".tgz", ".tar.gz"].some((e) => name.endsWith(e)))
+    return "archive";
 
-  // Fall back to fileType from fileProcessors.ts
-  return file.fileType || "unknown";
+  return "other";
 };
 
 // ============================================================================
@@ -102,19 +171,75 @@ export const getCountsByExtension = (
 //
 // Python reads files from disk; this reads from VFS FileItem.content.
 // ============================================================================
+// export const getUserContextText = (files: FileItem[]): string => {
+//   const readme = files.find((f) => f.name.toLowerCase().includes("readme"));
+//   const instructions = files.find(
+//     (f) =>
+//       f.name.toLowerCase().includes("conversion") ||
+//       f.name.toLowerCase().includes("instruction")
+//   );
+//   const participants = files.find((f) =>
+//     f.name.toLowerCase().includes("participant")
+//   );
+
+//   const datasetDescription = files.find(
+//     (f) => f.name.toLowerCase() === "dataset_description.json"
+//   );
+
+//   const pdfsAndDocs = files.filter(
+//     (f) =>
+//       f.source === "user" &&
+//       f.fileType === "office" &&
+//       f.content?.trim() &&
+//       f.name.toLowerCase() !== "participants.tsv" // already handled
+//   );
+//   const textFiles = files.filter(
+//     (f) =>
+//       f.source === "user" &&
+//       f.fileType === "text" &&
+//       f.content?.trim() &&
+//       ![
+//         "readme",
+//         "participants.tsv",
+//         "dataset_description.json",
+//         "readme.md",
+//         "readme.txt",
+//       ].includes(f.name.toLowerCase()) &&
+//       f.isUserMeta === true // only user-added meta files, not data sidecars
+//   );
+//   textFiles.forEach((f) => {
+//     parts.push(`TEXT FILE [${f.name}]:\n${f.content!.slice(0, 3000)}`);
+//   });
+
+//   const parts = [];
+//   if (datasetDescription?.content)
+//     parts.push(`DATASET DESCRIPTION:\n${datasetDescription.content}`);
+//   if (readme?.content) parts.push(`README:\n${readme.content}`);
+//   if (instructions?.content)
+//     parts.push(`INSTRUCTIONS:\n${instructions.content}`);
+//   if (participants?.content)
+//     parts.push(`PARTICIPANTS:\n${participants.content}`);
+//   pdfsAndDocs.forEach((f) => {
+//     parts.push(`DOCUMENT [${f.name}]:\n${f.content!.slice(0, 3000)}`);
+//   });
+//   return parts.join("\n\n");
+// };
 export const getUserContextText = (files: FileItem[]): string => {
-  const readme = files.find((f) => f.name.toLowerCase().includes("readme"));
+  const readme = files.find(
+    (f) => f.source === "user" && f.name.toLowerCase().includes("readme")
+  );
   const instructions = files.find(
     (f) =>
-      f.name.toLowerCase().includes("conversion") ||
-      f.name.toLowerCase().includes("instruction")
+      f.source === "user" &&
+      (f.name.toLowerCase().includes("conversion") ||
+        f.name.toLowerCase().includes("instruction"))
   );
-  const participants = files.find((f) =>
-    f.name.toLowerCase().includes("participant")
+  const participants = files.find(
+    (f) => f.source === "user" && f.name.toLowerCase().includes("participant")
   );
-
   const datasetDescription = files.find(
-    (f) => f.name.toLowerCase() === "dataset_description.json"
+    (f) =>
+      f.source === "user" && f.name.toLowerCase() === "dataset_description.json"
   );
 
   const pdfsAndDocs = files.filter(
@@ -122,10 +247,24 @@ export const getUserContextText = (files: FileItem[]): string => {
       f.source === "user" &&
       f.fileType === "office" &&
       f.content?.trim() &&
-      f.name.toLowerCase() !== "participants.tsv" // already handled
+      f.name.toLowerCase() !== "participants.tsv"
+  );
+  const textFiles = files.filter(
+    (f) =>
+      f.source === "user" &&
+      f.fileType === "text" &&
+      f.content?.trim() &&
+      ![
+        "readme",
+        "participants.tsv",
+        "dataset_description.json",
+        "readme.md",
+        "readme.txt",
+      ].includes(f.name.toLowerCase()) &&
+      f.isUserMeta === true
   );
 
-  const parts = [];
+  const parts: string[] = [];
   if (datasetDescription?.content)
     parts.push(`DATASET DESCRIPTION:\n${datasetDescription.content}`);
   if (readme?.content) parts.push(`README:\n${readme.content}`);
@@ -136,5 +275,9 @@ export const getUserContextText = (files: FileItem[]): string => {
   pdfsAndDocs.forEach((f) => {
     parts.push(`DOCUMENT [${f.name}]:\n${f.content!.slice(0, 3000)}`);
   });
+  textFiles.forEach((f) => {
+    parts.push(`TEXT FILE [${f.name}]:\n${f.content!.slice(0, 3000)}`);
+  });
+
   return parts.join("\n\n");
 };
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/fileProcessors.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/fileProcessors.ts
index b51d150..9897b15 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/fileProcessors.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/fileProcessors.ts
@@ -118,12 +118,32 @@ export const processFile = async (
       }
       entry.contentType = "hdf5";
     } else if (fileType === "neurojsonText") {
-      // Extract NeuroJSON text
       const text = await file.text();
-      // entry.content = text.slice(0, 5000);
       try {
         const json = JSON.parse(text);
-        entry.content = JSON.stringify(json, null, 2).slice(0, 5000);
+        // JNIfTI files — extract NIFTIHeader only, mirrors _extract_jnifti_header()
+        if (
+          file.name.toLowerCase().endsWith(".jnii") ||
+          file.name.toLowerCase().endsWith(".bnii")
+        ) {
+          const hdr = json?.NIFTIHeader ?? {};
+          const result: Record<string, any> = {};
+          for (const field of [
+            "Dim",
+            "VoxelSize",
+            "DataType",
+            "Intent",
+            "QForm",
+            "SForm",
+            "Description",
+            "NIIFormat",
+          ]) {
+            if (hdr[field] !== undefined) result[field] = hdr[field];
+          }
+          entry.content = JSON.stringify(result, null, 2);
+        } else {
+          entry.content = JSON.stringify(json, null, 2).slice(0, 5000);
+        }
       } catch (e) {
         entry.content = text.slice(0, 5000);
       }
@@ -344,9 +364,29 @@ export const processZip = async (
       else if (fileType === "neurojsonText") {
         try {
           const text = await zipEntry.async("text");
-          // entry.content = text.slice(0, 5000);
           const json = JSON.parse(text);
-          entry.content = JSON.stringify(json, null, 2).slice(0, 5000);
+          if (
+            fileName.toLowerCase().endsWith(".jnii") ||
+            fileName.toLowerCase().endsWith(".bnii")
+          ) {
+            const hdr = json?.NIFTIHeader ?? {};
+            const result: Record<string, any> = {};
+            for (const field of [
+              "Dim",
+              "VoxelSize",
+              "DataType",
+              "Intent",
+              "QForm",
+              "SForm",
+              "Description",
+              "NIIFormat",
+            ]) {
+              if (hdr[field] !== undefined) result[field] = hdr[field];
+            }
+            entry.content = JSON.stringify(result, null, 2);
+          } else {
+            entry.content = JSON.stringify(json, null, 2).slice(0, 5000);
+          }
           entry.contentType = "neurojson";
         } catch (e: any) {
           entry.content = `Error: ${e.message}`;
@@ -755,6 +795,14 @@ const parseDicomHeader = (buffer: ArrayBuffer): string => {
     const manufacturer = getString("x00080070");
     const rows = getString("x00280010");
     const cols = getString("x00280011");
+    const repetitionTime = getString("x00180080");
+    const echoTime = getString("x00180081");
+    const flipAngle = getString("x00181314");
+    const sliceThickness = getString("x00180050");
+    const magneticFieldStrength = getString("x00180087");
+    const manufacturerModel = getString("x00081090");
+    const softwareVersions = getString("x00181020");
+    const acquisitionDate = getString("x00080022");
 
     const lines = [`DICOM File`, `─`.repeat(50)];
 
@@ -767,7 +815,15 @@ const parseDicomHeader = (buffer: ArrayBuffer): string => {
     if (patientAge) lines.push(`Age: ${patientAge}`);
     if (manufacturer) lines.push(`Scanner: ${manufacturer}`);
     if (rows && cols) lines.push(`Image Size: ${rows} × ${cols}`);
-
+    if (repetitionTime) lines.push(`RepetitionTime: ${repetitionTime}`);
+    if (echoTime) lines.push(`EchoTime: ${echoTime}`);
+    if (flipAngle) lines.push(`FlipAngle: ${flipAngle}`);
+    if (sliceThickness) lines.push(`SliceThickness: ${sliceThickness}`);
+    if (magneticFieldStrength)
+      lines.push(`MagneticFieldStrength: ${magneticFieldStrength}`);
+    if (manufacturerModel) lines.push(`Model: ${manufacturerModel}`);
+    if (softwareVersions) lines.push(`SoftwareVersions: ${softwareVersions}`);
+    if (acquisitionDate) lines.push(`AcquisitionDate: ${acquisitionDate}`);
     return lines.join("\n");
   } catch (e: any) {
     return `DICOM File\nSize: ${(buffer.byteLength / 1024).toFixed(
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
index 24aa930..cc30bc8 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/filenameTokenizer.ts
@@ -358,72 +358,6 @@ export const buildLLMPayload = (
   };
 };
 
-/**
- * Analyze token statistics across all filenames.
- * Mirrors FilenamePatternAnalyzer.analyze_token_statistics()
- */
-// export const analyzeTokenStatistics = (
-//   filenames: string[]
-// ): TokenStatistics => {
-//   const allTokens: Record<string, number> = {};
-//   const prefixTokens: Record<string, number> = {}; // first token only
-
-//   for (const filename of filenames) {
-//     // Extract just filename from path
-//     const fname = filename.includes("/")
-//       ? filename.split("/").pop()!
-//       : filename;
-
-//     const tokens = tokenizeFilename(fname);
-
-//     // Count all tokens
-//     for (const token of tokens) {
-//       allTokens[token] = (allTokens[token] || 0) + 1;
-//     }
-
-//     // CRITICAL: use first TOKEN as prefix (not regex match)
-//     if (tokens.length > 0) {
-//       const firstToken = tokens[0];
-//       prefixTokens[firstToken] = (prefixTokens[firstToken] || 0) + 1;
-//     }
-//   }
-
-//   const dominantPrefixes = findDominantPrefixes(prefixTokens, filenames.length);
-
-//   return {
-//     totalFiles: filenames.length,
-//     tokenFrequency: allTokens,
-//     prefixFrequency: prefixTokens,
-//     dominantPrefixes,
-//   };
-// };
-
-/*
- * Find dominant prefixes — tokens appearing in >5% of files
- * that are not common words.
- * Mirrors FilenamePatternAnalyzer._find_dominant_prefixes()
- */
-// const findDominantPrefixes = (
-//   prefixCounter: Record<string, number>,
-//   totalFiles: number
-// ): DominantPrefix[] => {
-//   const threshold = totalFiles * 0.05; // 5% threshold
-
-//   return Object.entries(prefixCounter)
-//     .filter(([prefix, count]) => {
-//       if (count < threshold) return false;
-//       if (COMMON_WORDS.has(prefix.toLowerCase())) return false;
-//       return true;
-//     })
-//     .sort((a, b) => b[1] - a[1])
-//     .slice(0, 20)
-//     .map(([prefix, count]) => ({
-//       prefix,
-//       count,
-//       percentage: Math.round((count / totalFiles) * 1000) / 10,
-//     }));
-// };
-
 // ============================================================================
 // Integration Functions
 // Mirrors analyze_filenames_for_subjects() + _generate_recommendation() in filename_tokenizer.py
@@ -605,525 +539,3 @@ export const createBlockingQuestion = (
     options,
   },
 });
-
-// ============================================================================
-// extractSubjectAnalysis — mirrors build_bids_plan()'s subject extraction
-// ============================================================================
-
-/**
- * Full subject extraction mirroring autobidsify's judgment sequence:
- *
- * 1. Try directory structure patterns (sub-01, subject_01, site_sub01, 001)
- * 2. If fails → try filename token statistics (dominant prefix approach)
- * 3. Generate ID mapping (already_bids / numeric / semantic)
- */
-// export const extractSubjectAnalysis = (allFiles: string[], userNSubjects?: number | null, dominantPrefixes?: { prefix: string; count: number; percentage: number }[]): SubjectAnalysis => {
-//   // ── Step 1: Try directory structure (mirrors _extract_subjects_from_directory_structure)
-//   const fromDir = extractFromDirectoryStructure(allFiles);
-//   if (fromDir && fromDir.subject_records.length > 0) {
-//     const idMapping = generateIdMapping(fromDir);
-//     return { ...fromDir, id_mapping: idMapping };
-//   }
-
-//   // ── Step 2: Filename token statistics (mirrors filename_tokenizer approach)
-//   const fromTokens = extractFromTokenStatistics(allFiles);
-//   if (fromTokens && fromTokens.subject_records.length > 0) {
-//     const idMapping = generateIdMapping(fromTokens);
-//     return { ...fromTokens, id_mapping: idMapping };
-//   }
-
-//   // ── Fallback: empty result
-//   return {
-//     success: false,
-//     method: "none",
-//     subject_records: [],
-//     subject_count: 0,
-//     has_site_info: false,
-//     variants_by_subject: {},
-//     python_generated_filename_rules: [],
-//     id_mapping: {
-//       id_mapping: {},
-//       reverse_mapping: {},
-//       strategy_used: "none",
-//       metadata_columns: [],
-//     },
-//   };
-// };
-
-// ── Step 1: Directory structure patterns
-// Mirrors _extract_subjects_from_directory_structure() in planner.py
-// const extractFromDirectoryStructure = (
-//   allFiles: string[]
-// ): Omit<SubjectAnalysis, "id_mapping"> | null => {
-//   const patterns: Array<[RegExp, boolean, number, number | null, string]> = [
-//     [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"],
-//     [/^sub-(\w+)$/i, false, 1, null, "standard_bids"],
-//     [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"],
-//     [/^(\d{3,})$/, false, 1, null, "numeric_only"],
-//   ];
-
-//   const subjectRecords: SubjectRecord[] = [];
-//   const seenIds = new Set<string>();
-
-//   for (const filepath of allFiles) {
-//     const parts = filepath.split("/");
-//     for (const part of parts.slice(0, 2)) {
-//       for (const [
-//         regex,
-//         hasSite,
-//         idGroup,
-//         siteGroup,
-//         patternName,
-//       ] of patterns) {
-//         const match = part.match(regex);
-//         if (match) {
-//           const originalId = match[0];
-//           if (seenIds.has(originalId)) break;
-//           seenIds.add(originalId);
-//           subjectRecords.push({
-//             original_id: originalId,
-//             numeric_id: match[idGroup],
-//             site: hasSite && siteGroup ? match[siteGroup] : null,
-//             pattern_name: patternName,
-//             file_count: 0,
-//           });
-//           break;
-//         }
-//       }
-//     }
-//   }
-
-//   if (subjectRecords.length === 0) return null;
-
-//   subjectRecords.sort((a, b) => {
-//     const na = parseInt(a.numeric_id) || 0;
-//     const nb = parseInt(b.numeric_id) || 0;
-//     return na - nb;
-//   });
-
-//   return {
-//     success: true,
-//     method: "directory_structure",
-//     subject_records: subjectRecords,
-//     subject_count: subjectRecords.length,
-//     has_site_info: subjectRecords.some((r) => r.site !== null),
-//     variants_by_subject: {},
-//     python_generated_filename_rules: [],
-//   };
-// };
-
-// ── Step 2: Token statistics (dominant prefix approach)
-// Mirrors FilenamePatternAnalyzer + analyze_filenames_for_subjects() in filename_tokenizer.py
-// const extractFromTokenStatistics = (
-//   allFiles: string[]
-// ): Omit<SubjectAnalysis, "id_mapping"> | null => {
-//   // Extract just filenames (not full paths) — mirrors filename_tokenizer.py line:
-//   // filenames = [f.split('/')[-1] for f in all_files]
-//   const filenames = allFiles.map((f) =>
-//     f.includes("/") ? f.split("/").pop()! : f
-//   );
-
-//   const stats = analyzeTokenStatistics(filenames);
-
-//   if (stats.dominantPrefixes.length === 0) return null;
-
-//   // Count files per prefix
-//   const prefixFileCounts: Record<string, number> = {};
-//   for (const filename of filenames) {
-//     const tokens = tokenizeFilename(filename);
-//     if (tokens.length > 0) {
-//       const first = tokens[0];
-//       if (stats.dominantPrefixes.some((p) => p.prefix === first)) {
-//         prefixFileCounts[first] = (prefixFileCounts[first] || 0) + 1;
-//       }
-//     }
-//   }
-
-//   const subjectRecords: SubjectRecord[] = stats.dominantPrefixes.map(
-//     (p, i) => ({
-//       original_id: p.prefix,
-//       numeric_id: String(i + 1),
-//       site: null,
-//       pattern_name: "dominant_prefix",
-//       file_count: prefixFileCounts[p.prefix] || p.count,
-//     })
-//   );
-
-//   return {
-//     success: true,
-//     method: "dominant_prefix_fallback",
-//     subject_records: subjectRecords,
-//     subject_count: subjectRecords.length,
-//     has_site_info: false,
-//     variants_by_subject: {},
-//     python_generated_filename_rules: [],
-//   };
-// };
-
-/**
- * Mirrors _extract_numeric_id_from_identifier() in planner.py
- * BZZ003 → "003", sub-01 → "01", patient021 → "021"
- */
-const extractNumericIdFromIdentifier = (identifier: string): string | null => {
-  const numbers = identifier.match(/\d+/g);
-  if (!numbers) return null;
-  return numbers[numbers.length - 1]; // last numeric sequence, preserving leading zeros
-};
-
-// ── Step 1: Directory structure patterns
-// Mirrors _extract_subjects_from_directory_structure() in planner.py
-const SKIP_DIRS = new Set([
-  "anat",
-  "func",
-  "dwi",
-  "fmap",
-  "nirs",
-  "meg",
-  "eeg",
-  "beh",
-  "perf",
-  "derivatives",
-  "sourcedata",
-  "stimuli",
-  "walking",
-  "resting",
-  "resting_state",
-  "run",
-  "ses",
-  "pd",
-  "control",
-  "hc",
-  "task",
-  "sub",
-  "dataset",
-  "data",
-  "raw",
-  "bids",
-  "output",
-  "outputs",
-  "staging",
-  "_staging",
-  "mri",
-  "fnirs",
-  "edf",
-  "dicom",
-]);
-
-const extractFromDirectoryStructure = (
-  allFiles: string[]
-): Omit<SubjectAnalysis, "id_mapping"> | null => {
-  const patterns: Array<[RegExp, boolean, number, number | null, string]> = [
-    [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"], // Beijing_sub82352
-    [/^sub-(\w+)$/, false, 1, null, "standard_bids"], // sub-01
-    [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"], // subject_01
-    [/^\d{3,}$/, false, 1, null, "numeric_only"], // 001
-    [/^([A-Za-z]+\d+)$/, false, 1, null, "alphanum_id"], // PD01, Control01, HC03
-  ];
-
-  const subjectRecords: SubjectRecord[] = [];
-  const seenIds = new Set<string>();
-
-  for (const filepath of allFiles) {
-    const parts = filepath.split("/");
-    // Check ALL directory levels (not just first 2)
-    const dirsOnly = parts.slice(0, parts.length - 1);
-    // const dirsOnly = parts.slice(0, Math.min(2, parts.length - 1)); // only first 2 levels
-
-    for (const part of dirsOnly) {
-      // Skip known non-subject directory names
-      // if (SKIP_DIRS.has(part.toLowerCase())) continue;
-
-      for (const [
-        regex,
-        hasSite,
-        idGroup,
-        siteGroup,
-        patternName,
-      ] of patterns) {
-        const match = part.match(regex);
-        if (match) {
-          const originalId = match[0];
-          if (seenIds.has(originalId)) break;
-          seenIds.add(originalId);
-          subjectRecords.push({
-            original_id: originalId,
-            numeric_id: match[idGroup] || match[0],
-            site: hasSite && siteGroup ? match[siteGroup] : null,
-            pattern_name: patternName,
-            file_count: 0,
-          });
-          break;
-        }
-      }
-    }
-  }
-
-  if (subjectRecords.length === 0) return null;
-
-  subjectRecords.sort((a, b) => {
-    // const na = parseInt(a.numeric_id) || 0;
-    // const nb = parseInt(b.numeric_id) || 0;
-    // return na - nb;
-    const aMatch = a.original_id.match(/^([A-Za-z]+)(\d+)$/);
-    const bMatch = b.original_id.match(/^([A-Za-z]+)(\d+)$/);
-
-    if (aMatch && bMatch) {
-      const prefixCompare = aMatch[1].localeCompare(bMatch[1]);
-      if (prefixCompare !== 0) return prefixCompare;
-      return parseInt(aMatch[2]) - parseInt(bMatch[2]);
-    }
-
-    const na = parseInt(a.numeric_id) || 0;
-    const nb = parseInt(b.numeric_id) || 0;
-    return na - nb;
-  });
-
-  // Build group map: subject originalId → parent directory name
-  // const groupMap: Record<string, string> = {};
-  // for (const filepath of allFiles) {
-  //   const parts = filepath.split("/");
-  //   for (let i = 1; i < parts.length - 1; i++) {
-  //     if (seenIds.has(parts[i]) && !SKIP_DIRS.has(parts[i - 1].toLowerCase())) {
-  //       groupMap[parts[i]] = parts[i - 1];
-  //     }
-  //   }
-  // }
-
-  // // Attach group to each record
-  // for (const rec of subjectRecords) {
-  //   if (groupMap[rec.original_id]) {
-  //     rec.group = groupMap[rec.original_id];
-  //   }
-  // }
-
-  return {
-    success: true,
-    method: "directory_structure",
-    subject_records: subjectRecords,
-    subject_count: subjectRecords.length,
-    has_site_info: subjectRecords.some((r) => r.site !== null),
-    variants_by_subject: {},
-    python_generated_filename_rules: [],
-  };
-};
-
-const TRIO_FILENAMES = new Set([
-  "dataset_description.json",
-  "participants.tsv",
-  "readme.md",
-  "readme.txt",
-  "readme.rst",
-  "readme",
-]);
-// ── Step 2: Flat filename identifier extraction
-// Mirrors _extract_subjects_from_flat_filenames() in planner.py
-// KEY DIFFERENCE from old version: uses base identifier (before first _)
-// not tokenizer dominant prefixes
-const extractFromFlatFilenames = (
-  allFiles: string[]
-): Omit<SubjectAnalysis, "id_mapping"> | null => {
-  const identifierToFiles: Record<string, string[]> = {};
-
-  for (const filepath of allFiles) {
-    const filename = filepath.split("/").pop()!;
-
-    // Skip trio files
-    if (TRIO_FILENAMES.has(filename.toLowerCase())) continue;
-    // Skip non-data files (PDFs, docs, JSONs that aren't data)
-    if (!DATA_EXTENSIONS.test(filename)) continue;
-    // Remove extension(s): sub-01_ses-left2s_task-FRESHMOTOR_nirs.snirf → sub-01_ses-left2s_task-FRESHMOTOR_nirs
-    const nameNoExt = filename.replace(/(\.[^.]+)+$/, "");
-
-    // Extract base identifier — alphanumeric before first underscore
-    // sub-01_ses-left2s → sub-01
-    // BZZ003_rest → BZZ003
-    // VHMCT1mm-Hip → VHMCT1mm-Hip (no underscore, take full name)
-    const match = nameNoExt.match(/^([A-Za-z0-9\-]+)/);
-    if (match) {
-      const identifier = match[1];
-      if (!identifierToFiles[identifier]) identifierToFiles[identifier] = [];
-      identifierToFiles[identifier].push(filepath);
-    }
-  }
-
-  if (Object.keys(identifierToFiles).length === 0) return null;
-
-  // Sort by extracted numeric ID if possible (mirrors sort_key in planner.py)
-  const sortedIdentifiers = Object.keys(identifierToFiles).sort((a, b) => {
-    const na = extractNumericIdFromIdentifier(a);
-    const nb = extractNumericIdFromIdentifier(b);
-    if (na && nb) return parseInt(na) - parseInt(nb);
-    return a.localeCompare(b);
-  });
-
-  const subjectRecords: SubjectRecord[] = sortedIdentifiers.map(
-    (identifier, i) => ({
-      original_id: identifier,
-      numeric_id: String(i + 1),
-      site: null,
-      pattern_name: "filename_identifier",
-      file_count: identifierToFiles[identifier].length,
-    })
-  );
-
-  return {
-    success: true,
-    method: "flat_filename_identifiers",
-    subject_records: subjectRecords,
-    subject_count: subjectRecords.length,
-    has_site_info: false,
-    variants_by_subject: {},
-    python_generated_filename_rules: [],
-  };
-};
-
-export const extractSubjectAnalysis = (
-  allFiles: string[],
-  userNSubjects?: number | null,
-  dominantPrefixes?: { prefix: string; count: number; percentage: number }[]
-): SubjectAnalysis => {
-  // Step 1: directory structure
-  let subjectInfo = extractFromDirectoryStructure(allFiles);
-
-  // Step 2: flat filename fallback
-  if (!subjectInfo || subjectInfo.subject_records.length === 0) {
-    subjectInfo = extractFromFlatFilenames(allFiles);
-  }
-
-  if (!subjectInfo || subjectInfo.subject_records.length === 0) {
-    return {
-      success: false,
-      method: "none",
-      subject_records: [],
-      subject_count: 0,
-      has_site_info: false,
-      variants_by_subject: {},
-      python_generated_filename_rules: [],
-      id_mapping: {
-        id_mapping: {},
-        reverse_mapping: {},
-        strategy_used: "none",
-        metadata_columns: [],
-      },
-    };
-  }
-
-  // ── CRITICAL validation: mirrors planner.py lines 190-215
-  // If extracted count doesn't match user hint but dominant prefixes do,
-  // fall back to dominant prefixes (handles VHM/VHF body-part over-extraction)
-  const pythonCount = subjectInfo.subject_count;
-  if (
-    userNSubjects &&
-    pythonCount !== userNSubjects &&
-    dominantPrefixes &&
-    dominantPrefixes.length === userNSubjects
-  ) {
-    subjectInfo = {
-      success: true,
-      method: "dominant_prefix_fallback",
-      subject_records: dominantPrefixes.map((p, i) => ({
-        original_id: p.prefix,
-        numeric_id: String(i + 1),
-        site: null,
-        pattern_name: "dominant_prefix",
-        file_count: p.count,
-      })),
-      subject_count: dominantPrefixes.length,
-      has_site_info: false,
-      variants_by_subject: {},
-      python_generated_filename_rules: [],
-    };
-  }
-  // bug fix for subject mapping
-  // === original
-  // const idMapping = generateIdMapping(subjectInfo);
-  // return { ...subjectInfo, id_mapping: idMapping };
-  // ==== end
-  // ==== updates
-  // CRITICAL: n_subjects is authoritative (mirrors planner.py PROMPT_BIDS_PLAN)
-  // If analysis count doesn't match user input, fall back to sequential numbering
-  const expectedCount = userNSubjects;
-  if (expectedCount && subjectInfo.subject_count !== expectedCount) {
-    const idMap: Record<string, string> = {};
-    const reverseMap: Record<string, string> = {};
-    for (let i = 1; i <= expectedCount; i++) {
-      const bidsId = String(i).padStart(2, "0");
-      idMap[`sub-${bidsId}`] = bidsId;
-      reverseMap[bidsId] = `sub-${bidsId}`;
-    }
-    return {
-      ...subjectInfo,
-      subject_count: expectedCount,
-      id_mapping: {
-        id_mapping: idMap,
-        reverse_mapping: reverseMap,
-        strategy_used: "numeric_fallback",
-        metadata_columns: [],
-      },
-    };
-  }
-
-  const idMapping = generateIdMapping(subjectInfo);
-  return { ...subjectInfo, id_mapping: idMapping };
-};
-
-// ── ID mapping — mirrors _generate_subject_id_mapping() in planner.py
-const generateIdMapping = (
-  subjectInfo: Omit<SubjectAnalysis, "id_mapping">
-): SubjectAnalysis["id_mapping"] => {
-  const records = subjectInfo.subject_records;
-  const idMapping: Record<string, string> = {};
-  const reverseMapping: Record<string, string> = {};
-
-  // Detect already-BIDS format (sub-01, sub-02...)
-  const allAlreadyBids = records.every((r) => /^sub-\w+$/i.test(r.original_id));
-
-  if (allAlreadyBids) {
-    for (const rec of records) {
-      const bidsId = rec.original_id.replace(/^sub-/i, "");
-      idMapping[rec.original_id] = bidsId;
-      reverseMapping[bidsId] = rec.original_id;
-    }
-    return {
-      id_mapping: idMapping,
-      reverse_mapping: reverseMapping,
-      strategy_used: "already_bids",
-      metadata_columns: [],
-    };
-  }
-
-  // Numeric strategy: try to extract trailing numbers first
-  // BZZ003 → "003", patient021 → "021" (mirrors _extract_numeric_id_from_identifier)
-  const extractedNumbers: Record<string, string> = {};
-  for (const rec of records) {
-    const nums = rec.original_id.match(/\d+/g);
-    if (nums) extractedNumbers[rec.original_id] = nums[nums.length - 1];
-  }
-
-  const numericValues = Object.values(extractedNumbers);
-  const allUnique = new Set(numericValues).size === numericValues.length;
-
-  if (Object.keys(extractedNumbers).length === records.length && allUnique) {
-    // Use extracted numeric IDs (preserving leading zeros)
-    for (const rec of records) {
-      const bidsId = extractedNumbers[rec.original_id];
-      idMapping[rec.original_id] = bidsId;
-      reverseMapping[bidsId] = rec.original_id;
-    }
-  } else {
-    // Fall back to sequential numbering
-    for (let i = 0; i < records.length; i++) {
-      const orig = records[i].original_id;
-      const bidsId = String(i + 1);
-      idMapping[orig] = bidsId;
-      reverseMapping[bidsId] = orig;
-    }
-  }
-
-  return {
-    id_mapping: idMapping,
-    reverse_mapping: reverseMapping,
-    strategy_used: "numeric",
-    metadata_columns: ["original_id"],
-  };
-};
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/llm.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/llm.ts
new file mode 100644
index 0000000..4e17c34
--- /dev/null
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/llm.ts
@@ -0,0 +1,963 @@
+// src/components/DatasetOrganizer/utils/llm.ts
+//
+// Mirrors autobidsify/llm.py
+// Unified LLM caller supporting OpenAI, Qwen (Ollama), Anthropic, Groq, OpenRouter.
+//
+// Python equivalents:
+//   LLMHardFail                  → LLMHardFail class
+//   isQwenModel()                → is_qwen_model()
+//   isOpenAIModel()              → is_openai_model()
+//   isReasoningModel()           → is_reasoning_model()
+//   inferQwenTemperature()       → _infer_qwen_temperature()
+//   callLLM()                    → _call_llm()
+//   PROMPT_TRIO_DATASET_DESC     → PROMPT_TRIO_DATASET_DESC
+//   PROMPT_TRIO_README           → PROMPT_TRIO_README
+//   PROMPT_TRIO_PARTICIPANTS     → PROMPT_TRIO_PARTICIPANTS
+//   PROMPT_BIDS_PLAN             → PROMPT_BIDS_PLAN
+//   PROMPT_MAT_SNIRF_MAPPING     → PROMPT_MAT_SNIRF_MAPPING
+//   llmTrioDatasetDescription()  → llm_trio_dataset_description()
+//   llmTrioReadme()              → llm_trio_readme()
+//   llmTrioParticipants()        → llm_trio_participants()
+//   llmBidsPlan()                → llm_bids_plan()
+//   llmMapMatToSnirf()           → llm_map_mat_to_snirf()
+//
+// DIFFERENCES FROM llm.py — see bottom of file for explanation
+import { OllamaService } from "services/ollama.service";
+
+// ============================================================================
+// LLMHardFail
+// Mirrors LLMHardFail exception class in llm.py
+// ============================================================================
+
+export class LLMHardFail extends Error {
+  step: string;
+  error_type: string;
+  message: string;
+
+  constructor(step: string, errorType: string, message: string) {
+    super(`[${step}] ${errorType}: ${message}`);
+    this.step = step;
+    this.error_type = errorType;
+    this.message = message;
+  }
+}
+
+// ============================================================================
+// Provider detection
+// Mirrors is_qwen_model(), is_openai_model(), is_reasoning_model()
+// ============================================================================
+
+export const isQwenModel = (model: string): boolean =>
+  model.toLowerCase().startsWith("qwen");
+
+export const isOpenAIModel = (model: string): boolean =>
+  model.toLowerCase().startsWith("gpt") ||
+  model.toLowerCase().startsWith("o1") ||
+  model.toLowerCase().startsWith("o3");
+
+export const isReasoningModel = (model: string): boolean => {
+  const m = model.toLowerCase();
+  return m.startsWith("o1") || m.startsWith("o3") || m.startsWith("gpt-5");
+};
+
+// TS addition: Anthropic is a separate provider not in Python
+// Python has OpenAI + Qwen only. TS adds Anthropic, Groq, OpenRouter.
+export const isAnthropicModel = (model: string): boolean =>
+  model.toLowerCase().startsWith("claude");
+
+// ============================================================================
+// Temperature inference for Qwen
+// Mirrors _infer_qwen_temperature() in llm.py
+// ============================================================================
+
+export const inferQwenTemperature = (
+  model: string,
+  baseTemperature: number | null
+): number | null => {
+  if (baseTemperature === null) return null;
+
+  const m = model.toLowerCase();
+
+  if (["think", "careful", "compare", "reason"].some((kw) => m.includes(kw)))
+    return Math.min(baseTemperature, 0.15);
+
+  if (["next", "fast", "turbo", "lite"].some((kw) => m.includes(kw)))
+    return Math.max(baseTemperature, 0.4);
+
+  return Math.max(baseTemperature, 0.3);
+};
+
+// ============================================================================
+// LLM config type
+// TS-only: Python uses env vars + CLI args; TS gets config from UI state
+// ============================================================================
+
+export interface LLMConfig {
+  provider: string;
+  model: string;
+  apiKey: string;
+  baseUrl: string;
+  isAnthropic?: boolean;
+  noApiKey?: boolean;
+}
+
+// ============================================================================
+// callLLM()
+// Mirrors _call_llm() unified entry point in llm.py
+//
+// Python routing:
+//   qwen*        → _call_qwen()    (Ollama / REST API / DashScope)
+//   gpt* o1* o3* → _call_openai() (OpenAI API)
+//
+// TS routing adds Anthropic, Groq, OpenRouter (not in Python)
+// because NeuroJSON.io supports more providers than the CLI does.
+// ============================================================================
+
+export const callLLM = async (
+  systemPrompt: string,
+  userPayload: string,
+  step: string,
+  llmConfig: LLMConfig,
+  temperature: number | null = null,
+  signal?: AbortSignal
+): Promise<string> => {
+  const { provider, model, apiKey, baseUrl, isAnthropic, noApiKey } = llmConfig;
+
+  // ── Qwen via Ollama proxy ─────────────────────────────────────────
+  // Mirrors _call_qwen() → _call_qwen_ollama() / _call_qwen_rest_api()
+  // Python supports local Ollama + REST API + DashScope.
+  // TS only supports the REST API proxy (OllamaService routes to jin.neu.edu:11434).
+  if (provider === "ollama" || isQwenModel(model)) {
+    const temp = inferQwenTemperature(model, temperature);
+    try {
+      const res = await OllamaService.chat(
+        model,
+        [
+          { role: "system", content: systemPrompt },
+          { role: "user", content: userPayload },
+        ],
+        temp ?? undefined
+      );
+      const content = res?.choices?.[0]?.message?.content ?? "";
+      if (content.trim()) return content.trim();
+      throw new LLMHardFail(
+        step,
+        "EmptyResponse",
+        "Ollama returned empty content"
+      );
+    } catch (e) {
+      if (e instanceof LLMHardFail) throw e;
+      const msg = String(e).toLowerCase();
+      if (msg.includes("connection") || msg.includes("refused"))
+        throw new LLMHardFail(
+          step,
+          "OllamaNotRunning",
+          "Cannot connect to Ollama proxy"
+        );
+      throw new LLMHardFail(step, "QwenError", String(e));
+    }
+  }
+
+  // ── Anthropic Claude ──────────────────────────────────────────────
+  // TS addition — not in Python llm.py
+  if (isAnthropic || isAnthropicModel(model)) {
+    try {
+      const res = await fetch(baseUrl, {
+        method: "POST",
+        signal,
+        headers: {
+          "Content-Type": "application/json",
+          "x-api-key": apiKey,
+          "anthropic-version": "2023-06-01",
+        },
+        body: JSON.stringify({
+          model,
+          max_tokens: isReasoningModel(model) ? 32000 : 16000,
+          messages: [
+            { role: "user", content: `${systemPrompt}\n\n${userPayload}` },
+          ],
+        }),
+      });
+      const data = await res.json();
+      if (!res.ok)
+        throw new LLMHardFail(
+          step,
+          "AnthropicError",
+          data?.error?.message ?? res.statusText
+        );
+      const content = data?.content?.[0]?.text ?? "";
+      if (content.trim()) return content.trim();
+      throw new LLMHardFail(
+        step,
+        "EmptyResponse",
+        "Anthropic returned empty content"
+      );
+    } catch (e) {
+      if (e instanceof LLMHardFail) throw e;
+      throw new LLMHardFail(step, "AnthropicError", String(e));
+    }
+  }
+
+  // ── OpenAI-compatible (OpenAI, Groq, OpenRouter) ──────────────────
+  // Mirrors _call_openai() in llm.py.
+  // Groq and OpenRouter use the same OpenAI-compatible API format.
+  try {
+    const params: Record<string, any> = {
+      model,
+      messages: [
+        { role: "system", content: systemPrompt },
+        { role: "user", content: userPayload },
+      ],
+    };
+
+    if (isReasoningModel(model)) {
+      // Mirrors: params["max_completion_tokens"] = 32000 (no temperature)
+      params.max_completion_tokens = 32000;
+    } else {
+      // Mirrors: params["max_completion_tokens"] = 16000 + temperature
+      params.max_completion_tokens = 16000;
+      if (temperature !== null) params.temperature = temperature;
+    }
+
+    const res = await fetch(baseUrl, {
+      method: "POST",
+      signal,
+      headers: {
+        "Content-Type": "application/json",
+        ...(noApiKey ? {} : { Authorization: `Bearer ${apiKey}` }),
+      },
+      body: JSON.stringify(params),
+    });
+    const data = await res.json();
+    if (!res.ok)
+      throw new LLMHardFail(
+        step,
+        "OpenAIError",
+        data?.error?.message ?? res.statusText
+      );
+    const content = data?.choices?.[0]?.message?.content ?? "";
+    if (content.trim()) return content.trim();
+    throw new LLMHardFail(
+      step,
+      "EmptyResponse",
+      "OpenAI returned empty content"
+    );
+  } catch (e) {
+    if (e instanceof LLMHardFail) throw e;
+    throw new LLMHardFail(step, "UnexpectedError", String(e));
+  }
+};
+
+// ============================================================================
+// Prompts
+// Mirrors all PROMPT_* constants in llm.py
+// These are the EXACT strings from llm.py — no changes.
+// ============================================================================
+
+export const PROMPT_TRIO_DATASET_DESC = `You are a BIDS dataset_description.json metadata extractor.
+
+═══════════════════════════════════════════════════════
+YOUR JOB
+═══════════════════════════════════════════════════════
+
+Extract dataset metadata from the input. Return ONLY valid JSON, no markdown.
+
+═══════════════════════════════════════════════════════
+CRITICAL RULES
+═══════════════════════════════════════════════════════
+
+1. LICENSE — output as "raw_license" (plain string, NOT normalized):
+   - Copy exactly what the user wrote, e.g. "CC0", "CC BY 4.0",
+     "Creative Commons Zero", "public domain", "MIT license"
+   - Do NOT try to normalize or format it — Python will do that
+   - If the user wrote "License: CC0" → raw_license: "CC0"
+   - If the document says "released under Creative Commons" → raw_license: "Creative Commons"
+   - If no license mentioned anywhere → omit raw_license
+
+2. AUTHORS — extract from ALL available sources:
+   - Search in order: user_hints.user_text → documents[]
+   - Look for: explicit author lists, citation patterns, "Created by",
+     "Principal Investigator", "Contact", "Contributors" sections
+   - If full names are available, use them: ["Last FM", "Last FM"]
+   - If only "et al." citation exists, keep first author + et al.: ["Shafto MA et al."]
+   - Do NOT infer, guess, or use outside knowledge to expand author lists
+   - Do NOT fabricate names not present in any input source
+   - If no author information found anywhere, omit Authors field entirely
+
+   EXAMPLES (follow exactly):
+
+   Input: "Smith et al. (2023). A neuroimaging study..."
+   Output: "Authors": ["Smith et al."]
+
+   Input: "Created by John Doe, Jane Smith and Bob Lee"
+   Output: "Authors": ["John Doe", "Jane Smith", "Bob Lee"]
+
+   Input: "Data collected by the CamCAN team. Contact: info@cam.ac.uk"
+   Output: (omit Authors field)
+
+   Input: "Shafto et al. (2014). The Cambridge Centre for Ageing..."
+   Output: "Authors": ["Shafto et al."]
+
+3. NAME — infer from context:
+   - Look for explicit dataset name in user_hints.user_text
+   - If not found, infer from the scientific context
+   - Keep it short and descriptive
+
+4. MISSING FIELDS — omit rather than guess:
+   - If you cannot determine a field with reasonable confidence, omit it
+   - Never invent information not present in the input
+
+═══════════════════════════════════════════════════════
+OUTPUT FORMAT
+═══════════════════════════════════════════════════════
+
+{
+  "dataset_description": {
+    "Name": "...",
+    "BIDSVersion": "1.10.0",
+    "DatasetType": "raw",
+    "Authors": ["First Last", "First Last"]
+  },
+  "raw_license": "CC0",
+  "extraction_log": {
+    "Name": "inferred from user_text: '...'",
+    "raw_license": "found in user_text: 'License: CC0'",
+    "Authors": "extracted from citation in user_text"
+  },
+  "questions": []
+}
+
+Notes:
+- raw_license goes at the TOP LEVEL (not inside dataset_description)
+- dataset_description should NOT contain a "License" field — Python adds it after normalization
+- BIDSVersion must always be "1.10.0"
+- DatasetType must always be "raw"
+- Output ONLY valid JSON, no extra text, no markdown fences
+
+FIELD SOURCE RULES (STRICT - violations cause data integrity failure):
+┌─────────────────┬────────────────────────────────────────────────────┐
+│ Field           │ Allowed sources                                    │
+├─────────────────┼────────────────────────────────────────────────────┤
+│ Authors         │ user_hints.user_text or documents[] ONLY           │
+│                 │ NEVER use training knowledge to expand et al.      │
+│ raw_license     │ user_hints.user_text or documents[] ONLY           │
+│ Name            │ may infer from context if not explicit             │
+│ BIDSVersion     │ always "1.10.0" (fixed)                            │
+│ DatasetType     │ always "raw" (fixed)                               │
+└─────────────────┴────────────────────────────────────────────────────┘`;
+
+export const PROMPT_TRIO_README = `Generate README.md for BIDS dataset.
+
+CRITICAL: Use user_hints.user_text as primary source for README content.
+
+Create comprehensive README with sections:
+- Overview
+- Dataset Description
+- Data Acquisition
+- File Organization
+- Usage Notes
+- References
+
+Output: Direct Markdown text (no JSON wrapper)`;
+
+export const PROMPT_BIDS_PLAN = `You are a BIDS dataset architect with complete decision-making authority.
+
+═══════════════════════════════════════════════════════════════════════
+SUPPORTED FORMATS AND CONVERSION RULES
+═══════════════════════════════════════════════════════════════════════
+
+MRI FORMATS (modality: mri):
+  • DICOM (.dcm)           → convert_to: nifti   (dcm2niix)
+  • NIfTI (.nii, .nii.gz)  → format_ready: true  (copy directly)
+  • JNIfTI (.jnii, .bnii)  → convert_to: nifti
+
+fNIRS FORMATS (modality: nirs):
+  • SNIRF (.snirf)         → format_ready: true  (copy directly)
+  • Homer3 (.nirs)         → convert_to: snirf
+  • MATLAB (.mat)          → convert_to: snirf
+
+═══════════════════════════════════════════════════════════════════════
+SUBJECT IDENTIFICATION — MOST IMPORTANT STEP
+═══════════════════════════════════════════════════════════════════════
+
+Your first job is to correctly identify all subjects from the file list.
+The dataset may use ANY of the following structures:
+
+STRUCTURE 1 — Already BIDS (sub-XX directories)
+  sub-01/nirs/sub-01_task-rest_nirs.snirf
+  sub-02/nirs/sub-02_task-rest_nirs.snirf
+  → Use 'already_bids' strategy. Strip 'sub-' prefix.
+
+STRUCTURE 2 — Site-prefixed directories
+  Beijing_sub82352/anat/scan.nii.gz
+  Newark_sub41006/anat/scan.nii.gz
+  → Use directory names as subject identifiers.
+
+STRUCTURE 3 — Flat files with numeric suffix
+  VHMCT1mm-Hip (134).dcm  (prefix VHM = subject 1)
+  VHFCT1mm-Hip (45).dcm   (prefix VHF = subject 2)
+  → Use filename prefix as subject identifier.
+
+STRUCTURE 4 — Group/subject nested directories
+  PD/PD_01.snirf
+  PD/PD_02.snirf
+  control/control_01.snirf
+  control/control_20.snirf
+  → Each unique filename base (PD_01, PD_02 ... control_01 ... control_20)
+    is ONE subject. The parent directory (PD / control) is the GROUP,
+    not the subject. Add 'group' column to participant_metadata.
+  → Assign numeric IDs: PD_01→1, PD_02→2 ... control_01→21 ... control_20→40
+
+STRUCTURE 5 — Task/group/subject nested directories
+  walking/PD/PD_01.snirf
+  walking/control/control_01.snirf
+  → Same as Structure 4. Ignore the task-level directory when identifying subjects.
+    The task name goes into the BIDS filename (task-walking), not the subject ID.
+
+STRUCTURE 6 — Pure numeric directories
+  001/scan.dcm
+  002/scan.dcm
+  → Use directory number as subject ID.
+
+CRITICAL RULES FOR SUBJECT COUNTING:
+1. python_subject_analysis.subject_count is a HINT, not authoritative.
+2. user_hints.n_subjects is the AUTHORITATIVE count.
+   If provided, your assignment_rules MUST produce exactly that many subjects.
+3. Count the actual unique files/directories to determine the true number.
+4. For group/subject nested structures: count UNIQUE FILES, not directories.
+   (PD/ and control/ are 2 directories but may contain 40 subjects total)
+
+═══════════════════════════════════════════════════════════════════════
+GROUP METADATA
+═══════════════════════════════════════════════════════════════════════
+
+When the dataset has clinically meaningful groups (PD vs control,
+patient vs healthy, treated vs untreated):
+- Add a 'group' column to participant_metadata for EVERY subject.
+- Use the exact group label from the directory or filename.
+
+Example for PD dataset with 40 subjects:
+  participant_metadata:
+    '1':  {original_id: 'PD_01',      group: 'PD'}
+    '2':  {original_id: 'PD_02',      group: 'PD'}
+    ...
+    '21': {original_id: 'control_01', group: 'control'}
+    ...
+    '40': {original_id: 'control_20', group: 'control'}
+
+═══════════════════════════════════════════════════════════════════════
+ASSIGNMENT RULES
+═══════════════════════════════════════════════════════════════════════
+
+Each rule maps source files to one BIDS subject ID.
+
+CRITICAL: 'subject' field must be BARE ID — no 'sub-' prefix.
+  ✓ subject: '1'      → executor creates sub-1
+  ✗ subject: 'sub-1'  → executor creates sub-sub-1
+
+For group/subject nested structures, use the filename as the match token:
+  assignment_rules:
+    - subject: '1'
+      original: 'PD_01'
+      match: ['*PD_01*']
+    - subject: '21'
+      original: 'control_01'
+      match: ['*control_01*']
+
+For prefix-based flat structures:
+  assignment_rules:
+    - subject: '1'
+      original: 'VHM'
+      match: ['*VHM*']
+    - subject: '2'
+      original: 'VHF'
+      match: ['*VHF*']
+
+═══════════════════════════════════════════════════════════════════════
+FORMAT_READY AND CONVERT_TO RULES
+═══════════════════════════════════════════════════════════════════════
+
+format_ready: true  → .nii/.nii.gz (MRI) or .snirf (fNIRS) — copy directly
+format_ready: false → needs conversion:
+  .dcm / .jnii / .bnii → convert_to: nifti
+  .mat / .nirs         → convert_to: snirf
+convert_to: "none"   → only when format_ready: true
+
+═══════════════════════════════════════════════════════════════════════
+FILENAME RULES — TASK INFERENCE
+═══════════════════════════════════════════════════════════════════════
+
+For fNIRS: infer task name from directory structure or user description.
+  walking/ directory → task-walking
+  fingertapping/ or tapping/ → task-fingertapping
+  resting/ or rest/ → task-rest
+
+For MRI: use acq- to distinguish different scan series from same subject.
+  VHFCT1mm-Ankle.dcm → acq-ankle_T1w
+  VHFCT1mm-Head.dcm  → acq-head_T1w
+
+═══════════════════════════════════════════════════════════════════════
+OUTPUT FORMAT
+═══════════════════════════════════════════════════════════════════════
+
+subjects:
+  labels: [list of bare BIDS IDs, e.g. ['1','2',...,'40']]
+  count: N
+  source: llm_analysis
+  id_strategy: numeric / semantic / already_bids
+
+assignment_rules:
+  - subject: 'bare_id'
+    original: 'exact_identifier_from_filename_or_dirname'
+    match: ['*identifier*']
+
+participant_metadata:
+  'bare_id':
+    original_id: 'xxx'
+    group: 'PD'          # if applicable
+    sex: 'M'             # if available
+    age: '65'            # if available
+
+mappings:
+  - modality: nirs
+    match: ['**/*.snirf']
+    exclude: []
+    format_ready: true
+    convert_to: none
+    filename_rules:
+      - match_pattern: '.*'
+        bids_template: 'sub-X_task-walking_nirs.snirf'
+
+OUTPUT: Raw YAML only (no markdown, no explanation)`;
+
+export const PROMPT_MAT_SNIRF_MAPPING = `You are an fNIRS data format expert.
+
+You will receive a JSON summary of one or more MATLAB .mat files from the
+same structural group. The summary contains a "flat_vars" dict where all
+scipy struct wrappers have already been unwrapped — what you see reflects
+the actual data shape and content.
+
+flat_vars key conventions:
+- Top-level variable:     "d", "t", "fs"
+- Struct field:           "dat.signal", "SD.Lambda", "dat.fs"
+- "likely_data": true     marks tall 2D float arrays (n_samples > n_channels)
+- "value"                 means scalar
+- "values"                means small array with known content
+- "string_array" dtype    means channel labels or string metadata
+
+Use flat_vars keys EXACTLY as they appear. Do not invent new paths.
+
+═══════════════════════════════════════════════════════════
+SNIRF REQUIRED FIELDS
+═══════════════════════════════════════════════════════════
+
+dataTimeSeries  — 2D float (n_samples × n_channels)
+time            — 1D float (n_samples,), unit: seconds
+wavelengths     — 1D array of wavelength values in nm
+measurementList — per-channel source/detector/wavelength/dataType indices
+
+═══════════════════════════════════════════════════════════
+DATA ASSEMBLY TYPES
+═══════════════════════════════════════════════════════════
+
+Choose the correct type based on how the data is stored:
+
+TYPE 1 — "single": data is in one variable (most common)
+  Use when: one tall 2D array holds all channels
+  Example: Homer3 "d", or "dat.signal"
+  {
+    "type": "single",
+    "var": "d",
+    "transpose": false
+  }
+  Set transpose: true if shape is (n_channels, n_samples) instead of (n_samples, n_channels)
+  FORBIDDEN: Do NOT use array indexing syntax like "data.values[0]" or "data[0]".
+  The Python executor does not support cell array indexing.
+  Only dot-notation paths are supported: "data.X", "dat.signal", "SD.Lambda".
+
+  CRITICAL — struct variables: if the top-level variable is a MATLAB struct
+  (i.e. flat_vars shows sub-fields like "data.X", "data.fs", "data.trial"),
+  you MUST use the full dot-notation path to the numeric field, NOT the
+  struct variable name itself.
+
+  Example: flat_vars shows:
+    "data.X":     {"shape": [N, C], "likely_data": true}
+    "data.fs":    {"value": 10.0}
+    "data.trial": {"shape": [1, 75]}
+  Correct:   "var": "data.X"     ← full dot-notation path
+  WRONG:     "var": "data"       ← this is the struct, not the data array
+
+  Similarly for time:
+    "data.fs" is a scalar → use as fs_var in time_assembly
+    Correct: {"type": "generate", "fs_var": "data.fs"}
+
+TYPE 2 — "stack_columns": data split across ch1, ch2, ... chN variables
+  Use when: flat_vars contains many variables named ch1, ch2, ch3 ... chN
+  each being a 1D or column vector of the same length
+  {
+    "type": "stack_columns",
+    "var_pattern": "ch",
+    "var_range": [1, 40]
+  }
+  var_pattern: the common prefix (e.g. "ch", "channel", "nirs")
+  var_range: [first_index, last_index] inclusive
+  Use "vars" list instead of var_pattern+var_range if naming is non-numeric:
+  {
+    "type": "stack_columns",
+    "vars": ["left_pfc", "right_pfc", "motor"]
+  }
+
+TYPE 3 — "hbo_hbr": HbO and HbR stored as separate matrices
+  Use when: two 2D arrays named HbO/HbR or oxy/deoxy exist with same shape
+  {
+    "type": "hbo_hbr",
+    "hbo_var": "HbO",
+    "hbr_var": "HbR"
+  }
+  Result: columns are concatenated [HbO | HbR] → (n_samples, n_channels)
+
+═══════════════════════════════════════════════════════════
+TIME ASSEMBLY TYPES
+═══════════════════════════════════════════════════════════
+
+TYPE 1 — "var": time vector exists as a variable
+  {
+    "type": "var",
+    "var": "t"
+  }
+
+TYPE 2 — "generate": no time variable, generate from sampling rate
+  Prefer fs_var (read from file) over fs_value (hardcoded)
+  {
+    "type": "generate",
+    "fs_var": "dat.fs",
+    "fs_value": 13.33
+  }
+  If neither fs_var nor fs_value is known, set fs_value to null
+  (executor will default to 10.0 Hz)
+
+═══════════════════════════════════════════════════════════
+WAVELENGTHS ASSEMBLY TYPES
+═══════════════════════════════════════════════════════════
+
+TYPE 1 — "var": wavelengths stored in a variable
+  {
+    "type": "var",
+    "var": "SD.Lambda"
+  }
+
+TYPE 2 — "value": hardcode the values
+  Use when no wavelength variable found, or data is already concentration (HbO/HbR)
+  {
+    "type": "value",
+    "values": [760, 850]
+  }
+
+═══════════════════════════════════════════════════════════
+OTHER FIELDS
+═══════════════════════════════════════════════════════════
+
+measlist_var:
+  2D array shape (n_channels, 4), cols = [srcIdx, detIdx, aux, dataTypeCode]
+  Common: "SD.MeasList"
+  null if not found
+
+n_sources_var:
+  dot-notation path to a scalar variable whose value is the number of sources (optodes).
+  Look in flat_vars for a key whose:
+    - value is a small integer (typically 2–64)
+    - name semantically suggests source count: contains "nSrc", "nSource", "source",
+      "Src", "nS" or similar
+  Use the EXACT key as it appears in flat_vars. Do NOT invent paths.
+  null if no such variable found.
+
+n_detectors_var:
+  dot-notation path to a scalar variable whose value is the number of detectors (optodes).
+  Look in flat_vars for a key whose:
+    - value is a small integer (typically 2–64)
+    - name semantically suggests detector count: contains "nDet", "nDetector",
+      "detector", "Det", "nD" or similar
+  Use the EXACT key as it appears in flat_vars. Do NOT invent paths.
+  null if no such variable found.
+
+data_type_code:
+  1 = raw intensity (default)
+  2 = dOD (optical density change)
+  4 = HbO/HbR concentration
+  Set to 4 if data_assembly type is "hbo_hbr" or var names suggest concentration
+
+confidence: "high" | "medium" | "low"
+
+═══════════════════════════════════════════════════════
+DECISION GUIDE
+═══════════════════════════════════════════════════════
+
+Step 0 — Detect multi-block structure:
+  Use "top_level_shapes" (NOT flat_vars) to detect multi-block structures.
+  top_level_shapes shows the RAW shape of each variable BEFORE any unwrapping,
+  which is the only reliable way to see that e.g. "data" is a (1,4) cell array.
+
+  Detection rule — ALL three conditions must be true:
+    1. top_level_shapes[key].is_object == true
+    2. top_level_shapes[key].shape == [1, N] with N > 1
+    3. flat_vars contains sub-fields of that key (e.g. "data.X", "data.fs")
+       meaning each element of the cell array is a struct with data fields
+
+  If all three conditions are met:
+    → n_blocks = N  (the second dimension of the shape)
+    → block_data_field = the sub-field name holding the signal matrix
+      (look for the tall 2D array in flat_vars, e.g. "data.X" with likely_data=true)
+    → data_assembly.var = full dot-notation path to signal field in ONE block
+      (e.g. "data.X") — the executor iterates over blocks automatically
+
+  If the top-level variable is a plain 2D float matrix: n_blocks=1.
+  If uncertain: n_blocks=1  (safe default — no data is lost).
+
+  EXAMPLES:
+    top_level_shapes: {"data": {"shape": [1,4], "is_object": true, "is_struct": false}}
+    flat_vars has: "data.X" (likely_data=true), "data.fs" (scalar), "data.trial"
+    → n_blocks=4, block_data_field="X", data_assembly.var="data.X"
+
+    top_level_shapes: {"d": {"shape": [3000, 52], "is_object": false}}
+    → n_blocks=1, standard single-block processing
+
+Step 1 — Identify data_assembly type:
+  - Is there one tall 2D float array?        → "single"
+  - Are there many ch1...chN variables?      → "stack_columns"
+  - Are there HbO and HbR arrays?            → "hbo_hbr"
+
+Step 2 — Identify time_assembly type:
+  - Is there a 1D array matching n_samples?  → "var"
+  - Is there a scalar fs/Fs/srate?           → "generate" with fs_var
+  - Neither?                                 → "generate" with fs_value from notes or null
+
+Step 3 — Identify wavelengths_assembly type:
+  - Is there a small float array 600-1000?   → "var"
+  - No wavelength info found?                → "value" with [760, 850]
+
+Step 4 — Set data_type_code:
+  - Raw NIR intensity data                   → 1
+  - Optical density (log ratio)              → 2
+  - Hemoglobin concentration (HbO/HbR)       → 4
+
+═══════════════════════════════════════════════════════════
+OUTPUT FORMAT — JSON only, no markdown, no explanation
+═══════════════════════════════════════════════════════════
+
+{
+  "data_assembly": {
+    "type": "single",
+    "var": "d",
+    "transpose": false
+  },
+  "time_assembly": {
+    "type": "var",
+    "var": "t"
+  },
+  "wavelengths_assembly": {
+    "type": "var",
+    "var": "SD.Lambda"
+  },
+  "wavelengths_default": [760, 850],
+  "measlist_var": "SD.MeasList",
+  "n_sources_var": null,
+  "n_detectors_var": null,
+  "n_blocks": 1,
+  "block_data_field": null,
+  "data_type_code": 1,
+  "notes": "Homer3 format: standard d/t/SD structure detected",
+  "confidence": "high"
+}
+
+Additional examples:
+
+stack_columns case (ch1...ch40):
+{
+  "data_assembly": {
+    "type": "stack_columns",
+    "var_pattern": "ch",
+    "var_range": [1, 40]
+  },
+  "time_assembly": {
+    "type": "generate",
+    "fs_var": "nfo.fs",
+    "fs_value": 13.33
+  },
+  "wavelengths_assembly": {
+    "type": "value",
+    "values": [760, 850]
+  },
+  "wavelengths_default": [760, 850],
+  "measlist_var": null,
+  "n_sources_var": null,
+  "n_detectors_var": null,
+  "n_blocks": 1,
+  "block_data_field": null,
+  "data_type_code": 4,
+  "notes": "Data split across 40 channel variables ch1-ch40, concentration format",
+  "confidence": "medium"
+}
+
+hbo_hbr case:
+{
+  "data_assembly": {
+    "type": "hbo_hbr",
+    "hbo_var": "HbO",
+    "hbr_var": "HbR"
+  },
+  "time_assembly": {
+    "type": "var",
+    "var": "time"
+  },
+  "wavelengths_assembly": {
+    "type": "value",
+    "values": [760, 850]
+  },
+  "wavelengths_default": [760, 850],
+  "measlist_var": null,
+  "n_sources_var": null,
+  "n_detectors_var": null,
+  "n_blocks": 1,
+  "block_data_field": null,
+  "data_type_code": 4,
+  "notes": "HbO and HbR stored separately, will be concatenated column-wise",
+  "confidence": "high"
+}`;
+
+// ============================================================================
+// Public LLM call wrappers
+// Mirrors llm_trio_dataset_description(), llm_bids_plan(), etc. in llm.py
+// Each function mirrors its Python counterpart including temperature.
+// ============================================================================
+
+export const llmTrioDatasetDescription = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(
+    PROMPT_TRIO_DATASET_DESC,
+    payload,
+    "Trio_DatasetDesc",
+    llmConfig,
+    0.1,
+    signal
+  );
+
+export const llmTrioReadme = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(PROMPT_TRIO_README, payload, "Trio_README", llmConfig, 0.4, signal);
+
+// generate_participants no longer calls the LLM at all — it just generates simple sequential IDs and defers to the plan stage for complex datasets.
+// export const llmTrioParticipants = (
+//   payload: string,
+//   llmConfig: LLMConfig,
+//   signal?: AbortSignal
+// ): Promise<string> =>
+//   callLLM(PROMPT_TRIO_PARTICIPANTS, payload, "Trio_Participants", llmConfig, 0.2, signal);
+
+export const llmBidsPlan = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(PROMPT_BIDS_PLAN, payload, "BIDSPlan", llmConfig, 0.15, signal);
+
+export const llmMapMatToSnirf = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(
+    PROMPT_MAT_SNIRF_MAPPING,
+    payload,
+    "MAT_SNIRF_Mapping",
+    llmConfig,
+    0.05,
+    signal
+  );
+
+// Python stubs themselves are essentially empty instructions,
+// these stages aren't really functional in autobidsify either yet
+// they're just scaffolding for future implementation.
+export const PROMPT_NIRS_DRAFT = `fNIRS-to-SNIRF mapper (Draft).
+  Output JSON (ONLY valid JSON):
+  {
+    "draft": {...},
+    "confidence": 0.8,
+    "questions": [...]
+  }`;
+
+export const PROMPT_NIRS_NORMALIZE = `fNIRS-to-SNIRF mapper (Normalize).
+  Output JSON (ONLY valid JSON):
+  {
+    "normalized": {...},
+    "questions": [...]
+  }`;
+
+export const PROMPT_MRI_VOXEL_DRAFT = `MRI voxelization planner (Draft).
+  Output JSON (ONLY valid JSON):
+  {
+    "volume_candidates": [...],
+    "meta_candidates": {...},
+    "confidence": 0.8
+  }`;
+
+export const PROMPT_MRI_VOXEL_FINAL = `MRI voxelization planner (Final).
+  Output JSON (ONLY valid JSON):
+  {
+    "conversions": [...],
+    "questions": []
+  }`;
+
+export const llmNirsDraft = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(PROMPT_NIRS_DRAFT, payload, "NIRS_Draft", llmConfig, 0.2, signal);
+
+export const llmNirsNormalize = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(
+    PROMPT_NIRS_NORMALIZE,
+    payload,
+    "NIRS_Normalize",
+    llmConfig,
+    0.1,
+    signal
+  );
+
+export const llmMriVoxelDraft = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(
+    PROMPT_MRI_VOXEL_DRAFT,
+    payload,
+    "MRI_Voxel_Draft",
+    llmConfig,
+    0.2,
+    signal
+  );
+
+export const llmMriVoxelFinal = (
+  payload: string,
+  llmConfig: LLMConfig,
+  signal?: AbortSignal
+): Promise<string> =>
+  callLLM(
+    PROMPT_MRI_VOXEL_FINAL,
+    payload,
+    "MRI_Voxel_Final",
+    llmConfig,
+    0.1,
+    signal
+  );
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/llmHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/llmHelpers.ts
index 3f2a6a1..0bbbea2 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/llmHelpers.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/llmHelpers.ts
@@ -6,14 +6,304 @@ import {
   getUserContextText,
 } from "./fileAnalyzers";
 import {
-  extractSubjectAnalysis,
+  analyzeFilenamesForSubjects,
   analyzeTokenStatistics,
 } from "./filenameTokenizer";
 import { FileItem } from "redux/projects/types/projects.interface";
 
-/**
- * Build structured file summary for LLM
- */
+// ============================================================================
+// FileStructureAnalyzer
+// Mirrors universal_core.py FileStructureAnalyzer
+// Works on allFiles: string[] (relative paths) from VFS
+// ============================================================================
+
+const analyzeDirectoryStructure = (allFiles: string[]): Record<string, any> => {
+  const depthCounter: Record<number, number> = {};
+  const uniqueDirs = new Set<string>();
+  const levelDirs: Record<number, Set<string>> = {};
+
+  for (const filepath of allFiles) {
+    const parts = filepath.split("/");
+    const depth = parts.length - 1;
+    depthCounter[depth] = (depthCounter[depth] || 0) + 1;
+
+    for (let level = 0; level < parts.length - 1; level++) {
+      uniqueDirs.add(parts[level]);
+      if (!levelDirs[level]) levelDirs[level] = new Set();
+      levelDirs[level].add(parts[level]);
+    }
+  }
+
+  // Infer structure template — mirrors _infer_structure_template()
+  const firstLevel = levelDirs[0] ? [...levelDirs[0]].slice(0, 10) : [];
+  const hasSubKeyword = firstLevel.some((d) => d.toLowerCase().includes("sub"));
+  const nLevels = Object.keys(levelDirs).length;
+
+  let template = "flat";
+  if (hasSubKeyword) {
+    if (nLevels === 1) template = "{subject}";
+    else if (nLevels === 2) template = "{subject}/{scantype}";
+    else if (nLevels === 3) template = "{subject}/{scantype}/{format}";
+    else template = "{subject}/nested";
+  } else if (nLevels > 0) {
+    template = `custom_${nLevels}_levels`;
+  }
+
+  return {
+    max_depth: Math.max(0, ...Object.keys(depthCounter).map(Number)),
+    depth_distribution: depthCounter,
+    unique_dir_names: [...uniqueDirs].sort().slice(0, 100),
+    dir_level_patterns: Object.fromEntries(
+      Object.entries(levelDirs).map(([k, v]) => [k, [...v].sort().slice(0, 20)])
+    ),
+    total_unique_dirs: uniqueDirs.size,
+    structure_template: template,
+  };
+};
+
+const detectSubjectIdentifiers = (
+  allFiles: string[],
+  userHint: number | null
+): Record<string, any> => {
+  const firstLevelDirs = new Set<string>();
+  for (const filepath of allFiles) {
+    const parts = filepath.split("/");
+    if (parts.length > 1) firstLevelDirs.add(parts[0]);
+  }
+
+  const candidates: any[] = [];
+  const totalFiles = allFiles.length;
+
+  // Pattern 1: Site_subID (e.g. Beijing_sub82352)
+  const p1Matches: Record<string, any> = {};
+  for (const dir of firstLevelDirs) {
+    const m = dir.match(/^([A-Za-z]+)_sub(\d+)$/i);
+    if (m) p1Matches[m[2]] = { site: m[1], original: dir };
+  }
+  if (Object.keys(p1Matches).length > 0) {
+    candidates.push({
+      type: "directory_pattern",
+      pattern_name: "site_sub_id",
+      pattern_display: "{site}_sub{id}",
+      extraction_regex: `([A-Za-z]+)_sub(\\d+)`,
+      subject_group: 2,
+      site_group: 1,
+      count: Object.keys(p1Matches).length,
+      sample_ids: Object.keys(p1Matches).sort().slice(0, 10),
+      metadata: { has_site: true },
+      avg_files_per_subject:
+        Object.keys(p1Matches).length > 0
+          ? totalFiles / Object.keys(p1Matches).length
+          : 0,
+    });
+  }
+
+  // Pattern 2: sub-ID or subID (BIDS standard)
+  const p2Matches = new Set<string>();
+  for (const dir of firstLevelDirs) {
+    const m = dir.match(/^sub-?(\w+)$/i);
+    if (m) p2Matches.add(m[1]);
+  }
+  if (p2Matches.size > 0) {
+    candidates.push({
+      type: "directory_pattern",
+      pattern_name: "bids_standard",
+      pattern_display: "sub-{id}",
+      extraction_regex: `sub-?(\\w+)`,
+      subject_group: 1,
+      site_group: null,
+      count: p2Matches.size,
+      sample_ids: [...p2Matches].sort().slice(0, 10),
+      metadata: { has_site: false },
+      avg_files_per_subject:
+        p2Matches.size > 0 ? totalFiles / p2Matches.size : 0,
+    });
+  }
+
+  // Pattern 3: Numeric directories (e.g. 001, 025)
+  const p3Matches = new Set<string>();
+  for (const dir of firstLevelDirs) {
+    if (/^\d{2,6}$/.test(dir)) p3Matches.add(dir);
+  }
+  if (p3Matches.size > 0) {
+    candidates.push({
+      type: "directory_pattern",
+      pattern_name: "numeric_only",
+      pattern_display: "{id}",
+      extraction_regex: `^(\\d+)$`,
+      subject_group: 1,
+      site_group: null,
+      count: p3Matches.size,
+      sample_ids: [...p3Matches].sort().slice(0, 10),
+      metadata: { numeric_only: true },
+      avg_files_per_subject:
+        p3Matches.size > 0 ? totalFiles / p3Matches.size : 0,
+    });
+  }
+
+  // Pattern 4: patient_ID or subject_ID in filenames
+  const p4Matches = new Set<string>();
+  for (const filepath of allFiles) {
+    const filename = filepath.split("/").pop()!;
+    const m = filename.match(/(?:patient|subject)[_-]?(\d+)/i);
+    if (m) p4Matches.add(m[1]);
+  }
+  if (p4Matches.size > 0) {
+    candidates.push({
+      type: "filename_pattern",
+      pattern_name: "patient_or_subject_id",
+      pattern_display: "{prefix}_{id}",
+      extraction_regex: `(?:patient|subject)[_-]?(\\d+)`,
+      subject_group: 1,
+      site_group: null,
+      count: p4Matches.size,
+      sample_ids: [...p4Matches].sort().slice(0, 10),
+      metadata: {},
+      avg_files_per_subject:
+        p4Matches.size > 0 ? totalFiles / p4Matches.size : 0,
+    });
+  }
+
+  // Pattern 5: Alphanumeric IDs (PD01, Control01, HC03)
+  const p5Matches = new Set<string>();
+  for (const dir of firstLevelDirs) {
+    if (/^[A-Za-z]+\d+$/.test(dir)) p5Matches.add(dir);
+  }
+  if (p5Matches.size > 0) {
+    candidates.push({
+      type: "directory_pattern",
+      pattern_name: "alphanum_id",
+      pattern_display: "{prefix}{id}",
+      extraction_regex: `^([A-Za-z]+)(\\d+)$`,
+      subject_group: 2,
+      site_group: null,
+      count: p5Matches.size,
+      sample_ids: [...p5Matches].sort().slice(0, 10),
+      metadata: {},
+      avg_files_per_subject:
+        p5Matches.size > 0 ? totalFiles / p5Matches.size : 0,
+    });
+  }
+
+  if (candidates.length === 0) {
+    return {
+      best_candidate: null,
+      confidence: "none",
+      candidates: [],
+      total_candidates_evaluated: 0,
+    };
+  }
+
+  // Score candidates — mirrors _score_identifier_candidate()
+  for (const c of candidates) {
+    let score = 0;
+    const count = c.count;
+
+    if (userHint) {
+      if (count === userHint) score += 50;
+      else if (Math.abs(count - userHint) <= 2) score += 30;
+      else if (Math.abs(count - userHint) <= 5) score += 10;
+    }
+
+    const avg = c.avg_files_per_subject;
+    if (avg >= 5) score += 20;
+    else if (avg >= 2) score += 15;
+    else if (avg >= 1) score += 5;
+
+    if (count >= 2 && count <= 200) score += 15;
+    else if (count > 200 && count <= 500) score += 5;
+
+    if (c.type === "directory_pattern") score += 10;
+    if (c.metadata?.has_site) score += 5;
+    c.score = score;
+  }
+
+  candidates.sort((a, b) => b.score - a.score);
+  const best = candidates[0];
+
+  let confidence: "high" | "medium" | "low" | "none" = "none";
+  if (best.score > 80) confidence = "high";
+  else if (best.score > 60) confidence = "medium";
+  else confidence = "low";
+
+  return {
+    candidates: candidates.slice(0, 5),
+    best_candidate: best,
+    confidence,
+    total_candidates_evaluated: candidates.length,
+  };
+};
+
+const detectDuplicateFilenames = (
+  allFiles: string[]
+): Record<string, string[]> => {
+  const filenameToPaths: Record<string, string[]> = {};
+  for (const filepath of allFiles) {
+    const filename = filepath.split("/").pop()!;
+    if (!filenameToPaths[filename]) filenameToPaths[filename] = [];
+    filenameToPaths[filename].push(filepath);
+  }
+  return Object.fromEntries(
+    Object.entries(filenameToPaths).filter(([, paths]) => paths.length > 1)
+  );
+};
+
+const buildDirectoryTreeSummary = (
+  allFiles: string[],
+  maxSubjects: number = 50
+): Record<string, any> => {
+  const subjectToStructure: Record<string, Record<string, string[]>> = {};
+
+  for (const filepath of allFiles) {
+    const parts = filepath.split("/");
+    if (parts.length < 2) continue;
+    const subjectDir = parts[0];
+    const remainingPath = parts.slice(1, -1).join("/") || "root";
+    const filename = parts[parts.length - 1];
+    const pattern = filename.replace(/\d+/g, "N").replace(/\s*\([^)]*\)/g, "");
+
+    if (!subjectToStructure[subjectDir]) subjectToStructure[subjectDir] = {};
+    if (!subjectToStructure[subjectDir][remainingPath])
+      subjectToStructure[subjectDir][remainingPath] = [];
+    if (!subjectToStructure[subjectDir][remainingPath].includes(pattern))
+      subjectToStructure[subjectDir][remainingPath].push(pattern);
+  }
+
+  const allSubjects = Object.keys(subjectToStructure).sort();
+  let sampledSubjects = allSubjects;
+  if (allSubjects.length > maxSubjects) {
+    const mid = Math.floor(allSubjects.length / 2);
+    sampledSubjects = [
+      ...allSubjects.slice(0, 15),
+      ...allSubjects.slice(mid - 10, mid + 10),
+      ...allSubjects.slice(-15),
+    ]
+      .filter((v, i, a) => a.indexOf(v) === i)
+      .slice(0, maxSubjects);
+  }
+
+  const summary: Record<string, any> = {};
+  for (const subject of sampledSubjects) {
+    summary[subject] = Object.fromEntries(
+      Object.entries(subjectToStructure[subject]).map(([path, patterns]) => [
+        path,
+        patterns.slice(0, 5),
+      ])
+    );
+  }
+
+  return {
+    subject_structure_samples: summary,
+    total_subjects_detected: allSubjects.length,
+    sampled_subjects: sampledSubjects.length,
+  };
+};
+
+// ============================================================================
+// TS-only UI helpers
+// ============================================================================
+
+// Build structured file summary for LLM
 export const buildFileSummary = (files: FileItem[]): string => {
   let summary = "";
 
@@ -66,14 +356,6 @@ export const buildFileSummary = (files: FileItem[]): string => {
     hdf5: "format: SNIRF → format_ready: true",
   };
 
-  // dataFiles.forEach((f) => {
-  //   const category = categorizeFile(f);
-  //   const fmt = formatLabel[f.fileType || ""] || ""; // add
-  //   summary += `  - ${f.name} [${category}]`;
-  //   if (fmt) summary += ` <${fmt}>`; // add
-  //   if (f.sourcePath) summary += ` (${f.sourcePath})`;
-  //   summary += "\n";
-  // });
   const byType: Record<string, typeof dataFiles> = {};
   dataFiles.forEach((f) => {
     const key = f.fileType || "other";
@@ -107,75 +389,71 @@ export const buildFileSummary = (files: FileItem[]): string => {
 /**
  * Analyze file patterns
  */
-export const analyzeFilePatterns = (files: FileItem[]): string => {
-  const dataFiles = files.filter((f) => f.type === "file" && !f.isUserMeta);
-  const filenames = dataFiles.map((f) => f.name);
-
-  const extensions = [
-    ...new Set(
-      filenames.map((name) => {
-        const parts = name.toLowerCase().split(".");
-        return parts.length > 1 ? parts[parts.length - 1] : "none";
-      })
-    ),
-  ];
-
-  // Categorize files
-  const categorized: Record<string, string[]> = {
-    anatomical: [],
-    functional: [],
-    diffusion: [],
-    other: [],
-  };
-
-  dataFiles.forEach((f) => {
-    const category = categorizeFile(f);
-    if (category.startsWith("anatomical")) {
-      categorized.anatomical.push(f.name);
-    } else if (category.startsWith("functional")) {
-      categorized.functional.push(f.name);
-    } else if (category.includes("diffusion")) {
-      categorized.diffusion.push(f.name);
-    } else {
-      categorized.other.push(f.name);
-    }
-  });
-
-  return `
-FILENAME ANALYSIS:
-${"=".repeat(70)}
-Total data files: ${dataFiles.length}
-File types: ${extensions.join(", ")}
-
-File Categories:
-  Anatomical scans: ${categorized.anatomical.length}
-  Functional scans: ${categorized.functional.length}
-  Diffusion scans: ${categorized.diffusion.length}
-  Other files: ${categorized.other.length}
-
-Sample filenames (first 10):
-${filenames
-  .slice(0, 10)
-  .map((name) => `  - ${name}`)
-  .join("\n")}
-${
-  filenames.length > 10 ? `\n  ... and ${filenames.length - 10} more files` : ""
-}
-`;
-};
-
-/**
- * Get user context (README, instructions, participant info)
- */
-export const getUserContext = (files: FileItem[]): string => {
-  const userText = getUserContextText(files);
-  if (!userText) return "No user-provided context available.";
-  return `USER-PROVIDED CONTEXT:\n${"=".repeat(70)}\n${userText}`;
-};
-
-/**
- * Get file annotations (notes)
- */
+// export const analyzeFilePatterns = (files: FileItem[]): string => {
+//   const dataFiles = files.filter((f) => f.type === "file" && !f.isUserMeta);
+//   const filenames = dataFiles.map((f) => f.name);
+
+//   const extensions = [
+//     ...new Set(
+//       filenames.map((name) => {
+//         const parts = name.toLowerCase().split(".");
+//         return parts.length > 1 ? parts[parts.length - 1] : "none";
+//       })
+//     ),
+//   ];
+
+//   // Categorize files
+//   const categorized: Record<string, string[]> = {
+//     anatomical: [],
+//     functional: [],
+//     diffusion: [],
+//     other: [],
+//   };
+
+//   dataFiles.forEach((f) => {
+//     const category = categorizeFile(f);
+//     if (category === "mri" || category === "jnifti") {
+//       categorized.anatomical.push(f.name);
+//     } else if (category === "nirs") {
+//       categorized.functional.push(f.name);
+//     } else if (category === "array") {
+//       categorized.diffusion.push(f.name);
+//     } else {
+//       categorized.other.push(f.name);
+//     }
+//   });
+
+//   return `
+// FILENAME ANALYSIS:
+// ${"=".repeat(70)}
+// Total data files: ${dataFiles.length}
+// File types: ${extensions.join(", ")}
+
+// File Categories:
+//   Anatomical scans: ${categorized.anatomical.length}
+//   Functional scans: ${categorized.functional.length}
+//   Diffusion scans: ${categorized.diffusion.length}
+//   Other files: ${categorized.other.length}
+
+// Sample filenames (first 10):
+// ${filenames
+//   .slice(0, 10)
+//   .map((name) => `  - ${name}`)
+//   .join("\n")}
+// ${
+//   filenames.length > 10 ? `\n  ... and ${filenames.length - 10} more files` : ""
+// }
+// `;
+// };
+
+// Get user context (README, instructions, participant info)
+// export const getUserContext = (files: FileItem[]): string => {
+//   const userText = getUserContextText(files);
+//   if (!userText) return "No user-provided context available.";
+//   return `USER-PROVIDED CONTEXT:\n${"=".repeat(70)}\n${userText}`;
+// };
+
+// Get file annotations (notes)
 export const getFileAnnotations = (files: FileItem[]): string => {
   const filesWithNotes = files.filter((f) => f.note);
   if (filesWithNotes.length === 0) return "";
@@ -201,225 +479,90 @@ export const downloadJSON = (data: any, filename: string) => {
   URL.revokeObjectURL(url);
 };
 
-/**
- * Download text file(not using this function yet)
- */
-export const downloadText = (text: string, filename: string) => {
-  const blob = new Blob([text], { type: "text/plain" });
-  const url = URL.createObjectURL(blob);
-  const a = document.createElement("a");
-  a.href = url;
-  a.download = filename;
-  a.click();
-  URL.revokeObjectURL(url);
-};
-
-/**
- * Build evidence bundle structure
- */
-export const buildEvidenceBundle = (
-  files: FileItem[],
-  baseDirectoryPath: string,
-  userOverrides?: {
-    nSubjects: number | null;
-    modalityHint: string;
-    describeText: string;
-  }
-): any => {
-  const counts = getCountsByExtension(files);
-  const userText = getUserContextText(files);
-
-  // add for samples ---start---
-  const dataFiles = files.filter(
-    (f) => f.source === "user" && f.type === "file"
-  );
-
-  // Mirror autobidsify's _intelligent_file_sampling()
-  // Group by file type, take up to 5 samples per type
-  const samplesByType: Record<string, FileItem[]> = {};
+// ============================================================================
+// functions mirror to evidence.py
+// ============================================================================
+
+// ============================================================================
+// detect_kind from evidence.py maps to categorizeFile in fileAnalyzers.ts
+// ============================================================================
+
+// ============================================================================
+// Intelligent file sampling — mirrors _intelligent_file_sampling() in evidence.py
+// Groups files by extension then by filename pattern, samples up to 5 per extension.
+// ============================================================================
+
+const intelligentFileSampling = (
+  dataFiles: FileItem[],
+  targetSamplesPerExt: number = 5
+): FileItem[] => {
+  // Group by extension — mirrors by_ext in Python
+  const byExt: Record<string, FileItem[]> = {};
   dataFiles.forEach((f) => {
-    const key = f.fileType || "other";
-    if (!samplesByType[key]) samplesByType[key] = [];
-    if (samplesByType[key].length < 5) {
-      samplesByType[key].push(f);
-    }
+    const name = f.name.toLowerCase();
+    const ext = name.endsWith(".nii.gz")
+      ? ".nii.gz"
+      : "." + (name.split(".").pop() || "other");
+    if (!byExt[ext]) byExt[ext] = [];
+    byExt[ext].push(f);
   });
 
-  const samples = Object.values(samplesByType)
-    .flat()
-    .map((f) => ({
-      relpath: f.sourcePath || f.name,
-      filename: f.name,
-      suffix: f.name.split(".").pop() || "",
-      kind: f.fileType || "other",
-      size: 0,
-    }));
+  const sampledFiles: FileItem[] = [];
 
-  // ----end---
-
-  // add this for subject_analysis.json
-  // const allFiles = files
-  //   .filter((f) => f.source === "user" && f.type === "file")
-  //   .map((f) => f.sourcePath || f.name);
-  const allFiles = files
-    .filter((f) => f.source === "user" && f.type === "file")
-    .map((f) => {
-      const path = f.sourcePath || f.name;
-      // Strip leading folder name — mirrors Python's relative-to-data_root paths
-      // "1-FRESH-Motor-snirf/sub-01_ses-..." → "sub-01_ses-..."
-      const parts = path.split("/");
-      return parts.length > 1 ? parts.slice(1).join("/") : path;
+  Object.entries(byExt).forEach(([ext, fileList]) => {
+    // Group by filename pattern — mirrors pattern_groups in Python
+    const patternGroups: Record<string, FileItem[]> = {};
+    fileList.forEach((f) => {
+      const pattern = f.name.replace(/\d+/g, "N").replace(/\s*\([^)]*\)/g, "");
+      if (!patternGroups[pattern]) patternGroups[pattern] = [];
+      patternGroups[pattern].push(f);
     });
 
-  const subjectAnalysis = extractSubjectAnalysis(allFiles);
-  // ← end
+    const nPatterns = Object.keys(patternGroups).length;
+    const spp = Math.max(1, Math.floor(targetSamplesPerExt / nPatterns));
 
-  // ── filename analysis (must come AFTER subjectAnalysis)
-  const justFilenames = allFiles.map((f) =>
-    f.includes("/") ? f.split("/").pop()! : f
-  );
-  const tokenStats = analyzeTokenStatistics(justFilenames);
-  const dominantCount = tokenStats.dominantPrefixes.length;
-  const userNSubjects = subjectAnalysis.subject_count || null;
-  let filenameConfidence: "high" | "medium" | "low" | "none" = "none";
-  if (dominantCount > 0) {
-    if (userNSubjects && dominantCount === userNSubjects)
-      filenameConfidence = "high";
-    else if (dominantCount >= 2 && dominantCount <= 10)
-      filenameConfidence = "medium";
-    else filenameConfidence = "low";
-  }
-  const filenameAnalysis = {
-    python_statistics: {
-      total_files: tokenStats.totalFiles,
-      token_frequency: tokenStats.tokenFrequency,
-      prefix_frequency: tokenStats.prefixFrequency,
-      dominant_prefixes: tokenStats.dominantPrefixes,
-      unique_token_count: Object.keys(tokenStats.tokenFrequency).length,
-      unique_prefix_count: Object.keys(tokenStats.prefixFrequency).length,
-    },
-    confidence: filenameConfidence,
-    recommendation: buildFilenameRecommendation(
-      tokenStats.dominantPrefixes,
-      userNSubjects
-    ),
-  };
+    let extSamples: FileItem[] = [];
+    const extSampledSet = new Set<string>();
 
-  // subject count decision logic:
-  const finalSubjectCount =
-    userOverrides?.nSubjects ?? // user wins
-    subjectAnalysis.subject_count ??
-    tokenStats.dominantPrefixes.length ??
-    null;
+    // Take spp files from each pattern group
+    Object.values(patternGroups).forEach((group) => {
+      group.slice(0, spp).forEach((f) => {
+        extSamples.push(f);
+        extSampledSet.add(f.id);
+      });
+    });
 
-  const participantEvidence = buildParticipantMetadataEvidence(
-    allFiles,
-    // pass the already-built documents array
-    files
-      .filter(
-        (f) => f.source === "user" && f.content && f.content.trim().length > 0
-      )
-      .map((f) => ({
-        relpath: f.sourcePath || f.name,
-        filename: f.name,
-        content: f.content || "",
-      }))
-  );
+    // Top-up to targetSamplesPerExt if under
+    if (extSamples.length < targetSamplesPerExt) {
+      const sorted = [...Object.values(patternGroups)].sort(
+        (a, b) => b.length - a.length
+      );
+      for (const group of sorted) {
+        if (extSamples.length >= targetSamplesPerExt) break;
+        for (const f of group) {
+          if (extSamples.length >= targetSamplesPerExt) break;
+          if (!extSampledSet.has(f.id)) {
+            extSamples.push(f);
+            extSampledSet.add(f.id);
+          }
+        }
+      }
+    }
 
-  return {
-    root: baseDirectoryPath,
-    counts_by_ext: counts,
-    samples,
-    all_files: allFiles,
-    filename_analysis: filenameAnalysis, // NEW
-    participant_metadata_evidence: participantEvidence, // NEW
-    subject_detection: {
-      method: "hybrid_analysis",
-      path_based_count: subjectAnalysis.subject_count,
-      path_based_confidence: subjectAnalysis.success ? "medium" : "none",
-      filename_based_count: tokenStats.dominantPrefixes.length,
-      filename_based_confidence: filenameConfidence,
-      final_count: finalSubjectCount,
-      count_source:
-        userOverrides?.nSubjects != null
-          ? "user_provided"
-          : subjectAnalysis.success
-          ? subjectAnalysis.method
-          : "filename_based",
-      best_pattern: subjectAnalysis.subject_records[0]?.pattern_name || "none",
-    },
-    documents: files
-      .filter((f) => {
-        if (f.source !== "user") return false; // exclude AI files
-        if (!f.content || f.content.trim().length === 0) return false;
-
-        // ✅ Text files - primary source
-        if (["text", "office", "meta"].includes(f.fileType || "")) return true;
-
-        // ✅ NIfTI headers - useful for LLM to understand scan parameters
-        if (f.fileType === "nifti" && f.contentType === "nifti") return true;
-
-        // ✅ HDF5/SNIRF structure - useful for fNIRS datasets
-        if (f.fileType === "hdf5" && f.contentType === "hdf5") return true;
-
-        // ✅ NeuroJSON - already JSON text
-        if (f.fileType === "neurojsonText") return true;
-
-        // ✅ Catch undefined fileType but has content (your current bug)
-        if (f.fileType === undefined && f.content) return true;
-
-        return false;
-      })
-      .map((f) => ({
-        relpath: f.sourcePath || f.name,
-        filename: f.name,
-        type: f.fileType || "unknown",
-        content: f.content || "",
-        purpose: "experimental_protocol_or_metadata",
-      })),
-    user_hints: {
-      user_text: userText,
-      modality_hint: userOverrides?.modalityHint || detectModality(files),
-      n_subjects: finalSubjectCount,
-    },
-    // subject_analysis: subjectAnalysis,
-    trio_found: {
-      "dataset_description.json": files.some(
-        (f) => f.source === "user" && f.name === "dataset_description.json"
-      ),
-      "README.md": files.some(
-        (f) =>
-          f.source === "user" &&
-          (f.name === "README.md" ||
-            f.name === "README.txt" ||
-            f.name === "README.rst" ||
-            f.name === "readme.md")
-      ),
-      "participants.tsv": files.some(
-        (f) => f.source === "user" && f.name === "participants.tsv"
-      ),
-    },
-  };
-};
+    sampledFiles.push(...extSamples);
+  });
 
-const buildFilenameRecommendation = (
-  dominantPrefixes: { prefix: string; count: number; percentage: number }[],
-  userNSubjects: number | null
-): string => {
-  if (dominantPrefixes.length === 0)
-    return "No clear filename patterns detected. Recommend user describe subject identification.";
-  if (userNSubjects && dominantPrefixes.length === userNSubjects) {
-    const prefixStr = dominantPrefixes.map((p) => p.prefix).join(", ");
-    return `HIGH CONFIDENCE: Detected ${dominantPrefixes.length} dominant prefixes (${prefixStr}) matching user hint of ${userNSubjects} subjects.`;
-  }
-  if (dominantPrefixes.length >= 2 && dominantPrefixes.length <= 5)
-    return `MEDIUM CONFIDENCE: Detected ${dominantPrefixes.length} potential subject groups. Will send to LLM for validation.`;
-  return `LOW CONFIDENCE: Found ${dominantPrefixes.length} prefix patterns, which may or may not represent subjects. LLM will analyze.`;
+  return sampledFiles;
 };
 
+// ============================================================================
+// mirror _collect_participant_metadata_evidence() in evidence.py
+// ============================================================================
+
 const buildParticipantMetadataEvidence = (
   allFiles: string[],
-  documents: { relpath: string; filename: string; content: string }[]
+  documents: { relpath: string; filename: string; content: string }[],
+  files: FileItem[]
 ): Record<string, any> => {
   const evidence: Record<string, any> = {};
 
@@ -457,6 +600,25 @@ const buildParticipantMetadataEvidence = (
   // Evidence 2: DICOM headers (already extracted into documents content)
   // Skip re-reading — not feasible client-side
 
+  const dicomFiles = files.filter(
+    (f) => f.source === "user" && f.fileType === "dicom" && f.content
+  );
+  if (dicomFiles.length > 0) {
+    const dicomSamples = dicomFiles.slice(0, 10).map((f) => ({
+      filename: f.name,
+      extracted_header: f.content?.slice(0, 300) || "",
+    }));
+    evidence.dicom_headers = {
+      found: true,
+      sampled_count: dicomSamples.length,
+      total_dicom_files: dicomFiles.length,
+      samples: dicomSamples,
+      note: "DICOM headers extracted client-side",
+    };
+  } else {
+    evidence.dicom_headers = { found: false };
+  }
+
   // Evidence 3: filename semantic patterns
   const genderKws = [
     "male",
@@ -606,81 +768,200 @@ const buildParticipantMetadataEvidence = (
   return evidence;
 };
 
-/**
- * Extract subject identifiers from file list
- * Mirrors autobidsify's _extract_subjects_from_flat_filenames()
- */
-export const extractSubjectsFromFiles = (
-  files: FileItem[]
-): {
-  subjects: { originalId: string; bidsId: string }[];
-  strategy: string;
-} => {
+// ============================================================================
+// Build evidence bundle structure
+// mirror _build_evidence_bundle_internal() and build_evidence_bundle() in evidence.py
+// ============================================================================
+
+export const buildEvidenceBundle = (
+  files: FileItem[],
+  baseDirectoryPath: string,
+  userOverrides?: {
+    nSubjects: number | null;
+    modalityHint: string;
+    describeText: string;
+  }
+): any => {
+  const counts = getCountsByExtension(files);
+  // const userText = getUserContextText(files);
+  const fileContextText = getUserContextText(files);
+  const userText = [userOverrides?.describeText?.trim(), fileContextText]
+    .filter(Boolean)
+    .join("\n\n");
+
+  // add for samples ---start---
   const dataFiles = files.filter(
     (f) => f.source === "user" && f.type === "file"
   );
 
-  // Count occurrences of each base identifier
-  const identifierCounts: Record<string, number> = {};
-  // dataFiles.forEach((f) => {
-  //   const nameNoExt = f.name.replace(/\.[^/.]+$/, "").replace(/\.nii$/, "");
-  //   const match = nameNoExt.match(/^([A-Za-z0-9\-]+)/);
-  //   if (match) {
-  //     const id = match[1];
-  //     identifierCounts[id] = (identifierCounts[id] || 0) + 1;
-  //   }
-  // });
-  dataFiles.forEach((f) => {
-    const nameNoExt = f.name
-      .replace(/\.nii\.gz$/i, "")
-      .replace(/\.[^/.]+$/, "")
-      .replace(/\s*\([^)]*\)/, ""); // remove (309) etc.
-
-    // Split on first digit sequence or underscore — take prefix only
-    // VHMCT1mm → VHMCT, sub-01 → sub-01, BZZ003 → BZZ
-    const match = nameNoExt.match(/^([A-Za-z]+(?:-[A-Za-z]+)*)/);
-    if (match) {
-      const id = match[1];
-      identifierCounts[id] = (identifierCounts[id] || 0) + 1;
-    }
+  const sampledFiles = intelligentFileSampling(dataFiles);
+  const samples = sampledFiles.map((f) => ({
+    relpath: f.sourcePath || f.name,
+    filename: f.name,
+    suffix: f.name.split(".").pop() || "",
+    kind: categorizeFile(f),
+    size: 0,
+    header_info: f.content ? { raw: f.content.slice(0, 500) } : undefined,
+  }));
+
+  const allFiles = files
+    .filter((f) => f.source === "user" && f.type === "file")
+    .map((f) => {
+      const path = f.sourcePath || f.name;
+      // Strip leading folder name — mirrors Python's relative-to-data_root paths
+      // "1-FRESH-Motor-snirf/sub-01_ses-..." → "sub-01_ses-..."
+      const parts = path.split("/");
+      return parts.length > 1 ? parts.slice(1).join("/") : path;
+    });
+
+  // ── FileStructureAnalyzer — mirrors universal_core.py
+  const dirStructure = analyzeDirectoryStructure(allFiles);
+  const subjectDetectionResult = detectSubjectIdentifiers(
+    allFiles,
+    userOverrides?.nSubjects ?? null
+  );
+  const duplicates = detectDuplicateFilenames(allFiles);
+  const treeSummary = buildDirectoryTreeSummary(allFiles, 50);
+  const pathBasedCount = subjectDetectionResult.best_candidate?.count ?? 0;
+  const pathBasedConfidence = subjectDetectionResult.confidence;
+
+  const filenameAnalysisRaw = analyzeFilenamesForSubjects(allFiles, {
+    n_subjects: userOverrides?.nSubjects ?? null,
+    user_text: userOverrides?.describeText ?? "",
   });
+  const { llm_payload, ...filenameAnalysis } = filenameAnalysisRaw;
+  const tokenStats = filenameAnalysis.python_statistics;
+  const filenameConfidence = filenameAnalysis.confidence;
 
-  // Sort by frequency — most common identifiers are likely subjects
-  // const sorted = Object.entries(identifierCounts).sort((a, b) => b[1] - a[1]);
-
-  // Step 2: Keep only identifiers that appear in multiple files
-  // (single-file identifiers are likely body parts, not subjects)
-  const totalFiles = dataFiles.length;
-  const threshold = Math.max(2, Math.floor(totalFiles * 0.05)); // at least 5% of files
-
-  const filtered = Object.entries(identifierCounts)
-    .filter(([, count]) => count >= threshold)
-    .sort((a, b) => b[1] - a[1]);
-
-  // If filtering leaves nothing, fall back to all identifiers
-  const candidates =
-    filtered.length > 0
-      ? filtered
-      : Object.entries(identifierCounts).sort((a, b) => b[1] - a[1]);
-  // Step 3: Use numeric strategy for >10 subjects
-  const strategy = candidates.length > 10 ? "numeric" : "numeric";
-  // const strategy = sorted.length > 10 ? "numeric" : "semantic";
-
-  // const subjects = sorted.map(([originalId], i) => ({
-  //   originalId,
-  //   bidsId:
-  //     strategy === "numeric"
-  //       ? String(i + 1)
-  //       : originalId.replace(/[^a-zA-Z0-9]/g, ""),
-  // }));
-  const subjects = candidates.map(([originalId], i) => ({
-    originalId,
-    bidsId: String(i + 1),
-  }));
+  // subject count decision logic:
+  let finalSubjectCount: number | null;
+  let countSource: string;
+
+  if (userOverrides?.nSubjects != null) {
+    finalSubjectCount = userOverrides.nSubjects;
+    countSource = "user_provided";
+  } else if (pathBasedConfidence === "high") {
+    finalSubjectCount = pathBasedCount;
+    countSource = "path_based_high_confidence";
+  } else if (
+    (filenameConfidence === "high" || filenameConfidence === "medium") &&
+    pathBasedCount === 0
+  ) {
+    finalSubjectCount = tokenStats.dominantPrefixes.length;
+    countSource = "filename_based";
+  } else if (pathBasedCount > 0) {
+    finalSubjectCount = pathBasedCount;
+    countSource = "path_based";
+  } else {
+    finalSubjectCount = 1;
+    countSource = "fallback";
+  }
+
+  const documents = files
+    .filter((f) => {
+      if (f.source !== "user") return false;
+      if (!f.content || f.content.trim().length === 0) return false;
+      if (["text", "office", "meta"].includes(f.fileType || "")) return true;
+      if (f.fileType === "nifti" && f.contentType === "nifti") return true;
+      if (f.fileType === "hdf5" && f.contentType === "hdf5") return true;
+      if (f.fileType === "neurojsonText") return true;
+      if (f.fileType === undefined && f.content) return true;
+      return false;
+    })
+    .map((f) => ({
+      relpath: f.sourcePath || f.name,
+      filename: f.name,
+      type: f.fileType || "unknown",
+      content: f.content || "",
+      purpose: "experimental_protocol_or_metadata",
+    }));
+
+  const participantEvidence = buildParticipantMetadataEvidence(
+    allFiles,
+    documents,
+    files
+  );
 
-  return { subjects, strategy };
+  return {
+    root: baseDirectoryPath,
+    counts_by_ext: counts,
+    samples,
+    all_files: allFiles,
+    filename_analysis: filenameAnalysis, // NEW
+    participant_metadata_evidence: participantEvidence, // NEW
+    subject_detection: {
+      method: "hybrid_analysis",
+      path_based_count: pathBasedCount,
+      path_based_confidence: pathBasedConfidence,
+      filename_based_count: tokenStats.dominantPrefixes.length,
+      filename_based_confidence: filenameConfidence,
+      final_count: finalSubjectCount,
+      count_source: countSource,
+      best_pattern:
+        subjectDetectionResult.best_candidate?.pattern_display || "none",
+    },
+    structure_analysis: {
+      directory_structure: dirStructure,
+      subject_detection: subjectDetectionResult,
+      duplicate_files: Object.fromEntries(
+        Object.entries(duplicates).slice(0, 20)
+      ),
+      tree_summary_for_llm: treeSummary,
+      analyzer_confidence: subjectDetectionResult.confidence,
+    },
+
+    documents: documents,
+    document_summary: {
+      total_documents: documents.length,
+      document_types: [...new Set(documents.map((d) => d.type))],
+      total_text_length: documents.reduce(
+        (sum, d) => sum + d.content.length,
+        0
+      ),
+    },
+    sampling_strategy: {
+      method: "pattern_based",
+      target_per_ext: 5,
+      total_files_sampled: sampledFiles.length,
+    },
+    user_hints: {
+      user_text: userText,
+      modality_hint: userOverrides?.modalityHint || detectModality(files),
+      n_subjects: finalSubjectCount,
+    },
+    trio_found: {
+      "dataset_description.json": files.some(
+        (f) => f.source === "user" && f.name === "dataset_description.json"
+      ),
+      "README.md": files.some(
+        (f) =>
+          f.source === "user" &&
+          (f.name === "README.md" ||
+            f.name === "README.txt" ||
+            f.name === "README.rst" ||
+            f.name === "readme.md")
+      ),
+      "participants.tsv": files.some(
+        (f) => f.source === "user" && f.name === "participants.tsv"
+      ),
+    },
+    trio_promoted: {
+      dataset_description: [],
+      readme: [],
+      participants: [],
+    },
+    data_source: {
+      type: "directory",
+      original_path: baseDirectoryPath,
+      actual_path: baseDirectoryPath,
+    },
+  };
 };
 
+// ============================================================================
+// mirror ingest_data() in ingest.py
+// ============================================================================
+
 export const buildIngestInfo = (
   baseDirectoryPath: string
   // outputDir: string
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
index be03f83..22c635a 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/llmPrompts.ts
@@ -1,177 +1,21 @@
 // src/components/DatasetOrganizer/utils/llmPrompts.ts
+//
+// NeuroJSON.io-only prompts — functions that have no Python equivalent.
+//
+// All PROMPT_* constants and LLM wrapper functions now live in llm.ts,
+// mirroring autobidsify's llm.py where prompts and callers are co-located.
+//
+// This file only contains:
+//   getConversionScriptPrompt() — generates a standalone Python conversion
+//   script from the user's file structure. Autobidsify IS the conversion
+//   script, so this feature has no Python equivalent.
+
+// ============================================================================
+// getConversionScriptPrompt()
+// NeuroJSON.io-only — no Python equivalent in autobidsify.
+// Called by LLMPanel.tsx → handleGenerate() ("Generate Script" button)
+// ============================================================================
 
-/**
- * Prompt for dataset_description.json generation
- * Based on auto-bidsify's PROMPT_TRIO_DATASET_DESC
- */
-export const getDatasetDescriptionPrompt = (
-  userText: string,
-  evidenceBundle?: any
-): string => {
-  const documentsContext =
-    // evidenceBundle?.documents
-    //   ?.map((d: any) => `[${d.filename}]:\n${d.content}`)
-    //   .join("\n\n") || "";
-    evidenceBundle?.documents
-      ?.map((d: any) => `[${d.filename}]:\n${(d.content || "").slice(0, 500)}`)
-      .join("\n\n") || "";
-
-  return `You are a BIDS dataset_description.json generator.
-  
-  CRITICAL: Use the following user-provided content to extract dataset information!
-  
-  USER-PROVIDED CONTENT:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  ${userText || "(no readme/instructions provided)"}
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-
-   ALL UPLOADED DOCUMENTS (search these for dataset name, authors, etc.):
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  ${documentsContext || "(no documents)"}
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-
-  Also consider the dataset folder name for clues about the dataset name:
-  File paths start with: ${evidenceBundle?.root || ""}
-  
-  CRITICAL RULES:
-  - Authors MUST be array: ["Name 1", "Name 2", "Name 3"]
-  - DO NOT include empty strings "" or empty arrays []
-  - DO NOT use placeholders like "Extract" or "Dataset Name"
-  - Extract ACTUAL dataset name from content
-  - License: use "PD" if not specified, normalize "CC BY 4.0" to "CC-BY-4.0"
-  
-  Extract from user-provided content:
-  - Dataset name (look for study title, project name, experiment name)
-  - Authors/institutions mentioned
-  - Funding sources (if mentioned)
-  - License information
-  
-  Output ONLY valid JSON (no markdown fences, no explanations):
-  {
-    "Name": "Actual Dataset Name Here",
-    "BIDSVersion": "1.10.0",
-    "DatasetType": "raw",
-    "License": "PD",
-    "Authors": ["Actual Author Name"]
-  }`;
-};
-
-/**
- * Prompt for README.md generation
- * Based on auto-bidsify's PROMPT_TRIO_README
- */
-export const getReadmePrompt = (userText: string): string => {
-  return `Generate a comprehensive BIDS README.md file.
-  
-  CRITICAL: Use the following user-provided content as the PRIMARY source!
-  
-  USER-PROVIDED CONTENT:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  ${userText}
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  
-  Create a comprehensive README with these sections:
-  - ## Overview (extract from user content)
-  - ## Dataset Description (expand on user content)
-  - ## Data Acquisition (if information available)
-  - ## File Organization (describe BIDS structure)
-  - ## Usage Notes
-  - ## References (if mentioned in user content)
-  
-  Use the user-provided content to inform ALL sections.
-  Expand and structure the information, but stay true to the original content.
-  
-  OUTPUT: Direct Markdown text only (no JSON wrapper, no code fences)`;
-};
-
-/**
- * Prompt for participants.tsv generation
- * Based on auto-bidsify's PROMPT_TRIO_PARTICIPANTS
- */
-export const getParticipantsPrompt = (userText: string): string => {
-  return `You are a BIDS participants.tsv column schema generator.
-
-USER-PROVIDED CONTENT:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-${userText}
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-
-YOUR JOB: Decide which columns belong in participants.tsv based ONLY on what is explicitly stated in the user content above.
-
-STRICT RULES:
-- participant_id is ALWAYS required
-- ONLY add columns for demographics EXPLICITLY mentioned in the content
-- DO NOT invent age, sex, handedness, or any column not directly stated
-- If no demographic info is mentioned, return ONLY participant_id
-
-Output ONLY valid JSON (no markdown fences, no explanation):
-{
-  "columns": [
-    {"name": "participant_id", "required": true}
-  ]
-}
-
-Examples:
-- Content mentions "1 male, 1 female" → add {"name": "sex", "levels": ["M", "F"]}
-- Content mentions "patients and controls" → add {"name": "group", "levels": ["patient", "control"]}
-- Content mentions nothing about demographics → return only participant_id
-`;
-};
-
-// export const getParticipantsPrompt = (userText: string): string => {
-//   return `Generate a BIDS participants.tsv file.
-
-//   CRITICAL: Extract participant metadata from the following user-provided content!
-
-//   USER-PROVIDED CONTENT:
-//   ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-//   ${userText}
-//   ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-
-//   STRICT RULES:
-//   - First column MUST be "participant_id"
-//   - Use tab (\\t) as delimiter
-//   - ONLY include columns for data EXPLICITLY mentioned in the user content above
-//   - DO NOT invent or assume age, sex, handedness, or any other column unless it is directly stated in the content
-//   - If no demographic data is mentioned, output ONLY participant_id column
-//   - If only subject IDs are known, output the minimal form below
-
-//   MINIMAL FORM (use this when no demographics are mentioned):
-//   participant_id
-//   sub-01
-//   sub-02
-
-//   Extract participant information:
-//   - Subject IDs (look for "sub-01", "2 subjects", "participants: sub-01 and sub-02", etc.)
-//   - Demographics if available:
-//     - "1 male, 1 female" → sex column: M, F
-//     - "ages 25-65" → age column
-//     - "patients and controls" → group column
-//     - "right-handed" → handedness column
-
-//   Rules:
-//   - First column MUST be "participant_id"
-//   - Use tab (\\t) as delimiter
-//   - Include only columns with actual data (no empty columns)
-//   - If only subject IDs known, output: participant_id\\nsub-01\\nsub-02
-
-//   Examples:
-//   - If text says "2 subjects: sub-01 and sub-02" with no demographics:
-//     participant_id
-//     sub-01
-//     sub-02
-
-//   - If text says "sub-01 (25y, male), sub-02 (30y, female)":
-//     participant_id\\tage\\tsex
-//     sub-01\\t25\\tM
-//     sub-02\\t30\\tF
-
-//   OUTPUT: Direct TSV text only (no JSON, no code fences, no markdown)`;
-// };
-
-/**
- * Main prompt for BIDS conversion script generation
- */
 export const getConversionScriptPrompt = (
   baseDirectoryPath: string,
   fileSummary: string,
@@ -180,188 +24,12 @@ export const getConversionScriptPrompt = (
   annotations: string
 ): string => {
   return `You are a BIDS conversion expert specializing in neuroimaging data.
-  
-  ╔════════════════════════════════════════════════════════════════╗
-  ║ TASK: Generate Python script to convert dataset to BIDS       ║
-  ╚════════════════════════════════════════════════════════════════╝
-  
-  BASE DIRECTORY: ${baseDirectoryPath}
-  
-  ${fileSummary}
-  
-  ${filePatterns}
-  
-  ${userContext}
-  
-  ${annotations}
-  
-  CRITICAL FILE CATEGORIZATION RULES:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  Files are marked with categories. YOU MUST respect these categories:
-  
-  - [anatomical-T1w] → Goes to sub-XX/anat/ folder, rename to sub-XX_T1w.nii.gz
-  - [anatomical-T2w] → Goes to sub-XX/anat/ folder, rename to sub-XX_T2w.nii.gz
-  - [functional-bold] → Goes to sub-XX/func/ folder, rename to sub-XX_task-<name>_run-XX_bold.nii.gz
-  - [functional-nirs] → Goes to sub-XX/func/ folder, rename to sub-XX_task-<name>_nirs.snirf
-  - [anatomical-dicom] → Convert to NIfTI using dcm2niix, then goes to sub-XX/anat/
-  - [diffusion] → Goes to sub-XX/dwi/ folder
-  - [fieldmap] → Goes to sub-XX/fmap/ folder
-
-  FORMAT CONVERSION RULES:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  Some files require conversion before copying to BIDS:
-  
-  - <format: DICOM → convert_to: nifti (dcm2niix)>
-      → Run: subprocess.run(['dcm2niix', '-o', dest_dir, '-f', bids_filename, src_file])
-      → Output goes to sub-XX/anat/
-  
-  - <format: MATLAB → convert_to: snirf>
-      → Use MNE-Python: mne.export.export_raw(dst, raw, fmt='snirf')
-      → OR note in script that manual conversion is needed
-      → Output goes to sub-XX/nirs/
-  
-  - <format: Homer3 → convert_to: snirf>
-      → Same as MATLAB conversion above
-      → Output goes to sub-XX/nirs/
-  
-  - <format: NIfTI → format_ready: true>
-      → Direct copy, no conversion needed
-  
-  - <format: SNIRF → format_ready: true>
-      → Direct copy, no conversion needed
-  
-  FILENAME-BASED DETECTION (if category unclear):
-  - Contains "task-" AND "bold" → ALWAYS functional (func/ folder)
-  - Contains "T1w" → ALWAYS anatomical (anat/ folder)
-  - Contains "T2w" OR "inplaneT2" → ALWAYS anatomical (anat/ folder)
-  - Ends with ".snirf" → ALWAYS functional (func/ folder)
-  - Ends with ".dcm" → ALWAYS needs dcm2niix conversion → anat/ folder
-  - Ends with ".mat" → ALWAYS needs snirf conversion → nirs/ folder  
-  - Ends with ".nirs" → ALWAYS needs snirf conversion → nirs/ folder
-  
-  ⚠️ CRITICAL: NEVER put task-based files in anat/ folder!
-  ⚠️ CRITICAL: NEVER put T1w/T2w files in func/ folder!
-  
-  CRITICAL INSTRUCTIONS:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  
-  1. The BIDS metadata files (dataset_description.json, README.md, participants.tsv)
-     have ALREADY been generated above. Your script MUST:
-     ✓ Use the EXACT content from dataset_description.json (copy it verbatim)
-     ✓ Use the EXACT participant IDs from participants.tsv
-     ✓ Write these files as-is to the BIDS directory
-  
-  2. All file paths are RELATIVE to base directory: ${baseDirectoryPath}
-     When accessing files: os.path.join(base_dir, relative_path)
-     
-     Example:
-     File shown as: "Balloon Analog Risk-taking Task/sub-01_T1w.nii.gz"
-     Full path: os.path.join('${baseDirectoryPath}', 'Balloon Analog Risk-taking Task', 'sub-01_T1w.nii.gz')
-  
-  3. BIDS directory structure to create:
-     bids_dataset/
-     ├── dataset_description.json  ← Write exact content from above
-     ├── README.md                  ← Write exact content from above
-     ├── participants.tsv           ← Write exact content from above
-     └── sub-XX/
-         ├── anat/                  ← Anatomical scans only!
-         │   ├── sub-XX_T1w.nii.gz
-         │   └── sub-XX_T2w.nii.gz
-         └── func/                  ← Functional scans only!
-             └── sub-XX_task-<name>_run-XX_bold.nii.gz
-  
-  4. For EACH data file, you must:
-     a) Extract subject ID from filename (e.g., "sub-01" from "sub-01_T1w.nii.gz")
-     b) Determine modality from file category:
-        - [anatomical-*] → modality = 'anat'
-        - [functional-*] → modality = 'func'
-        - [diffusion] → modality = 'dwi'
-     c) Construct source path including any parent folders
-     d) Create destination path: bids_dir/sub-XX/modality/new_filename
-     e) Copy the file
-     f) Create JSON sidecar (for imaging files)
-  
-  5. Handle run numbers correctly:
-     - Functional scans often have run-01, run-02, run-03
-     - Extract run number ONLY from files that have "_run-" in filename
-     - Anatomical scans typically don't have run numbers
-  
-  6. Error handling:
-     - Wrap file operations in try-except
-     - Print progress messages
-     - Print errors but continue processing
-  
-  OUTPUT REQUIREMENTS:
-  ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-  Generate a complete, runnable Python script that:
-  - Imports: os, shutil, json, pathlib
-  - Defines base_dir and bids_dir
-  - Creates BIDS directory structure (based on participants.tsv)
-  - Writes the three metadata files (exact content from above)
-  - Loops through data files and processes each one
-  - Includes clear comments explaining each step
-  - Has error handling and progress messages
-  
-  OUTPUT ONLY THE PYTHON SCRIPT (no markdown code fences, no explanations before or after).`;
-};
-
-/**
- * Prompt for BIDSPlan.yaml generation
- * Based on autobidsify's PROMPT_BIDS_PLAN
- */
-export const getBIDSPlanPrompt = (
-  fileSummary: string,
-  filePatterns: string,
-  userContext: string,
-  subjectInfo: {
-    subjects: { originalId: string; bidsId: string }[];
-    strategy: string;
-  },
-  countsByExt: Record<string, number>,
-  sampleFiles: string,
-  evidenceBundle: any
-): string => {
-  const subjectAnalysis = evidenceBundle.subject_analysis;
-  const assignmentRules = subjectInfo.subjects
-    .slice(0, 50) // cap at 50
-    .map(
-      (s) =>
-        `- match:\n  - '*${s.originalId}*'\n  original: ${s.originalId}\n  subject: '${s.bidsId}'`
-    )
-    .join("\n");
-
-  const subjectLabels = subjectInfo.subjects
-    .slice(0, 50)
-    .map((s) => `  - '${s.bidsId}'`)
-    .join("\n");
 
-  const participantMetadata = subjectInfo.subjects
-    .slice(0, 50)
-    .map((s) => `  '${s.bidsId}':\n    original_id: ${s.originalId}`)
-    .join("\n");
+╔════════════════════════════════════════════════════════════════╗
+║ TASK: Generate Python script to convert dataset to BIDS       ║
+╚════════════════════════════════════════════════════════════════╝
 
-  const countsText = Object.entries(countsByExt)
-    .map(([ext, count]) => `  ${ext}: ${count} files`)
-    .join("\n");
-
-  const pythonSubjectAnalysisText = subjectAnalysis
-    ? `\nPYTHON SUBJECT ANALYSIS (for context only — do NOT re-detect subjects):\n${JSON.stringify(
-        {
-          method: subjectAnalysis.method,
-          subject_count: subjectAnalysis.subject_count,
-          subject_examples: (subjectAnalysis.subject_records || [])
-            .slice(0, 5)
-            .map((r: any) => ({
-              original: r.original_id,
-              file_count: r.file_count,
-            })),
-        },
-        null,
-        2
-      )}\n`
-    : "";
-
-  return `You are a BIDS dataset architect. Generate a BIDSPlan.yaml file.
+BASE DIRECTORY: ${baseDirectoryPath}
 
 ${fileSummary}
 
@@ -369,216 +37,49 @@ ${filePatterns}
 
 ${userContext}
 
-${pythonSubjectAnalysisText}
-
-CONVERSION RULES (CRITICAL):
-- .dcm  → format_ready: false, convert_to: nifti,  modality: mri
-- .nii/.nii.gz → format_ready: true,  convert_to: none,  modality: mri
-- .jnii/.bnii  → format_ready: false, convert_to: nifti,  modality: mri
-- .mat  → format_ready: false, convert_to: snirf, modality: nirs
-- .nirs → format_ready: false, convert_to: snirf, modality: nirs
-- .snirf → format_ready: true, convert_to: none,  modality: nirs
-
-YOUR ONLY JOB: Generate the mappings section based on the file types present.
-Copy assignment_rules, participant_metadata, and subjects sections EXACTLY as shown in the OUTPUT below.
-
-OUTPUT (Raw YAML only, no markdown, no explanation):
-
-assignment_rules:
-${assignmentRules}
-
-FILE EXTENSION COUNTS (use these to determine which mappings to generate):
-${countsText}
-
-SAMPLE FILENAMES (use these to determine correct bids_template and match_pattern):
-${sampleFiles}
-
-MAPPINGS FORMAT (ONE entry per file extension, use glob patterns NOT individual filenames):
+${annotations}
 
-Example 1 - DICOM:
-  mappings:
-  - modality: mri
-    match: ['*.dcm', '**/*.dcm']
-    format_ready: false
-    convert_to: nifti
-    filename_rules:
-      - match_pattern: '.*'
-        bids_template: 'sub-X_T1w.nii.gz'
+CRITICAL FILE CATEGORIZATION RULES:
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+- [anatomical-T1w]    → sub-XX/anat/sub-XX_T1w.nii.gz
+- [anatomical-T2w]    → sub-XX/anat/sub-XX_T2w.nii.gz
+- [functional-bold]   → sub-XX/func/sub-XX_task-<n>_run-XX_bold.nii.gz
+- [functional-nirs]   → sub-XX/nirs/sub-XX_task-<n>_nirs.snirf
+- [anatomical-dicom]  → convert with dcm2niix → sub-XX/anat/
+- [anatomical-jnifti] → convert with jnifti_converter → sub-XX/anat/
+- [diffusion]         → sub-XX/dwi/
+- [fieldmap]          → sub-XX/fmap/
+
+FORMAT CONVERSION RULES:
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+- <format: DICOM → convert_to: nifti>
+    → subprocess.run(['dcm2niix', '-o', dest_dir, '-f', bids_filename, src_file])
+- <format: MATLAB → convert_to: snirf>
+    → Use MNE-Python or note manual conversion needed → sub-XX/nirs/
+- <format: Homer3 → convert_to: snirf>
+    → Same as MATLAB → sub-XX/nirs/
+- <format: NIfTI → format_ready: true>   → direct copy
+- <format: SNIRF → format_ready: true>   → direct copy
+
+⚠️ NEVER put task-based files in anat/ folder!
+⚠️ NEVER put T1w/T2w files in func/ folder!
+
+CRITICAL INSTRUCTIONS:
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+1. BIDS metadata files (dataset_description.json, README.md, participants.tsv)
+   have ALREADY been generated. Script MUST use their EXACT content.
 
-Example 2 - fNIRS .mat:
-  mappings:
-  - modality: nirs
-    match: ['*.mat', '**/*.mat']
-    format_ready: false
-    convert_to: snirf
-    filename_rules:
-      - match_pattern: '.*'
-        bids_template: 'sub-X_task-rest_nirs.snirf'
+2. All paths are RELATIVE to: ${baseDirectoryPath}
+   Access with: os.path.join('${baseDirectoryPath}', relative_path)
 
-Example 3 - Mixed:
-  mappings:
-  - modality: mri
-    match: ['*.nii.gz']
-    format_ready: true
-    convert_to: none
-    filename_rules:
-      - match_pattern: '.*T1.*'
-        bids_template: 'sub-X_T1w.nii.gz'
-  - modality: nirs
-    match: ['*.mat']
-    format_ready: false
-    convert_to: snirf
-    filename_rules:
-      - match_pattern: '.*'
-        bids_template: 'sub-X_task-rest_nirs.snirf'
+3. For EACH data file:
+   a) Extract subject ID from filename
+   b) Determine modality from file category
+   c) Create destination: bids_dir/sub-XX/modality/new_filename
+   d) Copy the file
+   e) Create JSON sidecar for imaging files
 
-participant_metadata:
-${participantMetadata}
+4. Error handling: wrap in try-except, print progress, continue on errors
 
-subjects:
-  count: ${subjectInfo.subjects.length}
-  id_strategy: ${subjectInfo.strategy}
-  labels:
-${subjectLabels}
-  source: python_extracted`;
+OUTPUT ONLY THE PYTHON SCRIPT (no markdown code fences, no explanations).`;
 };
-
-/**
- * Prompt for BIDSPlan.yaml generation
- * Mirrors autobidsify's PROMPT_BIDS_PLAN + build_bids_plan()'s optimized_bundle
- */
-// export const getBIDSPlanPrompt = (evidenceBundle: any): string => {
-//   // ── Pull subject analysis from evidence bundle (generated by extractSubjectAnalysis)
-//   const subjectAnalysis = evidenceBundle.subject_analysis;
-//   const idMapping: Record<string, string> =
-//     subjectAnalysis?.id_mapping?.id_mapping || {};
-//   const subjectRecords: any[] = subjectAnalysis?.subject_records || [];
-
-//   // ── Build assignment_rules (mirrors planner.py's _apply_python_rules_to_plan)
-//   const assignmentRules = subjectRecords
-//     .slice(0, 50)
-//     .map(
-//       (r) =>
-//         `- match:\n  - '*${r.original_id}*'\n  original: ${
-//           r.original_id
-//         }\n  subject: '${idMapping[r.original_id] ?? r.numeric_id}'`
-//     )
-//     .join("\n");
-
-//   // ── Build subjects section
-//   const subjectLabels = subjectRecords
-//     .slice(0, 50)
-//     .map((r) => `  - '${idMapping[r.original_id] ?? r.numeric_id}'`)
-//     .join("\n");
-
-//   // ── Build participant_metadata section
-//   const participantMetadata = subjectRecords
-//     .slice(0, 50)
-//     .map(
-//       (r) =>
-//         `  '${idMapping[r.original_id] ?? r.numeric_id}':\n    original_id: ${
-//           r.original_id
-//         }`
-//     )
-//     .join("\n");
-
-//   // ── Build file extension counts
-//   const countsText = Object.entries(
-//     evidenceBundle.counts_by_ext as Record<string, number>
-//   )
-//     .map(([ext, count]) => `  ${ext}: ${count} files`)
-//     .join("\n");
-
-//   // ── Build sample files (mirrors optimized_bundle.sample_files)
-//   const sampleFiles =
-//     (evidenceBundle.sample as Array<{ relpath: string }>)
-//       ?.map((s) => `  - ${s.relpath}`)
-//       .join("\n") ?? "";
-
-//   // ── Build python_subject_analysis block (mirrors planner.py's optimized_bundle)
-//   const subjectExamples = subjectRecords.slice(0, 10).map((r) => ({
-//     original: r.original_id,
-//     bids_id: idMapping[r.original_id] ?? r.numeric_id,
-//   }));
-
-//   const pythonSubjectAnalysis = JSON.stringify(
-//     {
-//       success: subjectAnalysis?.success ?? false,
-//       method: subjectAnalysis?.method ?? "none",
-//       subject_count: subjectAnalysis?.subject_count ?? 0,
-//       subject_examples: subjectExamples,
-//       id_mapping: subjectAnalysis?.id_mapping ?? {},
-//     },
-//     null,
-//     2
-//   );
-
-//   return `You are a BIDS dataset architect with complete decision-making authority.
-
-// ═══════════════════════════════════════════════════════════════════════
-// SUPPORTED FORMATS AND CONVERSION RULES (v10 - CRITICAL)
-// ═══════════════════════════════════════════════════════════════════════
-
-// MRI FORMATS (modality: mri):
-//   Input formats:
-//     • DICOM (.dcm)           → Convert to NIfTI using dcm2niix
-//     • NIfTI (.nii, .nii.gz)  → Already BIDS-ready, copy directly
-//     • JNIfTI (.jnii, .bnii)  → Convert to NIfTI using jnifti_converter
-//   BIDS output: .nii.gz files only
-
-// fNIRS FORMATS (modality: nirs):
-//   Input formats:
-//     • SNIRF (.snirf)         → Already BIDS-ready, copy directly
-//     • Homer3 (.nirs)         → Convert to SNIRF
-//     • MATLAB (.mat)          → Convert to SNIRF
-//   BIDS output: .snirf files only
-
-// FORMAT_READY AND CONVERT_TO RULES:
-//   format_ready: true  → .nii/.nii.gz (MRI) or .snirf (fNIRS) — just copy
-//   format_ready: false → .dcm (convert_to: nifti), .jnii/.bnii (convert_to: nifti),
-//                         .mat (convert_to: snirf), .nirs (convert_to: snirf)
-
-// CRITICAL: assignment_rules subject values must be BARE IDs (no 'sub-' prefix).
-//   ✓ subject: '1'       ← correct
-//   ✗ subject: 'sub-1'   ← wrong, executor adds sub- automatically
-
-// YOUR ONLY JOB: Generate the mappings section based on the file types present.
-// Copy assignment_rules, participant_metadata, and subjects sections EXACTLY as shown below.
-
-// ═══════════════════════════════════════════════════════════════════════
-// PYTHON SUBJECT ANALYSIS (use this — do NOT re-detect subjects yourself)
-// ═══════════════════════════════════════════════════════════════════════
-// ${pythonSubjectAnalysis}
-
-// FILE EXTENSION COUNTS:
-// ${countsText}
-
-// SAMPLE FILE PATHS (use these for match patterns and bids_template):
-// ${sampleFiles}
-
-// ═══════════════════════════════════════════════════════════════════════
-// OUTPUT (Raw YAML only, no markdown, no explanation)
-// ═══════════════════════════════════════════════════════════════════════
-
-// assignment_rules:
-// ${assignmentRules}
-
-// mappings:
-//   - modality: mri             # example — generate based on file types present
-//     match: ['*.dcm', '**/*.dcm']
-//     format_ready: false
-//     convert_to: nifti
-//     filename_rules:
-//       - match_pattern: '.*'
-//         bids_template: 'sub-X_T1w.nii.gz'
-
-// participant_metadata:
-// ${participantMetadata}
-
-// subjects:
-//   count: ${subjectAnalysis?.subject_count ?? 0}
-//   id_strategy: ${subjectAnalysis?.id_mapping?.strategy_used ?? "numeric"}
-//   labels:
-// ${subjectLabels}
-//   source: python_extracted`;
-// };
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
index e69de29..5b203e8 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
@@ -0,0 +1,870 @@
+// src/components/DatasetOrganizer/utils/plannerHelpers.ts
+//
+// Mirrors autobidsify/converters/planner.py
+// Owns Stage 5 of the pipeline: evidence bundle → BIDSPlan.yaml + participants.tsv
+//
+// Python equivalents:
+//   DATA_EXTENSIONS / TRIO_FILENAMES / SKIP_DIRS  → planner.py _DATA_EXTS / TRIO_NAMES
+//   extractNumericIdFromIdentifier()              → planner.py _sort_key lambda
+//   extractFromDirectoryStructure()               → planner.py _extract_subjects_from_directory_structure()
+//   extractFromFlatFilenames()                    → planner.py _extract_subjects_from_flat_filenames()
+//   generateIdMapping()                           → planner.py _write_participants_from_plan() logic
+//   extractSubjectAnalysis()                      → planner.py build_bids_plan() Steps 1 + 4
+//   parseLLMJsonResponse()                        → planner.py _parse_llm_json_response()
+//   buildOptimizedBundle()                        → planner.py build_bids_plan() Step 2
+//   getBidsPlanPrompt()                           → planner.py PROMPT_BIDS_PLAN
+//   parsePlanYaml()                               → planner.py yaml.safe_load() block
+//   collectExtraColumns()                         → planner.py _collect_extra_columns()
+//   validateSubjectCount()                        → planner.py build_bids_plan() Step 4
+//   writeParticipantsFromPlan()                   → planner.py _write_participants_from_plan()
+//   mergeParticipantsFromPlan()                   → planner.py _merge_participants_from_llm_metadata()
+//   buildBidsPlan()                               → planner.py build_bids_plan() main entry point
+import { validatePlanCoverage } from "./executorHelpers";
+import { llmBidsPlan, LLMConfig } from "./llm";
+import { load as yamlLoad } from "js-yaml";
+
+// ============================================================================
+// Types
+// ============================================================================
+export interface SubjectRecord {
+  original_id: string;
+  numeric_id: string;
+  site: string | null;
+  pattern_name: string;
+  file_count: number;
+  group?: string;
+}
+
+export interface SubjectAnalysis {
+  success: boolean;
+  method: string;
+  subject_records: SubjectRecord[];
+  subject_count: number;
+  has_site_info: boolean;
+  variants_by_subject: Record<string, any>;
+  python_generated_filename_rules: any[];
+  //   id_mapping: {
+  //     id_mapping: Record<string, string>;
+  //     reverse_mapping: Record<string, string>;
+  //     strategy_used: string;
+  //     metadata_columns: string[];
+  //   };
+}
+
+export interface BuildBidsPlanOptions {
+  evidenceBundle: any;
+  llmConfig: LLMConfig;
+  signal?: AbortSignal;
+  onStatus?: (msg: string) => void;
+}
+
+export interface BuildBidsPlanResult {
+  planYaml: string;
+  subjectAnalysis: SubjectAnalysis;
+  participantsTsv: string;
+  coverageWarnings: string[];
+}
+
+// ============================================================================
+// Constants
+// Mirrors planner.py _DATA_EXTS, evidence.py TRIO_NAMES
+// ============================================================================
+
+const DATA_EXTENSIONS =
+  //   /\.(snirf|nii|nii\.gz|dcm|mat|nirs|jnii|bnii|h5|hdf5|edf|bdf)$/i;
+  /\.(snirf|nii|nii\.gz|dcm|mat|nirs|jnii|bnii)$/i;
+
+const TRIO_FILENAMES = new Set([
+  "dataset_description.json",
+  "participants.tsv",
+  "readme.md",
+  "readme.txt",
+  "readme.rst",
+  "readme",
+]);
+
+const SKIP_DIRS = new Set([
+  "anat",
+  "func",
+  "dwi",
+  "fmap",
+  "nirs",
+  "meg",
+  "eeg",
+  "beh",
+  "perf",
+  "derivatives",
+  "sourcedata",
+  "stimuli",
+  "walking",
+  "resting",
+  "resting_state",
+  "run",
+  "ses",
+  "pd",
+  "control",
+  "hc",
+  "task",
+  "sub",
+  "dataset",
+  "data",
+  "raw",
+  "bids",
+  "output",
+  "outputs",
+  "staging",
+  "_staging",
+  "mri",
+  "fnirs",
+  "edf",
+  "dicom",
+]);
+
+// ============================================================================
+// Mirrors planner.py _parse_llm_json_response()
+// ============================================================================
+
+export const parseLLMJsonResponse = (
+  text: string,
+  stepName: string
+): any | null => {
+  if (!text?.trim()) {
+    console.warn(`${stepName}: LLM returned empty response`);
+    return null;
+  }
+  let t = text.trim();
+  if (t.startsWith("```json")) t = t.slice(7);
+  else if (t.startsWith("```")) t = t.split("\n").slice(1).join("\n");
+  if (t.endsWith("```")) t = t.slice(0, -3);
+  t = t.trim();
+
+  try {
+    return JSON.parse(t);
+  } catch {}
+
+  const match = t.match(/\{[\s\S]*\}/);
+  if (match) {
+    try {
+      return JSON.parse(match[0]);
+    } catch {}
+  }
+
+  console.warn(
+    `${stepName}: Failed to parse JSON. Preview: ${t.slice(0, 200)}`
+  );
+  return null;
+};
+
+// ============================================================================
+// Subject extraction
+// Mirrors _extract_numeric_id_from_identifier() in planner.py
+// BZZ003 → "003", sub-01 → "01", patient021 → "021"
+// ============================================================================
+
+const extractNumericIdFromIdentifier = (identifier: string): string | null => {
+  const numbers = identifier.match(/\d+/g);
+  if (!numbers) return null;
+  return numbers[numbers.length - 1];
+};
+
+// ── Step 1: Directory structure patterns
+// Mirrors _extract_subjects_from_directory_structure() in planner.py
+
+const extractFromDirectoryStructure = (
+  allFiles: string[]
+): Omit<SubjectAnalysis, "id_mapping"> | null => {
+  const patterns: Array<[RegExp, boolean, number, number | null, string]> = [
+    [/^([A-Za-z]+)_sub(\d+)$/i, true, 2, 1, "site_prefixed"], // Beijing_sub82352
+    [/^sub-(\w+)$/, false, 1, null, "standard_bids"], // sub-01
+    [/^subject[_-]?(\d+)$/i, false, 1, null, "simple"], // subject_01
+    [/^\d{3,}$/, false, 1, null, "numeric_only"], // 001
+    [/^([A-Za-z]+\d+)$/, false, 1, null, "alphanum_id"], // PD01, Control01, HC03
+  ];
+
+  const subjectRecords: SubjectRecord[] = [];
+  const seenIds = new Set<string>();
+
+  for (const filepath of allFiles) {
+    const parts = filepath.split("/");
+
+    // const dirsOnly = parts.slice(0, parts.length - 1); // Check ALL directory levels (not just first 2)
+    const dirsOnly = parts.slice(0, Math.min(2, parts.length - 1)); // only first 2 levels
+
+    for (const part of dirsOnly) {
+      // Skip known non-subject directory names
+      if (SKIP_DIRS.has(part.toLowerCase())) continue;
+
+      for (const [
+        regex,
+        hasSite,
+        idGroup,
+        siteGroup,
+        patternName,
+      ] of patterns) {
+        const match = part.match(regex);
+        if (match) {
+          const originalId = match[0];
+          if (seenIds.has(originalId)) break;
+          seenIds.add(originalId);
+          subjectRecords.push({
+            original_id: originalId,
+            numeric_id: match[idGroup] || match[0],
+            site: hasSite && siteGroup ? match[siteGroup] : null,
+            pattern_name: patternName,
+            file_count: 0,
+          });
+          break;
+        }
+      }
+    }
+  }
+
+  if (subjectRecords.length === 0) return null;
+
+  subjectRecords.sort((a, b) => {
+    const aMatch = a.original_id.match(/^([A-Za-z]+)(\d+)$/);
+    const bMatch = b.original_id.match(/^([A-Za-z]+)(\d+)$/);
+    if (aMatch && bMatch) {
+      const cmp = aMatch[1].localeCompare(bMatch[1]);
+      if (cmp !== 0) return cmp;
+      return parseInt(aMatch[2]) - parseInt(bMatch[2]);
+    }
+    return (parseInt(a.numeric_id) || 0) - (parseInt(b.numeric_id) || 0);
+  });
+
+  // Detect group from parent directory — mirrors PROMPT_BIDS_PLAN Structure 4
+  // e.g. PD/PD_01.snirf → group: "PD"
+  const subjectToParent: Record<string, string> = {};
+  for (const filepath of allFiles) {
+    const parts = filepath.split("/");
+    if (parts.length >= 3) {
+      const potentialGroup = parts[0];
+      const potentialSubject = parts[1];
+      if (
+        seenIds.has(potentialSubject) &&
+        !SKIP_DIRS.has(potentialGroup.toLowerCase())
+      ) {
+        subjectToParent[potentialSubject] = potentialGroup;
+      }
+    }
+  }
+  for (const rec of subjectRecords) {
+    if (subjectToParent[rec.original_id]) {
+      rec.group = subjectToParent[rec.original_id];
+    }
+  }
+
+  return {
+    success: true,
+    method: "directory_structure",
+    subject_records: subjectRecords,
+    subject_count: subjectRecords.length,
+    has_site_info: subjectRecords.some((r) => r.site !== null),
+    variants_by_subject: {},
+    python_generated_filename_rules: [],
+  };
+};
+
+// ── Step 2: Flat filename identifier extraction
+// Mirrors _extract_subjects_from_flat_filenames() in planner.py
+
+const extractFromFlatFilenames = (
+  allFiles: string[]
+): Omit<SubjectAnalysis, "id_mapping"> | null => {
+  const identifierToFiles: Record<string, string[]> = {};
+
+  for (const filepath of allFiles) {
+    const filename = filepath.split("/").pop()!;
+
+    // Skip trio files
+    if (TRIO_FILENAMES.has(filename.toLowerCase())) continue;
+    // Skip non-data files (PDFs, docs, JSONs that aren't data)
+    if (!DATA_EXTENSIONS.test(filename)) continue;
+    // Remove extension(s): sub-01_ses-left2s_task-FRESHMOTOR_nirs.snirf → sub-01_ses-left2s_task-FRESHMOTOR_nirs
+    const nameNoExt = filename.replace(/(\.[^.]+)+$/, "");
+
+    // Extract base identifier — alphanumeric before first underscore
+    // sub-01_ses-left2s → sub-01
+    // BZZ003_rest → BZZ003
+    // VHMCT1mm-Hip → VHMCT1mm-Hip (no underscore, take full name)
+    const match = nameNoExt.match(/^([A-Za-z0-9\-]+)/);
+    if (match) {
+      const identifier = match[1];
+      if (!identifierToFiles[identifier]) identifierToFiles[identifier] = [];
+      identifierToFiles[identifier].push(filepath);
+    }
+  }
+
+  if (Object.keys(identifierToFiles).length === 0) return null;
+
+  // Sort by extracted numeric ID if possible (mirrors sort_key in planner.py)
+  const sortedIdentifiers = Object.keys(identifierToFiles).sort((a, b) => {
+    const na = extractNumericIdFromIdentifier(a);
+    const nb = extractNumericIdFromIdentifier(b);
+    if (na && nb) return parseInt(na) - parseInt(nb);
+    return a.localeCompare(b);
+  });
+
+  const subjectRecords: SubjectRecord[] = sortedIdentifiers.map(
+    (identifier, i) => ({
+      original_id: identifier,
+      numeric_id: String(i + 1),
+      site: null,
+      pattern_name: "filename_identifier",
+      file_count: identifierToFiles[identifier].length,
+    })
+  );
+
+  // Detect group from "GROUP_NN" pattern — mirrors PROMPT_BIDS_PLAN Structure 4
+  for (const rec of subjectRecords) {
+    const groupMatch = rec.original_id.match(/^([A-Za-z]+)[_\-](\d+)$/);
+    if (groupMatch) rec.group = groupMatch[1];
+  }
+
+  return {
+    success: true,
+    method: "flat_filename_identifiers",
+    subject_records: subjectRecords,
+    subject_count: subjectRecords.length,
+    has_site_info: false,
+    variants_by_subject: {},
+    python_generated_filename_rules: [],
+  };
+};
+
+// ── ID mapping — mirrors _generate_subject_id_mapping() in planner.py
+// const generateIdMapping = (
+//     subjectInfo: Omit<SubjectAnalysis, "id_mapping">
+//   ): SubjectAnalysis["id_mapping"] => {
+//     const records = subjectInfo.subject_records;
+//     const idMapping: Record<string, string>     = {};
+//     const reverseMapping: Record<string, string> = {};
+
+//     const allAlreadyBids = records.every((r) => /^sub-\w+$/i.test(r.original_id));
+//     if (allAlreadyBids) {
+//       for (const rec of records) {
+//         const bidsId = rec.original_id.replace(/^sub-/i, "");
+//         idMapping[rec.original_id] = bidsId;
+//         reverseMapping[bidsId]     = rec.original_id;
+//       }
+//       return { id_mapping: idMapping, reverse_mapping: reverseMapping,
+//                strategy_used: "already_bids", metadata_columns: [] };
+//     }
+
+//     const extractedNumbers: Record<string, string> = {};
+//     for (const rec of records) {
+//       const nums = rec.original_id.match(/\d+/g);
+//       if (nums) extractedNumbers[rec.original_id] = nums[nums.length - 1];
+//     }
+//     const numericValues = Object.values(extractedNumbers);
+//     const allUnique = new Set(numericValues).size === numericValues.length;
+
+//     if (Object.keys(extractedNumbers).length === records.length && allUnique) {
+//       for (const rec of records) {
+//         const bidsId = extractedNumbers[rec.original_id];
+//         idMapping[rec.original_id] = bidsId;
+//         reverseMapping[bidsId]     = rec.original_id;
+//       }
+//     } else {
+//       for (let i = 0; i < records.length; i++) {
+//         const orig   = records[i].original_id;
+//         const bidsId = String(i + 1);
+//         idMapping[orig]      = bidsId;
+//         reverseMapping[bidsId] = orig;
+//       }
+//     }
+
+//     return { id_mapping: idMapping, reverse_mapping: reverseMapping,
+//              strategy_used: "numeric", metadata_columns: ["original_id"] };
+//   };
+
+// export const extractSubjectAnalysis = (
+//   allFiles: string[],
+//   userNSubjects?: number | null,
+//   dominantPrefixes?: { prefix: string; count: number; percentage: number }[]
+// ): SubjectAnalysis => {
+//   // Step 1: directory structure
+//   let subjectInfo = extractFromDirectoryStructure(allFiles);
+
+//   // Step 2: flat filename fallback
+//   if (!subjectInfo || subjectInfo.subject_records.length === 0) {
+//     subjectInfo = extractFromFlatFilenames(allFiles);
+//   }
+
+//   if (!subjectInfo || subjectInfo.subject_records.length === 0) {
+//     return {
+//       success: false,
+//       method: "none",
+//       subject_records: [],
+//       subject_count: 0,
+//       has_site_info: false,
+//       variants_by_subject: {},
+//       python_generated_filename_rules: [],
+//       id_mapping: {
+//         id_mapping: {},
+//         reverse_mapping: {},
+//         strategy_used: "none",
+//         metadata_columns: [],
+//       },
+//     };
+//   }
+
+//   // ── CRITICAL validation: mirrors planner.py lines 190-215
+//   // If extracted count doesn't match user hint but dominant prefixes do,
+//   // fall back to dominant prefixes (handles VHM/VHF body-part over-extraction)
+//   const pythonCount = subjectInfo.subject_count;
+//   if (
+//     userNSubjects &&
+//     pythonCount !== userNSubjects &&
+//     dominantPrefixes &&
+//     dominantPrefixes.length === userNSubjects
+//   ) {
+//     subjectInfo = {
+//       success: true,
+//       method: "dominant_prefix_fallback",
+//       subject_records: dominantPrefixes.map((p, i) => ({
+//         original_id: p.prefix,
+//         numeric_id: String(i + 1),
+//         site: null,
+//         pattern_name: "dominant_prefix",
+//         file_count: p.count,
+//       })),
+//       subject_count: dominantPrefixes.length,
+//       has_site_info: false,
+//       variants_by_subject: {},
+//       python_generated_filename_rules: [],
+//     };
+//   }
+//   // bug fix for subject mapping
+//   // === original
+//   // const idMapping = generateIdMapping(subjectInfo);
+//   // return { ...subjectInfo, id_mapping: idMapping };
+//   // ==== end
+//   // ==== updates
+//   // CRITICAL: n_subjects is authoritative (mirrors planner.py PROMPT_BIDS_PLAN)
+//   // If analysis count doesn't match user input, fall back to sequential numbering
+//   const expectedCount = userNSubjects;
+//   if (expectedCount && subjectInfo.subject_count !== expectedCount) {
+//     const idMap: Record<string, string> = {};
+//     const reverseMap: Record<string, string> = {};
+//     for (let i = 1; i <= expectedCount; i++) {
+//       const bidsId = String(i).padStart(2, "0");
+//       idMap[`sub-${bidsId}`] = bidsId;
+//       reverseMap[bidsId] = `sub-${bidsId}`;
+//     }
+//     return {
+//       ...subjectInfo,
+//       subject_count: expectedCount,
+//       id_mapping: {
+//         id_mapping: idMap,
+//         reverse_mapping: reverseMap,
+//         strategy_used: "numeric_fallback",
+//         metadata_columns: [],
+//       },
+//     };
+//   }
+
+//   const idMapping = generateIdMapping(subjectInfo);
+//   return { ...subjectInfo, id_mapping: idMapping };
+// };
+
+// ============================================================================
+// collectExtraColumns()
+// Mirrors _collect_extra_columns() in planner.py
+// ============================================================================
+
+const collectExtraColumns = (
+  metadata: Record<string, Record<string, any>>
+): string[] => {
+  const seen = new Set<string>();
+  const cols: string[] = [];
+  for (const meta of Object.values(metadata)) {
+    for (const col of Object.keys(meta)) {
+      if (!seen.has(col) && col !== "participant_id") {
+        seen.add(col);
+        cols.push(col);
+      }
+    }
+  }
+  return cols;
+};
+
+// ============================================================================
+// writeParticipantsFromPlan()
+// Mirrors _write_participants_from_plan() in planner.py
+// ============================================================================
+
+export const writeParticipantsFromPlan = (
+  planYaml: any,
+  userNSubjects: number | null
+): string => {
+  const rules: any[] = planYaml?.assignment_rules || [];
+  const labels: any[] = planYaml?.subjects?.labels || [];
+  const metadata: Record<string, any> = planYaml?.participant_metadata || {};
+
+  // Collect ordered subject IDs from assignment_rules first, then labels
+  const seen = new Set<string>();
+  const ordered: string[] = [];
+  for (const rule of rules) {
+    const sid = String(rule?.subject ?? "");
+    if (sid && !seen.has(sid)) {
+      seen.add(sid);
+      ordered.push(sid);
+    }
+  }
+  if (ordered.length === 0) {
+    for (const lbl of labels) {
+      const sid = String(lbl);
+      if (sid && !seen.has(sid)) {
+        seen.add(sid);
+        ordered.push(sid);
+      }
+    }
+  }
+
+  if (userNSubjects && ordered.length < userNSubjects) {
+    console.warn(
+      `writeParticipantsFromPlan: plan has ${ordered.length} subjects ` +
+        `but user specified ${userNSubjects}. LLM assignment_rules may be incomplete.`
+    );
+  }
+
+  const extraColumns = collectExtraColumns(metadata);
+  // Always include original_id — mirrors Python metadata_columns: ["original_id"]
+  // const allExtra = ["original_id", ...extraColumns.filter((c) => c !== "original_id")];
+  // const columns  = ["participant_id", ...allExtra];
+  const columns = ["participant_id", ...extraColumns];
+
+  const sortKey = (sid: string): [number, number, string] => {
+    const n = parseInt(sid);
+    return isNaN(n) ? [1, 0, sid] : [0, n, sid];
+  };
+
+  const sortedIds = [...ordered].sort((a, b) => {
+    const [at, an, as_] = sortKey(a);
+    const [bt, bn, bs] = sortKey(b);
+    if (at !== bt) return at - bt;
+    if (an !== bn) return an - bn;
+    return as_.localeCompare(bs);
+  });
+
+  const header = columns.join("\t");
+  const rows = sortedIds.map((sid) => {
+    const meta = metadata[sid] || {};
+    return columns
+      .map((col) => {
+        if (col === "participant_id") return `sub-${sid}`;
+        return String(meta[col] ?? "n/a");
+      })
+      .join("\t");
+  });
+
+  return [header, ...rows].join("\n");
+};
+
+// ============================================================================
+// mergeParticipantsFromPlan()
+// Mirrors _merge_participants_from_llm_metadata() in planner.py
+// Appends extra columns from BIDSPlan participant_metadata into existing TSV
+// ============================================================================
+
+export const mergeParticipantsFromPlan = (
+  existingTsv: string,
+  planYaml: any
+): string => {
+  const metadata = planYaml?.participant_metadata || {};
+  const extraColumns = collectExtraColumns(metadata);
+  if (extraColumns.length === 0) return existingTsv;
+
+  const lines = existingTsv.split("\n").filter((l) => l.trim());
+  if (lines.length === 0) return existingTsv;
+
+  const header = lines[0].split("\t");
+  const newCols = extraColumns.filter((c) => !header.includes(c));
+  if (newCols.length === 0) return existingTsv;
+
+  const newHeader = [...header, ...newCols].join("\t");
+  const newRows = lines.slice(1).map((line) => {
+    const cells = line.split("\t");
+    const sid = cells[0].replace(/^sub-/, "");
+    const meta = metadata[sid] || {};
+    return [...cells, ...newCols.map((col) => String(meta[col] ?? "n/a"))].join(
+      "\t"
+    );
+  });
+
+  return [newHeader, ...newRows].join("\n");
+};
+
+// ============================================================================
+// sampleDataFiles()
+// Mirrors build_bids_plan() Step 2 sampling:
+//   ≤200 files → use all; >200 → sample beginning + middle + end
+// ============================================================================
+
+const sampleDataFiles = (allFiles: string[], maxFiles = 200): string[] => {
+  const dataFiles = allFiles.filter((f) => {
+    const low = f.toLowerCase();
+    if (low.endsWith(".nii.gz")) return true;
+    const ext = low.includes(".") ? "." + low.split(".").pop()! : "";
+    return new Set([
+      ".snirf",
+      ".nirs",
+      ".mat",
+      ".dcm",
+      ".nii",
+      ".jnii",
+      ".bnii",
+      ".nii.gz",
+    ]).has(ext);
+  });
+
+  if (dataFiles.length <= maxFiles) return dataFiles;
+
+  const n = dataFiles.length;
+  const indices = new Set([
+    ...Array.from({ length: Math.min(50, n) }, (_, i) => i),
+    ...Array.from({ length: 50 }, (_, i) => Math.floor(n / 2) - 25 + i),
+    ...Array.from({ length: Math.min(50, n) }, (_, i) => n - 50 + i),
+  ]);
+  return [...indices]
+    .filter((i) => i >= 0 && i < n)
+    .sort((a, b) => a - b)
+    .map((i) => dataFiles[i]);
+};
+
+// ============================================================================
+// buildOptimizedBundle()
+// Mirrors build_bids_plan() Step 2 — strips evidence bundle to lean payload.
+// Python explicitly excludes documents[], participant_metadata_evidence,
+// full all_files[] to keep the prompt token count low.
+// ============================================================================
+
+const buildOptimizedBundle = (
+  evidenceBundle: any,
+  subjectAnalysis: SubjectAnalysis
+): object => {
+  const allFiles: string[] = evidenceBundle?.all_files || [];
+  const sampleFiles = sampleDataFiles(allFiles, 200);
+
+  const DATA_EXT_SET = new Set([
+    ".snirf",
+    ".nirs",
+    ".mat",
+    ".dcm",
+    ".nii",
+    ".jnii",
+    ".bnii",
+    ".nii.gz",
+  ]);
+  const countsFiltered = Object.fromEntries(
+    Object.entries(evidenceBundle?.counts_by_ext || {}).filter(([ext]) =>
+      DATA_EXT_SET.has(ext.toLowerCase())
+    )
+  );
+
+  return {
+    root: evidenceBundle?.root,
+    counts_by_ext: countsFiltered,
+    user_hints: evidenceBundle?.user_hints,
+    total_files: allFiles.length,
+    data_files: allFiles.filter((f) => DATA_EXTENSIONS.test(f)).length,
+    sample_files: sampleFiles,
+    structure_hint: evidenceBundle?.structure_hint,
+    python_subject_analysis: {
+      success: subjectAnalysis.success,
+      method: subjectAnalysis.method,
+      subject_count: subjectAnalysis.subject_count,
+      subject_examples: subjectAnalysis.subject_records
+        .slice(0, 20)
+        .map((r) => ({
+          original: r.original_id,
+          numeric_id: r.numeric_id,
+          site: r.site ?? null,
+          //   group: r.group ?? null,
+        })),
+      note:
+        "This is a HINT from heuristic detection. " +
+        "Trust user_hints.n_subjects over this count. " +
+        "Use your own analysis of sample_files to determine the true subject structure.",
+    },
+  };
+};
+
+// ============================================================================
+// parsePlanYaml()
+// Mirrors yaml.safe_load() + validation in build_bids_plan() Step 3
+// ============================================================================
+
+export const parsePlanYaml = (responseText: string): any | null => {
+  let text = responseText.trim();
+  if (text.startsWith("```yaml")) text = text.slice(7);
+  else if (text.startsWith("```")) text = text.split("\n").slice(1).join("\n");
+  if (text.endsWith("```")) text = text.slice(0, -3);
+  text = text.trim();
+
+  try {
+    const parsed = yamlLoad(text);
+    if (parsed && typeof parsed === "object") return parsed;
+    return { _raw: text, _parseError: "parsed value is not an object" };
+  } catch (e) {
+    console.warn("parsePlanYaml: YAML parse failed", e);
+    return { _raw: text, _parseError: String(e) };
+  }
+};
+
+// ============================================================================
+// validateSubjectCount()
+// Mirrors build_bids_plan() Step 4
+// Trusts LLM assignment_rules; only patches the count field if needed
+// ============================================================================
+
+const validateSubjectCount = (
+  planYaml: any,
+  userNSubjects: number | null
+): any => {
+  const llmCount = planYaml?.subjects?.count ?? 0;
+  if (userNSubjects && llmCount !== userNSubjects) {
+    console.warn(
+      `validateSubjectCount: LLM count (${llmCount}) ≠ user count (${userNSubjects}). ` +
+        `Trusting LLM assignment_rules, updating count field only.`
+    );
+    return {
+      ...planYaml,
+      subjects: { ...(planYaml.subjects || {}), count: userNSubjects },
+    };
+  }
+  return planYaml;
+};
+
+// ============================================================================
+// buildBidsPlan()
+// Main entry point — mirrors build_bids_plan() in planner.py
+// Called by handleGeneratePlan() in LLMPanel.tsx
+// ============================================================================
+
+export const buildBidsPlan = async (
+  opts: BuildBidsPlanOptions
+): Promise<BuildBidsPlanResult> => {
+  const { evidenceBundle, llmConfig, signal, onStatus } = opts;
+  const log = (msg: string) => {
+    console.log(msg);
+    onStatus?.(msg);
+  };
+
+  const allFiles: string[] = evidenceBundle?.all_files || [];
+  const userHints = evidenceBundle?.user_hints || {};
+  const userNSubjects: number | null = userHints?.n_subjects ?? null;
+
+  // ── Step 1: Python structural hints (advisory) ────────────────────
+  log("Step 1: Extracting subject hints...");
+
+  let rawSubjectInfo = extractFromDirectoryStructure(allFiles);
+  if (!rawSubjectInfo || rawSubjectInfo.subject_records.length === 0) {
+    log("  Directory-level detection failed, trying flat filename analysis...");
+    rawSubjectInfo = extractFromFlatFilenames(allFiles);
+  }
+
+  // Attach id_mapping so buildOptimizedBundle() has full SubjectAnalysis shape
+  //   const subjectAnalysis: SubjectAnalysis = rawSubjectInfo
+  //     ? { ...rawSubjectInfo, id_mapping: generateIdMapping(rawSubjectInfo) }
+  //     : {
+  //         success: false, method: "none", subject_records: [],
+  //         subject_count: 0, has_site_info: false,
+  //         variants_by_subject: {}, python_generated_filename_rules: [],
+  //         id_mapping: { id_mapping: {}, reverse_mapping: {},
+  //                       strategy_used: "none", metadata_columns: [] },
+  //       };
+  const subjectAnalysis: SubjectAnalysis = rawSubjectInfo ?? {
+    success: false,
+    method: "none",
+    subject_records: [],
+    subject_count: 0,
+    has_site_info: false,
+    variants_by_subject: {},
+    python_generated_filename_rules: [],
+  };
+  log(
+    `  ${subjectAnalysis.subject_count} subjects (method: ${subjectAnalysis.method})`
+  );
+
+  // ── Step 2: Build optimized LLM payload ───────────────────────────
+  log("Step 2: Building LLM payload...");
+  const optimizedBundle = buildOptimizedBundle(evidenceBundle, subjectAnalysis);
+  const payload = JSON.stringify(optimizedBundle, null, 2);
+  log(`  Sample files: ${(optimizedBundle as any).sample_files?.length ?? 0}`);
+
+  // ── Step 3: Call LLM ──────────────────────────────────────────────
+  log(`Step 3: Calling LLM (${llmConfig.model})...`);
+  const raw = await llmBidsPlan(payload, llmConfig, signal);
+  if (!raw) throw new Error("LLM returned empty response for BIDS plan");
+
+  // ── Step 3b: Parse YAML ───────────────────────────────────────────
+  let planYaml = parsePlanYaml(raw);
+  if (!planYaml || planYaml._parseError) {
+    throw new Error(
+      `BIDS plan YAML parsing failed: ${planYaml?._parseError ?? "unknown"}`
+    );
+  }
+
+  // ── Step 4: Validate subject count ───────────────────────────────
+  log("Step 4: Validating subject count...");
+  planYaml = validateSubjectCount(planYaml, userNSubjects);
+  log(`  Final count: ${planYaml?.subjects?.count ?? "unknown"}`);
+
+  // ── Step 4b: Validate plan coverage against sample files ─────────
+  // Uses executorHelpers.validatePlanCoverage() — surfaces LLM pattern errors early
+  const sampleFiles: string[] = (optimizedBundle as any).sample_files || [];
+  const coverage = validatePlanCoverage(sampleFiles, planYaml?.mappings || []);
+  if (coverage.warnings.length > 0) {
+    coverage.warnings.forEach((w) => log(`  ⚠ ${w}`));
+  } else {
+    log(`  ✓ Coverage: ${coverage.coveragePercent}% of sample files matched`);
+  }
+
+  // ── Step 5: Write participants.tsv ────────────────────────────────
+  log("Step 5: Generating participants.tsv...");
+  const participantsTsv = writeParticipantsFromPlan(planYaml, userNSubjects);
+
+  // ── Step 6: Merge extra metadata columns ──────────────────────────
+  log("Step 6: Merging participant metadata columns...");
+  const mergedTsv = mergeParticipantsFromPlan(participantsTsv, planYaml);
+
+  // ── Step 7: Inject plan metadata ─────────────────────────────────
+  // Mirrors plan_yaml["metadata"] = {...} in planner.py Step 7
+  planYaml.metadata = {
+    generated_at: new Date().toISOString(),
+    model: llmConfig.model,
+    id_strategy: "auto",
+  };
+
+  // ── Step MAT: inject mat_mapping_path into nirs mappings ─────────
+  log("Step MAT: .mat mapping deferred to local execute step");
+  const matFiles = allFiles.filter((f) => f.toLowerCase().endsWith(".mat"));
+  if (matFiles.length > 0) {
+    for (const mapping of planYaml?.mappings || []) {
+      if (mapping?.modality === "nirs") {
+        const patterns: string[] = mapping?.match || [];
+        const coversMat =
+          patterns.length === 0 ||
+          patterns.some(
+            (p: string) => p.toLowerCase().includes(".mat") || p === "**/*.mat"
+          );
+        if (coversMat) {
+          mapping.mat_mapping_path = "_staging/mat_mapping.json";
+        }
+      }
+    }
+  }
+
+  // Preserve raw YAML string for saving
+  const planYamlStr = raw.startsWith("```") ? planYaml._raw ?? raw : raw;
+
+  log("✓ BIDSPlan complete");
+  return {
+    planYaml: planYamlStr,
+    subjectAnalysis,
+    participantsTsv: mergedTsv,
+    coverageWarnings: coverage.warnings,
+  };
+};
diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/trioHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/trioHelpers.ts
new file mode 100644
index 0000000..064cb1d
--- /dev/null
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/trioHelpers.ts
@@ -0,0 +1,762 @@
+// src/components/DatasetOrganizer/utils/trioHelpers.ts
+//
+// Mirrors autobidsify/stages/trio.py
+// Owns Stage 4 of the pipeline: evidence bundle → trio files
+// (dataset_description.json, README.md, participants.tsv)
+//
+// Python equivalents:
+//   normalizeLicenseLocally()       → normalize_license_locally()
+//   checkTrioStatus()               → check_trio_status()
+//   isMarkdownContent()             → _is_markdown_content()
+//   validateDatasetDescription()    → _validate_dataset_description()
+//   fixFieldTypes()                 → _fix_field_types()
+//   parseLLMJsonResponse()          → _parse_llm_json_response()
+//   generateDatasetDescription()    → generate_dataset_description()
+//   generateReadme()                → generate_readme()
+//   generateParticipants()          → generate_participants()
+//   generateTrioFiles()             → trio_generate_all() — main entry point
+import {
+  callLLM,
+  llmTrioDatasetDescription,
+  llmTrioReadme,
+  LLMConfig,
+} from "./llm";
+import { FileItem } from "redux/projects/types/projects.interface";
+import { OllamaService } from "services/ollama.service";
+
+export type TrioLLMConfig = LLMConfig;
+// ── License whitelist — mirrors LICENSE_WHITELIST in constants.py ─────────────
+export const LICENSE_WHITELIST = new Set([
+  "PDDL",
+  "CC0",
+  "PD",
+  "CC-BY-4.0",
+  "CC-BY-SA-4.0",
+  "BSD-3-Clause",
+  "BSD-2-Clause",
+  "CDDL-1.0",
+  "MPL",
+  "MIT",
+  "GPL-2.0",
+  "GPL-2.0+",
+  "GPL-3.0",
+  "GPL-3.0+",
+  "LGPL-3.0+",
+  "GFDL-1.3",
+  "CC-BY-NC-4.0",
+  "CC-BY-NC-SA-4.0",
+  "CC-BY-NC-ND-4.0",
+  "Non-Standard",
+]);
+
+// ============================================================================
+// checkTrioStatus()
+// Mirrors check_trio_status() in trio.py
+// Checks VFS FileItem[] instead of disk
+// ============================================================================
+
+export interface TrioStatus {
+  dataset_description: {
+    exists: boolean;
+    source: "user" | "ai" | null;
+    content: string | null;
+  };
+  readme: {
+    exists: boolean;
+    source: "user" | "ai" | null;
+    content: string | null;
+  };
+  participants: {
+    exists: boolean;
+    source: "user" | "ai" | null;
+    content: string | null;
+  };
+}
+
+export const checkTrioStatus = (files: FileItem[]): TrioStatus => {
+  const findFile = (predicate: (f: FileItem) => boolean) =>
+    files.find(predicate) ?? null;
+
+  const dd = findFile((f) => f.name === "dataset_description.json");
+  const readme = findFile((f) =>
+    ["README.md", "README.txt", "README.rst", "readme.md"].includes(f.name)
+  );
+  const participants = findFile((f) => f.name === "participants.tsv");
+
+  return {
+    dataset_description: {
+      exists: !!dd,
+      source: dd ? (dd.source as "user" | "ai") : null,
+      content: dd?.content ?? null,
+    },
+    readme: {
+      exists: !!readme,
+      source: readme ? (readme.source as "user" | "ai") : null,
+      content: readme?.content ?? null,
+    },
+    participants: {
+      exists: !!participants,
+      source: participants ? (participants.source as "user" | "ai") : null,
+      content: participants?.content ?? null,
+    },
+  };
+};
+
+// ============================================================================
+// normalizeLicenseLocally()
+// Mirrors normalize_license_locally() in trio.py
+// Full alias table — handles natural language, abbreviations, typos
+// ============================================================================
+
+export const normalizeLicenseLocally = (licenseStr: string): string | null => {
+  if (!licenseStr) return null;
+
+  // Normalize: strip separators, uppercase
+  const key = licenseStr.toUpperCase().replace(/[\s\-\._]+/g, "");
+
+  const ALIAS_TABLE: Record<string, string[]> = {
+    CC0: [
+      "CC0",
+      "CC010",
+      "CC01",
+      "CREATIVECOMMONSZERO",
+      "CREATIVECOMMONS0",
+      "CC0UNIVERSALPUBLICDOMAIN",
+      "CC010UNIVERSAL",
+      "CC0UNIVERSAL",
+      "ZERORIGHTSPUBLICDOMAIN",
+      "CC0LICENSE",
+    ],
+    PD: ["PD", "PUBLICDOMAIN", "PUBLIEDOMAIN"],
+    PDDL: ["PDDL", "PDDL10", "PUBLICDOMAINDEDICATIONLICENSE"],
+    "CC-BY-4.0": [
+      "CCBY40",
+      "CCBY4",
+      "CCBY",
+      "CREATIVECOMMONSATTRIBUTION40",
+      "CREATIVECOMMONSATTRIBUTION4",
+      "CREATIVECOMMONSATTRIBUTION40INTERNATIONAL",
+    ],
+    "CC-BY-SA-4.0": [
+      "CCBYSA40",
+      "CCBYSA4",
+      "CCBYSA",
+      "CREATIVECOMMONSATTRIBUTIONSHAREALIKE40",
+    ],
+    "CC-BY-NC-4.0": [
+      "CCBYNC40",
+      "CCBYNC4",
+      "CCBYNC",
+      "CREATIVECOMMONSATTRIBUTIONNONCOMMERCIAL40",
+    ],
+    "CC-BY-NC-SA-4.0": ["CCBYNCSA40", "CCBYNCSA4"],
+    "CC-BY-NC-ND-4.0": ["CCBYNCND40", "CCBYNCND4"],
+    MIT: ["MIT", "MITLICENSE", "MITOPENSOURCE"],
+    "BSD-3-Clause": ["BSD3CLAUSE", "BSD3", "BSDNEW", "BSDREVISED"],
+    "BSD-2-Clause": ["BSD2CLAUSE", "BSD2", "BSDORIGINAL", "BSDSIMPLIFIED"],
+    "GPL-2.0": ["GPL20", "GPL2", "GNUGPL2"],
+    "GPL-2.0+": ["GPL20+", "GPL2+", "GPL2ORLATER"],
+    "GPL-3.0": ["GPL30", "GPL3", "GNUGPL3"],
+    "GPL-3.0+": ["GPL30+", "GPL3+", "GPL3ORLATER"],
+    "LGPL-3.0+": ["LGPL30+", "LGPL3+", "LGPL3ORLATER"],
+    MPL: ["MPL", "MPL20", "MPL2", "MOZILLAPUBLICLICENSE"],
+    "CDDL-1.0": ["CDDL", "CDDL10"],
+    "GFDL-1.3": ["GFDL", "GFDL13"],
+    "Non-Standard": [
+      "NONSTANDARD",
+      "CUSTOM",
+      "OTHER",
+      "PROPRIETARY",
+      "RESTRICTED",
+    ],
+  };
+
+  for (const [canonical, variants] of Object.entries(ALIAS_TABLE)) {
+    if (variants.includes(key)) return canonical;
+  }
+
+  return "Non-Standard";
+};
+
+// ============================================================================
+// parseLLMJsonResponse()
+// Mirrors _parse_llm_json_response() in trio.py
+// Shared utility — also used in plannerHelpers.ts
+// ============================================================================
+
+export const parseLLMJsonResponse = (
+  text: string,
+  stepName: string
+): any | null => {
+  if (!text?.trim()) {
+    console.warn(`${stepName}: LLM returned empty response`);
+    return null;
+  }
+
+  let t = text.trim();
+  if (t.startsWith("```json")) t = t.slice(7);
+  else if (t.startsWith("```")) t = t.split("\n").slice(1).join("\n");
+  if (t.endsWith("```")) t = t.slice(0, -3);
+  t = t.trim();
+
+  // Direct parse
+  try {
+    return JSON.parse(t);
+  } catch {}
+
+  // raw_decode equivalent: find first complete JSON object
+  const match = t.match(/\{[\s\S]*\}/);
+  if (match) {
+    try {
+      return JSON.parse(match[0]);
+    } catch {}
+  }
+
+  console.warn(
+    `${stepName}: Failed to parse JSON. Preview: ${t.slice(0, 200)}`
+  );
+  return null;
+};
+
+// ============================================================================
+// isMarkdownContent()
+// Mirrors _is_markdown_content() in trio.py
+// ============================================================================
+
+export const isMarkdownContent = (text: string): boolean => {
+  const t = text.trim();
+  return (
+    t.startsWith("#") ||
+    t.startsWith("##") ||
+    t.includes("# ") ||
+    t.includes("\n## ") ||
+    t.startsWith("**") ||
+    t.slice(0, 100).includes("- ") ||
+    t.includes("\n- ")
+  );
+};
+
+// ============================================================================
+// validateDatasetDescription()
+// Mirrors _validate_dataset_description() in trio.py
+// ============================================================================
+
+export const validateDatasetDescription = (
+  dd: Record<string, any>
+): { isValid: boolean; issues: string[] } => {
+  const issues: string[] = [];
+
+  if (!dd.Name) issues.push("Missing required field: Name");
+  if (!dd.BIDSVersion) issues.push("Missing required field: BIDSVersion");
+  if (!dd.License) issues.push("Missing required field: License");
+  else if (!LICENSE_WHITELIST.has(dd.License))
+    issues.push(`License '${dd.License}' not in BIDS whitelist`);
+
+  for (const field of ["Authors", "Funding", "EthicsApprovals"]) {
+    if (dd[field] !== undefined && !Array.isArray(dd[field]))
+      issues.push(`${field} must be an array`);
+  }
+
+  if (dd.License === "Non-Standard" && !dd.DataLicense)
+    issues.push("License='Non-Standard' requires DataLicense field");
+
+  const empty = Object.entries(dd)
+    .filter(([, v]) => v === "" || (Array.isArray(v) && v.length === 0))
+    .map(([k]) => k);
+  if (empty.length > 0)
+    issues.push(`Empty fields (will be removed): ${empty.join(", ")}`);
+
+  const isValid = !issues.some(
+    (i) => i.includes("Missing required") || i.includes("must be an array")
+  );
+  return { isValid, issues };
+};
+
+// ============================================================================
+// fixFieldTypes()
+// Mirrors _fix_field_types() in trio.py
+// Converts string → array for Authors/Funding/EthicsApprovals,
+// removes empty strings
+// ============================================================================
+
+export const fixFieldTypes = (
+  dd: Record<string, any>
+): { fixed: Record<string, any>; fixes: string[] } => {
+  const fixed = { ...dd };
+  const fixes: string[] = [];
+
+  for (const field of ["Authors", "Funding", "EthicsApprovals"]) {
+    if (!(field in fixed)) continue;
+    const val = fixed[field];
+    if (typeof val === "string") {
+      if (val.trim()) {
+        fixed[field] = [val];
+        fixes.push(`Converted ${field} from string to array`);
+      } else {
+        delete fixed[field];
+      }
+    } else if (Array.isArray(val) && val.length === 0) {
+      delete fixed[field];
+    }
+  }
+
+  // Remove empty strings except required fields
+  const required = new Set(["Name", "BIDSVersion", "DatasetType", "License"]);
+  for (const [k, v] of Object.entries(fixed)) {
+    if (v === "" && !required.has(k)) delete fixed[k];
+  }
+
+  return { fixed, fixes };
+};
+
+// ============================================================================
+// LLM call config type
+// ============================================================================
+
+// export interface TrioLLMConfig {
+//   provider: string;
+//   model: string;
+//   apiKey: string;
+//   baseUrl: string;
+//   isAnthropic?: boolean;
+//   noApiKey?: boolean;
+// }
+
+export interface GenerateTrioOptions {
+  evidenceBundle: any;
+  files: FileItem[];
+  llmConfig: TrioLLMConfig;
+  signal?: AbortSignal;
+  onStatus?: (msg: string) => void;
+}
+
+export interface GenerateTrioResult {
+  datasetDesc: Record<string, any>;
+  readmeContent: string;
+  participantsTsv: string;
+  skipped: { datasetDesc: boolean; readme: boolean; participants: boolean };
+}
+
+// ============================================================================
+// callTrioLLM() — internal LLM dispatcher
+// ============================================================================
+
+const callTrioLLM = async (
+  prompt: string,
+  llmConfig: TrioLLMConfig,
+  maxTokens: number = 2048,
+  signal?: AbortSignal
+): Promise<string> => {
+  const { provider, model, apiKey, baseUrl, isAnthropic, noApiKey } = llmConfig;
+
+  if (provider === "ollama") {
+    const res = await OllamaService.chat(model, [
+      { role: "user", content: prompt },
+    ]);
+    return res?.choices?.[0]?.message?.content ?? "";
+  }
+
+  if (isAnthropic) {
+    const res = await fetch(baseUrl, {
+      method: "POST",
+      signal,
+      headers: {
+        "Content-Type": "application/json",
+        "x-api-key": apiKey,
+        "anthropic-version": "2023-06-01",
+      },
+      body: JSON.stringify({
+        model,
+        max_tokens: maxTokens,
+        messages: [{ role: "user", content: prompt }],
+      }),
+    });
+    const data = await res.json();
+    return data?.content?.[0]?.text ?? "";
+  }
+
+  const res = await fetch(baseUrl, {
+    method: "POST",
+    signal,
+    headers: {
+      "Content-Type": "application/json",
+      ...(noApiKey ? {} : { Authorization: `Bearer ${apiKey}` }),
+    },
+    body: JSON.stringify({
+      model,
+      messages: [{ role: "user", content: prompt }],
+      max_tokens: maxTokens,
+    }),
+  });
+  const data = await res.json();
+  return data?.choices?.[0]?.message?.content ?? "";
+};
+
+// ============================================================================
+// generateDatasetDescription()
+// Mirrors generate_dataset_description() in trio.py
+//
+// Key design (mirrors Python):
+//   LLM outputs 'raw_license' (natural language, no format constraints)
+//   Python/TS normalizes: raw_license → normalizeLicenseLocally() → BIDS canonical
+//   This is robust: user can write anything, LLM understands it, we map it.
+// ============================================================================
+
+const generateDatasetDescription = async (
+  evidenceBundle: any,
+  existingContent: string | null,
+  llmConfig: TrioLLMConfig,
+  signal?: AbortSignal
+): Promise<Record<string, any>> => {
+  let existingDD: Record<string, any> | null = null;
+  if (existingContent) {
+    try {
+      existingDD = JSON.parse(existingContent);
+    } catch {}
+  }
+
+  const raw = await llmTrioDatasetDescription(
+    JSON.stringify({
+      user_hints: evidenceBundle?.user_hints ?? {},
+      documents: (evidenceBundle?.documents ?? []).map((d: any) => ({
+        filename: d.filename,
+        content: (d.content || "").slice(0, 500),
+      })),
+      counts_by_ext: evidenceBundle?.counts_by_ext ?? {},
+      existing: existingDD,
+    }),
+    llmConfig,
+    signal
+  );
+  const result = parseLLMJsonResponse(raw, "dataset_description");
+
+  // Extract raw_license — mirrors Python's multi-location search
+  const rawLicense: string =
+    result?.raw_license ||
+    result?.dataset_description?.raw_license ||
+    result?.dataset_description?.License ||
+    existingDD?.License ||
+    "";
+
+  // Python-side normalization — mirrors normalize_license_locally() call
+  const normalizedLicense = rawLicense
+    ? normalizeLicenseLocally(rawLicense)
+    : null;
+
+  const llmDD = result?.dataset_description || {};
+
+  // Merge: existingDD < llmDD, then apply normalized license (highest priority)
+  const merged: Record<string, any> = {};
+  Object.assign(merged, llmDD);
+  if (existingDD) {
+    for (const [k, v] of Object.entries(existingDD)) {
+      if (v) merged[k] = v; // existing wins only if non-empty
+    }
+  }
+  delete merged.raw_license; // remove if LLM put it inside
+
+  if (normalizedLicense) {
+    merged.License = normalizedLicense;
+  }
+
+  // Build final structure — mirrors Python's required_structure assembly
+  const final: Record<string, any> = {
+    Name: merged.Name || "",
+    BIDSVersion: "1.10.0",
+    DatasetType: merged.DatasetType || "raw",
+    License: merged.License || "",
+  };
+
+  // Array fields — mirrors _fix_field_types()
+  for (const field of ["Authors", "Funding", "EthicsApprovals"]) {
+    const val = merged[field];
+    if (!val) continue;
+    if (typeof val === "string" && val.trim()) final[field] = [val];
+    else if (Array.isArray(val) && val.length > 0) final[field] = val;
+  }
+
+  // Optional scalar fields
+  for (const field of [
+    "Acknowledgements",
+    "HowToAcknowledge",
+    "DatasetDOI",
+    "HEDVersion",
+    "DataLicense",
+  ]) {
+    if (merged[field]) final[field] = merged[field];
+  }
+
+  // Optional array fields
+  for (const field of ["ReferencesAndLinks", "GeneratedBy", "SourceDatasets"]) {
+    if (Array.isArray(merged[field]) && merged[field].length > 0)
+      final[field] = merged[field];
+  }
+
+  const finalLic = final.License;
+  if (finalLic && !LICENSE_WHITELIST.has(finalLic)) {
+    const again = normalizeLicenseLocally(finalLic);
+    if (again) final.License = again;
+  }
+
+  // Remove empty strings
+  for (const [k, v] of Object.entries(final)) {
+    if (v === "" || (Array.isArray(v) && v.length === 0)) delete final[k];
+  }
+
+  return final;
+};
+
+// ============================================================================
+// generateReadme()
+// Mirrors generate_readme() in trio.py
+// ============================================================================
+
+const generateReadme = async (
+  evidenceBundle: any,
+  llmConfig: TrioLLMConfig,
+  signal?: AbortSignal
+): Promise<string> => {
+  const raw = await llmTrioReadme(
+    JSON.stringify({
+      documents: (evidenceBundle?.documents ?? []).map((d: any) => ({
+        filename: d.filename,
+        content: (d.content || "").slice(0, 500),
+      })),
+      user_hints: evidenceBundle?.user_hints ?? {},
+      existing_readme: null,
+    }),
+    llmConfig,
+    signal
+  );
+
+  if (isMarkdownContent(raw)) return raw.trim();
+
+  const result = parseLLMJsonResponse(raw, "README");
+  return result?.readme_content ?? "# Dataset\n\nNeuroimaging dataset.\n";
+};
+// ============================================================================
+// generateParticipants()
+// Mirrors generate_participants() in trio.py
+//
+// Critical design (mirrors Python):
+//   LLM decides ONLY extra demographic column schema
+//   TS always controls participant_id and original_id from subject analysis
+// ============================================================================
+
+const generateParticipants = (evidenceBundle: any): string | null => {
+  // null = deferred
+  const nSubjects: number = evidenceBundle?.user_hints?.n_subjects ?? 1;
+  const allFiles: string[] = evidenceBundle?.all_files || [];
+
+  // Mirror Python deferral logic exactly
+  if (nSubjects > 100 || allFiles.length > 500) {
+    return null; // deferred — plan stage handles it
+  }
+
+  // Simple placeholder — plan stage will overwrite with full columns
+  const rows = Array.from(
+    { length: nSubjects },
+    (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+  );
+  return ["participant_id", ...rows].join("\n");
+};
+// const generateParticipants = async (
+//   evidenceBundle: any,
+//   files: FileItem[],
+//   llmConfig: TrioLLMConfig,
+//   signal?: AbortSignal
+// ): Promise<string> => {
+//   const userText = evidenceBundle?.user_hints?.user_text || "";
+//   const allFiles: string[] = evidenceBundle?.all_files || [];
+//   const userNSubjects: number | null =
+//     evidenceBundle?.user_hints?.n_subjects ?? null;
+//   const dominantPrefixes =
+//     evidenceBundle?.filename_analysis?.python_statistics?.dominant_prefixes;
+
+//   // Compute subject analysis — mirrors Python's authoritative subject detection
+//   const subjectAnalysis = extractSubjectAnalysis(
+//     allFiles,
+//     userNSubjects,
+//     dominantPrefixes
+//   );
+
+//   const idMap = subjectAnalysis.id_mapping.id_mapping;
+//   const reverseMap = subjectAnalysis.id_mapping.reverse_mapping;
+//   const subjectRecords = subjectAnalysis.subject_records;
+
+//   // Build subject labels list
+//   const expectedCount = userNSubjects || Object.keys(idMap).length || 1;
+//   const subjectLabels: string[] =
+//     Object.keys(idMap).length > 0 &&
+//     (!userNSubjects || Object.keys(idMap).length === userNSubjects)
+//       ? Object.values(idMap).map((id: string) => `sub-${id}`)
+//       : Array.from(
+//           { length: expectedCount },
+//           (_, i) => `sub-${String(i + 1).padStart(2, "0")}`
+//         );
+
+//   // Ask LLM ONLY for extra column schema — mirrors Python's design
+//   const prompt = `You are a BIDS participants.tsv column schema generator.
+
+// USER-PROVIDED CONTENT:
+// ${"─".repeat(60)}
+// ${userText || "(none provided)"}
+// ${"─".repeat(60)}
+
+// YOUR JOB: Decide which EXTRA columns belong in participants.tsv based ONLY
+// on what is explicitly stated in the user content above.
+
+// STRICT RULES:
+// - participant_id and original_id are ALWAYS added by code — do NOT include them
+// - ONLY add columns for demographics EXPLICITLY mentioned
+// - DO NOT invent age, sex, handedness unless directly stated
+// - If no demographic info is mentioned, return empty columns array
+
+// Output ONLY valid JSON (no markdown fences):
+// {
+//   "columns": [
+//     {"name": "sex", "levels": ["M", "F"]}
+//   ]
+// }
+
+// If no extra columns: {"columns": []}`;
+
+//   const raw = await callTrioLLM(prompt, llmConfig, 1024, signal);
+//   const schema = parseLLMJsonResponse(raw, "participants");
+
+//   // Extra columns decided by LLM (demographic columns only)
+//   const extraColumns: string[] = (schema?.columns || [])
+//     .map((c: any) => c.name)
+//     .filter((n: string) => n !== "participant_id" && n !== "original_id");
+
+//   // TypeScript always controls participant_id and original_id
+//   // mirrors Python: _generate_participants_tsv_from_python()
+//   const columns = ["participant_id", "original_id", ...extraColumns];
+//   const header = columns.join("\t");
+
+//   const rows = subjectLabels.map((subId) => {
+//     const bareId = subId.replace(/^sub-/, "");
+//     const originalId = reverseMap[bareId] || "n/a";
+//     const record = subjectRecords.find((r) => r.original_id === originalId);
+
+//     return columns
+//       .map((col) => {
+//         if (col === "participant_id") return subId;
+//         if (col === "original_id") return originalId;
+//         if (col === "group") return (record as any)?.group ?? "n/a";
+//         return "n/a";
+//       })
+//       .join("\t");
+//   });
+
+//   return [header, ...rows].join("\n");
+// };
+
+// ============================================================================
+// generateTrioFiles()
+// Main entry point — mirrors trio_generate_all() in trio.py
+// Called by handleGenerateTrio() in LLMPanel.tsx
+// ============================================================================
+
+export const generateTrioFiles = async (
+  opts: GenerateTrioOptions
+): Promise<GenerateTrioResult> => {
+  const { evidenceBundle, files, llmConfig, signal, onStatus } = opts;
+  const log = (msg: string) => {
+    console.log(msg);
+    onStatus?.(msg);
+  };
+
+  const status = checkTrioStatus(files);
+  log(
+    `Trio status: DD=${status.dataset_description.exists}, README=${status.readme.exists}, participants=${status.participants.exists}`
+  );
+
+  // Skip logic:
+  //   source === "user"  → user uploaded this file → ALWAYS skip (never overwrite)
+  //   source === "ai"    → AI generated previously → REGENERATE (replace)
+  //   null               → nothing exists          → GENERATE
+  const skipDD = status.dataset_description.source === "user";
+  const skipReadme = status.readme.source === "user";
+  const skipParticipants = status.participants.source === "user";
+  // ── dataset_description.json ─────────────────────────────────────
+  let datasetDesc: Record<string, any>;
+
+  if (skipDD) {
+    log("1/3 dataset_description.json user-uploaded, skipping...");
+    try {
+      datasetDesc = JSON.parse(status.dataset_description.content!);
+    } catch {
+      datasetDesc = {};
+    }
+  } else {
+    // Generates on first click AND regenerates on every subsequent click
+    log("1/3 Generating dataset_description.json...");
+    datasetDesc = await generateDatasetDescription(
+      evidenceBundle,
+      status.dataset_description.content ?? null,
+      llmConfig,
+      signal
+    );
+    log(`  License: ${datasetDesc.License || "MISSING"}`);
+  }
+
+  // ── README.md ────────────────────────────────────────────────────
+  let readmeContent: string;
+
+  if (skipReadme) {
+    log("2/3 README.md user-uploaded, skipping...");
+    readmeContent = status.readme.content!;
+  } else {
+    log("2/3 Generating README.md...");
+    readmeContent = await generateReadme(evidenceBundle, llmConfig, signal);
+  }
+
+  // ── participants.tsv ─────────────────────────────────────────────
+  let participantsTsv: string;
+
+  //   if (skipParticipants) {
+  //     log("3/3 participants.tsv user-uploaded, skipping...");
+  //     participantsTsv = status.participants.content!;
+  //   } else {
+  //     log("3/3 Generating participants.tsv...");
+  //     participantsTsv = await generateParticipants(
+  //       evidenceBundle,
+  //       files,
+  //       llmConfig,
+  //       signal
+  //     );
+  //   }
+  if (skipParticipants) {
+    log("3/3 participants.tsv user-uploaded, skipping...");
+    participantsTsv = status.participants.content!;
+  } else {
+    const simple = generateParticipants(evidenceBundle);
+    if (simple === null) {
+      log("3/3 participants.tsv deferred to plan stage...");
+      participantsTsv = ""; // empty — plan step will generate it
+    } else {
+      log("3/3 Generating basic participants.tsv...");
+      participantsTsv = simple;
+    }
+  }
+
+  log("✓ Trio generation complete");
+
+  return {
+    datasetDesc,
+    readmeContent: readmeContent
+      .replace(/^```markdown\n?/g, "")
+      .replace(/\n?```$/g, "")
+      .trim(),
+    participantsTsv: participantsTsv
+      .replace(/^```\n?/g, "")
+      .replace(/\n?```$/g, "")
+      .trim(),
+    skipped: {
+      datasetDesc: skipDD,
+      readme: skipReadme,
+      participants: skipParticipants,
+    },
+  };
+};
diff --git a/src/services/ollama.service.ts b/src/services/ollama.service.ts
index 9d8b368..3decc45 100644
--- a/src/services/ollama.service.ts
+++ b/src/services/ollama.service.ts
@@ -1,17 +1,18 @@
 const API_URL = process.env.REACT_APP_API_URL || "http://localhost:5000/api/v1";
 
-const getQwenTemperature = (modelName: string): number => {
-  if (modelName.includes("next") || modelName.includes("fast")) return 0.4;
-  if (modelName.includes("careful") || modelName.includes("think")) return 0.15;
-  return 0.3;
-};
+// const getQwenTemperature = (modelName: string): number => {
+//   if (modelName.includes("next") || modelName.includes("fast")) return 0.4;
+//   if (modelName.includes("careful") || modelName.includes("think")) return 0.15;
+//   return 0.3;
+// };
 
 export const OllamaService = {
   chat: async (
     model: string,
-    messages: { role: string; content: string }[]
+    messages: { role: string; content: string }[],
+    temperature?: number
   ): Promise<any> => {
-    const temperature = getQwenTemperature(model);
+    // const temperature = getQwenTemperature(model);
     const response = await fetch(`${API_URL}/ollama/chat`, {
       method: "POST",
       headers: { "Content-Type": "application/json" },
@@ -20,7 +21,7 @@ export const OllamaService = {
         messages,
         stream: false,
         options: {
-          temperature, // ← pass to Ollama
+          ...(temperature !== undefined ? { temperature } : {}),
         },
       }),
     });
diff --git a/yarn.lock b/yarn.lock
index b946d6d..8b8ba61 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -2962,6 +2962,11 @@
     jest-matcher-utils "^27.0.0"
     pretty-format "^27.0.0"
 
+"@types/js-yaml@^4.0.9":
+  version "4.0.9"
+  resolved "https://registry.yarnpkg.com/@types/js-yaml/-/js-yaml-4.0.9.tgz#cd82382c4f902fed9691a2ed79ec68c5898af4c2"
+  integrity sha512-k4MGaQl5TGo/iipqb2UDG2UwjXziSWkh0uysQelTlJpX1qGlpUZYm8PnO4DxG1qBomtJUdYJ6qR6xdIah10JLg==
+
 "@types/json-schema@*", "@types/json-schema@^7.0.15", "@types/json-schema@^7.0.4", "@types/json-schema@^7.0.5", "@types/json-schema@^7.0.8", "@types/json-schema@^7.0.9":
   version "7.0.15"
   resolved "https://registry.yarnpkg.com/@types/json-schema/-/json-schema-7.0.15.tgz#596a1747233694d50f6ad8a7869fcb6f56cf5841"

From d7176a3257aa3ccb4e8df54fc1a82776c74898ca Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 14 Apr 2026 10:18:16 -0400
Subject: [PATCH 07/61] fix: support double-click to reset uPlot series on Mac

---
 src/pages/UpdatedDatasetDetailPage.tsx |  2 +-
 src/utils/preview.js                   | 11 ++++++++++-
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index 52f87ca..67b3cb6 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -1568,7 +1568,7 @@ const UpdatedDatasetDetailPage: React.FC = () => {
           style={{
             display: "none",
             marginTop: "16px",
-            background: Colors.darkGray,
+            background: Colors.lightGray,
             color: Colors.black,
             padding: "12px",
             borderRadius: "8px",
diff --git a/src/utils/preview.js b/src/utils/preview.js
index 02f3908..dbb1c56 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -396,7 +396,7 @@ function dopreview(key, idx, isinternal, hastime) {
     $("#chartpanel").css("padding", "10px");
     $("#chartpanel").show();
     $("#chartpanel").html(
-      '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a><div id="plotchart"></div>'
+      '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a><div id="plotchart"></div>'
     );
     if (dataroot instanceof nj.NdArray) {
       // console.log("dataroot", dataroot);
@@ -445,6 +445,15 @@ function dopreview(key, idx, isinternal, hastime) {
         plotdata,
         document.getElementById("plotchart")
       );
+      // Reset all series on double-click (works on both Mac and Windows)
+      uplotInstance.root.addEventListener("dblclick", (e) => {
+        e.preventDefault();
+        e.stopPropagation();
+        uplotInstance.series.forEach((s, i) => {
+          if (i === 0) return; // skip x-axis
+          uplotInstance.setSeries(i, { show: true });
+        });
+      });
     } else {
       // let u = new uPlot(
       //   opts,

From ad92d728277ff4f1ec4129b6656ce0ed51f46d71 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 16 Apr 2026 09:42:07 -0400
Subject: [PATCH 08/61] fix: strip markdown fences from BIDSPlan YAML string
 before saving

---
 .../DatasetOrganizer/utils/plannerHelpers.ts  |  9 ++++++-
 src/utils/preview.js                          | 27 +++++++++++++------
 2 files changed, 27 insertions(+), 9 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts b/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
index 5b203e8..820c61f 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
+++ b/src/components/User/Dashboard/DatasetOrganizer/utils/plannerHelpers.ts
@@ -858,7 +858,14 @@ export const buildBidsPlan = async (
   }
 
   // Preserve raw YAML string for saving
-  const planYamlStr = raw.startsWith("```") ? planYaml._raw ?? raw : raw;
+  //   const planYamlStr = raw.startsWith("```") ? planYaml._raw ?? raw : raw;
+  // Preserve raw YAML string for saving — strip markdown fences if present (mirrors planner.py Step 3)
+  let planYamlStr = raw.trim();
+  if (planYamlStr.startsWith("```yaml")) planYamlStr = planYamlStr.slice(7);
+  else if (planYamlStr.startsWith("```"))
+    planYamlStr = planYamlStr.split("\n").slice(1).join("\n");
+  if (planYamlStr.endsWith("```")) planYamlStr = planYamlStr.slice(0, -3);
+  planYamlStr = planYamlStr.trim();
 
   log("✓ BIDSPlan complete");
   return {
diff --git a/src/utils/preview.js b/src/utils/preview.js
index dbb1c56..3013967 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -398,6 +398,7 @@ function dopreview(key, idx, isinternal, hastime) {
     $("#chartpanel").html(
       '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a><div id="plotchart"></div>'
     );
+
     if (dataroot instanceof nj.NdArray) {
       // console.log("dataroot", dataroot);
       if (dataroot.shape[0] > dataroot.shape[1])
@@ -445,15 +446,16 @@ function dopreview(key, idx, isinternal, hastime) {
         plotdata,
         document.getElementById("plotchart")
       );
+
       // Reset all series on double-click (works on both Mac and Windows)
-      uplotInstance.root.addEventListener("dblclick", (e) => {
-        e.preventDefault();
-        e.stopPropagation();
-        uplotInstance.series.forEach((s, i) => {
-          if (i === 0) return; // skip x-axis
-          uplotInstance.setSeries(i, { show: true });
-        });
-      });
+      // uplotInstance.root.addEventListener("dblclick", (e) => {
+      //   e.preventDefault();
+      //   e.stopPropagation();
+      //   uplotInstance.series.forEach((s, i) => {
+      //     if (i === 0) return; // skip x-axis
+      //     uplotInstance.setSeries(i, { show: true });
+      //   });
+      // });
     } else {
       // let u = new uPlot(
       //   opts,
@@ -469,6 +471,15 @@ function dopreview(key, idx, isinternal, hastime) {
         [[...Array(dataroot.length).keys()], dataroot],
         document.getElementById("plotchart")
       );
+
+      // uplotInstance.root.addEventListener("dblclick", (e) => {
+      //   e.preventDefault();
+      //   e.stopPropagation();
+      //   uplotInstance.series.forEach((s, i) => {
+      //     if (i === 0) return;
+      //     uplotInstance.setSeries(i, { show: true });
+      //   });
+      // });
     }
 
     // for spinner

From 072db3dcfd57c566e245ce0d9b5115d1613c4f7d Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 16 Apr 2026 10:24:02 -0400
Subject: [PATCH 09/61] fix: expand external data path segments and add 2D plot
 interaction tips

---
 src/pages/UpdatedDatasetDetailPage.tsx |  2 +-
 src/utils/preview.js                   | 13 ++++++++++++-
 2 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index 67b3cb6..db1236d 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -335,7 +335,7 @@ const UpdatedDatasetDetailPage: React.FC = () => {
               : "Unknown Size";
 
             const parts = currentPath.split("/");
-            const subpath = parts.slice(-3).join("/");
+            const subpath = parts.slice(-6).join("/");
             const label = parentKey || "ExternalData";
 
             links.push({
diff --git a/src/utils/preview.js b/src/utils/preview.js
index 3013967..d8721f8 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -396,7 +396,18 @@ function dopreview(key, idx, isinternal, hastime) {
     $("#chartpanel").css("padding", "10px");
     $("#chartpanel").show();
     $("#chartpanel").html(
-      '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a><div id="plotchart"></div>'
+      '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a>' +
+        '<div style="font-size:0.78rem; color:#555; margin:6px 0 4px 0; padding:6px 10px; background:#f0f0f0; border-radius:4px;">' +
+        "<b>Tips:</b> " +
+        "<b>Click</b> a item to toggle a signal &nbsp;|&nbsp;<br> " +
+        "<b>⌘+Click</b> (Mac) / <b>Ctrl+Click</b> (Windows) to isolate one signal &nbsp;|&nbsp; " +
+        "<b>Shift+Click</b> to add more signals to the selection &nbsp;|&nbsp; " +
+        "<b>Click and drag</b> on the plot to zoom into a region &nbsp;|&nbsp;" +
+        "<b>Double-click</b> to restore selected signals (Mac) &nbsp;|&nbsp; " +
+        "<b>Double-click</b> to restore all signals (Windows) &nbsp;|&nbsp; " +
+        "<b>⌘+Click</b> the same selected item to restore all signals (Mac)" +
+        "</div>" +
+        '<div id="plotchart"></div>'
     );
 
     if (dataroot instanceof nj.NdArray) {

From 2fffdb9ed74de7ecd42805e0596a1904abc14fb3 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 16 Apr 2026 13:07:32 -0400
Subject: [PATCH 10/61] feat: show source path and index above 2D chart panel

---
 src/pages/UpdatedDatasetDetailPage.tsx | 50 ++++++++++++++++++++++----
 src/utils/preview.js                   | 11 ++++--
 2 files changed, 51 insertions(+), 10 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index db1236d..a5be12c 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -262,7 +262,7 @@ const UpdatedDatasetDetailPage: React.FC = () => {
   const [searchParams, setSearchParams] = useSearchParams();
   const focus = searchParams.get("focus") || undefined; // get highlight from url
   const rev = searchParams.get("rev") || undefined; // get revision from url
-
+  const [chart2DPreviewPath, setChart2DPreviewPath] = useState<string>("");
   const [externalLinks, setExternalLinks] = useState<ExternalDataLink[]>([]);
   const [internalLinks, setInternalLinks] = useState<InternalDataLink[]>([]);
   const [isInternalExpanded, setIsInternalExpanded] = useState(true);
@@ -284,6 +284,14 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     ? rawSummary
     : Object.values(rawSummary).filter(Boolean).join("\n\n");
   const readme = datasetDocument?.["README"] ?? "";
+
+  useEffect(() => {
+    window.__clear2DPath = () => setChart2DPreviewPath("");
+    return () => {
+      delete window.__clear2DPath;
+    };
+  }, []);
+
   const handleSelectRevision = (newRev?: string | null) => {
     setSearchParams((prev) => {
       const p = new URLSearchParams(prev); // copy of the query url
@@ -625,7 +633,9 @@ const UpdatedDatasetDetailPage: React.FC = () => {
   const handlePreview = (
     dataOrUrl: string | any,
     idx: number,
-    isInternal: boolean = false
+    isInternal: boolean = false,
+    previewPath: string = "",
+    displayNumber?: number
   ) => {
     // console.log(
     //   "🟢 Preview button clicked for:",
@@ -635,6 +645,9 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     //   "Is Internal:",
     //   isInternal
     // );
+    setChart2DPreviewPath(
+      displayNumber ? `[${displayNumber}] ${previewPath}` : previewPath
+    );
 
     // Clear any stale preview type from last run
     delete (window as any).__previewType;
@@ -783,14 +796,14 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     // Try internal data first
     const internal = internalMap.get(previewPath);
     if (internal) {
-      handlePreview(internal.data, internal.index, true);
+      handlePreview(internal.data, internal.index, true, previewPath);
       return;
     }
 
     // Then try external data by JSON path
     const external = linkMap.get(previewPath);
     if (external) {
-      handlePreview(external.url, external.index, false);
+      handlePreview(external.url, external.index, false, previewPath);
     }
   }, [
     datasetDocument,
@@ -1324,7 +1337,12 @@ const UpdatedDatasetDetailPage: React.FC = () => {
                               },
                             }}
                             onClick={() =>
-                              handlePreview(link.data, link.index, true)
+                              handlePreview(
+                                link.data,
+                                link.index,
+                                true,
+                                link.path
+                              )
                             }
                           >
                             Preview
@@ -1463,7 +1481,7 @@ const UpdatedDatasetDetailPage: React.FC = () => {
                           }}
                           title={link.name}
                         >
-                          {link.name}
+                          {index + 1}. {link.name}
                         </Typography>
                         <Box sx={{ display: "flex", flexShrink: 0, gap: 1 }}>
                           <Button
@@ -1500,7 +1518,13 @@ const UpdatedDatasetDetailPage: React.FC = () => {
                                 },
                               }}
                               onClick={() =>
-                                handlePreview(link.url, link.index, false)
+                                handlePreview(
+                                  link.url,
+                                  link.index,
+                                  false,
+                                  link.path,
+                                  index + 1
+                                )
                               }
                             >
                               Preview
@@ -1563,6 +1587,18 @@ const UpdatedDatasetDetailPage: React.FC = () => {
           </Box>
         </Box>
 
+        {chart2DPreviewPath && (
+          <Typography
+            sx={{
+              mt: 2,
+              mb: 0.5,
+              fontSize: "0.85rem",
+              color: Colors.lightBlue,
+            }}
+          >
+            Previewing: {chart2DPreviewPath}
+          </Typography>
+        )}
         <div
           id="chartpanel"
           style={{
diff --git a/src/utils/preview.js b/src/utils/preview.js
index d8721f8..6f4a0fb 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -381,8 +381,9 @@ function dopreview(key, idx, isinternal, hastime) {
     const opts = {
       // title: "Preview for " + (isinternal ? intdata[idx][3] : extdata[idx][3]),
       title:
-        "Preview for " +
-        (isinternal ? intdata[idx][3] : window.extdata[idx][3]),
+        // "Preview for " +
+        // (isinternal ? intdata[idx][3] : window.extdata[idx][3]),
+        "Data Preview",
       width: 1100,
       height: 400,
       series: [{}, {}],
@@ -396,7 +397,11 @@ function dopreview(key, idx, isinternal, hastime) {
     $("#chartpanel").css("padding", "10px");
     $("#chartpanel").show();
     $("#chartpanel").html(
-      '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a>' +
+      // '<h4>Data preview</h4><a href="javascript:void(0)" class="closebtn" style="color: black;" onclick="$(\'#chartpanel\').hide()" title="Close">&times;</a>' +
+      "<h4></h4>" +
+        '<a href="javascript:void(0)" class="closebtn" style="color: black;" ' +
+        "onclick=\"$('#chartpanel').hide(); window.__clear2DPath && window.__clear2DPath();\" " +
+        'title="Close">&times;</a>' +
         '<div style="font-size:0.78rem; color:#555; margin:6px 0 4px 0; padding:6px 10px; background:#f0f0f0; border-radius:4px;">' +
         "<b>Tips:</b> " +
         "<b>Click</b> a item to toggle a signal &nbsp;|&nbsp;<br> " +

From badf503cd117f7b6210714eac90008d6a182e582 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 6 May 2026 10:32:46 -0400
Subject: [PATCH 11/61] feat: add axis labels to 2D plot(Sample / a.u.

---
 src/utils/preview.js | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/src/utils/preview.js b/src/utils/preview.js
index 6f4a0fb..7e4dd6d 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -387,7 +387,16 @@ function dopreview(key, idx, isinternal, hastime) {
       width: 1100,
       height: 400,
       series: [{}, {}],
-      axes: [{}, {}],
+      axes: [
+        {
+          label: "Sample", // ← x axis
+          labelSize: 20,
+        },
+        {
+          label: "a.u.", // ← y axis
+          labelSize: 20,
+        },
+      ],
       scales: {
         x: {
           time: false,

From 7a303ed61bc5e1658a08a5091e693a77acf4d6d5 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 6 May 2026 11:11:42 -0400
Subject: [PATCH 12/61] refactor: point baseURL to Express server and remove
 cors proxy logic; refs #125

---
 src/services/instance.ts | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/src/services/instance.ts b/src/services/instance.ts
index bd02b1a..13ebec2 100644
--- a/src/services/instance.ts
+++ b/src/services/instance.ts
@@ -1,18 +1,19 @@
 import axios, { AxiosInstance, AxiosRequestConfig, AxiosResponse } from "axios";
 
-// export const baseURL =
-// 	process.env.REACT_APP_BACK_URL ??
-// 	"https://cors.redoc.ly/https://neurojson.io:7777";
+// ==========not mapping neurojson.org and CouchDB requests to backend api yet==============
+// const needsCorsProxy =
+//   process.env.REACT_APP_USE_CORS === "true" ||
+//   process.env.NODE_ENV === "development";
 
-const needsCorsProxy =
-  process.env.REACT_APP_USE_CORS === "true" ||
-  process.env.NODE_ENV === "development";
+// const backendURL = "https://neurojson.io:7777";
 
-const backendURL = "https://neurojson.io:7777";
+// export const baseURL = needsCorsProxy
+//   ? `https://cors.redoc.ly/${backendURL}`
+//   : backendURL;
+//==========================================================================================
 
-export const baseURL = needsCorsProxy
-  ? `https://cors.redoc.ly/${backendURL}`
-  : backendURL;
+export const baseURL =
+  process.env.REACT_APP_API_URL || "http://localhost:5000/api/v1";
 
 export const api: AxiosInstance = axios.create({
   baseURL,

From 0f7fbffaae061c5d21e5d9ac799ba75f2520d40f Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 6 May 2026 12:19:39 -0400
Subject: [PATCH 13/61] feat: map all external API calls through Express to
 bypass firewall port restrictions; refs #125

---
 backend/src/controllers/couchdb.controller.js |   8 +-
 backend/src/routes/dbs.routes.js              |   2 +-
 src/redux/neurojson/neurojson.action.ts       |   2 +-
 src/services/neurojson.service.ts             | 241 ++++++++++--------
 4 files changed, 147 insertions(+), 106 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index ac75807..e913ee3 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -1,8 +1,8 @@
 const axios = require("axios");
-const COUCHDB_BASE_URL =
-  process.env.COUCHDB_BASE_URL ||
-  "https://cors.redoc.ly/https://neurojson.io:7777";
-
+// const COUCHDB_BASE_URL =
+//   process.env.COUCHDB_BASE_URL ||
+//   "https://cors.redoc.ly/https://neurojson.io:7777";
+const COUCHDB_BASE_URL = "https://neurojson.io:7777";
 // get all dbs list (registry)
 const getDbList = async (req, res) => {
   try {
diff --git a/backend/src/routes/dbs.routes.js b/backend/src/routes/dbs.routes.js
index d11f970..c8a57fa 100644
--- a/backend/src/routes/dbs.routes.js
+++ b/backend/src/routes/dbs.routes.js
@@ -16,7 +16,7 @@ router.get("/", getDbList);
 router.get("/stats", getDbStats);
 
 // cross-database search
-router.get("/search", searchAllDatabases);
+router.post("/search", searchAllDatabases);
 
 // Specific database routes
 router.get("/:dbName", getDbInfo);
diff --git a/src/redux/neurojson/neurojson.action.ts b/src/redux/neurojson/neurojson.action.ts
index c050ad8..35cf6c1 100644
--- a/src/redux/neurojson/neurojson.action.ts
+++ b/src/redux/neurojson/neurojson.action.ts
@@ -45,7 +45,7 @@ export const loadPaginatedData = createAsyncThunk(
         return rejectWithValue("No more data to load.");
       }
 
-      response.rows = response.rows.map((row) => ({
+      response.rows = response.rows.map((row: any) => ({
         ...row,
         dbName,
       }));
diff --git a/src/services/neurojson.service.ts b/src/services/neurojson.service.ts
index fe6859d..008e960 100644
--- a/src/services/neurojson.service.ts
+++ b/src/services/neurojson.service.ts
@@ -8,125 +8,166 @@ import { IApiResponse } from "types/responses/apiResponse.interface";
 import { Registry } from "types/responses/registry.interface";
 
 export const NeurojsonService = {
-  getRegistry: async (): Promise<Registry> => {
-    const response = await api.get<Registry>(`${baseURL}/sys/registry`);
+  // getRegistry: async (): Promise<Registry> => {
+  //   const response = await api.get<Registry>(`${baseURL}/sys/registry`);
 
+  //   return response.data;
+  // },
+  // GET /api/v1/dbs/  → getDbList
+  getRegistry: async () => {
+    const response = await api.get(`/dbs`);
     return response.data;
   },
-  getDbInfo: async (dbName: string): Promise<DBParticulars> => {
-    const response = await api.get(`${baseURL}/${dbName}`);
+
+  // getDbInfo: async (dbName: string): Promise<DBParticulars> => {
+  //   const response = await api.get(`${baseURL}/${dbName}`);
+  //   return response.data;
+  // },
+  // GET /api/v1/dbs/:dbName  → getDbInfo
+  getDbInfo: async (dbName: string) => {
+    const response = await api.get(`/dbs/${dbName}`);
     return response.data;
   },
-  getPaginatedData: async (
-    dbName: string,
-    offset: number,
-    limit: number
-  ): Promise<DBDatafields> => {
-    const response = await api.get(
-      `${baseURL}/${dbName}/_design/qq/_view/dbinfo?limit=${limit}&skip=${offset}`
-    );
 
+  // getPaginatedData: async (
+  //   dbName: string,
+  //   offset: number,
+  //   limit: number
+  // ): Promise<DBDatafields> => {
+  //   const response = await api.get(
+  //     `${baseURL}/${dbName}/_design/qq/_view/dbinfo?limit=${limit}&skip=${offset}`
+  //   );
+
+  //   return response.data;
+  // },
+  // GET /api/v1/dbs/:dbName/datasets?offset=0&limit=10  → getDbDatasets
+  getPaginatedData: async (dbName: string, offset: number, limit: number) => {
+    const response = await api.get(`/dbs/${dbName}/datasets`, {
+      params: { offset, limit },
+    });
     return response.data;
   },
-  getDocumentById: async (
-    dbName: string,
-    documentId: string,
-    rev?: string
-  ): Promise<any> => {
-    try {
-      const url = `${baseURL}/${dbName}/${documentId}`;
-      // const response = await api.get(
-      //   `${baseURL}/${dbName}/${documentId}?revs_info=true`
-      // );
-      const response = await api.get(url, {
-        params: {
-          revs_info: true,
-          ...(rev ? { rev } : {}), // add ?rev=... only when provided
-        },
-      });
-      return response.data;
-    } catch (error) {
-      console.error(
-        `Error fetching document with ID ${documentId} from ${dbName}:`,
-        error
-      );
-      throw error;
-    }
+
+  // getDocumentById: async (
+  //   dbName: string,
+  //   documentId: string,
+  //   rev?: string
+  // ): Promise<any> => {
+  //   try {
+  //     const url = `${baseURL}/${dbName}/${documentId}`;
+  //     const response = await api.get(url, {
+  //       params: {
+  //         revs_info: true,
+  //         ...(rev ? { rev } : {}), // add ?rev=... only when provided
+  //       },
+  //     });
+  //     return response.data;
+  //   } catch (error) {
+  //     console.error(
+  //       `Error fetching document with ID ${documentId} from ${dbName}:`,
+  //       error
+  //     );
+  //     throw error;
+  //   }
+  // },
+  // GET /api/v1/datasets/:dbName/:datasetId  → getDatasetDetail
+  getDocumentById: async (dbName: string, documentId: string, rev?: string) => {
+    const response = await api.get(`/datasets/${dbName}/${documentId}`, {
+      params: { revs_info: true, ...(rev ? { rev } : {}) },
+    });
+    return response.data;
   },
-  getDbStats: async (): Promise<any> => {
-    const response = await axios.get(
-      "https://cors.redoc.ly/https://neurojson.org/io/search.cgi?dbstats=1"
-    );
+
+  // getDbStats: async (): Promise<any> => {
+  //   const response = await axios.get(
+  //     "https://cors.redoc.ly/https://neurojson.org/io/search.cgi?dbstats=1"
+  //   );
+  //   return response.data;
+  // },
+  // GET /api/v1/dbs/stats  → getDbStats
+  getDbStats: async () => {
+    const response = await api.get(`/dbs/stats`);
     return response.data;
   },
-  getMetadataSearchResults: async (formData: any): Promise<any> => {
-    const map: Record<string, string> = {
-      keyword: "keyword",
-      age_min: "agemin",
-      age_max: "agemax",
-      task_min: "taskmin",
-      task_max: "taskmax",
-      run_min: "runmin",
-      run_max: "runmax",
-      sess_min: "sessmin",
-      sess_max: "sessmax",
-      modality: "modality",
-      run_name: "run",
-      type_name: "type",
-      session_name: "session",
-      task_name: "task",
-      limit: "limit",
-      skip: "skip",
-      count: "count",
-      unique: "unique",
-      gender: "gender",
-      database: "dbname",
-      dataset: "dsname",
-      subject: "subname",
-    };
 
-    const params = new URLSearchParams();
-    params.append("_get", "dbname, dsname, json");
-    Object.keys(formData).forEach((key) => {
-      let val = formData[key];
-      if (val === "" || val === "any" || val === undefined || val === null)
-        return;
+  // getMetadataSearchResults: async (formData: any): Promise<any> => {
+  //   const map: Record<string, string> = {
+  //     keyword: "keyword",
+  //     age_min: "agemin",
+  //     age_max: "agemax",
+  //     task_min: "taskmin",
+  //     task_max: "taskmax",
+  //     run_min: "runmin",
+  //     run_max: "runmax",
+  //     sess_min: "sessmin",
+  //     sess_max: "sessmax",
+  //     modality: "modality",
+  //     run_name: "run",
+  //     type_name: "type",
+  //     session_name: "session",
+  //     task_name: "task",
+  //     limit: "limit",
+  //     skip: "skip",
+  //     count: "count",
+  //     unique: "unique",
+  //     gender: "gender",
+  //     database: "dbname",
+  //     dataset: "dsname",
+  //     subject: "subname",
+  //   };
 
-      const queryKey = map[key];
-      if (!queryKey) return;
+  //   const params = new URLSearchParams();
+  //   params.append("_get", "dbname, dsname, json");
+  //   Object.keys(formData).forEach((key) => {
+  //     let val = formData[key];
+  //     if (val === "" || val === "any" || val === undefined || val === null)
+  //       return;
 
-      if (key.startsWith("age")) {
-        params.append(queryKey, String(Math.floor(val * 100)).padStart(5, "0"));
-      } else if (key === "gender") {
-        params.append(queryKey, val[0]);
-      } else if (key === "modality") {
-        params.append(queryKey, val.replace(/.*\(/, "").replace(/\).*/, ""));
-      } else {
-        params.append(queryKey, val.toString());
-      }
-    });
+  //     const queryKey = map[key];
+  //     if (!queryKey) return;
+
+  //     if (key.startsWith("age")) {
+  //       params.append(queryKey, String(Math.floor(val * 100)).padStart(5, "0"));
+  //     } else if (key === "gender") {
+  //       params.append(queryKey, val[0]);
+  //     } else if (key === "modality") {
+  //       params.append(queryKey, val.replace(/.*\(/, "").replace(/\).*/, ""));
+  //     } else {
+  //       params.append(queryKey, val.toString());
+  //     }
+  //   });
 
-    const queryString = `?${params.toString()}`;
-    const response = await axios.get(
-      `https://cors.redoc.ly/https://neurojson.org/io/search.cgi${queryString}`
-    );
+  //   const queryString = `?${params.toString()}`;
+  //   const response = await axios.get(
+  //     `https://cors.redoc.ly/https://neurojson.org/io/search.cgi${queryString}`
+  //   );
 
+  //   return response.data;
+  // },
+  // GET /api/v1/dbs/search  → searchAllDatabases
+  getMetadataSearchResults: async (formData: any) => {
+    const response = await api.post(`/dbs/search`, formData);
     return response.data;
   },
 
-  getDbInfoByDatasetId: async (dbName: string, dsId: string): Promise<any> => {
-    const response = await api.get(
-      `${baseURL}/${dbName}/_design/qq/_view/dbinfo`,
-      {
-        params: {
-          // CouchDB expects a JSON value; this produces %22ds000001%22
-          key: JSON.stringify(dsId),
-          // include_docs is optional; keep it if your view needs the full doc
-          include_docs: true,
-          // reduce: false, // uncomment if your view has a reduce function
-        },
-      }
-    );
+  // getDbInfoByDatasetId: async (dbName: string, dsId: string): Promise<any> => {
+  //   const response = await api.get(
+  //     `${baseURL}/${dbName}/_design/qq/_view/dbinfo`,
+  //     {
+  //       params: {
+  //         // CouchDB expects a JSON value; this produces %22ds000001%22
+  //         key: JSON.stringify(dsId),
+  //         // include_docs is optional; keep it if your view needs the full doc
+  //         include_docs: true,
+  //         // reduce: false, // uncomment if your view has a reduce function
+  //       },
+  //     }
+  //   );
+  //   return response.data;
+  // },
+  // GET /api/v1/datasets/:dbName/:datasetId/meta  → getDatasetMeta
+  getDbInfoByDatasetId: async (dbName: string, dsId: string) => {
+    const response = await api.get(`/datasets/${dbName}/${dsId}/meta`);
     return response.data;
   },
 };

From c450eb4108bf4a19f3b27d47bc256d6a958ff183 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 6 May 2026 12:44:16 -0400
Subject: [PATCH 14/61] fix: clear stale document and revision state when
 navigating between datasets

---
 src/pages/UpdatedDatasetDetailPage.tsx | 13 ++++++++++---
 src/redux/neurojson/neurojson.slice.ts |  6 +++++-
 2 files changed, 15 insertions(+), 4 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index a5be12c..f94a751 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -68,6 +68,7 @@ import {
   fetchDbInfoByDatasetId,
 } from "redux/neurojson/neurojson.action";
 import { NeurojsonSelector } from "redux/neurojson/neurojson.selector";
+import { resetDocument } from "redux/neurojson/neurojson.slice";
 // import { NeurojsonService } from "services/neurojson.service";
 import RoutesEnum from "types/routes.enum";
 
@@ -486,6 +487,12 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     };
   }, []);
 
+  // clean old dataset detail and metadata panel(include rev)
+  useEffect(() => {
+    dispatch(resetDocument()); // clear redux state
+    setRevsList([]); // clear local state
+  }, [dbName, docId, dispatch]);
+
   useEffect(() => {
     if (!dbName || !docId) return;
 
@@ -501,10 +508,10 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     const fromDoc = Array.isArray(datasetDocument?._revs_info)
       ? (datasetDocument._revs_info as { rev: string }[])
       : [];
-    if (fromDoc.length && revsList.length === 0) {
-      setRevsList(fromDoc);
+    if (fromDoc.length > 0) {
+      setRevsList(fromDoc); // only update when we have revisions
     }
-  }, [datasetDocument, revsList.length]);
+  }, [datasetDocument]);
 
   useEffect(() => {
     if (datasetDocument) {
diff --git a/src/redux/neurojson/neurojson.slice.ts b/src/redux/neurojson/neurojson.slice.ts
index fdcd2ce..90722c7 100644
--- a/src/redux/neurojson/neurojson.slice.ts
+++ b/src/redux/neurojson/neurojson.slice.ts
@@ -43,6 +43,10 @@ const neurojsonSlice = createSlice({
     setLoading: (state, action: PayloadAction<boolean>) => {
       state.loading = action.payload;
     },
+    resetDocument: (state) => {
+      state.selectedDocument = null;
+      state.datasetViewInfo = null;
+    },
   },
   extraReducers: (builder) => {
     builder
@@ -169,6 +173,6 @@ const neurojsonSlice = createSlice({
   },
 });
 
-export const { resetData, setLoading } = neurojsonSlice.actions;
+export const { resetData, setLoading, resetDocument } = neurojsonSlice.actions;
 
 export default neurojsonSlice.reducer;

From 67cb50e3fb154b90ef22abb923613087faca78e3 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 7 May 2026 11:16:06 -0400
Subject: [PATCH 15/61] feat: add search tables migration and update db config
 for local postgres

---
 backend/config/config.js                      |  13 +-
 .../20260507145253-create-search-tables.js    | 130 ++++++++++++++++++
 2 files changed, 141 insertions(+), 2 deletions(-)
 create mode 100644 backend/migrations/20260507145253-create-search-tables.js

diff --git a/backend/config/config.js b/backend/config/config.js
index 7c15ed9..d117965 100644
--- a/backend/config/config.js
+++ b/backend/config/config.js
@@ -1,9 +1,18 @@
 require("dotenv").config();
 
 module.exports = {
+  // development: {
+  //   dialect: "sqlite",
+  //   storage: "./database.sqlite",
+  //   logging: console.log,
+  // },
   development: {
-    dialect: "sqlite",
-    storage: "./database.sqlite",
+    dialect: "postgres",
+    host: "localhost",
+    port: 5432,
+    database: "neurojson_dev",
+    username: process.env.DB_USER_LOCAL,
+    password: process.env.DB_PASSWORD_LOCAL,
     logging: console.log,
   },
   test: {
diff --git a/backend/migrations/20260507145253-create-search-tables.js b/backend/migrations/20260507145253-create-search-tables.js
new file mode 100644
index 0000000..d2c9deb
--- /dev/null
+++ b/backend/migrations/20260507145253-create-search-tables.js
@@ -0,0 +1,130 @@
+"use strict";
+
+/** @type {import('sequelize-cli').Migration} */
+module.exports = {
+  async up(queryInterface, Sequelize) {
+    // ioviews table
+    await queryInterface.createTable("ioviews", {
+      id: {
+        type: Sequelize.INTEGER,
+        autoIncrement: true,
+        primaryKey: true,
+        allowNull: false,
+      },
+      dbname: {
+        type: Sequelize.STRING(30),
+        allowNull: true,
+      },
+      dsname: {
+        type: Sequelize.STRING(30),
+        allowNull: true,
+      },
+      subj: {
+        type: Sequelize.STRING(12),
+        allowNull: true,
+      },
+      view: {
+        type: Sequelize.STRING(12),
+        allowNull: true,
+      },
+      json: {
+        type: Sequelize.JSONB,
+        allowNull: true,
+      },
+      search_vector: {
+        type: Sequelize.DataTypes.TSVECTOR,
+        allowNull: true,
+      },
+      updated_at: {
+        type: Sequelize.DATE,
+        allowNull: false,
+        defaultValue: Sequelize.literal("CURRENT_TIMESTAMP"),
+      },
+    });
+
+    // ioviews indexes
+    await queryInterface.addIndex("ioviews", ["view"], {
+      name: "idx_ioviews_view",
+    });
+    await queryInterface.addIndex("ioviews", ["dbname"], {
+      name: "idx_ioviews_dbname",
+    });
+    await queryInterface.addIndex("ioviews", ["updated_at"], {
+      name: "idx_ioviews_updated_at",
+    });
+
+    // GIN indexes need raw query (not supported by addIndex)
+    await queryInterface.sequelize.query(`
+    CREATE INDEX IF NOT EXISTS idx_ioviews_search 
+      ON ioviews USING GIN(search_vector);
+    CREATE INDEX IF NOT EXISTS idx_ioviews_json 
+      ON ioviews USING GIN(json);
+  `);
+
+    // iolinks table
+    await queryInterface.createTable("iolinks", {
+      id: {
+        type: Sequelize.INTEGER,
+        autoIncrement: true,
+        primaryKey: true,
+        allowNull: false,
+      },
+      dbname: {
+        type: Sequelize.STRING(30),
+        allowNull: true,
+      },
+      dsname: {
+        type: Sequelize.STRING(30),
+        allowNull: true,
+      },
+      subj: {
+        type: Sequelize.TEXT,
+        allowNull: true,
+      },
+      view: {
+        type: Sequelize.TEXT,
+        allowNull: true,
+      },
+      json: {
+        type: Sequelize.JSONB,
+        allowNull: true,
+      },
+    });
+
+    // iolinks indexes
+    await queryInterface.addIndex("iolinks", ["view"], {
+      name: "idx_iolinks_view",
+    });
+    await queryInterface.addIndex("iolinks", ["dbname"], {
+      name: "idx_iolinks_dbname",
+    });
+    await queryInterface.sequelize.query(`
+    CREATE INDEX IF NOT EXISTS idx_iolinks_json 
+      ON iolinks USING GIN(json);
+  `);
+
+    // sync_state table
+    await queryInterface.createTable("sync_state", {
+      dbname: {
+        type: Sequelize.STRING(30),
+        primaryKey: true,
+        allowNull: false,
+      },
+      last_seq: {
+        type: Sequelize.TEXT,
+        allowNull: true,
+      },
+      synced_at: {
+        type: Sequelize.DATE,
+        allowNull: false,
+        defaultValue: Sequelize.literal("CURRENT_TIMESTAMP"),
+      },
+    });
+  },
+
+  async down(queryInterface, Sequelize) {
+    await queryInterface.dropTable("ioviews");
+    await queryInterface.dropTable("iolinks");
+    await queryInterface.dropTable("sync_state");
+  },
+};

From 7432b3539892f99b174061815b80894c13605bcc Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 8 May 2026 10:54:52 -0400
Subject: [PATCH 16/61] feat: add incremental sync script to populate ioviews
 and iolinks from CouchDB

---
 backend/package.json            |   3 +-
 backend/sync/incrementalSync.js | 263 ++++++++++++++++++++++++++++++++
 2 files changed, 265 insertions(+), 1 deletion(-)
 create mode 100644 backend/sync/incrementalSync.js

diff --git a/backend/package.json b/backend/package.json
index 1dde6de..fa156b3 100644
--- a/backend/package.json
+++ b/backend/package.json
@@ -11,7 +11,8 @@
     "migrate:undo:all": "npx sequelize-cli db:migrate:undo:all",
     "seed": "npx sequelize-cli db:seed:all",
     "seed:undo": "npx sequelize-cli db:seed:undo:all",
-    "db:reset": "npx sequelize-cli db:migrate:undo:all && npx sequelize-cli db:migrate"
+    "db:reset": "npx sequelize-cli db:migrate:undo:all && npx sequelize-cli db:migrate",
+    "sync": "node sync/incrementalSync.js"
   },
   "keywords": [
     "express",
diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
new file mode 100644
index 0000000..b885fc7
--- /dev/null
+++ b/backend/sync/incrementalSync.js
@@ -0,0 +1,263 @@
+"use strict";
+
+require("dotenv").config();
+const axios = require("axios");
+const { sequelize } = require("../src/config/database");
+
+const COUCHDB_URL = process.env.COUCHDB_URL || "https://neurojson.io:7777";
+
+// fetch database list dynamically from registry
+async function getDatabases() {
+  try {
+    const response = await axios.get(`${COUCHDB_URL}/sys/registry`);
+    const databases = response.data
+      .map((db) => db.id)
+      .filter((id) => id && id !== "sys");
+    console.log(`Found ${databases.length} databases in registry`);
+    return databases;
+  } catch (err) {
+    console.error("Failed to fetch registry:", err.message);
+    // fallback to hardcoded list if registry fails
+    return [
+      "openneuro",
+      "abide",
+      "abide2",
+      "datalad-registry",
+      "adhd200",
+      "bfnirs",
+      "mcx",
+      "mmc",
+      "ucl-4d-neonatal-head-model",
+      "unc-012-infant-atlas",
+      "unc-infant-cortical-surface-atlas",
+      "cotilab",
+      "emnist",
+      "nemo-bids",
+      "openfnirs",
+    ];
+  }
+}
+
+// get last synced sequence number for a database
+async function getLastSeq(dbname) {
+  try {
+    const result = await sequelize.query(
+      "SELECT last_seq FROM sync_state WHERE dbname = :dbname",
+      {
+        replacements: { dbname },
+        type: sequelize.QueryTypes.SELECT,
+      }
+    );
+    return result[0]?.last_seq || "0";
+  } catch (err) {
+    console.error(`Error getting last_seq for ${dbname}:`, err.message);
+    return "0";
+  }
+}
+
+// save latest sequence number after sync
+async function saveLastSeq(dbname, seq) {
+  await sequelize.query(
+    `INSERT INTO sync_state (dbname, last_seq, synced_at)
+     VALUES (:dbname, :seq, NOW())
+     ON CONFLICT (dbname) DO UPDATE
+     SET last_seq = :seq, synced_at = NOW()`,
+    { replacements: { dbname, seq } }
+  );
+}
+
+// upsert a row into ioviews
+async function upsertIoview(dbname, dsname, subj, view, json) {
+  await sequelize.query(
+    `INSERT INTO ioviews (dbname, dsname, subj, view, json, search_vector, updated_at)
+     VALUES (:dbname, :dsname, :subj, :view, :json, to_tsvector('english', :text), NOW())
+     ON CONFLICT (dbname, dsname, subj, view) DO UPDATE
+     SET json = :json,
+         search_vector = to_tsvector('english', :text),
+         updated_at = NOW()`,
+    {
+      replacements: {
+        dbname,
+        dsname,
+        subj: String(subj),
+        view,
+        json: JSON.stringify(json),
+        text: JSON.stringify(json),
+      },
+    }
+  );
+}
+
+// insert a row into iolinks
+async function insertIolink(dbname, dsname, subj, view, json) {
+  await sequelize.query(
+    `INSERT INTO iolinks (dbname, dsname, subj, view, json)
+     VALUES (:dbname, :dsname, :subj, :view, :json)`,
+    {
+      replacements: {
+        dbname,
+        dsname,
+        subj: String(subj),
+        view,
+        json: JSON.stringify(json),
+      },
+    }
+  );
+}
+
+// delete all records for a dataset
+async function deleteDataset(dbname, dsname) {
+  await sequelize.query(
+    "DELETE FROM ioviews WHERE dbname = :dbname AND dsname = :dsname",
+    { replacements: { dbname, dsname } }
+  );
+  await sequelize.query(
+    "DELETE FROM iolinks WHERE dbname = :dbname AND dsname = :dsname",
+    { replacements: { dbname, dsname } }
+  );
+  console.log(`  Deleted ${dbname}/${dsname}`);
+}
+
+// first time sync - fetch from CouchDB views directly
+async function firstSync(dbname) {
+  console.log(`  ${dbname}: first sync, fetching all views...`);
+
+  // fetch dbinfo view
+  const dbinfoRes = await axios.get(
+    `${COUCHDB_URL}/${dbname}/_design/qq/_view/dbinfo`
+  );
+  const dbinfoRows = dbinfoRes.data.rows || [];
+  for (const row of dbinfoRows) {
+    const subj = String(row.value?.subj?.length || 0);
+    await upsertIoview(dbname, row.id, subj, "dbinfo", row.value);
+  }
+  console.log(`  ${dbname}: dbinfo synced (${dbinfoRows.length} rows)`);
+
+  // fetch subjects view
+  const subjectsRes = await axios.get(
+    `${COUCHDB_URL}/${dbname}/_design/qq/_view/subjects`
+  );
+  const subjectRows = subjectsRes.data.rows || [];
+  for (const row of subjectRows) {
+    const subj = String(row.key?.[6] || "");
+    await upsertIoview(dbname, row.id, subj, "subjects", {
+      key: row.key,
+      value: row.value,
+    });
+  }
+  console.log(`  ${dbname}: subjects synced (${subjectRows.length} rows)`);
+
+  // fetch links view
+  const linksRes = await axios.get(
+    `${COUCHDB_URL}/${dbname}/_design/qq/_view/links`
+  );
+  const linkRows = linksRes.data.rows || [];
+  for (const row of linkRows) {
+    const fileType = row.key?.[0];
+    const subjId = String(row.key?.[1] || "");
+    await insertIolink(dbname, row.id, subjId, fileType, {
+      key: row.key,
+      value: row.value,
+    });
+  }
+  console.log(`  ${dbname}: links synced (${linkRows.length} rows)`);
+}
+
+// incremental sync - only fetch changes since last sync
+async function incrementalSync(dbname, lastSeq) {
+  const { data } = await axios.get(
+    `${COUCHDB_URL}/${dbname}/_changes?since=${lastSeq}&include_docs=true`
+  );
+
+  if (data.results.length === 0) {
+    console.log(`  ${dbname}: no changes since last sync`);
+    return data.last_seq;
+  }
+
+  console.log(`  ${dbname}: ${data.results.length} changes found`);
+
+  for (const change of data.results) {
+    if (change.deleted) {
+      await deleteDataset(dbname, change.id);
+      continue;
+    }
+
+    const doc = change.doc;
+    if (!doc?.value) continue;
+
+    // upsert dbinfo
+    if (doc.value.subj && Array.isArray(doc.value.subj)) {
+      const subj = String(doc.value.subj.length);
+      await upsertIoview(dbname, change.id, subj, "dbinfo", doc.value);
+    }
+
+    // upsert subjects
+    if (doc.value.subjects) {
+      for (const [subjId, subjData] of Object.entries(doc.value.subjects)) {
+        await upsertIoview(dbname, change.id, subjId, "subjects", {
+          key: subjData.key,
+          value: subjData.value,
+        });
+      }
+    }
+
+    // upsert links
+    if (doc.value.links) {
+      for (const link of doc.value.links) {
+        const fileType = link.key?.[0];
+        const subjId = String(link.key?.[1] || "");
+        await insertIolink(dbname, change.id, subjId, fileType, link);
+      }
+    }
+  }
+
+  return data.last_seq;
+}
+
+// sync a single database
+async function syncDatabase(dbname) {
+  console.log(`\nSyncing ${dbname}...`);
+  const lastSeq = await getLastSeq(dbname);
+
+  try {
+    if (lastSeq === "0") {
+      await firstSync(dbname);
+    } else {
+      await incrementalSync(dbname, lastSeq);
+    }
+
+    // get and save the latest seq number
+    const { data: info } = await axios.get(`${COUCHDB_URL}/${dbname}`);
+    await saveLastSeq(dbname, String(info.update_seq));
+    console.log(`  ${dbname}: sync complete ✓`);
+  } catch (err) {
+    console.error(`  ${dbname}: sync failed - ${err.message}`);
+  }
+}
+
+// main function
+async function runSync() {
+  console.log("=== Starting NeuroJSON sync ===");
+  console.log(new Date().toISOString());
+  console.log(`CouchDB: ${COUCHDB_URL}`);
+  console.log(`Databases: ${DATABASES.length}`);
+
+  // change to getDatabases() when ready for full sync
+  // const databases = await getDatabases();
+  const databases = ["bfnirs"]; // testing with small database first
+
+  console.log(`Databases: ${databases.length}`);
+
+  for (const db of databases) {
+    await syncDatabase(db);
+  }
+
+  await sequelize.close();
+  console.log("\n=== Sync complete ===");
+  console.log(new Date().toISOString());
+}
+
+runSync().catch((err) => {
+  console.error("Sync failed:", err);
+  process.exit(1);
+});

From f686418b5b76d1adabde2e55419dd6dafd2ce11b Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 8 May 2026 15:47:06 -0400
Subject: [PATCH 17/61] feat: refactor incremental sync with transactions,
 concurrency, and edge case guards

---
 backend/sync/incrementalSync.js | 469 +++++++++++++++++++++++++++-----
 1 file changed, 402 insertions(+), 67 deletions(-)

diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index b885fc7..5a73c42 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -5,6 +5,7 @@ const axios = require("axios");
 const { sequelize } = require("../src/config/database");
 
 const COUCHDB_URL = process.env.COUCHDB_URL || "https://neurojson.io:7777";
+const CONCURRENCY = 5;
 
 // fetch database list dynamically from registry
 async function getDatabases() {
@@ -17,7 +18,6 @@ async function getDatabases() {
     return databases;
   } catch (err) {
     console.error("Failed to fetch registry:", err.message);
-    // fallback to hardcoded list if registry fails
     return [
       "openneuro",
       "abide",
@@ -38,15 +38,275 @@ async function getDatabases() {
   }
 }
 
-// get last synced sequence number for a database
+// === Local ports of CouchDB _design/qq map functions ===
+// 1:1 ports of dbinfo / subjects / links views. If upstream views change,
+// these drift silently.
+
+function transformDbinfo(doc) {
+  const txt =
+    doc["README"] || doc["README.md"] || doc["README.rst"] || "";
+  const rawtext = JSON.stringify(doc);
+  const datainfo = doc["dataset_description.json"] || { Name: doc._id };
+  const subjlist = [];
+  const modalitylist = [];
+
+  for (const item of Object.keys(doc)) {
+    if (item.indexOf("ub-") !== -1) {
+      subjlist.push(item);
+      for (const modal of Object.keys(doc[item] || {})) {
+        if (modal.indexOf("ses") === 0) {
+          for (const m of Object.keys(doc[item][modal] || {})) {
+            if (m.indexOf(".") === -1 && modalitylist.indexOf(m) === -1) {
+              modalitylist.push(m);
+            }
+          }
+        } else if (
+          modal.indexOf(".") === -1 &&
+          modalitylist.indexOf(modal) === -1
+        ) {
+          modalitylist.push(modal);
+        }
+      }
+    }
+  }
+
+  if (subjlist.length === 0) subjlist.push("nonbids");
+
+  if (modalitylist.length === 0) {
+    if (rawtext.indexOf('"MeshNode"') !== -1) modalitylist.push("JMesh");
+    if (rawtext.indexOf('"NIFTIData"') !== -1) modalitylist.push("JNIFTI");
+    if (rawtext.indexOf('"SNIRFData"') !== -1) modalitylist.push("JSNIRF");
+    if (rawtext.indexOf('"_ArrayType_"') !== -1) modalitylist.push("JData");
+  }
+
+  return {
+    name: datainfo.Name,
+    length: rawtext.length,
+    readme: String(txt).substr(0, 256),
+    info: datainfo,
+    subj: subjlist,
+    modality: modalitylist,
+  };
+}
+
+function transformSubjects(doc) {
+  const results = [];
+  const skipIds = ["sidecards", "derivatives", "sourcedata", "code"];
+  if (skipIds.indexOf(doc._id) !== -1) return results;
+
+  for (const subj of Object.keys(doc)) {
+    if (!/^[sS]ub-/.test(subj)) continue;
+
+    const sessionlist = [];
+    const modalitylist = [];
+    const tasklist = [];
+    const runlist = [];
+    const filetype = [];
+    let age = -0.01;
+    let gender = "N";
+
+    const p = doc["participants.tsv"];
+    if (p && Array.isArray(p.participant_id)) {
+      let idx = -1;
+      for (let i = 0; i < p.participant_id.length; i++) {
+        if (subj.indexOf(String(p.participant_id[i])) > -1) {
+          idx = i;
+          break;
+        }
+      }
+
+      if (idx >= 0) {
+        for (const agekey of ["age", "age_scan", "age_at_scan"]) {
+          if (age >= 0) break;
+          if (p[agekey]) {
+            age = p[agekey][idx];
+            break;
+          } else if (p[agekey.toUpperCase()]) {
+            age = p[agekey.toUpperCase()][idx];
+            break;
+          } else {
+            const cap = agekey.charAt(0).toUpperCase() + agekey.slice(1);
+            if (p[cap]) {
+              age = p[cap]; // matches upstream view (drops [idx] here)
+              break;
+            }
+          }
+        }
+        if (age < 0) {
+          for (const pfield of Object.keys(p)) {
+            if (pfield.toLowerCase().indexOf("age") >= 0) {
+              age = p[pfield][idx];
+            }
+          }
+        }
+        for (const sexkey of ["sex", "gender"]) {
+          if (gender !== "N") break;
+          if (p[sexkey]) {
+            gender = p[sexkey][idx];
+            break;
+          } else if (p[sexkey.toUpperCase()]) {
+            gender = p[sexkey.toUpperCase()][idx];
+            break;
+          } else {
+            const cap = sexkey.charAt(0).toUpperCase() + sexkey.slice(1);
+            if (p[cap]) {
+              gender = p[cap]; // matches upstream view (drops [idx] here)
+              break;
+            }
+          }
+        }
+        if (gender === "N") {
+          for (const pfield of Object.keys(p)) {
+            if (pfield.toLowerCase().indexOf("sex") >= 0) {
+              gender = p[pfield][idx];
+            }
+          }
+        }
+        if (gender === "N") {
+          for (const pfield of Object.keys(p)) {
+            if (pfield.toLowerCase().indexOf("gender") >= 0) {
+              gender = p[pfield][idx];
+            }
+          }
+        }
+      }
+    }
+
+    const subjDoc = doc[subj] || {};
+    const parseFiles = (container) => {
+      for (const filename of Object.keys(container || {})) {
+        for (const task of filename.split("_")) {
+          if (task.indexOf("run-") === 0) {
+            if (runlist.indexOf(task.substring(4)) === -1) {
+              runlist.push(task.substring(4));
+            }
+          } else if (task.indexOf("task-") === 0) {
+            if (tasklist.indexOf(task.substring(5)) === -1) {
+              tasklist.push(task.substring(5));
+            }
+          } else if (task.indexOf(".") > 0) {
+            const tmp = task.substring(0, task.indexOf("."));
+            if (filetype.indexOf(tmp) === -1) filetype.push(tmp);
+          }
+        }
+      }
+    };
+
+    for (const modal of Object.keys(subjDoc)) {
+      if (modal.indexOf("ses-") === 0) {
+        if (sessionlist.indexOf(modal.substring(4)) === -1) {
+          sessionlist.push(modal.substring(4));
+        }
+        for (const modname of Object.keys(subjDoc[modal] || {})) {
+          if (
+            modname.indexOf(".") === -1 &&
+            modalitylist.indexOf(modname) === -1
+          ) {
+            modalitylist.push(modname);
+          }
+          parseFiles(subjDoc[modal][modname]);
+        }
+      } else if (
+        modal.indexOf(".") === -1 &&
+        modalitylist.indexOf(modal) === -1
+      ) {
+        modalitylist.push(modal);
+        parseFiles(subjDoc[modal]);
+      }
+    }
+
+    if (typeof gender === "string") {
+      gender = gender.substring(0, 1).toUpperCase();
+    } else {
+      gender = gender + "";
+    }
+    if (typeof age === "string" && isNaN(+age)) age = -0.001;
+    if (typeof age === "string") age = +age;
+    if (age < 0) age = -0.01;
+    age = Math.floor(age * 100);
+
+    results.push({
+      id: doc._id,
+      key: [
+        ("0000" + age).slice(-5),
+        ("000" + gender).slice(-4),
+        ("000" + sessionlist.length).slice(-4),
+        ("000" + modalitylist.length).slice(-4),
+        ("000" + tasklist.length).slice(-4),
+        ("000" + runlist.length).slice(-4),
+        subj.substring(4),
+      ],
+      value: {
+        sessions: sessionlist,
+        modalities: modalitylist,
+        tasks: tasklist,
+        runs: runlist,
+        types: filetype,
+      },
+    });
+  }
+
+  return results;
+}
+
+function transformLinks(doc) {
+  const results = [];
+  const filenameRe = /file=([^\/]*\/)*([^&\/\.]+)(\.[^.&%:]+(\.gz)*)([&:].*)*$/;
+  const filesizeRe = /size=(\d+)/;
+  const jsonpathRe = /:(\$[^&]+)/;
+  const urlhash = {};
+
+  function traverse(obj, level, rootpath) {
+    if (level > 10) return;
+    if (obj === null || typeof obj !== "object") return;
+
+    for (const subkey of Object.keys(obj)) {
+      const v = obj[subkey];
+      if (
+        subkey === "_DataLink_" &&
+        typeof v === "string" &&
+        v.indexOf("http") !== -1
+      ) {
+        const url = v;
+        const uniqurl = url.split(":$")[0];
+        if (!Object.prototype.hasOwnProperty.call(urlhash, uniqurl)) {
+          const fname = url.match(filenameRe);
+          const fsize = url.match(filesizeRe);
+          let jpath = url.match(jsonpathRe);
+          if (jpath !== null && jpath.length) jpath = jpath[1];
+          urlhash[uniqurl] = 1;
+          if (fname && fsize) {
+            results.push({
+              id: doc._id,
+              key: [fname[3], parseInt(fsize[1], 10)],
+              value: {
+                path: rootpath,
+                url: uniqurl,
+                file: fname[2] + fname[3],
+                suffix: fname[3],
+                ref: jpath,
+              },
+            });
+          }
+        }
+      }
+      if (typeof v === "object" && v !== null) {
+        traverse(v, level + 1, rootpath + "." + subkey);
+      }
+    }
+  }
+
+  traverse(doc, 1, "$");
+  return results;
+}
+
+// === DB helpers (each accepts an optional transaction) ===
+
 async function getLastSeq(dbname) {
   try {
     const result = await sequelize.query(
       "SELECT last_seq FROM sync_state WHERE dbname = :dbname",
-      {
-        replacements: { dbname },
-        type: sequelize.QueryTypes.SELECT,
-      }
+      { replacements: { dbname }, type: sequelize.QueryTypes.SELECT }
     );
     return result[0]?.last_seq || "0";
   } catch (err) {
@@ -55,19 +315,17 @@ async function getLastSeq(dbname) {
   }
 }
 
-// save latest sequence number after sync
 async function saveLastSeq(dbname, seq) {
   await sequelize.query(
     `INSERT INTO sync_state (dbname, last_seq, synced_at)
      VALUES (:dbname, :seq, NOW())
      ON CONFLICT (dbname) DO UPDATE
      SET last_seq = :seq, synced_at = NOW()`,
-    { replacements: { dbname, seq } }
+    { replacements: { dbname, seq: String(seq) } }
   );
 }
 
-// upsert a row into ioviews
-async function upsertIoview(dbname, dsname, subj, view, json) {
+async function upsertIoview(dbname, dsname, subj, view, json, transaction) {
   await sequelize.query(
     `INSERT INTO ioviews (dbname, dsname, subj, view, json, search_vector, updated_at)
      VALUES (:dbname, :dsname, :subj, :view, :json, to_tsvector('english', :text), NOW())
@@ -84,12 +342,12 @@ async function upsertIoview(dbname, dsname, subj, view, json) {
         json: JSON.stringify(json),
         text: JSON.stringify(json),
       },
+      transaction,
     }
   );
 }
 
-// insert a row into iolinks
-async function insertIolink(dbname, dsname, subj, view, json) {
+async function insertIolink(dbname, dsname, subj, view, json, transaction) {
   await sequelize.query(
     `INSERT INTO iolinks (dbname, dsname, subj, view, json)
      VALUES (:dbname, :dsname, :subj, :view, :json)`,
@@ -101,28 +359,27 @@ async function insertIolink(dbname, dsname, subj, view, json) {
         view,
         json: JSON.stringify(json),
       },
+      transaction,
     }
   );
 }
 
-// delete all records for a dataset
-async function deleteDataset(dbname, dsname) {
+async function deleteDataset(dbname, dsname, transaction) {
   await sequelize.query(
     "DELETE FROM ioviews WHERE dbname = :dbname AND dsname = :dsname",
-    { replacements: { dbname, dsname } }
+    { replacements: { dbname, dsname }, transaction }
   );
   await sequelize.query(
     "DELETE FROM iolinks WHERE dbname = :dbname AND dsname = :dsname",
-    { replacements: { dbname, dsname } }
+    { replacements: { dbname, dsname }, transaction }
   );
-  console.log(`  Deleted ${dbname}/${dsname}`);
 }
 
-// first time sync - fetch from CouchDB views directly
+// === First-time sync (fetch all three views once) ===
+
 async function firstSync(dbname) {
   console.log(`  ${dbname}: first sync, fetching all views...`);
 
-  // fetch dbinfo view
   const dbinfoRes = await axios.get(
     `${COUCHDB_URL}/${dbname}/_design/qq/_view/dbinfo`
   );
@@ -133,7 +390,6 @@ async function firstSync(dbname) {
   }
   console.log(`  ${dbname}: dbinfo synced (${dbinfoRows.length} rows)`);
 
-  // fetch subjects view
   const subjectsRes = await axios.get(
     `${COUCHDB_URL}/${dbname}/_design/qq/_view/subjects`
   );
@@ -147,7 +403,6 @@ async function firstSync(dbname) {
   }
   console.log(`  ${dbname}: subjects synced (${subjectRows.length} rows)`);
 
-  // fetch links view
   const linksRes = await axios.get(
     `${COUCHDB_URL}/${dbname}/_design/qq/_view/links`
   );
@@ -163,89 +418,169 @@ async function firstSync(dbname) {
   console.log(`  ${dbname}: links synced (${linkRows.length} rows)`);
 }
 
-// incremental sync - only fetch changes since last sync
-async function incrementalSync(dbname, lastSeq) {
-  const { data } = await axios.get(
-    `${COUCHDB_URL}/${dbname}/_changes?since=${lastSeq}&include_docs=true`
-  );
+// === Process one changed dataset (Option A: 2 HTTP requests + local transforms) ===
 
-  if (data.results.length === 0) {
-    console.log(`  ${dbname}: no changes since last sync`);
-    return data.last_seq;
+async function processDatasetUpdate(dbname, dsname) {
+  // dbinfo view supports key filtering; raw doc carries everything else.
+  const keyParam = encodeURIComponent(JSON.stringify(dsname));
+  const [dbinfoRes, rawDocRes] = await Promise.all([
+    axios.get(
+      `${COUCHDB_URL}/${dbname}/_design/qq/_view/dbinfo?key=${keyParam}`
+    ),
+    axios.get(`${COUCHDB_URL}/${dbname}/${encodeURIComponent(dsname)}`),
+  ]);
+
+  const dbinfoRow = (dbinfoRes.data.rows || [])[0];
+  if (!dbinfoRow) {
+    console.warn(`  ${dbname}/${dsname}: no dbinfo row, skipping`);
+    return;
   }
+  const dbinfoValue = dbinfoRow.value;
+  const doc = rawDocRes.data;
 
-  console.log(`  ${dbname}: ${data.results.length} changes found`);
+  const subjectRows = transformSubjects(doc);
+  const linkRows = transformLinks(doc);
 
-  for (const change of data.results) {
-    if (change.deleted) {
-      await deleteDataset(dbname, change.id);
-      continue;
-    }
+  // Rule 1: wrap all writes for this dataset in one transaction.
+  await sequelize.transaction(async (t) => {
+    const subjCount = String(dbinfoValue?.subj?.length || 0);
+    await upsertIoview(dbname, dsname, subjCount, "dbinfo", dbinfoValue, t);
 
-    const doc = change.doc;
-    if (!doc?.value) continue;
-
-    // upsert dbinfo
-    if (doc.value.subj && Array.isArray(doc.value.subj)) {
-      const subj = String(doc.value.subj.length);
-      await upsertIoview(dbname, change.id, subj, "dbinfo", doc.value);
+    // Rule 2: empty-subjs guard. NOT IN (NULL) silently matches nothing.
+    const currentSubjs = Array.isArray(dbinfoValue?.subj)
+      ? dbinfoValue.subj
+      : [];
+    if (currentSubjs.length > 0) {
+      // subjects view stores subj without "sub-"/"Sub-" prefix
+      // (key[6] = subj.substring(4) in upstream map).
+      const currentSubjIds = currentSubjs.map((s) => s.substring(4));
+      await sequelize.query(
+        `DELETE FROM ioviews
+         WHERE dbname = :dbname AND dsname = :dsname AND view = 'subjects'
+           AND subj NOT IN (:subjs)`,
+        {
+          replacements: { dbname, dsname, subjs: currentSubjIds },
+          transaction: t,
+        }
+      );
     }
 
-    // upsert subjects
-    if (doc.value.subjects) {
-      for (const [subjId, subjData] of Object.entries(doc.value.subjects)) {
-        await upsertIoview(dbname, change.id, subjId, "subjects", {
-          key: subjData.key,
-          value: subjData.value,
-        });
-      }
+    for (const row of subjectRows) {
+      const subj = String(row.key?.[6] || "");
+      await upsertIoview(
+        dbname,
+        dsname,
+        subj,
+        "subjects",
+        { key: row.key, value: row.value },
+        t
+      );
     }
 
-    // upsert links
-    if (doc.value.links) {
-      for (const link of doc.value.links) {
-        const fileType = link.key?.[0];
-        const subjId = String(link.key?.[1] || "");
-        await insertIolink(dbname, change.id, subjId, fileType, link);
-      }
+    // iolinks: no usable upsert key, so delete + reinsert per dataset.
+    await sequelize.query(
+      "DELETE FROM iolinks WHERE dbname = :dbname AND dsname = :dsname",
+      { replacements: { dbname, dsname }, transaction: t }
+    );
+    for (const row of linkRows) {
+      const fileType = row.key?.[0];
+      const subjId = String(row.key?.[1] || "");
+      await insertIolink(
+        dbname,
+        dsname,
+        subjId,
+        fileType,
+        { key: row.key, value: row.value },
+        t
+      );
     }
+  });
+}
+
+// === Incremental sync ===
+
+async function incrementalSync(dbname, lastSeq) {
+  // No include_docs=true: we fetch the raw doc per dataset so the _changes
+  // payload stays small and per-dataset work runs in parallel.
+  const { data } = await axios.get(
+    `${COUCHDB_URL}/${dbname}/_changes?since=${encodeURIComponent(lastSeq)}`
+  );
+
+  if (!data.results || data.results.length === 0) {
+    console.log(`  ${dbname}: no changes since last sync`);
+    return data.last_seq;
   }
 
+  const changes = data.results.filter(
+    (c) => c.id && !c.id.startsWith("_design/")
+  );
+  console.log(
+    `  ${dbname}: ${changes.length} dataset changes (raw=${data.results.length})`
+  );
+
+  // Rule 3: bounded concurrency + per-dataset try/catch.
+  for (let i = 0; i < changes.length; i += CONCURRENCY) {
+    const chunk = changes.slice(i, i + CONCURRENCY);
+    await Promise.all(
+      chunk.map(async (change) => {
+        try {
+          if (change.deleted) {
+            await sequelize.transaction((t) =>
+              deleteDataset(dbname, change.id, t)
+            );
+            console.log(`  ${dbname}/${change.id}: deleted`);
+          } else {
+            await processDatasetUpdate(dbname, change.id);
+          }
+        } catch (err) {
+          console.error(
+            `  ${dbname}/${change.id}: failed - ${err.message}`
+          );
+        }
+      })
+    );
+  }
+
+  // Rule 4: return last_seq from THIS response. Never re-fetch update_seq
+  // afterward (writes during sync would be silently skipped).
   return data.last_seq;
 }
 
-// sync a single database
+// === Sync a single database ===
+
 async function syncDatabase(dbname) {
   console.log(`\nSyncing ${dbname}...`);
   const lastSeq = await getLastSeq(dbname);
 
   try {
+    let nextSeq;
     if (lastSeq === "0") {
+      // Rule 5: capture update_seq BEFORE firstSync. Writes during firstSync
+      // get picked up by the next incremental run.
+      const { data: info } = await axios.get(`${COUCHDB_URL}/${dbname}`);
+      const seqAtStart = String(info.update_seq);
       await firstSync(dbname);
+      nextSeq = seqAtStart;
     } else {
-      await incrementalSync(dbname, lastSeq);
+      nextSeq = await incrementalSync(dbname, lastSeq);
     }
 
-    // get and save the latest seq number
-    const { data: info } = await axios.get(`${COUCHDB_URL}/${dbname}`);
-    await saveLastSeq(dbname, String(info.update_seq));
+    await saveLastSeq(dbname, String(nextSeq));
     console.log(`  ${dbname}: sync complete ✓`);
   } catch (err) {
     console.error(`  ${dbname}: sync failed - ${err.message}`);
   }
 }
 
-// main function
+// === Main ===
+
 async function runSync() {
   console.log("=== Starting NeuroJSON sync ===");
   console.log(new Date().toISOString());
   console.log(`CouchDB: ${COUCHDB_URL}`);
-  console.log(`Databases: ${DATABASES.length}`);
 
-  // change to getDatabases() when ready for full sync
-  // const databases = await getDatabases();
+  // change to await getDatabases() when ready for full sync
   const databases = ["bfnirs"]; // testing with small database first
-
   console.log(`Databases: ${databases.length}`);
 
   for (const db of databases) {

From 9d69223b51c297bdde62abc409c6860e5601d258 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 8 May 2026 16:57:45 -0400
Subject: [PATCH 18/61] feat: add ioviews unique constraint migration and
 disable sequelize logging in dev

---
 backend/config/config.js                      |  2 +-
 ...508195500-add-ioviews-unique-constraint.js | 20 +++++++++++++++++++
 2 files changed, 21 insertions(+), 1 deletion(-)
 create mode 100644 backend/migrations/20260508195500-add-ioviews-unique-constraint.js

diff --git a/backend/config/config.js b/backend/config/config.js
index d117965..0e7d92a 100644
--- a/backend/config/config.js
+++ b/backend/config/config.js
@@ -13,7 +13,7 @@ module.exports = {
     database: "neurojson_dev",
     username: process.env.DB_USER_LOCAL,
     password: process.env.DB_PASSWORD_LOCAL,
-    logging: console.log,
+    logging: false,
   },
   test: {
     dialect: "sqlite",
diff --git a/backend/migrations/20260508195500-add-ioviews-unique-constraint.js b/backend/migrations/20260508195500-add-ioviews-unique-constraint.js
new file mode 100644
index 0000000..757397d
--- /dev/null
+++ b/backend/migrations/20260508195500-add-ioviews-unique-constraint.js
@@ -0,0 +1,20 @@
+"use strict";
+
+/** @type {import('sequelize-cli').Migration} */
+module.exports = {
+  async up(queryInterface, Sequelize) {
+    // Required by upsertIoview's ON CONFLICT (dbname, dsname, subj, view).
+    await queryInterface.addConstraint("ioviews", {
+      fields: ["dbname", "dsname", "subj", "view"],
+      type: "unique",
+      name: "ioviews_dbname_dsname_subj_view_unique",
+    });
+  },
+
+  async down(queryInterface, Sequelize) {
+    await queryInterface.removeConstraint(
+      "ioviews",
+      "ioviews_dbname_dsname_subj_view_unique"
+    );
+  },
+};

From 627e59845b982d8fc2d9ea85df507ed410fdcd73 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 10:55:01 -0400
Subject: [PATCH 19/61] feat: replace CGI search with PostgreSQL query in
 searchAllDatabases controller

---
 backend/src/controllers/couchdb.controller.js | 269 ++++++++++++++----
 backend/sync/incrementalSync.js               |   7 +-
 2 files changed, 218 insertions(+), 58 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index e913ee3..f6c54c5 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -1,4 +1,5 @@
 const axios = require("axios");
+const { sequelize } = require("../config/database");
 // const COUCHDB_BASE_URL =
 //   process.env.COUCHDB_BASE_URL ||
 //   "https://cors.redoc.ly/https://neurojson.io:7777";
@@ -38,72 +39,226 @@ const getDbStats = async (req, res) => {
   }
 };
 
-// cross-database search
+// cross-database search — old version proxied to https://neurojson.org/io/search.cgi
+// kept for reference; replaced by the Postgres-backed version below.
+// const searchAllDatabases = async (req, res) => {
+//   try {
+//     const formData = req.body;
+//     const map = {
+//       keyword: "keyword",
+//       age_min: "agemin",
+//       age_max: "agemax",
+//       task_min: "taskmin",
+//       task_max: "taskmax",
+//       run_min: "runmin",
+//       run_max: "runmax",
+//       sess_min: "sessmin",
+//       sess_max: "sessmax",
+//       modality: "modality",
+//       run_name: "run",
+//       type_name: "type",
+//       session_name: "session",
+//       task_name: "task",
+//       limit: "limit",
+//       skip: "skip",
+//       count: "count",
+//       unique: "unique",
+//       gender: "gender",
+//       database: "dbname",
+//       dataset: "dsname",
+//       subject: "subname",
+//     };
+//
+//     const params = new URLSearchParams();
+//     params.append("_get", "dbname, dsname, json");
+//
+//     Object.keys(formData).forEach((key) => {
+//       let val = formData[key];
+//       if (val === "" || val === "any" || val === undefined || val === null) {
+//         return;
+//       }
+//
+//       const queryKey = map[key];
+//       if (!queryKey) return;
+//
+//       if (key.startsWith("age")) {
+//         params.append(queryKey, String(Math.floor(val * 100)).padStart(5, "0"));
+//       } else if (key === "gender") {
+//         params.append(queryKey, val[0]);
+//       } else if (key === "modality") {
+//         params.append(queryKey, val.replace(/.*\(/, "").replace(/\).*/, ""));
+//       } else {
+//         params.append(queryKey, val.toString());
+//       }
+//     });
+//
+//     const queryString = `?${params.toString()}`;
+//     const response = await axios.get(
+//       `https://cors.redoc.ly/https://neurojson.org/io/search.cgi${queryString}`,
+//       {
+//         headers: {
+//           Origin: "https://neurojson.io",
+//           "X-Requested-With": "XMLHttpRequest",
+//         },
+//       }
+//     );
+//     res.status(200).json(response.data);
+//   } catch (error) {
+//     console.error("Error searching all databases:", error.message);
+//     res.status(error.response?.status || 500).json({
+//       message: "Error searching databases",
+//       error: error.message,
+//     });
+//   }
+// };
+
+// helpers for the Postgres-backed search
+function isFilter(v) {
+  return v !== "" && v !== "any" && v !== undefined && v !== null;
+}
+function pad4(n) {
+  return String(n).padStart(4, "0");
+}
+function pad5(n) {
+  return String(n).padStart(5, "0");
+}
+
+// cross-database search — Postgres-backed (queries ioviews)
 const searchAllDatabases = async (req, res) => {
   try {
-    const formData = req.body;
-    const map = {
-      keyword: "keyword",
-      age_min: "agemin",
-      age_max: "agemax",
-      task_min: "taskmin",
-      task_max: "taskmax",
-      run_min: "runmin",
-      run_max: "runmax",
-      sess_min: "sessmin",
-      sess_max: "sessmax",
-      modality: "modality",
-      run_name: "run",
-      type_name: "type",
-      session_name: "session",
-      task_name: "task",
-      limit: "limit",
-      skip: "skip",
-      count: "count",
-      unique: "unique",
-      gender: "gender",
-      database: "dbname",
-      dataset: "dsname",
-      subject: "subname",
-    };
+    const f = req.body || {};
+    const where = [];
+    const repl = {};
 
-    const params = new URLSearchParams();
-    params.append("_get", "dbname, dsname, json");
+    // Pick which view to search.
+    // Subject-level filters → subjects view; otherwise dbinfo.
+    const subjectFilterKeys = [
+      "age_min", "age_max", "gender",
+      "task_min", "task_max", "task_name",
+      "run_min", "run_max", "run_name",
+      "sess_min", "sess_max", "session_name",
+      "type_name", "modality", "subject",
+    ];
+    const isSubjectSearch = subjectFilterKeys.some((k) => isFilter(f[k]));
+    where.push(`view = :view`);
+    repl.view = isSubjectSearch ? "subjects" : "dbinfo";
 
-    Object.keys(formData).forEach((key) => {
-      let val = formData[key];
-      if (val === "" || val === "any" || val === undefined || val === null) {
-        return;
-      }
+    // Range filters compare against zero-padded key components.
+    // json->'key' = [age, gender, sess, mod, task, run, subjId]
+    if (isFilter(f.age_min)) {
+      where.push(`(json->'key'->>0) >= :ageMin`);
+      repl.ageMin = pad5(Math.floor(Number(f.age_min) * 100));
+    }
+    if (isFilter(f.age_max)) {
+      where.push(`(json->'key'->>0) <= :ageMax`);
+      repl.ageMax = pad5(Math.floor(Number(f.age_max) * 100));
+    }
+    if (isFilter(f.sess_min)) {
+      where.push(`(json->'key'->>2) >= :sessMin`);
+      repl.sessMin = pad4(f.sess_min);
+    }
+    if (isFilter(f.sess_max)) {
+      where.push(`(json->'key'->>2) <= :sessMax`);
+      repl.sessMax = pad4(f.sess_max);
+    }
+    if (isFilter(f.task_min)) {
+      where.push(`(json->'key'->>4) >= :taskMin`);
+      repl.taskMin = pad4(f.task_min);
+    }
+    if (isFilter(f.task_max)) {
+      where.push(`(json->'key'->>4) <= :taskMax`);
+      repl.taskMax = pad4(f.task_max);
+    }
+    if (isFilter(f.run_min)) {
+      where.push(`(json->'key'->>5) >= :runMin`);
+      repl.runMin = pad4(f.run_min);
+    }
+    if (isFilter(f.run_max)) {
+      where.push(`(json->'key'->>5) <= :runMax`);
+      repl.runMax = pad4(f.run_max);
+    }
+    if (isFilter(f.gender)) {
+      // stored as one upper-case char left-padded to 4 chars
+      where.push(`(json->'key'->>1) LIKE :gender`);
+      repl.gender = `%${String(f.gender)[0].toUpperCase()}`;
+    }
 
-      const queryKey = map[key];
-      if (!queryKey) return;
-
-      if (key.startsWith("age")) {
-        params.append(queryKey, String(Math.floor(val * 100)).padStart(5, "0"));
-      } else if (key === "gender") {
-        params.append(queryKey, val[0]);
-      } else if (key === "modality") {
-        params.append(queryKey, val.replace(/.*\(/, "").replace(/\).*/, ""));
-      } else {
-        params.append(queryKey, val.toString());
-      }
+    // Name filters — jsonb ? checks if a string is an element of the array.
+    if (isFilter(f.task_name)) {
+      where.push(`json->'value'->'tasks' ? :taskName`);
+      repl.taskName = String(f.task_name);
+    }
+    if (isFilter(f.run_name)) {
+      where.push(`json->'value'->'runs' ? :runName`);
+      repl.runName = String(f.run_name);
+    }
+    if (isFilter(f.session_name)) {
+      where.push(`json->'value'->'sessions' ? :sessName`);
+      repl.sessName = String(f.session_name);
+    }
+    if (isFilter(f.type_name)) {
+      where.push(`json->'value'->'types' ? :typeName`);
+      repl.typeName = String(f.type_name);
+    }
+    if (isFilter(f.modality)) {
+      // form sometimes wraps as "fNIRS (nirs)" — pull text inside parens
+      const mod = String(f.modality).replace(/.*\(/, "").replace(/\).*/, "");
+      where.push(`json->'value'->'modalities' ? :modality`);
+      repl.modality = mod;
+    }
+
+    // db / ds / subj filters
+    if (isFilter(f.database)) {
+      where.push(`dbname = :dbname`);
+      repl.dbname = String(f.database);
+    }
+    if (isFilter(f.dataset)) {
+      where.push(`dsname = :dsname`);
+      repl.dsname = String(f.dataset);
+    }
+    if (isFilter(f.subject)) {
+      where.push(`subj = :subj`);
+      repl.subj = String(f.subject);
+    }
+
+    // Keyword full-text search
+    if (isFilter(f.keyword)) {
+      where.push(`search_vector @@ websearch_to_tsquery('english', :keyword)`);
+      repl.keyword = String(f.keyword);
+    }
+
+    const limit = Math.min(parseInt(f.limit) || 100, 1000);
+    const offset = parseInt(f.skip) || 0;
+    repl.limit = limit;
+    repl.offset = offset;
+
+    // dbinfo was stored flat ({name, subj, ...}); subjects was stored wrapped
+    // ({key, value}). Frontend expects parsed.value.subj for datasets, so we
+    // wrap dbinfo on the way out.
+    const sql = `
+      SELECT
+        dbname,
+        dsname,
+        subj,
+        CASE
+          WHEN view = 'dbinfo' THEN jsonb_build_object('value', json)::text
+          ELSE json::text
+        END AS json
+      FROM ioviews
+      WHERE ${where.join(" AND ")}
+      ORDER BY dbname, dsname, subj
+      LIMIT :limit OFFSET :offset
+    `;
+
+    const rows = await sequelize.query(sql, {
+      replacements: repl,
+      type: sequelize.QueryTypes.SELECT,
     });
 
-    const queryString = `?${params.toString()}`;
-    const response = await axios.get(
-      `https://cors.redoc.ly/https://neurojson.org/io/search.cgi${queryString}`,
-      {
-        headers: {
-          Origin: "https://neurojson.io",
-          "X-Requested-With": "XMLHttpRequest",
-        },
-      }
-    );
-    res.status(200).json(response.data);
+    res.status(200).json(rows);
   } catch (error) {
     console.error("Error searching all databases:", error.message);
-    res.status(error.response?.status || 500).json({
+    res.status(500).json({
       message: "Error searching databases",
       error: error.message,
     });
diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index 5a73c42..c6ab7c7 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -580,7 +580,12 @@ async function runSync() {
   console.log(`CouchDB: ${COUCHDB_URL}`);
 
   // change to await getDatabases() when ready for full sync
-  const databases = ["bfnirs"]; // testing with small database first
+  const databases = [
+    "bfnirs",           // NIRS — .snirf, .jdb
+    "brainmeshlibrary", // mesh + atlas — .jmsh, .jnii (318 datasets)
+    "cotilab",          // JData — small (6 datasets)
+    "abide",            // BIDS MRI — .nii.gz, .tsv, .json (25 datasets)
+  ];
   console.log(`Databases: ${databases.length}`);
 
   for (const db of databases) {

From 207c6340728045f5853fc6ce457cc68473927c9c Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 11:25:31 -0400
Subject: [PATCH 20/61] fix: widen ioviews and iolinks text columns to handle
 longer values

---
 ...5900-widen-ioviews-iolinks-text-columns.js | 60 +++++++++++++++++++
 backend/sync/incrementalSync.js               | 32 ++++++----
 2 files changed, 80 insertions(+), 12 deletions(-)
 create mode 100644 backend/migrations/20260511145900-widen-ioviews-iolinks-text-columns.js

diff --git a/backend/migrations/20260511145900-widen-ioviews-iolinks-text-columns.js b/backend/migrations/20260511145900-widen-ioviews-iolinks-text-columns.js
new file mode 100644
index 0000000..c6cbe81
--- /dev/null
+++ b/backend/migrations/20260511145900-widen-ioviews-iolinks-text-columns.js
@@ -0,0 +1,60 @@
+"use strict";
+
+/** @type {import('sequelize-cli').Migration} */
+module.exports = {
+  async up(queryInterface, Sequelize) {
+    // VARCHAR(n) → TEXT is a metadata-only change in Postgres (no table rewrite,
+    // no need to drop the unique constraint or indexes).
+    await queryInterface.changeColumn("ioviews", "dbname", {
+      type: Sequelize.TEXT,
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("ioviews", "dsname", {
+      type: Sequelize.TEXT,
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("ioviews", "subj", {
+      type: Sequelize.TEXT,
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("iolinks", "dbname", {
+      type: Sequelize.TEXT,
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("iolinks", "dsname", {
+      type: Sequelize.TEXT,
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("sync_state", "dbname", {
+      type: Sequelize.TEXT,
+      allowNull: false,
+    });
+  },
+
+  async down(queryInterface, Sequelize) {
+    await queryInterface.changeColumn("ioviews", "dbname", {
+      type: Sequelize.STRING(30),
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("ioviews", "dsname", {
+      type: Sequelize.STRING(30),
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("ioviews", "subj", {
+      type: Sequelize.STRING(12),
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("iolinks", "dbname", {
+      type: Sequelize.STRING(30),
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("iolinks", "dsname", {
+      type: Sequelize.STRING(30),
+      allowNull: true,
+    });
+    await queryInterface.changeColumn("sync_state", "dbname", {
+      type: Sequelize.STRING(30),
+      allowNull: false,
+    });
+  },
+};
diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index c6ab7c7..b9e497a 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -377,23 +377,34 @@ async function deleteDataset(dbname, dsname, transaction) {
 
 // === First-time sync (fetch all three views once) ===
 
+// Fetch a view, treating 404 as "view doesn't exist on this DB" (returns []).
+// Non-BIDS DBs (e.g. brainmeshlibrary) only have the dbinfo view.
+async function fetchView(dbname, viewName) {
+  try {
+    const res = await axios.get(
+      `${COUCHDB_URL}/${dbname}/_design/qq/_view/${viewName}`
+    );
+    return res.data.rows || [];
+  } catch (err) {
+    if (err.response?.status === 404) {
+      console.log(`  ${dbname}: view '${viewName}' not present, skipping`);
+      return [];
+    }
+    throw err;
+  }
+}
+
 async function firstSync(dbname) {
   console.log(`  ${dbname}: first sync, fetching all views...`);
 
-  const dbinfoRes = await axios.get(
-    `${COUCHDB_URL}/${dbname}/_design/qq/_view/dbinfo`
-  );
-  const dbinfoRows = dbinfoRes.data.rows || [];
+  const dbinfoRows = await fetchView(dbname, "dbinfo");
   for (const row of dbinfoRows) {
     const subj = String(row.value?.subj?.length || 0);
     await upsertIoview(dbname, row.id, subj, "dbinfo", row.value);
   }
   console.log(`  ${dbname}: dbinfo synced (${dbinfoRows.length} rows)`);
 
-  const subjectsRes = await axios.get(
-    `${COUCHDB_URL}/${dbname}/_design/qq/_view/subjects`
-  );
-  const subjectRows = subjectsRes.data.rows || [];
+  const subjectRows = await fetchView(dbname, "subjects");
   for (const row of subjectRows) {
     const subj = String(row.key?.[6] || "");
     await upsertIoview(dbname, row.id, subj, "subjects", {
@@ -403,10 +414,7 @@ async function firstSync(dbname) {
   }
   console.log(`  ${dbname}: subjects synced (${subjectRows.length} rows)`);
 
-  const linksRes = await axios.get(
-    `${COUCHDB_URL}/${dbname}/_design/qq/_view/links`
-  );
-  const linkRows = linksRes.data.rows || [];
+  const linkRows = await fetchView(dbname, "links");
   for (const row of linkRows) {
     const fileType = row.key?.[0];
     const subjId = String(row.key?.[1] || "");

From 4490af6c2060d0b732cb8de106ae158cfbdde77e Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 11:44:02 -0400
Subject: [PATCH 21/61] fix: make suggested databases refresh on Search click

---
 src/pages/SearchPage.tsx | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index 8e35494..b0479af 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -91,9 +91,10 @@ const SearchPage: React.FC = () => {
 
   const placement = upMd ? "right" : "top";
 
-  // for database card
-  const keywordInput = String(formData?.keyword ?? "").trim();
-  const selectedDbId = String(formData?.database ?? "").trim();
+  // inputs for the "Suggested databases" memo — read from appliedFilters so
+  // the suggestion list refreshes only on Search click, matching the results.
+  const keywordInput = String(appliedFilters?.keyword ?? "").trim();
+  const selectedDbId = String(appliedFilters?.database ?? "").trim();
 
   const registryMatches: RegistryItem[] = React.useMemo(() => {
     if (!Array.isArray(registry)) return [];
@@ -635,10 +636,9 @@ const SearchPage: React.FC = () => {
                     }}
                     title={
                       <Typography variant="body2">
-                        Live preview based on your keyword or selected database.
-                        This list updates as you type or change the dropdown.
-                        It’s <strong>separate from the results</strong>—you’ll
-                        see datasets/subjects after you click <em>Search</em>.
+                        Databases that match your keyword or selected database
+                        filter. This list refreshes when you click{" "}
+                        <em>Search</em>, alongside the datasets/subjects below.
                       </Typography>
                     }
                   >
@@ -668,7 +668,7 @@ const SearchPage: React.FC = () => {
                       datasets={db.datasets}
                       modalities={db.datatype}
                       logo={db.logo}
-                      keyword={formData.keyword} // for keyword highlight
+                      keyword={appliedFilters.keyword} // highlight the searched keyword, not the live input
                       onChipClick={handleChipClick}
                     />
                   ))}

From 5966b0957e5e02fec0c83bcf1ff2e00514ea64ea Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 13:54:32 -0400
Subject: [PATCH 22/61] feat: modality-aware combobox for Data type filter

---
 .../widgets/TypeAutocompleteWidget.tsx        | 27 +++++++++++++++
 src/pages/SearchPage.tsx                      |  5 +++
 .../SearchPageFunctions/generateUiSchema.ts   | 15 +++++---
 .../SearchPageFunctions/searchformSchema.ts   |  2 +-
 .../SearchPageFunctions/typesByModality.ts    | 34 +++++++++++++++++++
 5 files changed, 78 insertions(+), 5 deletions(-)
 create mode 100644 src/components/SearchPage/widgets/TypeAutocompleteWidget.tsx
 create mode 100644 src/utils/SearchPageFunctions/typesByModality.ts

diff --git a/src/components/SearchPage/widgets/TypeAutocompleteWidget.tsx b/src/components/SearchPage/widgets/TypeAutocompleteWidget.tsx
new file mode 100644
index 0000000..b0573fc
--- /dev/null
+++ b/src/components/SearchPage/widgets/TypeAutocompleteWidget.tsx
@@ -0,0 +1,27 @@
+import { Autocomplete, TextField } from "@mui/material";
+import { WidgetProps } from "@rjsf/utils";
+
+// Combobox: type freely OR pick from a modality-specific suggestion list.
+export const TypeAutocompleteWidget = (props: WidgetProps) => {
+  const { value, onChange, options, label, placeholder } = props;
+  const suggestions = (options.suggestions as string[]) || [];
+
+  return (
+    <Autocomplete
+      freeSolo
+      options={suggestions}
+      value={value || ""}
+      onChange={(_, v) => onChange(typeof v === "string" ? v : "")}
+      onInputChange={(_, v) => onChange(v || "")}
+      renderInput={(params) => (
+        <TextField
+          {...params}
+          label={label}
+          placeholder={placeholder || "e.g. bold, T1w"}
+          size="small"
+          fullWidth
+        />
+      )}
+    />
+  );
+};
diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index b0479af..cfd7fd7 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -22,6 +22,7 @@ import ClickTooltip from "components/SearchPage/ClickTooltip";
 import DatabaseCard from "components/SearchPage/DatabaseCard";
 import DatasetCard from "components/SearchPage/DatasetCard";
 import SubjectCard from "components/SearchPage/SubjectCard";
+import { TypeAutocompleteWidget } from "components/SearchPage/widgets/TypeAutocompleteWidget";
 import { Colors } from "design/theme";
 import { useAppDispatch } from "hooks/useAppDispatch";
 import { useAppSelector } from "hooks/useAppSelector";
@@ -212,6 +213,9 @@ const SearchPage: React.FC = () => {
     [formData, showSubjectFilters, showDatasetFilters]
   );
 
+  // Custom RJSF widgets — combobox for the "Data type keywords" field.
+  const customWidgets = { typeAutocomplete: TypeAutocompleteWidget };
+
   // Create the "Subject-level Filters" button as a custom field
   const customFields = {
     subjectFiltersToggle: () => (
@@ -401,6 +405,7 @@ const SearchPage: React.FC = () => {
         onChange={({ formData }) => setFormData(formData)}
         uiSchema={uiSchema}
         fields={customFields}
+        widgets={customWidgets}
       />
     </>
   );
diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index f352a23..7b54428 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -1,4 +1,5 @@
 import { Colors } from "design/theme";
+import { getTypeSuggestions } from "./typesByModality";
 
 // Controls the background highlight of selected fields
 // Controls the visibility of subject-level filters
@@ -52,6 +53,7 @@ export const generateUiSchema = (
       "keyword",
       "subject_filters_toggle",
       "modality",
+      "type_name", // sits right after modality — its options depend on it
       "gender",
       "age_min",
       "age_max",
@@ -62,7 +64,6 @@ export const generateUiSchema = (
       "run_min",
       "run_max",
       "task_name",
-      "type_name",
       "session_name",
       "run_name",
       "limit",
@@ -156,9 +157,15 @@ export const generateUiSchema = (
         : {}
       : hiddenStyle,
     type_name: showSubjectFilters
-      ? formData["type_name"]
-        ? activeStyle
-        : {}
+      ? {
+          "ui:widget": "typeAutocomplete",
+          "ui:options": {
+            suggestions: getTypeSuggestions(formData.modality),
+            ...(formData["type_name"]
+              ? { style: { backgroundColor: Colors.lightBlue } }
+              : {}),
+          },
+        }
       : hiddenStyle,
     session_name: showSubjectFilters
       ? formData["session_name"]
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index 7fc71b5..ead7855 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -118,7 +118,7 @@ export const baseSchema: JSONSchema7 = {
       type: "string",
     },
     type_name: {
-      title: "Data type keywords",
+      title: "Data type",
       type: "string",
     },
     session_name: {
diff --git a/src/utils/SearchPageFunctions/typesByModality.ts b/src/utils/SearchPageFunctions/typesByModality.ts
new file mode 100644
index 0000000..090475d
--- /dev/null
+++ b/src/utils/SearchPageFunctions/typesByModality.ts
@@ -0,0 +1,34 @@
+// Common BIDS suffixes grouped by modality.
+// Extend the lists as you find missing values in your data.
+export const TYPES_BY_MODALITY: Record<string, string[]> = {
+  anat: ["T1w", "T2w", "FLAIR", "T2star", "PD", "angio", "defacemask"],
+  func: ["bold", "sbref", "events", "physio", "stim"],
+  dwi: ["dwi", "sbref"],
+  fmap: ["phasediff", "magnitude1", "magnitude2", "fieldmap", "epi"],
+  meg: ["meg", "channels", "coordsystem", "headshape", "events"],
+  eeg: ["eeg", "channels", "electrodes", "coordsystem", "events"],
+  ieeg: ["ieeg", "channels", "electrodes", "coordsystem", "events"],
+  pet: ["pet", "blood", "events"],
+  nirs: ["nirs", "channels", "optodes", "coordsystem", "events"],
+  beh: ["beh", "events"],
+  motion: ["motion", "channels", "events"],
+  perf: ["asl", "m0scan"],
+  micr: ["TEM", "SEM", "MRM"],
+};
+
+// The modality form field stores values like "fMRI (func)" — extract the
+// suffix inside the parens so we can look it up in TYPES_BY_MODALITY.
+export function getModalityKey(modalityValue?: string): string | null {
+  if (!modalityValue || modalityValue === "any") return null;
+  const m = modalityValue.match(/\(([^)]+)\)/);
+  return m ? m[1] : modalityValue;
+}
+
+export function getTypeSuggestions(modalityValue?: string): string[] {
+  const key = getModalityKey(modalityValue);
+  if (!key) {
+    // No modality picked → show all suffixes deduped and sorted.
+    return Array.from(new Set(Object.values(TYPES_BY_MODALITY).flat())).sort();
+  }
+  return TYPES_BY_MODALITY[key] || [];
+}

From d101e5cd64b0f6c4ce582c4cf4eec1ae2cf340b7 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 14:54:30 -0400
Subject: [PATCH 23/61] feat(search): add draggable age-range slider at top of
 subject filters

---
 src/pages/SearchPage.tsx                      | 58 +++++++++++++++++++
 .../SearchPageFunctions/generateUiSchema.ts   | 19 +++---
 .../SearchPageFunctions/searchformSchema.ts   |  4 ++
 3 files changed, 71 insertions(+), 10 deletions(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index cfd7fd7..e9ac04d 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -13,6 +13,7 @@ import {
   Tooltip,
   IconButton,
   Alert,
+  Slider,
 } from "@mui/material";
 import { useTheme } from "@mui/material/styles";
 import useMediaQuery from "@mui/material/useMediaQuery";
@@ -46,6 +47,60 @@ type RegistryItem = {
   logo?: string;
 };
 
+// Module-scope so the component identity is stable across SearchPage renders.
+// An inline arrow function inside customFields was getting a new identity each
+// render, which made RJSF remount the slider mid-drag.
+const AGE_MIN_BOUND = 0;
+const AGE_MAX_BOUND = 100;
+
+const AgeRangeSliderField = (props: any) => {
+  const ctx = props?.registry?.formContext as
+    | {
+        formData: Record<string, any>;
+        setFormData: React.Dispatch<React.SetStateAction<Record<string, any>>>;
+      }
+    | undefined;
+  if (!ctx) return null;
+  const { formData, setFormData } = ctx;
+  const lo =
+    typeof formData.age_min === "number" ? formData.age_min : AGE_MIN_BOUND;
+  const hi =
+    typeof formData.age_max === "number" ? formData.age_max : AGE_MAX_BOUND;
+  const isAny = lo === AGE_MIN_BOUND && hi === AGE_MAX_BOUND;
+  return (
+    <Box sx={{ px: 2, mt: 2, mb: 1, width: "100%" }}>
+      <Typography variant="body2" sx={{ mb: 1 }}>
+        Age: {isAny ? "Any" : `${lo} – ${hi}`}
+      </Typography>
+      <Slider
+        value={[lo, hi]}
+        onChange={(_, v) => {
+          const [newLo, newHi] = v as number[];
+          setFormData((prev) => {
+            const atFull =
+              newLo === AGE_MIN_BOUND && newHi === AGE_MAX_BOUND;
+            const next = { ...prev };
+            if (atFull) {
+              delete next.age_min;
+              delete next.age_max;
+            } else {
+              next.age_min = newLo;
+              next.age_max = newHi;
+            }
+            return next;
+          });
+        }}
+        valueLabelDisplay="auto"
+        min={AGE_MIN_BOUND}
+        max={AGE_MAX_BOUND}
+        step={1}
+        disableSwap
+        sx={{ color: Colors.purple }}
+      />
+    </Box>
+  );
+};
+
 const matchesKeyword = (item: RegistryItem, keyword: string) => {
   if (!keyword) return false;
   const needle = keyword.toLowerCase();
@@ -252,6 +307,7 @@ const SearchPage: React.FC = () => {
         </Button>
       </Box>
     ),
+    ageRangeSlider: AgeRangeSliderField,
   };
 
   // determine the results are subject-level or dataset-level
@@ -406,6 +462,7 @@ const SearchPage: React.FC = () => {
         uiSchema={uiSchema}
         fields={customFields}
         widgets={customWidgets}
+        formContext={{ formData, setFormData }}
       />
     </>
   );
@@ -847,6 +904,7 @@ const SearchPage: React.FC = () => {
                                   {...item}
                                   parsedJson={parsedJson}
                                   onChipClick={handleChipClick}
+                                  age={parsedJson?.key?.[0]}
                                 />
                               );
                             } catch (e) {
diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index 7b54428..d604b5f 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -52,10 +52,11 @@ export const generateUiSchema = (
       "database",
       "keyword",
       "subject_filters_toggle",
+      "age_range_slider", // top of subject filters — range slider for age
       "modality",
       "type_name", // sits right after modality — its options depend on it
       "gender",
-      "age_min",
+      "age_min", // hidden via invisibleStyle; written by the slider above
       "age_max",
       "sess_min",
       "sess_max",
@@ -101,16 +102,14 @@ export const generateUiSchema = (
         : {}
       : hiddenStyle,
 
-    age_min: showSubjectFilters
-      ? formData["age_min"]
-        ? activeStyle
-        : {}
-      : hiddenStyle,
-    age_max: showSubjectFilters
-      ? formData["age_max"]
-        ? activeStyle
-        : {}
+    // Age range — slider lives inside the form via the AgeRangeSliderField
+    // stable component. age_min/age_max stay in the schema (so the backend
+    // gets them on submit) but their default numeric inputs are hidden.
+    age_range_slider: showSubjectFilters
+      ? { "ui:field": "ageRangeSlider" }
       : hiddenStyle,
+    age_min: invisibleStyle,
+    age_max: invisibleStyle,
 
     gender: showSubjectFilters
       ? formData["gender"] && formData["gender"] !== "any"
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index ead7855..bcba6d7 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -64,6 +64,10 @@ export const baseSchema: JSONSchema7 = {
       enum: ["male", "female", "unknown", "any"],
       default: "any",
     },
+    age_range_slider: {
+      type: "null",
+      title: "Age range",
+    },
     age_min: {
       title: "Minimum age",
       type: "number",

From 88474cc4caf485da90a6a5ea366f69f208210ef3 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 15:05:54 -0400
Subject: [PATCH 24/61] feat(search): add placeholder hints to task/session/run
 keyword fields

---
 .../SearchPageFunctions/generateUiSchema.ts   | 21 +++++++++++--------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index d604b5f..e27d02c 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -151,9 +151,10 @@ export const generateUiSchema = (
       : hiddenStyle,
 
     task_name: showSubjectFilters
-      ? formData["task_name"]
-        ? activeStyle
-        : {}
+      ? {
+          "ui:placeholder": "e.g. rest, motor",
+          ...(formData["task_name"] ? activeStyle : {}),
+        }
       : hiddenStyle,
     type_name: showSubjectFilters
       ? {
@@ -167,14 +168,16 @@ export const generateUiSchema = (
         }
       : hiddenStyle,
     session_name: showSubjectFilters
-      ? formData["session_name"]
-        ? activeStyle
-        : {}
+      ? {
+          "ui:placeholder": "e.g. 01, pre, baseline",
+          ...(formData["session_name"] ? activeStyle : {}),
+        }
       : hiddenStyle,
     run_name: showSubjectFilters
-      ? formData["run_name"]
-        ? activeStyle
-        : {}
+      ? {
+          "ui:placeholder": "e.g. 01, 02",
+          ...(formData["run_name"] ? activeStyle : {}),
+        }
       : hiddenStyle,
 
     "ui:submitButtonOptions": {

From b9be29f248103c4c44e743c7274cb501d5c1b407 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 15:18:23 -0400
Subject: [PATCH 25/61] feat(search): pair min/max count fields on one row and
 tighten gaps(sessions, tasks, and runs)

---
 src/pages/SearchPage.tsx                      | 60 +++++++++++++++
 .../SearchPageFunctions/generateUiSchema.ts   | 76 +++++++++++--------
 .../SearchPageFunctions/searchformSchema.ts   |  3 +
 3 files changed, 106 insertions(+), 33 deletions(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index e9ac04d..ca5d1c4 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -14,6 +14,8 @@ import {
   IconButton,
   Alert,
   Slider,
+  Stack,
+  TextField,
 } from "@mui/material";
 import { useTheme } from "@mui/material/styles";
 import useMediaQuery from "@mui/material/useMediaQuery";
@@ -101,6 +103,63 @@ const AgeRangeSliderField = (props: any) => {
   );
 };
 
+// Pairs a "<key>_min" + "<key>_max" into a single row of two number inputs.
+// Reads target field names + label from uiSchema's ui:options:
+//   { minKey: "sess_min", maxKey: "sess_max", label: "sessions" }
+const CountRangePairField = (props: any) => {
+  const ctx = props?.registry?.formContext as
+    | {
+        formData: Record<string, any>;
+        setFormData: React.Dispatch<React.SetStateAction<Record<string, any>>>;
+      }
+    | undefined;
+  const opts = props?.uiSchema?.["ui:options"] || {};
+  const minKey = opts.minKey as string;
+  const maxKey = opts.maxKey as string;
+  const label = (opts.label as string) || "";
+  if (!ctx || !minKey || !maxKey) return null;
+  const { formData, setFormData } = ctx;
+  const minVal = formData[minKey] ?? "";
+  const maxVal = formData[maxKey] ?? "";
+
+  const update = (key: string, raw: string) => {
+    setFormData((prev) => {
+      const next = { ...prev };
+      if (raw === "" || raw === undefined) {
+        delete next[key];
+      } else {
+        const n = Number(raw);
+        if (Number.isNaN(n)) delete next[key];
+        else next[key] = n;
+      }
+      return next;
+    });
+  };
+
+  return (
+    <Stack direction="row" spacing={2} sx={{ mt: 1, mb: 1 }}>
+      <TextField
+        label={`Min ${label}`}
+        type="number"
+        size="small"
+        value={minVal}
+        onChange={(e) => update(minKey, e.target.value)}
+        fullWidth
+        inputProps={{ min: 0 }}
+      />
+      <TextField
+        label={`Max ${label}`}
+        type="number"
+        size="small"
+        value={maxVal}
+        onChange={(e) => update(maxKey, e.target.value)}
+        fullWidth
+        inputProps={{ min: 0 }}
+      />
+    </Stack>
+  );
+};
+
 const matchesKeyword = (item: RegistryItem, keyword: string) => {
   if (!keyword) return false;
   const needle = keyword.toLowerCase();
@@ -308,6 +367,7 @@ const SearchPage: React.FC = () => {
       </Box>
     ),
     ageRangeSlider: AgeRangeSliderField,
+    countRangePair: CountRangePairField,
   };
 
   // determine the results are subject-level or dataset-level
diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index e27d02c..872accb 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -16,13 +16,11 @@ export const generateUiSchema = (
     },
   };
 
-  // hide subject-level filter
+  // Fully remove a field from the rendered DOM (keeps its value in formData).
+  // Using ui:widget: "hidden" produces just an <input type="hidden">, so no
+  // empty Grid row + margin is left behind — fixes the big gap between rows.
   const invisibleStyle = {
-    "ui:options": {
-      style: {
-        display: "none",
-      },
-    },
+    "ui:widget": "hidden",
   };
 
   const hiddenStyle = {
@@ -58,10 +56,13 @@ export const generateUiSchema = (
       "gender",
       "age_min", // hidden via invisibleStyle; written by the slider above
       "age_max",
+      "sess_count_range", // sessions min/max on one row
       "sess_min",
       "sess_max",
+      "task_count_range", // tasks min/max on one row
       "task_min",
       "task_max",
+      "run_count_range", // runs min/max on one row
       "run_min",
       "run_max",
       "task_name",
@@ -117,38 +118,47 @@ export const generateUiSchema = (
         : {}
       : hiddenStyle,
 
-    sess_min: showSubjectFilters
-      ? formData["sess_min"]
-        ? activeStyle
-        : {}
-      : hiddenStyle,
-    sess_max: showSubjectFilters
-      ? formData["sess_max"]
-        ? activeStyle
-        : {}
+    // Session / task / run min+max pairs are rendered by a single
+    // CountRangePairField each. The raw integer inputs are hidden but stay in
+    // formData so the backend still receives them on submit.
+    sess_count_range: showSubjectFilters
+      ? {
+          "ui:field": "countRangePair",
+          "ui:options": {
+            minKey: "sess_min",
+            maxKey: "sess_max",
+            label: "sessions",
+          },
+        }
       : hiddenStyle,
+    sess_min: invisibleStyle,
+    sess_max: invisibleStyle,
 
-    task_min: showSubjectFilters
-      ? formData["task_min"]
-        ? activeStyle
-        : {}
-      : hiddenStyle,
-    task_max: showSubjectFilters
-      ? formData["task_max"]
-        ? activeStyle
-        : {}
+    task_count_range: showSubjectFilters
+      ? {
+          "ui:field": "countRangePair",
+          "ui:options": {
+            minKey: "task_min",
+            maxKey: "task_max",
+            label: "tasks",
+          },
+        }
       : hiddenStyle,
+    task_min: invisibleStyle,
+    task_max: invisibleStyle,
 
-    run_min: showSubjectFilters
-      ? formData["run_min"]
-        ? activeStyle
-        : {}
-      : hiddenStyle,
-    run_max: showSubjectFilters
-      ? formData["run_max"]
-        ? activeStyle
-        : {}
+    run_count_range: showSubjectFilters
+      ? {
+          "ui:field": "countRangePair",
+          "ui:options": {
+            minKey: "run_min",
+            maxKey: "run_max",
+            label: "runs",
+          },
+        }
       : hiddenStyle,
+    run_min: invisibleStyle,
+    run_max: invisibleStyle,
 
     task_name: showSubjectFilters
       ? {
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index bcba6d7..34abc4a 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -81,6 +81,7 @@ export const baseSchema: JSONSchema7 = {
       maximum: 1000,
     },
 
+    sess_count_range: { type: "null", title: "Sessions" },
     sess_min: {
       title: "Minimum session count",
       type: "integer",
@@ -93,6 +94,7 @@ export const baseSchema: JSONSchema7 = {
       minimum: 0,
       maximum: 1000,
     },
+    task_count_range: { type: "null", title: "Tasks" },
     task_min: {
       title: "Minimum task count",
       type: "integer",
@@ -105,6 +107,7 @@ export const baseSchema: JSONSchema7 = {
       minimum: 0,
       maximum: 1000,
     },
+    run_count_range: { type: "null", title: "Runs" },
     run_min: {
       title: "Minimum runs",
       type: "integer",

From df73e1cbc0e2f61fe1c41c006a6dd08088d1871c Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 11 May 2026 15:31:47 -0400
Subject: [PATCH 26/61] feat(search): show run count in subject card

---
 src/components/SearchPage/SubjectCard.tsx         | 9 ++++++++-
 src/utils/SearchPageFunctions/searchformSchema.ts | 2 +-
 2 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/components/SearchPage/SubjectCard.tsx b/src/components/SearchPage/SubjectCard.tsx
index c66ebce..f805b48 100644
--- a/src/components/SearchPage/SubjectCard.tsx
+++ b/src/components/SearchPage/SubjectCard.tsx
@@ -16,6 +16,7 @@ interface SubjectCardProps {
       modalities?: string[];
       tasks?: string[];
       sessions?: string[];
+      runs?: string[];
       types?: string[];
     };
   };
@@ -32,7 +33,8 @@ const SubjectCard: React.FC<SubjectCardProps> = ({
   index,
   onChipClick,
 }) => {
-  const { modalities, tasks, sessions, types } = parsedJson.value;
+  const { modalities, tasks, sessions, runs, types } = parsedJson.value;
+  const runCount = Array.isArray(runs) ? runs.length : 0;
   const subjectLink = `${RoutesEnum.DATABASES}/${dbname}/${dsname}`;
   const formattedSubj = /^sub-/i.test(subj) ? subj : `sub-${String(subj)}`;
 
@@ -229,6 +231,11 @@ const SubjectCard: React.FC<SubjectCardProps> = ({
               {sessions?.length === 0 ? 1 : sessions?.length}
             </Typography>
           </Stack>
+          <Stack direction="row" spacing={1} flexWrap="wrap" gap={1}>
+            <Typography variant="body2" mt={1}>
+              <strong>Runs:</strong> {runCount}
+            </Typography>
+          </Stack>
         </Stack>
       </CardContent>
     </Card>
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index 34abc4a..4cb4ef6 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -61,7 +61,7 @@ export const baseSchema: JSONSchema7 = {
     gender: {
       title: "Subject gender",
       type: "string",
-      enum: ["male", "female", "unknown", "any"],
+      enum: ["male", "female", "any"],
       default: "any",
     },
     age_range_slider: {

From 44635bd8a4e67c909306c43d68a0c8743bf24d2c Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 12 May 2026 10:55:48 -0400
Subject: [PATCH 27/61] feat(backend): add file type filter to search using
 iolinks table

---
 backend/src/controllers/couchdb.controller.js | 36 +++++++++++++++++++
 backend/src/routes/dbs.routes.js              |  6 ++++
 2 files changed, 42 insertions(+)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index f6c54c5..edb9957 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -227,6 +227,20 @@ const searchAllDatabases = async (req, res) => {
       repl.keyword = String(f.keyword);
     }
 
+    // File-type filter — array of extensions like [".jdb", ".snirf"].
+    // Dataset-level: include rows whose (dbname, dsname) has at least one
+    // iolinks file with a matching view (extension). Per-subject filtering
+    // isn't possible here because iolinks.subj stores file size, not subj id.
+    if (Array.isArray(f.file_type) && f.file_type.length > 0) {
+      where.push(`EXISTS (
+        SELECT 1 FROM iolinks l
+        WHERE l.dbname = ioviews.dbname
+          AND l.dsname = ioviews.dsname
+          AND l.view = ANY(:fileTypes)
+      )`);
+      repl.fileTypes = f.file_type.map((t) => String(t));
+    }
+
     const limit = Math.min(parseInt(f.limit) || 100, 1000);
     const offset = parseInt(f.skip) || 0;
     repl.limit = limit;
@@ -392,6 +406,27 @@ const getDatasetMeta = async (req, res) => {
 
 // }
 
+// distinct file extensions present in iolinks across all synced DBs.
+// Drives the multi-select "File types" filter on the search page.
+const getFileTypes = async (req, res) => {
+  try {
+    const rows = await sequelize.query(
+      `SELECT DISTINCT view AS type
+       FROM iolinks
+       WHERE view IS NOT NULL AND view <> ''
+       ORDER BY view`,
+      { type: sequelize.QueryTypes.SELECT }
+    );
+    res.status(200).json(rows.map((r) => r.type));
+  } catch (error) {
+    console.error("Error fetching file types:", error.message);
+    res.status(500).json({
+      message: "Error fetching file types",
+      error: error.message,
+    });
+  }
+};
+
 module.exports = {
   getDbList,
   getDbStats,
@@ -400,4 +435,5 @@ module.exports = {
   searchAllDatabases,
   getDatasetDetail,
   getDatasetMeta,
+  getFileTypes,
 };
diff --git a/backend/src/routes/dbs.routes.js b/backend/src/routes/dbs.routes.js
index c8a57fa..621b32f 100644
--- a/backend/src/routes/dbs.routes.js
+++ b/backend/src/routes/dbs.routes.js
@@ -6,6 +6,7 @@ const {
   getDbInfo,
   getDbDatasets,
   searchAllDatabases,
+  getFileTypes,
   //   searchDatabase,
 } = require("../controllers/couchdb.controller");
 
@@ -15,6 +16,11 @@ const router = express.Router();
 router.get("/", getDbList);
 router.get("/stats", getDbStats);
 
+// distinct file extensions across all iolinks rows (drives the file-type
+// filter on the search page). Must come BEFORE the /:dbName route, otherwise
+// Express treats "file-types" as a dbName.
+router.get("/file-types", getFileTypes);
+
 // cross-database search
 router.post("/search", searchAllDatabases);
 

From 1b0aa6576ecddb1c225adb3d8b0c543ea8069bb9 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 12 May 2026 11:37:12 -0400
Subject: [PATCH 28/61] feat(search): add multi-select File types filter
 (dataset-level)

---
 backend/src/controllers/couchdb.controller.js |  4 +-
 .../widgets/FileTypeAutocompleteWidget.tsx    | 40 +++++++++++++++++++
 src/pages/SearchPage.tsx                      | 27 +++++++++++--
 src/redux/neurojson/neurojson.action.ts       | 13 ++++++
 src/redux/neurojson/neurojson.slice.ts        | 13 ++++++
 .../neurojson/types/neurojson.interface.ts    |  1 +
 src/services/neurojson.service.ts             |  7 ++++
 .../SearchPageFunctions/generateUiSchema.ts   | 18 ++++++++-
 .../SearchPageFunctions/searchformSchema.ts   |  6 +++
 9 files changed, 123 insertions(+), 6 deletions(-)
 create mode 100644 src/components/SearchPage/widgets/FileTypeAutocompleteWidget.tsx

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index edb9957..928a61b 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -231,12 +231,14 @@ const searchAllDatabases = async (req, res) => {
     // Dataset-level: include rows whose (dbname, dsname) has at least one
     // iolinks file with a matching view (extension). Per-subject filtering
     // isn't possible here because iolinks.subj stores file size, not subj id.
+    // Use IN (:array) — Sequelize replacements expand arrays as 'a','b','c',
+    // which fits IN(...) but NOT ANY(...).
     if (Array.isArray(f.file_type) && f.file_type.length > 0) {
       where.push(`EXISTS (
         SELECT 1 FROM iolinks l
         WHERE l.dbname = ioviews.dbname
           AND l.dsname = ioviews.dsname
-          AND l.view = ANY(:fileTypes)
+          AND l.view IN (:fileTypes)
       )`);
       repl.fileTypes = f.file_type.map((t) => String(t));
     }
diff --git a/src/components/SearchPage/widgets/FileTypeAutocompleteWidget.tsx b/src/components/SearchPage/widgets/FileTypeAutocompleteWidget.tsx
new file mode 100644
index 0000000..eb941ad
--- /dev/null
+++ b/src/components/SearchPage/widgets/FileTypeAutocompleteWidget.tsx
@@ -0,0 +1,40 @@
+import { Autocomplete, Chip, TextField } from "@mui/material";
+import { WidgetProps } from "@rjsf/utils";
+
+// Multi-select combobox for file extensions (e.g. ".jdb", ".snirf").
+// Options come from uiSchema's ui:options.fileTypes, fetched once by the
+// parent SearchPage from /api/v1/dbs/file-types.
+export const FileTypeAutocompleteWidget = (props: WidgetProps) => {
+  const { value, onChange, options, label } = props;
+  const fileTypes = (options.fileTypes as string[]) || [];
+  const current: string[] = Array.isArray(value) ? value : [];
+
+  return (
+    <Autocomplete
+      multiple
+      options={fileTypes}
+      value={current}
+      onChange={(_, v) => onChange(v as string[])}
+      renderTags={(items, getTagProps) =>
+        items.map((item, index) => (
+          <Chip
+            variant="outlined"
+            label={item}
+            size="small"
+            {...getTagProps({ index })}
+            key={item}
+          />
+        ))
+      }
+      renderInput={(params) => (
+        <TextField
+          {...params}
+          label={label || "File types"}
+          placeholder={current.length === 0 ? "e.g. .snirf, .jdb" : ""}
+          size="small"
+          fullWidth
+        />
+      )}
+    />
+  );
+};
diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index ca5d1c4..e8e8da0 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -25,6 +25,7 @@ import ClickTooltip from "components/SearchPage/ClickTooltip";
 import DatabaseCard from "components/SearchPage/DatabaseCard";
 import DatasetCard from "components/SearchPage/DatasetCard";
 import SubjectCard from "components/SearchPage/SubjectCard";
+import { FileTypeAutocompleteWidget } from "components/SearchPage/widgets/FileTypeAutocompleteWidget";
 import { TypeAutocompleteWidget } from "components/SearchPage/widgets/TypeAutocompleteWidget";
 import { Colors } from "design/theme";
 import { useAppDispatch } from "hooks/useAppDispatch";
@@ -33,6 +34,7 @@ import pako from "pako";
 import React from "react";
 import { useState, useEffect, useMemo } from "react";
 import {
+  fetchFileTypes,
   fetchMetadataSearchResults,
   fetchRegistry,
 } from "redux/neurojson/neurojson.action";
@@ -186,6 +188,9 @@ const SearchPage: React.FC = () => {
   const registry = useAppSelector(
     (state: RootState) => state.neurojson.registry
   );
+  const fileTypes = useAppSelector(
+    (state: RootState) => state.neurojson.fileTypes
+  );
   const loading = useAppSelector((state: RootState) => state.neurojson.loading);
 
   const [formData, setFormData] = useState<Record<string, any>>({});
@@ -323,12 +328,21 @@ const SearchPage: React.FC = () => {
 
   // form UI
   const uiSchema = useMemo(
-    () => generateUiSchema(formData, showSubjectFilters, showDatasetFilters),
-    [formData, showSubjectFilters, showDatasetFilters]
+    () =>
+      generateUiSchema(
+        formData,
+        showSubjectFilters,
+        showDatasetFilters,
+        fileTypes || []
+      ),
+    [formData, showSubjectFilters, showDatasetFilters, fileTypes]
   );
 
-  // Custom RJSF widgets — combobox for the "Data type keywords" field.
-  const customWidgets = { typeAutocomplete: TypeAutocompleteWidget };
+  // Custom RJSF widgets — comboboxes for the Data type and File types fields.
+  const customWidgets = {
+    typeAutocomplete: TypeAutocompleteWidget,
+    fileTypeAutocomplete: FileTypeAutocompleteWidget,
+  };
 
   // Create the "Subject-level Filters" button as a custom field
   const customFields = {
@@ -387,6 +401,11 @@ const SearchPage: React.FC = () => {
     dispatch(fetchRegistry());
   }, [dispatch]);
 
+  // get the distinct file extensions for the "File types" multi-select.
+  useEffect(() => {
+    dispatch(fetchFileTypes());
+  }, [dispatch]);
+
   // dynamically add database enum to schema
   const schema = useMemo(() => {
     const dbList = registry?.length
diff --git a/src/redux/neurojson/neurojson.action.ts b/src/redux/neurojson/neurojson.action.ts
index 35cf6c1..f8f08c2 100644
--- a/src/redux/neurojson/neurojson.action.ts
+++ b/src/redux/neurojson/neurojson.action.ts
@@ -109,6 +109,19 @@ export const fetchMetadataSearchResults = createAsyncThunk(
   }
 );
 
+// distinct iolinks file extensions — populates the "File types" multi-select
+export const fetchFileTypes = createAsyncThunk(
+  "neurojson/fetchFileTypes",
+  async (_, { rejectWithValue }) => {
+    try {
+      const data = await NeurojsonService.getFileTypes();
+      return data;
+    } catch (error: any) {
+      return rejectWithValue("Failed to fetch file types");
+    }
+  }
+);
+
 // fetch data for metadata panel in dataset detail page
 export const fetchDbInfoByDatasetId = createAsyncThunk(
   "neurojson/fetchDbInfoByDatasetId",
diff --git a/src/redux/neurojson/neurojson.slice.ts b/src/redux/neurojson/neurojson.slice.ts
index 90722c7..cfafc6a 100644
--- a/src/redux/neurojson/neurojson.slice.ts
+++ b/src/redux/neurojson/neurojson.slice.ts
@@ -7,6 +7,7 @@ import {
   fetchDbStats,
   fetchMetadataSearchResults,
   fetchDbInfoByDatasetId,
+  fetchFileTypes,
 } from "./neurojson.action";
 import { DBDatafields, INeuroJsonState } from "./types/neurojson.interface";
 import { createSlice, PayloadAction } from "@reduxjs/toolkit";
@@ -26,6 +27,7 @@ const initialState: INeuroJsonState = {
   dbStats: null,
   searchResults: null,
   datasetViewInfo: null,
+  fileTypes: null,
 };
 
 const neurojsonSlice = createSlice({
@@ -155,6 +157,17 @@ const neurojsonSlice = createSlice({
         state.loading = false;
         state.error = action.payload as string;
       })
+      // fetchFileTypes runs once on mount; no pending case so it doesn't
+      // clobber the shared `loading` spinner used by the search button.
+      .addCase(
+        fetchFileTypes.fulfilled,
+        (state, action: PayloadAction<string[]>) => {
+          state.fileTypes = action.payload;
+        }
+      )
+      .addCase(fetchFileTypes.rejected, (state, action) => {
+        state.error = action.payload as string;
+      })
       .addCase(fetchDbInfoByDatasetId.pending, (state) => {
         state.loading = true;
         state.error = null;
diff --git a/src/redux/neurojson/types/neurojson.interface.ts b/src/redux/neurojson/types/neurojson.interface.ts
index 365566d..01c8273 100644
--- a/src/redux/neurojson/types/neurojson.interface.ts
+++ b/src/redux/neurojson/types/neurojson.interface.ts
@@ -13,6 +13,7 @@ export interface INeuroJsonState {
   dbStats: DbStatsItem[] | null; // for dbStats on landing page
   searchResults: any[] | { status: string; msg: string } | null;
   datasetViewInfo: any | null;
+  fileTypes: string[] | null;
 }
 
 export interface DBParticulars {
diff --git a/src/services/neurojson.service.ts b/src/services/neurojson.service.ts
index 008e960..ed1f70d 100644
--- a/src/services/neurojson.service.ts
+++ b/src/services/neurojson.service.ts
@@ -150,6 +150,13 @@ export const NeurojsonService = {
     return response.data;
   },
 
+  // GET /api/v1/dbs/file-types  → distinct iolinks.view values
+  // Drives the multi-select "File types" filter on the search page.
+  getFileTypes: async (): Promise<string[]> => {
+    const response = await api.get(`/dbs/file-types`);
+    return response.data;
+  },
+
   // getDbInfoByDatasetId: async (dbName: string, dsId: string): Promise<any> => {
   //   const response = await api.get(
   //     `${baseURL}/${dbName}/_design/qq/_view/dbinfo`,
diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index 872accb..152a056 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -6,7 +6,8 @@ import { getTypeSuggestions } from "./typesByModality";
 export const generateUiSchema = (
   formData: Record<string, any>,
   showSubjectFilters: boolean,
-  showDatasetFilters: boolean
+  showDatasetFilters: boolean,
+  fileTypeOptions: string[] = []
 ) => {
   const activeStyle = {
     "ui:options": {
@@ -49,6 +50,7 @@ export const generateUiSchema = (
       "dataset_filters_toggle", // button first
       "database",
       "keyword",
+      "file_type", // dataset-level: filters by file extensions in iolinks
       "subject_filters_toggle",
       "age_range_slider", // top of subject filters — range slider for age
       "modality",
@@ -90,6 +92,20 @@ export const generateUiSchema = (
     //   dataset: formData["dataset"] ? activeStyle : {},
     //   limit: formData["limit"] ? activeStyle : {},
     //   skip: formData["skip"] ? activeStyle : {},
+    // File-type filter — dataset-level. Multi-select of file extensions
+    // present in iolinks (fetched dynamically via /api/v1/dbs/file-types).
+    file_type: showDatasetFilters
+      ? {
+          "ui:widget": "fileTypeAutocomplete",
+          "ui:options": {
+            fileTypes: fileTypeOptions,
+            ...(Array.isArray(formData["file_type"]) &&
+            formData["file_type"].length > 0
+              ? { style: { backgroundColor: Colors.lightBlue } }
+              : {}),
+          },
+        }
+      : datasetHiddenStyle,
     limit: invisibleStyle,
     skip: invisibleStyle,
 
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index 4cb4ef6..e122725 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -128,6 +128,12 @@ export const baseSchema: JSONSchema7 = {
       title: "Data type",
       type: "string",
     },
+    file_type: {
+      title: "File types",
+      type: "array",
+      items: { type: "string" },
+      uniqueItems: true,
+    },
     session_name: {
       title: "Session keywords",
       type: "string",

From 9f826d4c4e959b9553c191ea8a52afd1585f4ea1 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 12 May 2026 12:12:11 -0400
Subject: [PATCH 29/61] fix(search): age slider per-handle clearing + non-BIDS
 file-type warning

---
 src/pages/SearchPage.tsx | 64 ++++++++++++++++++++++++++++++++--------
 1 file changed, 51 insertions(+), 13 deletions(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index e8e8da0..260931c 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -81,16 +81,15 @@ const AgeRangeSliderField = (props: any) => {
         onChange={(_, v) => {
           const [newLo, newHi] = v as number[];
           setFormData((prev) => {
-            const atFull =
-              newLo === AGE_MIN_BOUND && newHi === AGE_MAX_BOUND;
             const next = { ...prev };
-            if (atFull) {
-              delete next.age_min;
-              delete next.age_max;
-            } else {
-              next.age_min = newLo;
-              next.age_max = newHi;
-            }
+            // Each handle is its own filter. A handle at the bound means
+            // "no constraint on that side", so we leave it out of formData
+            // (otherwise age_min=0 silently excludes unknown-age subjects
+            // whose stored key is "000-1", lexicographically below "00000").
+            if (newLo === AGE_MIN_BOUND) delete next.age_min;
+            else next.age_min = newLo;
+            if (newHi === AGE_MAX_BOUND) delete next.age_max;
+            else next.age_max = newHi;
             return next;
           });
         }}
@@ -560,6 +559,35 @@ const SearchPage: React.FC = () => {
     !loading &&
     // !hasDbMatches &&
     (!hasDatasetMatches || backendEmpty);
+
+  // Tailored empty-state message: when the user combined a file_type filter
+  // with any subject-level filter and got nothing back, it's almost certainly
+  // because the file extension lives in non-BIDS datasets (which have no
+  // subject rows in ioviews). The generic "adjust filters" message hides this.
+  const SUBJECT_FILTER_KEYS = [
+    "age_min",
+    "age_max",
+    "gender",
+    "task_min",
+    "task_max",
+    "task_name",
+    "run_min",
+    "run_max",
+    "run_name",
+    "sess_min",
+    "sess_max",
+    "session_name",
+    "type_name",
+    "modality",
+    "subject",
+  ];
+  const isAppliedFilter = (v: any) =>
+    v !== "" && v !== "any" && v !== undefined && v !== null;
+  const showFileTypeNonBidsHint =
+    showNoResults &&
+    Array.isArray(appliedFilters.file_type) &&
+    appliedFilters.file_type.length > 0 &&
+    SUBJECT_FILTER_KEYS.some((k) => isAppliedFilter(appliedFilters[k]));
   return (
     <Container
       maxWidth={false}
@@ -1011,10 +1039,20 @@ const SearchPage: React.FC = () => {
                           Search Results
                         </Typography>
 
-                        <Typography sx={{ color: Colors.error }}>
-                          No datasets or subjects found. Please adjust the
-                          filters and try again.
-                        </Typography>
+                        {showFileTypeNonBidsHint ? (
+                          <Typography sx={{ color: Colors.error }}>
+                            No matching subjects found. The selected file type
+                            may only exist in non-BIDS datasets (e.g. mesh or
+                            atlas libraries), which have no subject-level
+                            records. Try removing subject-level filters
+                            (modality, age, gender, etc.) and search again.
+                          </Typography>
+                        ) : (
+                          <Typography sx={{ color: Colors.error }}>
+                            No datasets or subjects found. Please adjust the
+                            filters and try again.
+                          </Typography>
+                        )}
                       </Box>
                     )}
 

From 38fc1cbb83131613137d0386f55a4d6b2e993772 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 12 May 2026 14:26:36 -0400
Subject: [PATCH 30/61] fix(search): highlight each word of multi-word keyword
 independently

---
 backend/src/controllers/couchdb.controller.js | 13 +++-
 src/components/SearchPage/DatasetCard.tsx     | 75 +++++++++++++------
 2 files changed, 65 insertions(+), 23 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index 928a61b..df1532b 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -221,10 +221,19 @@ const searchAllDatabases = async (req, res) => {
       repl.subj = String(f.subject);
     }
 
-    // Keyword full-text search
+    // Keyword search — match anywhere relevant.
+    // tsquery covers stemmed tokens inside the JSON content (name, readme,
+    // info, modality, subj). ILIKE on dbname/dsname adds substring matching
+    // so "fnirs" finds "bfnirs", "openfnirs", and any dataset id containing it.
+    // The whole group is parenthesised so it ANDs cleanly with other filters.
     if (isFilter(f.keyword)) {
-      where.push(`search_vector @@ websearch_to_tsquery('english', :keyword)`);
+      where.push(`(
+        search_vector @@ websearch_to_tsquery('english', :keyword)
+        OR dbname ILIKE :keywordLike
+        OR dsname ILIKE :keywordLike
+      )`);
       repl.keyword = String(f.keyword);
+      repl.keywordLike = `%${String(f.keyword)}%`;
     }
 
     // File-type filter — array of extensions like [".jdb", ".snirf"].
diff --git a/src/components/SearchPage/DatasetCard.tsx b/src/components/SearchPage/DatasetCard.tsx
index 42f6646..5790ee5 100644
--- a/src/components/SearchPage/DatasetCard.tsx
+++ b/src/components/SearchPage/DatasetCard.tsx
@@ -35,11 +35,21 @@ const normalize = (s: string) =>
     ?.replace(/[\u201C\u201D\u2033]/g, '"') ?? // curly → straight
   "";
 
+// Multi-word keyword support: backend tsquery treats "head brain" as AND of
+// independent tokens. Highlighting should match the same logic — split on
+// whitespace and treat each word independently.
+const splitKeyword = (kw?: string): string[] => {
+  if (!kw) return [];
+  return normalize(kw).trim().split(/\s+/).filter(Boolean);
+};
+
+const escapeRegex = (s: string) => s.replace(/[.*+?^${}()|[\]\\]/g, "\\$&");
+
 const containsKeyword = (text?: string, kw?: string) => {
   if (!text || !kw) return false;
   const t = normalize(text).toLowerCase();
-  const k = normalize(kw).toLowerCase();
-  return t.includes(k);
+  const words = splitKeyword(kw.toLowerCase());
+  return words.some((w) => t.includes(w));
 };
 
 /** Find a short snippet in secondary fields if not already visible */
@@ -62,24 +72,41 @@ function findMatchSnippet(
     ["ReferencesAndLinks", (v) => v?.info?.ReferencesAndLinks],
   ];
 
-  const k = normalize(kw).toLowerCase();
+  const words = splitKeyword(kw.toLowerCase());
+  if (words.length === 0) return null;
 
   for (const [label, getter] of CANDIDATE_FIELDS) {
     const raw = getter(v); // v = parsedJson.value
     if (!raw) continue;
     const text = normalize(String(raw));
-    const i = text.toLowerCase().indexOf(k); // k is the lowercase version of keyword
-    if (i >= 0) {
-      const start = Math.max(0, i - 40);
-      const end = Math.min(text.length, i + k.length + 40);
-      const before = text.slice(start, i);
-      const hit = text.slice(i, i + k.length);
-      const after = text.slice(i + k.length, end);
-      const html = `${
-        start > 0 ? "…" : ""
-      }${before}<mark>${hit}</mark>${after}${end < text.length ? "…" : ""}`;
-      return { label, html };
+    const lower = text.toLowerCase();
+
+    // Find the earliest occurrence of ANY matching word — that's the snippet anchor.
+    let anchor = -1;
+    let anchorLen = 0;
+    for (const w of words) {
+      const i = lower.indexOf(w);
+      if (i >= 0 && (anchor < 0 || i < anchor)) {
+        anchor = i;
+        anchorLen = w.length;
+      }
     }
+    if (anchor < 0) continue;
+
+    const start = Math.max(0, anchor - 40);
+    const end = Math.min(text.length, anchor + anchorLen + 40);
+    const slice = text.slice(start, end);
+
+    // Highlight every matching word inside the snippet, not just the first.
+    const regex = new RegExp(
+      `(${words.map(escapeRegex).join("|")})`,
+      "gi"
+    );
+    const highlighted = slice.replace(regex, "<mark>$1</mark>");
+    const html = `${start > 0 ? "…" : ""}${highlighted}${
+      end < text.length ? "…" : ""
+    }`;
+    return { label, html };
   }
   return null;
 }
@@ -122,19 +149,25 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
     [parsedJson.value, keyword, visibleHasKeyword]
   );
 
-  // keyword highlight functional component (only for visible fields)
+  // keyword highlight functional component (only for visible fields).
+  // Splits the keyword on whitespace and highlights each word independently
+  // so "head brain" highlights both words wherever they appear.
   const highlightKeyword = (text: string, keyword?: string) => {
-    if (!keyword || !text?.toLowerCase().includes(keyword.toLowerCase())) {
-      return text;
-    }
-
-    const regex = new RegExp(`(${keyword})`, "gi"); // for case-insensitive and global
+    const words = splitKeyword(keyword);
+    if (words.length === 0 || !text) return text;
+    const lowerWordSet = new Set(words.map((w) => w.toLowerCase()));
+    const regex = new RegExp(
+      `(${words.map(escapeRegex).join("|")})`,
+      "gi"
+    );
+    if (!regex.test(text)) return text;
+    // Reset lastIndex because test() advances on /g regexes; safer to use split.
     const parts = text.split(regex);
 
     return (
       <>
         {parts.map((part, i) =>
-          part.toLowerCase() === keyword.toLowerCase() ? (
+          lowerWordSet.has(part.toLowerCase()) ? (
             <mark
               key={i}
               style={{ backgroundColor: "yellow", fontWeight: 600 }}

From bebd036f647b9dec78eec8e0045646aee7c5c76a Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 12 May 2026 16:31:53 -0400
Subject: [PATCH 31/61] fix(search): keyword highlight reads from
 appliedFilters, not formData

---
 src/pages/SearchPage.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index 260931c..ca63bed 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -1002,7 +1002,7 @@ const SearchPage: React.FC = () => {
                                   dsname={item.dsname}
                                   parsedJson={parsedJson}
                                   onChipClick={handleChipClick}
-                                  keyword={formData.keyword} // for keyword highlight
+                                  keyword={appliedFilters.keyword} // highlight what was searched, not the live form
                                 />
                               ) : (
                                 <SubjectCard

From fba024032f900b5d5bda5c4d572eaa2187d20b42 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 13 May 2026 15:26:18 -0400
Subject: [PATCH 32/61] feat: add file download endpoints for dataset search
 results

---
 backend/src/controllers/couchdb.controller.js | 76 ++++++++++++++++++-
 backend/src/routes/dbs.routes.js              |  5 ++
 2 files changed, 80 insertions(+), 1 deletion(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index df1532b..db642da 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -257,6 +257,32 @@ const searchAllDatabases = async (req, res) => {
     repl.limit = limit;
     repl.offset = offset;
 
+    // When file_type filter is active, also return a sample of the actual
+    // matching iolinks rows (filename, url, path, suffix) per dataset, plus
+    // a total count. Frontend shows up to 20 as clickable filenames and a
+    // "Download manifest" button for the full list via a separate endpoint.
+    const matchingFilesActive =
+      Array.isArray(f.file_type) && f.file_type.length > 0;
+    const matchingFilesColumn = matchingFilesActive
+      ? `,
+        COALESCE((
+          SELECT jsonb_agg(t.json)
+          FROM (
+            SELECT l.json
+            FROM iolinks l
+            WHERE l.dbname = ioviews.dbname
+              AND l.dsname = ioviews.dsname
+              AND l.view IN (:fileTypes)
+            ORDER BY l.id
+            LIMIT 20
+          ) t
+        ), '[]'::jsonb)::text AS matching_files,
+        (SELECT COUNT(*) FROM iolinks l
+         WHERE l.dbname = ioviews.dbname
+           AND l.dsname = ioviews.dsname
+           AND l.view IN (:fileTypes))::int AS matching_files_total`
+      : "";
+
     // dbinfo was stored flat ({name, subj, ...}); subjects was stored wrapped
     // ({key, value}). Frontend expects parsed.value.subj for datasets, so we
     // wrap dbinfo on the way out.
@@ -268,7 +294,7 @@ const searchAllDatabases = async (req, res) => {
         CASE
           WHEN view = 'dbinfo' THEN jsonb_build_object('value', json)::text
           ELSE json::text
-        END AS json
+        END AS json${matchingFilesColumn}
       FROM ioviews
       WHERE ${where.join(" AND ")}
       ORDER BY dbname, dsname, subj
@@ -417,6 +443,53 @@ const getDatasetMeta = async (req, res) => {
 
 // }
 
+// Plain-text manifest of every matching iolinks URL for a dataset, served
+// as a downloadable .txt. The user pipes it into wget/aria2c to fetch
+// everything: `wget -i manifest.txt`. Avoids server-side zipping and gives
+// resumable, parallel downloads.
+const getDatasetFilesManifest = async (req, res) => {
+  try {
+    const { dbName, dsName } = req.params;
+    const rawExt = req.query.ext;
+    const exts = Array.isArray(rawExt)
+      ? rawExt
+      : typeof rawExt === "string" && rawExt.length > 0
+      ? rawExt.split(",")
+      : [];
+
+    if (exts.length === 0) {
+      res.status(400).send("ext query parameter required (e.g. ?ext=.jdb)");
+      return;
+    }
+
+    const rows = await sequelize.query(
+      `SELECT json->'value'->>'url' AS url
+       FROM iolinks
+       WHERE dbname = :dbname
+         AND dsname = :dsname
+         AND view IN (:exts)
+       ORDER BY id`,
+      {
+        replacements: { dbname: dbName, dsname: dsName, exts },
+        type: sequelize.QueryTypes.SELECT,
+      }
+    );
+
+    const urls = rows.map((r) => r.url).filter(Boolean);
+    const filename = `${dbName}_${dsName}_${exts.join("_")}_manifest.txt`;
+
+    res.setHeader("Content-Type", "text/plain; charset=utf-8");
+    res.setHeader(
+      "Content-Disposition",
+      `attachment; filename="${filename}"`
+    );
+    res.send(urls.join("\n") + "\n");
+  } catch (error) {
+    console.error("Error generating manifest:", error.message);
+    res.status(500).send(`Error generating manifest: ${error.message}`);
+  }
+};
+
 // distinct file extensions present in iolinks across all synced DBs.
 // Drives the multi-select "File types" filter on the search page.
 const getFileTypes = async (req, res) => {
@@ -447,4 +520,5 @@ module.exports = {
   getDatasetDetail,
   getDatasetMeta,
   getFileTypes,
+  getDatasetFilesManifest,
 };
diff --git a/backend/src/routes/dbs.routes.js b/backend/src/routes/dbs.routes.js
index 621b32f..45979ac 100644
--- a/backend/src/routes/dbs.routes.js
+++ b/backend/src/routes/dbs.routes.js
@@ -7,6 +7,7 @@ const {
   getDbDatasets,
   searchAllDatabases,
   getFileTypes,
+  getDatasetFilesManifest,
   //   searchDatabase,
 } = require("../controllers/couchdb.controller");
 
@@ -24,6 +25,10 @@ router.get("/file-types", getFileTypes);
 // cross-database search
 router.post("/search", searchAllDatabases);
 
+// downloadable manifest (plain text) of all iolinks URLs for a dataset
+// filtered by extension(s). e.g. /dbs/bfnirs/Motion-Yucel2014-I/files/manifest?ext=.jdb
+router.get("/:dbName/:dsName/files/manifest", getDatasetFilesManifest);
+
 // Specific database routes
 router.get("/:dbName", getDbInfo);
 router.get("/:dbName/datasets", getDbDatasets);

From 51960cf2274aacf95c4864da675809b74aadd925 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 13 May 2026 15:45:06 -0400
Subject: [PATCH 33/61] feat(search): show matching files in dataset card with
 selective and manifest download

---
 backend/src/controllers/couchdb.controller.js |   4 +-
 src/components/SearchPage/DatasetCard.tsx     | 145 +++++++++++++++++-
 src/pages/SearchPage.tsx                      |   7 +
 3 files changed, 153 insertions(+), 3 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index db642da..20a7cae 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -259,7 +259,7 @@ const searchAllDatabases = async (req, res) => {
 
     // When file_type filter is active, also return a sample of the actual
     // matching iolinks rows (filename, url, path, suffix) per dataset, plus
-    // a total count. Frontend shows up to 20 as clickable filenames and a
+    // a total count. Frontend shows up to 10 as clickable filenames and a
     // "Download manifest" button for the full list via a separate endpoint.
     const matchingFilesActive =
       Array.isArray(f.file_type) && f.file_type.length > 0;
@@ -274,7 +274,7 @@ const searchAllDatabases = async (req, res) => {
               AND l.dsname = ioviews.dsname
               AND l.view IN (:fileTypes)
             ORDER BY l.id
-            LIMIT 20
+            LIMIT 10
           ) t
         ), '[]'::jsonb)::text AS matching_files,
         (SELECT COUNT(*) FROM iolinks l
diff --git a/src/components/SearchPage/DatasetCard.tsx b/src/components/SearchPage/DatasetCard.tsx
index 5790ee5..da4e0c7 100644
--- a/src/components/SearchPage/DatasetCard.tsx
+++ b/src/components/SearchPage/DatasetCard.tsx
@@ -1,10 +1,31 @@
-import { Typography, Card, CardContent, Stack, Chip } from "@mui/material";
+import DownloadIcon from "@mui/icons-material/Download";
+import {
+  Typography,
+  Card,
+  CardContent,
+  Stack,
+  Chip,
+  Button,
+  Link as MuiLink,
+} from "@mui/material";
+import { baseURL } from "services/instance";
 import { Colors } from "design/theme";
 import React from "react";
 import { useMemo } from "react";
 import { Link } from "react-router-dom";
 import RoutesEnum from "types/routes.enum";
 
+interface MatchingFile {
+  key?: any;
+  value?: {
+    file?: string;
+    url?: string;
+    path?: string;
+    suffix?: string;
+    ref?: string;
+  };
+}
+
 interface DatasetCardProps {
   dbname: string;
   dsname: string;
@@ -26,6 +47,9 @@ interface DatasetCardProps {
   index: number;
   onChipClick: (key: string, value: string) => void;
   keyword?: string; // for keyword highlight
+  matchingFiles?: MatchingFile[]; // sample of iolinks rows matching file_type
+  matchingFilesTotal?: number; // total count across all matches
+  fileTypes?: string[]; // the active file_type filter, used to build manifest URL
 }
 
 /** ---------- utility helpers ---------- **/
@@ -119,10 +143,41 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
   index,
   onChipClick,
   keyword,
+  matchingFiles,
+  matchingFilesTotal,
+  fileTypes,
 }) => {
   const { name, readme, modality, subj, info } = parsedJson.value;
   const datasetLink = `${RoutesEnum.DATABASES}/${dbname}/${dsname}`;
 
+  // Manifest URL — backend serves a plain-text list of all matching URLs.
+  const manifestUrl = useMemo(() => {
+    if (!fileTypes || fileTypes.length === 0) return null;
+    const ext = fileTypes
+      .map((e) => encodeURIComponent(e))
+      .join(",");
+    return `${baseURL}/dbs/${encodeURIComponent(
+      dbname
+    )}/${encodeURIComponent(dsname)}/files/manifest?ext=${ext}`;
+  }, [dbname, dsname, fileTypes]);
+
+  // Extract a short "sub-XXX" tag from a BIDS path like
+  // "$.sub-019.ses-1.nirs.sub-019_ses-1_task-MA_run-01_nirs.snirf.SNIRFData..."
+  const subjectFromPath = (p?: string): string => {
+    if (!p) return "";
+    const m = p.match(/sub-[^.]+/);
+    return m ? m[0] : "";
+  };
+
+  // File size stored in key[1] of each iolinks row (bytes). Format for humans.
+  const formatBytes = (n?: number): string => {
+    if (typeof n !== "number" || !Number.isFinite(n) || n < 0) return "";
+    if (n < 1024) return `${n} B`;
+    if (n < 1024 * 1024) return `${(n / 1024).toFixed(1)} KB`;
+    if (n < 1024 * 1024 * 1024) return `${(n / 1024 / 1024).toFixed(1)} MB`;
+    return `${(n / 1024 / 1024 / 1024).toFixed(2)} GB`;
+  };
+
   // prepare DOI URL
   const rawDOI = info?.DatasetDOI?.replace(/^doi:/, "");
   const doiLink = rawDOI ? `https://doi.org/${rawDOI}` : null;
@@ -338,6 +393,94 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
               </Stack>
             )}
           </Stack>
+
+          {/* Matching files section — only shown when file_type filter is active */}
+          {Array.isArray(matchingFiles) && matchingFiles.length > 0 && (
+            <Stack
+              spacing={1}
+              sx={{
+                mt: 2,
+                pt: 1.5,
+                borderTop: "1px solid",
+                borderColor: "divider",
+              }}
+            >
+              <Stack
+                direction="row"
+                alignItems="center"
+                justifyContent="space-between"
+                flexWrap="wrap"
+                gap={1}
+              >
+                <Typography variant="subtitle2" sx={{ fontWeight: 600 }}>
+                  Matching files
+                  {typeof matchingFilesTotal === "number" &&
+                    ` (${
+                      matchingFiles.length < matchingFilesTotal
+                        ? `${matchingFiles.length} of ${matchingFilesTotal}`
+                        : matchingFilesTotal
+                    })`}
+                </Typography>
+                {manifestUrl && (
+                  <Button
+                    component="a"
+                    href={manifestUrl}
+                    size="small"
+                    variant="outlined"
+                    startIcon={<DownloadIcon />}
+                    sx={{
+                      color: Colors.purple,
+                      borderColor: Colors.purple,
+                      textTransform: "none",
+                    }}
+                  >
+                    Download manifest
+                    {typeof matchingFilesTotal === "number" &&
+                      ` (${matchingFilesTotal} files)`}
+                  </Button>
+                )}
+              </Stack>
+              <Stack spacing={0.5} component="ul" sx={{ pl: 2, m: 0 }}>
+                {matchingFiles.slice(0, 10).map((f, i) => {
+                  const v = f.value || {};
+                  const subjTag = subjectFromPath(v.path);
+                  const sizeBytes =
+                    Array.isArray(f.key) && typeof f.key[1] === "number"
+                      ? f.key[1]
+                      : undefined;
+                  const sizeTag = formatBytes(sizeBytes);
+                  const meta = [subjTag, sizeTag].filter(Boolean).join(" · ");
+                  return (
+                    <li key={i}>
+                      <MuiLink
+                        href={v.url}
+                        target="_blank"
+                        rel="noopener noreferrer"
+                        underline="hover"
+                        sx={{
+                          color: Colors.purple,
+                          fontFamily: "monospace",
+                          fontSize: "0.8rem",
+                          wordBreak: "break-all",
+                        }}
+                      >
+                        {v.file || v.url}
+                      </MuiLink>
+                      {meta && (
+                        <Typography
+                          component="span"
+                          variant="caption"
+                          sx={{ ml: 1, color: "text.secondary" }}
+                        >
+                          ({meta})
+                        </Typography>
+                      )}
+                    </li>
+                  );
+                })}
+              </Stack>
+            </Stack>
+          )}
         </Stack>
       </CardContent>
     </Card>
diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index ca63bed..397e63a 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -1003,6 +1003,13 @@ const SearchPage: React.FC = () => {
                                   parsedJson={parsedJson}
                                   onChipClick={handleChipClick}
                                   keyword={appliedFilters.keyword} // highlight what was searched, not the live form
+                                  matchingFiles={
+                                    item.matching_files
+                                      ? JSON.parse(item.matching_files)
+                                      : undefined
+                                  }
+                                  matchingFilesTotal={item.matching_files_total}
+                                  fileTypes={appliedFilters.file_type}
                                 />
                               ) : (
                                 <SubjectCard

From 5677c7428a921607fc93f03c36113077e1ab3846 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 13 May 2026 16:14:45 -0400
Subject: [PATCH 34/61] fix(search): use plainto_tsquery + normalize ILIKE
 separators for keyword

---
 backend/src/controllers/couchdb.controller.js | 15 ++++++++++-----
 1 file changed, 10 insertions(+), 5 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index 20a7cae..cdcedd3 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -222,18 +222,23 @@ const searchAllDatabases = async (req, res) => {
     }
 
     // Keyword search — match anywhere relevant.
-    // tsquery covers stemmed tokens inside the JSON content (name, readme,
-    // info, modality, subj). ILIKE on dbname/dsname adds substring matching
-    // so "fnirs" finds "bfnirs", "openfnirs", and any dataset id containing it.
+    // plainto_tsquery treats input as plain words AND'd together; ignores
+    // operator chars like "-" and "OR" so dataset names with hyphens
+    // (e.g. "ABIDE - CMU_a") don't get parsed as NOT clauses.
+    // ILIKE on dbname/dsname adds substring matching so "fnirs" finds
+    // "bfnirs", "openfnirs", and any dataset id containing it.
+    // ILIKE pattern normalizes whitespace/hyphens to % wildcards so the
+    // user's "ABIDE - CMU_a" matches stored names like "abide_cmu_a" or
+    // "ABIDE_-_CMU_a" regardless of separator style.
     // The whole group is parenthesised so it ANDs cleanly with other filters.
     if (isFilter(f.keyword)) {
       where.push(`(
-        search_vector @@ websearch_to_tsquery('english', :keyword)
+        search_vector @@ plainto_tsquery('english', :keyword)
         OR dbname ILIKE :keywordLike
         OR dsname ILIKE :keywordLike
       )`);
       repl.keyword = String(f.keyword);
-      repl.keywordLike = `%${String(f.keyword)}%`;
+      repl.keywordLike = `%${String(f.keyword).replace(/[\s-]+/g, "%")}%`;
     }
 
     // File-type filter — array of extensions like [".jdb", ".snirf"].

From bf1abe34995b9e28692165aa38b07718fdce90c6 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 13 May 2026 16:31:14 -0400
Subject: [PATCH 35/61] fix(search): match dataset display name via
 json->>'name' ILIKE

---
 backend/src/controllers/couchdb.controller.js | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index cdcedd3..88e96f1 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -227,15 +227,19 @@ const searchAllDatabases = async (req, res) => {
     // (e.g. "ABIDE - CMU_a") don't get parsed as NOT clauses.
     // ILIKE on dbname/dsname adds substring matching so "fnirs" finds
     // "bfnirs", "openfnirs", and any dataset id containing it.
-    // ILIKE pattern normalizes whitespace/hyphens to % wildcards so the
-    // user's "ABIDE - CMU_a" matches stored names like "abide_cmu_a" or
-    // "ABIDE_-_CMU_a" regardless of separator style.
+    // ILIKE on json->>'name' covers the human-readable name from
+    // dataset_description.json (e.g. "ABIDE - CMU_a"), which is where the
+    // user-visible dataset titles live — dsname column often stores just
+    // an opaque id like "CMU_a" without the prefix.
+    // ILIKE pattern normalizes whitespace/hyphens to % wildcards so
+    // "ABIDE - CMU_a" matches stored names regardless of separator style.
     // The whole group is parenthesised so it ANDs cleanly with other filters.
     if (isFilter(f.keyword)) {
       where.push(`(
         search_vector @@ plainto_tsquery('english', :keyword)
         OR dbname ILIKE :keywordLike
         OR dsname ILIKE :keywordLike
+        OR (json->>'name') ILIKE :keywordLike
       )`);
       repl.keyword = String(f.keyword);
       repl.keywordLike = `%${String(f.keyword).replace(/[\s-]+/g, "%")}%`;

From 6fce0633ef5b639c863302ff50c659386d0ce15b Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 14 May 2026 16:56:12 -0400
Subject: [PATCH 36/61] feat(search): add Mac/Linux and Windows script options
 to file download

---
 backend/src/controllers/couchdb.controller.js |  86 ++++++++-
 src/components/SearchPage/DatasetCard.tsx     | 177 +++++++++++++++---
 2 files changed, 229 insertions(+), 34 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index 88e96f1..c990fe7 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -452,14 +452,18 @@ const getDatasetMeta = async (req, res) => {
 
 // }
 
-// Plain-text manifest of every matching iolinks URL for a dataset, served
-// as a downloadable .txt. The user pipes it into wget/aria2c to fetch
-// everything: `wget -i manifest.txt`. Avoids server-side zipping and gives
-// resumable, parallel downloads.
+// Downloadable list of every matching iolinks URL for a dataset.
+// Three formats via ?format=:
+//   - txt (default) → plain URL list (use with `wget -i`)
+//   - sh             → bash script with curl commands (Mac/Linux)
+//   - bat            → Windows batch script with curl commands
+// All three avoid server-side zipping — the user's machine pulls files
+// directly from neurojson.org/io, so this Express server stays light.
 const getDatasetFilesManifest = async (req, res) => {
   try {
     const { dbName, dsName } = req.params;
     const rawExt = req.query.ext;
+    const format = String(req.query.format || "txt").toLowerCase();
     const exts = Array.isArray(rawExt)
       ? rawExt
       : typeof rawExt === "string" && rawExt.length > 0
@@ -472,7 +476,8 @@ const getDatasetFilesManifest = async (req, res) => {
     }
 
     const rows = await sequelize.query(
-      `SELECT json->'value'->>'url' AS url
+      `SELECT json->'value'->>'url'  AS url,
+              json->'value'->>'file' AS file
        FROM iolinks
        WHERE dbname = :dbname
          AND dsname = :dsname
@@ -484,15 +489,78 @@ const getDatasetFilesManifest = async (req, res) => {
       }
     );
 
-    const urls = rows.map((r) => r.url).filter(Boolean);
-    const filename = `${dbName}_${dsName}_${exts.join("_")}_manifest.txt`;
+    const files = rows.filter((r) => r.url);
+    const urls = files.map((r) => r.url);
+    const baseName = `${dbName}_${dsName}_${exts.join("_")}`;
+    const extLabel = exts.join(", ");
+
+    // Strip any path separators or quote chars from the parsed filename
+    // before using it in shell commands — file names come from iolinks
+    // and are usually content hashes, but defensive belt-and-suspenders.
+    const safeName = (s) =>
+      (s || "").replace(/["\\\/\r\n]/g, "").trim();
+
+    let body;
+    let contentType;
+    let filename;
+
+    if (format === "sh") {
+      // Bash script — curl is preinstalled on macOS and most Linux distros.
+      // -L follows redirects, -C - resumes interrupted downloads, -o saves
+      // with our parsed filename (the URL is a CGI query — using -O would
+      // save files as literal `stat.cgi?...`).
+      body =
+        `#!/bin/bash\n` +
+        `# Downloads ${extLabel} files from ${dbName}/${dsName}\n` +
+        `# Usage: bash ${baseName}_download.sh\n` +
+        `set -e\n` +
+        `mkdir -p "neurojson_downloads"\n` +
+        `cd "neurojson_downloads" || exit 1\n` +
+        files
+          .map((r) => {
+            const fn = safeName(r.file);
+            return fn
+              ? `curl -L -C - -o "${fn}" "${r.url}"`
+              : `curl -L -C - -O "${r.url}"`;
+          })
+          .join("\n") +
+        `\necho "Done. Files saved to $(pwd)"\n`;
+      contentType = "application/x-sh; charset=utf-8";
+      filename = `${baseName}_download.sh`;
+    } else if (format === "bat") {
+      // Windows batch — curl ships with Windows 10+. Uses CRLF line endings
+      // for proper rendering in CMD. /d on cd handles cross-drive paths.
+      body =
+        `@echo off\r\n` +
+        `REM Downloads ${extLabel} files from ${dbName}/${dsName}\r\n` +
+        `REM Usage: double-click or run ${baseName}_download.bat\r\n` +
+        `if not exist "neurojson_downloads" mkdir "neurojson_downloads"\r\n` +
+        `cd /d "neurojson_downloads"\r\n` +
+        files
+          .map((r) => {
+            const fn = safeName(r.file);
+            return fn
+              ? `curl -L -C - -o "${fn}" "${r.url}"`
+              : `curl -L -C - -O "${r.url}"`;
+          })
+          .join("\r\n") +
+        `\r\necho Done. Files saved to %cd%\r\n` +
+        `pause\r\n`;
+      contentType = "text/plain; charset=utf-8";
+      filename = `${baseName}_download.bat`;
+    } else {
+      // Default: plain URL list, one per line (advanced users with wget).
+      body = urls.join("\n") + "\n";
+      contentType = "text/plain; charset=utf-8";
+      filename = `${baseName}_manifest.txt`;
+    }
 
-    res.setHeader("Content-Type", "text/plain; charset=utf-8");
+    res.setHeader("Content-Type", contentType);
     res.setHeader(
       "Content-Disposition",
       `attachment; filename="${filename}"`
     );
-    res.send(urls.join("\n") + "\n");
+    res.send(body);
   } catch (error) {
     console.error("Error generating manifest:", error.message);
     res.status(500).send(`Error generating manifest: ${error.message}`);
diff --git a/src/components/SearchPage/DatasetCard.tsx b/src/components/SearchPage/DatasetCard.tsx
index da4e0c7..4243119 100644
--- a/src/components/SearchPage/DatasetCard.tsx
+++ b/src/components/SearchPage/DatasetCard.tsx
@@ -1,4 +1,5 @@
 import DownloadIcon from "@mui/icons-material/Download";
+import KeyboardArrowDownIcon from "@mui/icons-material/KeyboardArrowDown";
 import {
   Typography,
   Card,
@@ -7,11 +8,16 @@ import {
   Chip,
   Button,
   Link as MuiLink,
+  Menu,
+  MenuItem,
+  Box,
+  Snackbar,
+  Alert,
 } from "@mui/material";
 import { baseURL } from "services/instance";
 import { Colors } from "design/theme";
 import React from "react";
-import { useMemo } from "react";
+import { useMemo, useState } from "react";
 import { Link } from "react-router-dom";
 import RoutesEnum from "types/routes.enum";
 
@@ -150,16 +156,44 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
   const { name, readme, modality, subj, info } = parsedJson.value;
   const datasetLink = `${RoutesEnum.DATABASES}/${dbname}/${dsname}`;
 
-  // Manifest URL — backend serves a plain-text list of all matching URLs.
-  const manifestUrl = useMemo(() => {
+  // Build manifest URL for any of the three formats. Backend serves
+  // text/plain for .txt, application/x-sh for .sh, text/plain for .bat —
+  // each with a Content-Disposition header so the browser saves them.
+  const buildManifestUrl = (format: "txt" | "sh" | "bat") => {
     if (!fileTypes || fileTypes.length === 0) return null;
-    const ext = fileTypes
-      .map((e) => encodeURIComponent(e))
-      .join(",");
+    const ext = fileTypes.map((e) => encodeURIComponent(e)).join(",");
     return `${baseURL}/dbs/${encodeURIComponent(
       dbname
-    )}/${encodeURIComponent(dsname)}/files/manifest?ext=${ext}`;
-  }, [dbname, dsname, fileTypes]);
+    )}/${encodeURIComponent(
+      dsname
+    )}/files/manifest?ext=${ext}&format=${format}`;
+  };
+
+  const hasManifest = Array.isArray(fileTypes) && fileTypes.length > 0;
+
+  // Dropdown state for the download format menu.
+  const [downloadMenuEl, setDownloadMenuEl] = useState<HTMLElement | null>(
+    null
+  );
+  // Post-download instruction snackbar. Stays open until user dismisses it
+  // (no autoHideDuration) so researchers have time to read multi-step
+  // instructions.
+  const [downloadHint, setDownloadHint] = useState<
+    "sh" | "bat" | "txt" | null
+  >(null);
+  const handleDownload = (format: "txt" | "sh" | "bat") => {
+    const url = buildManifestUrl(format);
+    setDownloadMenuEl(null);
+    if (!url) return;
+    // Programmatic anchor click triggers the browser's normal download flow
+    // without leaving the current page (window.location would navigate away).
+    const a = document.createElement("a");
+    a.href = url;
+    document.body.appendChild(a);
+    a.click();
+    document.body.removeChild(a);
+    setDownloadHint(format);
+  };
 
   // Extract a short "sub-XXX" tag from a BIDS path like
   // "$.sub-019.ses-1.nirs.sub-019_ses-1_task-MA_run-01_nirs.snirf.SNIRFData..."
@@ -421,23 +455,40 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
                         : matchingFilesTotal
                     })`}
                 </Typography>
-                {manifestUrl && (
-                  <Button
-                    component="a"
-                    href={manifestUrl}
-                    size="small"
-                    variant="outlined"
-                    startIcon={<DownloadIcon />}
-                    sx={{
-                      color: Colors.purple,
-                      borderColor: Colors.purple,
-                      textTransform: "none",
-                    }}
-                  >
-                    Download manifest
-                    {typeof matchingFilesTotal === "number" &&
-                      ` (${matchingFilesTotal} files)`}
-                  </Button>
+                {hasManifest && (
+                  <>
+                    <Button
+                      onClick={(e) => setDownloadMenuEl(e.currentTarget)}
+                      size="small"
+                      variant="outlined"
+                      startIcon={<DownloadIcon />}
+                      endIcon={<KeyboardArrowDownIcon />}
+                      sx={{
+                        color: Colors.purple,
+                        borderColor: Colors.purple,
+                        textTransform: "none",
+                      }}
+                    >
+                      Download all
+                      {typeof matchingFilesTotal === "number" &&
+                        ` (${matchingFilesTotal})`}
+                    </Button>
+                    <Menu
+                      anchorEl={downloadMenuEl}
+                      open={Boolean(downloadMenuEl)}
+                      onClose={() => setDownloadMenuEl(null)}
+                    >
+                      <MenuItem onClick={() => handleDownload("sh")}>
+                        For Mac / Linux (.sh)
+                      </MenuItem>
+                      <MenuItem onClick={() => handleDownload("bat")}>
+                        For Windows (.bat)
+                      </MenuItem>
+                      <MenuItem onClick={() => handleDownload("txt")}>
+                        URL list (.txt, advanced)
+                      </MenuItem>
+                    </Menu>
+                  </>
                 )}
               </Stack>
               <Stack spacing={0.5} component="ul" sx={{ pl: 2, m: 0 }}>
@@ -483,6 +534,82 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
           )}
         </Stack>
       </CardContent>
+
+      {/* Post-download instructions. No auto-hide so users can read at their
+       *  own pace; dismiss with the ✕ when finished. */}
+      <Snackbar
+        open={Boolean(downloadHint)}
+        onClose={() => setDownloadHint(null)}
+        anchorOrigin={{ vertical: "bottom", horizontal: "center" }}
+      >
+        <Alert
+          severity="success"
+          onClose={() => setDownloadHint(null)}
+          sx={{ maxWidth: 520 }}
+        >
+          {downloadHint === "sh" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the Mac / Linux script
+              </Typography>
+              <Typography variant="body2">
+                To fetch your data files:
+              </Typography>
+              <Box component="ol" sx={{ pl: 2.5, mt: 0.5, mb: 0 }}>
+                <li>Open Terminal</li>
+                <li>Go to the folder where the script was saved</li>
+                <li>
+                  Run:{" "}
+                  <Box
+                    component="code"
+                    sx={{
+                      fontFamily: "monospace",
+                      backgroundColor: "rgba(0,0,0,0.06)",
+                      px: 0.5,
+                      borderRadius: 0.5,
+                    }}
+                  >
+                    bash &lt;script-name&gt;.sh
+                  </Box>
+                </li>
+              </Box>
+            </Box>
+          )}
+          {downloadHint === "bat" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the Windows script
+              </Typography>
+              <Typography variant="body2">
+                Open the folder where the script was saved and{" "}
+                <strong>double-click the .bat file</strong>. A command window
+                opens and the files download next to it.
+              </Typography>
+            </Box>
+          )}
+          {downloadHint === "txt" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the URL list
+              </Typography>
+              <Typography variant="body2">
+                In Terminal (Mac/Linux) or PowerShell (Windows), run:{" "}
+                <Box
+                  component="code"
+                  sx={{
+                    fontFamily: "monospace",
+                    backgroundColor: "rgba(0,0,0,0.06)",
+                    px: 0.5,
+                    borderRadius: 0.5,
+                  }}
+                >
+                  wget -i &lt;file-name&gt;.txt
+                </Box>
+              </Typography>
+            </Box>
+          )}
+        </Alert>
+      </Snackbar>
     </Card>
   );
 };

From 8be3fa1af653de11aedc926130f7a054a2d09bf2 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 15 May 2026 14:15:49 -0400
Subject: [PATCH 37/61] fix(dataset-detail): keep all downloaded files in one
 visible folder

---
 src/pages/UpdatedDatasetDetailPage.tsx | 19 ++++++++++++++-----
 1 file changed, 14 insertions(+), 5 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index f94a751..734c104 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -577,8 +577,17 @@ const UpdatedDatasetDetailPage: React.FC = () => {
       //   });
       //   setJsonSize(blob.size);
 
-      //  Construct download script dynamically
-      let script = `curl -L --create-dirs "https://neurojson.io:7777/${dbName}/${docId}" -o "${docId}.json"\n`;
+      //  Construct download script dynamically — everything lands in a
+      //  ./<docId>/ folder next to where the user runs the script, so the
+      //  JSON and the data files stay together (was split between cwd and
+      //  ~/.neurojson/io/... previously, hard to find).
+      let script = `#!/bin/bash\n`;
+      script += `# Downloads ${docId} from ${dbName}\n`;
+      script += `# Usage: bash ${docId}.sh\n`;
+      script += `set -e\n`;
+      script += `mkdir -p "${docId}"\n`;
+      script += `cd "${docId}" || exit 1\n`;
+      script += `curl -L -C - -o "${docId}.json" "https://neurojson.io:7777/${dbName}/${docId}"\n`;
 
       links.forEach((link) => {
         const url = link.url;
@@ -594,10 +603,10 @@ const UpdatedDatasetDetailPage: React.FC = () => {
             })()
           : `file-${link.index}`;
 
-        const outputPath = `$HOME/.neurojson/io/${dbName}/${docId}/${filename}`;
-
-        script += `curl -L --create-dirs "${url}" -o "${outputPath}"\n`;
+        script += `curl -L -C - -o "${filename}" "${url}"\n`;
       });
+
+      script += `echo "Done. Files saved to $(pwd)"\n`;
       setDownloadScript(script);
       // Calculate and set script size
       const scriptBlob = new Blob([script], { type: "text/plain" });

From e21c661760d3061f2b18540043c8952c60a259fa Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 15 May 2026 14:24:22 -0400
Subject: [PATCH 38/61] feat(dataset-detail): three script formats for download
 all files button

---
 src/pages/UpdatedDatasetDetailPage.tsx | 223 ++++++++++++++++++++-----
 1 file changed, 183 insertions(+), 40 deletions(-)

diff --git a/src/pages/UpdatedDatasetDetailPage.tsx b/src/pages/UpdatedDatasetDetailPage.tsx
index 734c104..835a6b5 100644
--- a/src/pages/UpdatedDatasetDetailPage.tsx
+++ b/src/pages/UpdatedDatasetDetailPage.tsx
@@ -7,6 +7,7 @@ import ExpandLess from "@mui/icons-material/ExpandLess";
 import ExpandMore from "@mui/icons-material/ExpandMore";
 import HomeIcon from "@mui/icons-material/Home";
 import InfoOutlinedIcon from "@mui/icons-material/InfoOutlined";
+import KeyboardArrowDownIcon from "@mui/icons-material/KeyboardArrowDown";
 import {
   Box,
   Typography,
@@ -17,6 +18,9 @@ import {
   Collapse,
   Tooltip,
   IconButton,
+  Menu,
+  MenuItem,
+  Snackbar,
 } from "@mui/material";
 import DatasetActions from "components/DatasetDetailPage/DatasetAction";
 import FileTree from "components/DatasetDetailPage/FileTree/FileTree";
@@ -267,8 +271,23 @@ const UpdatedDatasetDetailPage: React.FC = () => {
   const [externalLinks, setExternalLinks] = useState<ExternalDataLink[]>([]);
   const [internalLinks, setInternalLinks] = useState<InternalDataLink[]>([]);
   const [isInternalExpanded, setIsInternalExpanded] = useState(true);
-  const [downloadScript, setDownloadScript] = useState<string>("");
+  // Three script formats generated client-side: bash (Mac/Linux), batch
+  // (Windows), and a plain URL list. Same files in all three; only the
+  // wrapper syntax differs.
+  const [downloadScripts, setDownloadScripts] = useState<{
+    sh: string;
+    bat: string;
+    txt: string;
+  }>({ sh: "", bat: "", txt: "" });
   const [downloadScriptSize, setDownloadScriptSize] = useState<number>(0);
+  // Dropdown state for the download format menu.
+  const [downloadMenuEl, setDownloadMenuEl] = useState<HTMLElement | null>(
+    null
+  );
+  // Post-download instruction snackbar. Stays open until user dismisses.
+  const [downloadHint, setDownloadHint] = useState<
+    "sh" | "bat" | "txt" | null
+  >(null);
   const [totalFileSize, setTotalFileSize] = useState<number>(0);
   const [previewIsInternal, setPreviewIsInternal] = useState(false);
   const [isExternalExpanded, setIsExternalExpanded] = useState(true);
@@ -577,40 +596,62 @@ const UpdatedDatasetDetailPage: React.FC = () => {
       //   });
       //   setJsonSize(blob.size);
 
-      //  Construct download script dynamically — everything lands in a
-      //  ./<docId>/ folder next to where the user runs the script, so the
-      //  JSON and the data files stay together (was split between cwd and
-      //  ~/.neurojson/io/... previously, hard to find).
-      let script = `#!/bin/bash\n`;
-      script += `# Downloads ${docId} from ${dbName}\n`;
-      script += `# Usage: bash ${docId}.sh\n`;
-      script += `set -e\n`;
-      script += `mkdir -p "${docId}"\n`;
-      script += `cd "${docId}" || exit 1\n`;
-      script += `curl -L -C - -o "${docId}.json" "https://neurojson.io:7777/${dbName}/${docId}"\n`;
-
-      links.forEach((link) => {
-        const url = link.url;
-        const match = url.match(/file=([^&]+)/);
-
-        const filename = match
-          ? (() => {
-              try {
-                return decodeURIComponent(match[1]);
-              } catch {
-                return match[1]; // fallback if decode fails
-              }
-            })()
-          : `file-${link.index}`;
-
-        script += `curl -L -C - -o "${filename}" "${url}"\n`;
-      });
-
-      script += `echo "Done. Files saved to $(pwd)"\n`;
-      setDownloadScript(script);
-      // Calculate and set script size
-      const scriptBlob = new Blob([script], { type: "text/plain" });
-      setDownloadScriptSize(scriptBlob.size);
+      //  Construct download scripts (three formats) dynamically — everything
+      //  lands in a ./<docId>/ folder next to where the user runs the script.
+      //  JSON metadata and data files stay together (was split between cwd
+      //  and ~/.neurojson/io/... previously, hard to find).
+      const docUrl = `https://neurojson.io:7777/${dbName}/${docId}`;
+      type DlItem = { url: string; filename: string };
+      const items: DlItem[] = [
+        { url: docUrl, filename: `${docId}.json` },
+        ...links.map((link) => {
+          const match = link.url.match(/file=([^&]+)/);
+          const filename = match
+            ? (() => {
+                try {
+                  return decodeURIComponent(match[1]);
+                } catch {
+                  return match[1];
+                }
+              })()
+            : `file-${link.index}`;
+          return { url: link.url, filename };
+        }),
+      ];
+
+      // Bash script (Mac/Linux)
+      const sh =
+        `#!/bin/bash\n` +
+        `# Downloads ${docId} from ${dbName}\n` +
+        `# Usage: bash ${docId}.sh\n` +
+        `set -e\n` +
+        `mkdir -p "${docId}"\n` +
+        `cd "${docId}" || exit 1\n` +
+        items
+          .map((it) => `curl -L -C - -o "${it.filename}" "${it.url}"`)
+          .join("\n") +
+        `\necho "Done. Files saved to $(pwd)"\n`;
+
+      // Batch script (Windows) — curl ships with Windows 10+. CRLF endings.
+      const bat =
+        `@echo off\r\n` +
+        `REM Downloads ${docId} from ${dbName}\r\n` +
+        `REM Usage: double-click or run ${docId}.bat\r\n` +
+        `if not exist "${docId}" mkdir "${docId}"\r\n` +
+        `cd /d "${docId}"\r\n` +
+        items
+          .map((it) => `curl -L -C - -o "${it.filename}" "${it.url}"`)
+          .join("\r\n") +
+        `\r\necho Done. Files saved to %cd%\r\n` +
+        `pause\r\n`;
+
+      // Plain URL list — for advanced users with wget.
+      const txt = items.map((it) => it.url).join("\n") + "\n";
+
+      setDownloadScripts({ sh, bat, txt });
+      // Size shown on the button is the .sh script size (representative).
+      const shBlob = new Blob([sh], { type: "text/plain" });
+      setDownloadScriptSize(shBlob.size);
     }
   }, [datasetDocument, docId]);
 
@@ -636,14 +677,25 @@ const UpdatedDatasetDetailPage: React.FC = () => {
     document.body.removeChild(link);
   };
 
-  const handleDownloadScript = () => {
-    const blob = new Blob([downloadScript], { type: "text/plain" });
+  // Trigger download of the selected script format. Programmatic anchor
+  // click triggers the browser's normal download flow without navigating.
+  const handleDownloadScript = (format: "sh" | "bat" | "txt") => {
+    const content = downloadScripts[format];
+    if (!content) return;
+    const mime =
+      format === "sh" ? "application/x-sh" : "text/plain";
+    const filename =
+      format === "txt" ? `${docId}_manifest.txt` : `${docId}.${format}`;
+    const blob = new Blob([content], { type: `${mime}; charset=utf-8` });
     const link = document.createElement("a");
     link.href = URL.createObjectURL(blob);
-    link.download = `${docId}.sh`;
+    link.download = filename;
     document.body.appendChild(link);
     link.click();
     document.body.removeChild(link);
+    URL.revokeObjectURL(link.href);
+    setDownloadMenuEl(null);
+    setDownloadHint(format);
   };
 
   const handlePreview = (
@@ -1127,20 +1179,35 @@ const UpdatedDatasetDetailPage: React.FC = () => {
             <Button
               variant="contained"
               startIcon={<DescriptionIcon />}
-              onClick={handleDownloadScript}
+              endIcon={<KeyboardArrowDownIcon />}
+              onClick={(e) => setDownloadMenuEl(e.currentTarget)}
               sx={{
                 backgroundColor: Colors.purple,
                 color: Colors.lightGray,
                 "&:hover": { backgroundColor: Colors.secondaryPurple },
               }}
             >
-              {/* Script to Download All Files ({downloadScript.length} Bytes) */}
               Script to Download All Files ({formatSize(downloadScriptSize)})
               {externalLinks.length > 0 &&
                 ` (links: ${externalLinks.length}, total: ${formatSize(
                   totalFileSize
                 )})`}
             </Button>
+            <Menu
+              anchorEl={downloadMenuEl}
+              open={Boolean(downloadMenuEl)}
+              onClose={() => setDownloadMenuEl(null)}
+            >
+              <MenuItem onClick={() => handleDownloadScript("sh")}>
+                For Mac / Linux (.sh)
+              </MenuItem>
+              <MenuItem onClick={() => handleDownloadScript("bat")}>
+                For Windows (.bat)
+              </MenuItem>
+              <MenuItem onClick={() => handleDownloadScript("txt")}>
+                URL list (.txt, advanced)
+              </MenuItem>
+            </Menu>
           </Box>
         </Box>
 
@@ -1667,6 +1734,82 @@ const UpdatedDatasetDetailPage: React.FC = () => {
           key={`${previewIndex}-${previewOpen}`} // react will destroy the existing component and create a new one for mount
         />
       </Box>
+
+      {/* Post-download instructions. No auto-hide so users can read at
+       *  their own pace; dismiss with the ✕ when finished. */}
+      <Snackbar
+        open={Boolean(downloadHint)}
+        onClose={() => setDownloadHint(null)}
+        anchorOrigin={{ vertical: "bottom", horizontal: "center" }}
+      >
+        <Alert
+          severity="success"
+          onClose={() => setDownloadHint(null)}
+          sx={{ maxWidth: 520 }}
+        >
+          {downloadHint === "sh" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the Mac / Linux script
+              </Typography>
+              <Typography variant="body2">
+                To fetch your data files:
+              </Typography>
+              <Box component="ol" sx={{ pl: 2.5, mt: 0.5, mb: 0 }}>
+                <li>Open Terminal</li>
+                <li>Go to the folder where the script was saved</li>
+                <li>
+                  Run:{" "}
+                  <Box
+                    component="code"
+                    sx={{
+                      fontFamily: "monospace",
+                      backgroundColor: "rgba(0,0,0,0.06)",
+                      px: 0.5,
+                      borderRadius: 0.5,
+                    }}
+                  >
+                    bash &lt;script-name&gt;.sh
+                  </Box>
+                </li>
+              </Box>
+            </Box>
+          )}
+          {downloadHint === "bat" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the Windows script
+              </Typography>
+              <Typography variant="body2">
+                Open the folder where the script was saved and{" "}
+                <strong>double-click the .bat file</strong>. A command
+                window opens and the files download next to it.
+              </Typography>
+            </Box>
+          )}
+          {downloadHint === "txt" && (
+            <Box>
+              <Typography variant="body2" sx={{ fontWeight: 600, mb: 0.5 }}>
+                Downloaded the URL list
+              </Typography>
+              <Typography variant="body2">
+                In Terminal (Mac/Linux) or PowerShell (Windows), run:{" "}
+                <Box
+                  component="code"
+                  sx={{
+                    fontFamily: "monospace",
+                    backgroundColor: "rgba(0,0,0,0.06)",
+                    px: 0.5,
+                    borderRadius: 0.5,
+                  }}
+                >
+                  wget -i &lt;file-name&gt;.txt
+                </Box>
+              </Typography>
+            </Box>
+          )}
+        </Alert>
+      </Snackbar>
     </>
   );
 };

From 909cd36172343cf1b86492bae3c5d70174ce2558 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 20 May 2026 16:39:16 -0400
Subject: [PATCH 39/61] feat(sync): pull database list from registry

---
 backend/sync/incrementalSync.js | 48 +++++++--------------------------
 1 file changed, 9 insertions(+), 39 deletions(-)

diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index b9e497a..55c5e90 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -8,34 +8,13 @@ const COUCHDB_URL = process.env.COUCHDB_URL || "https://neurojson.io:7777";
 const CONCURRENCY = 5;
 
 // fetch database list dynamically from registry
+// registry doc shape: { database: [{ id, name, ... }, ...] }
 async function getDatabases() {
-  try {
-    const response = await axios.get(`${COUCHDB_URL}/sys/registry`);
-    const databases = response.data
-      .map((db) => db.id)
-      .filter((id) => id && id !== "sys");
-    console.log(`Found ${databases.length} databases in registry`);
-    return databases;
-  } catch (err) {
-    console.error("Failed to fetch registry:", err.message);
-    return [
-      "openneuro",
-      "abide",
-      "abide2",
-      "datalad-registry",
-      "adhd200",
-      "bfnirs",
-      "mcx",
-      "mmc",
-      "ucl-4d-neonatal-head-model",
-      "unc-012-infant-atlas",
-      "unc-infant-cortical-surface-atlas",
-      "cotilab",
-      "emnist",
-      "nemo-bids",
-      "openfnirs",
-    ];
-  }
+  const response = await axios.get(`${COUCHDB_URL}/sys/registry`);
+  const entries = response.data?.database || [];
+  const databases = entries.map((db) => db.id).filter(Boolean);
+  console.log(`Found ${databases.length} databases in registry`);
+  return databases;
 }
 
 // === Local ports of CouchDB _design/qq map functions ===
@@ -43,8 +22,7 @@ async function getDatabases() {
 // these drift silently.
 
 function transformDbinfo(doc) {
-  const txt =
-    doc["README"] || doc["README.md"] || doc["README.rst"] || "";
+  const txt = doc["README"] || doc["README.md"] || doc["README.rst"] || "";
   const rawtext = JSON.stringify(doc);
   const datainfo = doc["dataset_description.json"] || { Name: doc._id };
   const subjlist = [];
@@ -541,9 +519,7 @@ async function incrementalSync(dbname, lastSeq) {
             await processDatasetUpdate(dbname, change.id);
           }
         } catch (err) {
-          console.error(
-            `  ${dbname}/${change.id}: failed - ${err.message}`
-          );
+          console.error(`  ${dbname}/${change.id}: failed - ${err.message}`);
         }
       })
     );
@@ -587,13 +563,7 @@ async function runSync() {
   console.log(new Date().toISOString());
   console.log(`CouchDB: ${COUCHDB_URL}`);
 
-  // change to await getDatabases() when ready for full sync
-  const databases = [
-    "bfnirs",           // NIRS — .snirf, .jdb
-    "brainmeshlibrary", // mesh + atlas — .jmsh, .jnii (318 datasets)
-    "cotilab",          // JData — small (6 datasets)
-    "abide",            // BIDS MRI — .nii.gz, .tsv, .json (25 datasets)
-  ];
+  const databases = await getDatabases();
   console.log(`Databases: ${databases.length}`);
 
   for (const db of databases) {

From 0cee8b6c221002d6d49c3f7748f0159d62906585 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Thu, 21 May 2026 11:43:56 -0400
Subject: [PATCH 40/61] feat(search): add dataset-level modality filter with
 AND/OR mode

---
 backend/src/controllers/couchdb.controller.js | 24 +++++
 backend/sync/incrementalSync.js               | 14 ++-
 src/pages/SearchPage.tsx                      | 97 ++++++++++++++++++-
 .../SearchPageFunctions/generateUiSchema.ts   |  8 ++
 .../SearchPageFunctions/searchformSchema.ts   | 15 +++
 5 files changed, 151 insertions(+), 7 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index c990fe7..3700fc8 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -207,6 +207,30 @@ const searchAllDatabases = async (req, res) => {
       repl.modality = mod;
     }
 
+    // Dataset-level modality filter (multi-select + AND/OR).
+    // Queries json->'modality' on dbinfo rows, not subjects rows.
+    if (Array.isArray(f.modalities) && f.modalities.length > 0) {
+      const op = f.modality_mode === "and" ? " AND " : " OR ";
+      const parts = f.modalities.map((m, i) => {
+        repl[`dmod${i}`] = String(m);
+        return isSubjectSearch
+          ? `dsi.json->'modality' ? :dmod${i}`
+          : `json->'modality' ? :dmod${i}`;
+      });
+      const condition = `(${parts.join(op)})`;
+      if (isSubjectSearch) {
+        where.push(`EXISTS (
+          SELECT 1 FROM ioviews dsi
+          WHERE dsi.dbname = ioviews.dbname
+            AND dsi.dsname = ioviews.dsname
+            AND dsi.view = 'dbinfo'
+            AND ${condition}
+        )`);
+      } else {
+        where.push(condition);
+      }
+    }
+
     // db / ds / subj filters
     if (isFilter(f.database)) {
       where.push(`dbname = :dbname`);
diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index 55c5e90..50fbad5 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -303,7 +303,15 @@ async function saveLastSeq(dbname, seq) {
   );
 }
 
+// Postgres jsonb rejects the null-byte escape with "unsupported Unicode
+// escape sequence", so strip it from the serialized JSON before insert.
+// Seen in openneuro README/TSV fields containing stray null bytes.
+function safeStringify(obj) {
+  return JSON.stringify(obj).replace(/\\u0000/g, "");
+}
+
 async function upsertIoview(dbname, dsname, subj, view, json, transaction) {
+  const payload = safeStringify(json);
   await sequelize.query(
     `INSERT INTO ioviews (dbname, dsname, subj, view, json, search_vector, updated_at)
      VALUES (:dbname, :dsname, :subj, :view, :json, to_tsvector('english', :text), NOW())
@@ -317,8 +325,8 @@ async function upsertIoview(dbname, dsname, subj, view, json, transaction) {
         dsname,
         subj: String(subj),
         view,
-        json: JSON.stringify(json),
-        text: JSON.stringify(json),
+        json: payload,
+        text: payload,
       },
       transaction,
     }
@@ -335,7 +343,7 @@ async function insertIolink(dbname, dsname, subj, view, json, transaction) {
         dsname,
         subj: String(subj),
         view,
-        json: JSON.stringify(json),
+        json: safeStringify(json),
       },
       transaction,
     }
diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index 397e63a..ddd5137 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -16,6 +16,11 @@ import {
   Slider,
   Stack,
   TextField,
+  ToggleButton,
+  ToggleButtonGroup,
+  FormGroup,
+  FormControlLabel,
+  Checkbox,
 } from "@mui/material";
 import { useTheme } from "@mui/material/styles";
 import useMediaQuery from "@mui/material/useMediaQuery";
@@ -57,6 +62,80 @@ type RegistryItem = {
 const AGE_MIN_BOUND = 0;
 const AGE_MAX_BOUND = 100;
 
+const DATASET_MODALITIES = [
+  "anat", "func", "dwi", "fmap", "perf",
+  "meg", "eeg", "ieeg", "beh", "pet",
+  "micr", "nirs", "motion", "ephys", "atlas",
+  "JMesh", "JNIFTI", "JSNIRF", "JData",
+];
+
+const DatasetModalityFilterField = (props: any) => {
+  const ctx = props?.registry?.formContext as
+    | { formData: Record<string, any>; setFormData: React.Dispatch<React.SetStateAction<Record<string, any>>> }
+    | undefined;
+  if (!ctx) return null;
+  const { formData, setFormData } = ctx;
+  const selected: string[] = Array.isArray(formData.modalities) ? formData.modalities : [];
+  const mode: string = formData.modality_mode || "or";
+
+  const toggle = (code: string) => {
+    setFormData((prev) => {
+      const cur: string[] = Array.isArray(prev.modalities) ? prev.modalities : [];
+      const next = cur.includes(code) ? cur.filter((m) => m !== code) : [...cur, code];
+      const updated = { ...prev };
+      if (next.length === 0) {
+        delete updated.modalities;
+        delete updated.modality_mode;
+      } else {
+        updated.modalities = next;
+        if (!updated.modality_mode) updated.modality_mode = "or";
+      }
+      return updated;
+    });
+  };
+
+  const handleModeChange = (_: any, val: string | null) => {
+    if (!val) return;
+    setFormData((prev) => ({ ...prev, modality_mode: val }));
+  };
+
+  return (
+    <Box sx={{ mt: 1, mb: 1, p: 1, borderRadius: 1, backgroundColor: selected.length > 0 ? "#e8f4fd" : "transparent" }}>
+      <Typography variant="body2" sx={{ fontWeight: 500, mb: 0.5 }}>
+        Dataset modalities
+      </Typography>
+      <FormGroup row>
+        {DATASET_MODALITIES.map((code) => (
+          <FormControlLabel
+            key={code}
+            control={
+              <Checkbox
+                size="small"
+                checked={selected.includes(code)}
+                onChange={() => toggle(code)}
+                sx={{ py: 0.25 }}
+              />
+            }
+            label={<Typography variant="body2">{code}</Typography>}
+            sx={{ mr: 1 }}
+          />
+        ))}
+      </FormGroup>
+      {selected.length > 1 && (
+        <Box sx={{ mt: 1, display: "flex", alignItems: "center", gap: 1 }}>
+          <ToggleButtonGroup size="small" value={mode} exclusive onChange={handleModeChange}>
+            <ToggleButton value="or" sx={{ px: 2, py: 0.25 }}>OR</ToggleButton>
+            <ToggleButton value="and" sx={{ px: 2, py: 0.25 }}>AND</ToggleButton>
+          </ToggleButtonGroup>
+          <Typography variant="caption" sx={{ color: "text.secondary" }}>
+            {mode === "and" ? "must have all selected" : "must have any selected"}
+          </Typography>
+        </Box>
+      )}
+    </Box>
+  );
+};
+
 const AgeRangeSliderField = (props: any) => {
   const ctx = props?.registry?.formContext as
     | {
@@ -239,10 +318,12 @@ const SearchPage: React.FC = () => {
     ([key, value]) =>
       key !== "skip" &&
       key !== "limit" &&
+      key !== "modality_mode" &&
       value !== undefined &&
       value !== null &&
       value !== "" &&
-      value !== "any"
+      value !== "any" &&
+      !(Array.isArray(value) && value.length === 0)
   );
 
   useEffect(() => {
@@ -381,6 +462,7 @@ const SearchPage: React.FC = () => {
     ),
     ageRangeSlider: AgeRangeSliderField,
     countRangePair: CountRangePairField,
+    datasetModalityFilter: DatasetModalityFilterField,
   };
 
   // determine the results are subject-level or dataset-level
@@ -685,10 +767,16 @@ const SearchPage: React.FC = () => {
                 mt: 1,
               }}
             >
-              {activeFilters.map(([key, value]) => (
+              {activeFilters.map(([key, value]) => {
+                let label = `${String(key)}: ${String(value)}`;
+                if (key === "modalities" && Array.isArray(value)) {
+                  const mode = appliedFilters.modality_mode || "or";
+                  label = `modalities (${mode}): ${value.join(", ")}`;
+                }
+                return (
                 <Chip
                   key={key}
-                  label={`${String(key)}: ${String(value)}`}
+                  label={label}
                   variant="outlined"
                   sx={{
                     color: Colors.darkPurple,
@@ -736,7 +824,8 @@ const SearchPage: React.FC = () => {
                     }
                   }}
                 />
-              ))}
+                );
+              })}
             </Box>
           )}
 
diff --git a/src/utils/SearchPageFunctions/generateUiSchema.ts b/src/utils/SearchPageFunctions/generateUiSchema.ts
index 152a056..46dc215 100644
--- a/src/utils/SearchPageFunctions/generateUiSchema.ts
+++ b/src/utils/SearchPageFunctions/generateUiSchema.ts
@@ -51,6 +51,9 @@ export const generateUiSchema = (
       "database",
       "keyword",
       "file_type", // dataset-level: filters by file extensions in iolinks
+      "dataset_modality_filter", // dataset-level: modality multi-select + AND/OR
+      "modalities",
+      "modality_mode",
       "subject_filters_toggle",
       "age_range_slider", // top of subject filters — range slider for age
       "modality",
@@ -106,6 +109,11 @@ export const generateUiSchema = (
           },
         }
       : datasetHiddenStyle,
+    dataset_modality_filter: showDatasetFilters
+      ? { "ui:field": "datasetModalityFilter" }
+      : datasetHiddenStyle,
+    modalities: invisibleStyle,
+    modality_mode: invisibleStyle,
     limit: invisibleStyle,
     skip: invisibleStyle,
 
diff --git a/src/utils/SearchPageFunctions/searchformSchema.ts b/src/utils/SearchPageFunctions/searchformSchema.ts
index e122725..3674cdd 100644
--- a/src/utils/SearchPageFunctions/searchformSchema.ts
+++ b/src/utils/SearchPageFunctions/searchformSchema.ts
@@ -134,6 +134,21 @@ export const baseSchema: JSONSchema7 = {
       items: { type: "string" },
       uniqueItems: true,
     },
+    dataset_modality_filter: {
+      type: "null",
+      title: "",
+    },
+    modalities: {
+      type: "array",
+      title: "Dataset modalities",
+      items: { type: "string" },
+      uniqueItems: true,
+    },
+    modality_mode: {
+      type: "string",
+      title: "Modality match mode",
+      default: "or",
+    },
     session_name: {
       title: "Session keywords",
       type: "string",

From 601d90be7e248ed6e1b977883a6f456f715ab8e3 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 22 May 2026 10:10:44 -0400
Subject: [PATCH 41/61] feat(search): add tooltip to Subject-Level Filters
 explaining result type

---
 src/pages/SearchPage.tsx | 18 +++++++++++++++++-
 1 file changed, 17 insertions(+), 1 deletion(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index ddd5137..765e308 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -427,7 +427,7 @@ const SearchPage: React.FC = () => {
   // Create the "Subject-level Filters" button as a custom field
   const customFields = {
     subjectFiltersToggle: () => (
-      <Box sx={{ mt: 2, mb: 1 }}>
+      <Box sx={{ mt: 2, mb: 1, display: "flex", alignItems: "center", gap: 1 }}>
         <Button
           variant="outlined"
           onClick={() => setShowSubjectFilters((prev) => !prev)}
@@ -442,6 +442,22 @@ const SearchPage: React.FC = () => {
         >
           Subject-Level Filters
         </Button>
+        <Tooltip
+          title="Applying any filter here returns subject-level results."
+          componentsProps={{
+            tooltip: {
+              sx: {
+                backgroundColor: "white",
+                color: Colors.darkPurple,
+                boxShadow: 1,
+              },
+            },
+          }}
+        >
+          <IconButton size="small" sx={{ color: Colors.purple }}>
+            <InfoOutlinedIcon fontSize="small" />
+          </IconButton>
+        </Tooltip>
       </Box>
     ),
     datasetFiltersToggle: () => (

From 5aab8089f330c52d3ce592af07ba8f2152f04815 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 22 May 2026 10:24:34 -0400
Subject: [PATCH 42/61] fix(sync): reject malformed file extensions from
 CouchDB links view

---
 backend/sync/incrementalSync.js | 18 +++++++++++++++++-
 1 file changed, 17 insertions(+), 1 deletion(-)

diff --git a/backend/sync/incrementalSync.js b/backend/sync/incrementalSync.js
index 50fbad5..766f1a5 100644
--- a/backend/sync/incrementalSync.js
+++ b/backend/sync/incrementalSync.js
@@ -310,6 +310,19 @@ function safeStringify(obj) {
   return JSON.stringify(obj).replace(/\\u0000/g, "");
 }
 
+// A valid file type is a dot-prefixed extension with no slashes and
+// a reasonable length. Some CouchDB links view rows (e.g. openneuro)
+// emit paths like ".0/libraries/FID-A/..." where the version number
+// gets parsed as a fake extension — reject those.
+function isValidFileType(ext) {
+  return (
+    typeof ext === "string" &&
+    ext.startsWith(".") &&
+    !ext.includes("/") &&
+    ext.length <= 20
+  );
+}
+
 async function upsertIoview(dbname, dsname, subj, view, json, transaction) {
   const payload = safeStringify(json);
   await sequelize.query(
@@ -401,15 +414,18 @@ async function firstSync(dbname) {
   console.log(`  ${dbname}: subjects synced (${subjectRows.length} rows)`);
 
   const linkRows = await fetchView(dbname, "links");
+  let linkCount = 0;
   for (const row of linkRows) {
     const fileType = row.key?.[0];
+    if (!isValidFileType(fileType)) continue;
     const subjId = String(row.key?.[1] || "");
     await insertIolink(dbname, row.id, subjId, fileType, {
       key: row.key,
       value: row.value,
     });
+    linkCount++;
   }
-  console.log(`  ${dbname}: links synced (${linkRows.length} rows)`);
+  console.log(`  ${dbname}: links synced (${linkCount}/${linkRows.length} rows)`);
 }
 
 // === Process one changed dataset (Option A: 2 HTTP requests + local transforms) ===

From f834a4740a5d912203d3b8ebe791049de23f3abe Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 25 May 2026 07:34:16 -0400
Subject: [PATCH 43/61] style(search): match dataset modality filter UI to file
 types field

---
 src/pages/SearchPage.tsx | 54 +++++++++++++++++++++-------------------
 1 file changed, 28 insertions(+), 26 deletions(-)

diff --git a/src/pages/SearchPage.tsx b/src/pages/SearchPage.tsx
index 765e308..df49761 100644
--- a/src/pages/SearchPage.tsx
+++ b/src/pages/SearchPage.tsx
@@ -18,9 +18,7 @@ import {
   TextField,
   ToggleButton,
   ToggleButtonGroup,
-  FormGroup,
-  FormControlLabel,
-  Checkbox,
+  Autocomplete,
 } from "@mui/material";
 import { useTheme } from "@mui/material/styles";
 import useMediaQuery from "@mui/material/useMediaQuery";
@@ -78,10 +76,8 @@ const DatasetModalityFilterField = (props: any) => {
   const selected: string[] = Array.isArray(formData.modalities) ? formData.modalities : [];
   const mode: string = formData.modality_mode || "or";
 
-  const toggle = (code: string) => {
+  const handleChange = (_: any, next: string[]) => {
     setFormData((prev) => {
-      const cur: string[] = Array.isArray(prev.modalities) ? prev.modalities : [];
-      const next = cur.includes(code) ? cur.filter((m) => m !== code) : [...cur, code];
       const updated = { ...prev };
       if (next.length === 0) {
         delete updated.modalities;
@@ -100,27 +96,33 @@ const DatasetModalityFilterField = (props: any) => {
   };
 
   return (
-    <Box sx={{ mt: 1, mb: 1, p: 1, borderRadius: 1, backgroundColor: selected.length > 0 ? "#e8f4fd" : "transparent" }}>
-      <Typography variant="body2" sx={{ fontWeight: 500, mb: 0.5 }}>
-        Dataset modalities
-      </Typography>
-      <FormGroup row>
-        {DATASET_MODALITIES.map((code) => (
-          <FormControlLabel
-            key={code}
-            control={
-              <Checkbox
-                size="small"
-                checked={selected.includes(code)}
-                onChange={() => toggle(code)}
-                sx={{ py: 0.25 }}
-              />
-            }
-            label={<Typography variant="body2">{code}</Typography>}
-            sx={{ mr: 1 }}
+    <Box sx={{ mt: 1, mb: 1 }}>
+      <Autocomplete
+        multiple
+        options={DATASET_MODALITIES}
+        value={selected}
+        onChange={handleChange}
+        renderTags={(items, getTagProps) =>
+          items.map((item, index) => (
+            <Chip
+              variant="outlined"
+              label={item}
+              size="small"
+              {...getTagProps({ index })}
+              key={item}
+            />
+          ))
+        }
+        renderInput={(params) => (
+          <TextField
+            {...params}
+            label="Dataset modalities"
+            placeholder={selected.length === 0 ? "e.g. eeg, nirs" : ""}
+            size="small"
+            fullWidth
           />
-        ))}
-      </FormGroup>
+        )}
+      />
       {selected.length > 1 && (
         <Box sx={{ mt: 1, display: "flex", alignItems: "center", gap: 1 }}>
           <ToggleButtonGroup size="small" value={mode} exclusive onChange={handleModeChange}>

From faf548ff118a7126fe8fa496bf83c11788cbe20a Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 26 May 2026 14:53:39 -0400
Subject: [PATCH 44/61] fix(search): resolve relative-path iolinks URLs for
 openneuro file links

---
 backend/src/controllers/couchdb.controller.js |  6 +-
 src/components/SearchPage/DatasetCard.tsx     | 14 +++-
 yarn.lock                                     | 78 ++++++++++---------
 3 files changed, 60 insertions(+), 38 deletions(-)

diff --git a/backend/src/controllers/couchdb.controller.js b/backend/src/controllers/couchdb.controller.js
index 3700fc8..ab12d0f 100644
--- a/backend/src/controllers/couchdb.controller.js
+++ b/backend/src/controllers/couchdb.controller.js
@@ -513,7 +513,11 @@ const getDatasetFilesManifest = async (req, res) => {
       }
     );
 
-    const files = rows.filter((r) => r.url);
+    const resolveUrl = (url) => {
+      if (!url || url.startsWith("http")) return url;
+      return `https://neurojson.org/io/stat.cgi?action=get&db=${dbName}&doc=${dsName}&${url}`;
+    };
+    const files = rows.filter((r) => r.url).map((r) => ({ ...r, url: resolveUrl(r.url) }));
     const urls = files.map((r) => r.url);
     const baseName = `${dbName}_${dsName}_${exts.join("_")}`;
     const extLabel = exts.join(", ");
diff --git a/src/components/SearchPage/DatasetCard.tsx b/src/components/SearchPage/DatasetCard.tsx
index 4243119..7ecefae 100644
--- a/src/components/SearchPage/DatasetCard.tsx
+++ b/src/components/SearchPage/DatasetCard.tsx
@@ -59,6 +59,18 @@ interface DatasetCardProps {
 }
 
 /** ---------- utility helpers ---------- **/
+// Some iolinks records (older openneuro links view) store a relative path like
+// "file=sub-01/anat/sub-01_T1w.nii&size=1" instead of a full stat.cgi URL.
+// Reconstruct the full URL so the browser can follow it.
+const resolveFileUrl = (
+  dbname: string,
+  dsname: string,
+  url?: string
+): string => {
+  if (!url) return "";
+  if (url.startsWith("http")) return url;
+  return `https://neurojson.org/io/stat.cgi?action=get&db=${dbname}&doc=${dsname}&${url}`;
+};
 const normalize = (s: string) =>
   s
     ?.replace(/[\u2018\u2019\u2032]/g, "'") // curly → straight
@@ -504,7 +516,7 @@ const DatasetCard: React.FC<DatasetCardProps> = ({
                   return (
                     <li key={i}>
                       <MuiLink
-                        href={v.url}
+                        href={resolveFileUrl(dbname, dsname, v.url)}
                         target="_blank"
                         rel="noopener noreferrer"
                         underline="hover"
diff --git a/yarn.lock b/yarn.lock
index 8b8ba61..e881a21 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -2424,10 +2424,10 @@
     redux-thunk "^2.4.2"
     reselect "^4.1.8"
 
-"@remix-run/router@1.23.0":
-  version "1.23.0"
-  resolved "https://registry.yarnpkg.com/@remix-run/router/-/router-1.23.0.tgz#35390d0e7779626c026b11376da6789eb8389242"
-  integrity sha512-O3rHJzAQKamUz1fvE0Qaw0xSFqsA/yafi2iqeE0pvdFtCO1viYx8QL6f3Ln/aCCTLxs68SLf0KPM9eSeM8yBnA==
+"@remix-run/router@1.23.2":
+  version "1.23.2"
+  resolved "https://registry.yarnpkg.com/@remix-run/router/-/router-1.23.2.tgz#156c4b481c0bee22a19f7924728a67120de06971"
+  integrity sha512-Ic6m2U/rMjTkhERIa/0ZtXJP17QUi2CbWE7cqx4J58M8aA3QTfW+2UlQ4psvTX9IO1RfNVhK3pcpdjej7L+t2w==
 
 "@rjsf/core@^5.24.8":
   version "5.24.11"
@@ -3926,13 +3926,14 @@ axe-core@^4.10.0:
   integrity sha512-Xm7bpRXnDSX2YE2YFfBk2FnF0ep6tmG7xPh8iHee8MIcrgq762Nkce856dYtJYLkuIoYZvGfTs/PbZhideTcEg==
 
 axios@^1.4.0:
-  version "1.9.0"
-  resolved "https://registry.yarnpkg.com/axios/-/axios-1.9.0.tgz#25534e3b72b54540077d33046f77e3b8d7081901"
-  integrity sha512-re4CqKTJaURpzbLHtIi6XpDv20/CnpXOtjRY5/CU32L8gU8ek9UIivcfvSWvmKEngmVbrUtPpdDwWDWL7DNHvg==
+  version "1.16.1"
+  resolved "https://registry.yarnpkg.com/axios/-/axios-1.16.1.tgz#517e29291d19d6e8cf919ff264f4fe157261ba12"
+  integrity sha512-caYkukvroVPO8KrzuJEb50Hm07KwfBZPEC3VeFHTsqWHvKTsy54hjJz9BS/cdaypROE2rH6xvm9mHX4fgWkr3A==
   dependencies:
-    follow-redirects "^1.15.6"
-    form-data "^4.0.0"
-    proxy-from-env "^1.1.0"
+    follow-redirects "^1.16.0"
+    form-data "^4.0.5"
+    https-proxy-agent "^5.0.1"
+    proxy-from-env "^2.1.0"
 
 axobject-query@^4.1.0:
   version "4.1.0"
@@ -5973,9 +5974,9 @@ es-module-lexer@^1.2.1:
   integrity sha512-jEQoCwk8hyb2AZziIOLhDqpm5+2ww5uIE6lkO/6jcOCusfk6LhMHpXXfBLXTZ7Ydyt0j4VoUQv6uGNYbdW+kBA==
 
 es-object-atoms@^1.0.0, es-object-atoms@^1.1.1:
-  version "1.1.1"
-  resolved "https://registry.yarnpkg.com/es-object-atoms/-/es-object-atoms-1.1.1.tgz#1c4f2c4837327597ce69d2ca190a7fdd172338c1"
-  integrity sha512-FGgH2h8zKNim9ljj7dankFPcICIK9Cp5bm+c2gQSYePhpaG5+esrLODihIorn+Pe6FGJzWhXQotPv73jTaldXA==
+  version "1.1.2"
+  resolved "https://registry.yarnpkg.com/es-object-atoms/-/es-object-atoms-1.1.2.tgz#a2d0b373205724dfa525d23b0c3e1b1ca582c99b"
+  integrity sha512-HWcBoN6NileqtSydK2FqHbS/LoDd2pqrnQHLyJzBj4kOp/ky2MWMN694xOfkK8/SnUsW2DH7EfyVlydKCsm1Zw==
   dependencies:
     es-errors "^1.3.0"
 
@@ -6756,11 +6757,16 @@ flux@^4.0.1:
     fbemitter "^3.0.0"
     fbjs "^3.0.1"
 
-follow-redirects@^1.0.0, follow-redirects@^1.15.6:
+follow-redirects@^1.0.0:
   version "1.15.9"
   resolved "https://registry.yarnpkg.com/follow-redirects/-/follow-redirects-1.15.9.tgz#a604fa10e443bf98ca94228d9eebcc2e8a2c8ee1"
   integrity sha512-gew4GsXizNgdoRyqmyfMHyAmXsZDk6mHkSxZFCzW9gwlbtOW44CDtYavM+y+72qD/Vq2l550kMF52DT8fOLJqQ==
 
+follow-redirects@^1.16.0:
+  version "1.16.0"
+  resolved "https://registry.yarnpkg.com/follow-redirects/-/follow-redirects-1.16.0.tgz#28474a159d3b9d11ef62050a14ed60e4df6d61bc"
+  integrity sha512-y5rN/uOsadFT/JfYwhxRS5R7Qce+g3zG97+JrtFZlC9klX/W5hD7iiLzScI4nZqUS7DNUdhPgw4xI8W2LuXlUw==
+
 for-each@^0.3.3, for-each@^0.3.5:
   version "0.3.5"
   resolved "https://registry.yarnpkg.com/for-each/-/for-each-0.3.5.tgz#d650688027826920feeb0af747ee7b9421a41d47"
@@ -6805,10 +6811,10 @@ form-data@^3.0.0:
     es-set-tostringtag "^2.1.0"
     mime-types "^2.1.35"
 
-form-data@^4.0.0:
-  version "4.0.3"
-  resolved "https://registry.yarnpkg.com/form-data/-/form-data-4.0.3.tgz#608b1b3f3e28be0fccf5901fc85fb3641e5cf0ae"
-  integrity sha512-qsITQPfmvMOSAdeyZ+12I1c+CKSstAFAwu+97zrnWAbIr5u8wfsExUzCesVLC8NgHuRUqNN4Zy6UPWUTRGslcA==
+form-data@^4.0.5:
+  version "4.0.5"
+  resolved "https://registry.yarnpkg.com/form-data/-/form-data-4.0.5.tgz#b49e48858045ff4cbf6b03e1805cebcad3679053"
+  integrity sha512-8RipRLol37bNs2bhoV67fiTEvdTrbMUYcFTiy3+wuuOnUog2QBHCZWXDRijWQfAkhBj2Uf5UnVaiWwA5vdd82w==
   dependencies:
     asynckit "^0.4.0"
     combined-stream "^1.0.8"
@@ -7193,9 +7199,9 @@ has@^1.0.0:
   integrity sha512-qdSAmqLF6209RFj4VVItywPMbm3vWylknmB3nvNiUIs72xAimcM8nVYxYr7ncvZq5qzk9MKIZR8ijqD/1QuYjQ==
 
 hasown@^2.0.2:
-  version "2.0.2"
-  resolved "https://registry.yarnpkg.com/hasown/-/hasown-2.0.2.tgz#003eaf91be7adc372e84ec59dc37252cedb80003"
-  integrity sha512-0hJU9SCPvmMzIBdZFqNPXWa6dqh7WdH0cII9y+CyS8rG3nL48Bclra9HmKhVVUHyPWNH5Y7xDwAB7bfgSjkUMQ==
+  version "2.0.3"
+  resolved "https://registry.yarnpkg.com/hasown/-/hasown-2.0.3.tgz#5e5c2b15b60370a4c7930c383dfb76bf17bc403c"
+  integrity sha512-ej4AhfhfL2Q2zpMmLo7U1Uv9+PyhIZpgQLGT1F9miIGmiCJIoCgSmczFdrc97mWT4kVY72KA+WnnhJ5pghSvSg==
   dependencies:
     function-bind "^1.1.2"
 
@@ -7363,7 +7369,7 @@ http-proxy@^1.18.1:
     follow-redirects "^1.0.0"
     requires-port "^1.0.0"
 
-https-proxy-agent@^5.0.0:
+https-proxy-agent@^5.0.0, https-proxy-agent@^5.0.1:
   version "5.0.1"
   resolved "https://registry.yarnpkg.com/https-proxy-agent/-/https-proxy-agent-5.0.1.tgz#c59ef224a04fe8b754f3db0063a25ea30d0005d6"
   integrity sha512-dFcAjpTQFgoLMzC2VwU+C/CbS7uRL0lWmxDITmqm7C+7F0Odmj6s9l6alZc6AELXhrnggM2CeWSXHGOdX2YtwA==
@@ -10573,10 +10579,10 @@ proxy-addr@~2.0.7:
     forwarded "0.2.0"
     ipaddr.js "1.9.1"
 
-proxy-from-env@^1.1.0:
-  version "1.1.0"
-  resolved "https://registry.yarnpkg.com/proxy-from-env/-/proxy-from-env-1.1.0.tgz#e102f16ca355424865755d2c9e8ea4f24d58c3e2"
-  integrity sha512-D+zkORCbA9f1tdWRK0RaCR3GPv50cMxcrz4X8k5LTSUD1Dkw47mKJEZQNunItRTkWwgtaUSo1RVFRIG9ZXiFYg==
+proxy-from-env@^2.1.0:
+  version "2.1.0"
+  resolved "https://registry.yarnpkg.com/proxy-from-env/-/proxy-from-env-2.1.0.tgz#a7487568adad577cfaaa7e88c49cab3ab3081aba"
+  integrity sha512-cJ+oHTW1VAEa8cJslgmUZrc+sjRKgAKl3Zyse6+PV38hZe/V6Z14TbCuXcan9F9ghlz4QrFr2c92TNF82UkYHA==
 
 psl@^1.1.33:
   version "1.15.0"
@@ -10799,19 +10805,19 @@ react-refresh@^0.11.0:
   integrity sha512-F27qZr8uUqwhWZboondsPx8tnC3Ct3SxZA3V5WyEvujRyyNv0VYPhoBg1gZ8/MV5tubQp76Trw8lTv9hzRBa+A==
 
 react-router-dom@^6.15.0:
-  version "6.30.1"
-  resolved "https://registry.yarnpkg.com/react-router-dom/-/react-router-dom-6.30.1.tgz#da2580c272ddb61325e435478566be9563a4a237"
-  integrity sha512-llKsgOkZdbPU1Eg3zK8lCn+sjD9wMRZZPuzmdWWX5SUs8OFkN5HnFVC0u5KMeMaC9aoancFI/KoLuKPqN+hxHw==
+  version "6.30.3"
+  resolved "https://registry.yarnpkg.com/react-router-dom/-/react-router-dom-6.30.3.tgz#42ae6dc4c7158bfb0b935f162b9621b29dddf740"
+  integrity sha512-pxPcv1AczD4vso7G4Z3TKcvlxK7g7TNt3/FNGMhfqyntocvYKj+GCatfigGDjbLozC4baguJ0ReCigoDJXb0ag==
   dependencies:
-    "@remix-run/router" "1.23.0"
-    react-router "6.30.1"
+    "@remix-run/router" "1.23.2"
+    react-router "6.30.3"
 
-react-router@6.30.1:
-  version "6.30.1"
-  resolved "https://registry.yarnpkg.com/react-router/-/react-router-6.30.1.tgz#ecb3b883c9ba6dbf5d319ddbc996747f4ab9f4c3"
-  integrity sha512-X1m21aEmxGXqENEPG3T6u0Th7g0aS4ZmoNynhbs+Cn+q+QGTLt+d5IQ2bHAXKzKcxGJjxACpVbnYQSCRcfxHlQ==
+react-router@6.30.3:
+  version "6.30.3"
+  resolved "https://registry.yarnpkg.com/react-router/-/react-router-6.30.3.tgz#994b3ccdbe0e81fe84d4f998100f62584dfbf1cf"
+  integrity sha512-XRnlbKMTmktBkjCLE8/XcZFlnHvr2Ltdr1eJX4idL55/9BbORzyZEaIkBFDhFGCEWBBItsVrDxwx3gnisMitdw==
   dependencies:
-    "@remix-run/router" "1.23.0"
+    "@remix-run/router" "1.23.2"
 
 react-scripts@^5.0.1:
   version "5.0.1"

From 3761e82099f5a7f0fb9230fcb2d1352a7519eba5 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 26 May 2026 17:32:27 -0400
Subject: [PATCH 45/61] feat(bids-converter): add public BIDS Converter page
 and navbar link

---
 src/components/NavBar/NavItems.tsx |   1 +
 src/components/Routes.tsx          |   2 +
 src/pages/BidsConverterPage.tsx    | 198 +++++++++++++++++++++++++++++
 src/types/routes.enum.ts           |   1 +
 4 files changed, 202 insertions(+)
 create mode 100644 src/pages/BidsConverterPage.tsx

diff --git a/src/components/NavBar/NavItems.tsx b/src/components/NavBar/NavItems.tsx
index d2882e6..c102bcf 100644
--- a/src/components/NavBar/NavItems.tsx
+++ b/src/components/NavBar/NavItems.tsx
@@ -319,6 +319,7 @@ const NavItems: React.FC = () => {
             { text: "Wiki", url: "https://neurojson.org/Wiki" },
             { text: "Search", url: RoutesEnum.SEARCH },
             { text: "Databases", url: RoutesEnum.DATABASES },
+            { text: "BIDS Converter", url: RoutesEnum.BIDS_CONVERTER },
           ].map(({ text, url }) => (
             <Grid item key={text}>
               {url?.startsWith("https") ? (
diff --git a/src/components/Routes.tsx b/src/components/Routes.tsx
index 5983701..10b15e9 100644
--- a/src/components/Routes.tsx
+++ b/src/components/Routes.tsx
@@ -1,3 +1,4 @@
+import BidsConverterPage from "pages/BidsConverterPage";
 import ScrollToTop from "./ScrollToTop";
 import CompleteProfile from "./User/CompleteProfile";
 import CollectionDetailPage from "./User/Dashboard/CollectionDetailPage";
@@ -68,6 +69,7 @@ const Routes = () => (
           element={<CollectionDetailPage />}
         />
         <Route path="/projects/:projectId" element={<DatasetOrganizer />} />
+        <Route path={RoutesEnum.BIDS_CONVERTER} element={<BidsConverterPage />} />
       </Route>
     </RouterRoutes>
   </>
diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
new file mode 100644
index 0000000..76de114
--- /dev/null
+++ b/src/pages/BidsConverterPage.tsx
@@ -0,0 +1,198 @@
+import DropZone from "components/User/Dashboard/DatasetOrganizer/DropZone";
+import FileTree from "components/User/Dashboard/DatasetOrganizer/FileTree";
+import LLMPanel from "components/User/Dashboard/DatasetOrganizer/LLMPanel";
+import { ArrowBack, GetApp, Psychology } from "@mui/icons-material";
+import { Box, Button, Typography, Alert } from "@mui/material";
+import { Colors } from "design/theme";
+import React, { useState } from "react";
+import { useNavigate } from "react-router-dom";
+import { FileItem } from "redux/projects/types/projects.interface";
+
+const BidsConverterPage: React.FC = () => {
+  const navigate = useNavigate();
+
+  const [files, setFiles] = useState<FileItem[]>([]);
+  const [selectedIds, setSelectedIds] = useState<Set<string>>(new Set());
+  const [expandedIds, setExpandedIds] = useState<Set<string>>(new Set());
+  const [showLLMPanel, setShowLLMPanel] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+  const [baseDirectoryPath, setBaseDirectoryPath] = useState<string>("");
+  const [evidenceBundle, setEvidenceBundle] = useState<any>(null);
+  const [trioGenerated, setTrioGenerated] = useState(false);
+
+  const updateFiles = (updater: React.SetStateAction<FileItem[]>) =>
+    setFiles(updater);
+
+  const updateSelectedIds = (updater: React.SetStateAction<Set<string>>) =>
+    setSelectedIds(updater);
+
+  const updateExpandedIds = (updater: React.SetStateAction<Set<string>>) =>
+    setExpandedIds(updater);
+
+  const updateBaseDirectoryPath = (path: string) => setBaseDirectoryPath(path);
+
+  const handleExportJSON = () => {
+    const buildTree = (parentId: string | null): any => {
+      const children = files.filter((f) => f.parentId === parentId);
+      const result: any = {};
+      children.forEach((child) => {
+        if (child.type === "folder" || child.type === "zip") {
+          result[child.name] = {
+            _type: child.type,
+            _sourcePath: baseDirectoryPath
+              ? `${baseDirectoryPath}/${child.sourcePath || child.name}`.replace(/\/+/g, "/")
+              : child.sourcePath || "",
+            _children: buildTree(child.id),
+          };
+        } else {
+          const fileData: any = {
+            _type: "file",
+            _fileType: child.fileType || "other",
+          };
+          if (child.sourcePath || baseDirectoryPath) {
+            fileData._sourcePath = baseDirectoryPath
+              ? `${baseDirectoryPath}/${child.sourcePath || child.name}`.replace(/\/+/g, "/")
+              : child.sourcePath;
+          }
+          if (child.isUserMeta) fileData._isUserMeta = true;
+          if (child.content) fileData._content = child.content;
+          if (child.contentType) fileData._contentType = child.contentType;
+          if (child.note) fileData._note = child.note;
+          result[child.name] = fileData;
+        }
+      });
+      return result;
+    };
+
+    const exportData = {
+      _exportDate: new Date().toISOString(),
+      _totalFiles: files.length,
+      files: buildTree(null),
+    };
+
+    const blob = new Blob([JSON.stringify(exportData, null, 2)], {
+      type: "application/json",
+    });
+    const url = URL.createObjectURL(blob);
+    const a = document.createElement("a");
+    a.href = url;
+    a.download = "bids_converter_export.json";
+    a.click();
+    URL.revokeObjectURL(url);
+  };
+
+  return (
+    <Box
+      sx={{
+        display: "flex",
+        flexDirection: "column",
+        height: "100vh",
+        background: "linear-gradient(180deg,#f6f7fb 0%, #aeb6e8 100%)",
+      }}
+    >
+      {/* Header */}
+      <Box
+        sx={{
+          p: 2,
+          borderBottom: 1,
+          borderColor: "divider",
+          display: "flex",
+          justifyContent: "space-between",
+          alignItems: "center",
+          gap: 2,
+        }}
+      >
+        <Box display="flex" alignItems="center" gap={2}>
+          <Button
+            startIcon={<ArrowBack />}
+            onClick={() => navigate("/")}
+            sx={{ color: Colors.purple }}
+          >
+            Back
+          </Button>
+          <Box>
+            <Typography variant="h5">BIDS Converter</Typography>
+            <Typography variant="body2" color="text.secondary">
+              Organize and rename your dataset files into BIDS format
+            </Typography>
+          </Box>
+        </Box>
+
+        <Box display="flex" gap={1}>
+          <Button
+            variant="contained"
+            startIcon={<Psychology />}
+            onClick={() => setShowLLMPanel(!showLLMPanel)}
+            disabled={files.length === 0}
+            sx={{
+              backgroundColor: Colors.purple,
+              color: Colors.lightGray,
+              "&:hover": { backgroundColor: Colors.purple, border: "none" },
+            }}
+          >
+            Generate BIDS Plan
+          </Button>
+          <Button
+            variant="contained"
+            startIcon={<GetApp />}
+            onClick={handleExportJSON}
+            disabled={files.length === 0}
+            sx={{
+              backgroundColor: Colors.darkGreen,
+              color: Colors.lightGray,
+              "&:hover": { backgroundColor: Colors.darkGreen, border: "none" },
+            }}
+          >
+            Export JSON
+          </Button>
+        </Box>
+      </Box>
+
+      {error && (
+        <Alert severity="error" onClose={() => setError(null)} sx={{ m: 2 }}>
+          {error}
+        </Alert>
+      )}
+
+      {/* Main Content */}
+      <Box sx={{ display: "flex", flex: 1, minHeight: 0 }}>
+        <Box sx={{ flex: 1, overflow: "auto", p: 3, position: "relative" }}>
+          <DropZone
+            files={files}
+            setFiles={updateFiles}
+            baseDirectoryPath={baseDirectoryPath}
+            setBaseDirectoryPath={updateBaseDirectoryPath}
+            selectedIds={selectedIds}
+            setSelectedIds={setSelectedIds}
+            expandedIds={expandedIds}
+            setExpandedIds={setExpandedIds}
+          />
+          {showLLMPanel && (
+            <LLMPanel
+              files={files}
+              baseDirectoryPath={baseDirectoryPath}
+              setBaseDirectoryPath={updateBaseDirectoryPath}
+              evidenceBundle={evidenceBundle}
+              setEvidenceBundle={setEvidenceBundle}
+              trioGenerated={trioGenerated}
+              setTrioGenerated={setTrioGenerated}
+              updateFiles={updateFiles}
+              onClose={() => setShowLLMPanel(false)}
+            />
+          )}
+        </Box>
+
+        <FileTree
+          files={files}
+          selectedIds={selectedIds}
+          expandedIds={expandedIds}
+          setFiles={updateFiles}
+          setSelectedIds={updateSelectedIds}
+          setExpandedIds={updateExpandedIds}
+        />
+      </Box>
+    </Box>
+  );
+};
+
+export default BidsConverterPage;
diff --git a/src/types/routes.enum.ts b/src/types/routes.enum.ts
index b37a84d..a774051 100644
--- a/src/types/routes.enum.ts
+++ b/src/types/routes.enum.ts
@@ -4,5 +4,6 @@ enum RoutesEnum {
   SEARCH = "/search", // New route for the search page
   ABOUT = "/about", // New route for the about page
   DASHBOARD = "/dashboard",
+  BIDS_CONVERTER = "/bids-converter",
 }
 export default RoutesEnum;

From 11b77bde4464355bfd13077968679dadcb56a542 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Tue, 26 May 2026 18:00:15 -0400
Subject: [PATCH 46/61] feat(bids-converter): add mode selection dialog and
 private/save toggle bar

---
 src/pages/BidsConverterPage.tsx | 234 +++++++++++++++++++++++++++++++-
 1 file changed, 228 insertions(+), 6 deletions(-)

diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index 76de114..2bbb3f0 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -1,15 +1,43 @@
 import DropZone from "components/User/Dashboard/DatasetOrganizer/DropZone";
 import FileTree from "components/User/Dashboard/DatasetOrganizer/FileTree";
 import LLMPanel from "components/User/Dashboard/DatasetOrganizer/LLMPanel";
-import { ArrowBack, GetApp, Psychology } from "@mui/icons-material";
-import { Box, Button, Typography, Alert } from "@mui/material";
+import UserLogin from "components/User/UserLogin";
+import UserSignup from "components/User/UserSignup";
+import {
+  ArrowBack,
+  GetApp,
+  Psychology,
+  LockOutlined,
+  CloudUpload,
+} from "@mui/icons-material";
+import {
+  Box,
+  Button,
+  Typography,
+  Alert,
+  Dialog,
+  DialogContent,
+  DialogTitle,
+  ToggleButton,
+  ToggleButtonGroup,
+} from "@mui/material";
 import { Colors } from "design/theme";
-import React, { useState } from "react";
+import { useAppSelector } from "hooks/useAppSelector";
+import React, { useState, useEffect } from "react";
 import { useNavigate } from "react-router-dom";
+import { AuthSelector } from "redux/auth/auth.selector";
 import { FileItem } from "redux/projects/types/projects.interface";
 
+type Mode = "private" | "save";
+
 const BidsConverterPage: React.FC = () => {
   const navigate = useNavigate();
+  const { isLoggedIn } = useAppSelector(AuthSelector);
+
+  const [modeChosen, setModeChosen] = useState(false);
+  const [mode, setMode] = useState<Mode>("private");
+  const [loginOpen, setLoginOpen] = useState(false);
+  const [signupOpen, setSignupOpen] = useState(false);
 
   const [files, setFiles] = useState<FileItem[]>([]);
   const [selectedIds, setSelectedIds] = useState<Set<string>>(new Set());
@@ -20,15 +48,42 @@ const BidsConverterPage: React.FC = () => {
   const [evidenceBundle, setEvidenceBundle] = useState<any>(null);
   const [trioGenerated, setTrioGenerated] = useState(false);
 
+  // After login succeeds in save mode, redirect to dashboard to create a project
+  useEffect(() => {
+    if (isLoggedIn && mode === "save") {
+      navigate("/dashboard");
+    }
+  }, [isLoggedIn, mode, navigate]);
+
+  const handleChoosePrivate = () => {
+    setMode("private");
+    setModeChosen(true);
+  };
+
+  const handleChooseSave = () => {
+    setMode("save");
+    if (isLoggedIn) {
+      navigate("/dashboard");
+    } else {
+      setLoginOpen(true);
+    }
+  };
+
+  const handleModeBarChange = (_: React.MouseEvent, next: Mode | null) => {
+    if (!next || next === mode) return;
+    if (next === "save") {
+      handleChooseSave();
+    } else {
+      setMode("private");
+    }
+  };
+
   const updateFiles = (updater: React.SetStateAction<FileItem[]>) =>
     setFiles(updater);
-
   const updateSelectedIds = (updater: React.SetStateAction<Set<string>>) =>
     setSelectedIds(updater);
-
   const updateExpandedIds = (updater: React.SetStateAction<Set<string>>) =>
     setExpandedIds(updater);
-
   const updateBaseDirectoryPath = (path: string) => setBaseDirectoryPath(path);
 
   const handleExportJSON = () => {
@@ -148,6 +203,63 @@ const BidsConverterPage: React.FC = () => {
         </Box>
       </Box>
 
+      {/* Mode indicator bar */}
+      <Box
+        sx={{
+          px: 3,
+          py: 1,
+          borderBottom: 1,
+          borderColor: "divider",
+          display: "flex",
+          alignItems: "center",
+          gap: 2,
+          backgroundColor: "white",
+        }}
+      >
+        <ToggleButtonGroup
+          value={mode}
+          exclusive
+          onChange={handleModeBarChange}
+          size="small"
+        >
+          <ToggleButton
+            value="private"
+            sx={{
+              gap: 0.5,
+              textTransform: "none",
+              "&.Mui-selected": {
+                backgroundColor: Colors.purple,
+                color: Colors.white,
+                "&:hover": { backgroundColor: Colors.secondaryPurple },
+              },
+            }}
+          >
+            <LockOutlined fontSize="small" />
+            Private Mode
+          </ToggleButton>
+          <ToggleButton
+            value="save"
+            sx={{
+              gap: 0.5,
+              textTransform: "none",
+              "&.Mui-selected": {
+                backgroundColor: Colors.lightBlue,
+                color: Colors.darkPurple,
+              },
+            }}
+          >
+            <CloudUpload fontSize="small" />
+            Save to Account
+          </ToggleButton>
+        </ToggleButtonGroup>
+
+        <Typography variant="caption" color="text.secondary">
+          {mode === "private"
+            ? "Files are processed locally. Nothing is uploaded. All data is lost when you close this page."
+            : "Log in to save your work to a project on your account."}
+        </Typography>
+      </Box>
+
       {error && (
         <Alert severity="error" onClose={() => setError(null)} sx={{ m: 2 }}>
           {error}
@@ -191,6 +303,116 @@ const BidsConverterPage: React.FC = () => {
           setExpandedIds={updateExpandedIds}
         />
       </Box>
+
+      {/* Welcome dialog — shown on first load before user starts working */}
+      <Dialog open={!modeChosen} maxWidth="sm" fullWidth>
+        <DialogTitle sx={{ textAlign: "center", pt: 4 }}>
+          How would you like to use BIDS Converter?
+        </DialogTitle>
+        <DialogContent>
+          <Box
+            sx={{
+              display: "flex",
+              gap: 2,
+              mt: 1,
+              mb: 2,
+              flexDirection: { xs: "column", sm: "row" },
+            }}
+          >
+            {/* Private Mode card */}
+            <Box
+              onClick={handleChoosePrivate}
+              sx={{
+                flex: 1,
+                border: `2px solid ${Colors.purple}`,
+                borderRadius: 2,
+                p: 3,
+                cursor: "pointer",
+                display: "flex",
+                flexDirection: "column",
+                alignItems: "center",
+                gap: 1.5,
+                transition: "background 0.2s",
+                "&:hover": { backgroundColor: Colors.lightBlue },
+              }}
+            >
+              <LockOutlined sx={{ fontSize: 40, color: Colors.purple }} />
+              <Typography variant="h6" fontWeight={600}>
+                Private Mode
+              </Typography>
+              <Typography
+                variant="body2"
+                color="text.secondary"
+                textAlign="center"
+              >
+                Work entirely in your browser. No files are uploaded to any
+                server. All data will be lost when you close the page.
+              </Typography>
+            </Box>
+
+            {/* Save to Account card */}
+            <Box
+              onClick={handleChooseSave}
+              sx={{
+                flex: 1,
+                border: `2px solid ${Colors.darkGreen}`,
+                borderRadius: 2,
+                p: 3,
+                cursor: "pointer",
+                display: "flex",
+                flexDirection: "column",
+                alignItems: "center",
+                gap: 1.5,
+                transition: "background 0.2s",
+                "&:hover": { backgroundColor: "#e8f5e9" },
+              }}
+            >
+              <CloudUpload sx={{ fontSize: 40, color: Colors.darkGreen }} />
+              <Typography variant="h6" fontWeight={600}>
+                Save to Account
+              </Typography>
+              <Typography
+                variant="body2"
+                color="text.secondary"
+                textAlign="center"
+              >
+                Log in to save your work to a project. You can resume it any
+                time from your dashboard.
+              </Typography>
+            </Box>
+          </Box>
+        </DialogContent>
+      </Dialog>
+
+      <UserLogin
+        open={loginOpen}
+        onClose={() => {
+          setLoginOpen(false);
+          // If user closes login without logging in, fall back to private mode
+          if (!isLoggedIn) {
+            setMode("private");
+            setModeChosen(true);
+          }
+        }}
+        onSwitchToSignup={() => {
+          setLoginOpen(false);
+          setSignupOpen(true);
+        }}
+      />
+      <UserSignup
+        open={signupOpen}
+        onClose={() => {
+          setSignupOpen(false);
+          if (!isLoggedIn) {
+            setMode("private");
+            setModeChosen(true);
+          }
+        }}
+        onSwitchToLogin={() => {
+          setSignupOpen(false);
+          setLoginOpen(true);
+        }}
+      />
     </Box>
   );
 };

From 7dbb33555d39d2d0f7819ce8b0e5c80d3a236f44 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 11:47:49 -0400
Subject: [PATCH 47/61] feat(dashboard): open Projects tab directly from BIDS
 Converter redirect

---
 src/components/User/UserDashboard.tsx | 20 +++++++++++++++++++-
 src/pages/BidsConverterPage.tsx       |  4 ++--
 2 files changed, 21 insertions(+), 3 deletions(-)

diff --git a/src/components/User/UserDashboard.tsx b/src/components/User/UserDashboard.tsx
index 21d4e53..42eab48 100644
--- a/src/components/User/UserDashboard.tsx
+++ b/src/components/User/UserDashboard.tsx
@@ -24,6 +24,7 @@ import {
 import { Colors } from "design/theme";
 import { useAppSelector } from "hooks/useAppSelector";
 import React, { useState } from "react";
+import { useLocation, useNavigate } from "react-router-dom";
 import { AuthSelector } from "redux/auth/auth.selector";
 
 interface TabPanelProps {
@@ -48,12 +49,29 @@ function TabPanel(props: TabPanelProps) {
   );
 }
 
+const TAB_INDEX: Record<string, number> = {
+  profile: 0,
+  security: 1,
+  collections: 2,
+  liked: 3,
+  projects: 4,
+  settings: 5,
+};
+
+const TAB_NAME = Object.fromEntries(
+  Object.entries(TAB_INDEX).map(([k, v]) => [v, k])
+) as Record<number, string>;
+
 const UserDashboard: React.FC = () => {
-  const [tabValue, setTabValue] = useState(0);
+  const location = useLocation();
+  const navigate = useNavigate();
+  const tabParam = new URLSearchParams(location.search).get("tab") ?? "";
+  const [tabValue, setTabValue] = useState(TAB_INDEX[tabParam] ?? 0);
   const { user } = useAppSelector(AuthSelector);
 
   const handleTabChange = (event: React.SyntheticEvent, newValue: number) => {
     setTabValue(newValue);
+    navigate(`/dashboard?tab=${TAB_NAME[newValue]}`, { replace: true });
   };
 
   if (!user) {
diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index 2bbb3f0..1c57d16 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -51,7 +51,7 @@ const BidsConverterPage: React.FC = () => {
   // After login succeeds in save mode, redirect to dashboard to create a project
   useEffect(() => {
     if (isLoggedIn && mode === "save") {
-      navigate("/dashboard");
+      navigate("/dashboard?tab=projects");
     }
   }, [isLoggedIn, mode, navigate]);
 
@@ -63,7 +63,7 @@ const BidsConverterPage: React.FC = () => {
   const handleChooseSave = () => {
     setMode("save");
     if (isLoggedIn) {
-      navigate("/dashboard");
+      navigate("/dashboard?tab=projects");
     } else {
       setLoginOpen(true);
     }

From 71e5ffb0eba4571ba65ee1bf6244679a874a80ec Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 12:00:44 -0400
Subject: [PATCH 48/61] feat(bids-converter): add private mode visual indicator
 with slate grey background

---
 src/pages/BidsConverterPage.tsx | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index 1c57d16..1f27008 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -142,7 +142,9 @@ const BidsConverterPage: React.FC = () => {
         display: "flex",
         flexDirection: "column",
         height: "100vh",
-        background: "linear-gradient(180deg,#f6f7fb 0%, #aeb6e8 100%)",
+        background: mode === "private"
+          ? "linear-gradient(180deg, #eceff1 0%, #90a4ae 100%)"
+          : "linear-gradient(180deg,#f6f7fb 0%, #aeb6e8 100%)",
       }}
     >
       {/* Header */}
@@ -213,7 +215,7 @@ const BidsConverterPage: React.FC = () => {
           display: "flex",
           alignItems: "center",
           gap: 2,
-          backgroundColor: "white",
+          backgroundColor: mode === "private" ? "#eceff1" : "white",
         }}
       >
         <ToggleButtonGroup

From d0537a48eec51c7b4811676a91936c3453927c1d Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 15:11:48 -0400
Subject: [PATCH 49/61] feat(bids-converter): improve UI labels, tooltips, and
 private mode UX

---
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 83 ++++++++++++++-----
 .../User/Dashboard/DatasetOrganizer/index.tsx |  3 +-
 src/pages/BidsConverterPage.tsx               | 50 ++++++++++-
 3 files changed, 109 insertions(+), 27 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index 9658ec6..1e49428 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -13,6 +13,7 @@ import {
   Download,
   AutoAwesome,
   DriveFileMove,
+  InfoOutlined,
 } from "@mui/icons-material";
 import {
   Box,
@@ -27,6 +28,7 @@ import {
   CircularProgress,
   IconButton,
   Alert,
+  Tooltip,
 } from "@mui/material";
 import { Colors } from "design/theme";
 import { dump as yamlDump } from "js-yaml";
@@ -46,6 +48,7 @@ interface LLMPanelProps {
   setTrioGenerated: (value: boolean) => void; // ✅ Add
   updateFiles: (updater: React.SetStateAction<FileItem[]>) => void; // ✅ Add
   onClose: () => void;
+  isPrivateMode?: boolean;
 }
 
 interface LLMProvider {
@@ -77,28 +80,27 @@ const llmProviders: Record<string, LLMProvider> = {
     baseUrl: "https://api.groq.com/openai/v1/chat/completions",
     models: [
       { id: "llama-3.3-70b-versatile", name: "Llama 3.3 70B" },
+      { id: "llama-3.1-70b-versatile", name: "Llama 3.1 70B" },
       { id: "llama-3.1-8b-instant", name: "Llama 3.1 8B (Fast)" },
-      { id: "mixtral-8x7b-32768", name: "Mixtral 8x7B" },
+      { id: "gemma2-9b-it", name: "Gemma 2 9B" },
     ],
   },
   openrouter: {
     name: "OpenRouter (Free models available)",
     baseUrl: "https://openrouter.ai/api/v1/chat/completions",
     models: [
-      {
-        id: "meta-llama/llama-3.1-8b-instruct:free",
-        name: "Llama 3.1 8B (Free)",
-      },
-      { id: "google/gemma-2-9b-it:free", name: "Gemma 2 9B (Free)" },
-      { id: "mistralai/mistral-7b-instruct:free", name: "Mistral 7B (Free)" },
+      { id: "meta-llama/llama-3.3-70b-instruct:free", name: "Llama 3.3 70B (Free)" },
+      { id: "google/gemma-3n-e4b-it:free", name: "Gemma 3n 4B (Free)" },
+      { id: "mistralai/mistral-small-3.2-24b-instruct:free", name: "Mistral Small 3.2 24B (Free)" },
     ],
   },
   anthropic: {
     name: "Anthropic Claude (Paid)",
     baseUrl: "https://api.anthropic.com/v1/messages",
     models: [
-      { id: "claude-sonnet-4-20250514", name: "Claude Sonnet 4" },
-      { id: "claude-3-5-haiku-20241022", name: "Claude 3.5 Haiku" },
+      { id: "claude-opus-4-7", name: "Claude Opus 4.7" },
+      { id: "claude-sonnet-4-6", name: "Claude Sonnet 4.6" },
+      { id: "claude-haiku-4-5-20251001", name: "Claude Haiku 4.5" },
     ],
     isAnthropic: true,
   },
@@ -106,8 +108,11 @@ const llmProviders: Record<string, LLMProvider> = {
     name: "OpenAI (Paid)",
     baseUrl: "https://api.openai.com/v1/chat/completions",
     models: [
-      { id: "gpt-4o-mini", name: "GPT-4o Mini" },
+      { id: "gpt-5.5", name: "GPT-5.5" },
+      { id: "gpt-5.4", name: "GPT-5.4" },
+      { id: "gpt-5.4-mini", name: "GPT-5.4 Mini" },
       { id: "gpt-4o", name: "GPT-4o" },
+      { id: "gpt-4o-mini", name: "GPT-4o Mini" },
     ],
   },
 };
@@ -122,9 +127,10 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
   setTrioGenerated, // ✅ Add
   updateFiles, // ✅ Add
   onClose,
+  isPrivateMode = false,
 }) => {
-  const [provider, setProvider] = useState<string>("ollama");
-  const [model, setModel] = useState<string>("qwen3-coder-next:latest");
+  const [provider, setProvider] = useState<string>(isPrivateMode ? "groq" : "ollama");
+  const [model, setModel] = useState<string>(isPrivateMode ? "llama-3.3-70b-versatile" : "qwen3-coder-next:latest");
   // const [ollamaUrl, setOllamaUrl] = useState<string>(
   //   "http://jin.neu.edu:11434"
   // );
@@ -1208,7 +1214,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
     });
 
     updateFiles((prev) => [...prev, ...outputFiles]);
-    setStatus("✓ Saved to VFS. Click 'Save Changes' to persist to database.");
+    setStatus(isPrivateMode ? "✓ Saved to VFS." : "✓ Saved to VFS. Click 'Save Changes' to persist to database.");
   };
   // const handleSaveZip = async () => {
   //   const zip = new JSZip();
@@ -1350,7 +1356,38 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
           sx={{ display: "flex", alignItems: "center", gap: 1 }}
         >
           <AutoAwesome sx={{ color: Colors.purple }} />
-          AI-Generated BIDS Conversion Script
+          AI Assistant
+          <Tooltip
+            title="Fill in the required fields and follow the steps to get a downloadable BIDS conversion plan."
+            placement="bottom-start"
+            arrow
+            componentsProps={{
+              tooltip: {
+                sx: {
+                  backgroundColor: "white",
+                  color: Colors.darkPurple,
+                  border: `1px solid ${Colors.lightGray}`,
+                  boxShadow: 3,
+                  fontSize: "0.875rem",
+                  lineHeight: 1.5,
+                  p: 1.5,
+                  maxWidth: 320,
+                },
+              },
+              arrow: {
+                sx: {
+                  color: "white",
+                  "&::before": {
+                    border: `1px solid ${Colors.lightGray}`,
+                  },
+                },
+              },
+            }}
+          >
+            <IconButton size="small" sx={{ color: Colors.purple, p: 0 }}>
+              <InfoOutlined fontSize="small" />
+            </IconButton>
+          </Tooltip>
         </Typography>
         <IconButton onClick={onClose} size="small">
           <Close />
@@ -1379,11 +1416,13 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
                 setModel(llmProviders[e.target.value].models[0].id);
               }}
             >
-              {Object.entries(llmProviders).map(([key, p]) => (
-                <MenuItem key={key} value={key}>
-                  {p.name}
-                </MenuItem>
-              ))}
+              {Object.entries(llmProviders)
+                .filter(([key]) => !(isPrivateMode && key === "ollama"))
+                .map(([key, p]) => (
+                  <MenuItem key={key} value={key}>
+                    {p.name}
+                  </MenuItem>
+                ))}
             </Select>
           </FormControl>
 
@@ -1567,8 +1606,8 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
                 {generatingTrio
                   ? "Generating..."
                   : trioGenerated
-                  ? "✓  2. Generate BIDS Trio"
-                  : "2. Generate BIDS Trio"}
+                  ? "✓  2. Generate BIDS Metadata Files"
+                  : "2. Generate BIDS Metadata Files"}
               </Button>
               {/* <Typography
                 variant="body2"
@@ -1599,7 +1638,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               "&.Mui-disabled": { background: "#e0e0e0", color: "#9e9e9e" },
             }}
           >
-            {loading ? "Generating..." : "3. Generate BIDSPlan.yaml"}
+            {loading ? "Generating..." : "3. Generate Conversion Package"}
           </Button>
 
           {/* <Button
diff --git a/src/components/User/Dashboard/DatasetOrganizer/index.tsx b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
index ec8d97f..39c2f45 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/index.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
@@ -271,7 +271,6 @@ const DatasetOrganizer: React.FC = () => {
             variant="contained"
             startIcon={<Psychology />}
             onClick={() => setShowLLMPanel(!showLLMPanel)}
-            disabled={files.length === 0}
             sx={{
               backgroundColor: Colors.purple,
               color: Colors.lightGray,
@@ -281,7 +280,7 @@ const DatasetOrganizer: React.FC = () => {
               },
             }}
           >
-            Generate BIDS Plan
+            AI Assistant
           </Button>
           {/* <Button
             variant="contained"
diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index 1f27008..70b4a46 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -9,6 +9,7 @@ import {
   Psychology,
   LockOutlined,
   CloudUpload,
+  InfoOutlined,
 } from "@mui/icons-material";
 import {
   Box,
@@ -20,6 +21,8 @@ import {
   DialogTitle,
   ToggleButton,
   ToggleButtonGroup,
+  Tooltip,
+  IconButton,
 } from "@mui/material";
 import { Colors } from "design/theme";
 import { useAppSelector } from "hooks/useAppSelector";
@@ -168,7 +171,48 @@ const BidsConverterPage: React.FC = () => {
             Back
           </Button>
           <Box>
-            <Typography variant="h5">BIDS Converter</Typography>
+            <Box display="flex" alignItems="center" gap={0.5}>
+              <Typography variant="h5">BIDS Converter</Typography>
+              <Tooltip
+                title={
+                  <Box>
+                    <Typography variant="body2" fontWeight={600} mb={0.5}>How to use:</Typography>
+                    <Typography variant="body2" component="ol" sx={{ pl: 2, m: 0 }}>
+                      <li>Drop your dataset files into the workspace.</li>
+                      <li>Enter the number of subjects, modality, and base directory path.</li>
+                      <li>The AI will analyze your files and generate a BIDS conversion plan.</li>
+                      <li>Download and run the script locally to reorganize your data into BIDS format.</li>
+                    </Typography>
+                  </Box>
+                }
+                placement="bottom-start"
+                arrow
+                componentsProps={{
+                  tooltip: {
+                    sx: {
+                      backgroundColor: "white",
+                      color: Colors.darkPurple,
+                      border: `1px solid ${Colors.lightGray}`,
+                      boxShadow: 3,
+                      fontSize: "0.875rem",
+                      lineHeight: 1.5,
+                      p: 1.5,
+                      maxWidth: 320,
+                    },
+                  },
+                  arrow: {
+                    sx: {
+                      color: "white",
+                      "&::before": { border: `1px solid ${Colors.lightGray}` },
+                    },
+                  },
+                }}
+              >
+                <IconButton size="small" sx={{ color: Colors.purple, p: 0 }}>
+                  <InfoOutlined fontSize="small" />
+                </IconButton>
+              </Tooltip>
+            </Box>
             <Typography variant="body2" color="text.secondary">
               Organize and rename your dataset files into BIDS format
             </Typography>
@@ -180,14 +224,13 @@ const BidsConverterPage: React.FC = () => {
             variant="contained"
             startIcon={<Psychology />}
             onClick={() => setShowLLMPanel(!showLLMPanel)}
-            disabled={files.length === 0}
             sx={{
               backgroundColor: Colors.purple,
               color: Colors.lightGray,
               "&:hover": { backgroundColor: Colors.purple, border: "none" },
             }}
           >
-            Generate BIDS Plan
+            AI Assistant
           </Button>
           <Button
             variant="contained"
@@ -292,6 +335,7 @@ const BidsConverterPage: React.FC = () => {
               setTrioGenerated={setTrioGenerated}
               updateFiles={updateFiles}
               onClose={() => setShowLLMPanel(false)}
+              isPrivateMode={mode === "private"}
             />
           )}
         </Box>

From b0237116778ddae4c2442de28e5a1614d8db1acd Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 15:36:25 -0400
Subject: [PATCH 50/61] feat(llm-panel): improve AI Assistant UI labels and UX

---
 .../Dashboard/DatasetOrganizer/FileTree.tsx   |  2 +-
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 34 +++++++------------
 2 files changed, 14 insertions(+), 22 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx b/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
index 29c0bd5..c4e3db9 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
@@ -636,7 +636,7 @@ const FileTree: React.FC<FileTreeProps> = ({
                   variant="caption"
                   sx={{ color: Colors.darkGreen, fontWeight: 600 }}
                 >
-                  Saved Outputs
+                  BIDS Conversion Package Preview
                 </Typography>
               </Box>
               {outputFiles
diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index 1e49428..bb8d69a 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -1106,7 +1106,10 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
   const handleSaveZip = async () => {
     // Add output files to VFS
     const timestamp = new Date().toLocaleString();
-    const zipLabel = `bids_output_${new Date().toISOString().slice(0, 10)}`;
+    const now = new Date();
+    const dateStr = now.toISOString().slice(0, 10);
+    const timeStr = now.toTimeString().slice(0, 8).replace(/:/g, "-");
+    const zipLabel = `bids_output_${dateStr}_${timeStr}`;
     const outputFiles: FileItem[] = [];
 
     const folderId = generateId();
@@ -1214,7 +1217,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
     });
 
     updateFiles((prev) => [...prev, ...outputFiles]);
-    setStatus(isPrivateMode ? "✓ Saved to VFS." : "✓ Saved to VFS. Click 'Save Changes' to persist to database.");
+    setStatus(isPrivateMode ? "✓ Added to file tree." : "✓ Added to file tree. Click 'Save Changes' to persist to database.");
   };
   // const handleSaveZip = async () => {
   //   const zip = new JSZip();
@@ -1704,8 +1707,6 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
             <Button
               size="small"
               startIcon={<ContentCopy />}
-              // onClick={handleCopy}
-              // disabled={!generatedScript}
               onClick={() =>
                 navigator.clipboard.writeText(bidsPlan || generatedScript)
               }
@@ -1713,23 +1714,12 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
             >
               Copy
             </Button>
-            {/* <Button
-              size="small"
-              startIcon={<Download />}
-              // onClick={handleDownload}
-              // disabled={!generatedScript}
-              onClick={bidsPlan ? handleDownloadPlan : handleDownload}
-              disabled={!bidsPlan && !generatedScript}
-            >
-              {bidsPlan ? "Download BIDSPlan.yaml" : "Download Script"}
-            </Button> */}
             <Button
               size="small"
               startIcon={<Download />}
               onClick={handleDownloadPackage}
               disabled={!bidsPlan && !generatingTrio}
             >
-              {/* Download */}
               Download zip file for convert
             </Button>
             <Button
@@ -1739,7 +1729,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               disabled={!bidsPlan || !trioGenerated}
               sx={{ color: Colors.darkGreen, borderColor: Colors.darkGreen }}
             >
-              Save to Virtual File System
+              Preview in File Tree
             </Button>
           </Box>
 
@@ -1755,11 +1745,13 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               color: "#d4d4d4",
             }}
           >
-            {/* {generatedScript ||
-              'Configure your LLM provider and click "Generate Script"...'} */}
-            {bidsPlan ||
-              generatedScript ||
-              'Configure your LLM provider and click "Generate BIDSPlan.yaml"...'}
+            {bidsPlan || generatedScript || (
+              <span style={{ color: status && !error ? "#9cdcfe" : "#aaaaaa" }}>
+                {status && !error
+                  ? status
+                  : 'Fill in the fields on the left and follow the steps to generate your conversion package...'}
+              </span>
+            )}
           </Paper>
         </Box>
       </Box>

From cf2e445020ad22e35524d506a43976fb4c666694 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 16:11:17 -0400
Subject: [PATCH 51/61] fix(llm-panel): clear bidsPlan on step 2 re-run so
 progress shows in output panel

---
 src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx | 1 +
 src/components/User/Dashboard/DatasetOrganizer/index.tsx    | 4 ++--
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index bb8d69a..6b3c007 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -218,6 +218,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
     setAbortController(controller);
     setGeneratingTrio(true);
     setError(null);
+    setBidsPlan("");
     setStatus("Generating BIDS trio files...");
 
     try {
diff --git a/src/components/User/Dashboard/DatasetOrganizer/index.tsx b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
index 39c2f45..5a361a9 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/index.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
@@ -282,7 +282,7 @@ const DatasetOrganizer: React.FC = () => {
           >
             AI Assistant
           </Button>
-          {/* <Button
+          <Button
             variant="contained"
             startIcon={<GetApp />}
             onClick={handleExportJSON}
@@ -297,7 +297,7 @@ const DatasetOrganizer: React.FC = () => {
             }}
           >
             Export JSON
-          </Button> */}
+          </Button>
           <Button
             variant="contained"
             startIcon={<Save />}

From 028ee237f54516e6f68607b418dcc254bab39f0f Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 17:48:34 -0400
Subject: [PATCH 52/61] feat(llm-panel): UI polish for file tree and output
 panel

---
 .../Dashboard/DatasetOrganizer/FileTree.tsx   |  7 +++----
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 19 ++++++++++++++-----
 2 files changed, 17 insertions(+), 9 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx b/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
index c4e3db9..0dbcf90 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/FileTree.tsx
@@ -522,7 +522,7 @@ const FileTree: React.FC<FileTreeProps> = ({
           }}
         >
           <Box>
-            <Typography variant="subtitle2" fontWeight="600">
+            <Typography variant="subtitle2" fontWeight={800}>
               Virtual File System
             </Typography>
             <Typography variant="caption" color="text.secondary">
@@ -631,10 +631,9 @@ const FileTree: React.FC<FileTreeProps> = ({
                   borderColor: "divider",
                 }}
               >
-                <FolderSpecial sx={{ color: Colors.darkGreen, fontSize: 16 }} />
                 <Typography
-                  variant="caption"
-                  sx={{ color: Colors.darkGreen, fontWeight: 600 }}
+                  variant="body2"
+                  sx={{ color: Colors.darkPurple, fontWeight: 400 }}
                 >
                   BIDS Conversion Package Preview
                 </Typography>
diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index 6b3c007..a37ba9e 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -293,7 +293,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
 
       setTrioGenerated(true);
       setStatus(
-        "✓ BIDS trio files generated and added to Virtual File System!"
+        "✓ BIDS metadata files generated and added to file tree!"
       );
     } catch (err: any) {
       if (err.name === "AbortError") {
@@ -1705,7 +1705,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
         {/* Right: Generated Script */}
         <Box sx={{ flex: 1, display: "flex", flexDirection: "column", p: 2 }}>
           <Box sx={{ display: "flex", gap: 1, mb: 2 }}>
-            <Button
+            {/* <Button
               size="small"
               startIcon={<ContentCopy />}
               onClick={() =>
@@ -1714,12 +1714,17 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               disabled={!bidsPlan && !generatedScript}
             >
               Copy
-            </Button>
+            </Button> */}
             <Button
               size="small"
               startIcon={<Download />}
               onClick={handleDownloadPackage}
               disabled={!bidsPlan && !generatingTrio}
+              sx={{
+                color: Colors.purple,
+                borderColor: Colors.purple,
+                "&:hover": { borderColor: Colors.purple },
+              }}
             >
               Download zip file for convert
             </Button>
@@ -1728,9 +1733,13 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               startIcon={<DriveFileMove />}
               onClick={handleSaveZip}
               disabled={!bidsPlan || !trioGenerated}
-              sx={{ color: Colors.darkGreen, borderColor: Colors.darkGreen }}
+              sx={{
+                color: Colors.purple,
+                borderColor: Colors.purple,
+                "&:hover": { borderColor: Colors.purple },
+              }}
             >
-              Preview in File Tree
+              Preview Conversion Package in File Tree
             </Button>
           </Box>
 

From 60f51ade5d684d0c1eafcd5c647ac7a5f1d7aded Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 17:56:39 -0400
Subject: [PATCH 53/61] feat(ollama): require authentication on Ollama proxy
 endpoints

---
 backend/src/routes/ollama.routes.js | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/backend/src/routes/ollama.routes.js b/backend/src/routes/ollama.routes.js
index ff1fd94..38bdcb4 100644
--- a/backend/src/routes/ollama.routes.js
+++ b/backend/src/routes/ollama.routes.js
@@ -1,8 +1,9 @@
 const express = require("express");
 const router = express.Router();
 const { proxyChat, getTags } = require("../controllers/ollama.controller");
+const { requireAuth } = require("../middleware/auth.middleware");
 
-router.post("/chat", proxyChat);
-router.get("/tags", getTags);
+router.post("/chat", requireAuth, proxyChat);
+router.get("/tags", requireAuth, getTags);
 
 module.exports = router;

From 68218d5b000149565f7f86f05aaf775235376ef9 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Wed, 27 May 2026 18:11:41 -0400
Subject: [PATCH 54/61] feat(ollama): add public endpoint with 10 requests/day
 IP rate limit

---
 backend/package-lock.json                  | 26 ++++++++++++++++++----
 backend/package.json                       |  1 +
 backend/src/routes/ollama.public.routes.js | 17 ++++++++++++++
 backend/src/server.js                      |  2 ++
 4 files changed, 42 insertions(+), 4 deletions(-)
 create mode 100644 backend/src/routes/ollama.public.routes.js

diff --git a/backend/package-lock.json b/backend/package-lock.json
index 70f2f74..9bb2c58 100644
--- a/backend/package-lock.json
+++ b/backend/package-lock.json
@@ -15,6 +15,7 @@
         "cors": "^2.8.5",
         "dotenv": "^17.2.3",
         "express": "^5.1.0",
+        "express-rate-limit": "^8.5.2",
         "jsonwebtoken": "^9.0.2",
         "nanoid": "^3.3.11",
         "nodemailer": "^7.0.11",
@@ -1181,6 +1182,24 @@
         "url": "https://opencollective.com/express"
       }
     },
+    "node_modules/express-rate-limit": {
+      "version": "8.5.2",
+      "resolved": "https://registry.npmjs.org/express-rate-limit/-/express-rate-limit-8.5.2.tgz",
+      "integrity": "sha512-5Kb34ipNX694DH48vN9irak1Qx30nb0PLYHXfJgw4YEjiC3ZEmZJhwOp+VfiCYwFzvFTdB9QkArYS5kXa2cx2A==",
+      "license": "MIT",
+      "dependencies": {
+        "ip-address": "^10.2.0"
+      },
+      "engines": {
+        "node": ">= 16"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/express-rate-limit"
+      },
+      "peerDependencies": {
+        "express": ">= 4.11"
+      }
+    },
     "node_modules/file-uri-to-path": {
       "version": "1.0.0",
       "resolved": "https://registry.npmjs.org/file-uri-to-path/-/file-uri-to-path-1.0.0.tgz",
@@ -1742,11 +1761,10 @@
       "license": "ISC"
     },
     "node_modules/ip-address": {
-      "version": "10.0.1",
-      "resolved": "https://registry.npmjs.org/ip-address/-/ip-address-10.0.1.tgz",
-      "integrity": "sha512-NWv9YLW4PoW2B7xtzaS3NCot75m6nK7Icdv0o3lfMceJVRfSoQwqD4wEH5rLwoKJwUiZ/rfpiVBhnaF0FK4HoA==",
+      "version": "10.2.0",
+      "resolved": "https://registry.npmjs.org/ip-address/-/ip-address-10.2.0.tgz",
+      "integrity": "sha512-/+S6j4E9AHvW9SWMSEY9Xfy66O5PWvVEJ08O0y5JGyEKQpojb0K0GKpz/v5HJ/G0vi3D2sjGK78119oXZeE0qA==",
       "license": "MIT",
-      "optional": true,
       "engines": {
         "node": ">= 12"
       }
diff --git a/backend/package.json b/backend/package.json
index fa156b3..45f386a 100644
--- a/backend/package.json
+++ b/backend/package.json
@@ -29,6 +29,7 @@
     "cors": "^2.8.5",
     "dotenv": "^17.2.3",
     "express": "^5.1.0",
+    "express-rate-limit": "^8.5.2",
     "jsonwebtoken": "^9.0.2",
     "nanoid": "^3.3.11",
     "nodemailer": "^7.0.11",
diff --git a/backend/src/routes/ollama.public.routes.js b/backend/src/routes/ollama.public.routes.js
new file mode 100644
index 0000000..e9fc0f1
--- /dev/null
+++ b/backend/src/routes/ollama.public.routes.js
@@ -0,0 +1,17 @@
+const express = require("express");
+const router = express.Router();
+const rateLimit = require("express-rate-limit");
+const { proxyChat, getTags } = require("../controllers/ollama.controller");
+
+const dailyLimit = rateLimit({
+  windowMs: 24 * 60 * 60 * 1000, // 24 hours
+  max: 10,
+  standardHeaders: true,
+  legacyHeaders: false,
+  message: { error: "Daily request limit reached. You can send up to 10 requests per day from this IP." },
+});
+
+router.post("/chat", dailyLimit, proxyChat);
+router.get("/tags", dailyLimit, getTags);
+
+module.exports = router;
diff --git a/backend/src/server.js b/backend/src/server.js
index 5e6cb6c..d0d043d 100644
--- a/backend/src/server.js
+++ b/backend/src/server.js
@@ -14,6 +14,7 @@ const datasetsRoutes = require("./routes/datasets.routes");
 const collectionRoutes = require("./routes/collection.route");
 const projectRoutes = require("./routes/projects.routes");
 const ollamaRoutes = require("./routes/ollama.routes");
+const ollamaPublicRoutes = require("./routes/ollama.public.routes");
 
 const app = express();
 const PORT = process.env.PORT || 5000;
@@ -51,6 +52,7 @@ app.use("/api/v1/datasets", datasetsRoutes);
 app.use("/api/v1/collections", collectionRoutes);
 app.use("/api/v1/projects", projectRoutes);
 app.use("/api/v1/ollama", ollamaRoutes);
+app.use("/api/v1/ollama-public", ollamaPublicRoutes);
 
 // health check endpoint
 app.get("/api/health", async (req, res) => {

From 1aa509af696ef0b92f28489b31b5f08276a7f014 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 11:31:07 -0400
Subject: [PATCH 55/61] feat(llm-panel): add local Ollama provider for private
 mode with configurable URL

---
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 36 +++++++++++++------
 1 file changed, 25 insertions(+), 11 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index a37ba9e..d858c35 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -73,7 +73,18 @@ const llmProviders: Record<string, LLMProvider> = {
       { id: "qwen2.5-coder:7b", name: "Qwen 2.5 Coder 7B" },
     ],
     noApiKey: true,
-    // customUrl: true,
+  },
+  "local-ollama": {
+    name: "Ollama (Your Local Machine)",
+    baseUrl: "http://localhost:11434/v1/chat/completions",
+    models: [
+      { id: "llama3.2:latest", name: "Llama 3.2" },
+      { id: "llama3.1:latest", name: "Llama 3.1" },
+      { id: "qwen2.5-coder:latest", name: "Qwen 2.5 Coder" },
+      { id: "mistral:latest", name: "Mistral" },
+      { id: "gemma3:latest", name: "Gemma 3" },
+    ],
+    noApiKey: true,
   },
   groq: {
     name: "Groq (Free API Key - 14,400 req/day)",
@@ -129,8 +140,9 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
   onClose,
   isPrivateMode = false,
 }) => {
-  const [provider, setProvider] = useState<string>(isPrivateMode ? "groq" : "ollama");
-  const [model, setModel] = useState<string>(isPrivateMode ? "llama-3.3-70b-versatile" : "qwen3-coder-next:latest");
+  const [provider, setProvider] = useState<string>(isPrivateMode ? "local-ollama" : "ollama");
+  const [model, setModel] = useState<string>(isPrivateMode ? "llama3.2:latest" : "qwen3-coder-next:latest");
+  const [localOllamaUrl, setLocalOllamaUrl] = useState<string>("http://localhost:11434");
   // const [ollamaUrl, setOllamaUrl] = useState<string>(
   //   "http://jin.neu.edu:11434"
   // );
@@ -160,7 +172,9 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
     provider,
     model,
     apiKey,
-    baseUrl: currentProvider.baseUrl,
+    baseUrl: provider === "local-ollama"
+      ? `${localOllamaUrl}/v1/chat/completions`
+      : currentProvider.baseUrl,
     isAnthropic: currentProvider.isAnthropic,
     noApiKey: currentProvider.noApiKey,
   });
@@ -1421,7 +1435,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               }}
             >
               {Object.entries(llmProviders)
-                .filter(([key]) => !(isPrivateMode && key === "ollama"))
+                .filter(([key]) => isPrivateMode ? key !== "ollama" : key !== "local-ollama")
                 .map(([key, p]) => (
                   <MenuItem key={key} value={key}>
                     {p.name}
@@ -1445,17 +1459,17 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
             </Select>
           </FormControl>
 
-          {/* Ollama Server URL field */}
-          {/* {provider === "ollama" && (
+          {provider === "local-ollama" && (
             <TextField
               fullWidth
-              label="Ollama Server URL"
-              value={ollamaUrl}
-              onChange={(e) => setOllamaUrl(e.target.value)}
+              label="Ollama URL"
+              value={localOllamaUrl}
+              onChange={(e) => setLocalOllamaUrl(e.target.value)}
               placeholder="http://localhost:11434"
+              helperText="Default port is 11434. Change if your Ollama runs on a different port."
               sx={{ mb: 2 }}
             />
-          )} */}
+          )}
           {/* Base Directory Path field (shows for ALL providers) */}
           <TextField
             fullWidth

From 72b6b973cec1b27cc0db725619bdc336b988395f Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 11:42:20 -0400
Subject: [PATCH 56/61] feat(navbar): add AutoBIDSify dropdown with GitHub link
 and web app; update dialog title and description

---
 src/components/NavBar/NavItems.tsx | 92 ++++++++++++++++++++++++++++--
 src/pages/BidsConverterPage.tsx    |  5 +-
 2 files changed, 92 insertions(+), 5 deletions(-)

diff --git a/src/components/NavBar/NavItems.tsx b/src/components/NavBar/NavItems.tsx
index c102bcf..bfbb9b3 100644
--- a/src/components/NavBar/NavItems.tsx
+++ b/src/components/NavBar/NavItems.tsx
@@ -35,11 +35,13 @@ const NavItems: React.FC = () => {
   const [signupOpen, setSignupOpen] = useState(false);
 
   // Resources dropdown state
-  const [resourcesAnchor, setResourcesAnchor] = useState<null | HTMLElement>(
-    null
-  );
+  const [resourcesAnchor, setResourcesAnchor] = useState<null | HTMLElement>(null);
   const resourcesOpen = Boolean(resourcesAnchor);
 
+  // AutoBIDSify dropdown state
+  const [autobidsifyAnchor, setAutobidsifyAnchor] = useState<null | HTMLElement>(null);
+  const autobidsifyOpen = Boolean(autobidsifyAnchor);
+
   const handleLogout = () => {
     dispatch(logoutUser());
     navigate("/");
@@ -53,6 +55,14 @@ const NavItems: React.FC = () => {
     setResourcesAnchor(null);
   };
 
+  const handleAutobidsifyClick = (event: React.MouseEvent<HTMLElement>) => {
+    setAutobidsifyAnchor(event.currentTarget);
+  };
+
+  const handleAutobidsifyClose = () => {
+    setAutobidsifyAnchor(null);
+  };
+
   const resourcesMenu = [
     {
       category: "Converter",
@@ -319,7 +329,6 @@ const NavItems: React.FC = () => {
             { text: "Wiki", url: "https://neurojson.org/Wiki" },
             { text: "Search", url: RoutesEnum.SEARCH },
             { text: "Databases", url: RoutesEnum.DATABASES },
-            { text: "BIDS Converter", url: RoutesEnum.BIDS_CONVERTER },
           ].map(({ text, url }) => (
             <Grid item key={text}>
               {url?.startsWith("https") ? (
@@ -379,6 +388,38 @@ const NavItems: React.FC = () => {
             </Grid>
           ))}
 
+          {/* AutoBIDSify Dropdown */}
+          <Grid item>
+            <Box
+              onClick={handleAutobidsifyClick}
+              sx={{ display: "flex", alignItems: "center", gap: 0.5, cursor: "pointer" }}
+            >
+              <Typography
+                align="center"
+                fontWeight={600}
+                lineHeight={"1.5rem"}
+                letterSpacing={"0.05rem"}
+                sx={{
+                  fontSize: { xs: "0.8rem", sm: "1rem" },
+                  color: Colors.white,
+                  transition: "color 0.3s ease, transform 0.3s ease",
+                  textTransform: "uppercase",
+                  "&:hover": { transform: "scale(1.2)" },
+                }}
+              >
+                AutoBIDSify
+              </Typography>
+              <KeyboardArrowDownIcon
+                sx={{
+                  color: Colors.white,
+                  fontSize: "1.2rem",
+                  transition: "transform 0.3s ease",
+                  transform: autobidsifyOpen ? "rotate(180deg)" : "rotate(0deg)",
+                }}
+              />
+            </Box>
+          </Grid>
+
           {/* Resources Dropdown */}
           <Grid item>
             <Box
@@ -512,6 +553,49 @@ const NavItems: React.FC = () => {
           </Box>
         ))}
       </Menu>
+
+      {/* AutoBIDSify Dropdown Menu */}
+      <Menu
+        anchorEl={autobidsifyAnchor}
+        open={autobidsifyOpen}
+        onClose={handleAutobidsifyClose}
+        PaperProps={{
+          sx: {
+            bgcolor: Colors.darkPurple,
+            color: Colors.white,
+            minWidth: "220px",
+            mt: 1,
+          },
+        }}
+      >
+        <MenuItem
+          onClick={() => {
+            window.open("https://github.com/COTILab/autobidsify", "_blank");
+            handleAutobidsifyClose();
+          }}
+          sx={{
+            fontSize: "0.9rem",
+            color: Colors.white,
+            "&:hover": { bgcolor: Colors.purpleGrey, color: Colors.darkPurple },
+          }}
+        >
+          AutoBIDSify (GitHub)
+        </MenuItem>
+        <MenuItem
+          onClick={() => {
+            navigate(RoutesEnum.BIDS_CONVERTER);
+            handleAutobidsifyClose();
+          }}
+          sx={{
+            fontSize: "0.9rem",
+            color: Colors.white,
+            "&:hover": { bgcolor: Colors.purpleGrey, color: Colors.darkPurple },
+          }}
+        >
+          AutoBIDSify Web
+        </MenuItem>
+      </Menu>
+
       <UserLogin
         open={loginOpen}
         onClose={() => setLoginOpen(false)}
diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index 70b4a46..b528567 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -353,9 +353,12 @@ const BidsConverterPage: React.FC = () => {
       {/* Welcome dialog — shown on first load before user starts working */}
       <Dialog open={!modeChosen} maxWidth="sm" fullWidth>
         <DialogTitle sx={{ textAlign: "center", pt: 4 }}>
-          How would you like to use BIDS Converter?
+          How would you like to use AutoBIDSify?
         </DialogTitle>
         <DialogContent>
+          <Typography variant="body2" color="text.secondary" textAlign="center" sx={{ mb: 2 }}>
+            An LLM-powered tool for automatically converting neuroimaging datasets into BIDS-compliant format.
+          </Typography>
           <Box
             sx={{
               display: "flex",

From f344482b7f478bb498f87da67bd60ea6774d8ee2 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 11:59:49 -0400
Subject: [PATCH 57/61] feat(autobidsify): rebrand BIDS Converter to
 AutoBIDSify with navbar dropdown, updated labels, and GitHub links

---
 .../User/Dashboard/DatasetOrganizer/index.tsx | 51 +++++++++++++++++++
 src/components/User/Dashboard/ProjectsTab.tsx |  4 +-
 src/pages/BidsConverterPage.tsx               | 22 ++++++--
 src/types/routes.enum.ts                      |  2 +-
 4 files changed, 73 insertions(+), 6 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/index.tsx b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
index 5a361a9..796fbaa 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/index.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/index.tsx
@@ -14,6 +14,8 @@ import {
   DialogContent,
   DialogActions,
   DialogContentText,
+  Chip,
+  Tooltip,
 } from "@mui/material";
 import { Colors } from "design/theme";
 import { useAppDispatch } from "hooks/useAppDispatch";
@@ -263,6 +265,55 @@ const DatasetOrganizer: React.FC = () => {
                 {currentProject.description}
               </Typography>
             )}
+            <Tooltip
+              title={
+                <Box>
+                  <Typography variant="body2">An LLM-powered tool for automatically converting neuroimaging datasets into BIDS-compliant format.</Typography>
+                  <Typography
+                    variant="body2"
+                    sx={{ color: Colors.purple, cursor: "pointer", mt: 0.5, textDecoration: "underline" }}
+                    onClick={() => window.open("https://github.com/COTILab/autobidsify", "_blank")}
+                  >
+                    Learn more
+                  </Typography>
+                </Box>
+              }
+              placement="bottom-start"
+              arrow
+              componentsProps={{
+                tooltip: {
+                  sx: {
+                    backgroundColor: "white",
+                    color: Colors.darkPurple,
+                    border: `1px solid ${Colors.lightGray}`,
+                    boxShadow: 3,
+                    fontSize: "0.875rem",
+                    p: 1.5,
+                    maxWidth: 320,
+                  },
+                },
+                arrow: {
+                  sx: {
+                    color: "white",
+                    "&::before": { border: `1px solid ${Colors.lightGray}` },
+                  },
+                },
+              }}
+            >
+              <Chip
+                label="Powered by AutoBIDSify"
+                size="small"
+                onClick={() => window.open("https://github.com/COTILab/autobidsify", "_blank")}
+                sx={{
+                  mt: 0.5,
+                  backgroundColor: Colors.purple,
+                  color: Colors.white,
+                  fontSize: "0.7rem",
+                  cursor: "pointer",
+                  "&:hover": { backgroundColor: Colors.secondaryPurple },
+                }}
+              />
+            </Tooltip>
           </Box>
         </Box>
 
diff --git a/src/components/User/Dashboard/ProjectsTab.tsx b/src/components/User/Dashboard/ProjectsTab.tsx
index 6095c9b..ceaa91b 100644
--- a/src/components/User/Dashboard/ProjectsTab.tsx
+++ b/src/components/User/Dashboard/ProjectsTab.tsx
@@ -199,10 +199,10 @@ const ProjectsTab: React.FC<ProjectsTabProps> = ({ userId }) => {
       >
         <Box>
           <Typography variant="h6" gutterBottom>
-            Dataset Organizer Projects
+            AutoBIDSify Projects
           </Typography>
           <Typography variant="body2" color="text.secondary">
-            Organize and convert your neuroimaging datasets to BIDS format
+            Organize and convert your neuroimaging datasets to BIDS format using AutoBIDSify
           </Typography>
         </Box>
         <Button
diff --git a/src/pages/BidsConverterPage.tsx b/src/pages/BidsConverterPage.tsx
index b528567..54bc8aa 100644
--- a/src/pages/BidsConverterPage.tsx
+++ b/src/pages/BidsConverterPage.tsx
@@ -172,7 +172,7 @@ const BidsConverterPage: React.FC = () => {
           </Button>
           <Box>
             <Box display="flex" alignItems="center" gap={0.5}>
-              <Typography variant="h5">BIDS Converter</Typography>
+              <Typography variant="h5">AutoBIDSify</Typography>
               <Tooltip
                 title={
                   <Box>
@@ -214,7 +214,15 @@ const BidsConverterPage: React.FC = () => {
               </Tooltip>
             </Box>
             <Typography variant="body2" color="text.secondary">
-              Organize and rename your dataset files into BIDS format
+              An LLM-powered tool for automatically converting neuroimaging datasets into BIDS-compliant format.{" "}
+              <Typography
+                component="span"
+                variant="body2"
+                onClick={() => window.open("https://github.com/COTILab/autobidsify", "_blank")}
+                sx={{ color: Colors.purple, cursor: "pointer", textDecoration: "underline" }}
+              >
+                Learn more
+              </Typography>
             </Typography>
           </Box>
         </Box>
@@ -357,7 +365,15 @@ const BidsConverterPage: React.FC = () => {
         </DialogTitle>
         <DialogContent>
           <Typography variant="body2" color="text.secondary" textAlign="center" sx={{ mb: 2 }}>
-            An LLM-powered tool for automatically converting neuroimaging datasets into BIDS-compliant format.
+            An LLM-powered tool for automatically converting neuroimaging datasets into BIDS-compliant format.{" "}
+            <Typography
+              component="span"
+              variant="body2"
+              onClick={() => window.open("https://github.com/COTILab/autobidsify", "_blank")}
+              sx={{ color: Colors.purple, cursor: "pointer", textDecoration: "underline" }}
+            >
+              Learn more
+            </Typography>
           </Typography>
           <Box
             sx={{
diff --git a/src/types/routes.enum.ts b/src/types/routes.enum.ts
index a774051..e8c2658 100644
--- a/src/types/routes.enum.ts
+++ b/src/types/routes.enum.ts
@@ -4,6 +4,6 @@ enum RoutesEnum {
   SEARCH = "/search", // New route for the search page
   ABOUT = "/about", // New route for the about page
   DASHBOARD = "/dashboard",
-  BIDS_CONVERTER = "/bids-converter",
+  BIDS_CONVERTER = "/autobidsify",
 }
 export default RoutesEnum;

From a69ff4a592707cc20151ccdf1c2aec2dccea607a Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 12:14:11 -0400
Subject: [PATCH 58/61] feat(llm-panel): add local AI support for Ollama, LM
 Studio, and Jan with custom model input

---
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 38 +++++++++++++++----
 1 file changed, 31 insertions(+), 7 deletions(-)

diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index d858c35..84e1a7a 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -75,14 +75,19 @@ const llmProviders: Record<string, LLMProvider> = {
     noApiKey: true,
   },
   "local-ollama": {
-    name: "Ollama (Your Local Machine)",
+    name: "Local AI (Ollama / LM Studio / Jan)",
     baseUrl: "http://localhost:11434/v1/chat/completions",
     models: [
-      { id: "llama3.2:latest", name: "Llama 3.2" },
-      { id: "llama3.1:latest", name: "Llama 3.1" },
-      { id: "qwen2.5-coder:latest", name: "Qwen 2.5 Coder" },
-      { id: "mistral:latest", name: "Mistral" },
-      { id: "gemma3:latest", name: "Gemma 3" },
+      { id: "llama3.2:latest", name: "Llama 3.2 (Ollama)" },
+      { id: "llama3.1:latest", name: "Llama 3.1 (Ollama)" },
+      { id: "qwen2.5-coder:latest", name: "Qwen 2.5 Coder (Ollama)" },
+      { id: "mistral:latest", name: "Mistral (Ollama)" },
+      { id: "gemma3:latest", name: "Gemma 3 (Ollama)" },
+      { id: "llama-3.2-3b-instruct", name: "Llama 3.2 3B (LM Studio)" },
+      { id: "llama-3.1-8b-instruct", name: "Llama 3.1 8B (LM Studio)" },
+      { id: "mistral-7b-instruct-v0.3", name: "Mistral 7B (LM Studio)" },
+      { id: "llama3.2:3b", name: "Llama 3.2 3B (Jan)" },
+      { id: "mistral:7b", name: "Mistral 7B (Jan)" },
     ],
     noApiKey: true,
   },
@@ -1459,6 +1464,25 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
             </Select>
           </FormControl>
 
+          {provider === "local-ollama" && (
+            <TextField
+              fullWidth
+              label="Custom Model Name (optional)"
+              placeholder="e.g. llama3:8b, phi3:mini, qwen2.5:7b"
+              helperText="Overrides the model selected above."
+              sx={{ mb: 2 }}
+              onChange={(e) => {
+                if (e.target.value.trim()) setModel(e.target.value.trim());
+              }}
+            />
+          )}
+
+          {isPrivateMode && provider !== "local-ollama" && (
+            <Alert severity="warning" sx={{ mb: 2, fontSize: "0.8rem" }}>
+              Your file information will be sent to <strong>{currentProvider.name}</strong>, an external AI service. Switch to <strong>Local AI (Ollama / LM Studio / Jan)</strong> to keep everything local.
+            </Alert>
+          )}
+
           {provider === "local-ollama" && (
             <TextField
               fullWidth
@@ -1466,7 +1490,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               value={localOllamaUrl}
               onChange={(e) => setLocalOllamaUrl(e.target.value)}
               placeholder="http://localhost:11434"
-              helperText="Default port is 11434. Change if your Ollama runs on a different port."
+              helperText="Ollama: port 11434 · LM Studio: port 1234 · Jan: port 1337"
               sx={{ mb: 2 }}
             />
           )}

From 1dfc255dbdef999b7db756ad0d737149a21f0e22 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 12:46:13 -0400
Subject: [PATCH 59/61] feat(ollama): use qwen3.6:27b on server for LLM, hide
 model selector

---
 backend/src/controllers/ollama.controller.js  |  5 +++--
 backend/src/routes/ollama.public.routes.js    |  2 +-
 backend/src/routes/ollama.routes.js           |  2 +-
 .../Dashboard/DatasetOrganizer/LLMPanel.tsx   | 22 +++++++++++++------
 4 files changed, 20 insertions(+), 11 deletions(-)

diff --git a/backend/src/controllers/ollama.controller.js b/backend/src/controllers/ollama.controller.js
index 84bb3bb..fe0c4e8 100644
--- a/backend/src/controllers/ollama.controller.js
+++ b/backend/src/controllers/ollama.controller.js
@@ -1,12 +1,13 @@
 const OLLAMA_BASE_URL = "http://jin.neu.edu:11434";
+const OLLAMA_MODEL = "qwen3.6:27b";
 
 const proxyChat = async (req, res) => {
-  console.log("🟣 [Ollama] proxyChat hit — model:", req.body.model);
+  console.log("🟣 [Ollama] proxyChat hit — model:", OLLAMA_MODEL);
   try {
     const response = await fetch(`${OLLAMA_BASE_URL}/v1/chat/completions`, {
       method: "POST",
       headers: { "Content-Type": "application/json" },
-      body: JSON.stringify(req.body),
+      body: JSON.stringify({ ...req.body, model: OLLAMA_MODEL }),
     });
 
     const data = await response.json();
diff --git a/backend/src/routes/ollama.public.routes.js b/backend/src/routes/ollama.public.routes.js
index e9fc0f1..b8981a0 100644
--- a/backend/src/routes/ollama.public.routes.js
+++ b/backend/src/routes/ollama.public.routes.js
@@ -12,6 +12,6 @@ const dailyLimit = rateLimit({
 });
 
 router.post("/chat", dailyLimit, proxyChat);
-router.get("/tags", dailyLimit, getTags);
+// router.get("/tags", dailyLimit, getTags);
 
 module.exports = router;
diff --git a/backend/src/routes/ollama.routes.js b/backend/src/routes/ollama.routes.js
index 38bdcb4..be86d75 100644
--- a/backend/src/routes/ollama.routes.js
+++ b/backend/src/routes/ollama.routes.js
@@ -4,6 +4,6 @@ const { proxyChat, getTags } = require("../controllers/ollama.controller");
 const { requireAuth } = require("../middleware/auth.middleware");
 
 router.post("/chat", requireAuth, proxyChat);
-router.get("/tags", requireAuth, getTags);
+// router.get("/tags", requireAuth, getTags);
 
 module.exports = router;
diff --git a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
index 84e1a7a..c574bf5 100644
--- a/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
+++ b/src/components/User/Dashboard/DatasetOrganizer/LLMPanel.tsx
@@ -62,15 +62,15 @@ interface LLMProvider {
 
 const llmProviders: Record<string, LLMProvider> = {
   ollama: {
-    name: "Ollama (Local Server)",
-    // baseUrl: "http://localhost:11434/v1/chat/completions",
+    name: "Ollama (NeuroJSON Server)",
     baseUrl: "",
     models: [
-      { id: "qwen3-coder-next:latest", name: "Qwen 3 Coder Next" },
-      { id: "qwen3-coder-careful:latest", name: "Qwen 3 Coder Careful" },
-      { id: "qwen3.5:9b", name: "Qwen 3.5 9B" },
-      { id: "qwen2.5-coder:latest", name: "Qwen 2.5 Coder (7.6B)" },
-      { id: "qwen2.5-coder:7b", name: "Qwen 2.5 Coder 7B" },
+      { id: "qwen3.6:27b", name: "Qwen 3.6 27B" },
+      // { id: "qwen3-coder-next:latest", name: "Qwen 3 Coder Next" },
+      // { id: "qwen3-coder-careful:latest", name: "Qwen 3 Coder Careful" },
+      // { id: "qwen3.5:9b", name: "Qwen 3.5 9B" },
+      // { id: "qwen2.5-coder:latest", name: "Qwen 2.5 Coder (7.6B)" },
+      // { id: "qwen2.5-coder:7b", name: "Qwen 2.5 Coder 7B" },
     ],
     noApiKey: true,
   },
@@ -1449,6 +1449,13 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
             </Select>
           </FormControl>
 
+          {provider === "ollama" && (
+            <Typography variant="caption" color="text.secondary" sx={{ mt: -1, mb: 2, display: "block" }}>
+              Using qwen3.6:27b on NeuroJSON server
+            </Typography>
+          )}
+
+          {provider !== "ollama" && (
           <FormControl fullWidth sx={{ mb: 2 }}>
             <InputLabel>Model</InputLabel>
             <Select
@@ -1463,6 +1470,7 @@ const LLMPanel: React.FC<LLMPanelProps> = ({
               ))}
             </Select>
           </FormControl>
+          )}
 
           {provider === "local-ollama" && (
             <TextField

From 34d0260181d896af7a31213824f3282ea8770d89 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Fri, 29 May 2026 12:47:30 -0400
Subject: [PATCH 60/61] fix(ollama): increase public endpoint rate limit to 20
 requests/day

---
 backend/src/routes/ollama.public.routes.js | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/backend/src/routes/ollama.public.routes.js b/backend/src/routes/ollama.public.routes.js
index b8981a0..c395e51 100644
--- a/backend/src/routes/ollama.public.routes.js
+++ b/backend/src/routes/ollama.public.routes.js
@@ -5,10 +5,10 @@ const { proxyChat, getTags } = require("../controllers/ollama.controller");
 
 const dailyLimit = rateLimit({
   windowMs: 24 * 60 * 60 * 1000, // 24 hours
-  max: 10,
+  max: 20,
   standardHeaders: true,
   legacyHeaders: false,
-  message: { error: "Daily request limit reached. You can send up to 10 requests per day from this IP." },
+  message: { error: "Daily request limit reached. You can send up to 20 requests per day from this IP." },
 });
 
 router.post("/chat", dailyLimit, proxyChat);

From 60cfdb0e5050fe33aa20d0ab43de8ddc724884c9 Mon Sep 17 00:00:00 2001
From: elainefan331 <elainefan331@gmail.com>
Date: Mon, 1 Jun 2026 10:42:02 -0400
Subject: [PATCH 61/61] fix(preview): make 2D chart responsive to container
 width

---
 package.json         |   4 +-
 src/utils/preview.js |  22 ++++-
 yarn.lock            | 215 ++++++++++++++++++++++---------------------
 3 files changed, 135 insertions(+), 106 deletions(-)

diff --git a/package.json b/package.json
index 6f414ef..aac37d2 100644
--- a/package.json
+++ b/package.json
@@ -50,13 +50,13 @@
     "react-redux": "^8.1.2",
     "react-router-dom": "^6.15.0",
     "react-scripts": "^5.0.1",
-    "react-syntax-highlighter": "^15.6.1",
+    "react-syntax-highlighter": "16.1.1",
     "sharp": "^0.33.5",
     "stats-js": "^1.0.1",
     "stats.js": "0.17.0",
     "three": "0.145.0",
     "typescript": "^5.1.6",
-    "uplot": "1.6.17",
+    "uplot": "1.6.32",
     "web-vitals": "^2.1.0",
     "xlsx": "^0.18.5"
   },
diff --git a/src/utils/preview.js b/src/utils/preview.js
index 7e4dd6d..231a85e 100644
--- a/src/utils/preview.js
+++ b/src/utils/preview.js
@@ -34,6 +34,7 @@ var lastvolumedata = null;
 var lastvolumedim = [];
 var lastclim = 0;
 var uplotInstance = null;
+var uplotResizeObserver = null;
 var reqid = undefined;
 
 var canvas = null;
@@ -135,6 +136,10 @@ function destroyPreview() {
   lastvolumedata = null;
   texture = undefined;
 
+  if (uplotResizeObserver !== null) {
+    uplotResizeObserver.disconnect();
+    uplotResizeObserver = null;
+  }
   if (uplotInstance !== null) {
     uplotInstance.destroy();
     uplotInstance = null;
@@ -384,7 +389,7 @@ function dopreview(key, idx, isinternal, hastime) {
         // "Preview for " +
         // (isinternal ? intdata[idx][3] : window.extdata[idx][3]),
         "Data Preview",
-      width: 1100,
+      width: Math.max(300, $("#chartpanel").width() - 24),
       height: 400,
       series: [{}, {}],
       axes: [
@@ -507,6 +512,21 @@ function dopreview(key, idx, isinternal, hastime) {
       // });
     }
 
+    if (uplotResizeObserver !== null) {
+      uplotResizeObserver.disconnect();
+    }
+    uplotResizeObserver = new ResizeObserver(() => {
+      requestAnimationFrame(() => {
+        if (uplotInstance) {
+          uplotInstance.setSize({
+            width: Math.max(300, $("#chartpanel").width() - 24),
+            height: 400,
+          });
+        }
+      });
+    });
+    uplotResizeObserver.observe(document.getElementById("chartpanel"));
+
     // for spinner
     // --- Signal React that 2D preview is ready ---
     window.__previewType = "2d";
diff --git a/yarn.lock b/yarn.lock
index e881a21..ec84ee7 100644
--- a/yarn.lock
+++ b/yarn.lock
@@ -1122,7 +1122,7 @@
     "@babel/plugin-transform-modules-commonjs" "^7.27.1"
     "@babel/plugin-transform-typescript" "^7.27.1"
 
-"@babel/runtime@7.26.10", "@babel/runtime@^7.11.2", "@babel/runtime@^7.12.1", "@babel/runtime@^7.12.5", "@babel/runtime@^7.16.3", "@babel/runtime@^7.17.8", "@babel/runtime@^7.18.3", "@babel/runtime@^7.20.13", "@babel/runtime@^7.23.9", "@babel/runtime@^7.3.1", "@babel/runtime@^7.5.5", "@babel/runtime@^7.8.7", "@babel/runtime@^7.9.2":
+"@babel/runtime@7.26.10", "@babel/runtime@^7.11.2", "@babel/runtime@^7.12.1", "@babel/runtime@^7.12.5", "@babel/runtime@^7.16.3", "@babel/runtime@^7.17.8", "@babel/runtime@^7.18.3", "@babel/runtime@^7.20.13", "@babel/runtime@^7.23.9", "@babel/runtime@^7.28.4", "@babel/runtime@^7.5.5", "@babel/runtime@^7.8.7", "@babel/runtime@^7.9.2":
   version "7.26.10"
   resolved "https://registry.yarnpkg.com/@babel/runtime/-/runtime-7.26.10.tgz#a07b4d8fa27af131a633d7b3524db803eb4764c2"
   integrity sha512-2WJMeRQPHKSPemqk/awGrAiuFfzBmOIPXKizAsVhWH9YJqLZ0H+HS4c8loHGgW6utJ3E/ejXQUsiGaQy2NZ9Fw==
@@ -2895,12 +2895,12 @@
   dependencies:
     "@types/node" "*"
 
-"@types/hast@^2.0.0":
-  version "2.3.10"
-  resolved "https://registry.yarnpkg.com/@types/hast/-/hast-2.3.10.tgz#5c9d9e0b304bbb8879b857225c5ebab2d81d7643"
-  integrity sha512-McWspRw8xx8J9HurkVBfYj0xKoE25tOFlHGdx4MJ5xORQrMGZNqJhVQWaIbm6Oyla5kYOXtDiopzKRJzEOkwJw==
+"@types/hast@^3.0.0":
+  version "3.0.4"
+  resolved "https://registry.yarnpkg.com/@types/hast/-/hast-3.0.4.tgz#1d6b39993b82cea6ad783945b0508c25903e15aa"
+  integrity sha512-WPs+bbQw5aCj+x6laNGWLH3wviHtoCv/P3+otBhbOhJgG8qtpdAMlTCxLtsTWA7LH1Oh/bFCHsBn0TPS5m30EQ==
   dependencies:
-    "@types/unist" "^2"
+    "@types/unist" "*"
 
 "@types/hoist-non-react-statics@^3.3.1":
   version "3.3.6"
@@ -3030,6 +3030,11 @@
   resolved "https://registry.yarnpkg.com/@types/prettier/-/prettier-2.7.3.tgz#3e51a17e291d01d17d3fc61422015a933af7a08f"
   integrity sha512-+68kP9yzs4LMp7VNh8gdzMSPZFL44MLGqiHWvttYJe+6qnuVr4Ek9wSBQoveqY/r+LwjCcU29kNVkidwim+kYA==
 
+"@types/prismjs@^1.0.0":
+  version "1.26.6"
+  resolved "https://registry.yarnpkg.com/@types/prismjs/-/prismjs-1.26.6.tgz#6ea27c126d645319ae4f7055eda63a9e835c0187"
+  integrity sha512-vqlvI7qlMvcCBbVe0AKAb4f97//Hy0EBTaiW8AalRnG/xAN5zOiWWyrNqNXeq8+KAuvRewjCVY1+IPxk4RdNYw==
+
 "@types/prop-types@*", "@types/prop-types@^15.7.12":
   version "15.7.15"
   resolved "https://registry.yarnpkg.com/@types/prop-types/-/prop-types-15.7.15.tgz#e6e5a86d602beaca71ce5163fadf5f95d70931c7"
@@ -3158,7 +3163,12 @@
   resolved "https://registry.yarnpkg.com/@types/trusted-types/-/trusted-types-2.0.7.tgz#baccb07a970b91707df3a3e8ba6896c57ead2d11"
   integrity sha512-ScaPdn1dQczgbl0QFTeTOmVHFULt394XJgOQNoyVhZ6r2vLnMLJfBPd53SB52T/3G36VI1/g2MZaX0cwDuXsfw==
 
-"@types/unist@^2":
+"@types/unist@*":
+  version "3.0.3"
+  resolved "https://registry.yarnpkg.com/@types/unist/-/unist-3.0.3.tgz#acaab0f919ce69cce629c2d4ed2eb4adc1b6c20c"
+  integrity sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q==
+
+"@types/unist@^2.0.0":
   version "2.0.11"
   resolved "https://registry.yarnpkg.com/@types/unist/-/unist-2.0.11.tgz#11af57b127e32487774841f7a4e54eab166d03c4"
   integrity sha512-CmBKiL6NNo/OqgmMn95Fk9Whlp2mtvIv+KNpQKN2F4SjvrEesubTRWGYSg+BnWZOnlCaSTU1sMpsBOzgbYhnsA==
@@ -4435,20 +4445,20 @@ char-regex@^2.0.0:
   resolved "https://registry.yarnpkg.com/char-regex/-/char-regex-2.0.2.tgz#81385bb071af4df774bff8721d0ca15ef29ea0bb"
   integrity sha512-cbGOjAptfM2LVmWhwRFHEKTPkLwNddVmuqYZQt895yXwAsWsXObCG+YN4DGQ/JBtT4GP1a1lPPdio2z413LmTg==
 
-character-entities-legacy@^1.0.0:
-  version "1.1.4"
-  resolved "https://registry.yarnpkg.com/character-entities-legacy/-/character-entities-legacy-1.1.4.tgz#94bc1845dce70a5bb9d2ecc748725661293d8fc1"
-  integrity sha512-3Xnr+7ZFS1uxeiUDvV02wQ+QDbc55o97tIV5zHScSPJpcLm/r0DFPcoY3tYRp+VZukxuMeKgXYmsXQHO05zQeA==
+character-entities-legacy@^3.0.0:
+  version "3.0.0"
+  resolved "https://registry.yarnpkg.com/character-entities-legacy/-/character-entities-legacy-3.0.0.tgz#76bc83a90738901d7bc223a9e93759fdd560125b"
+  integrity sha512-RpPp0asT/6ufRm//AJVwpViZbGM/MkjQFxJccQRHmISF/22NBtsHqAWmL+/pmkPWoIUJdWyeVleTl1wydHATVQ==
 
-character-entities@^1.0.0:
-  version "1.2.4"
-  resolved "https://registry.yarnpkg.com/character-entities/-/character-entities-1.2.4.tgz#e12c3939b7eaf4e5b15e7ad4c5e28e1d48c5b16b"
-  integrity sha512-iBMyeEHxfVnIakwOuDXpVkc54HijNgCyQB2w0VfGQThle6NXn50zU6V/u+LDhxHcDUPojn6Kpga3PTAD8W1bQw==
+character-entities@^2.0.0:
+  version "2.0.2"
+  resolved "https://registry.yarnpkg.com/character-entities/-/character-entities-2.0.2.tgz#2d09c2e72cd9523076ccb21157dff66ad43fcc22"
+  integrity sha512-shx7oQ0Awen/BRIdkjkvz54PnEEI/EjwXDSIZp86/KKdbafHh1Df/RYGBhn4hbe2+uKC9FnT5UCEdyPz3ai9hQ==
 
-character-reference-invalid@^1.0.0:
-  version "1.1.4"
-  resolved "https://registry.yarnpkg.com/character-reference-invalid/-/character-reference-invalid-1.1.4.tgz#083329cda0eae272ab3dbbf37e9a382c13af1560"
-  integrity sha512-mKKUkUbhPpQlCOfIuZkvSEgktjPFIsZKRRbC6KWVEMvlzblj3i3asQv5ODsrwt0N3pHAEvjP8KTQPHkp0+6jOg==
+character-reference-invalid@^2.0.0:
+  version "2.0.1"
+  resolved "https://registry.yarnpkg.com/character-reference-invalid/-/character-reference-invalid-2.0.1.tgz#85c66b041e43b47210faf401278abf808ac45cb9"
+  integrity sha512-iBZ4F4wRbyORVsu0jPV7gXkOsGYjGHPmAyv+HiHG8gi5PtC9KI2j1+v8/tlibRvjoWX027ypmG/n0HtO5t7unw==
 
 check-types@^11.2.3:
   version "11.2.3"
@@ -4641,10 +4651,10 @@ combined-stream@^1.0.8:
   dependencies:
     delayed-stream "~1.0.0"
 
-comma-separated-tokens@^1.0.0:
-  version "1.0.8"
-  resolved "https://registry.yarnpkg.com/comma-separated-tokens/-/comma-separated-tokens-1.0.8.tgz#632b80b6117867a158f1080ad498b2fbe7e3f5ea"
-  integrity sha512-GHuDRO12Sypu2cV70d1dkA2EUmXHgntrzbpvOB+Qy+49ypNfGgFQIC2fhhXbnyrJRynDCAARsT7Ou0M6hirpfw==
+comma-separated-tokens@^2.0.0:
+  version "2.0.3"
+  resolved "https://registry.yarnpkg.com/comma-separated-tokens/-/comma-separated-tokens-2.0.3.tgz#4e89c9458acb61bc8fef19f4529973b2392839ee"
+  integrity sha512-Fu4hJdvzeylCfQPp9SGWidpzrMs7tTrlu6Vb8XGaRGck8QSNZJJp538Wrb60Lax4fPwR64ViY468OIUTbRlGZg==
 
 commander@^11.1.0:
   version "11.1.0"
@@ -5415,6 +5425,13 @@ decimal.js@^10.2.1:
   resolved "https://registry.yarnpkg.com/decimal.js/-/decimal.js-10.5.0.tgz#0f371c7cf6c4898ce0afb09836db73cd82010f22"
   integrity sha512-8vDa8Qxvr/+d94hSh5P3IJwI5t8/c0KsMp+g8bNw9cY2icONa5aPfvKeieW1WlG0WQYwwhJ7mjui2xtiePQSXw==
 
+decode-named-character-reference@^1.0.0:
+  version "1.3.0"
+  resolved "https://registry.yarnpkg.com/decode-named-character-reference/-/decode-named-character-reference-1.3.0.tgz#3e40603760874c2e5867691b599d73a7da25b53f"
+  integrity sha512-GtpQYB283KrPp6nRw50q3U9/VfOutZOe103qlN7BPP6Ad27xYnOIWv4lPzo8HCAL+mMZofJ9KEy30fq6MfaK6Q==
+  dependencies:
+    character-entities "^2.0.0"
+
 decode-uri-component@^0.4.1:
   version "0.4.1"
   resolved "https://registry.yarnpkg.com/decode-uri-component/-/decode-uri-component-0.4.1.tgz#2ac4859663c704be22bf7db760a1494a49ab2cc5"
@@ -7205,21 +7222,23 @@ hasown@^2.0.2:
   dependencies:
     function-bind "^1.1.2"
 
-hast-util-parse-selector@^2.0.0:
-  version "2.2.5"
-  resolved "https://registry.yarnpkg.com/hast-util-parse-selector/-/hast-util-parse-selector-2.2.5.tgz#d57c23f4da16ae3c63b3b6ca4616683313499c3a"
-  integrity sha512-7j6mrk/qqkSehsM92wQjdIgWM2/BW61u/53G6xmC8i1OmEdKLHbk419QKQUjz6LglWsfqoiHmyMRkP1BGjecNQ==
+hast-util-parse-selector@^4.0.0:
+  version "4.0.0"
+  resolved "https://registry.yarnpkg.com/hast-util-parse-selector/-/hast-util-parse-selector-4.0.0.tgz#352879fa86e25616036037dd8931fb5f34cb4a27"
+  integrity sha512-wkQCkSYoOGCRKERFWcxMVMOcYE2K1AaNLU8DXS9arxnLOUEWbOXKXiJUNzEpqZ3JOKpnha3jkFrumEjVliDe7A==
+  dependencies:
+    "@types/hast" "^3.0.0"
 
-hastscript@^6.0.0:
-  version "6.0.0"
-  resolved "https://registry.yarnpkg.com/hastscript/-/hastscript-6.0.0.tgz#e8768d7eac56c3fdeac8a92830d58e811e5bf640"
-  integrity sha512-nDM6bvd7lIqDUiYEiu5Sl/+6ReP0BMk/2f4U/Rooccxkj0P5nm+acM5PrGJ/t5I8qPGiqZSE6hVAwZEdZIvP4w==
+hastscript@^9.0.0:
+  version "9.0.1"
+  resolved "https://registry.yarnpkg.com/hastscript/-/hastscript-9.0.1.tgz#dbc84bef6051d40084342c229c451cd9dc567dff"
+  integrity sha512-g7df9rMFX/SPi34tyGCyUBREQoKkapwdY/T04Qn9TDWfHhAYt4/I0gMVirzK5wEzeUqIjEB+LXC/ypb7Aqno5w==
   dependencies:
-    "@types/hast" "^2.0.0"
-    comma-separated-tokens "^1.0.0"
-    hast-util-parse-selector "^2.0.0"
-    property-information "^5.0.0"
-    space-separated-tokens "^1.0.0"
+    "@types/hast" "^3.0.0"
+    comma-separated-tokens "^2.0.0"
+    hast-util-parse-selector "^4.0.0"
+    property-information "^7.0.0"
+    space-separated-tokens "^2.0.0"
 
 he@^1.2.0:
   version "1.2.0"
@@ -7521,18 +7540,18 @@ ipaddr.js@^2.0.1:
   resolved "https://registry.yarnpkg.com/ipaddr.js/-/ipaddr.js-2.2.0.tgz#d33fa7bac284f4de7af949638c9d68157c6b92e8"
   integrity sha512-Ag3wB2o37wslZS19hZqorUnrnzSkpOVy+IiiDEiTqNubEYpYuHWIf6K4psgN2ZWKExS4xhVCrRVfb/wfW8fWJA==
 
-is-alphabetical@^1.0.0:
-  version "1.0.4"
-  resolved "https://registry.yarnpkg.com/is-alphabetical/-/is-alphabetical-1.0.4.tgz#9e7d6b94916be22153745d184c298cbf986a686d"
-  integrity sha512-DwzsA04LQ10FHTZuL0/grVDk4rFoVH1pjAToYwBrHSxcrBIGQuXrQMtD5U1b0U2XVgKZCTLLP8u2Qxqhy3l2Vg==
+is-alphabetical@^2.0.0:
+  version "2.0.1"
+  resolved "https://registry.yarnpkg.com/is-alphabetical/-/is-alphabetical-2.0.1.tgz#01072053ea7c1036df3c7d19a6daaec7f19e789b"
+  integrity sha512-FWyyY60MeTNyeSRpkM2Iry0G9hpr7/9kD40mD/cGQEuilcZYS4okz8SN2Q6rLCJ8gbCt6fN+rC+6tMGS99LaxQ==
 
-is-alphanumerical@^1.0.0:
-  version "1.0.4"
-  resolved "https://registry.yarnpkg.com/is-alphanumerical/-/is-alphanumerical-1.0.4.tgz#7eb9a2431f855f6b1ef1a78e326df515696c4dbf"
-  integrity sha512-UzoZUr+XfVz3t3v4KyGEniVL9BDRoQtY7tOyrRybkVNjDFWyo1yhXNGrrBTQxp3ib9BLAWs7k2YKBQsFRkZG9A==
+is-alphanumerical@^2.0.0:
+  version "2.0.1"
+  resolved "https://registry.yarnpkg.com/is-alphanumerical/-/is-alphanumerical-2.0.1.tgz#7c03fbe96e3e931113e57f964b0a368cc2dfd875"
+  integrity sha512-hmbYhX/9MUMF5uh7tOXyK/n0ZvWpad5caBA17GsC6vyuCqaWliRG5K1qS9inmUhEMaOBIW7/whAnSwveW/LtZw==
   dependencies:
-    is-alphabetical "^1.0.0"
-    is-decimal "^1.0.0"
+    is-alphabetical "^2.0.0"
+    is-decimal "^2.0.0"
 
 is-arguments@^1.1.1:
   version "1.2.0"
@@ -7633,10 +7652,10 @@ is-date-object@^1.0.5, is-date-object@^1.1.0:
     call-bound "^1.0.2"
     has-tostringtag "^1.0.2"
 
-is-decimal@^1.0.0:
-  version "1.0.4"
-  resolved "https://registry.yarnpkg.com/is-decimal/-/is-decimal-1.0.4.tgz#65a3a5958a1c5b63a706e1b333d7cd9f630d3fa5"
-  integrity sha512-RGdriMmQQvZ2aqaQq3awNA6dCGtKpiDFcOzrTWrDAT2MiWrKQVPmxLGHl7Y2nNu6led0kEyoX0enY0qXYsv9zw==
+is-decimal@^2.0.0:
+  version "2.0.1"
+  resolved "https://registry.yarnpkg.com/is-decimal/-/is-decimal-2.0.1.tgz#9469d2dc190d0214fd87d78b78caecc0cc14eef7"
+  integrity sha512-AAB9hiomQs5DXWcRB1rqsxGUstbRroFOPPVAomNk/3XHR5JyEZChOyTWe2oayKnsSsr/kcGqF+z6yuH6HHpN0A==
 
 is-docker@^2.0.0, is-docker@^2.1.1:
   version "2.2.1"
@@ -7689,10 +7708,10 @@ is-glob@^4.0.0, is-glob@^4.0.1, is-glob@^4.0.3, is-glob@~4.0.1:
   dependencies:
     is-extglob "^2.1.1"
 
-is-hexadecimal@^1.0.0:
-  version "1.0.4"
-  resolved "https://registry.yarnpkg.com/is-hexadecimal/-/is-hexadecimal-1.0.4.tgz#cc35c97588da4bd49a8eedd6bc4082d44dcb23a7"
-  integrity sha512-gyPJuv83bHMpocVYoqof5VDiZveEoGoFL8m3BXNb2VW8Xs+rz9kqO8LOQ5DH6EsuvilT1ApazU0pyl+ytbPtlw==
+is-hexadecimal@^2.0.0:
+  version "2.0.1"
+  resolved "https://registry.yarnpkg.com/is-hexadecimal/-/is-hexadecimal-2.0.1.tgz#86b5bf668fca307498d319dfc03289d781a90027"
+  integrity sha512-DgZQp241c8oO6cA1SbTEWiXeoxV42vlcJxgH+B3hi1AiqqKruZR3ZGF8In3fj4+/y/7rHvlOZLZtgJ/4ttYGZg==
 
 is-map@^2.0.2, is-map@^2.0.3:
   version "2.0.3"
@@ -9713,17 +9732,18 @@ parent-module@^2.0.0:
   dependencies:
     callsites "^3.1.0"
 
-parse-entities@^2.0.0:
-  version "2.0.0"
-  resolved "https://registry.yarnpkg.com/parse-entities/-/parse-entities-2.0.0.tgz#53c6eb5b9314a1f4ec99fa0fdf7ce01ecda0cbe8"
-  integrity sha512-kkywGpCcRYhqQIchaWqZ875wzpS/bMKhz5HnN3p7wveJTkTtyAB/AlnS0f8DFSqYW1T82t6yEAkEcB+A1I3MbQ==
+parse-entities@^4.0.0:
+  version "4.0.2"
+  resolved "https://registry.yarnpkg.com/parse-entities/-/parse-entities-4.0.2.tgz#61d46f5ed28e4ee62e9ddc43d6b010188443f159"
+  integrity sha512-GG2AQYWoLgL877gQIKeRPGO1xF9+eG1ujIb5soS5gPvLQ1y2o8FL90w2QWNdf9I361Mpp7726c+lj3U0qK1uGw==
   dependencies:
-    character-entities "^1.0.0"
-    character-entities-legacy "^1.0.0"
-    character-reference-invalid "^1.0.0"
-    is-alphanumerical "^1.0.0"
-    is-decimal "^1.0.0"
-    is-hexadecimal "^1.0.0"
+    "@types/unist" "^2.0.0"
+    character-entities-legacy "^3.0.0"
+    character-reference-invalid "^2.0.0"
+    decode-named-character-reference "^1.0.0"
+    is-alphanumerical "^2.0.0"
+    is-decimal "^2.0.0"
+    is-hexadecimal "^2.0.0"
 
 parse-json@^5.0.0, parse-json@^5.2.0:
   version "5.2.0"
@@ -10518,16 +10538,11 @@ pretty-format@^29.0.0, pretty-format@^29.7.0:
     ansi-styles "^5.0.0"
     react-is "^18.0.0"
 
-prismjs@^1.27.0:
+prismjs@^1.30.0:
   version "1.30.0"
   resolved "https://registry.yarnpkg.com/prismjs/-/prismjs-1.30.0.tgz#d9709969d9d4e16403f6f348c63553b19f0975a9"
   integrity sha512-DEvV2ZF2r2/63V+tK8hQvrR2ZGn10srHbXviTlcv7Kpzw8jWiNTqbVgjO3IY8RxrrOUF8VPMQQFysYYYv0YZxw==
 
-prismjs@~1.27.0:
-  version "1.27.0"
-  resolved "https://registry.yarnpkg.com/prismjs/-/prismjs-1.27.0.tgz#bb6ee3138a0b438a3653dd4d6ce0cc6510a45057"
-  integrity sha512-t13BGPUlFDR7wRB5kQDG4jjl7XeuH6jbJGt11JHPL96qwsEHNX2+68tFXqc1/k+/jALsbSWJKUOT/hcYAZ5LkA==
-
 process-nextick-args@~2.0.0:
   version "2.0.1"
   resolved "https://registry.yarnpkg.com/process-nextick-args/-/process-nextick-args-2.0.1.tgz#7820d9b16120cc55ca9ae7792680ae7dba6d7fe2"
@@ -10564,12 +10579,10 @@ prop-types@^15.6.2, prop-types@^15.8.1:
     object-assign "^4.1.1"
     react-is "^16.13.1"
 
-property-information@^5.0.0:
-  version "5.6.0"
-  resolved "https://registry.yarnpkg.com/property-information/-/property-information-5.6.0.tgz#61675545fb23002f245c6540ec46077d4da3ed69"
-  integrity sha512-YUHSPk+A30YPv+0Qf8i9Mbfe/C0hdPXk1s1jPVToV8pk8BQtpw10ct89Eo7OWkutrwqvT0eicAxlOg3dOAu8JA==
-  dependencies:
-    xtend "^4.0.0"
+property-information@^7.0.0:
+  version "7.1.0"
+  resolved "https://registry.yarnpkg.com/property-information/-/property-information-7.1.0.tgz#b622e8646e02b580205415586b40804d3e8bfd5d"
+  integrity sha512-TwEZ+X+yCJmYfL7TPUOcvBZ4QfoT5YenQiJuX//0th53DE6w0xxLEtfK3iyryQFddXuvkIk51EEgrJQ0WJkOmQ==
 
 proxy-addr@~2.0.7:
   version "2.0.7"
@@ -10874,17 +10887,17 @@ react-scripts@^5.0.1:
   optionalDependencies:
     fsevents "^2.3.2"
 
-react-syntax-highlighter@^15.6.1:
-  version "15.6.1"
-  resolved "https://registry.yarnpkg.com/react-syntax-highlighter/-/react-syntax-highlighter-15.6.1.tgz#fa567cb0a9f96be7bbccf2c13a3c4b5657d9543e"
-  integrity sha512-OqJ2/vL7lEeV5zTJyG7kmARppUjiB9h9udl4qHQjjgEos66z00Ia0OckwYfRxCSFrW8RJIBnsBwQsHZbVPspqg==
+react-syntax-highlighter@16.1.1:
+  version "16.1.1"
+  resolved "https://registry.yarnpkg.com/react-syntax-highlighter/-/react-syntax-highlighter-16.1.1.tgz#928459855d375f5cfc8e646071e20d541cebcb52"
+  integrity sha512-PjVawBGy80C6YbC5DDZJeUjBmC7skaoEUdvfFQediQHgCL7aKyVHe57SaJGfQsloGDac+gCpTfRdtxzWWKmCXA==
   dependencies:
-    "@babel/runtime" "^7.3.1"
+    "@babel/runtime" "^7.28.4"
     highlight.js "^10.4.1"
     highlightjs-vue "^1.0.0"
     lowlight "^1.17.0"
-    prismjs "^1.27.0"
-    refractor "^3.6.0"
+    prismjs "^1.30.0"
+    refractor "^5.0.0"
 
 react-textarea-autosize@^8.3.2:
   version "8.5.9"
@@ -11009,14 +11022,15 @@ reflect.getprototypeof@^1.0.6, reflect.getprototypeof@^1.0.9:
     get-proto "^1.0.1"
     which-builtin-type "^1.2.1"
 
-refractor@^3.6.0:
-  version "3.6.0"
-  resolved "https://registry.yarnpkg.com/refractor/-/refractor-3.6.0.tgz#ac318f5a0715ead790fcfb0c71f4dd83d977935a"
-  integrity sha512-MY9W41IOWxxk31o+YvFCNyNzdkc9M20NoZK5vq6jkv4I/uh2zkWcfudj0Q1fovjUQJrNewS9NMzeTtqPf+n5EA==
+refractor@^5.0.0:
+  version "5.0.0"
+  resolved "https://registry.yarnpkg.com/refractor/-/refractor-5.0.0.tgz#85daf0448a6d947f5361796eb22c31733d61d904"
+  integrity sha512-QXOrHQF5jOpjjLfiNk5GFnWhRXvxjUVnlFxkeDmewR5sXkr3iM46Zo+CnRR8B+MDVqkULW4EcLVcRBNOPXHosw==
   dependencies:
-    hastscript "^6.0.0"
-    parse-entities "^2.0.0"
-    prismjs "~1.27.0"
+    "@types/hast" "^3.0.0"
+    "@types/prismjs" "^1.0.0"
+    hastscript "^9.0.0"
+    parse-entities "^4.0.0"
 
 regenerate-unicode-properties@^10.2.0:
   version "10.2.0"
@@ -11707,10 +11721,10 @@ sourcemap-codec@^1.4.8:
   resolved "https://registry.yarnpkg.com/sourcemap-codec/-/sourcemap-codec-1.4.8.tgz#ea804bd94857402e6992d05a38ef1ae35a9ab4c4"
   integrity sha512-9NykojV5Uih4lgo5So5dtw+f0JgJX30KCNI8gwhz2J9A15wD0Ml6tjHKwf6fTSa6fAdVBdZeNOs9eJ71qCk8vA==
 
-space-separated-tokens@^1.0.0:
-  version "1.1.5"
-  resolved "https://registry.yarnpkg.com/space-separated-tokens/-/space-separated-tokens-1.1.5.tgz#85f32c3d10d9682007e917414ddc5c26d1aa6899"
-  integrity sha512-q/JSVd1Lptzhf5bkYm4ob4iWPjx0KiRe3sRFBNrVqbJkFaBm5vbbowy1mymoPNLRa52+oadOhJ+K49wsSeSjTA==
+space-separated-tokens@^2.0.0:
+  version "2.0.2"
+  resolved "https://registry.yarnpkg.com/space-separated-tokens/-/space-separated-tokens-2.0.2.tgz#1ecd9d2350a3844572c3f4a312bceb018348859f"
+  integrity sha512-PEGlAwrG8yXGXRjW32fGbg66JAlOAwbObuqVoJpv/mRgoWDQfgH1wDPvtzWyUSNAXBGSk8h755YDbbcEy3SH2Q==
 
 spdy-transport@^3.0.0:
   version "3.0.0"
@@ -12724,10 +12738,10 @@ update-browserslist-db@^1.1.3:
     escalade "^3.2.0"
     picocolors "^1.1.1"
 
-uplot@1.6.17:
-  version "1.6.17"
-  resolved "https://registry.yarnpkg.com/uplot/-/uplot-1.6.17.tgz#1f8fc07a0e48008798beca463523621ad66dcc46"
-  integrity sha512-WHNHvDCXURn+Qwb3QUUzP6rOxx+3kUZUspREyhkqmXCxFIND99l5z9intTh+uPEt+/EEu7lCaMjSd1uTfuTXfg==
+uplot@1.6.32:
+  version "1.6.32"
+  resolved "https://registry.yarnpkg.com/uplot/-/uplot-1.6.32.tgz#c800a63b432bad692d6d746f44f0882aa73a49ae"
+  integrity sha512-KIMVnG68zvu5XXUbC4LQEPnhwOxBuLyW1AHtpm6IKTXImkbLgkMy+jabjLgSLMasNuGGzQm/ep3tOkyTxpiQIw==
 
 uri-js@^4.2.2:
   version "4.4.1"
@@ -13451,11 +13465,6 @@ xmlchars@^2.2.0:
   resolved "https://registry.yarnpkg.com/xmlchars/-/xmlchars-2.2.0.tgz#060fe1bcb7f9c76fe2a17db86a9bc3ab894210cb"
   integrity sha512-JZnDKK8B0RCDw84FNdDAIpZK+JuJw+s7Lz8nksI7SIuU3UXJJslUthsi+uWBUYOwPFwW7W7PRLRfUKpxjtjFCw==
 
-xtend@^4.0.0:
-  version "4.0.2"
-  resolved "https://registry.yarnpkg.com/xtend/-/xtend-4.0.2.tgz#bb72779f5fa465186b1f438f674fa347fdb5db54"
-  integrity sha512-LKYU1iAXJXUgAXn9URjiu+MWhyUXHsvfp7mcuYm9dSUKK0/CjtrUwFAxD82/mCWbtLsGjFIad0wIsod4zrTAEQ==
-
 xtend@~2.1.1:
   version "2.1.2"
   resolved "https://registry.yarnpkg.com/xtend/-/xtend-2.1.2.tgz#6efecc2a4dad8e6962c4901b337ce7ba87b5d28b"