From 25982932c565413cba4ce408d96f448a63f2d5e9 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Wed, 22 Oct 2025 14:41:29 +0800
Subject: [PATCH 01/12] add dashboard link to documentation

---
 .github/workflows/main.yml                    |   2 +-
 .github/workflows/pr_code_changes.yaml        |   2 +-
 README.md                                     |  46 +-
 changelog_entry.yaml                          |   4 +
 docs/index.md                                 |  16 +
 .../app/api/github/artifacts/route.ts         | 117 +++++
 .../app/api/github/branches/route.ts          |  77 ++++
 .../app/api/github/commits/route.ts           |  55 +++
 .../app/api/github/download/route.ts          |  59 +++
 microimputation-dashboard/app/page.tsx        |   1 +
 .../components/FileUpload.tsx                 | 430 +++++-------------
 microimputation-dashboard/package.json        |   2 +-
 12 files changed, 478 insertions(+), 333 deletions(-)
 create mode 100644 microimputation-dashboard/app/api/github/artifacts/route.ts
 create mode 100644 microimputation-dashboard/app/api/github/branches/route.ts
 create mode 100644 microimputation-dashboard/app/api/github/commits/route.ts
 create mode 100644 microimputation-dashboard/app/api/github/download/route.ts

diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml
index 6f5b968..6a82c25 100644
--- a/.github/workflows/main.yml
+++ b/.github/workflows/main.yml
@@ -51,7 +51,7 @@ jobs:
         run: |
           python examples/pipeline.py
       - name: Upload microimputation results
-        if: always()
+        if: always() && matrix.python-version == '3.13'
         uses: actions/upload-artifact@v4
         with:
           name: microimputation-results-${{ github.sha }}
diff --git a/.github/workflows/pr_code_changes.yaml b/.github/workflows/pr_code_changes.yaml
index a2118b2..c8e2ce8 100644
--- a/.github/workflows/pr_code_changes.yaml
+++ b/.github/workflows/pr_code_changes.yaml
@@ -70,7 +70,7 @@ jobs:
         run: |
           python examples/pipeline.py
       - name: Upload microimputation results
-        if: always()
+        if: always() && matrix.python-version == '3.13'
         uses: actions/upload-artifact@v4
         with:
           name: microimputation-results-${{ github.sha }}
diff --git a/README.md b/README.md
index 63cf263..e9b83bb 100644
--- a/README.md
+++ b/README.md
@@ -1,7 +1,47 @@
 # Microimpute
 
-Microimpute enables variable imputation through different statistical methods. It facilitates comparison and benchmarking across methods through quantile loss calculations.
+Microimpute enables variable imputation through a variety of statistical methods. By providing a consistent interface across different imputation techniques, it allows researchers and data scientists to easily compare and benchmark different approaches using quantile loss and log loss calculations to determine the method providing most accurate results.
 
-To install, run pip install microimpute.
+## Features
 
-For image export functionality (PNG/JPG), install with: pip install microimpute[images]
+### Multiple imputation methods
+- **Statistical Matching**: Distance-based matching for finding similar observations
+- **Ordinary Least Squares (OLS)**: Linear regression-based imputation
+- **Quantile Regression**: Distribution-aware regression imputation
+- **Quantile Random Forests (QRF)**: Non-parametric forest-based approach
+
+### Automated method selection
+- **AutoImpute**: Automatically compares and selects the best imputation method for your data
+- **Cross-validation**: Built-in evaluation using quantile loss (numerical) and log loss (categorical)
+- **Variable type support**: Handles numerical, categorical, and boolean variables
+
+### Developer-friendly design
+- **Consistent API**: Standardized `fit()` and `predict()` interface across all models
+- **Extensible architecture**: Easy to implement custom imputation methods
+- **Weighted data handling**: Preserve data distributions with sample weights
+- **Input validation**: Automatic parameter and data validation
+
+### Interactive dashboard
+- **Visual exploration**: Analyze imputation results through interactive charts at https://microimpute-dashboard.vercel.app/
+- **GitHub integration**: Load artifacts directly from CI/CD workflows
+- **Multiple data sources**: File upload, URL loading and sample data
+
+## Installation
+
+```bash
+pip install microimpute
+```
+
+For image export functionality (PNG/JPG), install with:
+
+```bash
+pip install microimpute[images]
+```
+
+## Examples and documentation
+
+For detailed examples and interactive notebooks, see the [documentation](https://policyengine.github.io/microimpute/).
+
+## Contributing
+
+Contributions are welcome to the project. Please feel free to submit a Pull Request with your improvements.
diff --git a/changelog_entry.yaml b/changelog_entry.yaml
index e69de29..9670cc6 100644
--- a/changelog_entry.yaml
+++ b/changelog_entry.yaml
@@ -0,0 +1,4 @@
+- bump: minor
+  changes:
+    added:
+    - Links to dashboard in README.md and documentation.
diff --git a/docs/index.md b/docs/index.md
index dfa8a83..391c20c 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -9,3 +9,19 @@ The framework currently supports the following imputation methods:
 - Quantile Regression
 
 This is a work in progress that may evolve over time, including new statistical imputation methods and features. 
+
+## Microimputation dashboard
+
+Users can visualize imputation and benchmarking results at https://microimpute-dashboard.vercel.app/.
+
+To use the dashboard for visualization, CSV files must contain the following columns in this exact order:
+- `type`: Type of metric (e.g., "benchmark_loss", "distribution_distance", "predictor_correlation")
+- `method`: Imputation method name (e.g., "QRF", "OLS", "QuantReg", "Matching")
+- `variable`: Variable being imputed or analyzed
+- `quantile`: Quantile level (numeric value, "mean", or "N/A")
+- `metric_name`: Name of the metric (e.g., "quantile_loss", "log_loss")
+- `metric_value`: Numeric value of the metric
+- `split`: Data split indicator (e.g., "train", "test", "full")
+- `additional_info`: JSON-formatted string with additional metadata
+
+Users can use the `format_csv()` function from `microimpute.utils` to automatically format imputation and benchmarking results into the correct structure for dashboard visualization. This function accepts outputs from various analysis functions (autoimpute results, comparison metrics, distribution comparisons, etc.) and returns a properly formatted DataFrame.
\ No newline at end of file
diff --git a/microimputation-dashboard/app/api/github/artifacts/route.ts b/microimputation-dashboard/app/api/github/artifacts/route.ts
new file mode 100644
index 0000000..d071169
--- /dev/null
+++ b/microimputation-dashboard/app/api/github/artifacts/route.ts
@@ -0,0 +1,117 @@
+import { NextRequest, NextResponse } from 'next/server';
+
+export async function GET(request: NextRequest) {
+    const searchParams = request.nextUrl.searchParams;
+    const repo = searchParams.get('repo');
+    const commitSha = searchParams.get('commit');
+
+    if (!repo || !commitSha) {
+        return NextResponse.json(
+            { error: 'Missing repo or commit parameter' },
+            { status: 400 }
+        );
+    }
+
+    const githubToken = process.env.GITHUB_TOKEN;
+    if (!githubToken) {
+        return NextResponse.json(
+            { error: 'GitHub token not configured on server' },
+            { status: 500 }
+        );
+    }
+
+    try {
+        const [owner, repoName] = repo.split('/');
+
+        // Get workflow runs for the commit
+        const runsResponse = await fetch(
+            `https://api.github.com/repos/${owner}/${repoName}/actions/runs?head_sha=${commitSha}`,
+            {
+                headers: {
+                    Authorization: `Bearer ${githubToken}`,
+                    Accept: 'application/vnd.github.v3+json',
+                    'User-Agent': 'PolicyEngine-Dashboard/1.0',
+                },
+            }
+        );
+
+        if (!runsResponse.ok) {
+            return NextResponse.json(
+                { error: `GitHub API error: ${runsResponse.status}` },
+                { status: runsResponse.status }
+            );
+        }
+
+        const runsData = await runsResponse.json();
+        const runs = runsData.workflow_runs;
+
+        if (!runs || runs.length === 0) {
+            return NextResponse.json([]);
+        }
+
+        // Collect all imputation artifacts from completed runs
+        const allArtifacts = [];
+
+        for (const run of runs) {
+            if (run.status !== 'completed') continue;
+
+            try {
+                const artifactsResponse = await fetch(
+                    `https://api.github.com/repos/${owner}/${repoName}/actions/runs/${run.id}/artifacts`,
+                    {
+                        headers: {
+                            Authorization: `Bearer ${githubToken}`,
+                            Accept: 'application/vnd.github.v3+json',
+                            'User-Agent': 'PolicyEngine-Dashboard/1.0',
+                        },
+                    }
+                );
+
+                if (!artifactsResponse.ok) continue;
+
+                const artifactsData = await artifactsResponse.json();
+                const artifacts = artifactsData.artifacts;
+
+                // Filter for imputation artifacts
+                const imputationArtifacts = artifacts.filter(
+                    (artifact: { name: string }) =>
+                        artifact.name.toLowerCase().includes('impute') ||
+                        artifact.name
+                            .toLowerCase()
+                            .includes('imputation') ||
+                        artifact.name.toLowerCase().includes('result') ||
+                        artifact.name.toLowerCase().includes('.csv')
+                );
+
+                allArtifacts.push(...imputationArtifacts);
+            } catch {
+                continue;
+            }
+        }
+
+        // Remove duplicates and sort by creation date (newest first)
+        const uniqueArtifacts = allArtifacts
+            .filter(
+                (artifact: { name: string }, index: number, self: any[]) =>
+                    index ===
+                    self.findIndex((a: { name: string }) => a.name === artifact.name)
+            )
+            .sort(
+                (a: { created_at: string }, b: { created_at: string }) =>
+                    new Date(b.created_at).getTime() -
+                    new Date(a.created_at).getTime()
+            );
+
+        return NextResponse.json(uniqueArtifacts);
+    } catch (error) {
+        return NextResponse.json(
+            {
+                error:
+                    error instanceof Error
+                        ? error.message
+                        : 'Unknown error',
+            },
+            { status: 500 }
+        );
+    }
+}
diff --git a/microimputation-dashboard/app/api/github/branches/route.ts b/microimputation-dashboard/app/api/github/branches/route.ts
new file mode 100644
index 0000000..02a6bbd
--- /dev/null
+++ b/microimputation-dashboard/app/api/github/branches/route.ts
@@ -0,0 +1,77 @@
+import { NextRequest, NextResponse } from 'next/server';
+
+export async function GET(request: NextRequest) {
+    const searchParams = request.nextUrl.searchParams;
+    const repo = searchParams.get('repo');
+
+    if (!repo) {
+        return NextResponse.json(
+            { error: 'Missing repo parameter' },
+            { status: 400 }
+        );
+    }
+
+    const githubToken = process.env.GITHUB_TOKEN;
+    if (!githubToken) {
+        return NextResponse.json(
+            { error: 'GitHub token not configured on server' },
+            { status: 500 }
+        );
+    }
+
+    try {
+        const allBranches = [];
+        let page = 1;
+        const perPage = 100;
+
+        while (true) {
+            const response = await fetch(
+                `https://api.github.com/repos/${repo}/branches?per_page=${perPage}&page=${page}`,
+                {
+                    headers: {
+                        Authorization: `Bearer ${githubToken}`,
+                        Accept: 'application/vnd.github.v3+json',
+                        'User-Agent': 'PolicyEngine-Dashboard/1.0',
+                    },
+                }
+            );
+
+            if (!response.ok) {
+                return NextResponse.json(
+                    { error: `GitHub API error: ${response.status}` },
+                    { status: response.status }
+                );
+            }
+
+            const branches = await response.json();
+
+            if (branches.length === 0) {
+                break;
+            }
+
+            allBranches.push(...branches);
+
+            if (branches.length < perPage) {
+                break;
+            }
+
+            page++;
+
+            if (page > 10) {
+                break;
+            }
+        }
+
+        return NextResponse.json(allBranches);
+    } catch (error) {
+        return NextResponse.json(
+            {
+                error:
+                    error instanceof Error
+                        ? error.message
+                        : 'Unknown error',
+            },
+            { status: 500 }
+        );
+    }
+}
diff --git a/microimputation-dashboard/app/api/github/commits/route.ts b/microimputation-dashboard/app/api/github/commits/route.ts
new file mode 100644
index 0000000..9847aee
--- /dev/null
+++ b/microimputation-dashboard/app/api/github/commits/route.ts
@@ -0,0 +1,55 @@
+import { NextRequest, NextResponse } from 'next/server';
+
+export async function GET(request: NextRequest) {
+    const searchParams = request.nextUrl.searchParams;
+    const repo = searchParams.get('repo');
+    const branch = searchParams.get('branch');
+
+    if (!repo || !branch) {
+        return NextResponse.json(
+            { error: 'Missing repo or branch parameter' },
+            { status: 400 }
+        );
+    }
+
+    const githubToken = process.env.GITHUB_TOKEN;
+    if (!githubToken) {
+        return NextResponse.json(
+            { error: 'GitHub token not configured on server' },
+            { status: 500 }
+        );
+    }
+
+    try {
+        const response = await fetch(
+            `https://api.github.com/repos/${repo}/commits?sha=${branch}&per_page=20`,
+            {
+                headers: {
+                    Authorization: `Bearer ${githubToken}`,
+                    Accept: 'application/vnd.github.v3+json',
+                    'User-Agent': 'PolicyEngine-Dashboard/1.0',
+                },
+            }
+        );
+
+        if (!response.ok) {
+            return NextResponse.json(
+                { error: `GitHub API error: ${response.status}` },
+                { status: response.status }
+            );
+        }
+
+        const commits = await response.json();
+        return NextResponse.json(commits);
+    } catch (error) {
+        return NextResponse.json(
+            {
+                error:
+                    error instanceof Error
+                        ? error.message
+                        : 'Unknown error',
+            },
+            { status: 500 }
+        );
+    }
+}
diff --git a/microimputation-dashboard/app/api/github/download/route.ts b/microimputation-dashboard/app/api/github/download/route.ts
new file mode 100644
index 0000000..4938bab
--- /dev/null
+++ b/microimputation-dashboard/app/api/github/download/route.ts
@@ -0,0 +1,59 @@
+import { NextRequest, NextResponse } from 'next/server';
+
+export async function GET(request: NextRequest) {
+    const searchParams = request.nextUrl.searchParams;
+    const url = searchParams.get('url');
+
+    if (!url) {
+        return NextResponse.json(
+            { error: 'Missing url parameter' },
+            { status: 400 }
+        );
+    }
+
+    const githubToken = process.env.GITHUB_TOKEN;
+    if (!githubToken) {
+        return NextResponse.json(
+            { error: 'GitHub token not configured on server' },
+            { status: 500 }
+        );
+    }
+
+    try {
+        const downloadResponse = await fetch(url, {
+            headers: {
+                Authorization: `Bearer ${githubToken}`,
+                Accept: 'application/vnd.github.v3+json',
+                'User-Agent': 'PolicyEngine-Dashboard/1.0',
+            },
+        });
+
+        if (!downloadResponse.ok) {
+            return NextResponse.json(
+                { error: `GitHub API error: ${downloadResponse.status}` },
+                { status: downloadResponse.status }
+            );
+        }
+
+        // Get the artifact ZIP as an ArrayBuffer
+        const zipBuffer = await downloadResponse.arrayBuffer();
+
+        // Return the ZIP file as a response
+        return new NextResponse(zipBuffer, {
+            headers: {
+                'Content-Type': 'application/zip',
+                'Content-Length': zipBuffer.byteLength.toString(),
+            },
+        });
+    } catch (error) {
+        return NextResponse.json(
+            {
+                error:
+                    error instanceof Error
+                        ? error.message
+                        : 'Unknown error',
+            },
+            { status: 500 }
+        );
+    }
+}
diff --git a/microimputation-dashboard/app/page.tsx b/microimputation-dashboard/app/page.tsx
index 2b31bbf..c24753a 100644
--- a/microimputation-dashboard/app/page.tsx
+++ b/microimputation-dashboard/app/page.tsx
@@ -92,6 +92,7 @@ function HomeContent() {
     }
   };
 
+
   return (
     <main className="min-h-screen bg-gray-50">
       {/* Header */}
diff --git a/microimputation-dashboard/components/FileUpload.tsx b/microimputation-dashboard/components/FileUpload.tsx
index 581a2f3..24e8bd2 100644
--- a/microimputation-dashboard/components/FileUpload.tsx
+++ b/microimputation-dashboard/components/FileUpload.tsx
@@ -75,61 +75,32 @@ export default function FileUpload({
   const [selectedSecondArtifact, setSelectedSecondArtifact] = useState('');
 
   // Helper function to load a single artifact from deeplink parameters
-  const loadArtifactFromDeeplink = useCallback(async (artifactInfo: GitHubArtifactInfo, githubToken: string): Promise<string> => {
-    // First, get the artifacts for the specific commit
-    const [owner, repo] = artifactInfo.repo.split('/');
-    const runsResponse = await fetch(`https://api.github.com/repos/${owner}/${repo}/actions/runs?head_sha=${artifactInfo.commit}`, {
-      headers: {
-        'Authorization': `Bearer ${githubToken}`,
-        'Accept': 'application/vnd.github.v3+json',
-        'User-Agent': 'PolicyEngine-Dashboard/1.0'
-      }
-    });
-
-    if (!runsResponse.ok) {
-      throw new Error(`Failed to fetch workflow runs: ${runsResponse.status} ${runsResponse.statusText}`);
+  const loadArtifactFromDeeplink = useCallback(async (artifactInfo: GitHubArtifactInfo): Promise<string> => {
+    // Get artifacts for the specific commit using API route
+    const artifactsResponse = await fetch(
+      `/api/github/artifacts?repo=${encodeURIComponent(artifactInfo.repo)}&commit=${encodeURIComponent(artifactInfo.commit)}`
+    );
+
+    if (!artifactsResponse.ok) {
+      throw new Error(`Failed to fetch artifacts: ${artifactsResponse.status}`);
     }
 
-    const runsData = await runsResponse.json();
-    const completedRuns = runsData.workflow_runs.filter((run: { status: string }) => run.status === 'completed');
-
-    if (completedRuns.length === 0) {
-      throw new Error('No completed workflow runs found for this commit');
-    }
+    const artifacts = await artifactsResponse.json();
 
     // Find the artifact by name
-    let targetArtifact = null;
-    for (const run of completedRuns) {
-      const artifactsResponse = await fetch(`https://api.github.com/repos/${owner}/${repo}/actions/runs/${run.id}/artifacts`, {
-        headers: {
-          'Authorization': `Bearer ${githubToken}`,
-          'Accept': 'application/vnd.github.v3+json',
-          'User-Agent': 'PolicyEngine-Dashboard/1.0'
-        }
-      });
-
-      if (artifactsResponse.ok) {
-        const artifactsData = await artifactsResponse.json();
-        targetArtifact = artifactsData.artifacts.find((artifact: { name: string }) => artifact.name === artifactInfo.artifact);
-        if (targetArtifact) break;
-      }
-    }
+    const targetArtifact = artifacts.find((artifact: { name: string }) => artifact.name === artifactInfo.artifact);
 
     if (!targetArtifact) {
       throw new Error(`Artifact "${artifactInfo.artifact}" not found for commit ${artifactInfo.commit}`);
     }
 
-    // Download and extract the artifact
-    const downloadResponse = await fetch(targetArtifact.archive_download_url, {
-      headers: {
-        'Authorization': `Bearer ${githubToken}`,
-        'Accept': 'application/vnd.github.v3+json',
-        'User-Agent': 'PolicyEngine-Dashboard/1.0'
-      }
-    });
+    // Download and extract the artifact using API route
+    const downloadResponse = await fetch(
+      `/api/github/download?url=${encodeURIComponent(targetArtifact.archive_download_url)}`
+    );
 
     if (!downloadResponse.ok) {
-      throw new Error(`Failed to download artifact: ${downloadResponse.status} ${downloadResponse.statusText}`);
+      throw new Error(`Failed to download artifact: ${downloadResponse.status}`);
     }
 
     const zipBuffer = await downloadResponse.arrayBuffer();
@@ -155,12 +126,6 @@ export default function FileUpload({
 
   // Load GitHub artifacts directly from deeplink parameters
   const loadDeeplinkArtifacts = useCallback(async (primary: GitHubArtifactInfo, secondary?: GitHubArtifactInfo) => {
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoading(true);
     setError('');
 
@@ -168,11 +133,11 @@ export default function FileUpload({
       setError('🔄 Loading data from GitHub artifacts...');
 
       // Load primary artifact
-      const primaryData = await loadArtifactFromDeeplink(primary, githubToken);
+      const primaryData = await loadArtifactFromDeeplink(primary);
 
       if (secondary && onCompareLoad) {
         // Load secondary artifact for comparison
-        const secondaryData = await loadArtifactFromDeeplink(secondary, githubToken);
+        const secondaryData = await loadArtifactFromDeeplink(secondary);
 
         // Generate display names with commit info
         const primaryDisplayName = `${primary.repo}@${primary.branch} (${primary.commit.substring(0, 7)}) - ${primary.artifact}`;
@@ -436,14 +401,24 @@ export default function FileUpload({
     }
 
     let url: URL;
+    let finalUrl = urlInput.trim();
+
     try {
-      url = new URL(urlInput.trim());
+      url = new URL(finalUrl);
     } catch {
       setError('Invalid URL format. Please enter a valid URL (e.g., https://example.com/data.csv).');
       return;
     }
 
-    if (!url.pathname.toLowerCase().endsWith('.csv') && !urlInput.toLowerCase().includes('csv')) {
+    // Handle Google Drive URLs
+    if (url.hostname === 'drive.google.com') {
+      setError(
+        'Google Drive links are not supported due to CORS restrictions. Please download the file and use the "Drop file" tab instead or host the file on a different public server.'
+      );
+      return;
+    }
+
+    if (!url.pathname.toLowerCase().endsWith('.csv') && !finalUrl.toLowerCase().includes('csv')) {
       setError('URL should point to a CSV file. Please ensure the URL ends with .csv or contains CSV data.');
       return;
     }
@@ -460,7 +435,7 @@ export default function FileUpload({
       const controller = new AbortController();
       const timeoutId = setTimeout(() => controller.abort(), 30_000); // 30 s timeout
 
-      const response = await fetch(urlInput.trim(), {
+      const response = await fetch(finalUrl, {
         signal: controller.signal,
         headers: { Accept: 'text/csv, text/plain, */*' }
       });
@@ -557,62 +532,23 @@ export default function FileUpload({
       return;
     }
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoadingGithubData(true);
     setError('');
 
     try {
-      // Fetch all branches with pagination support
-      const allBranches: GitHubBranch[] = [];
-      let page = 1;
-      const perPage = 100; // Maximum allowed by GitHub API
-
-      while (true) {
-        const response = await fetch(`https://api.github.com/repos/${githubRepo}/branches?per_page=${perPage}&page=${page}`, {
-          headers: {
-            'Authorization': `Bearer ${githubToken}`,
-            'Accept': 'application/vnd.github.v3+json',
-            'User-Agent': 'PolicyEngine-Dashboard/1.0'
-          }
-        });
-
-        if (!response.ok) {
-          if (response.status === 404) {
-            throw new Error('Repository not found. Please check the repository name and ensure it is accessible.');
-          } else if (response.status === 403) {
-            throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
-          }
-          throw new Error(`Failed to fetch branches: ${response.status} ${response.statusText}`);
-        }
-
-        const branches: GitHubBranch[] = await response.json();
-
-        if (branches.length === 0) {
-          // No more branches to fetch
-          break;
-        }
+      const response = await fetch(`/api/github/branches?repo=${encodeURIComponent(githubRepo)}`);
 
-        allBranches.push(...branches);
-
-        // If we got fewer branches than requested, we've reached the end
-        if (branches.length < perPage) {
-          break;
-        }
-
-        page++;
-
-        // Safety check to prevent infinite loops (GitHub repos rarely have more than 1000 branches)
-        if (page > 10) {
-          console.warn('Stopped fetching branches after 10 pages (1000 branches) to prevent excessive API calls');
-          break;
+      if (!response.ok) {
+        if (response.status === 404) {
+          throw new Error('Repository not found. Please check the repository name and ensure it is accessible.');
+        } else if (response.status === 403) {
+          throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
         }
+        const errorData = await response.json();
+        throw new Error(errorData.error || `Failed to fetch branches: ${response.status}`);
       }
 
+      const allBranches: GitHubBranch[] = await response.json();
       setGithubBranches(allBranches);
 
       // Auto-select main/master branch if available
@@ -631,28 +567,20 @@ export default function FileUpload({
   async function fetchGithubCommits(branch: string) {
     if (!githubRepo.trim() || !branch) return;
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoadingGithubData(true);
     try {
-      const response = await fetch(`https://api.github.com/repos/${githubRepo}/commits?sha=${branch}&per_page=20`, {
-        headers: {
-          'Authorization': `Bearer ${githubToken}`,
-          'Accept': 'application/vnd.github.v3+json',
-          'User-Agent': 'PolicyEngine-Dashboard/1.0'
-        }
-      });
+      const response = await fetch(
+        `/api/github/commits?repo=${encodeURIComponent(githubRepo)}&branch=${encodeURIComponent(branch)}`
+      );
+
       if (!response.ok) {
         if (response.status === 404) {
           throw new Error('Branch not found or repository is private.');
         } else if (response.status === 403) {
           throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
         }
-        throw new Error(`Failed to fetch commits: ${response.status} ${response.statusText}`);
+        const errorData = await response.json();
+        throw new Error(errorData.error || `Failed to fetch commits: ${response.status}`);
       }
 
       const commits: GitHubCommit[] = await response.json();
@@ -673,98 +601,32 @@ export default function FileUpload({
   async function fetchGithubArtifacts(commitSha: string) {
     if (!githubRepo.trim() || !commitSha) return;
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoadingGithubData(true);
     setAvailableArtifacts([]);
     setSelectedArtifact('');
 
     try {
-      const [owner, repo] = githubRepo.split('/');
-
-      // Get workflow runs for the commit
-      const runsResponse = await fetch(
-        `https://api.github.com/repos/${owner}/${repo}/actions/runs?head_sha=${commitSha}`,
-        {
-          headers: {
-            'Authorization': `Bearer ${githubToken}`,
-            'Accept': 'application/vnd.github.v3+json',
-            'User-Agent': 'PolicyEngine-Dashboard/1.0'
-          }
-        }
+      const response = await fetch(
+        `/api/github/artifacts?repo=${encodeURIComponent(githubRepo)}&commit=${encodeURIComponent(commitSha)}`
       );
 
-      if (!runsResponse.ok) {
-        if (runsResponse.status === 403) {
+      if (!response.ok) {
+        if (response.status === 403) {
           throw new Error(`GitHub API rate limit exceeded or token permissions insufficient (403). Please try again later or check your token permissions.`);
-        } else if (runsResponse.status === 404) {
+        } else if (response.status === 404) {
           throw new Error(`Repository or commit not found (404). Please check the repository name and commit SHA.`);
-        } else {
-          throw new Error(`Failed to fetch workflow runs: ${runsResponse.status} ${runsResponse.statusText}`);
         }
+        const errorData = await response.json();
+        throw new Error(errorData.error || `Failed to fetch artifacts: ${response.status}`);
       }
 
-      const runsData = await runsResponse.json();
-      const runs = runsData.workflow_runs;
-
-      if (!runs || runs.length === 0) {
-        setError('No workflow runs found for this commit.');
-        return;
-      }
-
-      // Collect all imputation artifacts from completed runs
-      const allArtifacts: GitHubArtifact[] = [];
-
-      for (const run of runs) {
-        if (run.status !== 'completed') continue;
+      const uniqueArtifacts: GitHubArtifact[] = await response.json();
 
-        try {
-          const artifactsResponse = await fetch(
-            `https://api.github.com/repos/${owner}/${repo}/actions/runs/${run.id}/artifacts`,
-            {
-              headers: {
-                'Authorization': `Bearer ${githubToken}`,
-                'Accept': 'application/vnd.github.v3+json',
-                'User-Agent': 'PolicyEngine-Dashboard/1.0'
-              }
-            }
-          );
-
-          if (!artifactsResponse.ok) continue;
-
-          const artifactsData = await artifactsResponse.json();
-          const artifacts = artifactsData.artifacts;
-
-          // Filter for imputation artifacts
-          const imputationArtifacts = artifacts.filter((artifact: GitHubArtifact) =>
-            artifact.name.toLowerCase().includes('impute') ||
-            artifact.name.toLowerCase().includes('imputation') ||
-            artifact.name.toLowerCase().includes('result') ||
-            artifact.name.toLowerCase().includes('.csv')
-          );
-
-          allArtifacts.push(...imputationArtifacts);
-        } catch {
-          continue;
-        }
-      }
-
-      if (allArtifacts.length === 0) {
+      if (uniqueArtifacts.length === 0) {
         setError('No imputation artifacts found for this commit.');
         return;
       }
 
-      // Remove duplicates and sort by creation date (newest first)
-      const uniqueArtifacts = allArtifacts
-        .filter((artifact, index, self) =>
-          index === self.findIndex(a => a.name === artifact.name)
-        )
-        .sort((a, b) => new Date(b.created_at).getTime() - new Date(a.created_at).getTime());
-
       setAvailableArtifacts(uniqueArtifacts);
 
       // Auto-select the first artifact
@@ -791,25 +653,15 @@ export default function FileUpload({
       return;
     }
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoading(true);
     setError('');
 
     try {
       setError('🔄 Downloading and extracting CSV from artifact...');
 
-      const downloadResponse = await fetch(artifact.archive_download_url, {
-        headers: {
-          'Authorization': `Bearer ${githubToken}`,
-          'Accept': 'application/vnd.github.v3+json',
-          'User-Agent': 'PolicyEngine-Dashboard/1.0'
-        }
-      });
+      const downloadResponse = await fetch(
+        `/api/github/download?url=${encodeURIComponent(artifact.archive_download_url)}`
+      );
 
       if (!downloadResponse.ok) {
         throw new Error(`Failed to download artifact: ${downloadResponse.status}`);
@@ -887,28 +739,20 @@ export default function FileUpload({
   async function fetchSecondBranchCommits(branch: string) {
     if (!githubRepo.trim() || !branch) return;
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoadingGithubData(true);
     try {
-      const response = await fetch(`https://api.github.com/repos/${githubRepo}/commits?sha=${branch}&per_page=20`, {
-        headers: {
-          'Authorization': `Bearer ${githubToken}`,
-          'Accept': 'application/vnd.github.v3+json',
-          'User-Agent': 'PolicyEngine-Dashboard/1.0'
-        }
-      });
+      const response = await fetch(
+        `/api/github/commits?repo=${encodeURIComponent(githubRepo)}&branch=${encodeURIComponent(branch)}`
+      );
+
       if (!response.ok) {
         if (response.status === 404) {
           throw new Error('Branch not found or repository is private.');
         } else if (response.status === 403) {
           throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
         }
-        throw new Error(`Failed to fetch commits: ${response.status} ${response.statusText}`);
+        const errorData = await response.json();
+        throw new Error(errorData.error || `Failed to fetch commits: ${response.status}`);
       }
 
       const commits: GitHubCommit[] = await response.json();
@@ -929,98 +773,32 @@ export default function FileUpload({
   async function fetchSecondArtifacts(commitSha: string) {
     if (!githubRepo.trim() || !commitSha) return;
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoadingGithubData(true);
     setSecondArtifacts([]);
     setSelectedSecondArtifact('');
 
     try {
-      const [owner, repo] = githubRepo.split('/');
-
-      // Get workflow runs for the commit
-      const runsResponse = await fetch(
-        `https://api.github.com/repos/${owner}/${repo}/actions/runs?head_sha=${commitSha}`,
-        {
-          headers: {
-            'Authorization': `Bearer ${githubToken}`,
-            'Accept': 'application/vnd.github.v3+json',
-            'User-Agent': 'PolicyEngine-Dashboard/1.0'
-          }
-        }
+      const response = await fetch(
+        `/api/github/artifacts?repo=${encodeURIComponent(githubRepo)}&commit=${encodeURIComponent(commitSha)}`
       );
 
-      if (!runsResponse.ok) {
-        if (runsResponse.status === 403) {
+      if (!response.ok) {
+        if (response.status === 403) {
           throw new Error(`GitHub API rate limit exceeded or token permissions insufficient (403). Please try again later or check your token permissions.`);
-        } else if (runsResponse.status === 404) {
+        } else if (response.status === 404) {
           throw new Error(`Repository or commit not found (404). Please check the repository name and commit SHA.`);
-        } else {
-          throw new Error(`Failed to fetch workflow runs: ${runsResponse.status} ${runsResponse.statusText}`);
         }
+        const errorData = await response.json();
+        throw new Error(errorData.error || `Failed to fetch artifacts: ${response.status}`);
       }
 
-      const runsData = await runsResponse.json();
-      const runs = runsData.workflow_runs;
-
-      if (!runs || runs.length === 0) {
-        setError('No workflow runs found for this commit.');
-        return;
-      }
-
-      // Collect all imputation artifacts from completed runs
-      const allArtifacts: GitHubArtifact[] = [];
-
-      for (const run of runs) {
-        if (run.status !== 'completed') continue;
-
-        try {
-          const artifactsResponse = await fetch(
-            `https://api.github.com/repos/${owner}/${repo}/actions/runs/${run.id}/artifacts`,
-            {
-              headers: {
-                'Authorization': `Bearer ${githubToken}`,
-                'Accept': 'application/vnd.github.v3+json',
-                'User-Agent': 'PolicyEngine-Dashboard/1.0'
-              }
-            }
-          );
+      const uniqueArtifacts: GitHubArtifact[] = await response.json();
 
-          if (!artifactsResponse.ok) continue;
-
-          const artifactsData = await artifactsResponse.json();
-          const artifacts = artifactsData.artifacts;
-
-          // Filter for imputation artifacts
-          const imputationArtifacts = artifacts.filter((artifact: GitHubArtifact) =>
-            artifact.name.toLowerCase().includes('impute') ||
-            artifact.name.toLowerCase().includes('imputation') ||
-            artifact.name.toLowerCase().includes('result') ||
-            artifact.name.toLowerCase().includes('.csv')
-          );
-
-          allArtifacts.push(...imputationArtifacts);
-        } catch {
-          continue;
-        }
-      }
-
-      if (allArtifacts.length === 0) {
+      if (uniqueArtifacts.length === 0) {
         setError('No imputation artifacts found for this commit.');
         return;
       }
 
-      // Remove duplicates and sort by creation date (newest first)
-      const uniqueArtifacts = allArtifacts
-        .filter((artifact, index, self) =>
-          index === self.findIndex(a => a.name === artifact.name)
-        )
-        .sort((a, b) => new Date(b.created_at).getTime() - new Date(a.created_at).getTime());
-
       setSecondArtifacts(uniqueArtifacts);
 
       // Auto-select the first artifact
@@ -1049,12 +827,6 @@ export default function FileUpload({
       return;
     }
 
-    const githubToken = process.env.NEXT_PUBLIC_GITHUB_TOKEN;
-    if (!githubToken) {
-      setError('GitHub token not configured. Please set NEXT_PUBLIC_GITHUB_TOKEN environment variable.');
-      return;
-    }
-
     setIsLoading(true);
     setError('');
 
@@ -1063,20 +835,8 @@ export default function FileUpload({
 
       // Download both artifacts
       const [firstDownload, secondDownload] = await Promise.all([
-        fetch(firstArtifact.archive_download_url, {
-          headers: {
-            'Authorization': `Bearer ${githubToken}`,
-            'Accept': 'application/vnd.github.v3+json',
-            'User-Agent': 'PolicyEngine-Dashboard/1.0'
-          }
-        }),
-        fetch(secondArtifact.archive_download_url, {
-          headers: {
-            'Authorization': `Bearer ${githubToken}`,
-            'Accept': 'application/vnd.github.v3+json',
-            'User-Agent': 'PolicyEngine-Dashboard/1.0'
-          }
-        })
+        fetch(`/api/github/download?url=${encodeURIComponent(firstArtifact.archive_download_url)}`),
+        fetch(`/api/github/download?url=${encodeURIComponent(secondArtifact.archive_download_url)}`)
       ]);
 
       if (!firstDownload.ok || !secondDownload.ok) {
@@ -1176,7 +936,11 @@ export default function FileUpload({
       {/* Tab navigation */}
       <div className="flex border-b border-gray-200 mb-6">
         <button
-          onClick={() => setActiveTab('drop')}
+          onClick={() => {
+            setActiveTab('drop');
+            setError('');
+            setLoadedFile('');
+          }}
           className={`px-4 py-2 text-sm font-medium border-b-2 ${
             activeTab === 'drop'
               ? 'border-blue-500 text-blue-600'
@@ -1187,7 +951,11 @@ export default function FileUpload({
           Drop file
         </button>
         <button
-          onClick={() => setActiveTab('url')}
+          onClick={() => {
+            setActiveTab('url');
+            setError('');
+            setLoadedFile('');
+          }}
           className={`px-4 py-2 text-sm font-medium border-b-2 ${
             activeTab === 'url'
               ? 'border-blue-500 text-blue-600'
@@ -1198,7 +966,11 @@ export default function FileUpload({
           URL
         </button>
         <button
-          onClick={() => setActiveTab('github')}
+          onClick={() => {
+            setActiveTab('github');
+            setError('');
+            setLoadedFile('');
+          }}
           className={`px-4 py-2 text-sm font-medium border-b-2 ${
             activeTab === 'github'
               ? 'border-blue-500 text-blue-600'
@@ -1209,7 +981,11 @@ export default function FileUpload({
           GitHub
         </button>
         <button
-          onClick={() => setActiveTab('sample')}
+          onClick={() => {
+            setActiveTab('sample');
+            setError('');
+            setLoadedFile('');
+          }}
           className={`px-4 py-2 text-sm font-medium border-b-2 ${
             activeTab === 'sample'
               ? 'border-blue-500 text-blue-600'
@@ -1265,7 +1041,7 @@ export default function FileUpload({
                 value={urlInput}
                 onChange={e => setUrlInput(e.target.value)}
                 placeholder="https://example.com/data.csv"
-                className="flex-1 px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 focus:border-transparent"
+                className="flex-1 px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 focus:border-transparent text-gray-900"
               />
               <button
                 onClick={handleUrlLoad}
@@ -1332,8 +1108,8 @@ export default function FileUpload({
                       type="text"
                       value={githubRepo}
                       onChange={(e) => setGithubRepo(e.target.value)}
-                      placeholder="PolicyEngine/microimpute"
-                      className="flex-1 px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                      placeholder="policyengine/microimpute"
+                      className="flex-1 px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                     />
                     <button
                       onClick={fetchGithubBranches}
@@ -1386,7 +1162,7 @@ export default function FileUpload({
                         setSelectedBranch(e.target.value);
                         fetchGithubCommits(e.target.value);
                       }}
-                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                     >
                       <option value="">Select a branch</option>
                       {githubBranches.map((branch) => (
@@ -1411,7 +1187,7 @@ export default function FileUpload({
                         setSelectedCommit(e.target.value);
                         fetchGithubArtifacts(e.target.value);
                       }}
-                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                     >
                       <option value="">Select a commit</option>
                       {githubCommits.map((commit) => (
@@ -1441,7 +1217,7 @@ export default function FileUpload({
                       id="github-artifact"
                       value={selectedArtifact}
                       onChange={(e) => setSelectedArtifact(e.target.value)}
-                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                      className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                     >
                       <option value="">Select an artifact</option>
                       {availableArtifacts.map((artifact) => (
@@ -1477,7 +1253,7 @@ export default function FileUpload({
                           setSelectedSecondBranch(e.target.value);
                           fetchSecondBranchCommits(e.target.value);
                         }}
-                        className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                        className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                       >
                         <option value="">Select a branch</option>
                         {githubBranches.map((branch) => (
@@ -1501,7 +1277,7 @@ export default function FileUpload({
                             setSelectedSecondCommit(e.target.value);
                             fetchSecondArtifacts(e.target.value);
                           }}
-                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                         >
                           <option value="">Select a commit</option>
                           {secondCommits.map((commit) => (
@@ -1531,7 +1307,7 @@ export default function FileUpload({
                           id="github-second-artifact"
                           value={selectedSecondArtifact}
                           onChange={(e) => setSelectedSecondArtifact(e.target.value)}
-                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500"
+                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
                         >
                           <option value="">Select an artifact</option>
                           {secondArtifacts.map((artifact) => (
diff --git a/microimputation-dashboard/package.json b/microimputation-dashboard/package.json
index ab76b36..83f379e 100644
--- a/microimputation-dashboard/package.json
+++ b/microimputation-dashboard/package.json
@@ -4,7 +4,7 @@
   "private": true,
   "scripts": {
     "dev": "next dev --turbopack",
-    "build": "next build --turbopack",
+    "build": "next build",
     "start": "next start",
     "lint": "eslint"
   },

From 0c63d49f38923c94eb66b90ac844d5984687b90f Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Wed, 22 Oct 2025 15:20:03 +0800
Subject: [PATCH 02/12] first stab at benchmarking plots

---
 examples/pipeline.py                          |  19 +-
 .../components/BenchmarkLossCharts.tsx        | 189 +++++++++++++++++
 .../components/FileUpload.tsx                 |  14 +-
 .../components/PerVariableCharts.tsx          | 191 ++++++++++++++++++
 .../components/VisualizationDashboard.tsx     | 173 +++++++++++++++-
 .../components/VisualizationTabs.tsx          |  58 ++++++
 microimputation-dashboard/types/imputation.ts |  16 +-
 microimputation-dashboard/utils/colors.ts     |  29 +++
 8 files changed, 665 insertions(+), 24 deletions(-)
 create mode 100644 microimputation-dashboard/components/BenchmarkLossCharts.tsx
 create mode 100644 microimputation-dashboard/components/PerVariableCharts.tsx
 create mode 100644 microimputation-dashboard/components/VisualizationTabs.tsx
 create mode 100644 microimputation-dashboard/utils/colors.ts

diff --git a/examples/pipeline.py b/examples/pipeline.py
index c9dc90e..da848d8 100644
--- a/examples/pipeline.py
+++ b/examples/pipeline.py
@@ -75,9 +75,22 @@ def run_full_pipeline(output_path="microimpute_results.csv"):
     donor_data = diabetes_data.iloc[donor_indices].reset_index(drop=True)
     receiver_data = diabetes_data.iloc[receiver_indices].reset_index(drop=True)
 
+    # Create a categorical risk_factor variable based on cholesterol levels (s4)
+    # Categorize into low, medium, high based on s4 values
+    def categorize_risk(s4_value):
+        if s4_value < -0.02:
+            return "low"
+        elif s4_value < 0.02:
+            return "medium"
+        else:
+            return "high"
+
+    donor_data["risk_factor"] = donor_data["s4"].apply(categorize_risk)
+    receiver_data["risk_factor"] = receiver_data["s4"].apply(categorize_risk)
+
     # Define predictors and variables to impute
     predictors = ["age", "sex", "bmi", "bp"]
-    imputed_variables = ["s1", "s4"]
+    imputed_variables = ["s1", "s4", "risk_factor"]
 
     # Remove imputed variables from receiver data
     receiver_data_without_targets = receiver_data.drop(
@@ -88,6 +101,8 @@ def run_full_pipeline(output_path="microimpute_results.csv"):
     print(f"Receiver data shape: {receiver_data_without_targets.shape}")
     print(f"Predictors: {predictors}")
     print(f"Variables to impute: {imputed_variables}")
+    print(f"Risk factor distribution in donor data:")
+    print(donor_data["risk_factor"].value_counts())
     print()
 
     # ========================================================================
@@ -245,6 +260,8 @@ def run_full_pipeline(output_path="microimpute_results.csv"):
     print(f"  - Best imputation method: {best_method_name}")
     print(f"  - Number of predictors analyzed: {len(predictors)}")
     print(f"  - Number of imputed variables: {len(imputed_variables)}")
+    print(f"    - Numerical variables: s1, s4")
+    print(f"    - Categorical variables: risk_factor")
     print()
     print("Output CSV contains:")
     for result_type in formatted_df["type"].unique():
diff --git a/microimputation-dashboard/components/BenchmarkLossCharts.tsx b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
new file mode 100644
index 0000000..c057e93
--- /dev/null
+++ b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
@@ -0,0 +1,189 @@
+'use client';
+
+import { useMemo } from 'react';
+import {
+  BarChart,
+  Bar,
+  Cell,
+  XAxis,
+  YAxis,
+  CartesianGrid,
+  Tooltip,
+  Legend,
+  ResponsiveContainer,
+  ReferenceLine,
+} from 'recharts';
+import { ImputationDataPoint } from '@/types/imputation';
+import { getMethodColor } from '@/utils/colors';
+
+interface BenchmarkLossChartsProps {
+  data: ImputationDataPoint[];
+}
+
+export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps) {
+  // Filter for benchmark_loss data
+  const benchmarkData = useMemo(() => {
+    return data.filter(d => d.type === 'benchmark_loss');
+  }, [data]);
+
+  // Check if we have benchmark loss data
+  const hasBenchmarkData = benchmarkData.length > 0;
+
+  // Separate quantile loss and log loss data
+  const { quantileLossData, logLossData, methods } = useMemo(() => {
+    const quantile = benchmarkData.filter(
+      d => d.metric_name === 'quantile_loss' &&
+           d.split === 'test' &&
+           typeof d.quantile === 'number' &&
+           d.quantile >= 0 &&
+           d.quantile <= 1
+    );
+
+    const logLoss = benchmarkData.filter(
+      d => d.metric_name === 'log_loss' &&
+           d.split === 'test' &&
+           d.metric_value !== null
+    );
+
+    // Get unique methods
+    const uniqueMethods = Array.from(new Set(benchmarkData.map(d => d.method)));
+
+    return {
+      quantileLossData: quantile,
+      logLossData: logLoss,
+      methods: uniqueMethods,
+    };
+  }, [benchmarkData]);
+
+  // Transform quantile loss data for grouped bar chart
+  const quantileChartData = useMemo(() => {
+    if (quantileLossData.length === 0) return [];
+
+    // Group by quantile
+    const quantileMap = new Map<number, Record<string, any>>();
+
+    quantileLossData.forEach(d => {
+      const quantile = Number(d.quantile);
+      if (!quantileMap.has(quantile)) {
+        quantileMap.set(quantile, { quantile: quantile.toFixed(2) });
+      }
+      const entry = quantileMap.get(quantile)!;
+      entry[d.method] = d.metric_value;
+    });
+
+    return Array.from(quantileMap.values()).sort(
+      (a, b) => parseFloat(a.quantile) - parseFloat(b.quantile)
+    );
+  }, [quantileLossData]);
+
+  // Transform log loss data for bar chart
+  const logLossChartData = useMemo(() => {
+    if (logLossData.length === 0) return [];
+
+    // Average log loss per method
+    const methodMap = new Map<string, { sum: number; count: number }>();
+
+    logLossData.forEach(d => {
+      if (d.metric_value !== null) {
+        if (!methodMap.has(d.method)) {
+          methodMap.set(d.method, { sum: 0, count: 0 });
+        }
+        const entry = methodMap.get(d.method)!;
+        entry.sum += d.metric_value;
+        entry.count += 1;
+      }
+    });
+
+    return Array.from(methodMap.entries()).map(([method, { sum, count }]) => ({
+      method,
+      value: sum / count,
+    }));
+  }, [logLossData]);
+
+  if (!hasBenchmarkData) {
+    return null;
+  }
+
+  return (
+    <div className="space-y-8">
+      {/* Quantile Loss Comparison */}
+      {quantileChartData.length > 0 && (
+        <div className="bg-white p-6 rounded-lg shadow">
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Test Quantile Loss Across Quantiles for Different Imputation Methods
+          </h3>
+          <ResponsiveContainer width="100%" height={400}>
+            <BarChart data={quantileChartData}>
+              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+              <XAxis
+                dataKey="quantile"
+                label={{ value: 'Quantiles', position: 'insideBottom', offset: -5 }}
+                tick={{ fill: '#666' }}
+              />
+              <YAxis
+                label={{ value: 'Test Quantile Loss', angle: -90, position: 'insideLeft' }}
+                tick={{ fill: '#666' }}
+              />
+              <Tooltip
+                contentStyle={{
+                  backgroundColor: '#fff',
+                  border: '1px solid #ccc',
+                  color: '#000',
+                }}
+                labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                itemStyle={{ color: '#000' }}
+                formatter={(value: number) => value.toFixed(6)}
+              />
+              <Legend wrapperStyle={{ paddingTop: '20px' }} />
+              {methods.map((method, index) => (
+                <Bar
+                  key={method}
+                  dataKey={method}
+                  fill={getMethodColor(method, index)}
+                  name={method}
+                />
+              ))}
+            </BarChart>
+          </ResponsiveContainer>
+        </div>
+      )}
+
+      {/* Log Loss Comparison */}
+      {logLossChartData.length > 0 && (
+        <div className="bg-white p-6 rounded-lg shadow">
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Log Loss Comparison Across Methods
+          </h3>
+          <ResponsiveContainer width="100%" height={400}>
+            <BarChart data={logLossChartData}>
+              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+              <XAxis
+                dataKey="method"
+                tick={{ fill: '#666' }}
+              />
+              <YAxis
+                label={{ value: 'Log Loss', angle: -90, position: 'insideLeft' }}
+                tick={{ fill: '#666' }}
+              />
+              <Tooltip
+                contentStyle={{
+                  backgroundColor: '#fff',
+                  border: '1px solid #ccc',
+                  color: '#000',
+                }}
+                labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                itemStyle={{ color: '#000' }}
+                formatter={(value: number) => [value.toFixed(6), 'Log Loss']}
+              />
+              <Bar dataKey="value">
+                {logLossChartData.map((entry, index) => (
+                  <Cell key={entry.method} fill={getMethodColor(entry.method, index)} />
+                ))}
+              </Bar>
+            </BarChart>
+          </ResponsiveContainer>
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/components/FileUpload.tsx b/microimputation-dashboard/components/FileUpload.tsx
index 24e8bd2..52eb223 100644
--- a/microimputation-dashboard/components/FileUpload.tsx
+++ b/microimputation-dashboard/components/FileUpload.tsx
@@ -538,15 +538,15 @@ export default function FileUpload({
     try {
       const response = await fetch(`/api/github/branches?repo=${encodeURIComponent(githubRepo)}`);
 
-      if (!response.ok) {
-        if (response.status === 404) {
-          throw new Error('Repository not found. Please check the repository name and ensure it is accessible.');
-        } else if (response.status === 403) {
-          throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
-        }
+        if (!response.ok) {
+          if (response.status === 404) {
+            throw new Error('Repository not found. Please check the repository name and ensure it is accessible.');
+          } else if (response.status === 403) {
+            throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
+          }
         const errorData = await response.json();
         throw new Error(errorData.error || `Failed to fetch branches: ${response.status}`);
-      }
+        }
 
       const allBranches: GitHubBranch[] = await response.json();
       setGithubBranches(allBranches);
diff --git a/microimputation-dashboard/components/PerVariableCharts.tsx b/microimputation-dashboard/components/PerVariableCharts.tsx
new file mode 100644
index 0000000..7f7302e
--- /dev/null
+++ b/microimputation-dashboard/components/PerVariableCharts.tsx
@@ -0,0 +1,191 @@
+'use client';
+
+import { useMemo } from 'react';
+import {
+  BarChart,
+  Bar,
+  Cell,
+  XAxis,
+  YAxis,
+  CartesianGrid,
+  Tooltip,
+  Legend,
+  ResponsiveContainer,
+} from 'recharts';
+import { ImputationDataPoint } from '@/types/imputation';
+import { getMethodColor } from '@/utils/colors';
+
+interface PerVariableChartsProps {
+  data: ImputationDataPoint[];
+  variable: string;
+  metricType: 'quantile_loss' | 'log_loss';
+}
+
+export default function PerVariableCharts({
+  data,
+  variable,
+  metricType,
+}: PerVariableChartsProps) {
+  // Filter data for this specific variable
+  const variableData = useMemo(() => {
+    return data.filter(
+      (d) =>
+        d.type === 'benchmark_loss' &&
+        d.variable === variable &&
+        d.metric_name === metricType &&
+        d.split === 'test'
+    );
+  }, [data, variable, metricType]);
+
+  const methods = useMemo(() => {
+    return Array.from(new Set(variableData.map((d) => d.method)));
+  }, [variableData]);
+
+  // For numerical variables (quantile_loss), show quantile breakdown
+  const quantileChartData = useMemo(() => {
+    if (metricType !== 'quantile_loss') return [];
+
+    const numericData = variableData.filter(
+      (d) =>
+        typeof d.quantile === 'number' && d.quantile >= 0 && d.quantile <= 1
+    );
+
+    const quantileMap = new Map<number, Record<string, any>>();
+
+    numericData.forEach((d) => {
+      const quantile = Number(d.quantile);
+      if (!quantileMap.has(quantile)) {
+        quantileMap.set(quantile, { quantile: quantile.toFixed(2) });
+      }
+      const entry = quantileMap.get(quantile)!;
+      entry[d.method] = d.metric_value;
+    });
+
+    return Array.from(quantileMap.values()).sort(
+      (a, b) => parseFloat(a.quantile) - parseFloat(b.quantile)
+    );
+  }, [variableData, metricType]);
+
+  // For categorical variables (log_loss), show simple bar comparison
+  const logLossChartData = useMemo(() => {
+    if (metricType !== 'log_loss') return [];
+
+    const methodMap = new Map<string, { sum: number; count: number }>();
+
+    variableData.forEach((d) => {
+      if (d.metric_value !== null) {
+        if (!methodMap.has(d.method)) {
+          methodMap.set(d.method, { sum: 0, count: 0 });
+        }
+        const entry = methodMap.get(d.method)!;
+        entry.sum += d.metric_value;
+        entry.count += 1;
+      }
+    });
+
+    return Array.from(methodMap.entries()).map(
+      ([method, { sum, count }]) => ({
+        method,
+        value: sum / count,
+      })
+    );
+  }, [variableData, metricType]);
+
+  if (variableData.length === 0) {
+    return (
+      <div className="text-center py-8 text-gray-500">
+        No data available for variable: {variable}
+      </div>
+    );
+  }
+
+  return (
+    <div className="space-y-6">
+      {metricType === 'quantile_loss' && quantileChartData.length > 0 && (
+        <div>
+          <h4 className="text-lg font-semibold mb-4 text-gray-700">
+            Quantile Loss by Method for "{variable}"
+          </h4>
+          <ResponsiveContainer width="100%" height={400}>
+            <BarChart data={quantileChartData}>
+              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+              <XAxis
+                dataKey="quantile"
+                label={{
+                  value: 'Quantiles',
+                  position: 'insideBottom',
+                  offset: -5,
+                }}
+                tick={{ fill: '#666' }}
+              />
+              <YAxis
+                label={{
+                  value: 'Test Quantile Loss',
+                  angle: -90,
+                  position: 'insideLeft',
+                }}
+                tick={{ fill: '#666' }}
+              />
+              <Tooltip
+                contentStyle={{
+                  backgroundColor: '#fff',
+                  border: '1px solid #ccc',
+                  color: '#000',
+                }}
+                labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                itemStyle={{ color: '#000' }}
+                formatter={(value: number) => value.toFixed(6)}
+              />
+              <Legend wrapperStyle={{ paddingTop: '20px' }} />
+              {methods.map((method, index) => (
+                <Bar
+                  key={method}
+                  dataKey={method}
+                  fill={getMethodColor(method, index)}
+                  name={method}
+                />
+              ))}
+            </BarChart>
+          </ResponsiveContainer>
+        </div>
+      )}
+
+      {metricType === 'log_loss' && logLossChartData.length > 0 && (
+        <div>
+          <h4 className="text-lg font-semibold mb-4 text-gray-700">
+            Log Loss by Method for "{variable}"
+          </h4>
+          <ResponsiveContainer width="100%" height={400}>
+            <BarChart data={logLossChartData}>
+              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+              <XAxis dataKey="method" tick={{ fill: '#666' }} />
+              <YAxis
+                label={{
+                  value: 'Log Loss',
+                  angle: -90,
+                  position: 'insideLeft',
+                }}
+                tick={{ fill: '#666' }}
+              />
+              <Tooltip
+                contentStyle={{
+                  backgroundColor: '#fff',
+                  border: '1px solid #ccc',
+                  color: '#000',
+                }}
+                labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                itemStyle={{ color: '#000' }}
+                formatter={(value: number) => [value.toFixed(6), 'Log Loss']}
+              />
+              <Bar dataKey="value">
+                {logLossChartData.map((entry, index) => (
+                  <Cell key={entry.method} fill={getMethodColor(entry.method, index)} />
+                ))}
+              </Bar>
+            </BarChart>
+          </ResponsiveContainer>
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index f5806da..ffdf3cd 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -1,7 +1,11 @@
 'use client';
 
+import { useMemo, useState } from 'react';
 import { ImputationDataPoint } from '@/types/imputation';
 import { GitHubArtifactInfo } from '@/utils/deeplinks';
+import BenchmarkLossCharts from './BenchmarkLossCharts';
+import PerVariableCharts from './PerVariableCharts';
+import VisualizationTabs from './VisualizationTabs';
 
 interface VisualizationDashboardProps {
   data: ImputationDataPoint[];
@@ -20,23 +24,127 @@ export default function VisualizationDashboard({
   data,
   fileName,
   comparisonData,
-  githubArtifactInfo
 }: VisualizationDashboardProps) {
+  const [activeTab, setActiveTab] = useState('overview');
+
+  // Analyze data structure and available visualizations
+  const dataAnalysis = useMemo(() => {
+    const types = new Set(data.map(d => d.type));
+    const hasBenchmarkLoss = types.has('benchmark_loss');
+
+    // Extract individual variables (not aggregates)
+    const numericalVars: string[] = [];
+    const categoricalVars: string[] = [];
+
+    if (hasBenchmarkLoss) {
+      const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
+
+      // Find variables with quantile_loss (numerical)
+      const qlVars = new Set(
+        benchmarkData
+          .filter(d =>
+            d.metric_name === 'quantile_loss' &&
+            !d.variable.includes('_mean_all')
+          )
+          .map(d => d.variable)
+      );
+      numericalVars.push(...Array.from(qlVars));
+
+      // Find variables with log_loss (categorical)
+      const llVars = new Set(
+        benchmarkData
+          .filter(d =>
+            d.metric_name === 'log_loss' &&
+            !d.variable.includes('_mean_all') &&
+            d.metric_value !== null
+          )
+          .map(d => d.variable)
+      );
+      categoricalVars.push(...Array.from(llVars));
+    }
+
+    return {
+      hasBenchmarkLoss,
+      hasDistributionDistance: types.has('distribution_distance'),
+      hasPredictorCorrelation: types.has('predictor_correlation'),
+      numericalVars,
+      categoricalVars,
+      hasPerVariableData: numericalVars.length > 0 || categoricalVars.length > 0,
+    };
+  }, [data]);
+
+  // Build tabs based on available data
+  const tabs = useMemo(() => {
+    const tabsList = [];
+
+    if (dataAnalysis.hasBenchmarkLoss) {
+      tabsList.push({ id: 'overview', label: 'Overview' });
+    }
+
+    if (dataAnalysis.numericalVars.length > 0) {
+      tabsList.push({
+        id: 'numerical',
+        label: 'Numerical Variables',
+        count: dataAnalysis.numericalVars.length,
+      });
+    }
+
+    if (dataAnalysis.categoricalVars.length > 0) {
+      tabsList.push({
+        id: 'categorical',
+        label: 'Categorical Variables',
+        count: dataAnalysis.categoricalVars.length,
+      });
+    }
+
+    return tabsList;
+  }, [dataAnalysis]);
+
+  if (!dataAnalysis.hasBenchmarkLoss) {
+    return (
+      <div className="space-y-8">
+        <div className="bg-white rounded-lg shadow-lg p-6">
+          <h2 className="text-3xl font-bold text-gray-900 mb-4">Visualization Dashboard</h2>
+          <div className="p-4 bg-gray-50 rounded">
+            <p className="text-sm text-gray-600">
+              Successfully loaded: <strong>{fileName}</strong> ({data.length} records)
+            </p>
+          </div>
+        </div>
+        <div className="bg-white rounded-lg shadow-lg p-12">
+          <div className="text-center">
+            <p className="text-xl text-gray-600 mb-2">No visualization data found</p>
+            <p className="text-gray-500">
+              Upload a CSV file with benchmark_loss data to see visualizations.
+            </p>
+          </div>
+        </div>
+      </div>
+    );
+  }
+
   return (
-    <div className="bg-white rounded-lg shadow-lg p-12">
-      <div className="text-center">
+    <div className="space-y-8">
+      {/* Header */}
+      <div className="bg-white rounded-lg shadow-lg p-6">
         <h2 className="text-3xl font-bold text-gray-900 mb-4">Visualization Dashboard</h2>
-        <p className="text-xl text-gray-600 mb-2">Coming Soon...</p>
-        <p className="text-gray-500">
-          The visualization components for microimputation results will be implemented here.
-        </p>
-        <div className="mt-8 p-4 bg-gray-50 rounded">
+        <div className="p-4 bg-gray-50 rounded">
           <p className="text-sm text-gray-600">
             Successfully loaded: <strong>{fileName}</strong>
           </p>
           <p className="text-sm text-gray-600 mt-1">
             Records: <strong>{data.length}</strong>
           </p>
+          {dataAnalysis.numericalVars.length > 0 && (
+            <p className="text-sm text-gray-600 mt-1">
+              Numerical variables: <strong>{dataAnalysis.numericalVars.length}</strong>
+            </p>
+          )}
+          {dataAnalysis.categoricalVars.length > 0 && (
+            <p className="text-sm text-gray-600 mt-1">
+              Categorical variables: <strong>{dataAnalysis.categoricalVars.length}</strong>
+            </p>
+          )}
           {comparisonData && (
             <p className="text-sm text-gray-600 mt-1">
               Comparison file: <strong>{comparisonData.filename}</strong> ({comparisonData.data.length} records)
@@ -44,6 +152,55 @@ export default function VisualizationDashboard({
           )}
         </div>
       </div>
+
+      {/* Tabs Navigation */}
+      {tabs.length > 1 && (
+        <div className="bg-white rounded-lg shadow-lg px-6 pt-6">
+          <VisualizationTabs
+            tabs={tabs}
+            activeTab={activeTab}
+            onTabChange={setActiveTab}
+          />
+        </div>
+      )}
+
+      {/* Tab Content */}
+      <div>
+        {/* Overview Tab */}
+        {activeTab === 'overview' && (
+          <BenchmarkLossCharts data={data} />
+        )}
+
+        {/* Numerical Variables Tab */}
+        {activeTab === 'numerical' && (
+          <div className="space-y-8">
+            {dataAnalysis.numericalVars.map((variable) => (
+              <div key={variable} className="bg-white p-6 rounded-lg shadow">
+                <PerVariableCharts
+                  data={data}
+                  variable={variable}
+                  metricType="quantile_loss"
+                />
+              </div>
+            ))}
+          </div>
+        )}
+
+        {/* Categorical Variables Tab */}
+        {activeTab === 'categorical' && (
+          <div className="space-y-8">
+            {dataAnalysis.categoricalVars.map((variable) => (
+              <div key={variable} className="bg-white p-6 rounded-lg shadow">
+                <PerVariableCharts
+                  data={data}
+                  variable={variable}
+                  metricType="log_loss"
+                />
+              </div>
+            ))}
+          </div>
+        )}
+      </div>
     </div>
   );
 }
\ No newline at end of file
diff --git a/microimputation-dashboard/components/VisualizationTabs.tsx b/microimputation-dashboard/components/VisualizationTabs.tsx
new file mode 100644
index 0000000..5dfbef1
--- /dev/null
+++ b/microimputation-dashboard/components/VisualizationTabs.tsx
@@ -0,0 +1,58 @@
+'use client';
+
+import { useState } from 'react';
+
+interface Tab {
+  id: string;
+  label: string;
+  count?: number;
+}
+
+interface VisualizationTabsProps {
+  tabs: Tab[];
+  activeTab: string;
+  onTabChange: (tabId: string) => void;
+}
+
+export default function VisualizationTabs({
+  tabs,
+  activeTab,
+  onTabChange,
+}: VisualizationTabsProps) {
+  return (
+    <div className="border-b border-gray-200 mb-6">
+      <nav className="-mb-px flex space-x-8" aria-label="Tabs">
+        {tabs.map((tab) => (
+          <button
+            key={tab.id}
+            onClick={() => onTabChange(tab.id)}
+            className={`
+              whitespace-nowrap py-4 px-1 border-b-2 font-medium text-sm
+              ${
+                activeTab === tab.id
+                  ? 'border-blue-500 text-blue-600'
+                  : 'border-transparent text-gray-500 hover:text-gray-700 hover:border-gray-300'
+              }
+            `}
+          >
+            {tab.label}
+            {tab.count !== undefined && (
+              <span
+                className={`
+                  ml-2 py-0.5 px-2 rounded-full text-xs
+                  ${
+                    activeTab === tab.id
+                      ? 'bg-blue-100 text-blue-600'
+                      : 'bg-gray-100 text-gray-600'
+                  }
+                `}
+              >
+                {tab.count}
+              </span>
+            )}
+          </button>
+        ))}
+      </nav>
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/types/imputation.ts b/microimputation-dashboard/types/imputation.ts
index c6163bc..799862d 100644
--- a/microimputation-dashboard/types/imputation.ts
+++ b/microimputation-dashboard/types/imputation.ts
@@ -1,13 +1,13 @@
 // Type definitions for microimputation data
 export interface ImputationDataPoint {
-  // Add fields based on what microimpute outputs
-  // These are placeholder fields that will be updated based on actual CSV structure
-  id?: string;
-  variable?: string;
-  original_value?: number;
-  imputed_value?: number;
-  method?: string;
-  confidence?: number;
+  type: string; // e.g., "benchmark_loss", "distribution_distance", "predictor_correlation"
+  method: string; // e.g., "QRF", "OLS", "QuantReg", "Matching"
+  variable: string; // e.g., "quantile_loss_mean_all", "log_loss_mean_all", or actual variable names
+  quantile: string | number; // numeric (0.05, 0.1, etc.), "mean", or "N/A"
+  metric_name: string; // e.g., "quantile_loss", "log_loss"
+  metric_value: number | null; // numeric value of the metric
+  split: string; // e.g., "train", "test", "full"
+  additional_info: string; // JSON-formatted string with metadata
   [key: string]: any; // Allow additional fields
 }
 
diff --git a/microimputation-dashboard/utils/colors.ts b/microimputation-dashboard/utils/colors.ts
new file mode 100644
index 0000000..9e7e870
--- /dev/null
+++ b/microimputation-dashboard/utils/colors.ts
@@ -0,0 +1,29 @@
+// Consistent color mapping for imputation methods across all charts
+// Using Plotly color palette for consistency with Python visualizations
+
+export const METHOD_COLORS: Record<string, string> = {
+  QRF: '#636EFA',           // Plotly blue
+  OLS: '#EF553B',           // Plotly red
+  QuantReg: '#00CC96',      // Plotly teal
+  Matching: '#AB63FA',      // Plotly purple
+  // Add more methods as needed
+};
+
+export const FALLBACK_COLORS = [
+  '#FFA15A', // Plotly orange
+  '#19D3F3', // Plotly cyan
+  '#FF6692', // Plotly pink
+  '#B6E880', // Plotly lime
+  '#FF97FF', // Plotly magenta
+  '#FECB52', // Plotly yellow
+];
+
+/**
+ * Get color for a method, using predefined colors or fallback palette
+ */
+export function getMethodColor(method: string, index: number = 0): string {
+  if (method in METHOD_COLORS) {
+    return METHOD_COLORS[method];
+  }
+  return FALLBACK_COLORS[index % FALLBACK_COLORS.length];
+}

From ff998d361bf28893a18093e92d2505f00ef92c9f Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Wed, 22 Oct 2025 15:24:37 +0800
Subject: [PATCH 03/12] fix linting

---
 changelog_entry.yaml                                      | 1 +
 .../app/api/github/artifacts/route.ts                     | 2 +-
 .../components/BenchmarkLossCharts.tsx                    | 5 ++---
 microimputation-dashboard/components/FileUpload.tsx       | 2 +-
 .../components/PerVariableCharts.tsx                      | 8 ++++----
 .../components/VisualizationTabs.tsx                      | 2 --
 6 files changed, 9 insertions(+), 11 deletions(-)

diff --git a/changelog_entry.yaml b/changelog_entry.yaml
index 9670cc6..39bbe07 100644
--- a/changelog_entry.yaml
+++ b/changelog_entry.yaml
@@ -2,3 +2,4 @@
   changes:
     added:
     - Links to dashboard in README.md and documentation.
+    - First dashboard visualizations.
diff --git a/microimputation-dashboard/app/api/github/artifacts/route.ts b/microimputation-dashboard/app/api/github/artifacts/route.ts
index d071169..1ab5163 100644
--- a/microimputation-dashboard/app/api/github/artifacts/route.ts
+++ b/microimputation-dashboard/app/api/github/artifacts/route.ts
@@ -92,7 +92,7 @@ export async function GET(request: NextRequest) {
         // Remove duplicates and sort by creation date (newest first)
         const uniqueArtifacts = allArtifacts
             .filter(
-                (artifact: { name: string }, index: number, self: any[]) =>
+                (artifact: { name: string }, index: number, self: Array<{ name: string }>) =>
                     index ===
                     self.findIndex((a: { name: string }) => a.name === artifact.name)
             )
diff --git a/microimputation-dashboard/components/BenchmarkLossCharts.tsx b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
index c057e93..70a00c3 100644
--- a/microimputation-dashboard/components/BenchmarkLossCharts.tsx
+++ b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
@@ -11,7 +11,6 @@ import {
   Tooltip,
   Legend,
   ResponsiveContainer,
-  ReferenceLine,
 } from 'recharts';
 import { ImputationDataPoint } from '@/types/imputation';
 import { getMethodColor } from '@/utils/colors';
@@ -60,7 +59,7 @@ export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps)
     if (quantileLossData.length === 0) return [];
 
     // Group by quantile
-    const quantileMap = new Map<number, Record<string, any>>();
+    const quantileMap = new Map<number, Record<string, string | number | null>>();
 
     quantileLossData.forEach(d => {
       const quantile = Number(d.quantile);
@@ -72,7 +71,7 @@ export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps)
     });
 
     return Array.from(quantileMap.values()).sort(
-      (a, b) => parseFloat(a.quantile) - parseFloat(b.quantile)
+      (a, b) => parseFloat(a.quantile as string) - parseFloat(b.quantile as string)
     );
   }, [quantileLossData]);
 
diff --git a/microimputation-dashboard/components/FileUpload.tsx b/microimputation-dashboard/components/FileUpload.tsx
index 52eb223..6ac9f63 100644
--- a/microimputation-dashboard/components/FileUpload.tsx
+++ b/microimputation-dashboard/components/FileUpload.tsx
@@ -401,7 +401,7 @@ export default function FileUpload({
     }
 
     let url: URL;
-    let finalUrl = urlInput.trim();
+    const finalUrl = urlInput.trim();
 
     try {
       url = new URL(finalUrl);
diff --git a/microimputation-dashboard/components/PerVariableCharts.tsx b/microimputation-dashboard/components/PerVariableCharts.tsx
index 7f7302e..01f5933 100644
--- a/microimputation-dashboard/components/PerVariableCharts.tsx
+++ b/microimputation-dashboard/components/PerVariableCharts.tsx
@@ -50,7 +50,7 @@ export default function PerVariableCharts({
         typeof d.quantile === 'number' && d.quantile >= 0 && d.quantile <= 1
     );
 
-    const quantileMap = new Map<number, Record<string, any>>();
+    const quantileMap = new Map<number, Record<string, string | number | null>>();
 
     numericData.forEach((d) => {
       const quantile = Number(d.quantile);
@@ -62,7 +62,7 @@ export default function PerVariableCharts({
     });
 
     return Array.from(quantileMap.values()).sort(
-      (a, b) => parseFloat(a.quantile) - parseFloat(b.quantile)
+      (a, b) => parseFloat(a.quantile as string) - parseFloat(b.quantile as string)
     );
   }, [variableData, metricType]);
 
@@ -104,7 +104,7 @@ export default function PerVariableCharts({
       {metricType === 'quantile_loss' && quantileChartData.length > 0 && (
         <div>
           <h4 className="text-lg font-semibold mb-4 text-gray-700">
-            Quantile Loss by Method for "{variable}"
+            Quantile Loss by Method for &quot;{variable}&quot;
           </h4>
           <ResponsiveContainer width="100%" height={400}>
             <BarChart data={quantileChartData}>
@@ -153,7 +153,7 @@ export default function PerVariableCharts({
       {metricType === 'log_loss' && logLossChartData.length > 0 && (
         <div>
           <h4 className="text-lg font-semibold mb-4 text-gray-700">
-            Log Loss by Method for "{variable}"
+            Log Loss by Method for &quot;{variable}&quot;
           </h4>
           <ResponsiveContainer width="100%" height={400}>
             <BarChart data={logLossChartData}>
diff --git a/microimputation-dashboard/components/VisualizationTabs.tsx b/microimputation-dashboard/components/VisualizationTabs.tsx
index 5dfbef1..25c9736 100644
--- a/microimputation-dashboard/components/VisualizationTabs.tsx
+++ b/microimputation-dashboard/components/VisualizationTabs.tsx
@@ -1,7 +1,5 @@
 'use client';
 
-import { useState } from 'react';
-
 interface Tab {
   id: string;
   label: string;

From 90f43023250a7f586ef239de1664e15d01e2dc77 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 12:14:48 +0800
Subject: [PATCH 04/12] fix all loading pages

---
 .gitignore                                    |   1 +
 microimputation-dashboard/app/page.tsx        |  51 +--
 .../components/FileUpload.tsx                 | 390 ++----------------
 .../components/VisualizationDashboard.tsx     |  15 +-
 .../public/microimputation_results.csv        | 294 +++++++++++++
 microimputation-dashboard/utils/deeplinks.ts  |  97 +----
 6 files changed, 348 insertions(+), 500 deletions(-)
 create mode 100644 microimputation-dashboard/public/microimputation_results.csv

diff --git a/.gitignore b/.gitignore
index 555168e..a790fe1 100644
--- a/.gitignore
+++ b/.gitignore
@@ -76,6 +76,7 @@ celerybeat.pid
 
 # Ignore Data Files
 *.csv
+!microimputation-dashboard/**/*.csv
 *.jpg
 *.html
 *.h5
diff --git a/microimputation-dashboard/app/page.tsx b/microimputation-dashboard/app/page.tsx
index c24753a..8905f4e 100644
--- a/microimputation-dashboard/app/page.tsx
+++ b/microimputation-dashboard/app/page.tsx
@@ -13,18 +13,7 @@ function HomeContent() {
   const [fileName, setFileName] = useState<string>('');
   const [showDashboard, setShowDashboard] = useState(false);
   const [isLoadingFromDeeplink, setIsLoadingFromDeeplink] = useState(false);
-  const [githubArtifactInfo, setGithubArtifactInfo] = useState<{
-    primary: GitHubArtifactInfo | null;
-    secondary?: GitHubArtifactInfo | null;
-  } | null>(null);
-
-  // Comparison mode state
-  const [comparisonData, setComparisonData] = useState<{
-    data1: ImputationDataPoint[];
-    filename1: string;
-    data2: ImputationDataPoint[];
-    filename2: string;
-  } | null>(null);
+  const [githubArtifactInfo, setGithubArtifactInfo] = useState<GitHubArtifactInfo | null>(null);
 
   const searchParams = useSearchParams();
   const deeplinkParams = parseDeeplinkParams(searchParams);
@@ -40,32 +29,14 @@ function HomeContent() {
       const parsedData = parseImputationCSV(csvContent);
       setData(parsedData);
       setFileName(filename);
-      setComparisonData(null); // Clear comparison data when loading single file
     } catch (error) {
       console.error('Error parsing CSV:', error);
       alert('Failed to parse CSV file. Please check the file format.');
     }
   };
 
-  const handleCompareLoad = (content1: string, filename1: string, content2: string, filename2: string) => {
-    try {
-      const data1 = parseImputationCSV(content1);
-      const data2 = parseImputationCSV(content2);
-      setComparisonData({
-        data1,
-        filename1,
-        data2,
-        filename2
-      });
-      setData([]); // Clear single data when loading comparison
-    } catch (error) {
-      console.error('Error parsing comparison CSVs:', error);
-      alert('Failed to parse one or both CSV files. Please check the file formats.');
-    }
-  };
-
   const handleViewDashboard = () => {
-    if (data.length > 0 || comparisonData) {
+    if (data.length > 0) {
       setShowDashboard(true);
     }
   };
@@ -74,21 +45,20 @@ function HomeContent() {
     setShowDashboard(false);
     setData([]);
     setFileName('');
-    setComparisonData(null);
     setGithubArtifactInfo(null);
   };
 
-  const handleDeeplinkLoadComplete = (primary: GitHubArtifactInfo | null, secondary?: GitHubArtifactInfo | null) => {
+  const handleDeeplinkLoadComplete = (primary: GitHubArtifactInfo | null) => {
     setIsLoadingFromDeeplink(false);
     if (primary) {
-      setGithubArtifactInfo({ primary, secondary: secondary || undefined });
+      setGithubArtifactInfo(primary);
       setShowDashboard(true);
     }
   };
 
-  const handleGithubLoad = (primary: GitHubArtifactInfo | null, secondary?: GitHubArtifactInfo | null) => {
+  const handleGithubLoad = (primary: GitHubArtifactInfo | null) => {
     if (primary) {
-      setGithubArtifactInfo({ primary, secondary: secondary || undefined });
+      setGithubArtifactInfo(primary);
     }
   };
 
@@ -125,7 +95,6 @@ function HomeContent() {
           <FileUpload
             onFileLoad={handleFileLoad}
             onViewDashboard={handleViewDashboard}
-            onCompareLoad={handleCompareLoad}
             deeplinkParams={deeplinkParams}
             isLoadingFromDeeplink={isLoadingFromDeeplink}
             onDeeplinkLoadComplete={handleDeeplinkLoadComplete}
@@ -133,12 +102,8 @@ function HomeContent() {
           />
         ) : (
           <VisualizationDashboard
-            data={comparisonData ? comparisonData.data1 : data}
-            fileName={comparisonData ? comparisonData.filename1 : fileName}
-            comparisonData={comparisonData ? {
-              data: comparisonData.data2,
-              filename: comparisonData.filename2
-            } : undefined}
+            data={data}
+            fileName={fileName}
             githubArtifactInfo={githubArtifactInfo}
           />
         )}
diff --git a/microimputation-dashboard/components/FileUpload.tsx b/microimputation-dashboard/components/FileUpload.tsx
index 6ac9f63..a9bf564 100644
--- a/microimputation-dashboard/components/FileUpload.tsx
+++ b/microimputation-dashboard/components/FileUpload.tsx
@@ -8,11 +8,10 @@ import { DeeplinkParams, GitHubArtifactInfo } from '@/utils/deeplinks';
 interface FileUploadProps {
   onFileLoad: (content: string, filename: string) => void;
   onViewDashboard: () => void;
-  onCompareLoad?: (content1: string, filename1: string, content2: string, filename2: string) => void;
   deeplinkParams?: DeeplinkParams | null;
   isLoadingFromDeeplink?: boolean;
-  onDeeplinkLoadComplete?: (primary: GitHubArtifactInfo | null, secondary?: GitHubArtifactInfo | null | undefined) => void;
-  onGithubLoad?: (primary: GitHubArtifactInfo | null, secondary?: GitHubArtifactInfo | null) => void;
+  onDeeplinkLoadComplete?: (primary: GitHubArtifactInfo | null) => void;
+  onGithubLoad?: (primary: GitHubArtifactInfo | null) => void;
 }
 
 interface GitHubCommit {
@@ -43,7 +42,6 @@ interface GitHubArtifact {
 export default function FileUpload({
   onFileLoad,
   onViewDashboard,
-  onCompareLoad,
   deeplinkParams,
   isLoadingFromDeeplink,
   onDeeplinkLoadComplete,
@@ -66,14 +64,6 @@ export default function FileUpload({
   const [selectedArtifact, setSelectedArtifact] = useState('');
   const [isLoadingGithubData, setIsLoadingGithubData] = useState(false);
 
-  // Comparison mode state
-  const [comparisonMode, setComparisonMode] = useState(false);
-  const [selectedSecondBranch, setSelectedSecondBranch] = useState('');
-  const [secondCommits, setSecondCommits] = useState<GitHubCommit[]>([]);
-  const [selectedSecondCommit, setSelectedSecondCommit] = useState('');
-  const [secondArtifacts, setSecondArtifacts] = useState<GitHubArtifact[]>([]);
-  const [selectedSecondArtifact, setSelectedSecondArtifact] = useState('');
-
   // Helper function to load a single artifact from deeplink parameters
   const loadArtifactFromDeeplink = useCallback(async (artifactInfo: GitHubArtifactInfo): Promise<string> => {
     // Get artifacts for the specific commit using API route
@@ -125,7 +115,7 @@ export default function FileUpload({
   }, []);
 
   // Load GitHub artifacts directly from deeplink parameters
-  const loadDeeplinkArtifacts = useCallback(async (primary: GitHubArtifactInfo, secondary?: GitHubArtifactInfo) => {
+  const loadDeeplinkArtifacts = useCallback(async (primary: GitHubArtifactInfo) => {
     setIsLoading(true);
     setError('');
 
@@ -135,26 +125,14 @@ export default function FileUpload({
       // Load primary artifact
       const primaryData = await loadArtifactFromDeeplink(primary);
 
-      if (secondary && onCompareLoad) {
-        // Load secondary artifact for comparison
-        const secondaryData = await loadArtifactFromDeeplink(secondary);
-
-        // Generate display names with commit info
-        const primaryDisplayName = `${primary.repo}@${primary.branch} (${primary.commit.substring(0, 7)}) - ${primary.artifact}`;
-        const secondaryDisplayName = `${secondary.repo}@${secondary.branch} (${secondary.commit.substring(0, 7)}) - ${secondary.artifact}`;
-
-        onCompareLoad(primaryData, primaryDisplayName, secondaryData, secondaryDisplayName);
-        setLoadedFile(`Comparison: ${primaryDisplayName} vs ${secondaryDisplayName}`);
-      } else {
-        // Single artifact load
-        const displayName = `${primary.repo}@${primary.branch} (${primary.commit.substring(0, 7)}) - ${primary.artifact}`;
-        onFileLoad(primaryData, displayName);
-        setLoadedFile(displayName);
-      }
+      // Single artifact load
+      const displayName = `${primary.repo}@${primary.branch} (${primary.commit.substring(0, 7)}) - ${primary.artifact}`;
+      onFileLoad(primaryData, displayName);
+      setLoadedFile(displayName);
 
       // Notify parent component that deeplink loading is complete
       if (onDeeplinkLoadComplete) {
-        onDeeplinkLoadComplete(primary, secondary);
+        onDeeplinkLoadComplete(primary);
       }
 
       setError('');
@@ -166,35 +144,19 @@ export default function FileUpload({
     } finally {
       setIsLoading(false);
     }
-  }, [onFileLoad, onCompareLoad, onDeeplinkLoadComplete, loadArtifactFromDeeplink]);
+  }, [onFileLoad, onDeeplinkLoadComplete, loadArtifactFromDeeplink]);
 
   // Handle deeplink loading on mount
   useEffect(() => {
-    if (deeplinkParams && isLoadingFromDeeplink) {
+    if (deeplinkParams && isLoadingFromDeeplink && deeplinkParams.primary) {
       setActiveTab('github');
+      setGithubRepo(deeplinkParams.primary.repo);
+      setSelectedBranch(deeplinkParams.primary.branch);
+      setSelectedCommit(deeplinkParams.primary.commit);
+      setSelectedArtifact(deeplinkParams.primary.artifact);
 
-      if (deeplinkParams.mode === 'comparison' && deeplinkParams.primary && deeplinkParams.secondary) {
-        setComparisonMode(true);
-        setGithubRepo(deeplinkParams.primary.repo);
-        setSelectedBranch(deeplinkParams.primary.branch);
-        setSelectedCommit(deeplinkParams.primary.commit);
-        setSelectedArtifact(deeplinkParams.primary.artifact);
-        setSelectedSecondBranch(deeplinkParams.secondary.branch);
-        setSelectedSecondCommit(deeplinkParams.secondary.commit);
-        setSelectedSecondArtifact(deeplinkParams.secondary.artifact);
-
-        // Auto-load comparison data
-        loadDeeplinkArtifacts(deeplinkParams.primary, deeplinkParams.secondary);
-      } else if (deeplinkParams.primary) {
-        setComparisonMode(false);
-        setGithubRepo(deeplinkParams.primary.repo);
-        setSelectedBranch(deeplinkParams.primary.branch);
-        setSelectedCommit(deeplinkParams.primary.commit);
-        setSelectedArtifact(deeplinkParams.primary.artifact);
-
-        // Auto-load single artifact data
-        loadDeeplinkArtifacts(deeplinkParams.primary);
-      }
+      // Auto-load artifact data
+      loadDeeplinkArtifacts(deeplinkParams.primary);
     }
   }, [deeplinkParams, isLoadingFromDeeplink, loadDeeplinkArtifacts]);
 
@@ -540,7 +502,7 @@ export default function FileUpload({
 
         if (!response.ok) {
           if (response.status === 404) {
-            throw new Error('Repository not found. Please check the repository name and ensure it is accessible.');
+            throw new Error('Repository not found. Please check the repository name and ensure it is publicly accessible.');
           } else if (response.status === 403) {
             throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
           }
@@ -716,7 +678,7 @@ export default function FileUpload({
           commit: selectedCommit,
           artifact: artifact.name
         };
-        onGithubLoad(artifactInfo, null);
+        onGithubLoad(artifactInfo);
       }
 
       // Clear the GitHub state since we successfully loaded the file
@@ -736,183 +698,6 @@ export default function FileUpload({
     }
   }
 
-  async function fetchSecondBranchCommits(branch: string) {
-    if (!githubRepo.trim() || !branch) return;
-
-    setIsLoadingGithubData(true);
-    try {
-      const response = await fetch(
-        `/api/github/commits?repo=${encodeURIComponent(githubRepo)}&branch=${encodeURIComponent(branch)}`
-      );
-
-      if (!response.ok) {
-        if (response.status === 404) {
-          throw new Error('Branch not found or repository is private.');
-        } else if (response.status === 403) {
-          throw new Error('Access forbidden. Please check your GitHub token permissions or repository access.');
-        }
-        const errorData = await response.json();
-        throw new Error(errorData.error || `Failed to fetch commits: ${response.status}`);
-      }
-
-      const commits: GitHubCommit[] = await response.json();
-      setSecondCommits(commits);
-
-      // Auto-select latest commit and fetch its artifacts
-      if (commits.length > 0) {
-        setSelectedSecondCommit(commits[0].sha);
-        await fetchSecondArtifacts(commits[0].sha);
-      }
-    } catch (err) {
-      setError(`GitHub API error: ${err instanceof Error ? err.message : 'Unknown error'}`);
-    } finally {
-      setIsLoadingGithubData(false);
-    }
-  }
-
-  async function fetchSecondArtifacts(commitSha: string) {
-    if (!githubRepo.trim() || !commitSha) return;
-
-    setIsLoadingGithubData(true);
-    setSecondArtifacts([]);
-    setSelectedSecondArtifact('');
-
-    try {
-      const response = await fetch(
-        `/api/github/artifacts?repo=${encodeURIComponent(githubRepo)}&commit=${encodeURIComponent(commitSha)}`
-      );
-
-      if (!response.ok) {
-        if (response.status === 403) {
-          throw new Error(`GitHub API rate limit exceeded or token permissions insufficient (403). Please try again later or check your token permissions.`);
-        } else if (response.status === 404) {
-          throw new Error(`Repository or commit not found (404). Please check the repository name and commit SHA.`);
-        }
-        const errorData = await response.json();
-        throw new Error(errorData.error || `Failed to fetch artifacts: ${response.status}`);
-      }
-
-      const uniqueArtifacts: GitHubArtifact[] = await response.json();
-
-      if (uniqueArtifacts.length === 0) {
-        setError('No imputation artifacts found for this commit.');
-        return;
-      }
-
-      setSecondArtifacts(uniqueArtifacts);
-
-      // Auto-select the first artifact
-      if (uniqueArtifacts.length > 0) {
-        setSelectedSecondArtifact(uniqueArtifacts[0].id.toString());
-      }
-
-    } catch (err) {
-      setError(`Failed to fetch artifacts: ${err instanceof Error ? err.message : 'Unknown error'}`);
-    } finally {
-      setIsLoadingGithubData(false);
-    }
-  }
-
-  async function loadComparisonData() {
-    if (!selectedArtifact || !selectedSecondArtifact || !onCompareLoad) {
-      setError('Please select artifacts from both commits to compare');
-      return;
-    }
-
-    const firstArtifact = availableArtifacts.find(a => a.id.toString() === selectedArtifact);
-    const secondArtifact = secondArtifacts.find(a => a.id.toString() === selectedSecondArtifact);
-
-    if (!firstArtifact || !secondArtifact) {
-      setError('Selected artifacts not found');
-      return;
-    }
-
-    setIsLoading(true);
-    setError('');
-
-    try {
-      setError('🔄 Downloading and extracting CSV files for comparison...');
-
-      // Download both artifacts
-      const [firstDownload, secondDownload] = await Promise.all([
-        fetch(`/api/github/download?url=${encodeURIComponent(firstArtifact.archive_download_url)}`),
-        fetch(`/api/github/download?url=${encodeURIComponent(secondArtifact.archive_download_url)}`)
-      ]);
-
-      if (!firstDownload.ok || !secondDownload.ok) {
-        throw new Error('Failed to download one or both artifacts');
-      }
-
-      // Extract CSVs from both artifacts
-      const [firstZipBuffer, secondZipBuffer] = await Promise.all([
-        firstDownload.arrayBuffer(),
-        secondDownload.arrayBuffer()
-      ]);
-
-      const firstZip = new JSZip();
-      const secondZip = new JSZip();
-      const [firstZipContent, secondZipContent] = await Promise.all([
-        firstZip.loadAsync(firstZipBuffer),
-        secondZip.loadAsync(secondZipBuffer)
-      ]);
-
-      // Find CSV files in both ZIPs
-      const firstCsvFiles = Object.keys(firstZipContent.files).filter(filename =>
-        filename.toLowerCase().endsWith('.csv') && !firstZipContent.files[filename].dir
-      );
-      const secondCsvFiles = Object.keys(secondZipContent.files).filter(filename =>
-        filename.toLowerCase().endsWith('.csv') && !secondZipContent.files[filename].dir
-      );
-
-      if (firstCsvFiles.length === 0 || secondCsvFiles.length === 0) {
-        throw new Error('No CSV files found in one or both artifacts');
-      }
-
-      // Extract CSV content
-      const [firstCsvContent, secondCsvContent] = await Promise.all([
-        firstZipContent.files[firstCsvFiles[0]].async('text'),
-        secondZipContent.files[secondCsvFiles[0]].async('text')
-      ]);
-
-      // Create display names with commit info
-      const firstCommitShort = selectedCommit.slice(0, 8);
-      const secondCommitShort = selectedSecondCommit.slice(0, 8);
-
-      const firstBranchInfo = selectedBranch !== selectedSecondBranch ? ` (${selectedBranch})` : '';
-      const secondBranchInfo = selectedBranch !== selectedSecondBranch ? ` (${selectedSecondBranch})` : '';
-
-      const firstName = `${firstCsvFiles[0]} @ ${firstCommitShort}${firstBranchInfo}`;
-      const secondName = `${secondCsvFiles[0]} @ ${secondCommitShort}${secondBranchInfo}`;
-
-      // Load into comparison mode
-      onCompareLoad(firstCsvContent, firstName, secondCsvContent, secondName);
-
-      // Notify parent component about GitHub artifact info for sharing
-      if (onGithubLoad) {
-        const primaryArtifactInfo: GitHubArtifactInfo = {
-          repo: githubRepo,
-          branch: selectedBranch,
-          commit: selectedCommit,
-          artifact: firstArtifact.name
-        };
-        const secondaryArtifactInfo: GitHubArtifactInfo = {
-          repo: githubRepo,
-          branch: selectedSecondBranch,
-          commit: selectedSecondCommit,
-          artifact: secondArtifact.name
-        };
-        onGithubLoad(primaryArtifactInfo, secondaryArtifactInfo);
-      }
-
-      setError('');
-
-    } catch (extractError) {
-      console.error('Comparison extraction error:', extractError);
-      setError(`❌ Failed to extract comparison data: ${extractError instanceof Error ? extractError.message : 'Unknown error'}`);
-    } finally {
-      setIsLoading(false);
-    }
-  }
 
   return (
     <div className="bg-white rounded-lg shadow-lg p-6">
@@ -922,8 +707,14 @@ export default function FileUpload({
       </div>
 
       {error && (
-        <div className="mb-4 bg-red-50 border border-red-200 rounded-md p-3">
-          <p className="text-sm text-red-700">{error}</p>
+        <div className={`mb-4 rounded-md p-3 ${
+          error.startsWith('🔄')
+            ? 'bg-blue-50 border border-blue-200'
+            : 'bg-red-50 border border-red-200'
+        }`}>
+          <p className={`text-sm ${
+            error.startsWith('🔄') ? 'text-blue-700' : 'text-red-700'
+          }`}>{error}</p>
         </div>
       )}
 
@@ -1121,34 +912,6 @@ export default function FileUpload({
                   </div>
                 </div>
 
-                {/* Comparison Mode Toggle */}
-                <div className="mb-4">
-                  <label className="flex items-center">
-                    <input
-                      type="checkbox"
-                      checked={comparisonMode}
-                      onChange={(e) => {
-                        setComparisonMode(e.target.checked);
-                        if (!e.target.checked) {
-                          // Reset second selection states
-                          setSelectedSecondBranch('');
-                          setSecondCommits([]);
-                          setSelectedSecondCommit('');
-                          setSecondArtifacts([]);
-                          setSelectedSecondArtifact('');
-                        }
-                      }}
-                      className="mr-2 rounded"
-                    />
-                    <span className="text-sm font-medium text-gray-700">
-                      Compare two imputation runs (different branches/commits)
-                    </span>
-                  </label>
-                  <p className="text-xs text-gray-500 mt-1">
-                    Enable this to compare imputation results between different branches or commits
-                  </p>
-                </div>
-
                 {/* Branch Selection */}
                 {githubBranches.length > 0 && (
                   <div className="mb-4">
@@ -1236,109 +999,14 @@ export default function FileUpload({
                   </div>
                 )}
 
-                {/* Second Selection for Comparison */}
-                {comparisonMode && githubBranches.length > 0 && (
-                  <div className="border-t border-gray-200 pt-4 mt-6">
-                    <h4 className="text-md font-semibold text-gray-800 mb-4">Second Imputation Run (for comparison)</h4>
-
-                    {/* Second Branch Selection */}
-                    <div className="mb-4">
-                      <label htmlFor="github-second-branch" className="block text-sm font-medium text-gray-700 mb-2">
-                        Branch
-                      </label>
-                      <select
-                        id="github-second-branch"
-                        value={selectedSecondBranch}
-                        onChange={(e) => {
-                          setSelectedSecondBranch(e.target.value);
-                          fetchSecondBranchCommits(e.target.value);
-                        }}
-                        className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
-                      >
-                        <option value="">Select a branch</option>
-                        {githubBranches.map((branch) => (
-                          <option key={`second-${branch.name}`} value={branch.name}>
-                            {branch.name}
-                          </option>
-                        ))}
-                      </select>
-                    </div>
-
-                    {/* Second Commit Selection */}
-                    {secondCommits.length > 0 && (
-                      <div className="mb-4">
-                        <label htmlFor="github-second-commit" className="block text-sm font-medium text-gray-700 mb-2">
-                          Commit
-                        </label>
-                        <select
-                          id="github-second-commit"
-                          value={selectedSecondCommit}
-                          onChange={(e) => {
-                            setSelectedSecondCommit(e.target.value);
-                            fetchSecondArtifacts(e.target.value);
-                          }}
-                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
-                        >
-                          <option value="">Select a commit</option>
-                          {secondCommits.map((commit) => (
-                            <option key={`second-${commit.sha}`} value={commit.sha}>
-                              {commit.sha.slice(0, 8)} - {commit.commit.message.slice(0, 60)}
-                              {commit.commit.message.length > 60 ? '...' : ''}
-                            </option>
-                          ))}
-                        </select>
-                        {selectedSecondCommit && (
-                          <p className="text-sm text-gray-500 mt-1">
-                            {secondCommits.find(c => c.sha === selectedSecondCommit)?.commit.author.date &&
-                              new Date(secondCommits.find(c => c.sha === selectedSecondCommit)!.commit.author.date).toLocaleString()
-                            }
-                          </p>
-                        )}
-                      </div>
-                    )}
-
-                    {/* Second Artifact Selection */}
-                    {secondArtifacts.length > 0 && (
-                      <div className="mb-4">
-                        <label htmlFor="github-second-artifact" className="block text-sm font-medium text-gray-700 mb-2">
-                          Artifact ({secondArtifacts.length} available)
-                        </label>
-                        <select
-                          id="github-second-artifact"
-                          value={selectedSecondArtifact}
-                          onChange={(e) => setSelectedSecondArtifact(e.target.value)}
-                          className="w-full px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
-                        >
-                          <option value="">Select an artifact</option>
-                          {secondArtifacts.map((artifact) => (
-                            <option key={`second-${artifact.id}`} value={artifact.id.toString()}>
-                              {artifact.name} ({(artifact.size_in_bytes / 1024).toFixed(1)} KB)
-                            </option>
-                          ))}
-                        </select>
-                        {selectedSecondArtifact && (
-                          <p className="text-sm text-gray-500 mt-1">
-                            {secondArtifacts.find(a => a.id.toString() === selectedSecondArtifact)?.created_at &&
-                              `Created: ${new Date(secondArtifacts.find(a => a.id.toString() === selectedSecondArtifact)!.created_at).toLocaleString()}`
-                            }
-                          </p>
-                        )}
-                      </div>
-                    )}
-                  </div>
-                )}
-
                 {/* Load Button */}
-                {selectedArtifact && (!comparisonMode || selectedSecondArtifact) && (
+                {selectedArtifact && (
                   <button
-                    onClick={comparisonMode ? loadComparisonData : loadGithubArtifact}
+                    onClick={loadGithubArtifact}
                     disabled={isLoading}
                     className="bg-green-600 hover:bg-green-700 text-white font-medium py-2 px-4 rounded-md disabled:opacity-50"
                   >
-                    {isLoading
-                      ? (comparisonMode ? 'Loading comparison...' : 'Loading artifact...')
-                      : (comparisonMode ? 'Compare imputation runs' : 'Load imputation data')
-                    }
+                    {isLoading ? 'Loading artifact...' : 'Load imputation data'}
                   </button>
                 )}
 
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index ffdf3cd..6e046dd 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -10,20 +10,12 @@ import VisualizationTabs from './VisualizationTabs';
 interface VisualizationDashboardProps {
   data: ImputationDataPoint[];
   fileName: string;
-  comparisonData?: {
-    data: ImputationDataPoint[];
-    filename: string;
-  };
-  githubArtifactInfo?: {
-    primary: GitHubArtifactInfo | null;
-    secondary?: GitHubArtifactInfo | null;
-  } | null;
+  githubArtifactInfo?: GitHubArtifactInfo | null;
 }
 
 export default function VisualizationDashboard({
   data,
   fileName,
-  comparisonData,
 }: VisualizationDashboardProps) {
   const [activeTab, setActiveTab] = useState('overview');
 
@@ -145,11 +137,6 @@ export default function VisualizationDashboard({
               Categorical variables: <strong>{dataAnalysis.categoricalVars.length}</strong>
             </p>
           )}
-          {comparisonData && (
-            <p className="text-sm text-gray-600 mt-1">
-              Comparison file: <strong>{comparisonData.filename}</strong> ({comparisonData.data.length} records)
-            </p>
-          )}
         </div>
       </div>
 
diff --git a/microimputation-dashboard/public/microimputation_results.csv b/microimputation-dashboard/public/microimputation_results.csv
new file mode 100644
index 0000000..9ef58a5
--- /dev/null
+++ b/microimputation-dashboard/public/microimputation_results.csv
@@ -0,0 +1,294 @@
+type,method,variable,quantile,metric_name,metric_value,split,additional_info
+benchmark_loss,QRF,quantile_loss_mean_all,0.05,quantile_loss,0.0019931334519540313,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.1,quantile_loss,0.003676832529510976,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.15,quantile_loss,0.005051964323131603,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.2,quantile_loss,0.007150055272652542,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.25,quantile_loss,0.007272266767142256,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.3,quantile_loss,0.008540254219041532,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.35,quantile_loss,0.007621934560531267,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.4,quantile_loss,0.00916139860523047,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.45,quantile_loss,0.008137742361262587,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.5,quantile_loss,0.008501949409742712,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.55,quantile_loss,0.006943288815511526,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.6,quantile_loss,0.006674970777747578,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.65,quantile_loss,0.006300488362370938,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.7,quantile_loss,0.005762547086974565,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.75,quantile_loss,0.005910973227513356,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.8,quantile_loss,0.005674293245652812,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.85,quantile_loss,0.0045532698330881145,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.9,quantile_loss,0.003777490459909232,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.95,quantile_loss,0.0022857221356438738,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.05,quantile_loss,0.004976762851613436,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.1,quantile_loss,0.007958901707037789,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.15,quantile_loss,0.011348256884255009,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.2,quantile_loss,0.014479045607066829,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.25,quantile_loss,0.01804729212868635,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.3,quantile_loss,0.020713966247658862,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.35,quantile_loss,0.022742931417508282,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.4,quantile_loss,0.02258721277917371,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.45,quantile_loss,0.023351581275292608,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.5,quantile_loss,0.023625607730980425,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.55,quantile_loss,0.023186470004863385,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.6,quantile_loss,0.022905432991342744,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.65,quantile_loss,0.022230731438156376,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.7,quantile_loss,0.02057637886132135,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.75,quantile_loss,0.01912773338390523,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.8,quantile_loss,0.01739101077609373,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.85,quantile_loss,0.013723503511700213,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.9,quantile_loss,0.010967503180152355,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,0.95,quantile_loss,0.0071899999204732045,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,mean,quantile_loss,0.006052135549716419,train,"{""n_variables"": 2}"
+benchmark_loss,QRF,quantile_loss_mean_all,mean,quantile_loss,0.017217385405120095,test,"{""n_variables"": 2}"
+benchmark_loss,QRF,log_loss_mean_all,0.05,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.1,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.15,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.2,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.25,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.3,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.35,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.4,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.45,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.5,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.55,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.6,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.65,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.7,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.75,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.8,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.85,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.9,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.95,log_loss,2.614446654065684,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.05,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.1,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.15,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.2,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.25,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.3,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.35,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.4,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.45,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.5,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.55,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.6,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.65,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.7,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.75,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.8,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.85,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.9,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,0.95,log_loss,6.156691078407442,test,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,mean,log_loss,2.6144466540656834,train,"{""n_variables"": 1}"
+benchmark_loss,QRF,log_loss_mean_all,mean,log_loss,6.156691078407443,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.05,quantile_loss,0.003793097970980961,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.1,quantile_loss,0.0064813273535348865,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.15,quantile_loss,0.008718559399878228,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.2,quantile_loss,0.010655610008580571,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.25,quantile_loss,0.012256033388805257,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.3,quantile_loss,0.013565140770903024,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.35,quantile_loss,0.014611889242340062,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.4,quantile_loss,0.015425975031196375,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.45,quantile_loss,0.01605944525518228,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.5,quantile_loss,0.01647854556609527,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.55,quantile_loss,0.01661220911122457,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.6,quantile_loss,0.01645760847896342,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.65,quantile_loss,0.016061546015992825,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.7,quantile_loss,0.015395729893732578,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.75,quantile_loss,0.014398366337920352,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.8,quantile_loss,0.012997538438059541,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.85,quantile_loss,0.011142832423357984,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.9,quantile_loss,0.008676966523108521,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.95,quantile_loss,0.0053039200554893294,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.05,quantile_loss,0.003875743024333408,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.1,quantile_loss,0.006636892853346667,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.15,quantile_loss,0.008964045456920146,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.2,quantile_loss,0.010925268697485854,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.25,quantile_loss,0.012586171018988979,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.3,quantile_loss,0.013971078532560128,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.35,quantile_loss,0.015078371048174203,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.4,quantile_loss,0.015960673093506517,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.45,quantile_loss,0.016611314804344936,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.5,quantile_loss,0.017023427694261576,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.55,quantile_loss,0.017162262823655853,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.6,quantile_loss,0.016994331164241493,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.65,quantile_loss,0.016563877768320707,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.7,quantile_loss,0.01584349745574873,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.75,quantile_loss,0.014830479499612956,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.8,quantile_loss,0.013414418494530157,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.85,quantile_loss,0.011604173888267462,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.9,quantile_loss,0.009116693282835488,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,0.95,quantile_loss,0.005653910575626517,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,mean,quantile_loss,0.012373281119228738,train,"{""n_variables"": 2}"
+benchmark_loss,OLS,quantile_loss_mean_all,mean,quantile_loss,0.012779822693513777,test,"{""n_variables"": 2}"
+benchmark_loss,OLS,log_loss_mean_all,0.05,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.1,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.15,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.2,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.25,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.3,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.35,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.4,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.45,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.5,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.55,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.6,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.65,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.7,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.75,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.8,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.85,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.9,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.95,log_loss,0.9858032860627665,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.05,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.1,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.15,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.2,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.25,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.3,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.35,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.4,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.45,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.5,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.55,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.6,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.65,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.7,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.75,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.8,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.85,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.9,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,0.95,log_loss,1.0101334442421657,test,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,mean,log_loss,0.9858032860627663,train,"{""n_variables"": 1}"
+benchmark_loss,OLS,log_loss_mean_all,mean,log_loss,1.0101334442421654,test,"{""n_variables"": 1}"
+benchmark_loss,QuantReg,quantile_loss_mean_all,mean,quantile_loss,,train,"{""n_variables"": 0}"
+benchmark_loss,QuantReg,quantile_loss_mean_all,mean,quantile_loss,,test,"{""n_variables"": 0}"
+benchmark_loss,QuantReg,log_loss_mean_all,mean,log_loss,,train,"{""n_variables"": 0}"
+benchmark_loss,QuantReg,log_loss_mean_all,mean,log_loss,,test,"{""n_variables"": 0}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.05,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.1,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.15,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.2,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.25,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.3,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.35,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.4,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.45,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.5,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.55,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.6,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.65,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.7,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.75,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.8,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.85,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.9,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.95,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.05,quantile_loss,0.022039382576829306,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.1,quantile_loss,0.022147598558993443,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.15,quantile_loss,0.022255814541157576,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.2,quantile_loss,0.022364030523321716,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.25,quantile_loss,0.022472246505485852,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.3,quantile_loss,0.02258046248764999,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.35,quantile_loss,0.022688678469814125,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.4,quantile_loss,0.02279689445197826,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.45,quantile_loss,0.0229051104341424,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.5,quantile_loss,0.02301332641630653,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.55,quantile_loss,0.02312154239847067,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.6,quantile_loss,0.023229758380634808,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.65,quantile_loss,0.023337974362798945,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.7,quantile_loss,0.023446190344963078,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.75,quantile_loss,0.023554406327127214,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.8,quantile_loss,0.02366262230929135,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.85,quantile_loss,0.023770838291455487,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.9,quantile_loss,0.023879054273619627,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,0.95,quantile_loss,0.02398727025578376,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,mean,quantile_loss,0.0,train,"{""n_variables"": 2}"
+benchmark_loss,Matching,quantile_loss_mean_all,mean,quantile_loss,0.02301332641630653,test,"{""n_variables"": 2}"
+benchmark_loss,Matching,log_loss_mean_all,0.05,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.1,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.15,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.2,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.25,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.3,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.35,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.4,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.45,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.5,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.55,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.6,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.65,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.7,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.75,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.8,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.85,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.9,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.95,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.05,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.1,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.15,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.2,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.25,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.3,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.35,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.4,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.45,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.5,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.55,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.6,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.65,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.7,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.75,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.8,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.85,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.9,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,0.95,log_loss,19.713195542915205,test,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,mean,log_loss,2.2204460492503136e-16,train,"{""n_variables"": 1}"
+benchmark_loss,Matching,log_loss_mean_all,mean,log_loss,19.71319554291521,test,"{""n_variables"": 1}"
+distribution_distance,OLSResults,s1,N/A,wasserstein_distance,0.024660387596042915,full,{}
+distribution_distance,OLSResults,s4,N/A,wasserstein_distance,0.020422408337066628,full,{}
+distribution_distance,OLSResults,risk_factor,N/A,kl_divergence,6.033154649748202,full,{}
+predictor_correlation,N/A,age,N/A,pearson,0.22798247938962524,full,"{""predictor2"": ""sex""}"
+predictor_correlation,N/A,age,N/A,pearson,0.2501624011317938,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,age,N/A,pearson,0.3534419190240634,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,sex,N/A,pearson,0.08064137058331985,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,sex,N/A,pearson,0.26905206635937173,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,bmi,N/A,pearson,0.43643800885198847,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,age,N/A,spearman,0.2309511404045441,full,"{""predictor2"": ""sex""}"
+predictor_correlation,N/A,age,N/A,spearman,0.2559475199483165,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,age,N/A,spearman,0.3697134718827012,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,sex,N/A,spearman,0.10617808669020486,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,sex,N/A,spearman,0.3010250570740961,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,bmi,N/A,spearman,0.4472525722966459,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,age,N/A,mutual_info,0.0,full,"{""predictor2"": ""sex""}"
+predictor_correlation,N/A,age,N/A,mutual_info,0.01992537029466096,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,age,N/A,mutual_info,0.02051274401878463,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,sex,N/A,mutual_info,0.024974606868113543,full,"{""predictor2"": ""bmi""}"
+predictor_correlation,N/A,sex,N/A,mutual_info,0.06825522582483731,full,"{""predictor2"": ""bp""}"
+predictor_correlation,N/A,bmi,N/A,mutual_info,0.012362825726377452,full,"{""predictor2"": ""bp""}"
+predictor_target_mi,N/A,age,N/A,mutual_info,0.007275692599840133,full,"{""target"": ""s1""}"
+predictor_target_mi,N/A,age,N/A,mutual_info,0.017843189636206607,full,"{""target"": ""s4""}"
+predictor_target_mi,N/A,age,N/A,mutual_info,0.0527351415960489,full,"{""target"": ""risk_factor""}"
+predictor_target_mi,N/A,sex,N/A,mutual_info,0.002833409209270051,full,"{""target"": ""s1""}"
+predictor_target_mi,N/A,sex,N/A,mutual_info,0.022502563145111076,full,"{""target"": ""s4""}"
+predictor_target_mi,N/A,sex,N/A,mutual_info,0.03936347909918465,full,"{""target"": ""risk_factor""}"
+predictor_target_mi,N/A,bmi,N/A,mutual_info,0.00712501381273246,full,"{""target"": ""s1""}"
+predictor_target_mi,N/A,bmi,N/A,mutual_info,0.042828982564792506,full,"{""target"": ""s4""}"
+predictor_target_mi,N/A,bmi,N/A,mutual_info,0.09273531468209292,full,"{""target"": ""risk_factor""}"
+predictor_target_mi,N/A,bp,N/A,mutual_info,0.007630872443873875,full,"{""target"": ""s1""}"
+predictor_target_mi,N/A,bp,N/A,mutual_info,0.009030290161605078,full,"{""target"": ""s4""}"
+predictor_target_mi,N/A,bp,N/A,mutual_info,0.012933835727825435,full,"{""target"": ""risk_factor""}"
+predictor_importance,OLSResults,sex,N/A,relative_impact,30.680328353256453,test,"{""removed_predictor"": ""sex""}"
+predictor_importance,OLSResults,sex,N/A,loss_increase,0.7393423418942775,test,"{""removed_predictor"": ""sex""}"
+predictor_importance,OLSResults,bmi,N/A,relative_impact,0.03247893420537184,test,"{""removed_predictor"": ""bmi""}"
+predictor_importance,OLSResults,bmi,N/A,loss_increase,0.000782685602355393,test,"{""removed_predictor"": ""bmi""}"
+predictor_importance,OLSResults,age,N/A,relative_impact,0.00454596377561416,test,"{""removed_predictor"": ""age""}"
+predictor_importance,OLSResults,age,N/A,loss_increase,0.00010954978921118297,test,"{""removed_predictor"": ""age""}"
+predictor_importance,OLSResults,bp,N/A,relative_impact,-0.004826970371974454,test,"{""removed_predictor"": ""bp""}"
+predictor_importance,OLSResults,bp,N/A,loss_increase,-0.0001163215575132881,test,"{""removed_predictor"": ""bp""}"
+progressive_inclusion,OLSResults,N/A,N/A,cumulative_improvement,0.0,test,"{""step"": 1, ""predictor_added"": ""sex"", ""predictors"": [""sex""]}"
+progressive_inclusion,OLSResults,N/A,N/A,marginal_improvement,0.0,test,"{""step"": 1, ""predictor_added"": ""sex""}"
+progressive_inclusion,OLSResults,N/A,N/A,cumulative_improvement,0.0010940165047195194,test,"{""step"": 2, ""predictor_added"": ""bmi"", ""predictors"": [""sex"", ""bmi""]}"
+progressive_inclusion,OLSResults,N/A,N/A,marginal_improvement,0.0010940165047195194,test,"{""step"": 2, ""predictor_added"": ""bmi""}"
+progressive_inclusion,OLSResults,N/A,N/A,cumulative_improvement,0.0012175858369123382,test,"{""step"": 3, ""predictor_added"": ""age"", ""predictors"": [""sex"", ""bmi"", ""age""]}"
+progressive_inclusion,OLSResults,N/A,N/A,marginal_improvement,0.00012356933219281885,test,"{""step"": 3, ""predictor_added"": ""age""}"
+progressive_inclusion,OLSResults,N/A,N/A,cumulative_improvement,0.0011012642793990501,test,"{""step"": 4, ""predictor_added"": ""bp"", ""predictors"": [""sex"", ""bmi"", ""age"", ""bp""]}"
+progressive_inclusion,OLSResults,N/A,N/A,marginal_improvement,-0.0001163215575132881,test,"{""step"": 4, ""predictor_added"": ""bp""}"
diff --git a/microimputation-dashboard/utils/deeplinks.ts b/microimputation-dashboard/utils/deeplinks.ts
index 55b7af3..31d48bf 100644
--- a/microimputation-dashboard/utils/deeplinks.ts
+++ b/microimputation-dashboard/utils/deeplinks.ts
@@ -8,103 +8,36 @@ export interface GitHubArtifactInfo {
 }
 
 export interface DeeplinkParams {
-  mode?: 'single' | 'comparison';
   primary?: GitHubArtifactInfo;
-  secondary?: GitHubArtifactInfo;
 }
 
 export function parseDeeplinkParams(searchParams: URLSearchParams): DeeplinkParams | null {
-  const mode = searchParams.get('mode') || 'single';
-
-  const primaryRepo = searchParams.get('repo');
-  const primaryBranch = searchParams.get('branch');
-  const primaryCommit = searchParams.get('commit');
-  const primaryArtifact = searchParams.get('artifact');
-
-  if (!primaryRepo || !primaryBranch || !primaryCommit || !primaryArtifact) {
-    // Check for comparison mode parameters
-    const repo1 = searchParams.get('repo1');
-    const branch1 = searchParams.get('branch1');
-    const commit1 = searchParams.get('commit1');
-    const artifact1 = searchParams.get('artifact1');
-
-    const repo2 = searchParams.get('repo2');
-    const branch2 = searchParams.get('branch2');
-    const commit2 = searchParams.get('commit2');
-    const artifact2 = searchParams.get('artifact2');
-
-    if (repo1 && branch1 && commit1 && artifact1 && repo2 && branch2 && commit2 && artifact2) {
-      return {
-        mode: 'comparison',
-        primary: {
-          repo: repo1,
-          branch: branch1,
-          commit: commit1,
-          artifact: artifact1,
-        },
-        secondary: {
-          repo: repo2,
-          branch: branch2,
-          commit: commit2,
-          artifact: artifact2,
-        },
-      };
-    }
+  const repo = searchParams.get('repo');
+  const branch = searchParams.get('branch');
+  const commit = searchParams.get('commit');
+  const artifact = searchParams.get('artifact');
 
+  if (!repo || !branch || !commit || !artifact) {
     return null;
   }
 
-  const params: DeeplinkParams = {
-    mode: mode as 'single' | 'comparison',
+  return {
     primary: {
-      repo: primaryRepo,
-      branch: primaryBranch,
-      commit: primaryCommit,
-      artifact: primaryArtifact,
+      repo,
+      branch,
+      commit,
+      artifact,
     },
   };
-
-  // Check for secondary parameters for comparison mode
-  const secondaryRepo = searchParams.get('repo2') || primaryRepo;
-  const secondaryBranch = searchParams.get('branch2');
-  const secondaryCommit = searchParams.get('commit2');
-  const secondaryArtifact = searchParams.get('artifact2');
-
-  if (secondaryBranch && secondaryCommit && secondaryArtifact) {
-    params.mode = 'comparison';
-    params.secondary = {
-      repo: secondaryRepo,
-      branch: secondaryBranch,
-      commit: secondaryCommit,
-      artifact: secondaryArtifact,
-    };
-  }
-
-  return params;
 }
 
-export function createShareableUrl(baseUrl: string, artifactInfo: GitHubArtifactInfo, secondaryInfo?: GitHubArtifactInfo): string {
+export function createShareableUrl(baseUrl: string, artifactInfo: GitHubArtifactInfo): string {
   const url = new URL(baseUrl);
 
-  if (secondaryInfo) {
-    // Comparison mode
-    url.searchParams.set('mode', 'comparison');
-    url.searchParams.set('repo1', artifactInfo.repo);
-    url.searchParams.set('branch1', artifactInfo.branch);
-    url.searchParams.set('commit1', artifactInfo.commit);
-    url.searchParams.set('artifact1', artifactInfo.artifact);
-    url.searchParams.set('repo2', secondaryInfo.repo);
-    url.searchParams.set('branch2', secondaryInfo.branch);
-    url.searchParams.set('commit2', secondaryInfo.commit);
-    url.searchParams.set('artifact2', secondaryInfo.artifact);
-  } else {
-    // Single mode
-    url.searchParams.set('mode', 'single');
-    url.searchParams.set('repo', artifactInfo.repo);
-    url.searchParams.set('branch', artifactInfo.branch);
-    url.searchParams.set('commit', artifactInfo.commit);
-    url.searchParams.set('artifact', artifactInfo.artifact);
-  }
+  url.searchParams.set('repo', artifactInfo.repo);
+  url.searchParams.set('branch', artifactInfo.branch);
+  url.searchParams.set('commit', artifactInfo.commit);
+  url.searchParams.set('artifact', artifactInfo.artifact);
 
   return url.toString();
 }
\ No newline at end of file

From d3637644b98795091468da38a66b61e02506d97a Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 13:07:05 +0800
Subject: [PATCH 05/12] add share dashboard button for deeplinks

---
 microimputation-dashboard/app/page.tsx        |  25 +---
 .../components/FileUpload.tsx                 |  35 +++---
 .../components/VisualizationDashboard.tsx     | 109 ++++++++++++++----
 microimputation-dashboard/utils/deeplinks.ts  |  21 ++--
 4 files changed, 123 insertions(+), 67 deletions(-)

diff --git a/microimputation-dashboard/app/page.tsx b/microimputation-dashboard/app/page.tsx
index 8905f4e..a8bc1b6 100644
--- a/microimputation-dashboard/app/page.tsx
+++ b/microimputation-dashboard/app/page.tsx
@@ -65,30 +65,6 @@ function HomeContent() {
 
   return (
     <main className="min-h-screen bg-gray-50">
-      {/* Header */}
-      <header className="bg-white shadow-sm border-b">
-        <div className="max-w-7xl mx-auto px-4 sm:px-6 lg:px-8">
-          <div className="flex justify-between items-center py-6">
-            <div className="flex items-center space-x-3">
-              <h1 className="text-3xl font-bold text-gray-900">
-                Microimpute Dashboard
-              </h1>
-              <span className="bg-blue-100 text-blue-800 text-xs font-semibold px-2.5 py-0.5 rounded">
-                Beta
-              </span>
-            </div>
-            {showDashboard && (
-              <button
-                onClick={handleBackToUpload}
-                className="text-sm text-blue-600 hover:text-blue-800 font-medium"
-              >
-                ← Back to upload
-              </button>
-            )}
-          </div>
-        </div>
-      </header>
-
       {/* Main content */}
       <div className="max-w-7xl mx-auto px-4 sm:px-6 lg:px-8 py-8">
         {!showDashboard ? (
@@ -105,6 +81,7 @@ function HomeContent() {
             data={data}
             fileName={fileName}
             githubArtifactInfo={githubArtifactInfo}
+            onBackToUpload={handleBackToUpload}
           />
         )}
       </div>
diff --git a/microimputation-dashboard/components/FileUpload.tsx b/microimputation-dashboard/components/FileUpload.tsx
index a9bf564..fad0ec7 100644
--- a/microimputation-dashboard/components/FileUpload.tsx
+++ b/microimputation-dashboard/components/FileUpload.tsx
@@ -700,12 +700,20 @@ export default function FileUpload({
 
 
   return (
-    <div className="bg-white rounded-lg shadow-lg p-6">
-      <div className="mb-6">
-        <h2 className="text-2xl font-semibold text-gray-900 mb-2">Load imputation data</h2>
-        <p className="text-gray-600">Choose how you would like to load your CSV file</p>
+    <div className="space-y-8">
+      {/* Page Title */}
+      <div>
+        <h1 className="text-4xl font-bold text-gray-900 mb-2">Microimpute Dashboard</h1>
+        <p className="text-gray-600">Microimputation quality and model benchmarking assessment</p>
       </div>
 
+      {/* Upload Card */}
+      <div className="bg-white rounded-lg shadow-lg p-6">
+        <div className="mb-6">
+          <h2 className="text-2xl font-semibold text-gray-900 mb-2">Load imputation data</h2>
+          <p className="text-gray-600">Choose how you would like to load your CSV file</p>
+        </div>
+
       {error && (
         <div className={`mb-4 rounded-md p-3 ${
           error.startsWith('🔄')
@@ -1037,15 +1045,16 @@ export default function FileUpload({
         </div>
       )}
 
-      {/* Global loading indicator */}
-      {(isLoading || isLoadingGithubData) && (
-        <div className="mt-4 text-center">
-          <div className="inline-block animate-spin rounded-full h-6 w-6 border-b-2 border-blue-600" />
-          <p className="text-sm text-gray-600 mt-2">
-            {isLoadingGithubData ? 'Loading GitHub data...' : 'Loading file...'}
-          </p>
-        </div>
-      )}
+        {/* Global loading indicator */}
+        {(isLoading || isLoadingGithubData) && (
+          <div className="mt-4 text-center">
+            <div className="inline-block animate-spin rounded-full h-6 w-6 border-b-2 border-blue-600" />
+            <p className="text-sm text-gray-600 mt-2">
+              {isLoadingGithubData ? 'Loading GitHub data...' : 'Loading file...'}
+            </p>
+          </div>
+        )}
+      </div>
     </div>
   );
 }
\ No newline at end of file
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index 6e046dd..16ce893 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -2,23 +2,41 @@
 
 import { useMemo, useState } from 'react';
 import { ImputationDataPoint } from '@/types/imputation';
-import { GitHubArtifactInfo } from '@/utils/deeplinks';
+import { GitHubArtifactInfo, createShareableUrl } from '@/utils/deeplinks';
 import BenchmarkLossCharts from './BenchmarkLossCharts';
 import PerVariableCharts from './PerVariableCharts';
 import VisualizationTabs from './VisualizationTabs';
+import { Share } from 'lucide-react';
 
 interface VisualizationDashboardProps {
   data: ImputationDataPoint[];
   fileName: string;
   githubArtifactInfo?: GitHubArtifactInfo | null;
+  onBackToUpload: () => void;
 }
 
 export default function VisualizationDashboard({
   data,
   fileName,
+  githubArtifactInfo,
+  onBackToUpload,
 }: VisualizationDashboardProps) {
   const [activeTab, setActiveTab] = useState('overview');
 
+  // Handle sharing the dashboard via deeplink
+  const handleShare = async () => {
+    if (!githubArtifactInfo) return;
+
+    try {
+      const shareUrl = createShareableUrl(githubArtifactInfo);
+      await navigator.clipboard.writeText(shareUrl);
+      alert('Shareable URL copied to clipboard!');
+    } catch (err) {
+      console.error('Failed to copy URL:', err);
+      alert('Failed to copy URL to clipboard');
+    }
+  };
+
   // Analyze data structure and available visualizations
   const dataAnalysis = useMemo(() => {
     const types = new Set(data.map(d => d.type));
@@ -95,12 +113,32 @@ export default function VisualizationDashboard({
   if (!dataAnalysis.hasBenchmarkLoss) {
     return (
       <div className="space-y-8">
-        <div className="bg-white rounded-lg shadow-lg p-6">
-          <h2 className="text-3xl font-bold text-gray-900 mb-4">Visualization Dashboard</h2>
-          <div className="p-4 bg-gray-50 rounded">
-            <p className="text-sm text-gray-600">
-              Successfully loaded: <strong>{fileName}</strong> ({data.length} records)
-            </p>
+        {/* Header */}
+        <div>
+          <div className="flex justify-between items-start mb-4 gap-4">
+            <div className="flex-1 min-w-0">
+              <h1 className="text-4xl font-bold text-gray-900 mb-2">Microimpute Dashboard</h1>
+              <p className="text-gray-600 break-words">
+                Loaded: <span className="text-blue-600 break-all">{fileName}</span>
+              </p>
+            </div>
+            <div className="flex gap-3 flex-shrink-0">
+              {githubArtifactInfo && (
+                <button
+                  onClick={handleShare}
+                  className="bg-green-600 hover:bg-green-700 text-white font-medium py-2 px-4 rounded-md transition-colors flex items-center gap-2 whitespace-nowrap"
+                >
+                  <Share size={16} />
+                  Share Dashboard
+                </button>
+              )}
+              <button
+                onClick={onBackToUpload}
+                className="bg-blue-600 hover:bg-blue-700 text-white font-medium py-2 px-4 rounded-md transition-colors whitespace-nowrap"
+              >
+                Load new file
+              </button>
+            </div>
           </div>
         </div>
         <div className="bg-white rounded-lg shadow-lg p-12">
@@ -118,24 +156,53 @@ export default function VisualizationDashboard({
   return (
     <div className="space-y-8">
       {/* Header */}
+      <div>
+        <div className="flex justify-between items-start mb-4 gap-4">
+          <div className="flex-1 min-w-0">
+            <h1 className="text-4xl font-bold text-gray-900 mb-2">Microimpute Dashboard</h1>
+            <p className="text-gray-600 break-words">
+              Loaded: <span className="text-blue-600 break-all">{fileName}</span>
+            </p>
+          </div>
+          <div className="flex gap-3 flex-shrink-0">
+            {githubArtifactInfo && (
+              <button
+                onClick={handleShare}
+                className="bg-green-600 hover:bg-green-700 text-white font-medium py-2 px-4 rounded-md transition-colors flex items-center gap-2 whitespace-nowrap"
+              >
+                <Share size={16} />
+                Share Dashboard
+              </button>
+            )}
+            <button
+              onClick={onBackToUpload}
+              className="bg-blue-600 hover:bg-blue-700 text-white font-medium py-2 px-4 rounded-md transition-colors whitespace-nowrap"
+            >
+              Load new file
+            </button>
+          </div>
+        </div>
+      </div>
+
+      {/* Data Info */}
       <div className="bg-white rounded-lg shadow-lg p-6">
-        <h2 className="text-3xl font-bold text-gray-900 mb-4">Visualization Dashboard</h2>
-        <div className="p-4 bg-gray-50 rounded">
-          <p className="text-sm text-gray-600">
-            Successfully loaded: <strong>{fileName}</strong>
-          </p>
-          <p className="text-sm text-gray-600 mt-1">
-            Records: <strong>{data.length}</strong>
-          </p>
+        <h2 className="text-xl font-semibold text-gray-900 mb-3">Dataset Overview</h2>
+        <div className="grid grid-cols-1 md:grid-cols-3 gap-4">
+          <div className="p-4 bg-gray-50 rounded">
+            <p className="text-sm text-gray-600">Total Records</p>
+            <p className="text-2xl font-bold text-gray-900">{data.length}</p>
+          </div>
           {dataAnalysis.numericalVars.length > 0 && (
-            <p className="text-sm text-gray-600 mt-1">
-              Numerical variables: <strong>{dataAnalysis.numericalVars.length}</strong>
-            </p>
+            <div className="p-4 bg-gray-50 rounded">
+              <p className="text-sm text-gray-600">Numerical Variables</p>
+              <p className="text-2xl font-bold text-gray-900">{dataAnalysis.numericalVars.length}</p>
+            </div>
           )}
           {dataAnalysis.categoricalVars.length > 0 && (
-            <p className="text-sm text-gray-600 mt-1">
-              Categorical variables: <strong>{dataAnalysis.categoricalVars.length}</strong>
-            </p>
+            <div className="p-4 bg-gray-50 rounded">
+              <p className="text-sm text-gray-600">Categorical Variables</p>
+              <p className="text-2xl font-bold text-gray-900">{dataAnalysis.categoricalVars.length}</p>
+            </div>
           )}
         </div>
       </div>
diff --git a/microimputation-dashboard/utils/deeplinks.ts b/microimputation-dashboard/utils/deeplinks.ts
index 31d48bf..5ce99b9 100644
--- a/microimputation-dashboard/utils/deeplinks.ts
+++ b/microimputation-dashboard/utils/deeplinks.ts
@@ -31,13 +31,16 @@ export function parseDeeplinkParams(searchParams: URLSearchParams): DeeplinkPara
   };
 }
 
-export function createShareableUrl(baseUrl: string, artifactInfo: GitHubArtifactInfo): string {
-  const url = new URL(baseUrl);
-
-  url.searchParams.set('repo', artifactInfo.repo);
-  url.searchParams.set('branch', artifactInfo.branch);
-  url.searchParams.set('commit', artifactInfo.commit);
-  url.searchParams.set('artifact', artifactInfo.artifact);
-
-  return url.toString();
+export function createShareableUrl(artifactInfo: GitHubArtifactInfo): string {
+  const baseUrl = typeof window !== 'undefined'
+    ? `${window.location.protocol}//${window.location.host}${window.location.pathname}`
+    : '';
+
+  const urlParams = new URLSearchParams();
+  urlParams.set('repo', artifactInfo.repo);
+  urlParams.set('branch', artifactInfo.branch);
+  urlParams.set('commit', artifactInfo.commit);
+  urlParams.set('artifact', artifactInfo.artifact);
+
+  return `${baseUrl}?${urlParams.toString()}`;
 }
\ No newline at end of file

From a7f756a1e1d733c7ec678bbb992f0a689117e4d1 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 14:57:37 +0800
Subject: [PATCH 06/12] add train/test split viz

---
 microimputation-dashboard/app/globals.css     |   6 +-
 microimputation-dashboard/app/layout.tsx      |  18 +-
 .../components/BenchmarkLossCharts.tsx        | 573 +++++++++++++++---
 3 files changed, 511 insertions(+), 86 deletions(-)

diff --git a/microimputation-dashboard/app/globals.css b/microimputation-dashboard/app/globals.css
index a2dc41e..86b4953 100644
--- a/microimputation-dashboard/app/globals.css
+++ b/microimputation-dashboard/app/globals.css
@@ -8,8 +8,8 @@
 @theme inline {
   --color-background: var(--background);
   --color-foreground: var(--foreground);
-  --font-sans: var(--font-geist-sans);
-  --font-mono: var(--font-geist-mono);
+  --font-sans: var(--font-roboto-serif);
+  --font-mono: var(--font-roboto-mono);
 }
 
 @media (prefers-color-scheme: dark) {
@@ -22,5 +22,5 @@
 body {
   background: var(--background);
   color: var(--foreground);
-  font-family: Arial, Helvetica, sans-serif;
+  font-family: var(--font-roboto-serif), ui-serif, Georgia, Cambria, "Times New Roman", Times, serif;
 }
diff --git a/microimputation-dashboard/app/layout.tsx b/microimputation-dashboard/app/layout.tsx
index f7fa87e..a1be77b 100644
--- a/microimputation-dashboard/app/layout.tsx
+++ b/microimputation-dashboard/app/layout.tsx
@@ -1,20 +1,22 @@
 import type { Metadata } from "next";
-import { Geist, Geist_Mono } from "next/font/google";
+import { Roboto_Serif, Roboto_Mono } from "next/font/google";
 import "./globals.css";
 
-const geistSans = Geist({
-  variable: "--font-geist-sans",
+const robotoSerif = Roboto_Serif({
+  variable: "--font-roboto-serif",
   subsets: ["latin"],
+  weight: ["300", "400", "500", "600", "700"],
 });
 
-const geistMono = Geist_Mono({
-  variable: "--font-geist-mono",
+const robotoMono = Roboto_Mono({
+  variable: "--font-roboto-mono",
   subsets: ["latin"],
+  weight: ["300", "400", "500", "600", "700"],
 });
 
 export const metadata: Metadata = {
-  title: "Create Next App",
-  description: "Generated by create next app",
+  title: "Microimpute Dashboard",
+  description: "Microimputation quality and model benchmarking assessment",
 };
 
 export default function RootLayout({
@@ -25,7 +27,7 @@ export default function RootLayout({
   return (
     <html lang="en">
       <body
-        className={`${geistSans.variable} ${geistMono.variable} antialiased`}
+        className={`${robotoSerif.variable} ${robotoMono.variable} antialiased`}
       >
         {children}
       </body>
diff --git a/microimputation-dashboard/components/BenchmarkLossCharts.tsx b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
index 70a00c3..88b579d 100644
--- a/microimputation-dashboard/components/BenchmarkLossCharts.tsx
+++ b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
@@ -1,6 +1,6 @@
 'use client';
 
-import { useMemo } from 'react';
+import { useMemo, useState } from 'react';
 import {
   BarChart,
   Bar,
@@ -25,6 +25,9 @@ export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps)
     return data.filter(d => d.type === 'benchmark_loss');
   }, [data]);
 
+  // State for selected method in train/test comparison
+  const [selectedMethod, setSelectedMethod] = useState<string>('');
+
   // Check if we have benchmark loss data
   const hasBenchmarkData = benchmarkData.length > 0;
 
@@ -99,90 +102,510 @@ export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps)
     }));
   }, [logLossData]);
 
+  // Determine best performing model
+  const bestModel = useMemo(() => {
+    if (methods.length === 0) return null;
+
+    // Calculate average quantile loss per method (test only)
+    const quantileLossAvg = new Map<string, number>();
+    // Count unique variables per method for quantile loss
+    const quantileVarCounts = new Map<string, Set<string>>();
+
+    if (quantileLossData.length > 0) {
+      const methodSums = new Map<string, { sum: number; count: number }>();
+      quantileLossData.forEach(d => {
+        if (d.metric_value !== null) {
+          if (!methodSums.has(d.method)) {
+            methodSums.set(d.method, { sum: 0, count: 0 });
+          }
+          const entry = methodSums.get(d.method)!;
+          entry.sum += d.metric_value;
+          entry.count += 1;
+
+          // Track unique variables
+          if (!quantileVarCounts.has(d.method)) {
+            quantileVarCounts.set(d.method, new Set());
+          }
+          quantileVarCounts.get(d.method)!.add(d.variable);
+        }
+      });
+      methodSums.forEach((value, method) => {
+        quantileLossAvg.set(method, value.sum / value.count);
+      });
+    }
+
+    // Calculate average log loss per method (test only, already have this in logLossChartData)
+    const logLossAvg = new Map<string, number>();
+    // Count unique variables per method for log loss
+    const logLossVarCounts = new Map<string, Set<string>>();
+
+    logLossData.forEach(d => {
+      if (d.metric_value !== null) {
+        if (!logLossVarCounts.has(d.method)) {
+          logLossVarCounts.set(d.method, new Set());
+        }
+        logLossVarCounts.get(d.method)!.add(d.variable);
+      }
+    });
+
+    logLossChartData.forEach(({ method, value }) => {
+      logLossAvg.set(method, value);
+    });
+
+    // Rank methods by each metric (lower is better, so rank 1 is best)
+    const rankMethods = (avgMap: Map<string, number>): Map<string, number> => {
+      const sorted = Array.from(avgMap.entries()).sort((a, b) => a[1] - b[1]);
+      const ranks = new Map<string, number>();
+      sorted.forEach(([method], index) => {
+        ranks.set(method, index + 1);
+      });
+      return ranks;
+    };
+
+    const quantileRanks = rankMethods(quantileLossAvg);
+    const logLossRanks = rankMethods(logLossAvg);
+
+    // Calculate weighted combined rank (weighted by number of variables of each type)
+    // This matches autoimpute's select_best_model_dual_metrics approach
+    const combinedRanks = new Map<string, number>();
+    methods.forEach(method => {
+      const qRank = quantileRanks.get(method);
+      const lRank = logLossRanks.get(method);
+      const nQuantileVars = quantileVarCounts.get(method)?.size || 0;
+      const nLogLossVars = logLossVarCounts.get(method)?.size || 0;
+      const totalVars = nQuantileVars + nLogLossVars;
+
+      if (totalVars > 0) {
+        let weightedRank = 0;
+        if (qRank !== undefined) {
+          weightedRank += nQuantileVars * qRank;
+        }
+        if (lRank !== undefined) {
+          weightedRank += nLogLossVars * lRank;
+        }
+        combinedRanks.set(method, weightedRank / totalVars);
+      } else {
+        combinedRanks.set(method, Infinity);
+      }
+    });
+
+    // Find best method (lowest combined rank)
+    let bestMethod = '';
+    let bestRank = Infinity;
+    combinedRanks.forEach((rank, method) => {
+      if (rank < bestRank) {
+        bestRank = rank;
+        bestMethod = method;
+      }
+    });
+
+    // Calculate train/test ratios for the best method
+    let quantileTrainTestRatio: number | undefined;
+    let logLossTrainTestRatio: number | undefined;
+
+    // Quantile loss train/test ratio
+    const bestQuantileTrain = benchmarkData.filter(
+      d => d.method === bestMethod && d.metric_name === 'quantile_loss' && d.split === 'train' && d.metric_value !== null
+    );
+    const bestQuantileTest = benchmarkData.filter(
+      d => d.method === bestMethod && d.metric_name === 'quantile_loss' && d.split === 'test' && d.metric_value !== null
+    );
+
+    if (bestQuantileTrain.length > 0 && bestQuantileTest.length > 0) {
+      const trainAvg = bestQuantileTrain.reduce((sum, d) => sum + d.metric_value!, 0) / bestQuantileTrain.length;
+      const testAvg = bestQuantileTest.reduce((sum, d) => sum + d.metric_value!, 0) / bestQuantileTest.length;
+      quantileTrainTestRatio = testAvg / trainAvg;
+    }
+
+    // Log loss train/test ratio
+    const bestLogLossTrain = benchmarkData.filter(
+      d => d.method === bestMethod && d.metric_name === 'log_loss' && d.split === 'train' && d.metric_value !== null
+    );
+    const bestLogLossTest = benchmarkData.filter(
+      d => d.method === bestMethod && d.metric_name === 'log_loss' && d.split === 'test' && d.metric_value !== null
+    );
+
+    if (bestLogLossTrain.length > 0 && bestLogLossTest.length > 0) {
+      const trainAvg = bestLogLossTrain.reduce((sum, d) => sum + d.metric_value!, 0) / bestLogLossTrain.length;
+      const testAvg = bestLogLossTest.reduce((sum, d) => sum + d.metric_value!, 0) / bestLogLossTest.length;
+      logLossTrainTestRatio = testAvg / trainAvg;
+    }
+
+    return {
+      method: bestMethod,
+      quantileLoss: quantileLossAvg.get(bestMethod),
+      logLoss: logLossAvg.get(bestMethod),
+      quantileTrainTestRatio,
+      logLossTrainTestRatio,
+    };
+  }, [methods, quantileLossData, logLossChartData, benchmarkData]);
+
+  // Set default selected method to best model
+  useMemo(() => {
+    if (bestModel && bestModel.method && !selectedMethod) {
+      setSelectedMethod(bestModel.method);
+    }
+  }, [bestModel, selectedMethod]);
+
+  // Prepare train/test comparison data for selected method
+  const trainTestData = useMemo(() => {
+    if (!selectedMethod) return { quantile: [], logLoss: [] };
+
+    // Quantile loss train vs test
+    const quantileTrainTest: Array<{ quantile: string; train: number | null; test: number | null }> = [];
+    const quantileData = benchmarkData.filter(
+      d => d.method === selectedMethod && d.metric_name === 'quantile_loss'
+    );
+
+    if (quantileData.length > 0) {
+      const quantileMap = new Map<string, { train: number | null; test: number | null }>();
+
+      quantileData.forEach(d => {
+        const q = typeof d.quantile === 'number' ? d.quantile.toFixed(2) : String(d.quantile || '');
+        // Skip 'mean' quantiles
+        if (q.toLowerCase().includes('mean')) return;
+
+        if (!quantileMap.has(q)) {
+          quantileMap.set(q, { train: null, test: null });
+        }
+        const entry = quantileMap.get(q)!;
+        if (d.split === 'train') entry.train = d.metric_value;
+        if (d.split === 'test') entry.test = d.metric_value;
+      });
+
+      quantileMap.forEach((value, quantile) => {
+        quantileTrainTest.push({ quantile, ...value });
+      });
+
+      quantileTrainTest.sort((a, b) => parseFloat(a.quantile) - parseFloat(b.quantile));
+    }
+
+    // Log loss train vs test (average across variables)
+    const logLossTrainTest: Array<{ category: string; train: number; test: number }> = [];
+    const logData = benchmarkData.filter(
+      d => d.method === selectedMethod && d.metric_name === 'log_loss' && d.metric_value !== null
+    );
+
+    if (logData.length > 0) {
+      const trainVals: number[] = [];
+      const testVals: number[] = [];
+
+      logData.forEach(d => {
+        if (d.split === 'train') trainVals.push(d.metric_value!);
+        if (d.split === 'test') testVals.push(d.metric_value!);
+      });
+
+      if (trainVals.length > 0 || testVals.length > 0) {
+        const trainAvg = trainVals.length > 0 ? trainVals.reduce((a, b) => a + b, 0) / trainVals.length : 0;
+        const testAvg = testVals.length > 0 ? testVals.reduce((a, b) => a + b, 0) / testVals.length : 0;
+
+        logLossTrainTest.push({
+          category: 'Average',
+          train: trainAvg,
+          test: testAvg,
+        });
+      }
+    }
+
+    return {
+      quantile: quantileTrainTest,
+      logLoss: logLossTrainTest,
+    };
+  }, [selectedMethod, benchmarkData]);
+
+  const hasQuantileTrainTest = trainTestData.quantile.length > 0;
+  const hasLogLossTrainTest = trainTestData.logLoss.length > 0;
+
+  // Filter methods that have train/test data
+  const methodsWithData = useMemo(() => {
+    const validMethods = new Set<string>();
+
+    methods.forEach(method => {
+      const methodQuantileData = benchmarkData.filter(
+        d => d.method === method && d.metric_name === 'quantile_loss' && d.metric_value !== null
+      );
+      const methodLogLossData = benchmarkData.filter(
+        d => d.method === method && d.metric_name === 'log_loss' && d.metric_value !== null
+      );
+
+      if (methodQuantileData.length > 0 || methodLogLossData.length > 0) {
+        validMethods.add(method);
+      }
+    });
+
+    return Array.from(validMethods);
+  }, [methods, benchmarkData]);
+
+  const methodsWithoutData = methods.filter(m => !methodsWithData.includes(m));
+
   if (!hasBenchmarkData) {
     return null;
   }
 
   return (
-    <div className="space-y-8">
-      {/* Quantile Loss Comparison */}
-      {quantileChartData.length > 0 && (
-        <div className="bg-white p-6 rounded-lg shadow">
-          <h3 className="text-xl font-semibold mb-4 text-gray-900">
-            Test Quantile Loss Across Quantiles for Different Imputation Methods
-          </h3>
-          <ResponsiveContainer width="100%" height={400}>
-            <BarChart data={quantileChartData}>
-              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
-              <XAxis
-                dataKey="quantile"
-                label={{ value: 'Quantiles', position: 'insideBottom', offset: -5 }}
-                tick={{ fill: '#666' }}
-              />
-              <YAxis
-                label={{ value: 'Test Quantile Loss', angle: -90, position: 'insideLeft' }}
-                tick={{ fill: '#666' }}
-              />
-              <Tooltip
-                contentStyle={{
-                  backgroundColor: '#fff',
-                  border: '1px solid #ccc',
-                  color: '#000',
-                }}
-                labelStyle={{ color: '#000', fontWeight: 'bold' }}
-                itemStyle={{ color: '#000' }}
-                formatter={(value: number) => value.toFixed(6)}
-              />
-              <Legend wrapperStyle={{ paddingTop: '20px' }} />
-              {methods.map((method, index) => (
-                <Bar
-                  key={method}
-                  dataKey={method}
-                  fill={getMethodColor(method, index)}
-                  name={method}
-                />
-              ))}
-            </BarChart>
-          </ResponsiveContainer>
+    <div className="bg-white p-6 rounded-lg shadow">
+      <h2 className="text-2xl font-bold mb-6 text-gray-900">
+        Benchmarking imputation methods
+      </h2>
+
+      {/* Best Model Highlight */}
+      {bestModel && bestModel.method && (
+        <div className="mb-6 p-4 bg-gradient-to-r from-green-50 to-emerald-50 border-2 border-green-200 rounded-lg">
+          <div className="flex items-center gap-3 mb-2">
+            <div className="flex-shrink-0 w-10 h-10 bg-green-600 rounded-full flex items-center justify-center">
+              <svg className="w-6 h-6 text-white" fill="none" stroke="currentColor" viewBox="0 0 24 24">
+                <path strokeLinecap="round" strokeLinejoin="round" strokeWidth={2} d="M5 13l4 4L19 7" />
+              </svg>
+            </div>
+            <div>
+              <h3 className="text-lg font-bold text-gray-900">
+                Best performing model: <span className="text-green-700">{bestModel.method}</span>
+              </h3>
+              <p className="text-sm text-gray-600">Based on combined performance across all metrics</p>
+            </div>
+          </div>
+          <div className="mt-3 grid grid-cols-1 md:grid-cols-2 gap-3 text-sm">
+            {bestModel.quantileLoss !== undefined && (
+              <div className="flex flex-col gap-1">
+                <div>
+                  <span className="text-gray-700">Avg. quantile loss (test): </span>
+                  <span className="font-semibold text-gray-900">{bestModel.quantileLoss.toFixed(6)}</span>
+                </div>
+                {bestModel.quantileTrainTestRatio !== undefined && (
+                  <span className={`text-xs ${bestModel.quantileTrainTestRatio > 1.1 ? 'text-amber-600' : 'text-gray-700'}`}>
+                    Train/test ratio: {bestModel.quantileTrainTestRatio.toFixed(3)}
+                  </span>
+                )}
+              </div>
+            )}
+            {bestModel.logLoss !== undefined && (
+              <div className="flex flex-col gap-1">
+                <div>
+                  <span className="text-gray-700">Avg. log loss (test): </span>
+                  <span className="font-semibold text-gray-900">{bestModel.logLoss.toFixed(6)}</span>
+                </div>
+                {bestModel.logLossTrainTestRatio !== undefined && (
+                  <span className={`text-xs ${bestModel.logLossTrainTestRatio > 1.1 ? 'text-amber-600' : 'text-gray-700'}`}>
+                    Train/test ratio: {bestModel.logLossTrainTestRatio.toFixed(3)}
+                  </span>
+                )}
+              </div>
+            )}
+          </div>
         </div>
       )}
 
-      {/* Log Loss Comparison */}
-      {logLossChartData.length > 0 && (
-        <div className="bg-white p-6 rounded-lg shadow">
-          <h3 className="text-xl font-semibold mb-4 text-gray-900">
-            Log Loss Comparison Across Methods
-          </h3>
-          <ResponsiveContainer width="100%" height={400}>
-            <BarChart data={logLossChartData}>
-              <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
-              <XAxis
-                dataKey="method"
-                tick={{ fill: '#666' }}
-              />
-              <YAxis
-                label={{ value: 'Log Loss', angle: -90, position: 'insideLeft' }}
-                tick={{ fill: '#666' }}
-              />
-              <Tooltip
-                contentStyle={{
-                  backgroundColor: '#fff',
-                  border: '1px solid #ccc',
-                  color: '#000',
-                }}
-                labelStyle={{ color: '#000', fontWeight: 'bold' }}
-                itemStyle={{ color: '#000' }}
-                formatter={(value: number) => [value.toFixed(6), 'Log Loss']}
-              />
-              <Bar dataKey="value">
-                {logLossChartData.map((entry, index) => (
-                  <Cell key={entry.method} fill={getMethodColor(entry.method, index)} />
-                ))}
-              </Bar>
-            </BarChart>
-          </ResponsiveContainer>
+      {/* Note about methods without data */}
+      {methodsWithoutData.length > 0 && (
+        <div className="mb-6 p-3 bg-gray-50 border border-gray-300 rounded-md">
+          <p className="text-xs text-gray-600">
+            <strong>Note:</strong> {methodsWithoutData.length === 1 ? 'The following method does' : 'The following methods do'} not appear in visualizations because {methodsWithoutData.length === 1 ? 'it does' : 'they do'} not support imputation of the selected variables due to variable types: <span className="font-mono">{methodsWithoutData.join(', ')}</span>
+          </p>
         </div>
       )}
+
+      <div className="space-y-8">
+        {/* Quantile Loss Comparison */}
+        {quantileChartData.length > 0 && (
+          <div>
+            <h3 className="text-xl font-semibold mb-4 text-gray-900">
+              Test quantile loss across quantiles for different imputation methods
+            </h3>
+            <ResponsiveContainer width="100%" height={400}>
+              <BarChart data={quantileChartData}>
+                <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+                <XAxis
+                  dataKey="quantile"
+                  label={{ value: 'Quantiles', position: 'insideBottom', offset: -5 }}
+                  tick={{ fill: '#666' }}
+                />
+                <YAxis
+                  label={{ value: 'Test quantile loss', angle: -90, position: 'insideLeft' }}
+                  tick={{ fill: '#666' }}
+                />
+                <Tooltip
+                  contentStyle={{
+                    backgroundColor: '#fff',
+                    border: '1px solid #ccc',
+                    color: '#000',
+                  }}
+                  labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                  itemStyle={{ color: '#000' }}
+                  formatter={(value: number) => value.toFixed(6)}
+                />
+                <Legend wrapperStyle={{ paddingTop: '20px' }} />
+                {methods.map((method, index) => (
+                  <Bar
+                    key={method}
+                    dataKey={method}
+                    fill={getMethodColor(method, index)}
+                    name={method}
+                  />
+                ))}
+              </BarChart>
+            </ResponsiveContainer>
+            <div className="mt-4 p-4 bg-blue-50 border border-blue-200 rounded-md">
+              <p className="text-sm text-gray-700">
+                <strong>Quantile loss</strong> measures how well the imputation method predicts different quantiles of the distribution for numerical variables, creating an asymmetric loss function that penalizes under-prediction more heavily for higher quantiles and over-prediction more heavily for lower quantiles.
+                <br />
+                Lower values indicate better performance.
+              </p>
+            </div>
+          </div>
+        )}
+
+        {/* Log Loss Comparison */}
+        {logLossChartData.length > 0 && (
+          <div>
+            <h3 className="text-xl font-semibold mb-4 text-gray-900">
+              Test log loss across different imputation methods
+            </h3>
+            <ResponsiveContainer width="100%" height={400}>
+              <BarChart data={logLossChartData}>
+                <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+                <XAxis
+                  dataKey="method"
+                  tick={{ fill: '#666' }}
+                />
+                <YAxis
+                  label={{ value: 'Log loss', angle: -90, position: 'insideLeft' }}
+                  tick={{ fill: '#666' }}
+                />
+                <Tooltip
+                  contentStyle={{
+                    backgroundColor: '#fff',
+                    border: '1px solid #ccc',
+                    color: '#000',
+                  }}
+                  labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                  itemStyle={{ color: '#000' }}
+                  formatter={(value: number) => [value.toFixed(6), 'Log loss']}
+                />
+                <Bar dataKey="value">
+                  {logLossChartData.map((entry, index) => (
+                    <Cell key={entry.method} fill={getMethodColor(entry.method, index)} />
+                  ))}
+                </Bar>
+              </BarChart>
+            </ResponsiveContainer>
+            <div className="mt-4 p-4 bg-blue-50 border border-blue-200 rounded-md">
+              <p className="text-sm text-gray-700">
+                <strong>Log loss</strong> measures how well the imputation method predicts categorical and boolean variables by evaluating the accuracy of predicted probabilities. It heavily penalizes confident misclassifications, such that a perfect classifier would have a log loss of 0, while worse predictions yield increasingly higher values.
+              </p>
+            </div>
+          </div>
+        )}
+
+        {/* Train/Test Overfitting Assessment */}
+        {(hasQuantileTrainTest || hasLogLossTrainTest) && methods.length > 0 && (
+          <div className="mt-8 pt-8 border-t-2 border-gray-200">
+            <div className="mb-6">
+              <h3 className="text-xl font-semibold mb-2 text-gray-900">
+                Train vs test performance
+              </h3>
+              <p className="text-sm text-gray-600 mb-4">
+                Compare training and test set performance to assess potential overfitting or underfitting.
+              </p>
+
+              {/* Method Selector */}
+              <div className="flex items-center gap-3">
+                <label htmlFor="method-select" className="text-sm font-medium text-gray-700">
+                  Select method:
+                </label>
+                <select
+                  id="method-select"
+                  value={selectedMethod}
+                  onChange={(e) => setSelectedMethod(e.target.value)}
+                  className="px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
+                >
+                  {methodsWithData.map((method) => (
+                    <option key={method} value={method}>
+                      {method} {bestModel && method === bestModel.method ? '' : ''}
+                    </option>
+                  ))}
+                </select>
+              </div>
+            </div>
+
+            <div className={`grid gap-6 ${hasQuantileTrainTest && hasLogLossTrainTest ? 'grid-cols-2' : 'grid-cols-1'}`}>
+              {/* Quantile Loss Train/Test */}
+              {hasQuantileTrainTest && (
+                <div>
+                  <h4 className="text-lg font-semibold mb-3 text-gray-900">Quantile loss: train vs test</h4>
+                  <ResponsiveContainer width="100%" height={350}>
+                    <BarChart data={trainTestData.quantile}>
+                      <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+                      <XAxis
+                        dataKey="quantile"
+                        label={{ value: 'Quantiles', position: 'insideBottom', offset: -5 }}
+                        tick={{ fill: '#666' }}
+                      />
+                      <YAxis
+                        label={{ value: 'Quantile loss', angle: -90, position: 'insideLeft' }}
+                        tick={{ fill: '#666' }}
+                      />
+                      <Tooltip
+                        contentStyle={{
+                          backgroundColor: '#fff',
+                          border: '1px solid #ccc',
+                          color: '#000',
+                        }}
+                        labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                        itemStyle={{ color: '#000' }}
+                        formatter={(value: number) => value.toFixed(6)}
+                      />
+                      <Legend wrapperStyle={{ paddingTop: '25px' }} />
+                      <Bar dataKey="train" fill="#06b6d4" name="Train" />
+                      <Bar dataKey="test" fill="#16a34a" name="Test" />
+                    </BarChart>
+                  </ResponsiveContainer>
+                </div>
+              )}
+
+              {/* Log Loss Train/Test */}
+              {hasLogLossTrainTest && (
+                <div>
+                  <h4 className="text-lg font-semibold mb-3 text-gray-900">Log loss: train vs test</h4>
+                  <ResponsiveContainer width="100%" height={350}>
+                    <BarChart data={trainTestData.logLoss}>
+                      <CartesianGrid strokeDasharray="3 3" stroke="#e0e0e0" />
+                      <XAxis
+                        dataKey="category"
+                        tick={{ fill: '#666' }}
+                      />
+                      <YAxis
+                        label={{ value: 'Log loss', angle: -90, position: 'insideLeft' }}
+                        tick={{ fill: '#666' }}
+                      />
+                      <Tooltip
+                        contentStyle={{
+                          backgroundColor: '#fff',
+                          border: '1px solid #ccc',
+                          color: '#000',
+                        }}
+                        labelStyle={{ color: '#000', fontWeight: 'bold' }}
+                        itemStyle={{ color: '#000' }}
+                        formatter={(value: number) => value.toFixed(6)}
+                      />
+                      <Legend wrapperStyle={{ paddingTop: '25px' }} />
+                      <Bar dataKey="train" fill="#06b6d4" name="Train" />
+                      <Bar dataKey="test" fill="#16a34a" name="Test" />
+                    </BarChart>
+                  </ResponsiveContainer>
+                </div>
+              )}
+            </div>
+
+            <div className="mt-4 p-4 bg-blue-50 border border-blue-200 rounded-md">
+              <p className="text-sm text-gray-700">
+                <strong>Overfitting assessment:</strong> When test performance (green bars) is significantly worse than train performance (cyan bars), it suggests the model may be overfitting to the training data and not generalizing well to unseen data. If both train and test performances are poor, the model may be underfitting and failing to capture underlying patterns.
+                <br />
+                Healthy performance is indicated by similar train and test metrics, with both being reasonably low.
+              </p>
+            </div>
+          </div>
+        )}
+      </div>
     </div>
   );
 }

From ba77ba69fd64a0f597f0047f015a3aefda18fd51 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 21:26:04 +0800
Subject: [PATCH 07/12] adding predictor correlation to dashboard

---
 .../components/PredictorCorrelationMatrix.tsx | 466 ++++++++++++++++++
 .../components/VisualizationDashboard.tsx     |  15 +-
 2 files changed, 480 insertions(+), 1 deletion(-)
 create mode 100644 microimputation-dashboard/components/PredictorCorrelationMatrix.tsx

diff --git a/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx b/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx
new file mode 100644
index 0000000..331a5cc
--- /dev/null
+++ b/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx
@@ -0,0 +1,466 @@
+'use client';
+
+import { useMemo, useState } from 'react';
+import { ImputationDataPoint } from '@/types/imputation';
+
+interface PredictorCorrelationMatrixProps {
+  data: ImputationDataPoint[];
+}
+
+interface CorrelationData {
+  predictor1: string;
+  predictor2: string;
+  value: number;
+}
+
+export default function PredictorCorrelationMatrix({ data }: PredictorCorrelationMatrixProps) {
+  // Filter for predictor_correlation data
+  const correlationData = useMemo(() => {
+    return data.filter(d => d.type === 'predictor_correlation');
+  }, [data]);
+
+  // Filter for predictor-target mutual information data
+  const predictorTargetMIData = useMemo(() => {
+    return data.filter(d => d.type === 'predictor_target_mi');
+  }, [data]);
+
+  // Check available correlation metrics
+  const availableMetrics = useMemo(() => {
+    const metrics = new Set(correlationData.map(d => d.metric_name));
+    return Array.from(metrics);
+  }, [correlationData]);
+
+  // State for selected correlation metric
+  const [selectedMetric, setSelectedMetric] = useState<string>('');
+
+  // Set default metric to pearson if available, otherwise first available
+  useMemo(() => {
+    if (!selectedMetric && availableMetrics.length > 0) {
+      setSelectedMetric(availableMetrics.includes('pearson') ? 'pearson' : availableMetrics[0]);
+    }
+  }, [availableMetrics, selectedMetric]);
+
+  // Build correlation matrix data
+  const { predictors, matrixData } = useMemo(() => {
+    if (!selectedMetric) return { predictors: [], matrixData: new Map<string, Map<string, number>>() };
+
+    // Filter data for selected metric
+    const metricData = correlationData.filter(d => d.metric_name === selectedMetric);
+
+    // Extract all unique predictors
+    const predSet = new Set<string>();
+    const correlations: CorrelationData[] = [];
+
+    metricData.forEach(d => {
+      const pred1 = d.variable;
+      let pred2: string | undefined;
+
+      try {
+        const additionalInfo = typeof d.additional_info === 'string'
+          ? JSON.parse(d.additional_info)
+          : d.additional_info;
+        pred2 = additionalInfo?.predictor2;
+      } catch (e) {
+        console.error('Failed to parse additional_info:', e);
+      }
+
+      if (pred1 && pred2) {
+        predSet.add(pred1);
+        predSet.add(pred2);
+        correlations.push({
+          predictor1: pred1,
+          predictor2: pred2,
+          value: d.metric_value ?? 0,
+        });
+      }
+    });
+
+    const predictorList = Array.from(predSet).sort();
+
+    // Build symmetric matrix
+    const matrix = new Map<string, Map<string, number>>();
+
+    predictorList.forEach(p => {
+      matrix.set(p, new Map<string, number>());
+    });
+
+    // Add diagonal (1.0 for self-correlation)
+    predictorList.forEach(p => {
+      matrix.get(p)!.set(p, 1.0);
+    });
+
+    // Add correlations (symmetric)
+    correlations.forEach(({ predictor1, predictor2, value }) => {
+      matrix.get(predictor1)!.set(predictor2, value);
+      matrix.get(predictor2)!.set(predictor1, value);
+    });
+
+    return { predictors: predictorList, matrixData: matrix };
+  }, [correlationData, selectedMetric]);
+
+  // Build predictor-target mutual information matrix
+  const { predictorsList, targetsList, miMatrixData } = useMemo(() => {
+    if (predictorTargetMIData.length === 0) {
+      return { predictorsList: [], targetsList: [], miMatrixData: new Map<string, Map<string, number>>() };
+    }
+
+    const predSet = new Set<string>();
+    const targSet = new Set<string>();
+    const miValues: Array<{ predictor: string; target: string; value: number }> = [];
+
+    predictorTargetMIData.forEach(d => {
+      const predictor = d.variable;
+      let target: string | undefined;
+
+      try {
+        const additionalInfo = typeof d.additional_info === 'string'
+          ? JSON.parse(d.additional_info)
+          : d.additional_info;
+        target = additionalInfo?.target;
+      } catch (e) {
+        console.error('Failed to parse additional_info:', e);
+      }
+
+      if (predictor && target && d.metric_value !== null) {
+        predSet.add(predictor);
+        targSet.add(target);
+        miValues.push({
+          predictor,
+          target,
+          value: d.metric_value,
+        });
+      }
+    });
+
+    const predList = Array.from(predSet).sort();
+    const targList = Array.from(targSet).sort();
+
+    // Build matrix
+    const matrix = new Map<string, Map<string, number>>();
+    predList.forEach(p => {
+      matrix.set(p, new Map<string, number>());
+    });
+
+    miValues.forEach(({ predictor, target, value }) => {
+      matrix.get(predictor)!.set(target, value);
+    });
+
+    return { predictorsList: predList, targetsList: targList, miMatrixData: matrix };
+  }, [predictorTargetMIData]);
+
+  const hasPredictorTargetMI = predictorsList.length > 0 && targetsList.length > 0;
+
+  if (correlationData.length === 0 || predictors.length === 0) {
+    return null;
+  }
+
+  // Helper function to get color based on correlation value
+  const getColor = (value: number): string => {
+    // Scale from -1 to 1
+    // Negative: red shades, Positive: blue shades, Zero: white
+    if (value === 1.0) return '#1e40af'; // Dark blue for diagonal
+    if (value >= 0.7) return '#3b82f6'; // Blue
+    if (value >= 0.4) return '#60a5fa'; // Light blue
+    if (value >= 0.2) return '#93c5fd'; // Very light blue
+    if (value >= -0.2) return '#f3f4f6'; // Nearly white
+    if (value >= -0.4) return '#fca5a5'; // Light red
+    if (value >= -0.7) return '#f87171'; // Red
+    return '#ef4444'; // Dark red
+  };
+
+  // Helper function to get color based on mutual information value (0 to ~1)
+  const getMIColor = (value: number): string => {
+    // Scale from 0 (white) to high values (dark purple)
+    if (value >= 0.15) return '#581c87'; // Dark purple
+    if (value >= 0.10) return '#7c3aed'; // Purple
+    if (value >= 0.07) return '#a78bfa'; // Light purple
+    if (value >= 0.04) return '#c4b5fd'; // Very light purple
+    if (value >= 0.02) return '#ddd6fe'; // Almost white purple
+    return '#f3f4f6'; // Nearly white
+  };
+
+  const cellSize = 80; // Size of each cell in pixels
+
+  return (
+    <div className="bg-white p-6 rounded-lg shadow">
+      <div className="mb-6">
+        <h2 className="text-2xl font-bold mb-2 text-gray-900">
+          Predictor correlation analysis
+        </h2>
+        <p className="text-sm text-gray-600 mb-4">
+          Correlation matrix showing relationships between predictor variables
+        </p>
+
+        {/* Metric Selector */}
+        {availableMetrics.length > 1 && (
+          <div className="flex items-center gap-3">
+            <label htmlFor="metric-select" className="text-sm font-medium text-gray-700">
+              Correlation metric:
+            </label>
+            <select
+              id="metric-select"
+              value={selectedMetric}
+              onChange={(e) => setSelectedMetric(e.target.value)}
+              className="px-3 py-2 border border-gray-300 rounded-md focus:outline-none focus:ring-2 focus:ring-blue-500 text-gray-900"
+            >
+              {availableMetrics.map((metric) => {
+                const label = metric === 'mutual_info'
+                  ? 'Mutual information'
+                  : metric.charAt(0).toUpperCase() + metric.slice(1).replace('_', ' ');
+                return (
+                  <option key={metric} value={metric}>
+                    {label}
+                  </option>
+                );
+              })}
+            </select>
+          </div>
+        )}
+      </div>
+
+      {/* Correlation Matrix */}
+      <div className="overflow-x-auto overflow-y-hidden">
+        <div className="inline-block">
+          <div style={{ display: 'grid', gridTemplateColumns: `${cellSize}px repeat(${predictors.length}, ${cellSize}px)`, border: '1px solid #e5e7eb' }}>
+            {/* Top-left empty cell */}
+            <div style={{ width: cellSize, height: cellSize, borderRight: '1px solid #e5e7eb', borderBottom: '1px solid #e5e7eb' }} className="bg-white" />
+
+            {/* Column headers */}
+            {predictors.map((pred, idx) => (
+              <div
+                key={`header-${pred}`}
+                style={{
+                  width: cellSize,
+                  height: cellSize,
+                  borderRight: idx < predictors.length - 1 ? '1px solid #e5e7eb' : 'none',
+                  borderBottom: '1px solid #e5e7eb'
+                }}
+                className="bg-gray-100 flex items-center justify-center font-semibold text-gray-900 text-sm"
+              >
+                <div
+                  style={{
+                    transform: 'rotate(-45deg)',
+                    transformOrigin: 'center',
+                    whiteSpace: 'nowrap',
+                  }}
+                >
+                  {pred}
+                </div>
+              </div>
+            ))}
+
+            {/* Rows */}
+            {predictors.map((pred1, rowIdx) => (
+              <>
+                {/* Row header */}
+                <div
+                  key={`row-header-${pred1}`}
+                  style={{
+                    width: cellSize,
+                    height: cellSize,
+                    borderRight: '1px solid #e5e7eb',
+                    borderBottom: rowIdx < predictors.length - 1 ? '1px solid #e5e7eb' : 'none'
+                  }}
+                  className="bg-gray-100 flex items-center justify-center font-semibold text-gray-900 text-sm"
+                >
+                  {pred1}
+                </div>
+
+                {/* Correlation cells */}
+                {predictors.map((pred2, colIdx) => {
+                  const value = matrixData.get(pred1)?.get(pred2) ?? 0;
+                  // Use purple scale for mutual_info, blue/red scale for correlations
+                  const bgColor = selectedMetric === 'mutual_info' ? getMIColor(value) : getColor(value);
+                  const textColor = selectedMetric === 'mutual_info'
+                    ? (value > 0.07 ? '#ffffff' : '#000000')
+                    : (Math.abs(value) > 0.5 ? '#ffffff' : '#000000');
+
+                  return (
+                    <div
+                      key={`cell-${pred1}-${pred2}`}
+                      style={{
+                        width: cellSize,
+                        height: cellSize,
+                        backgroundColor: bgColor,
+                        color: textColor,
+                        borderRight: colIdx < predictors.length - 1 ? '1px solid #e5e7eb' : 'none',
+                        borderBottom: rowIdx < predictors.length - 1 ? '1px solid #e5e7eb' : 'none',
+                      }}
+                      className="flex items-center justify-center text-xs font-medium"
+                      title={`${pred1} vs ${pred2}: ${value.toFixed(3)}`}
+                    >
+                      {selectedMetric === 'mutual_info' ? value.toFixed(3) : value.toFixed(2)}
+                    </div>
+                  );
+                })}
+              </>
+            ))}
+          </div>
+        </div>
+      </div>
+
+      {/* Legend - only for correlation metrics (not mutual_info) */}
+      {selectedMetric !== 'mutual_info' && (
+        <div className="mt-6 p-4 bg-blue-50 border border-blue-200 rounded-md">
+          <p className="text-sm text-gray-700 mb-3">
+            <strong>Interpretation:</strong> Correlation values range from -1 to 1. Positive values (blue) indicate variables that increase together, negative values (red) indicate variables that move in opposite directions, and values near 0 (white) indicate little to no linear relationship.
+          </p>
+          <div className="flex items-center gap-4 mb-3">
+            <span className="text-xs text-gray-600 font-medium">Color scale:</span>
+            <div className="flex items-center gap-1">
+              <div className="w-8 h-4 bg-red-500" title="-1.0 to -0.7" />
+              <div className="w-8 h-4 bg-red-400" title="-0.7 to -0.4" />
+              <div className="w-8 h-4 bg-red-300" title="-0.4 to -0.2" />
+              <div className="w-8 h-4 bg-gray-100" title="-0.2 to 0.2" />
+              <div className="w-8 h-4 bg-blue-300" title="0.2 to 0.4" />
+              <div className="w-8 h-4 bg-blue-400" title="0.4 to 0.7" />
+              <div className="w-8 h-4 bg-blue-600" title="0.7 to 1.0" />
+            </div>
+            <span className="text-xs text-gray-600">
+              <span className="text-red-500">◄ Negative</span>
+              <span className="mx-2">|</span>
+              <span className="text-blue-500">Positive ►</span>
+            </span>
+          </div>
+          <div className="pt-3 border-t border-blue-300">
+            <p className="text-sm text-gray-700">
+              <strong>Pearson vs Spearman:</strong> Pearson correlation measures linear relationships between variables and is sensitive to outliers. Spearman correlation measures monotonic relationships (whether variables consistently increase or decrease together) by ranking the data first, making it more robust to outliers and non-linear but monotonic relationships. Use Pearson for linear relationships and Spearman when the relationship may be non-linear or when data contains outliers.
+            </p>
+          </div>
+        </div>
+      )}
+
+      {/* Predictor-Target Mutual Information Section */}
+      <div className="mt-8 pt-8 border-t-2 border-gray-200">
+        <h3 className="text-xl font-semibold mb-4 text-gray-900">
+          Predictor-imputed variable mutual information
+        </h3>
+
+        {hasPredictorTargetMI ? (
+          <>
+            <p className="text-sm text-gray-600 mb-4">
+              Mutual information between predictor variables and imputed target variables
+            </p>
+
+            {/* MI Matrix */}
+            <div className="overflow-x-auto overflow-y-hidden mb-4">
+              <div className="inline-block">
+                <div style={{ display: 'grid', gridTemplateColumns: `${cellSize}px repeat(${targetsList.length}, ${cellSize}px)`, border: '1px solid #e5e7eb' }}>
+                  {/* Top-left empty cell */}
+                  <div style={{ width: cellSize, height: cellSize, borderRight: '1px solid #e5e7eb', borderBottom: '1px solid #e5e7eb' }} className="bg-white" />
+
+                  {/* Column headers (targets) */}
+                  {targetsList.map((target, idx) => (
+                    <div
+                      key={`header-${target}`}
+                      style={{
+                        width: cellSize,
+                        height: cellSize,
+                        borderRight: idx < targetsList.length - 1 ? '1px solid #e5e7eb' : 'none',
+                        borderBottom: '1px solid #e5e7eb'
+                      }}
+                      className="bg-gray-100 flex items-center justify-center font-semibold text-gray-900 text-sm"
+                    >
+                      <div
+                        style={{
+                          transform: 'rotate(-45deg)',
+                          transformOrigin: 'center',
+                          whiteSpace: 'nowrap',
+                        }}
+                      >
+                        {target}
+                      </div>
+                    </div>
+                  ))}
+
+                  {/* Rows */}
+                  {predictorsList.map((predictor, rowIdx) => (
+                    <>
+                      {/* Row header */}
+                      <div
+                        key={`row-header-${predictor}`}
+                        style={{
+                          width: cellSize,
+                          height: cellSize,
+                          borderRight: '1px solid #e5e7eb',
+                          borderBottom: rowIdx < predictorsList.length - 1 ? '1px solid #e5e7eb' : 'none'
+                        }}
+                        className="bg-gray-100 flex items-center justify-center font-semibold text-gray-900 text-sm"
+                      >
+                        {predictor}
+                      </div>
+
+                      {/* MI cells */}
+                      {targetsList.map((target, colIdx) => {
+                        const value = miMatrixData.get(predictor)?.get(target) ?? 0;
+                        const bgColor = getMIColor(value);
+                        const textColor = value > 0.07 ? '#ffffff' : '#000000';
+
+                        return (
+                          <div
+                            key={`cell-${predictor}-${target}`}
+                            style={{
+                              width: cellSize,
+                              height: cellSize,
+                              backgroundColor: bgColor,
+                              color: textColor,
+                              borderRight: colIdx < targetsList.length - 1 ? '1px solid #e5e7eb' : 'none',
+                              borderBottom: rowIdx < predictorsList.length - 1 ? '1px solid #e5e7eb' : 'none',
+                            }}
+                            className="flex items-center justify-center text-xs font-medium"
+                            title={`${predictor} → ${target}: ${value.toFixed(4)}`}
+                          >
+                            {value.toFixed(3)}
+                          </div>
+                        );
+                      })}
+                    </>
+                  ))}
+                </div>
+              </div>
+            </div>
+          </>
+        ) : null}
+
+        {/* Explanation box - always shown */}
+        <div className="p-4 bg-purple-50 border border-purple-200 rounded-md">
+          <p className="text-sm text-gray-700 mb-2">
+            <strong>What is mutual information?</strong> Mutual information measures how much information one variable provides about another. Unlike correlation, it captures both linear and non-linear relationships between variables. Values range from 0 (independent variables) to higher positive values (strong dependency).
+          </p>
+          <p className="text-sm text-gray-700 mb-3">
+            <strong>Why measure it for imputed variables?</strong> Mutual information between predictors and imputed variables reveals which predictors are most informative for imputation. High mutual information indicates that a predictor strongly influences the imputed variable's distribution, making it crucial for accurate imputation. This helps validate that your imputation models are using the most relevant predictors and can identify when key predictive relationships exist in your data.
+          </p>
+
+          {/* Color scale within explanation box */}
+          <div className="mt-3 pt-3 border-t border-purple-300">
+            <div className="flex items-center gap-4">
+              <span className="text-xs text-gray-600 font-medium">Color scale:</span>
+              <div className="flex items-center gap-1">
+                <div className="w-8 h-4 bg-gray-100" title="0 to 0.02" />
+                <div className="w-8 h-4" style={{ backgroundColor: '#ddd6fe' }} title="0.02 to 0.04" />
+                <div className="w-8 h-4" style={{ backgroundColor: '#c4b5fd' }} title="0.04 to 0.07" />
+                <div className="w-8 h-4" style={{ backgroundColor: '#a78bfa' }} title="0.07 to 0.10" />
+                <div className="w-8 h-4" style={{ backgroundColor: '#7c3aed' }} title="0.10 to 0.15" />
+                <div className="w-8 h-4" style={{ backgroundColor: '#581c87' }} title="0.15+" />
+              </div>
+              <span className="text-xs text-gray-600">
+                <span className="text-gray-400">Weak</span>
+                <span className="mx-2">→</span>
+                <span className="text-purple-700">Strong ►</span>
+              </span>
+            </div>
+          </div>
+        </div>
+
+        {/* Message when no predictor-target data is available */}
+        {!hasPredictorTargetMI && (
+          <div className="mt-4 p-3 bg-amber-50 border border-amber-300 rounded-md">
+            <p className="text-sm text-gray-700">
+              <strong>Note:</strong> No predictor-imputed variable mutual information data was found in this CSV file. It is recommended to include this data in your analysis to understand which predictors are most informative for imputing each variable. This helps validate that your imputation models are leveraging the most relevant predictive relationships in your data.
+            </p>
+          </div>
+        )}
+      </div>
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index 16ce893..d98be55 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -6,6 +6,7 @@ import { GitHubArtifactInfo, createShareableUrl } from '@/utils/deeplinks';
 import BenchmarkLossCharts from './BenchmarkLossCharts';
 import PerVariableCharts from './PerVariableCharts';
 import VisualizationTabs from './VisualizationTabs';
+import PredictorCorrelationMatrix from './PredictorCorrelationMatrix';
 import { Share } from 'lucide-react';
 
 interface VisualizationDashboardProps {
@@ -88,7 +89,7 @@ export default function VisualizationDashboard({
     const tabsList = [];
 
     if (dataAnalysis.hasBenchmarkLoss) {
-      tabsList.push({ id: 'overview', label: 'Overview' });
+      tabsList.push({ id: 'overview', label: 'Model benchmarking' });
     }
 
     if (dataAnalysis.numericalVars.length > 0) {
@@ -107,6 +108,13 @@ export default function VisualizationDashboard({
       });
     }
 
+    if (dataAnalysis.hasPredictorCorrelation) {
+      tabsList.push({
+        id: 'correlation',
+        label: 'Predictor correlation',
+      });
+    }
+
     return tabsList;
   }, [dataAnalysis]);
 
@@ -254,6 +262,11 @@ export default function VisualizationDashboard({
             ))}
           </div>
         )}
+
+        {/* Predictor Correlation Tab */}
+        {activeTab === 'correlation' && (
+          <PredictorCorrelationMatrix data={data} />
+        )}
       </div>
     </div>
   );

From 961ab5a335c1747281cc5ec654a8e5140a53183b Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 21:50:29 +0800
Subject: [PATCH 08/12] adding predictor selection to dashboard

---
 .../PredictorOrderingRobustness.tsx           | 387 ++++++++++++++++++
 .../components/VisualizationDashboard.tsx     |  14 +
 2 files changed, 401 insertions(+)
 create mode 100644 microimputation-dashboard/components/PredictorOrderingRobustness.tsx

diff --git a/microimputation-dashboard/components/PredictorOrderingRobustness.tsx b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
new file mode 100644
index 0000000..e784a24
--- /dev/null
+++ b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
@@ -0,0 +1,387 @@
+'use client';
+
+import { useMemo } from 'react';
+import { ImputationDataPoint } from '@/types/imputation';
+import { BarChart, Bar, XAxis, YAxis, CartesianGrid, Tooltip, Legend, ResponsiveContainer, Cell } from 'recharts';
+
+interface PredictorOrderingRobustnessProps {
+  data: ImputationDataPoint[];
+}
+
+interface ProgressiveStep {
+  step: number;
+  predictorAdded: string;
+  predictors: string[];
+  cumulativeImprovement: number;
+  marginalImprovement: number;
+}
+
+interface PredictorImportance {
+  predictor: string;
+  relativeImpact: number;
+  lossIncrease: number;
+}
+
+export default function PredictorOrderingRobustness({ data }: PredictorOrderingRobustnessProps) {
+  // Filter for progressive inclusion data
+  const progressiveInclusionData = useMemo(() => {
+    return data.filter(d => d.type === 'progressive_inclusion');
+  }, [data]);
+
+  // Filter for predictor importance data
+  const predictorImportanceData = useMemo(() => {
+    return data.filter(d => d.type === 'predictor_importance');
+  }, [data]);
+
+  // Parse progressive inclusion steps
+  const progressiveSteps = useMemo(() => {
+    const stepData: ProgressiveStep[] = [];
+    const cumulativeData = progressiveInclusionData.filter(
+      d => d.metric_name === 'cumulative_improvement'
+    );
+
+    cumulativeData.forEach(d => {
+      try {
+        const additionalInfo = typeof d.additional_info === 'string'
+          ? JSON.parse(d.additional_info)
+          : d.additional_info;
+
+        const step = additionalInfo?.step;
+        const predictorAdded = additionalInfo?.predictor_added;
+        const predictors = additionalInfo?.predictors || [];
+
+        if (step !== undefined && predictorAdded) {
+          // Find corresponding marginal improvement
+          const marginalData = progressiveInclusionData.find(
+            m => m.metric_name === 'marginal_improvement' &&
+                 JSON.parse(typeof m.additional_info === 'string' ? m.additional_info : JSON.stringify(m.additional_info))?.step === step
+          );
+
+          stepData.push({
+            step,
+            predictorAdded,
+            predictors,
+            cumulativeImprovement: d.metric_value ?? 0,
+            marginalImprovement: marginalData?.metric_value ?? 0,
+          });
+        }
+      } catch (e) {
+        console.error('Failed to parse progressive inclusion data:', e);
+      }
+    });
+
+    return stepData.sort((a, b) => a.step - b.step);
+  }, [progressiveInclusionData]);
+
+  // Parse predictor importance
+  const importanceData = useMemo(() => {
+    const importanceMap = new Map<string, PredictorImportance>();
+
+    predictorImportanceData.forEach(d => {
+      try {
+        const additionalInfo = typeof d.additional_info === 'string'
+          ? JSON.parse(d.additional_info)
+          : d.additional_info;
+
+        const predictor = additionalInfo?.removed_predictor || d.variable;
+
+        if (predictor) {
+          if (!importanceMap.has(predictor)) {
+            importanceMap.set(predictor, {
+              predictor,
+              relativeImpact: 0,
+              lossIncrease: 0,
+            });
+          }
+
+          const entry = importanceMap.get(predictor)!;
+          if (d.metric_name === 'relative_impact') {
+            entry.relativeImpact = d.metric_value ?? 0;
+          } else if (d.metric_name === 'loss_increase') {
+            entry.lossIncrease = d.metric_value ?? 0;
+          }
+        }
+      } catch (e) {
+        console.error('Failed to parse predictor importance data:', e);
+      }
+    });
+
+    return Array.from(importanceMap.values()).sort(
+      (a, b) => Math.abs(b.relativeImpact) - Math.abs(a.relativeImpact)
+    );
+  }, [predictorImportanceData]);
+
+  const hasProgressiveData = progressiveSteps.length > 0;
+  const hasImportanceData = importanceData.length > 0;
+
+  if (!hasProgressiveData && !hasImportanceData) {
+    return null;
+  }
+
+  // Find best combination (highest cumulative improvement)
+  const bestCombination = progressiveSteps.reduce((best, current) =>
+    current.cumulativeImprovement > best.cumulativeImprovement ? current : best,
+    progressiveSteps[0]
+  );
+
+  return (
+    <div className="bg-white p-6 rounded-lg shadow">
+      <div className="mb-6">
+        <h2 className="text-2xl font-bold mb-2 text-gray-900">
+          Predictor selection and robustness
+        </h2>
+        <p className="text-sm text-gray-600">
+          Analysis of predictor combinations and their impact on model performance
+        </p>
+      </div>
+
+      {/* Progressive Inclusion Section */}
+      {hasProgressiveData && (
+        <div className="mb-8">
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Predictor addition order
+          </h3>
+
+          {/* Explanation */}
+          <div className="mb-6 p-4 bg-blue-50 border border-blue-200 rounded-md">
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>How this works:</strong> This analysis adds predictors one at a time,
+              choosing the predictor that improves performance the most at each step. This
+              step-by-step approach is efficient but doesn't test
+              every possible combination of predictors.
+            </p>
+            <p className="text-sm text-gray-700">
+              <strong>Reading the chart:</strong> The bars show cumulative improvement from
+              baseline as predictors are added. Larger improvements indicate more valuable
+              predictor combinations.
+            </p>
+          </div>
+
+          {/* Best Combination Highlight */}
+          {bestCombination && (
+            <div className="mb-6 p-4 bg-green-50 border-2 border-green-500 rounded-md">
+              <h4 className="text-md font-semibold text-gray-900 mb-2">
+                Best predictor combination
+              </h4>
+              <div className="flex items-start gap-4">
+                <div className="flex-1">
+                  <p className="text-sm text-gray-700 mb-1">
+                    <strong>Predictors:</strong>{' '}
+                    <span className="font-mono text-gray-900">
+                      {bestCombination.predictors.join(' → ')}
+                    </span>
+                  </p>
+                  <p className="text-sm text-gray-700">
+                    <strong>Cumulative improvement:</strong>{' '}
+                    <span className="font-semibold text-green-700">
+                      {(bestCombination.cumulativeImprovement * 100).toFixed(3)}%
+                    </span>
+                  </p>
+                </div>
+              </div>
+            </div>
+          )}
+
+          {/* Step-by-step visualization */}
+          <div className="space-y-4">
+            {progressiveSteps.map((step) => {
+              const isPositive = step.marginalImprovement >= 0;
+              const isBest = step.step === bestCombination?.step;
+
+              return (
+                <div
+                  key={step.step}
+                  className={`p-4 rounded-md border-2 ${
+                    isBest
+                      ? 'bg-green-50 border-green-500'
+                      : 'bg-gray-50 border-gray-200'
+                  }`}
+                >
+                  <div className="flex items-start gap-4">
+                    <div className="flex-shrink-0">
+                      <div className={`w-10 h-10 rounded-full flex items-center justify-center font-bold text-white ${
+                        isBest ? 'bg-green-600' : 'bg-blue-600'
+                      }`}>
+                        {step.step}
+                      </div>
+                    </div>
+
+                    <div className="flex-1 min-w-0">
+                      <div className="flex items-center gap-2 mb-1">
+                        <span className="text-sm font-medium text-gray-600">Add:</span>
+                        <span className="font-mono font-semibold text-gray-900">
+                          {step.predictorAdded}
+                        </span>
+                      </div>
+
+                      <div className="grid grid-cols-1 md:grid-cols-2 gap-4 mt-2">
+                        <div>
+                          <span className="text-xs text-gray-600">Marginal improvement:</span>
+                          <div className="flex items-center gap-2">
+                            <div className="flex-1 bg-gray-200 rounded-full h-2">
+                              <div
+                                className={`h-2 rounded-full ${
+                                  isPositive ? 'bg-green-500' : 'bg-red-500'
+                                }`}
+                                style={{
+                                  width: `${Math.min(Math.abs(step.marginalImprovement) * 5000, 100)}%`,
+                                }}
+                              />
+                            </div>
+                            <span className={`text-sm font-semibold ${
+                              isPositive ? 'text-green-700' : 'text-red-700'
+                            }`}>
+                              {isPositive ? '+' : ''}{(step.marginalImprovement * 100).toFixed(3)}%
+                            </span>
+                          </div>
+                        </div>
+
+                        <div>
+                          <span className="text-xs text-gray-600">Cumulative improvement:</span>
+                          <div className="flex items-center gap-2">
+                            <div className="flex-1 bg-gray-200 rounded-full h-2">
+                              <div
+                                className="h-2 rounded-full bg-blue-500"
+                                style={{
+                                  width: `${Math.min(Math.abs(step.cumulativeImprovement) * 5000, 100)}%`,
+                                }}
+                              />
+                            </div>
+                            <span className="text-sm font-semibold text-blue-700">
+                              {(step.cumulativeImprovement * 100).toFixed(3)}%
+                            </span>
+                          </div>
+                        </div>
+                      </div>
+
+                      <div className="mt-2 text-xs text-gray-500">
+                        Current predictors: {step.predictors.join(' → ')}
+                      </div>
+                    </div>
+                  </div>
+                </div>
+              );
+            })}
+          </div>
+        </div>
+      )}
+
+      {/* Predictor Importance Section */}
+      {hasImportanceData && (
+        <div className="mt-8 pt-8 border-t-2 border-gray-200">
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Predictor robustness check
+          </h3>
+
+          {/* Explanation */}
+          <div className="mb-6 p-4 bg-blue-50 border border-purple-200 rounded-md">
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>What this shows:</strong> This analysis measures how much performance
+              degrades when each predictor is removed. Predictors that cause large performance
+              drops when removed are critical to the model's accuracy.
+            </p>
+            <p className="text-sm text-gray-700">
+              <strong>Reading the chart:</strong> Positive values (bars pointing right) indicate
+              performance worsens when the predictor is removed, meaning the predictor is helpful.
+              Negative values suggest removing the predictor might actually improve performance.
+            </p>
+          </div>
+
+          {/* Bar chart */}
+          <div className="mb-4">
+            <ResponsiveContainer width="100%" height={Math.max(300, importanceData.length * 50)}>
+              <BarChart
+                data={importanceData}
+                layout="vertical"
+                margin={{ top: 20, right: 30, left: 100, bottom: 20 }}
+              >
+                <CartesianGrid strokeDasharray="3 3" />
+                <XAxis type="number" tickFormatter={(val) => `${val.toFixed(1)}%`} tick={{ fill: '#000000' }} />
+                <YAxis type="category" dataKey="predictor" width={90} tick={{ fill: '#000000' }} />
+                <Tooltip
+                  formatter={(value: number, name: string) => {
+                    if (name === 'relativeImpact') {
+                      return [`${value.toFixed(3)}%`, 'Relative Impact'];
+                    }
+                    return [value.toFixed(6), 'Loss Increase'];
+                  }}
+                />
+                <Legend wrapperStyle={{ color: '#000000' }} />
+                <Bar dataKey="relativeImpact" name="Relative Impact (%)">
+                  {importanceData.map((entry, index) => (
+                    <Cell
+                      key={`cell-${index}`}
+                      fill={entry.relativeImpact >= 0 ? '#ef4444' : '#22c55e'}
+                    />
+                  ))}
+                </Bar>
+              </BarChart>
+            </ResponsiveContainer>
+          </div>
+
+          {/* Detailed table */}
+          <div className="overflow-x-auto">
+            <table className="min-w-full divide-y divide-gray-200">
+              <thead className="bg-gray-50">
+                <tr>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Predictor
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Impact when removed
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Loss increase
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Assessment
+                  </th>
+                </tr>
+              </thead>
+              <tbody className="bg-white divide-y divide-gray-200">
+                {importanceData.map((item) => {
+                  const isHelpful = item.relativeImpact > 1;
+                  const isCritical = item.relativeImpact > 10;
+                  const isHarmful = item.relativeImpact < -1;
+
+                  let assessment = 'Minimal impact';
+                  let assessmentColor = 'text-gray-600';
+
+                  if (isCritical) {
+                    assessment = 'Critical predictor';
+                    assessmentColor = 'text-red-700 font-semibold';
+                  } else if (isHelpful) {
+                    assessment = 'Helpful predictor';
+                    assessmentColor = 'text-orange-600';
+                  } else if (isHarmful) {
+                    assessment = 'Consider removing';
+                    assessmentColor = 'text-green-600';
+                  }
+
+                  return (
+                    <tr key={item.predictor}>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm font-mono font-medium text-gray-900">
+                        {item.predictor}
+                      </td>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm">
+                        <span className={item.relativeImpact >= 0 ? 'text-red-600' : 'text-green-600'}>
+                          {item.relativeImpact >= 0 ? '+' : ''}{item.relativeImpact.toFixed(3)}%
+                        </span>
+                      </td>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm text-gray-700">
+                        {item.lossIncrease >= 0 ? '+' : ''}{item.lossIncrease.toFixed(6)}
+                      </td>
+                      <td className={`px-4 py-3 whitespace-nowrap text-sm ${assessmentColor}`}>
+                        {assessment}
+                      </td>
+                    </tr>
+                  );
+                })}
+              </tbody>
+            </table>
+          </div>
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index d98be55..23ba060 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -7,6 +7,7 @@ import BenchmarkLossCharts from './BenchmarkLossCharts';
 import PerVariableCharts from './PerVariableCharts';
 import VisualizationTabs from './VisualizationTabs';
 import PredictorCorrelationMatrix from './PredictorCorrelationMatrix';
+import PredictorOrderingRobustness from './PredictorOrderingRobustness';
 import { Share } from 'lucide-react';
 
 interface VisualizationDashboardProps {
@@ -78,6 +79,7 @@ export default function VisualizationDashboard({
       hasBenchmarkLoss,
       hasDistributionDistance: types.has('distribution_distance'),
       hasPredictorCorrelation: types.has('predictor_correlation'),
+      hasPredictorOrdering: types.has('progressive_inclusion') || types.has('predictor_importance'),
       numericalVars,
       categoricalVars,
       hasPerVariableData: numericalVars.length > 0 || categoricalVars.length > 0,
@@ -115,6 +117,13 @@ export default function VisualizationDashboard({
       });
     }
 
+    if (dataAnalysis.hasPredictorOrdering) {
+      tabsList.push({
+        id: 'ordering',
+        label: 'Predictor selection',
+      });
+    }
+
     return tabsList;
   }, [dataAnalysis]);
 
@@ -267,6 +276,11 @@ export default function VisualizationDashboard({
         {activeTab === 'correlation' && (
           <PredictorCorrelationMatrix data={data} />
         )}
+
+        {/* Predictor Ordering and Robustness Tab */}
+        {activeTab === 'ordering' && (
+          <PredictorOrderingRobustness data={data} />
+        )}
       </div>
     </div>
   );

From 8f942879277c64bdab277ae0e31845e946aedad9 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 22:41:40 +0800
Subject: [PATCH 09/12] adding distribution metrics to dashboard

---
 .../components/ImputationResults.tsx          | 315 ++++++++++++++++++
 .../PredictorOrderingRobustness.tsx           |   6 +-
 .../components/VisualizationDashboard.tsx     | 245 ++++++++++++--
 3 files changed, 542 insertions(+), 24 deletions(-)
 create mode 100644 microimputation-dashboard/components/ImputationResults.tsx

diff --git a/microimputation-dashboard/components/ImputationResults.tsx b/microimputation-dashboard/components/ImputationResults.tsx
new file mode 100644
index 0000000..ce3ab42
--- /dev/null
+++ b/microimputation-dashboard/components/ImputationResults.tsx
@@ -0,0 +1,315 @@
+'use client';
+
+import { useMemo } from 'react';
+import { ImputationDataPoint } from '@/types/imputation';
+import { BarChart, Bar, XAxis, YAxis, CartesianGrid, Tooltip, Legend, ResponsiveContainer, Cell } from 'recharts';
+
+interface ImputationResultsProps {
+  data: ImputationDataPoint[];
+}
+
+interface DistributionMetric {
+  variable: string;
+  method: string;
+  metricName: string;
+  value: number;
+}
+
+export default function ImputationResults({ data }: ImputationResultsProps) {
+  // Filter for distribution distance data
+  const distributionData = useMemo(() => {
+    return data.filter(d => d.type === 'distribution_distance');
+  }, [data]);
+
+  // Group by metric type
+  const { wassersteinData, klDivergenceData } = useMemo(() => {
+    const wasserstein: DistributionMetric[] = [];
+    const klDiv: DistributionMetric[] = [];
+
+    distributionData.forEach(d => {
+      const metric: DistributionMetric = {
+        variable: d.variable,
+        method: d.method,
+        metricName: d.metric_name,
+        value: d.metric_value ?? 0,
+      };
+
+      if (d.metric_name === 'wasserstein_distance') {
+        wasserstein.push(metric);
+      } else if (d.metric_name === 'kl_divergence') {
+        klDiv.push(metric);
+      }
+    });
+
+    // Sort by value (ascending - lower is better)
+    wasserstein.sort((a, b) => a.value - b.value);
+    klDiv.sort((a, b) => a.value - b.value);
+
+    return {
+      wassersteinData: wasserstein,
+      klDivergenceData: klDiv
+    };
+  }, [distributionData]);
+
+  const hasWasserstein = wassersteinData.length > 0;
+  const hasKLDivergence = klDivergenceData.length > 0;
+
+  if (!hasWasserstein && !hasKLDivergence) {
+    return null;
+  }
+
+  // Color function based on value quality (lower is better)
+  const getWassersteinColor = (value: number): string => {
+    if (value < 0.01) return '#16a34a'; // Dark green - excellent
+    if (value < 0.05) return '#22c55e'; // Green - good
+    if (value < 0.1) return '#eab308'; // Yellow - moderate
+    if (value < 0.2) return '#f97316'; // Orange - fair
+    return '#ef4444'; // Red - poor
+  };
+
+  const getKLColor = (value: number): string => {
+    if (value < 0.1) return '#16a34a'; // Dark green - excellent
+    if (value < 0.5) return '#22c55e'; // Green - good
+    if (value < 1.0) return '#eab308'; // Yellow - moderate
+    if (value < 5.0) return '#f97316'; // Orange - fair
+    return '#ef4444'; // Red - poor
+  };
+
+  return (
+    <div className="bg-white p-6 rounded-lg shadow">
+      <div className="mb-6">
+        <h2 className="text-2xl font-bold mb-2 text-gray-900">
+          Imputation results
+        </h2>
+        <p className="text-sm text-gray-600">
+          Distributional quality metrics comparing imputed values to true values
+        </p>
+      </div>
+
+      {/* Wasserstein Distance Section */}
+      {hasWasserstein && (
+        <div className="mb-8">
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Numerical variables (Wasserstein distance)
+          </h3>
+
+          {/* Explanation */}
+          <div className="mb-6 p-4 bg-blue-50 border border-blue-200 rounded-md">
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>What is Wasserstein distance?</strong> Also known as "Earth Mover's Distance,"
+              this metric measures how much "work" is needed to transform one probability distribution
+              into another. Think of it as the minimum cost to rearrange one pile of dirt to match
+              another pile's shape.
+            </p>
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>Why use it for imputation?</strong> Wasserstein distance is ideal for numerical
+              variables because it considers the actual distances between values, not just whether
+              they match exactly. A value of 0 means perfect imputation, and larger values indicate
+              greater differences between imputed and true distributions.
+            </p>
+            <p className="text-sm text-gray-700">
+              <strong>Interpretation:</strong> Values closer to 0 are better. Generally, values below
+              0.05 indicate good imputation quality, while values above 0.2 suggest significant
+              distributional differences.
+            </p>
+          </div>
+
+          {/* Bar chart */}
+          <div className="mb-4">
+            <ResponsiveContainer width="100%" height={Math.max(200, wassersteinData.length * 60)}>
+              <BarChart
+                data={wassersteinData}
+                layout="vertical"
+                margin={{ top: 20, right: 30, left: 100, bottom: 20 }}
+              >
+                <CartesianGrid strokeDasharray="3 3" />
+                <XAxis type="number" tick={{ fill: '#000000' }} />
+                <YAxis type="category" dataKey="variable" width={90} tick={{ fill: '#000000' }} />
+                <Tooltip
+                  formatter={(value: number) => [value.toFixed(6), 'Wasserstein Distance']}
+                />
+                <Legend wrapperStyle={{ color: '#000000' }} />
+                <Bar dataKey="value" name="Wasserstein Distance">
+                  {wassersteinData.map((entry, index) => (
+                    <Cell
+                      key={`cell-${index}`}
+                      fill={getWassersteinColor(entry.value)}
+                    />
+                  ))}
+                </Bar>
+              </BarChart>
+            </ResponsiveContainer>
+          </div>
+
+          {/* Detailed table */}
+          <div className="overflow-x-auto">
+            <table className="min-w-full divide-y divide-gray-200">
+              <thead className="bg-gray-50">
+                <tr>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Variable
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Wasserstein Distance
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Quality Assessment
+                  </th>
+                </tr>
+              </thead>
+              <tbody className="bg-white divide-y divide-gray-200">
+                {wassersteinData.map((item) => {
+                  let assessment = '';
+                  let assessmentColor = '';
+
+                  if (item.value < 0.01) {
+                    assessment = 'Excellent';
+                    assessmentColor = 'text-green-700 font-semibold';
+                  } else if (item.value < 0.05) {
+                    assessment = 'Good';
+                    assessmentColor = 'text-green-600';
+                  } else if (item.value < 0.1) {
+                    assessment = 'Moderate';
+                    assessmentColor = 'text-yellow-600';
+                  } else if (item.value < 0.2) {
+                    assessment = 'Fair';
+                    assessmentColor = 'text-orange-600';
+                  } else {
+                    assessment = 'Poor';
+                    assessmentColor = 'text-red-600 font-semibold';
+                  }
+
+                  return (
+                    <tr key={item.variable}>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm font-mono font-medium text-gray-900">
+                        {item.variable}
+                      </td>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm text-gray-700">
+                        {item.value.toFixed(6)}
+                      </td>
+                      <td className={`px-4 py-3 whitespace-nowrap text-sm ${assessmentColor}`}>
+                        {assessment}
+                      </td>
+                    </tr>
+                  );
+                })}
+              </tbody>
+            </table>
+          </div>
+        </div>
+      )}
+
+      {/* KL Divergence Section */}
+      {hasKLDivergence && (
+        <div className={hasWasserstein ? 'mt-8 pt-8 border-t-2 border-gray-200' : ''}>
+          <h3 className="text-xl font-semibold mb-4 text-gray-900">
+            Categorical variables (KL-divergence)
+          </h3>
+
+          {/* Explanation */}
+          <div className="mb-6 p-4 bg-purple-50 border border-purple-200 rounded-md">
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>What is KL-divergence?</strong> Kullback-Leibler divergence measures how much
+              one probability distribution differs from another. It quantifies the "information lost"
+              when using the imputed distribution to approximate the true distribution.
+            </p>
+            <p className="text-sm text-gray-700 mb-2">
+              <strong>Why use it for categorical variables?</strong> KL-divergence is particularly
+              useful for categorical data because it compares probability distributions across
+              categories. It's sensitive to differences in how probabilities are distributed across
+              all possible categories.
+            </p>
+            <p className="text-sm text-gray-700">
+              <strong>Interpretation:</strong> A value of 0 means perfect match. Values below 0.5
+              indicate good imputation, while values above 5.0 suggest substantial distributional
+              differences. Note that KL-divergence is not symmetric and can range from 0 to infinity.
+            </p>
+          </div>
+
+          {/* Bar chart */}
+          <div className="mb-4">
+            <ResponsiveContainer width="100%" height={Math.max(200, klDivergenceData.length * 60)}>
+              <BarChart
+                data={klDivergenceData}
+                layout="vertical"
+                margin={{ top: 20, right: 30, left: 100, bottom: 20 }}
+              >
+                <CartesianGrid strokeDasharray="3 3" />
+                <XAxis type="number" tick={{ fill: '#000000' }} />
+                <YAxis type="category" dataKey="variable" width={90} tick={{ fill: '#000000' }} />
+                <Tooltip
+                  formatter={(value: number) => [value.toFixed(6), 'KL-Divergence']}
+                />
+                <Legend wrapperStyle={{ color: '#000000' }} />
+                <Bar dataKey="value" name="KL-Divergence">
+                  {klDivergenceData.map((entry, index) => (
+                    <Cell
+                      key={`cell-${index}`}
+                      fill={getKLColor(entry.value)}
+                    />
+                  ))}
+                </Bar>
+              </BarChart>
+            </ResponsiveContainer>
+          </div>
+
+          {/* Detailed table */}
+          <div className="overflow-x-auto">
+            <table className="min-w-full divide-y divide-gray-200">
+              <thead className="bg-gray-50">
+                <tr>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Variable
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    KL-Divergence
+                  </th>
+                  <th className="px-4 py-3 text-left text-xs font-medium text-gray-500 uppercase tracking-wider">
+                    Quality Assessment
+                  </th>
+                </tr>
+              </thead>
+              <tbody className="bg-white divide-y divide-gray-200">
+                {klDivergenceData.map((item) => {
+                  let assessment = '';
+                  let assessmentColor = '';
+
+                  if (item.value < 0.1) {
+                    assessment = 'Excellent';
+                    assessmentColor = 'text-green-700 font-semibold';
+                  } else if (item.value < 0.5) {
+                    assessment = 'Good';
+                    assessmentColor = 'text-green-600';
+                  } else if (item.value < 1.0) {
+                    assessment = 'Moderate';
+                    assessmentColor = 'text-yellow-600';
+                  } else if (item.value < 5.0) {
+                    assessment = 'Fair';
+                    assessmentColor = 'text-orange-600';
+                  } else {
+                    assessment = 'Poor';
+                    assessmentColor = 'text-red-600 font-semibold';
+                  }
+
+                  return (
+                    <tr key={item.variable}>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm font-mono font-medium text-gray-900">
+                        {item.variable}
+                      </td>
+                      <td className="px-4 py-3 whitespace-nowrap text-sm text-gray-700">
+                        {item.value.toFixed(6)}
+                      </td>
+                      <td className={`px-4 py-3 whitespace-nowrap text-sm ${assessmentColor}`}>
+                        {assessment}
+                      </td>
+                    </tr>
+                  );
+                })}
+              </tbody>
+            </table>
+          </div>
+        </div>
+      )}
+    </div>
+  );
+}
diff --git a/microimputation-dashboard/components/PredictorOrderingRobustness.tsx b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
index e784a24..65ceee0 100644
--- a/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
+++ b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
@@ -148,7 +148,7 @@ export default function PredictorOrderingRobustness({ data }: PredictorOrderingR
               <strong>How this works:</strong> This analysis adds predictors one at a time,
               choosing the predictor that improves performance the most at each step. This
               step-by-step approach is efficient but doesn't test
-              every possible combination of predictors.
+              every possible combination of predictors. Note that this analysis may differ depending on the model type passed when using the `progressive_predictor_inclusion` function that produced these results.
             </p>
             <p className="text-sm text-gray-700">
               <strong>Reading the chart:</strong> The bars show cumulative improvement from
@@ -176,6 +176,10 @@ export default function PredictorOrderingRobustness({ data }: PredictorOrderingR
                     <span className="font-semibold text-green-700">
                       {(bestCombination.cumulativeImprovement * 100).toFixed(3)}%
                     </span>
+                    {' '}
+                    <span className="text-xs text-gray-600">
+                      (relative to the first predictor added, which was the best single predictor)
+                    </span>
                   </p>
                 </div>
               </div>
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index 23ba060..2071999 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -8,6 +8,7 @@ import PerVariableCharts from './PerVariableCharts';
 import VisualizationTabs from './VisualizationTabs';
 import PredictorCorrelationMatrix from './PredictorCorrelationMatrix';
 import PredictorOrderingRobustness from './PredictorOrderingRobustness';
+import ImputationResults from './ImputationResults';
 import { Share } from 'lucide-react';
 
 interface VisualizationDashboardProps {
@@ -75,14 +76,215 @@ export default function VisualizationDashboard({
       categoricalVars.push(...Array.from(llVars));
     }
 
+    // Check for actual distribution distance data (wasserstein or kl_divergence)
+    const distributionData = data.filter(d => d.type === 'distribution_distance');
+    const hasWasserstein = distributionData.some(d => d.metric_name === 'wasserstein_distance' && d.metric_value !== null);
+    const hasKLDivergence = distributionData.some(d => d.metric_name === 'kl_divergence' && d.metric_value !== null);
+    const hasDistributionDistance = hasWasserstein || hasKLDivergence;
+
+    // Check for predictor correlation data
+    const correlationData = data.filter(d => d.type === 'predictor_correlation');
+    const hasPredictorCorrelation = correlationData.length > 0 && correlationData.some(d => d.metric_value !== null);
+
+    // Check for predictor ordering/importance data
+    const progressiveData = data.filter(d => d.type === 'progressive_inclusion');
+    const importanceData = data.filter(d => d.type === 'predictor_importance');
+    const hasPredictorOrdering = (progressiveData.length > 0 && progressiveData.some(d => d.metric_value !== null)) ||
+                                   (importanceData.length > 0 && importanceData.some(d => d.metric_value !== null));
+
+    // Find imputed variables (from distribution_distance data)
+    const imputedVars = new Set<string>();
+    distributionData.forEach(d => {
+      if (d.variable && d.metric_value !== null) {
+        imputedVars.add(d.variable);
+      }
+    });
+
+    // Calculate best performing model
+    let bestModel = '';
+    let avgLoss = 0;
+
+    if (hasBenchmarkLoss) {
+      const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
+      const methods = Array.from(new Set(benchmarkData.map(d => d.method)));
+
+      // Calculate weighted combined rank for each method (same logic as BenchmarkLossCharts)
+      const quantileRanks = new Map<string, number>();
+      const logLossRanks = new Map<string, number>();
+      const quantileVarCounts = new Map<string, Set<string>>();
+      const logLossVarCounts = new Map<string, Set<string>>();
+
+      methods.forEach(method => {
+        const quantileData = benchmarkData.filter(
+          d => d.method === method && d.metric_name === 'quantile_loss' && d.split === 'test' &&
+               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
+        );
+        const logLossData = benchmarkData.filter(
+          d => d.method === method && d.metric_name === 'log_loss' && d.split === 'test' &&
+               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
+        );
+
+        if (quantileData.length > 0) {
+          const avgQuantile = quantileData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / quantileData.length;
+          quantileRanks.set(method, avgQuantile);
+          quantileVarCounts.set(method, new Set(quantileData.map(d => d.variable)));
+        }
+
+        if (logLossData.length > 0) {
+          const avgLogLoss = logLossData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / logLossData.length;
+          logLossRanks.set(method, avgLogLoss);
+          logLossVarCounts.set(method, new Set(logLossData.map(d => d.variable)));
+        }
+      });
+
+      // Rank methods by their average losses
+      const rankedQuantile = Array.from(quantileRanks.entries()).sort((a, b) => a[1] - b[1]);
+      const rankedLogLoss = Array.from(logLossRanks.entries()).sort((a, b) => a[1] - b[1]);
+
+      const combinedRanks = new Map<string, number>();
+      methods.forEach(method => {
+        const qRank = rankedQuantile.findIndex(([m]) => m === method) + 1;
+        const lRank = rankedLogLoss.findIndex(([m]) => m === method) + 1;
+        const nQuantileVars = quantileVarCounts.get(method)?.size || 0;
+        const nLogLossVars = logLossVarCounts.get(method)?.size || 0;
+        const totalVars = nQuantileVars + nLogLossVars;
+
+        if (totalVars > 0) {
+          let weightedRank = 0;
+          if (qRank > 0) {
+            weightedRank += nQuantileVars * qRank;
+          }
+          if (lRank > 0) {
+            weightedRank += nLogLossVars * lRank;
+          }
+          combinedRanks.set(method, weightedRank / totalVars);
+        }
+      });
+
+      const sortedMethods = Array.from(combinedRanks.entries()).sort((a, b) => a[1] - b[1]);
+      if (sortedMethods.length > 0) {
+        bestModel = sortedMethods[0][0];
+
+        // Calculate average loss for best model
+        const bestMethodData = benchmarkData.filter(
+          d => d.method === bestModel && d.split === 'test' &&
+               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
+        );
+        if (bestMethodData.length > 0) {
+          avgLoss = bestMethodData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / bestMethodData.length;
+        }
+      }
+    }
+
+    // Calculate quality scores by variable for model performance
+    let modelExcellent = 0;
+    let modelGood = 0;
+    let modelPoor = 0;
+    let modelScore = 0;
+    let modelQuality = '';
+
+    if (hasBenchmarkLoss && bestModel) {
+      const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
+      const bestModelVars = benchmarkData.filter(
+        d => d.method === bestModel && d.split === 'test' &&
+             d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
+      );
+
+      bestModelVars.forEach(d => {
+        const loss = d.metric_value ?? 0;
+        if (loss < 0.02) modelExcellent++;
+        else if (loss < 0.05) modelGood++;
+        else modelPoor++;
+      });
+
+      const totalModelVars = modelExcellent + modelGood + modelPoor;
+      if (totalModelVars > 0) {
+        modelScore = ((modelExcellent * 100) + (modelGood * 75)) / totalModelVars;
+        if (modelScore >= 90) modelQuality = 'Excellent';
+        else if (modelScore >= 70) modelQuality = 'Good';
+        else modelQuality = 'Needs improvement';
+      }
+    }
+
+    // Calculate quality scores by variable for distributional accuracy
+    let distExcellent = 0;
+    let distGood = 0;
+    let distPoor = 0;
+    let distScore = 0;
+    let distQuality = '';
+
+    distributionData.forEach(d => {
+      const value = d.metric_value ?? 0;
+      // Different thresholds for Wasserstein vs KL-divergence
+      if (d.metric_name === 'wasserstein_distance') {
+        if (value < 0.01) distExcellent++;
+        else if (value < 0.05) distGood++;
+        else distPoor++;
+      } else if (d.metric_name === 'kl_divergence') {
+        if (value < 0.1) distExcellent++;
+        else if (value < 0.5) distGood++;
+        else distPoor++;
+      }
+    });
+
+    const totalDistVars = distExcellent + distGood + distPoor;
+    if (totalDistVars > 0) {
+      distScore = ((distExcellent * 100) + (distGood * 75)) / totalDistVars;
+      if (distScore >= 90) distQuality = 'Excellent';
+      else if (distScore >= 70) distQuality = 'Good';
+      else distQuality = 'Needs improvement';
+    }
+
+    // Calculate overall quality (weighted average)
+    let overallScore = 0;
+    let overallQuality = '';
+    let overallColor = '';
+    const hasModelScore = modelScore > 0;
+    const hasDistScore = distScore > 0;
+
+    if (hasModelScore && hasDistScore) {
+      overallScore = (modelScore + distScore) / 2;
+    } else if (hasModelScore) {
+      overallScore = modelScore;
+    } else if (hasDistScore) {
+      overallScore = distScore;
+    }
+
+    if (overallScore >= 90) {
+      overallQuality = 'Excellent quality';
+      overallColor = 'text-green-700 bg-green-50 border-green-500';
+    } else if (overallScore >= 70) {
+      overallQuality = 'Good quality';
+      overallColor = 'text-yellow-700 bg-yellow-50 border-yellow-500';
+    } else if (overallScore > 0) {
+      overallQuality = 'Needs improvement';
+      overallColor = 'text-red-700 bg-red-50 border-red-500';
+    }
+
     return {
       hasBenchmarkLoss,
-      hasDistributionDistance: types.has('distribution_distance'),
-      hasPredictorCorrelation: types.has('predictor_correlation'),
-      hasPredictorOrdering: types.has('progressive_inclusion') || types.has('predictor_importance'),
+      hasDistributionDistance,
+      hasPredictorCorrelation,
+      hasPredictorOrdering,
       numericalVars,
       categoricalVars,
       hasPerVariableData: numericalVars.length > 0 || categoricalVars.length > 0,
+      imputedVars: Array.from(imputedVars).sort(),
+      bestModel,
+      avgLoss,
+      overallScore,
+      overallQuality,
+      overallColor,
+      modelScore,
+      modelQuality,
+      modelExcellent,
+      modelGood,
+      modelPoor,
+      distScore,
+      distQuality,
+      distExcellent,
+      distGood,
+      distPoor,
     };
   }, [data]);
 
@@ -94,6 +296,13 @@ export default function VisualizationDashboard({
       tabsList.push({ id: 'overview', label: 'Model benchmarking' });
     }
 
+    if (dataAnalysis.hasDistributionDistance) {
+      tabsList.push({
+        id: 'imputation',
+        label: 'Imputation results',
+      });
+    }
+
     if (dataAnalysis.numericalVars.length > 0) {
       tabsList.push({
         id: 'numerical',
@@ -201,27 +410,12 @@ export default function VisualizationDashboard({
         </div>
       </div>
 
-      {/* Data Info */}
+      {/* Imputation Summary */}
       <div className="bg-white rounded-lg shadow-lg p-6">
-        <h2 className="text-xl font-semibold text-gray-900 mb-3">Dataset Overview</h2>
-        <div className="grid grid-cols-1 md:grid-cols-3 gap-4">
-          <div className="p-4 bg-gray-50 rounded">
-            <p className="text-sm text-gray-600">Total Records</p>
-            <p className="text-2xl font-bold text-gray-900">{data.length}</p>
-          </div>
-          {dataAnalysis.numericalVars.length > 0 && (
-            <div className="p-4 bg-gray-50 rounded">
-              <p className="text-sm text-gray-600">Numerical Variables</p>
-              <p className="text-2xl font-bold text-gray-900">{dataAnalysis.numericalVars.length}</p>
-            </div>
-          )}
-          {dataAnalysis.categoricalVars.length > 0 && (
-            <div className="p-4 bg-gray-50 rounded">
-              <p className="text-sm text-gray-600">Categorical Variables</p>
-              <p className="text-2xl font-bold text-gray-900">{dataAnalysis.categoricalVars.length}</p>
-            </div>
-          )}
-        </div>
+        <h2 className="text-xl font-semibold text-gray-900 mb-1">Imputation summary</h2>
+        <p className="text-sm text-gray-600 mb-4">
+          Assessment of the quality of the imputations produced by the best-performing (or the only selected) model
+        </p>
       </div>
 
       {/* Tabs Navigation */}
@@ -281,6 +475,11 @@ export default function VisualizationDashboard({
         {activeTab === 'ordering' && (
           <PredictorOrderingRobustness data={data} />
         )}
+
+        {/* Imputation Results Tab */}
+        {activeTab === 'imputation' && (
+          <ImputationResults data={data} />
+        )}
       </div>
     </div>
   );

From e93bfa375a452d56eda5944f1a5b1b49f72eec58 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 23:43:18 +0800
Subject: [PATCH 10/12] add summary and fix deployment

---
 .../components/BenchmarkLossCharts.tsx        |   2 +-
 .../components/ImputationResults.tsx          |   6 +-
 .../components/VisualizationDashboard.tsx     | 201 ++++++++++++++----
 3 files changed, 161 insertions(+), 48 deletions(-)

diff --git a/microimputation-dashboard/components/BenchmarkLossCharts.tsx b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
index 88b579d..8cf9e5c 100644
--- a/microimputation-dashboard/components/BenchmarkLossCharts.tsx
+++ b/microimputation-dashboard/components/BenchmarkLossCharts.tsx
@@ -238,7 +238,7 @@ export default function BenchmarkLossCharts({ data }: BenchmarkLossChartsProps)
       quantileTrainTestRatio,
       logLossTrainTestRatio,
     };
-  }, [methods, quantileLossData, logLossChartData, benchmarkData]);
+  }, [methods, quantileLossData, logLossData, logLossChartData, benchmarkData]);
 
   // Set default selected method to best model
   useMemo(() => {
diff --git a/microimputation-dashboard/components/ImputationResults.tsx b/microimputation-dashboard/components/ImputationResults.tsx
index ce3ab42..6eceeca 100644
--- a/microimputation-dashboard/components/ImputationResults.tsx
+++ b/microimputation-dashboard/components/ImputationResults.tsx
@@ -96,10 +96,10 @@ export default function ImputationResults({ data }: ImputationResultsProps) {
           {/* Explanation */}
           <div className="mb-6 p-4 bg-blue-50 border border-blue-200 rounded-md">
             <p className="text-sm text-gray-700 mb-2">
-              <strong>What is Wasserstein distance?</strong> Also known as "Earth Mover's Distance,"
-              this metric measures how much "work" is needed to transform one probability distribution
+              <strong>What is Wasserstein distance?</strong> Also known as &quot;Earth Mover&apos;s Distance&quot;,
+              this metric measures how much &quot;work&quot; is needed to transform one probability distribution
               into another. Think of it as the minimum cost to rearrange one pile of dirt to match
-              another pile's shape.
+              another pile&apos;s shape.
             </p>
             <p className="text-sm text-gray-700 mb-2">
               <strong>Why use it for imputation?</strong> Wasserstein distance is ideal for numerical
diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index 2071999..f620925 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -49,6 +49,11 @@ export default function VisualizationDashboard({
     const numericalVars: string[] = [];
     const categoricalVars: string[] = [];
 
+    // Get all unique methods from benchmark data
+    const allMethods = hasBenchmarkLoss
+      ? Array.from(new Set(data.filter(d => d.type === 'benchmark_loss').map(d => d.method)))
+      : [];
+
     if (hasBenchmarkLoss) {
       const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
 
@@ -100,7 +105,7 @@ export default function VisualizationDashboard({
       }
     });
 
-    // Calculate best performing model
+    // Calculate best performing model (same logic as BenchmarkLossCharts)
     let bestModel = '';
     let avgLoss = 0;
 
@@ -108,72 +113,117 @@ export default function VisualizationDashboard({
       const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
       const methods = Array.from(new Set(benchmarkData.map(d => d.method)));
 
-      // Calculate weighted combined rank for each method (same logic as BenchmarkLossCharts)
-      const quantileRanks = new Map<string, number>();
-      const logLossRanks = new Map<string, number>();
+      // Filter quantile and log loss data (matching BenchmarkLossCharts logic)
+      const quantileLossData = benchmarkData.filter(
+        d => d.metric_name === 'quantile_loss' &&
+             d.split === 'test' &&
+             typeof d.quantile === 'number' &&
+             d.quantile >= 0 &&
+             d.quantile <= 1
+      );
+
+      const logLossData = benchmarkData.filter(
+        d => d.metric_name === 'log_loss' &&
+             d.split === 'test' &&
+             d.metric_value !== null
+      );
+
+      // Calculate average quantile loss per method
+      const quantileLossAvg = new Map<string, number>();
       const quantileVarCounts = new Map<string, Set<string>>();
+
+      if (quantileLossData.length > 0) {
+        const methodSums = new Map<string, { sum: number; count: number }>();
+        quantileLossData.forEach(d => {
+          if (d.metric_value !== null) {
+            if (!methodSums.has(d.method)) {
+              methodSums.set(d.method, { sum: 0, count: 0 });
+            }
+            const entry = methodSums.get(d.method)!;
+            entry.sum += d.metric_value;
+            entry.count += 1;
+
+            if (!quantileVarCounts.has(d.method)) {
+              quantileVarCounts.set(d.method, new Set());
+            }
+            quantileVarCounts.get(d.method)!.add(d.variable);
+          }
+        });
+        methodSums.forEach((value, method) => {
+          quantileLossAvg.set(method, value.sum / value.count);
+        });
+      }
+
+      // Calculate average log loss per method
+      const logLossAvg = new Map<string, number>();
       const logLossVarCounts = new Map<string, Set<string>>();
 
-      methods.forEach(method => {
-        const quantileData = benchmarkData.filter(
-          d => d.method === method && d.metric_name === 'quantile_loss' && d.split === 'test' &&
-               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
-        );
-        const logLossData = benchmarkData.filter(
-          d => d.method === method && d.metric_name === 'log_loss' && d.split === 'test' &&
-               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
-        );
-
-        if (quantileData.length > 0) {
-          const avgQuantile = quantileData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / quantileData.length;
-          quantileRanks.set(method, avgQuantile);
-          quantileVarCounts.set(method, new Set(quantileData.map(d => d.variable)));
-        }
+      if (logLossData.length > 0) {
+        const methodSums = new Map<string, { sum: number; count: number }>();
+        logLossData.forEach(d => {
+          if (d.metric_value !== null) {
+            if (!methodSums.has(d.method)) {
+              methodSums.set(d.method, { sum: 0, count: 0 });
+            }
+            const entry = methodSums.get(d.method)!;
+            entry.sum += d.metric_value;
+            entry.count += 1;
+
+            if (!logLossVarCounts.has(d.method)) {
+              logLossVarCounts.set(d.method, new Set());
+            }
+            logLossVarCounts.get(d.method)!.add(d.variable);
+          }
+        });
+        methodSums.forEach((value, method) => {
+          logLossAvg.set(method, value.sum / value.count);
+        });
+      }
 
-        if (logLossData.length > 0) {
-          const avgLogLoss = logLossData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / logLossData.length;
-          logLossRanks.set(method, avgLogLoss);
-          logLossVarCounts.set(method, new Set(logLossData.map(d => d.variable)));
-        }
-      });
+      // Rank methods by each metric (lower is better)
+      const rankMethods = (avgMap: Map<string, number>): Map<string, number> => {
+        const sorted = Array.from(avgMap.entries()).sort((a, b) => a[1] - b[1]);
+        const ranks = new Map<string, number>();
+        sorted.forEach(([method], index) => {
+          ranks.set(method, index + 1);
+        });
+        return ranks;
+      };
 
-      // Rank methods by their average losses
-      const rankedQuantile = Array.from(quantileRanks.entries()).sort((a, b) => a[1] - b[1]);
-      const rankedLogLoss = Array.from(logLossRanks.entries()).sort((a, b) => a[1] - b[1]);
+      const quantileRanks = rankMethods(quantileLossAvg);
+      const logLossRanks = rankMethods(logLossAvg);
 
+      // Calculate weighted combined rank
       const combinedRanks = new Map<string, number>();
       methods.forEach(method => {
-        const qRank = rankedQuantile.findIndex(([m]) => m === method) + 1;
-        const lRank = rankedLogLoss.findIndex(([m]) => m === method) + 1;
+        const qRank = quantileRanks.get(method);
+        const lRank = logLossRanks.get(method);
         const nQuantileVars = quantileVarCounts.get(method)?.size || 0;
         const nLogLossVars = logLossVarCounts.get(method)?.size || 0;
         const totalVars = nQuantileVars + nLogLossVars;
 
         if (totalVars > 0) {
           let weightedRank = 0;
-          if (qRank > 0) {
+          if (qRank !== undefined) {
             weightedRank += nQuantileVars * qRank;
           }
-          if (lRank > 0) {
+          if (lRank !== undefined) {
             weightedRank += nLogLossVars * lRank;
           }
           combinedRanks.set(method, weightedRank / totalVars);
+        } else {
+          combinedRanks.set(method, Infinity);
         }
       });
 
-      const sortedMethods = Array.from(combinedRanks.entries()).sort((a, b) => a[1] - b[1]);
-      if (sortedMethods.length > 0) {
-        bestModel = sortedMethods[0][0];
-
-        // Calculate average loss for best model
-        const bestMethodData = benchmarkData.filter(
-          d => d.method === bestModel && d.split === 'test' &&
-               d.quantile === 'mean' && !d.variable.includes('_mean_all') && d.metric_value !== null
-        );
-        if (bestMethodData.length > 0) {
-          avgLoss = bestMethodData.reduce((sum, d) => sum + (d.metric_value ?? 0), 0) / bestMethodData.length;
+      // Find best method (lowest combined rank)
+      let bestRank = Infinity;
+      combinedRanks.forEach((rank, method) => {
+        if (rank < bestRank) {
+          bestRank = rank;
+          bestModel = method;
         }
-      }
+      });
     }
 
     // Calculate quality scores by variable for model performance
@@ -285,6 +335,7 @@ export default function VisualizationDashboard({
       distExcellent,
       distGood,
       distPoor,
+      allMethods,
     };
   }, [data]);
 
@@ -416,6 +467,68 @@ export default function VisualizationDashboard({
         <p className="text-sm text-gray-600 mb-4">
           Assessment of the quality of the imputations produced by the best-performing (or the only selected) model
         </p>
+
+        <div className="grid grid-cols-1 md:grid-cols-2 gap-6 mt-6">
+          {/* Imputed Variables Section */}
+          <div className="border border-gray-200 rounded-md p-4">
+            <h3 className="text-sm font-semibold text-gray-700 mb-2 uppercase tracking-wide">
+              Imputed Variables
+            </h3>
+            {dataAnalysis.imputedVars.length > 0 ? (
+              <div className="space-y-2">
+                <p className="text-xs text-gray-600 mb-2">
+                  {dataAnalysis.imputedVars.length} variable{dataAnalysis.imputedVars.length !== 1 ? 's' : ''} imputed
+                </p>
+                <ul className="space-y-1 max-h-40 overflow-y-auto">
+                  {dataAnalysis.imputedVars.map((variable) => (
+                    <li key={variable} className="text-sm font-mono text-gray-900 bg-gray-50 px-2 py-1 rounded">
+                      {variable}
+                    </li>
+                  ))}
+                </ul>
+              </div>
+            ) : (
+              <p className="text-sm text-gray-500 italic">
+                No imputed variable information available in the CSV
+              </p>
+            )}
+          </div>
+
+          {/* Best Model Section */}
+          <div className="border border-gray-200 rounded-md p-4">
+            <h3 className="text-sm font-semibold text-gray-700 mb-2 uppercase tracking-wide">
+              {dataAnalysis.allMethods.length === 1 ? 'Imputation Model' : 'Best Performing Model'}
+            </h3>
+            {dataAnalysis.bestModel ? (
+              <div className="space-y-2">
+                <div className="flex items-center gap-2">
+                  <span className="text-lg font-bold text-blue-700">
+                    {dataAnalysis.bestModel}
+                  </span>
+                  {dataAnalysis.allMethods.length === 1 && (
+                    <span className="text-xs text-gray-500 bg-gray-100 px-2 py-0.5 rounded">
+                      Only model
+                    </span>
+                  )}
+                  {dataAnalysis.allMethods.length > 1 && (
+                    <span className="text-xs text-green-700 bg-green-50 px-2 py-0.5 rounded">
+                      Best of {dataAnalysis.allMethods.length}
+                    </span>
+                  )}
+                </div>
+                {dataAnalysis.allMethods.length > 1 && (
+                  <p className="text-xs text-gray-600">
+                    Selected based on combined performance across all cross-validation loss metrics
+                  </p>
+                )}
+              </div>
+            ) : (
+              <p className="text-sm text-gray-500 italic">
+                No model information available in the CSV
+              </p>
+            )}
+          </div>
+        </div>
       </div>
 
       {/* Tabs Navigation */}

From 4e6ab42fb885e23cd7dded6db1081506fa9eeb31 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 23:46:41 +0800
Subject: [PATCH 11/12] replace quotes to fix deployment

---
 microimputation-dashboard/components/ImputationResults.tsx    | 4 ++--
 .../components/PredictorCorrelationMatrix.tsx                 | 2 +-
 .../components/PredictorOrderingRobustness.tsx                | 4 ++--
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/microimputation-dashboard/components/ImputationResults.tsx b/microimputation-dashboard/components/ImputationResults.tsx
index 6eceeca..598b507 100644
--- a/microimputation-dashboard/components/ImputationResults.tsx
+++ b/microimputation-dashboard/components/ImputationResults.tsx
@@ -210,13 +210,13 @@ export default function ImputationResults({ data }: ImputationResultsProps) {
           <div className="mb-6 p-4 bg-purple-50 border border-purple-200 rounded-md">
             <p className="text-sm text-gray-700 mb-2">
               <strong>What is KL-divergence?</strong> Kullback-Leibler divergence measures how much
-              one probability distribution differs from another. It quantifies the "information lost"
+              one probability distribution differs from another. It quantifies the &quot;information lost&quot;
               when using the imputed distribution to approximate the true distribution.
             </p>
             <p className="text-sm text-gray-700 mb-2">
               <strong>Why use it for categorical variables?</strong> KL-divergence is particularly
               useful for categorical data because it compares probability distributions across
-              categories. It's sensitive to differences in how probabilities are distributed across
+              categories. It&apos;s sensitive to differences in how probabilities are distributed across
               all possible categories.
             </p>
             <p className="text-sm text-gray-700">
diff --git a/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx b/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx
index 331a5cc..6a47799 100644
--- a/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx
+++ b/microimputation-dashboard/components/PredictorCorrelationMatrix.tsx
@@ -428,7 +428,7 @@ export default function PredictorCorrelationMatrix({ data }: PredictorCorrelatio
             <strong>What is mutual information?</strong> Mutual information measures how much information one variable provides about another. Unlike correlation, it captures both linear and non-linear relationships between variables. Values range from 0 (independent variables) to higher positive values (strong dependency).
           </p>
           <p className="text-sm text-gray-700 mb-3">
-            <strong>Why measure it for imputed variables?</strong> Mutual information between predictors and imputed variables reveals which predictors are most informative for imputation. High mutual information indicates that a predictor strongly influences the imputed variable's distribution, making it crucial for accurate imputation. This helps validate that your imputation models are using the most relevant predictors and can identify when key predictive relationships exist in your data.
+            <strong>Why measure it for imputed variables?</strong> Mutual information between predictors and imputed variables reveals which predictors are most informative for imputation. High mutual information indicates that a predictor strongly influences the imputed variable&apos;s distribution, making it crucial for accurate imputation. This helps validate that your imputation models are using the most relevant predictors and can identify when key predictive relationships exist in your data.
           </p>
 
           {/* Color scale within explanation box */}
diff --git a/microimputation-dashboard/components/PredictorOrderingRobustness.tsx b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
index 65ceee0..fea48da 100644
--- a/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
+++ b/microimputation-dashboard/components/PredictorOrderingRobustness.tsx
@@ -147,7 +147,7 @@ export default function PredictorOrderingRobustness({ data }: PredictorOrderingR
             <p className="text-sm text-gray-700 mb-2">
               <strong>How this works:</strong> This analysis adds predictors one at a time,
               choosing the predictor that improves performance the most at each step. This
-              step-by-step approach is efficient but doesn't test
+              step-by-step approach is efficient but doesn&apos;t test
               every possible combination of predictors. Note that this analysis may differ depending on the model type passed when using the `progressive_predictor_inclusion` function that produced these results.
             </p>
             <p className="text-sm text-gray-700">
@@ -282,7 +282,7 @@ export default function PredictorOrderingRobustness({ data }: PredictorOrderingR
             <p className="text-sm text-gray-700 mb-2">
               <strong>What this shows:</strong> This analysis measures how much performance
               degrades when each predictor is removed. Predictors that cause large performance
-              drops when removed are critical to the model's accuracy.
+              drops when removed are critical to the model&apos;s accuracy.
             </p>
             <p className="text-sm text-gray-700">
               <strong>Reading the chart:</strong> Positive values (bars pointing right) indicate

From 70fed2baf6645c102f721c4110d77db005e5a798 Mon Sep 17 00:00:00 2001
From: juaristi22 <juaristi@uni.minerva.edu>
Date: Fri, 24 Oct 2025 23:49:06 +0800
Subject: [PATCH 12/12] remove unused variable

---
 microimputation-dashboard/components/VisualizationDashboard.tsx | 2 --
 1 file changed, 2 deletions(-)

diff --git a/microimputation-dashboard/components/VisualizationDashboard.tsx b/microimputation-dashboard/components/VisualizationDashboard.tsx
index f620925..67a1d88 100644
--- a/microimputation-dashboard/components/VisualizationDashboard.tsx
+++ b/microimputation-dashboard/components/VisualizationDashboard.tsx
@@ -107,7 +107,6 @@ export default function VisualizationDashboard({
 
     // Calculate best performing model (same logic as BenchmarkLossCharts)
     let bestModel = '';
-    let avgLoss = 0;
 
     if (hasBenchmarkLoss) {
       const benchmarkData = data.filter(d => d.type === 'benchmark_loss');
@@ -321,7 +320,6 @@ export default function VisualizationDashboard({
       hasPerVariableData: numericalVars.length > 0 || categoricalVars.length > 0,
       imputedVars: Array.from(imputedVars).sort(),
       bestModel,
-      avgLoss,
       overallScore,
       overallQuality,
       overallColor,