From 017cc581fc212fcac659d24e3b5d3af6769bfb80 Mon Sep 17 00:00:00 2001
From: Prashant Vasudevan <71649489+vprashrex@users.noreply.github.com>
Date: Sat, 9 May 2026 09:51:59 +0530
Subject: [PATCH 1/5] feat: Integrate Google Gemini model configurations and
 update assessment model types

---
 app/lib/data/assessmentModels.ts | 116 ++++++++++++++++++++++++++++++-
 app/lib/types/assessment.ts      |   2 +-
 2 files changed, 114 insertions(+), 4 deletions(-)

diff --git a/app/lib/data/assessmentModels.ts b/app/lib/data/assessmentModels.ts
index 4f82229..daf8f7c 100644
--- a/app/lib/data/assessmentModels.ts
+++ b/app/lib/data/assessmentModels.ts
@@ -1,6 +1,7 @@
 import type {
   AssessmentModelConfig,
   ConfigParamDefinition,
+  ModelOption,
 } from "@/app/lib/types/assessment";
 import type { ConfigBlob } from "@/app/lib/types/configs";
 
@@ -21,7 +22,42 @@ export const GPT4_STYLE_CONFIG = {
   },
 } as const satisfies Record<string, ConfigParamDefinition>;
 
+// ── Gemini param configs ─────────────────────────────────────────
+
+const GEMINI_TEMPERATURE_CONFIG = {
+  temperature: {
+    max: 2.0,
+    min: 0.0,
+    type: "float",
+    default: 0.4,
+    description: "Controls randomness. Lower = more deterministic.",
+  },
+} as const satisfies Record<string, ConfigParamDefinition>;
+
+const GEMINI_THINKING_CONFIG = {
+  ...GEMINI_TEMPERATURE_CONFIG,
+  thinking_level: {
+    type: "enum",
+    default: "LOW",
+    options: ["MINIMAL", "LOW", "MEDIUM", "HIGH"],
+    description: "Controls how much the model thinks before responding.",
+  },
+} as const satisfies Record<string, ConfigParamDefinition>;
+
+const GEMINI_THINKING_NO_MINIMAL_CONFIG = {
+  ...GEMINI_TEMPERATURE_CONFIG,
+  thinking_level: {
+    type: "enum",
+    default: "LOW",
+    options: ["LOW", "MEDIUM", "HIGH"],
+    description: "Controls how much the model thinks before responding.",
+  },
+} as const satisfies Record<string, ConfigParamDefinition>;
+
+// ── All model configs ────────────────────────────────────────────
+
 export const ASSESSMENT_MODEL_CONFIGS: AssessmentModelConfig[] = [
+  // OpenAI
   { provider: "openai", model_name: "gpt-4o-mini", config: GPT4_STYLE_CONFIG },
   { provider: "openai", model_name: "gpt-4o", config: GPT4_STYLE_CONFIG },
   { provider: "openai", model_name: "gpt-4.1", config: GPT4_STYLE_CONFIG },
@@ -215,9 +251,84 @@ export const ASSESSMENT_MODEL_CONFIGS: AssessmentModelConfig[] = [
       },
     },
   },
+  // Google (Gemini)
+  {
+    provider: "google",
+    model_name: "gemini-2.0-flash-lite",
+    config: GEMINI_TEMPERATURE_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-2.0-flash",
+    config: GEMINI_TEMPERATURE_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-2.5-flash-lite",
+    config: GEMINI_TEMPERATURE_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-2.5-flash",
+    config: GEMINI_TEMPERATURE_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-2.5-pro",
+    config: GEMINI_TEMPERATURE_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-3.1-flash-lite-preview",
+    config: GEMINI_THINKING_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-3.1-pro-preview",
+    config: GEMINI_THINKING_NO_MINIMAL_CONFIG,
+  },
+  {
+    provider: "google",
+    model_name: "gemini-3-flash-preview",
+    config: GEMINI_THINKING_CONFIG,
+  },
 ];
 
-export const PROVIDER_OPTIONS = [{ value: "openai", label: "OpenAI" }] as const;
+export const PROVIDER_OPTIONS = [
+  { value: "openai", label: "OpenAI" },
+  { value: "google", label: "Google (Gemini)" },
+] as const;
+
+export function getModelsByProvider(provider: string): ModelOption[] {
+  return ASSESSMENT_MODEL_CONFIGS.filter((m) => m.provider === provider).map(
+    ({ model_name }) => ({ value: model_name, label: model_name }),
+  );
+}
+
+export function getDefaultModelForProvider(provider: string): string {
+  return (
+    ASSESSMENT_MODEL_CONFIGS.find((m) => m.provider === provider)?.model_name ??
+    "gpt-4o-mini"
+  );
+}
+
+export function getModelConfigDefinition(
+  modelName: string,
+): Record<string, ConfigParamDefinition> {
+  return (
+    ASSESSMENT_MODEL_CONFIGS.find((item) => item.model_name === modelName)
+      ?.config ?? GPT4_STYLE_CONFIG
+  );
+}
+
+export function buildDefaultParams(
+  modelName: string,
+): Record<string, number | string> {
+  const definition = getModelConfigDefinition(modelName);
+  return Object.fromEntries(
+    Object.entries(definition).map(([key, value]) => [key, value.default]),
+  );
+}
 
 export const ASSESSMENT_DEFAULT_CONFIG: ConfigBlob = {
   completion: {
@@ -226,8 +337,7 @@ export const ASSESSMENT_DEFAULT_CONFIG: ConfigBlob = {
     params: {
       model: "gpt-4o-mini",
       instructions: "",
-      top_p: GPT4_STYLE_CONFIG.top_p.default,
-      temperature: GPT4_STYLE_CONFIG.temperature.default,
+      ...buildDefaultParams("gpt-4o-mini"),
     },
   },
 };
diff --git a/app/lib/types/assessment.ts b/app/lib/types/assessment.ts
index 5edf69b..f9c0adf 100644
--- a/app/lib/types/assessment.ts
+++ b/app/lib/types/assessment.ts
@@ -105,7 +105,7 @@ export interface ConfigParamDefinition {
 }
 
 export interface AssessmentModelConfig {
-  provider: "openai";
+  provider: "openai" | "google";
   model_name: string;
   config: Record<string, ConfigParamDefinition>;
 }

From 01f625a46d116b593276f1bd23de49ef7e5c31e7 Mon Sep 17 00:00:00 2001
From: Prashant Vasudevan <71649489+vprashrex@users.noreply.github.com>
Date: Mon, 11 May 2026 10:21:17 +0530
Subject: [PATCH 2/5] chore: Clean up comments in assessmentModels.ts for
 clarity

---
 app/lib/data/assessmentModels.ts | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/app/lib/data/assessmentModels.ts b/app/lib/data/assessmentModels.ts
index daf8f7c..41ee16a 100644
--- a/app/lib/data/assessmentModels.ts
+++ b/app/lib/data/assessmentModels.ts
@@ -22,7 +22,7 @@ export const GPT4_STYLE_CONFIG = {
   },
 } as const satisfies Record<string, ConfigParamDefinition>;
 
-// ── Gemini param configs ─────────────────────────────────────────
+// Gemini param configs
 
 const GEMINI_TEMPERATURE_CONFIG = {
   temperature: {
@@ -54,8 +54,6 @@ const GEMINI_THINKING_NO_MINIMAL_CONFIG = {
   },
 } as const satisfies Record<string, ConfigParamDefinition>;
 
-// ── All model configs ────────────────────────────────────────────
-
 export const ASSESSMENT_MODEL_CONFIGS: AssessmentModelConfig[] = [
   // OpenAI
   { provider: "openai", model_name: "gpt-4o-mini", config: GPT4_STYLE_CONFIG },

From 2689da2a9ac455f9d296279aee5d8027660882c2 Mon Sep 17 00:00:00 2001
From: Ayush <80516839+Ayush8923@users.noreply.github.com>
Date: Mon, 11 May 2026 11:09:24 +0530
Subject: [PATCH 3/5] Apply suggestions from code review

Co-authored-by: Ayush <80516839+Ayush8923@users.noreply.github.com>
---
 app/lib/data/assessmentModels.ts | 2 --
 1 file changed, 2 deletions(-)

diff --git a/app/lib/data/assessmentModels.ts b/app/lib/data/assessmentModels.ts
index 41ee16a..b8c2266 100644
--- a/app/lib/data/assessmentModels.ts
+++ b/app/lib/data/assessmentModels.ts
@@ -22,8 +22,6 @@ export const GPT4_STYLE_CONFIG = {
   },
 } as const satisfies Record<string, ConfigParamDefinition>;
 
-// Gemini param configs
-
 const GEMINI_TEMPERATURE_CONFIG = {
   temperature: {
     max: 2.0,

From 806c908cb1522e2e69e96400499b072bb0d2226e Mon Sep 17 00:00:00 2001
From: Prashant Vasudevan <71649489+vprashrex@users.noreply.github.com>
Date: Tue, 12 May 2026 10:48:59 +0530
Subject: [PATCH 4/5] feat: Integrate dataset preview functionality and enhance
 file handling in assessment components

---
 .../assessment/datasets/[dataset_id]/route.ts | 97 +------------------
 .../assessment/ColumnMapperStep.tsx           | 12 +--
 app/components/assessment/DataViewModal.tsx   | 13 ++-
 app/components/assessment/DatasetsTab.tsx     | 52 +++++++++-
 .../assessment/datasets/CreatePanel.tsx       |  2 +-
 .../output-schema/OutputSchemaModal.tsx       |  8 +-
 app/hooks/useAssessmentResults.ts             |  5 +-
 app/lib/assessment/constants.ts               |  3 +
 app/lib/assessment/results.ts                 |  9 +-
 app/lib/types/assessment.ts                   | 23 ++++-
 app/lib/utils/assessment.ts                   | 61 ++++--------
 11 files changed, 129 insertions(+), 156 deletions(-)

diff --git a/app/api/assessment/datasets/[dataset_id]/route.ts b/app/api/assessment/datasets/[dataset_id]/route.ts
index 7296408..a4f035b 100644
--- a/app/api/assessment/datasets/[dataset_id]/route.ts
+++ b/app/api/assessment/datasets/[dataset_id]/route.ts
@@ -1,58 +1,19 @@
-// BFF proxy — GET (with optional S3 file fetch, max 10 MB) + DELETE /api/v1/assessment/datasets/:id
+// BFF proxy — GET (optional preview via limit_rows) + DELETE /api/v1/assessment/datasets/:id
 import { NextRequest, NextResponse } from "next/server";
 import { apiClient } from "@/app/lib/apiClient";
 import { proxyErrorResponse, withQueryParams } from "@/app/api/_routeProxy";
 
-const MAX_DATASET_PROXY_BYTES = 10 * 1024 * 1024;
-
-async function readFileAsBase64WithLimit(response: Response): Promise<string> {
-  const contentLength = response.headers.get("content-length");
-  if (contentLength) {
-    const size = Number.parseInt(contentLength, 10);
-    if (Number.isFinite(size) && size > MAX_DATASET_PROXY_BYTES) {
-      throw new Error("FILE_TOO_LARGE");
-    }
-  }
-
-  const reader = response.body?.getReader();
-  if (!reader) {
-    throw new Error("FILE_STREAM_UNAVAILABLE");
-  }
-
-  const chunks: Uint8Array[] = [];
-  let totalBytes = 0;
-
-  while (true) {
-    const { done, value } = await reader.read();
-    if (done) break;
-    if (!value) continue;
-
-    totalBytes += value.byteLength;
-    if (totalBytes > MAX_DATASET_PROXY_BYTES) {
-      throw new Error("FILE_TOO_LARGE");
-    }
-    chunks.push(value);
-  }
-
-  return Buffer.concat(chunks).toString("base64");
-}
-
 export async function GET(
   request: NextRequest,
   { params }: { params: Promise<{ dataset_id: string }> },
 ) {
   try {
     const { dataset_id } = await params;
-    const fetchContent =
-      request.nextUrl.searchParams.get("fetch_content") === "true";
+    const limitRows = request.nextUrl.searchParams.get("limit_rows");
 
-    // Always request signed URL when fetch_content is needed
     const backendParams = new URLSearchParams();
-    if (fetchContent) {
-      backendParams.set("fetch_content", "true");
-    }
-    if (fetchContent) {
-      backendParams.set("include_signed_url", "true");
+    if (limitRows) {
+      backendParams.set("limit_rows", limitRows);
     }
     const endpoint = withQueryParams(
       `/api/v1/assessment/datasets/${dataset_id}`,
@@ -63,56 +24,6 @@ export async function GET(
       method: "GET",
     });
 
-    if (status >= 400) {
-      return NextResponse.json(data, { status });
-    }
-
-    // Download file from S3 server-side and return as base64
-    if (fetchContent) {
-      const signedUrl =
-        (data as { data?: { signed_url?: string }; signed_url?: string })?.data
-          ?.signed_url ||
-        (data as { data?: { signed_url?: string }; signed_url?: string })
-          ?.signed_url;
-
-      if (!signedUrl) {
-        return NextResponse.json(
-          { error: "No signed URL available" },
-          { status: 404 },
-        );
-      }
-
-      const fileResponse = await fetch(signedUrl);
-      if (!fileResponse.ok) {
-        return NextResponse.json(
-          { error: "Failed to fetch file from storage" },
-          { status: 502 },
-        );
-      }
-
-      let base64: string;
-      try {
-        base64 = await readFileAsBase64WithLimit(fileResponse);
-      } catch (error) {
-        if (error instanceof Error && error.message === "FILE_TOO_LARGE") {
-          return NextResponse.json(
-            { error: "File too large" },
-            { status: 413 },
-          );
-        }
-
-        return NextResponse.json(
-          { error: "Failed to read file from storage" },
-          { status: 502 },
-        );
-      }
-
-      return NextResponse.json(
-        { ...(data as Record<string, unknown>), file_content: base64 },
-        { status: 200 },
-      );
-    }
-
     return NextResponse.json(data, { status });
   } catch (error: unknown) {
     return proxyErrorResponse("Assessment dataset details proxy error:", error);
diff --git a/app/components/assessment/ColumnMapperStep.tsx b/app/components/assessment/ColumnMapperStep.tsx
index 41a09a1..0fa075d 100644
--- a/app/components/assessment/ColumnMapperStep.tsx
+++ b/app/components/assessment/ColumnMapperStep.tsx
@@ -158,19 +158,19 @@ export default function ColumnMapperStep({
                   <div
                     className={`flex flex-col gap-3 rounded-xl border px-3 py-3 ${roleVisuals.panelClass}`}
                   >
-                    <div className="flex flex-col gap-3 sm:flex-row sm:items-center sm:justify-between">
-                      <div className="min-w-0">
-                        <div className="flex items-center gap-2">
+                    <div className="flex flex-col gap-3 sm:flex-row sm:items-start sm:justify-between">
+                      <div className="min-w-0 flex-1 sm:max-w-[50%]">
+                        <div className="flex items-start gap-2">
                           <span
-                            className={`h-2 w-2 rounded-full ${roleVisuals.dotClass}`}
+                            className={`mt-1.5 h-2 w-2 shrink-0 rounded-full ${roleVisuals.dotClass}`}
                           />
-                          <span className="font-mono text-sm font-semibold text-text-primary">
+                          <span className="min-w-0 break-words font-mono text-sm font-semibold text-text-primary">
                             {column}
                           </span>
                         </div>
                       </div>
 
-                      <div className="flex flex-wrap gap-2">
+                      <div className="flex flex-wrap gap-2 sm:shrink-0">
                         {ASSESSMENT_ROLE_OPTIONS.map((option) => {
                           const isGroundTruth = option.value === "ground_truth";
                           const isActive = config.role === option.value;
diff --git a/app/components/assessment/DataViewModal.tsx b/app/components/assessment/DataViewModal.tsx
index 6e2fd19..a960eb2 100644
--- a/app/components/assessment/DataViewModal.tsx
+++ b/app/components/assessment/DataViewModal.tsx
@@ -45,14 +45,14 @@ export default function DataViewModal({
         </button>
       </div>
       <div className="flex-1 overflow-auto">
-        <table className="w-full text-sm">
+        <table className="w-full table-fixed text-sm">
           <thead>
             <tr className="border-b border-neutral-200 bg-neutral-50">
-              <th className="sticky top-0 w-10 bg-neutral-50 px-4 py-2.5 text-left text-xs font-semibold uppercase tracking-wide text-neutral-500"></th>
+              <th className="sticky top-0 z-10 w-10 bg-neutral-50 px-4 py-2.5 text-left text-xs font-semibold uppercase tracking-wide text-neutral-500"></th>
               {headers.map((header, i) => (
                 <th
                   key={i}
-                  className="sticky top-0 bg-neutral-50 px-4 py-2.5 text-left text-xs font-semibold uppercase tracking-wide text-neutral-500"
+                  className="sticky top-0 z-10 w-40 min-w-[10rem] max-w-[10rem] bg-neutral-50 px-4 py-2.5 text-left text-xs font-semibold uppercase tracking-wide whitespace-normal break-words text-neutral-500"
                 >
                   {header}
                 </th>
@@ -66,8 +66,11 @@ export default function DataViewModal({
                   {rowIdx + 1}
                 </td>
                 {row.map((cell, cellIdx) => (
-                  <td key={cellIdx} className="px-4 py-2.5 text-neutral-900">
-                    <div className="max-h-[120px] overflow-auto text-sm leading-6">
+                  <td
+                    key={cellIdx}
+                    className="w-40 min-w-[10rem] max-w-[10rem] px-4 py-2.5 align-top text-neutral-900"
+                  >
+                    <div className="max-h-[120px] overflow-auto whitespace-pre-wrap break-words text-sm leading-6">
                       {cell || <span className="text-neutral-500">—</span>}
                     </div>
                   </td>
diff --git a/app/components/assessment/DatasetsTab.tsx b/app/components/assessment/DatasetsTab.tsx
index 246ef75..5c05d59 100644
--- a/app/components/assessment/DatasetsTab.tsx
+++ b/app/components/assessment/DatasetsTab.tsx
@@ -7,12 +7,18 @@ import { useToast } from "@/app/components/Toast";
 import { useAuth } from "@/app/lib/context/AuthContext";
 import {
   extractCreatedDataset,
-  fetchAndParseDatasetFile,
+  fetchDatasetPreview,
   handleForbiddenError,
   isAllowedDatasetFile,
 } from "@/app/lib/utils/assessment";
+import { PREVIEW_ROW_LIMIT } from "@/app/lib/assessment/results";
+import {
+  DATASET_SAMPLE_ROW_LIMIT,
+  MAX_DATASET_FILE_BYTES,
+} from "@/app/lib/assessment/constants";
 import type {
   CreateDatasetResponse,
+  DatasetPreview,
   DatasetResponse,
   DatasetsTabProps,
   DatasetViewModalData,
@@ -49,6 +55,9 @@ export default function DatasetsTab({
     useState<DatasetViewModalData | null>(null);
   const [confirmDeleteId, setConfirmDeleteId] = useState<number | null>(null);
   const [deletingId, setDeletingId] = useState<number | null>(null);
+  const [previewCache, setPreviewCache] = useState<
+    Record<string, DatasetPreview>
+  >({});
 
   const loadDatasets = useCallback(async () => {
     if (!isAuthenticated) return;
@@ -91,6 +100,14 @@ export default function DatasetsTab({
       return;
     }
 
+    if (file.size > MAX_DATASET_FILE_BYTES) {
+      toast.error(
+        `File too large. Max ${MAX_DATASET_FILE_BYTES / (1024 * 1024)}MB allowed.`,
+      );
+      event.target.value = "";
+      return;
+    }
+
     setUploadedFile(file);
     if (!datasetName) {
       setDatasetName(file.name.replace(/\.(csv|xlsx|xls)$/i, ""));
@@ -163,7 +180,13 @@ export default function DatasetsTab({
 
     setIsLoadingColumns(true);
     try {
-      const parsed = await fetchAndParseDatasetFile(id, apiKey);
+      const cached = previewCache[id];
+      const parsed =
+        cached ??
+        (await fetchDatasetPreview(id, apiKey, DATASET_SAMPLE_ROW_LIMIT));
+      if (!cached) {
+        setPreviewCache((prev) => ({ ...prev, [id]: parsed }));
+      }
       const firstRow = parsed.rows[0] || [];
       const sampleRow = Object.fromEntries(
         parsed.headers.map((header, index) => [
@@ -188,9 +211,25 @@ export default function DatasetsTab({
   };
 
   const handleViewDataset = async (selectedDatasetId: number, name: string) => {
+    const cacheKey = String(selectedDatasetId);
+    const cached = previewCache[cacheKey];
+    if (cached) {
+      setViewModalData({
+        name,
+        headers: cached.headers,
+        rows: cached.rows,
+      });
+      return;
+    }
+
     setViewingId(selectedDatasetId);
     try {
-      const parsed = await fetchAndParseDatasetFile(selectedDatasetId, apiKey);
+      const parsed = await fetchDatasetPreview(
+        selectedDatasetId,
+        apiKey,
+        PREVIEW_ROW_LIMIT,
+      );
+      setPreviewCache((prev) => ({ ...prev, [cacheKey]: parsed }));
       setViewModalData({
         name,
         headers: parsed.headers,
@@ -235,6 +274,13 @@ export default function DatasetsTab({
     const file = event.dataTransfer.files?.[0];
     if (!file || !isAllowedDatasetFile(file.name)) return;
 
+    if (file.size > MAX_DATASET_FILE_BYTES) {
+      toast.error(
+        `File too large. Max ${MAX_DATASET_FILE_BYTES / (1024 * 1024)}MB allowed.`,
+      );
+      return;
+    }
+
     const dataTransfer = new DataTransfer();
     dataTransfer.items.add(file);
     if (!fileInputRef.current) return;
diff --git a/app/components/assessment/datasets/CreatePanel.tsx b/app/components/assessment/datasets/CreatePanel.tsx
index 976705f..d238b96 100644
--- a/app/components/assessment/datasets/CreatePanel.tsx
+++ b/app/components/assessment/datasets/CreatePanel.tsx
@@ -72,7 +72,7 @@ export default function CreatePanel({
         />
         <div>
           <label className="mb-1.5 block text-xs font-medium text-text-secondary">
-            Upload CSV *
+            Upload Dataset *
           </label>
 
           <input
diff --git a/app/components/assessment/output-schema/OutputSchemaModal.tsx b/app/components/assessment/output-schema/OutputSchemaModal.tsx
index 6c631ad..dc76c60 100644
--- a/app/components/assessment/output-schema/OutputSchemaModal.tsx
+++ b/app/components/assessment/output-schema/OutputSchemaModal.tsx
@@ -45,6 +45,10 @@ export default function OutputSchemaModal({
     setSchema(draftSchema);
     onClose();
   };
+  const handleClose = () => {
+    setSchema(draftSchema);
+    onClose();
+  };
   const handleReset = () => {
     setDraftSchema([createProperty()]);
   };
@@ -52,7 +56,7 @@ export default function OutputSchemaModal({
   return createPortal(
     <Modal
       open
-      onClose={onClose}
+      onClose={handleClose}
       maxWidth="!w-[760px] !max-w-[calc(100vw-2rem)]"
       maxHeight="max-h-[85vh]"
       showClose={false}
@@ -63,7 +67,7 @@ export default function OutputSchemaModal({
         </h2>
         <button
           type="button"
-          onClick={onClose}
+          onClick={handleClose}
           className="flex h-8 w-8 cursor-pointer items-center justify-center rounded-full text-text-secondary transition-colors hover:bg-bg-secondary hover:text-text-primary"
           aria-label="Close response format"
         >
diff --git a/app/hooks/useAssessmentResults.ts b/app/hooks/useAssessmentResults.ts
index b12d065..c7d5e48 100644
--- a/app/hooks/useAssessmentResults.ts
+++ b/app/hooks/useAssessmentResults.ts
@@ -17,6 +17,7 @@ import {
   isCompletedStatus,
   isFailedStatus,
   jsonResultsToTableData,
+  PREVIEW_ROW_LIMIT,
 } from "@/app/lib/assessment/results";
 import {
   ASSESSMENT_TAG,
@@ -436,7 +437,9 @@ export default function useAssessmentResults({
         const results: Record<string, unknown>[] = Array.isArray(json)
           ? json
           : json.data || [];
-        const { headers, rows } = jsonResultsToTableData(results);
+        const { headers, rows } = jsonResultsToTableData(results, {
+          rowLimit: PREVIEW_ROW_LIMIT,
+        });
         setPreviewModal({ title: label, headers, rows });
       } catch (error) {
         if (handleForbiddenError(error, onForbidden)) return;
diff --git a/app/lib/assessment/constants.ts b/app/lib/assessment/constants.ts
index ed6e928..21c42a7 100644
--- a/app/lib/assessment/constants.ts
+++ b/app/lib/assessment/constants.ts
@@ -15,6 +15,9 @@ export const ASSESSMENT_CONFIG_VERSION_PAGE_SIZE = 8;
 
 export const RESULTS_POLL_INTERVAL_MS = 60_000;
 
+export const MAX_DATASET_FILE_BYTES = 5 * 1024 * 1024;
+export const DATASET_SAMPLE_ROW_LIMIT = 10;
+
 export const ACTIVE_ASSESSMENT_STATUSES: ReadonlySet<string> = new Set([
   "pending",
   "processing",
diff --git a/app/lib/assessment/results.ts b/app/lib/assessment/results.ts
index c67f3f7..0aff7e7 100644
--- a/app/lib/assessment/results.ts
+++ b/app/lib/assessment/results.ts
@@ -67,9 +67,11 @@ export function filterAssessments(
   });
 }
 
+export const PREVIEW_ROW_LIMIT = 10;
+
 export function jsonResultsToTableData(
   results: Record<string, unknown>[],
-  opts?: { skipFields?: Set<string> },
+  opts?: { skipFields?: Set<string>; rowLimit?: number },
 ): { headers: string[]; rows: string[][] } {
   if (results.length === 0) return { headers: [], rows: [] };
 
@@ -105,7 +107,10 @@ export function jsonResultsToTableData(
     }),
   );
 
-  const rows = results.map((r) =>
+  const limited =
+    opts?.rowLimit != null ? results.slice(0, opts.rowLimit) : results;
+
+  const rows = limited.map((r) =>
     nonEmptyKeys.map((key) => {
       const v = r[key];
       if (v == null) return "";
diff --git a/app/lib/types/assessment.ts b/app/lib/types/assessment.ts
index f9c0adf..20bb37d 100644
--- a/app/lib/types/assessment.ts
+++ b/app/lib/types/assessment.ts
@@ -287,15 +287,32 @@ export type DatasetResponse = ListResponse<Dataset>;
 export type CreateDatasetResponse = CreateResponse<
   Partial<AssessmentDatasetSummary>
 >;
-export type DatasetFileResponse = { file_content?: string };
 
-export interface ParsedDatasetFile {
+export interface DatasetPreview {
   headers: string[];
   rows: string[][];
+  totalItems: number;
+  truncated: boolean;
 }
 
-export interface DatasetViewModalData extends ParsedDatasetFile {
+export interface DatasetPreviewPayload {
+  total_items?: number;
+  preview?: {
+    headers?: string[];
+    rows?: string[][];
+    returned_rows?: number;
+    truncated?: boolean;
+  };
+}
+
+export type DatasetPreviewResponse = DatasetPreviewPayload & {
+  data?: DatasetPreviewPayload;
+};
+
+export interface DatasetViewModalData {
   name: string;
+  headers: string[];
+  rows: string[][];
 }
 
 export type ConfigMode = "existing" | "create";
diff --git a/app/lib/utils/assessment.ts b/app/lib/utils/assessment.ts
index dc00d0d..6487231 100644
--- a/app/lib/utils/assessment.ts
+++ b/app/lib/utils/assessment.ts
@@ -1,4 +1,3 @@
-import * as XLSX from "xlsx";
 import { apiFetch } from "@/app/lib/apiClient";
 import {
   ALLOWED_DATASET_EXTENSIONS,
@@ -9,8 +8,8 @@ import type {
   ColumnMapping,
   ColumnRole,
   CreateDatasetResponse,
-  DatasetFileResponse,
-  ParsedDatasetFile,
+  DatasetPreview,
+  DatasetPreviewResponse,
   ReviewColumn,
   RoleVisuals,
 } from "@/app/lib/types/assessment";
@@ -22,60 +21,42 @@ export function isAllowedDatasetFile(fileName: string): boolean {
   );
 }
 
-export async function fetchAndParseDatasetFile(
+export async function fetchDatasetPreview(
   id: string | number,
   apiKey: string,
-): Promise<ParsedDatasetFile> {
-  let json: DatasetFileResponse;
+  limit: number,
+): Promise<DatasetPreview> {
+  let res: DatasetPreviewResponse;
   try {
-    json = await apiFetch<DatasetFileResponse>(
-      `/api/assessment/datasets/${id}?fetch_content=true`,
+    res = await apiFetch<DatasetPreviewResponse>(
+      `/api/assessment/datasets/${id}?limit_rows=${limit}`,
       apiKey,
     );
   } catch (error) {
     const message =
       error instanceof Error
         ? error.message
-        : "Failed to download dataset file";
+        : "Failed to fetch dataset preview";
     throw new Error(message);
   }
 
-  const base64 = json?.file_content;
-  if (!base64) {
-    throw new Error("Dataset file content is unavailable.");
+  const payload = res?.data ?? res;
+  const preview = payload?.preview;
+  if (!preview) {
+    throw new Error("Dataset preview is unavailable.");
   }
 
-  const binary = Uint8Array.from(atob(base64), (character) =>
-    character.charCodeAt(0),
-  );
-  const workbook = XLSX.read(binary, { type: "array" });
-  const sheet = workbook.Sheets[workbook.SheetNames[0]];
-  if (!sheet) {
-    throw new Error("Dataset file does not contain a readable sheet.");
-  }
-
-  const rawData: string[][] = XLSX.utils.sheet_to_json(sheet, {
-    header: 1,
-    defval: "",
-  });
-  if (rawData.length === 0) {
-    throw new Error("Dataset file is empty.");
-  }
-
-  const headers = rawData[0].map(String);
-  if (headers.length === 0 || headers.every((header) => !header.trim())) {
+  const headers = preview.headers ?? [];
+  if (headers.length === 0) {
     throw new Error("Dataset file is missing column headers.");
   }
 
-  const rows = rawData
-    .slice(1)
-    .filter((row) => row.some((cell) => String(cell).trim() !== ""));
-
-  if (rows.length === 0) {
-    throw new Error("Dataset file has headers but no data rows.");
-  }
-
-  return { headers, rows: rows.map((row) => row.map(String)) };
+  return {
+    headers,
+    rows: preview.rows ?? [],
+    totalItems: payload?.total_items ?? preview.returned_rows ?? 0,
+    truncated: Boolean(preview.truncated),
+  };
 }
 
 export function extractCreatedDataset(data: CreateDatasetResponse) {

From a6fe09ba66e01e90f46e8793bc6c481dad87242e Mon Sep 17 00:00:00 2001
From: Prashant Vasudevan <71649489+vprashrex@users.noreply.github.com>
Date: Tue, 12 May 2026 10:57:04 +0530
Subject: [PATCH 5/5] feat: Enhance DataViewModal and DatasetsTab for improved
 data handling and filtering

---
 app/components/assessment/DataViewModal.tsx | 24 ++++++++++++++++-----
 app/components/assessment/DatasetsTab.tsx   | 15 +++++++++----
 2 files changed, 30 insertions(+), 9 deletions(-)

diff --git a/app/components/assessment/DataViewModal.tsx b/app/components/assessment/DataViewModal.tsx
index a960eb2..74b04de 100644
--- a/app/components/assessment/DataViewModal.tsx
+++ b/app/components/assessment/DataViewModal.tsx
@@ -1,5 +1,6 @@
 "use client";
 
+import { useMemo } from "react";
 import { Modal } from "@/app/components";
 import CloseIcon from "@/app/components/icons/document/CloseIcon";
 interface DataViewModalProps {
@@ -10,16 +11,29 @@ interface DataViewModalProps {
   onClose: () => void;
 }
 
-/**
- * Reusable modal for viewing tabular data (dataset preview, result preview).
- */
+const isBlank = (cell: string | undefined) =>
+  cell == null || String(cell).trim() === "";
+
 export default function DataViewModal({
   title,
   subtitle,
-  headers,
-  rows,
+  headers: rawHeaders,
+  rows: rawRows,
   onClose,
 }: DataViewModalProps) {
+  const { headers, rows } = useMemo(() => {
+    const keptColIdx = rawHeaders
+      .map((_, colIdx) => colIdx)
+      .filter((colIdx) => rawRows.some((row) => !isBlank(row[colIdx])));
+
+    const filteredHeaders = keptColIdx.map((idx) => rawHeaders[idx]);
+    const filteredRows = rawRows
+      .map((row) => keptColIdx.map((idx) => row[idx] ?? ""))
+      .filter((row) => row.some((cell) => !isBlank(cell)));
+
+    return { headers: filteredHeaders, rows: filteredRows };
+  }, [rawHeaders, rawRows]);
+
   return (
     <Modal
       open
diff --git a/app/components/assessment/DatasetsTab.tsx b/app/components/assessment/DatasetsTab.tsx
index 6dae3d0..b3fcf45 100644
--- a/app/components/assessment/DatasetsTab.tsx
+++ b/app/components/assessment/DatasetsTab.tsx
@@ -187,14 +187,21 @@ export default function DatasetsTab({
       if (!cached) {
         setPreviewCache((prev) => ({ ...prev, [id]: parsed }));
       }
+      const isBlank = (cell: string | undefined) =>
+        cell == null || String(cell).trim() === "";
+      const keptIdx = parsed.headers
+        .map((_, colIdx) => colIdx)
+        .filter((colIdx) => parsed.rows.some((row) => !isBlank(row[colIdx])));
+
+      const filteredHeaders = keptIdx.map((idx) => parsed.headers[idx]);
       const firstRow = parsed.rows[0] || [];
       const sampleRow = Object.fromEntries(
-        parsed.headers.map((header, index) => [
-          header,
-          String(firstRow[index] ?? ""),
+        keptIdx.map((idx) => [
+          parsed.headers[idx],
+          String(firstRow[idx] ?? ""),
         ]),
       );
-      onColumnsLoaded(parsed.headers, sampleRow);
+      onColumnsLoaded(filteredHeaders, sampleRow);
     } catch (error) {
       if (handleForbiddenError(error, onForbidden)) return;
       const message =