agentset-ai · ahmedriad1 · Dec 22, 2025 · Dec 23, 2025 · Dec 23, 2025 · coderabbitai
diff --git a/apps/web/src/app/[hostingId]/(defaultLayout)/search/page.tsx b/apps/web/src/app/[hostingId]/(defaultLayout)/search/page.tsx
@@ -25,8 +25,6 @@ export default function SearchPage() {
     handleExampleClick,
   } = useSearch();
 
-  const allData = data ? data.chunks : null;
-
   if (!searchEnabled) {
     notFound();
   }
@@ -93,31 +91,15 @@ export default function SearchPage() {
           </div>
         ) : (
           <div>
-            <motion.div
-              initial={{ opacity: 0, y: 20 }}
-              animate={{ opacity: 1, y: 0 }}
-              exit={{ opacity: 0, y: 20 }}
-            >
-              <p className="text-sm font-medium">Queries performed:</p>
-              <p className="text-muted-foreground mt-1 text-xs">
-                {data.queries.map((q, idx) => (
-                  <i key={idx}>
-                    {q.query}
-                    {idx !== data.queries.length - 1 ? ", " : ""}
-                  </i>
-                ))}
-              </p>
-            </motion.div>
-
             <motion.div
               className="mt-6 flex w-full flex-col gap-6"
               initial={{ opacity: 0, y: 20 }}
               animate={{ opacity: 1, y: 0 }}
               exit={{ opacity: 0, y: 20 }}
               transition={{ delay: 0.05 * 1 }}
             >
-              {allData!.length > 0 ? (
-                allData!.map((result) => (
+              {data.length > 0 ? (
+                data.map((result) => (
                   <SearchChunk
                     key={result.id}
                     chunk={result}

diff --git a/apps/web/src/app/[hostingId]/(defaultLayout)/search/use-search.ts b/apps/web/src/app/[hostingId]/(defaultLayout)/search/use-search.ts
@@ -31,11 +31,7 @@ export const useSearch = () => {
         | { success: false }
         | {
             success: true;
-            data: {
-              totalQueries: number;
-              queries: { type: "keyword" | "semantic"; query: string }[];
-              chunks: QueryVectorStoreResult["results"];
-            };
+            data: QueryVectorStoreResult["results"];
           };
 
       if (!data.success) {

diff --git a/apps/web/src/app/api/(internal-api)/benchmark/prompts.ts b/apps/web/src/app/api/(internal-api)/benchmark/prompts.ts
@@ -39,25 +39,6 @@ but it is not as concise."
 }
 `;
 
-// export const FAITHFULNESS_REFINE_SYSTEM_PROMPT = prmpt`
-// We want to understand if the following information is present
-// in the context information: ${"query"}
-// We have provided an existing answer: ${"existingAnswer"}
-// We have the opportunity to refine the existing answer
-// (only if needed) with some more context below.
-// ------------
-// ${"context"}
-// ------------
-// If the existing answer was already true, still answer true.
-// If the information is present in the new context, answer true.
-// Otherwise answer false.
-
-// Example Response:
-// {
-// "faithful": true
-// }
-// `;
-
 export const FAITHFULNESS_SYSTEM_PROMPT = prmpt`
 Please tell if a given piece of information is supported by the context.
 
@@ -94,27 +75,6 @@ ${"context"}
 ------------
 `;
 
-// export const RELEVANCY_REFINE_SYSTEM_PROMPT = prmpt`
-// We want to understand if the following query and response is
-// in line with the context information:
-// ${"query"}
-// We have provided an existing answer:
-// ${"existingAnswer"}
-// We have the opportunity to refine the existing answer
-// (only if needed) with some more context below.
-// ------------
-// ${"context"}
-// ------------
-// If the existing answer was already true, still answer true.
-// If the information is present in the new context, answer true.
-// Otherwise answer false.
-
-// Example Response:
-// {
-// "relevant": true
-// }
-// `;
-
 export const RELEVANCY_SYSTEM_PROMPT = prmpt`
 Your task is to evaluate if the response for the query is in line with the context information provided.
 Answer with a JSON object with a single boolean field "relevant".

diff --git a/apps/web/src/app/api/(internal-api)/benchmark/route.ts b/apps/web/src/app/api/(internal-api)/benchmark/route.ts
@@ -4,7 +4,7 @@ import { AgentsetApiError } from "@/lib/api/errors";
 import { withAuthApiHandler } from "@/lib/api/handler";
 import { makeApiSuccessResponse } from "@/lib/api/response";
 import { parseRequestBody } from "@/lib/api/utils";
-import { NEW_MESSAGE_PROMPT } from "@/lib/prompts";
+import { DEFAULT_SYSTEM_PROMPT, NEW_MESSAGE_PROMPT } from "@/lib/prompts";
 import { waitUntil } from "@vercel/functions";
 import { generateText } from "ai";
 
@@ -16,6 +16,7 @@ import {
   getNamespaceVectorStore,
   queryVectorStore,
 } from "@agentset/engine";
+import { DEFAULT_RERANKER } from "@agentset/validation";
 
 import { chatSchema } from "./schema";
 import { correctnessEval, faithfulnessEval, relevanceEval } from "./utils";
@@ -69,41 +70,35 @@ export const POST = withAuthApiHandler(
     };
 
     if (body.mode === "agentic") {
-      result = await generateAgenticResponse({
+      const response = await generateAgenticResponse({
         model: languageModel,
-        systemPrompt: body.systemPrompt,
-        temperature: body.temperature,
-        queryOptions: {
-          embeddingModel,
-          vectorStore,
-          topK: body.topK,
-          minScore: body.minScore,
-          filter: body.filter,
-          includeMetadata: body.includeMetadata,
-          includeRelationships: body.includeRelationships,
-          rerank: body.rerank
-            ? { model: "cohere:rerank-v3.5", limit: body.rerankLimit }
-            : false,
-        },
-        messagesWithoutQuery: [],
-        lastMessage: message,
+        systemPrompt: DEFAULT_SYSTEM_PROMPT.compile(),
+        temperature: 0,
+        embeddingModel,
+        vectorStore,
+        messages: [
+          {
+            role: "user",
+            content: message,
+          },
+        ],
         afterQueries: (totalQueries) => {
           incrementUsage(namespace.id, totalQueries);
         },
       });
+
+      result = {
+        answer: response.text,
+        sources: response.searchResults as QueryVectorStoreResult["results"],
+      };
     } else {
       const data = await queryVectorStore({
         embeddingModel,
         vectorStore,
         query: message,
-        topK: body.topK,
-        minScore: body.minScore,
-        filter: body.filter,
-        includeMetadata: body.includeMetadata,
-        includeRelationships: body.includeRelationships,
-        rerank: body.rerank
-          ? { model: "cohere:rerank-v3.5", limit: body.rerankLimit }
-          : false,
+        topK: 50,
+        includeMetadata: true,
+        rerank: { model: DEFAULT_RERANKER, limit: 15 },
       });
 
       const newMessages: ModelMessage[] = [

diff --git a/apps/web/src/app/api/(internal-api)/benchmark/utils.ts b/apps/web/src/app/api/(internal-api)/benchmark/utils.ts
@@ -1,5 +1,5 @@
 import type { LanguageModel } from "ai";
-import { formatSources } from "@/lib/agentic/utils";
+import { formatSources } from "@/lib/prompts";
 import { generateText } from "ai";
 import { z } from "zod/v4";
 

diff --git a/apps/web/src/app/api/(internal-api)/chat/route.ts b/apps/web/src/app/api/(internal-api)/chat/route.ts
@@ -1,5 +1,5 @@
 import type { ModelMessage } from "ai";
-import agenticPipeline from "@/lib/agentic";
+import { streamAgenticResponse } from "@/lib/agentic";
 import { AgentsetApiError } from "@/lib/api/errors";
 import { withAuthApiHandler } from "@/lib/api/handler";
 import { parseRequestBody } from "@/lib/api/utils";
@@ -145,37 +145,29 @@ export const POST = withAuthApiHandler(
         ? new KeywordStore(namespace.id, tenantId)
         : undefined;
 
-      const result = agenticPipeline({
+      const result = streamAgenticResponse({
         model: languageModel,
         keywordStore,
-        queryOptions: {
-          embeddingModel,
-          vectorStore,
-          topK: body.topK,
-          minScore: body.minScore,
-          filter: body.filter,
-          includeMetadata: body.includeMetadata,
-          includeRelationships: body.includeRelationships,
-          rerank: body.rerank
-            ? {
-                model: body.rerankModel,
-                limit: body.rerankLimit,
-              }
-            : false,
-        },
+        embeddingModel,
+        vectorStore,
+        topK: body.topK,
+        rerank: body.rerank
+          ? {
+              model: body.rerankModel,
+              limit: body.rerankLimit,
+            }
+          : undefined,
         systemPrompt: body.systemPrompt,
         temperature: body.temperature,
-        messagesWithoutQuery,
-        lastMessage,
+        messages,
         afterQueries: (totalQueries) => {
           incrementUsage(namespace.id, totalQueries);
         },
       });
 
-      return result;
+      return result.toUIMessageStreamResponse({ headers });
     }
 
-    // TODO: track the usage
     const data = await queryVectorStore({
       embeddingModel,
       vectorStore,

diff --git a/apps/web/src/app/api/(internal-api)/hosting-chat/route.ts b/apps/web/src/app/api/(internal-api)/hosting-chat/route.ts
@@ -1,10 +1,9 @@
-import agenticPipeline from "@/lib/agentic";
+import { streamAgenticResponse } from "@/lib/agentic";
 import { AgentsetApiError } from "@/lib/api/errors";
 import { withPublicApiHandler } from "@/lib/api/handler/public";
 import { hostingAuth } from "@/lib/api/hosting-auth";
 import { parseRequestBody } from "@/lib/api/utils";
 import { DEFAULT_SYSTEM_PROMPT } from "@/lib/prompts";
-import { extractTextFromParts } from "@/lib/string-utils";
 import { waitUntil } from "@vercel/functions";
 import { convertToModelMessages } from "ai";
 
@@ -75,13 +74,8 @@ export const POST = withPublicApiHandler(
     );
 
     const messages = convertToModelMessages(body.messages);
-    const messagesWithoutQuery = messages.slice(0, -1);
-    const lastMessage =
-      messages.length > 0
-        ? extractTextFromParts(messages[messages.length - 1]!.content)
-        : null;
 
-    if (!lastMessage) {
+    if (messages.length === 0) {
       throw new AgentsetApiError({
         code: "bad_request",
         message: "Messages must contain at least one message",
@@ -116,29 +110,24 @@ export const POST = withPublicApiHandler(
       ? new KeywordStore(hosting.namespace.id)
       : undefined;
 
-    const result = agenticPipeline({
+    const result = streamAgenticResponse({
       model: languageModel,
       keywordStore,
-      queryOptions: {
-        embeddingModel,
-        vectorStore,
-        topK: hosting.topK,
-        rerank: {
-          model: hosting.rerankConfig?.model,
-          limit: hosting.rerankConfig?.limit ?? 15,
-        },
-        includeMetadata: true,
+      embeddingModel,
+      vectorStore,
+      topK: hosting.topK,
+      rerank: {
+        model: hosting.rerankConfig?.model,
+        limit: hosting.rerankConfig?.limit,
       },
-      rerank: {
-        model: hosting.rerankConfig?.model,
-        limit: hosting.rerankConfig?.limit,
-      },
+      rerank: hosting.rerankConfig
+        ? {
+            model: hosting.rerankConfig.model,
+            limit: hosting.rerankConfig.limit,
+          }
+        : undefined,
-      rerank: {
-        model: hosting.rerankConfig?.model,
-        limit: hosting.rerankConfig?.limit,
-      },
+      rerank: hosting.rerankConfig
+        ? {
+            model: hosting.rerankConfig.model,
+            limit: hosting.rerankConfig.limit,
+          }
+        : undefined,
       systemPrompt: hosting.systemPrompt ?? DEFAULT_SYSTEM_PROMPT.compile(),
       temperature: 0,
-      messagesWithoutQuery,
-      lastMessage,
+      messages,
       afterQueries: (totalQueries) => {
         incrementUsage(hosting.namespace.id, totalQueries);
       },
-      headers,
     });
 
-    return result;
+    return result.toUIMessageStreamResponse({ headers });
   },
 );
diff --git a/apps/web/src/app/api/(internal-api)/hosting-search/route.ts b/apps/web/src/app/api/(internal-api)/hosting-search/route.ts
@@ -1,4 +1,3 @@
-import { agenticSearch } from "@/lib/agentic/search";
 import { AgentsetApiError } from "@/lib/api/errors";
 import { withPublicApiHandler } from "@/lib/api/handler/public";
 import { hostingAuth } from "@/lib/api/hosting-auth";
@@ -9,9 +8,8 @@ import { parseRequestBody } from "@/lib/api/utils";
 import { db } from "@agentset/db/client";
 import {
   getNamespaceEmbeddingModel,
-  getNamespaceLanguageModel,
   getNamespaceVectorStore,
-  KeywordStore,
+  queryVectorStore,
 } from "@agentset/engine";
 
 import { hostingSearchSchema } from "./schema";
@@ -74,44 +72,28 @@ export const POST = withPublicApiHandler(
       });
     }
 
-    const [languageModel, vectorStore, embeddingModel] = await Promise.all([
-      getNamespaceLanguageModel(hosting.llmConfig?.model),
+    const [vectorStore, embeddingModel] = await Promise.all([
       getNamespaceVectorStore(hosting.namespace),
       getNamespaceEmbeddingModel(hosting.namespace, "query"),
     ]);
 
-    const keywordStore = hosting.namespace.keywordEnabled
-      ? new KeywordStore(hosting.namespace.id)
-      : undefined;
-
-    const result = await agenticSearch({
-      model: languageModel,
-      queryOptions: {
-        embeddingModel,
-        vectorStore,
-        topK: hosting.topK,
-        rerank: {
-          model: hosting.rerankConfig?.model,
-          limit: hosting.rerankConfig?.limit ?? 15,
-        },
-        includeMetadata: true,
+    const result = await queryVectorStore({
+      embeddingModel,
+      vectorStore,
+      query: body.query,
+      mode: "semantic",
+      topK: hosting.topK,
+      rerank: {
+        model: hosting.rerankConfig?.model,
+        limit: hosting.rerankConfig?.limit ?? 15,
       },
-      messages: [
-        {
-          role: "user",
-          content: body.query,
-        },
-      ],
+      includeMetadata: true,
     });
 
-    incrementSearchUsage(hosting.namespace.id, result.totalQueries);
+    incrementSearchUsage(hosting.namespace.id, 1);
 
     return makeApiSuccessResponse({
-      data: {
-        totalQueries: result.totalQueries,
-        queries: result.queries,
-        chunks: Object.values(result.chunks),
-      },
+      data: result.results,
       headers,
     });
   },