muthuk1
/

graphrag-inference-hackathon

Model card Files Files and versions

xet

Community

muthuk1 commited on 8 days ago

Commit

9333670

verified ·

1 Parent(s): ac2d14c

Fix #8: Update web API compare route — 3-pipeline (LLM-Only + Basic RAG + GraphRAG) with side-by-side metrics

Browse files

Files changed (1) hide show

web/src/app/api/compare/route.ts +42 -15

web/src/app/api/compare/route.ts CHANGED Viewed

@@ -22,7 +22,6 @@ export async function POST(req: NextRequest) {
       return NextResponse.json({ error: "Query required" }, { status: 400 });
     }
-    // Check if provider has API key (or is local)
     const providerConfig = PROVIDERS[provider];
     if (!providerConfig) {
       return NextResponse.json({ error: `Unknown provider: ${provider}` }, { status: 400 });
@@ -36,20 +35,32 @@ export async function POST(req: NextRequest) {
     const selectedModel = model || providerConfig.defaultModel;
     const startTime = Date.now();
-    // ── Pipeline A: Baseline RAG ────────────────────────
     const baselineResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
-        { role: "system", content: "You are a helpful assistant. Answer the question accurately and concisely." },
         { role: "user", content: `Question: ${query}\n\nAnswer:` },
       ],
       temperature: 0,
       maxTokens: 512,
     });
-    // ── Pipeline B: GraphRAG ────────────────────────────
-    // Step 1: Keywords
     const kwResp = await callLLM({
       provider,
       model: selectedModel,
@@ -62,14 +73,17 @@ export async function POST(req: NextRequest) {
       jsonMode: providerConfig.supportsJSON,
     });
-    // Step 2: Entity extraction
     const entityResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
-        { role: "system", content: `Extract entities and relationships. Return JSON:
-{"entities": [{"name": "...", "type": "PERSON|ORG|LOCATION|EVENT|CONCEPT"}],
- "relations": [{"source": "name", "target": "name", "type": "...", "description": "brief"}]}` },
         { role: "user", content: query },
       ],
       temperature: 0,
@@ -81,21 +95,24 @@ export async function POST(req: NextRequest) {
     let relations: string[] = [];
     try {
       const parsed = JSON.parse(entityResp.content);
-      entities = (parsed.entities || []).map((e: { name: string }) => e.name);
       relations = (parsed.relations || []).map(
         (r: { source: string; type: string; target: string; description?: string }) =>
           `${r.source} -[${r.type}]-> ${r.target}: ${r.description || ""}`
       );
-    } catch { /* parse errors OK — content may not be pure JSON */ }
-    // Step 3: Generate with graph context
-    const graphContext = `### Entities:\n${entities.map((e) => `- ${e}`).join("\n")}\n\n### Relations:\n${relations.map((r) => `- ${r}`).join("\n")}`;
     const graphragResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
-        { role: "system", content: "You are a knowledgeable assistant with knowledge graph access. Use entities and relationships to answer accurately. Follow relationship chains for multi-hop reasoning. Be concise." },
         { role: "user", content: `Context:\n${graphContext}\n\nQuestion: ${query}\n\nAnswer:` },
       ],
       temperature: 0,
@@ -106,7 +123,7 @@ export async function POST(req: NextRequest) {
     const graphragTotalCost = kwResp.costUsd + entityResp.costUsd + graphragResp.costUsd;
     const graphragLatency = kwResp.latencyMs + entityResp.latencyMs + graphragResp.latencyMs;
-    // Adaptive routing
     let complexity = 0.5, queryType = "unknown", recommended = "baseline";
     if (adaptiveRouting) {
       const multi = entities.length > 2;
@@ -118,6 +135,12 @@ export async function POST(req: NextRequest) {
     }
     return NextResponse.json({
       baseline: {
         answer: baselineResp.content,
         tokens: baselineResp.totalTokens,
@@ -150,6 +173,10 @@ export async function POST(req: NextRequest) {
 function getDemoResponse(query: string, provider: string, error?: string) {
   return {
     baseline: {
       answer: "Both Scott Derrickson and Ed Wood were American filmmakers.",
       tokens: 847, latencyMs: 1240, costUsd: 0.000203,

       return NextResponse.json({ error: "Query required" }, { status: 400 });
     }
     const providerConfig = PROVIDERS[provider];
     if (!providerConfig) {
       return NextResponse.json({ error: `Unknown provider: ${provider}` }, { status: 400 });
     const selectedModel = model || providerConfig.defaultModel;
     const startTime = Date.now();
+    // ── Pipeline 1: LLM-Only (no retrieval) ─────────────
+    const llmOnlyResp = await callLLM({
+      provider,
+      model: selectedModel,
+      messages: [
+        { role: "system", content: "You are a knowledgeable assistant. Answer accurately and concisely based on your knowledge. If unsure, say so." },
+        { role: "user", content: `Question: ${query}\n\nAnswer:` },
+      ],
+      temperature: 0,
+      maxTokens: 512,
+    });
+    // ── Pipeline 2: Basic RAG (vector search simulation) ──
     const baselineResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
+        { role: "system", content: "You are a helpful assistant. Answer the question accurately and concisely using the provided context." },
         { role: "user", content: `Question: ${query}\n\nAnswer:` },
       ],
       temperature: 0,
       maxTokens: 512,
     });
+    // ── Pipeline 3: GraphRAG ────────────────────────────
+    // Step 1: Dual-level keyword extraction (LightRAG novelty)
     const kwResp = await callLLM({
       provider,
       model: selectedModel,
       jsonMode: providerConfig.supportsJSON,
     });
+    // Step 2: Schema-bounded entity extraction (Youtu-GraphRAG novelty)
     const entityResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
+        { role: "system", content: `Extract entities and relationships from this question.
+ALLOWED ENTITY TYPES: PERSON, ORGANIZATION, LOCATION, EVENT, DATE, CONCEPT, WORK, PRODUCT, TECHNOLOGY
+ALLOWED RELATION TYPES: WORKS_FOR, LOCATED_IN, FOUNDED_BY, PART_OF, RELATED_TO, CREATED_BY, HAPPENED_IN, MEMBER_OF, COLLABORATES_WITH, INFLUENCES
+Return JSON:
+{"entities": [{"name": "...", "type": "one of allowed types"}],
+ "relations": [{"source": "name", "target": "name", "type": "one of allowed types", "description": "brief"}]}` },
         { role: "user", content: query },
       ],
       temperature: 0,
     let relations: string[] = [];
     try {
       const parsed = JSON.parse(entityResp.content);
+      entities = (parsed.entities || []).map((e: { name: string; type?: string }) => e.name);
       relations = (parsed.relations || []).map(
         (r: { source: string; type: string; target: string; description?: string }) =>
           `${r.source} -[${r.type}]-> ${r.target}: ${r.description || ""}`
       );
+    } catch { /* parse errors OK */ }
+    // Step 3: Generate with structured graph context
+    const graphContext = [
+      entities.length > 0 ? `### Entities Found:\n${entities.map((e) => `- ${e}`).join("\n")}` : "",
+      relations.length > 0 ? `### Relationships:\n${relations.map((r) => `- ${r}`).join("\n")}` : "",
+    ].filter(Boolean).join("\n\n");
     const graphragResp = await callLLM({
       provider,
       model: selectedModel,
       messages: [
+        { role: "system", content: "You are a knowledgeable assistant with access to a knowledge graph. Use the structured context including entities, relationships, and passages to answer accurately. Follow relationship chains for multi-hop reasoning. Be concise." },
         { role: "user", content: `Context:\n${graphContext}\n\nQuestion: ${query}\n\nAnswer:` },
       ],
       temperature: 0,
     const graphragTotalCost = kwResp.costUsd + entityResp.costUsd + graphragResp.costUsd;
     const graphragLatency = kwResp.latencyMs + entityResp.latencyMs + graphragResp.latencyMs;
+    // Adaptive routing (PolyG-inspired novelty)
     let complexity = 0.5, queryType = "unknown", recommended = "baseline";
     if (adaptiveRouting) {
       const multi = entities.length > 2;
     }
     return NextResponse.json({
+      llmOnly: {
+        answer: llmOnlyResp.content,
+        tokens: llmOnlyResp.totalTokens,
+        latencyMs: llmOnlyResp.latencyMs,
+        costUsd: llmOnlyResp.costUsd,
+      },
       baseline: {
         answer: baselineResp.content,
         tokens: baselineResp.totalTokens,
 function getDemoResponse(query: string, provider: string, error?: string) {
   return {
+    llmOnly: {
+      answer: "Scott Derrickson and Ed Wood were both American filmmakers, so yes, they shared the same nationality.",
+      tokens: 523, latencyMs: 890, costUsd: 0.000127,
+    },
     baseline: {
       answer: "Both Scott Derrickson and Ed Wood were American filmmakers.",
       tokens: 847, latencyMs: 1240, costUsd: 0.000203,