first commit

2026-06-05 10:25:09 +05:30
commit 0b5715f4b0
10 changed files with 4276 additions and 0 deletions
@@ -0,0 +1 @@
 AZURE_OPENAI_KEY=o20WLCQfubbGTo0SnkS70lefG0tHvdZlzcUGHOPDmww0igy94Up0JQQJ99CEAC77bzfXJ3w3AAAAACOGIUYb
@@ -0,0 +1 @@
 /node_modules
@@ -0,0 +1,723 @@
 require("dotenv").config();
 const fs = require("fs");
 const path = require("path");
 // ======================
 // SUPPRESS PDF WARNINGS
 // ======================
 const originalWarn = console.warn;
 console.warn = (
  message,
  ...args
 ) => {
  if (
    typeof message ===
    "string" &&
    (
      message.includes(
        "UnknownErrorException"
      ) ||
      message.includes(
        "TT:"
      )
    )
  ) {
    return;
  }
  originalWarn(
    message,
    ...args
  );
 };
 // ======================
 // PDF.js
 // ======================
 const pdfjsLib = require(
  "pdfjs-dist/legacy/build/pdf.mjs"
 );
 // ======================
 // Transformers
 // ======================
 const {
  pipeline,
 } = require("@xenova/transformers");
 // ======================
 // Qdrant
 // ======================
 const {
  QdrantClient,
 } = require("@qdrant/js-client-rest");
 // ======================
 // QDRANT CONFIG
 // ======================
 const qdrant = new QdrantClient({
  url: "http://20.40.61.65:6333",
  checkCompatibility: false,
  timeout: 30000,
 });
 const COLLECTION_NAME =
  "pdf_rag";
 let embedder;
 // ======================
 // LOAD MODEL
 // ======================
 async function loadModel() {
  console.log(
    "⏳ Loading embedding model..."
  );
  embedder = await pipeline(
    "feature-extraction",
    "Xenova/all-MiniLM-L6-v2"
  );
  console.log(
    "✅ Embedding model loaded"
  );
 }
 // ======================
 // SMART CHUNKING
 // ======================
 function chunkText(
  text,
  chunkSize = 800,
  overlap = 150
 ) {
  const chunks = [];
  text = text
    .replace(/\s+/g, " ")
    .trim();
  let start = 0;
  while (
    start < text.length
  ) {
    let end =
      start + chunkSize;
    // Try sentence ending
    if (
      end < text.length
    ) {
      const lastPeriod =
        text.lastIndexOf(
          ".",
          end
        );
      if (
        lastPeriod >
        start
      ) {
        end =
          lastPeriod +
          1;
      }
    }
    const chunk = text
      .slice(start, end)
      .trim();
    if (
      chunk.length > 50
    ) {
      chunks.push(
        chunk
      );
    }
    start =
      end - overlap;
  }
  return chunks;
 }
 // ======================
 // CREATE EMBEDDING
 // ======================
 async function createEmbedding(
  text
 ) {
  const output =
    await embedder(text, {
      pooling: "mean",
      normalize: true,
    });
  return Array.from(
    output.data
  );
 }
 // ======================
 // CREATE COLLECTION
 // ======================
 async function createCollection() {
  try {
    await qdrant.getCollection(
      COLLECTION_NAME
    );
    console.log(
      "ℹ️ Collection already exists"
    );
  } catch (err) {
    console.log(
      "⏳ Creating collection..."
    );
    await qdrant.createCollection(
      COLLECTION_NAME,
      {
        vectors: {
          size: 384,
          distance:
            "Cosine",
        },
      }
    );
    console.log(
      "✅ Collection created"
    );
  }
 }
 // ======================
 // EXTRACT TEXT FROM PDF
 // ======================
 async function extractTextFromPDF(
  filePath
 ) {
  try {
    const dataBuffer =
      fs.readFileSync(
        filePath
      );
    const uint8Array =
      new Uint8Array(
        dataBuffer
      );
    const loadingTask =
      pdfjsLib.getDocument(
        {
          data: uint8Array,
        }
      );
    const pdf =
      await loadingTask.promise;
    let fullText = "";
    console.log(
      `📄 Pages: ${pdf.numPages}`
    );
    for (
      let i = 1;
      i <= pdf.numPages;
      i++
    ) {
      const page =
        await pdf.getPage(i);
      const content =
        await page.getTextContent();
      const pageText =
        content.items
          .map(
            (item) =>
              item.str
          )
          .join(" ");
      fullText +=
        pageText + "\n";
    }
    return fullText;
  } catch (error) {
    console.log(
      "❌ PDF extraction error:",
      error
    );
    return "";
  }
 }
 // ======================
 // PROCESS PDF
 // ======================
 async function processPDF(filePath, fileName) {
  try {
    const dataBuffer = fs.readFileSync(filePath);
    const pdf = await pdfjsLib
      .getDocument({
        data: new Uint8Array(dataBuffer),
      })
      .promise;
    console.log(
      `📄 ${fileName} - ${pdf.numPages} pages`
    );
    const batchSize = 50;
    let batchPoints = [];
    let globalChunkIndex = 0;
    for (
      let pageNum = 1;
      pageNum <= pdf.numPages;
      pageNum++
    ) {
      console.log(
        `📖 Processing page ${pageNum}/${pdf.numPages}`
      );
      const page =
        await pdf.getPage(pageNum);
      const content =
        await page.getTextContent();
      const pageText =
        content.items
          .map((item) => item.str)
          .join(" ");
      if (
        !pageText ||
        pageText.trim().length === 0
      ) {
        continue;
      }
      const chunks = chunkText(
        pageText,
        1200,
        250
      );
      for (const chunk of chunks) {
        const embedding =
          await createEmbedding(chunk);
        batchPoints.push({
          id: Number(
            `${Date.now()}${globalChunkIndex}`
          ),
          vector: embedding,
          payload: {
            file: fileName,
            page: pageNum,
            chunk: globalChunkIndex,
            text: chunk,
            created_at:
              new Date().toISOString(),
          },
        });
        globalChunkIndex++;
        if (
          batchPoints.length >= batchSize
        ) {
          console.log(
            `⬆️ Uploading ${batchPoints.length} vectors`
          );
          await qdrant.upsert(
            COLLECTION_NAME,
            {
              wait: true,
              points: batchPoints,
            }
          );
          batchPoints = [];
        }
      }
    }
    if (batchPoints.length > 0) {
      console.log(
        `⬆️ Uploading final ${batchPoints.length} vectors`
      );
      await qdrant.upsert(
        COLLECTION_NAME,
        {
          wait: true,
          points: batchPoints,
        }
      );
    }
    console.log(
      `✅ ${fileName} indexed successfully`
    );
  } catch (error) {
    console.log(
      `❌ Error processing ${fileName}:`,
      error
    );
  }
 }
 // ======================
 // MAIN
 // ======================
 async function main() {
  try {
    await loadModel();
    await createCollection();
    const folder =
      path.join(
        __dirname,
        "uploads"
      );
    if (
      !fs.existsSync(
        folder
      )
    ) {
      console.log(
        "❌ uploads folder not found"
      );
      return;
    }
    const files =
      fs
        .readdirSync(
          folder
        )
        .filter((file) =>
          file.endsWith(
            ".pdf"
          )
        );
    if (
      files.length === 0
    ) {
      console.log(
        "⚠️ No PDFs found"
      );
      return;
    }
    console.log(
      `📚 Found ${files.length} PDFs`
    );
    for (const file of files) {
      const filePath =
        path.join(
          folder,
          file
        );
      console.log(
        `\n📄 Processing ${file}`
      );
      await processPDF(
        filePath,
        file
      );
    }
    console.log(
      "\n🎉 All PDFs indexed successfully"
    );
  } catch (err) {
    console.error(
      "❌ MAIN ERROR:",
      err
    );
  }
 }
 main();
 // require("dotenv").config();
 // const fs = require("fs");
 // const path = require("path");
 // const crypto = require("crypto");
 // // ─── Suppress PDF warnings ────────────────────────────────────────────────────
 // const _warn = console.warn;
 // console.warn = (msg, ...a) => {
 //   if (typeof msg === "string" && (msg.includes("UnknownErrorException") || msg.includes("TT:"))) return;
 //   _warn(msg, ...a);
 // };
 // const pdfjsLib = require("pdfjs-dist/legacy/build/pdf.mjs");
 // const { pipeline } = require("@xenova/transformers");
 // const { QdrantClient } = require("@qdrant/js-client-rest");
 // // ─── Config ───────────────────────────────────────────────────────────────────
 // const QDRANT_URL       = process.env.QDRANT_URL || "http://20.40.61.65:6333";
 // const COLLECTION_NAME  = "pdf_rag";
 // const VECTOR_SIZE      = 384;
 // const CHUNK_SIZE       = 1200;
 // const CHUNK_OVERLAP    = 250;
 // const BATCH_SIZE       = 100;       // points per upsert call
 // const EMBED_CONCURRENCY = 8;        // parallel embeddings at once
 // const MAX_RETRIES      = 3;
 // const qdrant = new QdrantClient({ url: QDRANT_URL, checkCompatibility: false, timeout: 60000 });
 // let embedder;
 // // ─── Semaphore ─────────────────────────────────────────────────────────────────
 // class Semaphore {
 //   constructor(n) { this.n = n; this.queue = []; }
 //   acquire() {
 //     return new Promise(res => {
 //       if (this.n > 0) { this.n--; res(); }
 //       else this.queue.push(res);
 //     });
 //   }
 //   release() {
 //     if (this.queue.length) this.queue.shift()();
 //     else this.n++;
 //   }
 // }
 // // ─── Retry helper ─────────────────────────────────────────────────────────────
 // async function withRetry(fn, retries = MAX_RETRIES, delay = 500) {
 //   for (let i = 0; i <= retries; i++) {
 //     try { return await fn(); }
 //     catch (err) {
 //       if (i === retries) throw err;
 //       console.warn(`  ⚠️  Retry ${i + 1}/${retries} after error: ${err.message}`);
 //       await new Promise(r => setTimeout(r, delay * 2 ** i));
 //     }
 //   }
 // }
 // // ─── Deterministic UUID from content hash ────────────────────────────────────
 // // Prevents duplicates if you re-run indexing on the same file
 // function makePointId(fileName, page, chunkIndex) {
 //   const hash = crypto
 //     .createHash("sha256")
 //     .update(`${fileName}::${page}::${chunkIndex}`)
 //     .digest("hex");
 //   // Qdrant supports UUID strings or unsigned ints; use hex slice as UUID-like string
 //   return `${hash.slice(0,8)}-${hash.slice(8,12)}-${hash.slice(12,16)}-${hash.slice(16,20)}-${hash.slice(20,32)}`;
 // }
 // // ─── Chunking ─────────────────────────────────────────────────────────────────
 // function chunkText(text, size = CHUNK_SIZE, overlap = CHUNK_OVERLAP) {
 //   const chunks = [];
 //   text = text.replace(/\s+/g, " ").trim();
 //   let start = 0;
 //   while (start < text.length) {
 //     let end = start + size;
 //     if (end < text.length) {
 //       const last = text.lastIndexOf(".", end);
 //       if (last > start) end = last + 1;
 //     }
 //     const chunk = text.slice(start, end).trim();
 //     if (chunk.length > 50) chunks.push(chunk);
 //     start = end - overlap;
 //   }
 //   return chunks;
 // }
 // // ─── Embedding ────────────────────────────────────────────────────────────────
 // async function embed(text) {
 //   const out = await embedder(text, { pooling: "mean", normalize: true });
 //   return Array.from(out.data);
 // }
 // // Embed multiple texts with bounded parallelism
 // async function embedBatch(texts) {
 //   const sem = new Semaphore(EMBED_CONCURRENCY);
 //   return Promise.all(
 //     texts.map(async (text) => {
 //       await sem.acquire();
 //       try { return await embed(text); }
 //       finally { sem.release(); }
 //     })
 //   );
 // }
 // // ─── Qdrant helpers ───────────────────────────────────────────────────────────
 // async function ensureCollection() {
 //   try {
 //     await qdrant.getCollection(COLLECTION_NAME);
 //     console.log("ℹ️  Collection already exists");
 //   } catch {
 //     console.log("⏳ Creating collection...");
 //     await qdrant.createCollection(COLLECTION_NAME, {
 //       vectors: { size: VECTOR_SIZE, distance: "Cosine" },
 //       // Optimizers: tune for bulk ingest speed, re-enable indexing after
 //       optimizers_config: { indexing_threshold: 0 },
 //     });
 //     console.log("✅ Collection created");
 //   }
 // }
 // // Upload a batch with retry
 // async function upsertBatch(points) {
 //   await withRetry(() =>
 //     qdrant.upsert(COLLECTION_NAME, { wait: true, points })
 //   );
 // }
 // // After bulk ingest, re-enable HNSW indexing
 // async function enableIndexing() {
 //   await qdrant.updateCollection(COLLECTION_NAME, {
 //     optimizers_config: { indexing_threshold: 20000 },
 //   });
 //   console.log("🔧 HNSW indexing re-enabled");
 // }
 // // ─── Check if file already indexed ───────────────────────────────────────────
 // async function isFileIndexed(fileName) {
 //   try {
 //     const result = await qdrant.scroll(COLLECTION_NAME, {
 //       filter: { must: [{ key: "file", match: { value: fileName } }] },
 //       limit: 1,
 //       with_payload: false,
 //       with_vector: false,
 //     });
 //     return result.points.length > 0;
 //   } catch { return false; }
 // }
 // // ─── Process a single PDF ─────────────────────────────────────────────────────
 // async function processPDF(filePath, fileName) {
 //   console.log(`\n📄 ${fileName}`);
 //   if (await isFileIndexed(fileName)) {
 //     console.log(`  ⏭️  Already indexed — skipping`);
 //     return;
 //   }
 //   const pdf = await pdfjsLib
 //     .getDocument({ data: new Uint8Array(fs.readFileSync(filePath)) })
 //     .promise;
 //   console.log(`  📖 ${pdf.numPages} pages`);
 //   const allChunks = []; // { text, page, chunkIndex }
 //   // 1️⃣  Extract all text first (fast, sequential is fine for I/O)
 //   for (let p = 1; p <= pdf.numPages; p++) {
 //     const page    = await pdf.getPage(p);
 //     const content = await page.getTextContent();
 //     const text    = content.items.map(i => i.str).join(" ");
 //     if (!text.trim()) continue;
 //     const chunks = chunkText(text);
 //     chunks.forEach((chunk, ci) => allChunks.push({ text: chunk, page: p, chunkIndex: allChunks.length }));
 //   }
 //   console.log(`  🧩 ${allChunks.length} chunks — embedding with concurrency=${EMBED_CONCURRENCY}`);
 //   // 2️⃣  Embed all chunks in parallel (bounded by semaphore)
 //   const start = Date.now();
 //   const vectors = await embedBatch(allChunks.map(c => c.text));
 //   const elapsed = ((Date.now() - start) / 1000).toFixed(1);
 //   console.log(`  ⚡ Embedding done in ${elapsed}s`);
 //   // 3️⃣  Build points
 //   const points = allChunks.map((c, i) => ({
 //     id:      makePointId(fileName, c.page, c.chunkIndex),
 //     vector:  vectors[i],
 //     payload: {
 //       file:       fileName,
 //       page:       c.page,
 //       chunk:      c.chunkIndex,
 //       text:       c.text,
 //       created_at: new Date().toISOString(),
 //     },
 //   }));
 //   // 4️⃣  Batch upsert with progress
 //   let uploaded = 0;
 //   for (let i = 0; i < points.length; i += BATCH_SIZE) {
 //     const batch = points.slice(i, i + BATCH_SIZE);
 //     await upsertBatch(batch);
 //     uploaded += batch.length;
 //     process.stdout.write(`\r  ⬆️  ${uploaded}/${points.length} vectors uploaded`);
 //   }
 //   console.log(`\n  ✅ ${fileName} indexed`);
 // }
 // // ─── Main ─────────────────────────────────────────────────────────────────────
 // async function main() {
 //   console.log("⏳ Loading embedding model...");
 //   embedder = await pipeline("feature-extraction", "Xenova/all-MiniLM-L6-v2");
 //   console.log("✅ Model loaded\n");
 //   await ensureCollection();
 //   const folder = path.join(__dirname, "uploads");
 //   if (!fs.existsSync(folder)) return console.log("❌ uploads/ folder not found");
 //   const pdfs = fs.readdirSync(folder).filter(f => f.endsWith(".pdf"));
 //   if (!pdfs.length) return console.log("⚠️  No PDFs found");
 //   console.log(`📚 Found ${pdfs.length} PDF(s)\n`);
 //   const t0 = Date.now();
 //   for (const file of pdfs) {
 //     await processPDF(path.join(folder, file), file);
 //   }
 //   await enableIndexing(); // re-enable HNSW after bulk load
 //   console.log(`\n🎉 Done in ${((Date.now() - t0) / 1000).toFixed(1)}s`);
 // }
 // main().catch(err => { console.error("❌ Fatal:", err); process.exit(1); });
@@ -0,0 +1,28 @@
 {
  "name": "server",
  "version": "1.0.0",
  "description": "",
  "main": "index.js",
  "scripts": {
    "test": "echo \"Error: no test specified\" && exit 1",
    "start": "nodemon server.js"
  },
  "keywords": [],
  "author": "",
  "license": "ISC",
  "type": "commonjs",
  "dependencies": {
    "@qdrant/js-client-rest": "^1.18.0",
    "@xenova/transformers": "^2.17.2",
    "axios": "^1.16.0",
    "cors": "^2.8.6",
    "dotenv": "^17.4.2",
    "express": "^5.2.1",
    "multer": "^2.1.1",
    "ollama": "^0.6.3",
    "openai": "^6.42.0",
    "pdf2pic": "^3.2.0",
    "pdfjs-dist": "^5.7.284",
    "tesseract.js": "^7.0.0"
  }
 }
@@ -0,0 +1,958 @@
 // // 
 // require("dotenv").config();
 // const express = require("express");
 // const cors = require("cors");
 // const OpenAI = require("openai");
 // const {
 //   pipeline,
 // } = require("@xenova/transformers");
 // const {
 //   QdrantClient,
 // } = require("@qdrant/js-client-rest");
 // const app = express();
 // app.use(cors());
 // app.use(express.json());
 // // ======================
 // // AZURE OPENAI
 // // ======================
 // const azureEndpoint =
 //   "https://cpmindiayoda-resource.services.ai.azure.com";
 // const deploymentName = "gpt-4o-mini";
 // const apiVersion =
 //   "2024-08-01-preview";
 // const llm = new OpenAI({
 //   baseURL:
 //     `${azureEndpoint}/openai/deployments/${deploymentName}`,
 //   apiKey:
 //     process.env.AZURE_OPENAI_KEY,
 //   defaultHeaders: {
 //     "api-key":
 //       process.env.AZURE_OPENAI_KEY,
 //   },
 //   defaultQuery: {
 //     "api-version":
 //       apiVersion,
 //   },
 // });
 // // ======================
 // // QDRANT
 // // ======================
 // const qdrant = new QdrantClient({
 //   url: "http://20.40.61.65:6333",
 //   checkCompatibility: false,
 //   timeout: 30000,
 // });
 // const COLLECTION_NAME =
 //   "pdf_rag";
 // let embedder;
 // // ======================
 // // LOAD EMBEDDING MODEL
 // // ======================
 // async function loadModel() {
 //   console.log(
 //     "Loading MiniLM model..."
 //   );
 //   embedder = await pipeline(
 //     "feature-extraction",
 //     "Xenova/all-MiniLM-L6-v2"
 //   );
 //   console.log(
 //     "Embedding model loaded"
 //   );
 // }
 // // ======================
 // // EMBEDDING
 // // ======================
 // async function createEmbedding(
 //   text
 // ) {
 //   const output =
 //     await embedder(text, {
 //       pooling: "mean",
 //       normalize: true,
 //     });
 //   return Array.from(output.data);
 // }
 // // ======================
 // // HEALTH
 // // ======================
 // app.get("/", (req, res) => {
 //   res.json({
 //     success: true,
 //     message:
 //       "Qdrant + Azure GPT RAG Running",
 //   });
 // });
 // // ======================
 // // ASK API
 // // ======================
 // app.post(
 //   "/ask",
 //   async (req, res) => {
 //     try {
 //       const { question } =
 //         req.body;
 //       if (!question) {
 //         return res
 //           .status(400)
 //           .json({
 //             success: false,
 //             error:
 //               "Question is required",
 //           });
 //       }
 //       console.log(
 //         "Question:",
 //         question
 //       );
 //       // ======================
 //       // CREATE EMBEDDING
 //       // ======================
 //       const embedding =
 //         await createEmbedding(
 //           question
 //         );
 //       // ======================
 //       // SEARCH QDRANT
 //       // ======================
 //       const searchResult =
 //         await qdrant.search(
 //           COLLECTION_NAME,
 //           {
 //             vector: embedding,
 //             limit: 20,
 //           }
 //         );
 //       const filteredResults = searchResult.filter(
 //         item => item.score >= 0.10
 //       );
 //       console.log(
 //         "Results:",
 //         filteredResults.length,
 //       );
 //       if (
 //         !filteredResults.length
 //       ) {
 //         return res.json({
 //           success: true,
 //           answer:
 //             "No relevant information found.",
 //           sources: [],
 //         });
 //       }
 //       // ======================
 //       // CONTEXT
 //       // ======================
 //       const context =
 //         filteredResults 
 //           .map(
 //             (item, index) => `
 // Result ${index + 1}
 // File:
 // ${item.payload?.file || ""}
 // Content:
 // ${item.payload?.text || ""}
 // `
 //           )
 //           .join("\n\n");
 //       // ======================
 //       // GPT CALL
 //       // ======================
 //       const completion =
 //         await llm.chat.completions.create(
 //           {
 //             model:
 //               deploymentName,
 //             temperature: 0,
 //             messages: [
 //               {
 //                 role: "system",
 //                 content: `
 // You are CPM AI Assistant.
 // Rules:
 // - Answer ONLY from the provided context.
 // - If information is not found, say:
 //   "❌ I could not find this information in the uploaded documents."
 // Response Style:
 // - Use emojis where appropriate.
 // - Use markdown formatting.
 // - Use headings.
 // - Use bullet points.
 // - Make answers professional and easy to read.
 // - Highlight important information using **bold** text.
 // - Never mention the context or document chunks.
 // Example Format:
 // # 📋 Dress Code Policy
 // ## 🎯 Overview
 // Brief summary here.
 // ## ✅ Key Points
 // • Point 1
 // • Point 2
 // • Point 3
 // ## ⚠️ Important Notes
 // • Note 1
 // • Note 2
 // ## 📝 Conclusion
 // Short conclusion.
 // `,
 //               },
 //               {
 //                 role: "user",
 //                 content: `
 // Context:
 // ${context}
 // Question:
 // ${question}
 // `,
 //               },
 //             ]
 //           }
 //         );
 //       const answer =
 //         completion.choices[0]
 //           .message.content;
 //       return res.json({
 //         success: true,
 //         question,
 //         answer,
 //         sources:
 //           filteredResults.map(
 //             (item) => ({
 //               score:
 //                 item.score,
 //               file:
 //                 item.payload
 //                   ?.file,
 //               chunk:
 //                 item.payload
 //                   ?.chunk,
 //             })
 //           ),
 //       });
 //     } catch (error) {
 //       console.error(
 //         "ERROR:",
 //         error
 //       );
 //       return res
 //         .status(500)
 //         .json({
 //           success: false,
 //           error:
 //             error.message,
 //         });
 //     }
 //   }
 // );
 // // ======================
 // // START SERVER
 // // ======================
 // async function startServer() {
 //   try {
 //     await loadModel();
 //     app.listen(
 //       process.env.PORT ||
 //       5000,
 //       () => {
 //         console.log(
 //           "Server running on port",
 //           process.env.PORT ||
 //           5000
 //         );
 //       }
 //     );
 //   } catch (error) {
 //     console.error(
 //       "Startup Error:",
 //       error
 //     );
 //   }
 // }
 // startServer();
 // require("dotenv").config();
 // const express = require("express");
 // const cors = require("cors");
 // const OpenAI = require("openai");
 // const { pipeline } = require("@xenova/transformers");
 // const { QdrantClient } = require("@qdrant/js-client-rest");
 // // ─── Config ───────────────────────────────────────────────────────────────────
 // const CONFIG = {
 //   azure: {
 //     endpoint:   process.env.AZURE_OPENAI_ENDPOINT || "https://cpmindiayoda-resource.services.ai.azure.com",
 //     deployment: process.env.AZURE_DEPLOYMENT       || "gpt-4o-mini",
 //     apiVersion: process.env.AZURE_API_VERSION      || "2024-08-01-preview",
 //     apiKey:     process.env.AZURE_OPENAI_KEY,
 //   },
 //   qdrant: {
 //     url:        process.env.QDRANT_URL             || "http://20.40.61.65:6333",
 //     collection: process.env.QDRANT_COLLECTION      || "pdf_rag",
 //   },
 //   search: {
 //     topK:           20,
 //     minScore:       0.10,
 //     maxContextDocs: 10,
 //   },
 //   port: process.env.PORT || 5000,
 // };
 // // ─── Clients ──────────────────────────────────────────────────────────────────
 // const llm = new OpenAI({
 //   baseURL: `${CONFIG.azure.endpoint}/openai/deployments/${CONFIG.azure.deployment}`,
 //   apiKey:  CONFIG.azure.apiKey,
 //   defaultHeaders: { "api-key": CONFIG.azure.apiKey },
 //   defaultQuery:   { "api-version": CONFIG.azure.apiVersion },
 // });
 // const qdrant = new QdrantClient({
 //   url:                CONFIG.qdrant.url,
 //   checkCompatibility: false,
 //   timeout:            30000,
 // });
 // // ─── Embedding model (singleton, lazy-init) ───────────────────────────────────
 // let _embedder = null;
 // async function getEmbedder() {
 //   if (!_embedder) {
 //     console.log("⏳ Loading MiniLM model...");
 //     _embedder = await pipeline("feature-extraction", "Xenova/all-MiniLM-L6-v2");
 //     console.log("✅ Embedding model ready");
 //   }
 //   return _embedder;
 // }
 // async function createEmbedding(text) {
 //   const model = await getEmbedder();
 //   const out = await model(text, { pooling: "mean", normalize: true });
 //   return Array.from(out.data);
 // }
 // // ─── Qdrant search ────────────────────────────────────────────────────────────
 // async function searchQdrant(embedding, { topK, minScore, maxContextDocs } = CONFIG.search) {
 //   const results = await qdrant.search(CONFIG.qdrant.collection, {
 //     vector:      embedding,
 //     limit:       topK,
 //     with_payload: true,
 //     score_threshold: minScore, // let Qdrant filter — faster than client-side
 //   });
 //   // Re-rank by score, cap to maxContextDocs
 //   return results
 //     .sort((a, b) => b.score - a.score)
 //     .slice(0, maxContextDocs);
 // }
 // // ─── Build LLM context string ─────────────────────────────────────────────────
 // function buildContext(results) {
 //   return results
 //     .map((item, i) =>
 //       `[${i + 1}] File: ${item.payload?.file ?? "unknown"} | Page: ${item.payload?.page ?? "?"}\n${item.payload?.text ?? ""}`
 //     )
 //     .join("\n\n---\n\n");
 // }
 // // ─── LLM call ─────────────────────────────────────────────────────────────────
 // const SYSTEM_PROMPT = `
 // You are CPM AI Assistant.
 // Rules:
 // - Answer only from the provided information.
 // - If the answer is not available, reply exactly:
 //   "❌ I could not find this information in the uploaded documents."
 // - Do not make up information.
 // - Do not mention documents, context, or chunks.
 // Response Style:
 // - Use simple English.
 // - Keep answers short and clear.
 // - Use headings and bullet points.
 // - Highlight important words in **bold**.
 // - Use emojis in headings.
 // Format:
 // # 📋 Topic
 // ## 🎯 Summary
 // Short answer in 1-2 sentences.
 // ## ✅ Details
 // - Point 1
 // - Point 2
 // - Point 3
 // ## ⚠️ Notes
 // - Extra information (if available).
 // `.trim();
 // async function askLLM(question, context) {
 //   const completion = await llm.chat.completions.create({
 //     model:       CONFIG.azure.deployment,
 //     temperature: 0,
 //     max_tokens:  1500,
 //     messages: [
 //       { role: "system", content: SYSTEM_PROMPT },
 //       { role: "user",   content: `Context:\n${context}\n\nQuestion:\n${question}` },
 //     ],
 //   });
 //   return completion.choices[0].message.content;
 // }
 // // ─── Express app ──────────────────────────────────────────────────────────────
 // const app = express();
 // app.use(cors());
 // app.use(express.json({ limit: "1mb" }));
 // // Request logger middleware
 // app.use((req, _res, next) => {
 //   console.log(`→ ${req.method} ${req.path}`);
 //   next();
 // });
 // // ─── Routes ───────────────────────────────────────────────────────────────────
 // app.get("/health", (_req, res) => {
 //   res.json({ status: "ok", model: CONFIG.azure.deployment, collection: CONFIG.qdrant.collection });
 // });
 // app.post("/ask", async (req, res) => {
 //   const { question } = req.body ?? {};
 //   if (!question?.trim()) {
 //     return res.status(400).json({ success: false, error: "question is required" });
 //   }
 //   const t0 = Date.now();
 //   try {
 //     // 1. Embed question
 //     const embedding = await createEmbedding(question.trim());
 //     // 2. Semantic search
 //     const results = await searchQdrant(embedding);
 //     if (!results.length) {
 //       return res.json({
 //         success: true,
 //         question,
 //         answer:  "❌ I could not find this information in the uploaded documents.",
 //         sources: [],
 //         ms:      Date.now() - t0,
 //       });
 //     }
 //     // 3. Build context + call LLM
 //     const context = buildContext(results);
 //     const answer  = await askLLM(question, context);
 //     return res.json({
 //       success: true,
 //       question,
 //       answer,
 //       sources: results.map(r => ({
 //         score: +r.score.toFixed(4),
 //         file:  r.payload?.file,
 //         page:  r.payload?.page,
 //         chunk: r.payload?.chunk,
 //       })),
 //       ms: Date.now() - t0,
 //     });
 //   } catch (err) {
 //     console.error("❌ /ask error:", err);
 //     return res.status(500).json({ success: false, error: err.message });
 //   }
 // });
 // app.post("/ask/stream", async (req, res) => {
 //   const { question } = req.body ?? {};
 //   if (!question?.trim()) {
 //     return res.status(400).json({ success: false, error: "question is required" });
 //   }
 //   // ── SSE headers ────────────────────────────────────────────────────────────
 //   res.setHeader("Content-Type",  "text/event-stream");
 //   res.setHeader("Cache-Control", "no-cache");
 //   res.setHeader("Connection",    "keep-alive");
 //   res.flushHeaders(); // send headers immediately
 //   const send = (event, data) => res.write(`event: ${event}\ndata: ${JSON.stringify(data)}\n\n`);
 //   try {
 //     // 1. Embed
 //     send("status", { message: "🔍 Searching documents..." });
 //     const embedding = await createEmbedding(question.trim());
 //     // 2. Search Qdrant
 //     const results = await searchQdrant(embedding);
 //     if (!results.length) {
 //       send("token",  { token: "❌ I could not find this information in the uploaded documents." });
 //       send("done",   { sources: [] });
 //       return res.end();
 //     }
 //     // 3. Send sources early so UI can show them while streaming answer
 //     const sources = results.map(r => ({
 //       score: +r.score.toFixed(4),
 //       file:  r.payload?.file,
 //       page:  r.payload?.page,
 //       chunk: r.payload?.chunk,
 //     }));
 //     send("sources", { sources });
 //     // 4. Stream LLM tokens
 //     send("status", { message: "💬 Generating answer..." });
 //     const context = buildContext(results);
 //     const stream  = await llm.chat.completions.create({
 //       model:       CONFIG.azure.deployment,
 //       temperature: 0,
 //       max_tokens:  1500,
 //       stream:      true,   // ← key change
 //       messages: [
 //         { role: "system", content: SYSTEM_PROMPT },
 //         { role: "user",   content: `Context:\n${context}\n\nQuestion:\n${question}` },
 //       ],
 //     });
 //     for await (const chunk of stream) {
 //       const token = chunk.choices[0]?.delta?.content ?? "";
 //       if (token) send("token", { token });
 //     }
 //     send("done", { sources });
 //   } catch (err) {
 //     console.error("❌ /ask/stream error:", err);
 //     send("error", { error: err.message });
 //   }
 //   res.end();
 // });
 // app.use((_req, res) => res.status(404).json({ success: false, error: "Not found" }));
 // // ─── Start ────────────────────────────────────────────────────────────────────
 // async function start() {
 //   await getEmbedder();
 //   app.listen(CONFIG.port, () => {
 //     console.log(`Server running on port ${CONFIG.port}`);
 //   });
 // }
 // start().catch(err => {
 //   console.error("Fatal startup error:", err);
 //   process.exit(1);
 // });
 require("dotenv").config();
 const express = require("express");
 const cors = require("cors");
 const OpenAI = require("openai");
 const { pipeline } = require("@xenova/transformers");
 const { QdrantClient } = require("@qdrant/js-client-rest");
 // ─── Config ───────────────────────────────────────────────────────────────────
 const CONFIG = {
  azure: {
    endpoint:   process.env.AZURE_OPENAI_ENDPOINT || "https://cpmindiayoda-resource.services.ai.azure.com",
    deployment: process.env.AZURE_DEPLOYMENT       || "gpt-4o-mini",
    apiVersion: process.env.AZURE_API_VERSION      || "2024-08-01-preview",
    apiKey:     process.env.AZURE_OPENAI_KEY,
  },
  qdrant: {
    url:        process.env.QDRANT_URL             || "http://20.40.61.65:6333",
    collection: process.env.QDRANT_COLLECTION      || "pdf_rag",
  },
  search: {
    topK:           20,
    minScore:       0.10,
    maxContextDocs: 10,
  },
  port: process.env.PORT || 5000,
 };
 // ─── Clients ──────────────────────────────────────────────────────────────────
 const llm = new OpenAI({
  baseURL: `${CONFIG.azure.endpoint}/openai/deployments/${CONFIG.azure.deployment}`,
  apiKey:  CONFIG.azure.apiKey,
  defaultHeaders: { "api-key": CONFIG.azure.apiKey },
  defaultQuery:   { "api-version": CONFIG.azure.apiVersion },
 });
 const qdrant = new QdrantClient({
  url:                CONFIG.qdrant.url,
  checkCompatibility: false,
  timeout:            30000,
 });
 // ─── Embedding model (singleton, lazy-init) ───────────────────────────────────
 let _embedder = null;
 async function getEmbedder() {
  if (!_embedder) {
    console.log("⏳ Loading MiniLM model...");
    _embedder = await pipeline("feature-extraction", "Xenova/all-MiniLM-L6-v2");
    console.log("✅ Embedding model ready");
  }
  return _embedder;
 }
 async function createEmbedding(text) {
  const model = await getEmbedder();
  const out = await model(text, { pooling: "mean", normalize: true });
  return Array.from(out.data);
 }
 // ─── Qdrant search ────────────────────────────────────────────────────────────
 async function searchQdrant(embedding, { topK, minScore, maxContextDocs } = CONFIG.search) {
  const results = await qdrant.search(CONFIG.qdrant.collection, {
    vector:      embedding,
    limit:       topK,
    with_payload: true,
    score_threshold: minScore,
  });
  return results
    .sort((a, b) => b.score - a.score)
    .slice(0, maxContextDocs);
 }
 // ─── Build LLM context string ─────────────────────────────────────────────────
 function buildContext(results) {
  return results
    .map((item, i) =>
      `[${i + 1}] File: ${item.payload?.file ?? "unknown"} | Page: ${item.payload?.page ?? "?"}\n${item.payload?.text ?? ""}`
    )
    .join("\n\n---\n\n");
 }
 // ─── LLM call ─────────────────────────────────────────────────────────────────
 const SYSTEM_PROMPT = `
 You are CPM AI Assistant.
 Rules:
 - Answer only from the provided information.
 - If the answer is not available, reply exactly:
  "❌ I could not find this information in the uploaded documents."
 - Do not make up information.
 - Do not mention documents, context, or chunks.
 Response Style:
 - Use simple English.
 - Keep answers short and clear.
 - Use headings and bullet points.
 - Highlight important words in **bold**.
 - Use emojis in headings.
 Format:
 # 📋 Topic
 ## 🎯 Summary
 Short answer in 1-2 sentences.
 ## ✅ Details
 - Point 1
 - Point 2
 - Point 3
 ## ⚠️ Notes
 - Extra information (if available).
 `.trim();
 async function askLLM(question, context) {
  const completion = await llm.chat.completions.create({
    model:       CONFIG.azure.deployment,
    temperature: 0,
    max_tokens:  1500,
    messages: [
      { role: "system", content: SYSTEM_PROMPT },
      { role: "user",   content: `Context:\n${context}\n\nQuestion:\n${question}` },
    ],
  });
  return completion.choices[0].message.content;
 }
 // ─── Express app ──────────────────────────────────────────────────────────────
 const app = express();
 app.use(cors());
 app.use(express.json({ limit: "1mb" }));
 app.use(express.urlencoded({ extended: true }));
 app.use((req, _res, next) => {
  console.log(`→ ${req.method} ${req.path}`);
  next();
 });
 // ─── Routes ───────────────────────────────────────────────────────────────────
 app.get("/health", (_req, res) => {
  res.json({ status: "ok", model: CONFIG.azure.deployment, collection: CONFIG.qdrant.collection });
 });
 app.post("/ask", async (req, res) => {
  const { question } = req.body ?? {};
  if (!question?.trim()) {
    return res.status(400).json({ success: false, error: "question is required" });
  }
  const t0 = Date.now();
  try {
    const embedding = await createEmbedding(question.trim());
    const results = await searchQdrant(embedding);
    if (!results.length) {
      return res.json({
        success: true,
        question,
        answer:  "❌ I could not find this information in the uploaded documents.",
        sources: [],
        ms:      Date.now() - t0,
      });
    }
    const context = buildContext(results);
    const answer  = await askLLM(question, context);
    return res.json({
      success: true,
      question,
      answer,
      sources: results.map(r => ({
        score: +r.score.toFixed(4),
        file:  r.payload?.file,
        page:  r.payload?.page,
        chunk: r.payload?.chunk,
      })),
      ms: Date.now() - t0,
    });
  } catch (err) {
    console.error("❌ /ask error:", err);
    return res.status(500).json({ success: false, error: err.message });
  }
 });
 // ─── /ask/stream — word-by-word SSE ──────────────────────────────────────────
 // The LLM streams tokens (which may be partial words or multi-word chunks).
 // We split every incoming token on whitespace and emit each word as a separate
 // SSE "token" event so the frontend can animate them one-by-one.
 app.post("/ask/stream", async (req, res) => {
  const { question } = req.body ?? {};
  if (!question?.trim()) {
    return res.status(400).json({ success: false, error: "question is required" });
  }
  res.setHeader("Content-Type",  "text/event-stream");
  res.setHeader("Cache-Control", "no-cache");
  res.setHeader("Connection",    "keep-alive");
  res.flushHeaders();
  const send = (event, data) => res.write(`event: ${event}\ndata: ${JSON.stringify(data)}\n\n`);
  try {
    send("status", { message: "🔍 Searching documents..." });
    const embedding = await createEmbedding(question.trim());
    const results = await searchQdrant(embedding);
    if (!results.length) {
      send("token",  { token: "❌", isWord: true });
      send("token",  { token: "I", isWord: true });
      send("token",  { token: "could", isWord: true });
      send("token",  { token: "not", isWord: true });
      send("token",  { token: "find", isWord: true });
      send("token",  { token: "this", isWord: true });
      send("token",  { token: "information", isWord: true });
      send("token",  { token: "in", isWord: true });
      send("token",  { token: "the", isWord: true });
      send("token",  { token: "uploaded", isWord: true });
      send("token",  { token: "documents.", isWord: true });
      send("done",   { sources: [] });
      return res.end();
    }
    const sources = results.map(r => ({
      score: +r.score.toFixed(4),
      file:  r.payload?.file,
      page:  r.payload?.page,
      chunk: r.payload?.chunk,
    }));
    send("sources", { sources });
    send("status", { message: "💬 Generating answer..." });
    const context = buildContext(results);
    const stream  = await llm.chat.completions.create({
      model:       CONFIG.azure.deployment,
      temperature: 0,
      max_tokens:  1500,
      stream:      true,
      messages: [
        { role: "system", content: SYSTEM_PROMPT },
        { role: "user",   content: `Context:\n${context}\n\nQuestion:\n${question}` },
      ],
    });
    // Buffer to handle tokens that may be split mid-word
    let wordBuffer = "";
    for await (const chunk of stream) {
      const rawToken = chunk.choices[0]?.delta?.content ?? "";
      if (!rawToken) continue;
      wordBuffer += rawToken;
      // Split on whitespace — emit complete words, keep trailing partial
      // We preserve newlines/markdown as separate tokens so markdown renders correctly
      const parts = wordBuffer.split(/(\s+)/);
      // Last element might be an incomplete word — buffer it
      wordBuffer = parts.pop() ?? "";
      for (const part of parts) {
        if (part) {
          send("token", { token: part, isWord: /\S/.test(part) });
        }
      }
    }
    // Flush any remaining buffered text
    if (wordBuffer) {
      send("token", { token: wordBuffer, isWord: true });
    }
    send("done", { sources });
  } catch (err) {
    console.error("❌ /ask/stream error:", err);
    send("error", { error: err.message });
  }
  res.end();
 });
 app.use((_req, res) => res.status(404).json({ success: false, error: "Not found" }));
 // ─── Start ────────────────────────────────────────────────────────────────────
 async function start() {
  await getEmbedder();
  app.listen(CONFIG.port, () => {
    console.log(`Server running on port ${CONFIG.port}`);
  });
 }
 start().catch(err => {
  console.error("Fatal startup error:", err);
  process.exit(1);
 });
		`@@ -0,0 +1 @@`
							`AZURE_OPENAI_KEY=o20WLCQfubbGTo0SnkS70lefG0tHvdZlzcUGHOPDmww0igy94Up0JQQJ99CEAC77bzfXJ3w3AAAAACOGIUYb`