feat(app): remove backend

2026-07-12 14:13:28 +00:00 · 2025-03-19 16:23:27 +05:30
parent 8a24572cd2
commit 217736d05a
145 changed files with 3546 additions and 10516 deletions
--- a/src/lib/utils/computeSimilarity.ts
+++ b/src/lib/utils/computeSimilarity.ts
@@ -0,0 +1,17 @@
+import dot from 'compute-dot';
+import cosineSimilarity from 'compute-cosine-similarity';
+import { getSimilarityMeasure } from '../config';
+
+const computeSimilarity = (x: number[], y: number[]): number => {
+  const similarityMeasure = getSimilarityMeasure();
+
+  if (similarityMeasure === 'cosine') {
+    return cosineSimilarity(x, y) as number;
+  } else if (similarityMeasure === 'dot') {
+    return dot(x, y);
+  }
+
+  throw new Error('Invalid similarity measure');
+};
+
+export default computeSimilarity;
--- a/src/lib/utils/documents.ts
+++ b/src/lib/utils/documents.ts
@@ -0,0 +1,99 @@
+import axios from 'axios';
+import { htmlToText } from 'html-to-text';
+import { RecursiveCharacterTextSplitter } from 'langchain/text_splitter';
+import { Document } from '@langchain/core/documents';
+import pdfParse from 'pdf-parse';
+
+export const getDocumentsFromLinks = async ({ links }: { links: string[] }) => {
+  const splitter = new RecursiveCharacterTextSplitter();
+
+  let docs: Document[] = [];
+
+  await Promise.all(
+    links.map(async (link) => {
+      link =
+        link.startsWith('http://') || link.startsWith('https://')
+          ? link
+          : `https://${link}`;
+
+      try {
+        const res = await axios.get(link, {
+          responseType: 'arraybuffer',
+        });
+
+        const isPdf = res.headers['content-type'] === 'application/pdf';
+
+        if (isPdf) {
+          const pdfText = await pdfParse(res.data);
+          const parsedText = pdfText.text
+            .replace(/(\r\n|\n|\r)/gm, ' ')
+            .replace(/\s+/g, ' ')
+            .trim();
+
+          const splittedText = await splitter.splitText(parsedText);
+          const title = 'PDF Document';
+
+          const linkDocs = splittedText.map((text) => {
+            return new Document({
+              pageContent: text,
+              metadata: {
+                title: title,
+                url: link,
+              },
+            });
+          });
+
+          docs.push(...linkDocs);
+          return;
+        }
+
+        const parsedText = htmlToText(res.data.toString('utf8'), {
+          selectors: [
+            {
+              selector: 'a',
+              options: {
+                ignoreHref: true,
+              },
+            },
+          ],
+        })
+          .replace(/(\r\n|\n|\r)/gm, ' ')
+          .replace(/\s+/g, ' ')
+          .trim();
+
+        const splittedText = await splitter.splitText(parsedText);
+        const title = res.data
+          .toString('utf8')
+          .match(/<title>(.*?)<\/title>/)?.[1];
+
+        const linkDocs = splittedText.map((text) => {
+          return new Document({
+            pageContent: text,
+            metadata: {
+              title: title || link,
+              url: link,
+            },
+          });
+        });
+
+        docs.push(...linkDocs);
+      } catch (err) {
+        console.error(
+          'An error occurred while getting documents from links: ',
+          err,
+        );
+        docs.push(
+          new Document({
+            pageContent: `Failed to retrieve content from the link: ${err}`,
+            metadata: {
+              title: 'Failed to retrieve content',
+              url: link,
+            },
+          }),
+        );
+      }
+    }),
+  );
+
+  return docs;
+};
--- a/src/lib/utils/files.ts
+++ b/src/lib/utils/files.ts
@@ -0,0 +1,17 @@
+import path from 'path';
+import fs from 'fs';
+
+export const getFileDetails = (fileId: string) => {
+  const fileLoc = path.join(
+    process.cwd(),
+    './uploads',
+    fileId + '-extracted.json',
+  );
+
+  const parsedFile = JSON.parse(fs.readFileSync(fileLoc, 'utf8'));
+
+  return {
+    name: parsedFile.title,
+    fileId: fileId,
+  };
+};
--- a/src/lib/utils/formatHistory.ts
+++ b/src/lib/utils/formatHistory.ts
@@ -0,0 +1,9 @@
+import { BaseMessage } from '@langchain/core/messages';
+
+const formatChatHistoryAsString = (history: BaseMessage[]) => {
+  return history
+    .map((message) => `${message._getType()}: ${message.content}`)
+    .join('\n');
+};
+
+export default formatChatHistoryAsString;