feat(providers): implement custom classes

2026-01-12 02:35:42 +00:00 · 2025-11-18 14:39:04 +05:30
parent 5272c7fd3e
commit 4bcbdad6cb
8 changed files with 417 additions and 88 deletions
--- a/src/lib/models/providers/ollama/ollamaLLM.ts
+++ b/src/lib/models/providers/ollama/ollamaLLM.ts
@@ -0,0 +1,149 @@
+import z from 'zod';
+import BaseLLM from '../../base/llm';
+import {
+  GenerateObjectInput,
+  GenerateOptions,
+  GenerateTextInput,
+  GenerateTextOutput,
+  StreamTextOutput,
+} from '../../types';
+import { Ollama } from 'ollama';
+import { parse } from 'partial-json';
+
+type OllamaConfig = {
+  baseURL: string;
+  model: string;
+  options?: GenerateOptions;
+};
+
+class OllamaLLM extends BaseLLM<OllamaConfig> {
+  ollamaClient: Ollama;
+
+  constructor(protected config: OllamaConfig) {
+    super(config);
+
+    this.ollamaClient = new Ollama({
+      host: this.config.baseURL || 'http://localhost:11434',
+    });
+  }
+
+  withOptions(options: GenerateOptions) {
+    this.config.options = {
+      ...this.config.options,
+      ...options,
+    };
+    return this;
+  }
+
+  async generateText(input: GenerateTextInput): Promise<GenerateTextOutput> {
+    this.withOptions(input.options || {});
+
+    const res = await this.ollamaClient.chat({
+      model: this.config.model,
+      messages: input.messages,
+      options: {
+        top_p: this.config.options?.topP,
+        temperature: this.config.options?.temperature,
+        num_predict: this.config.options?.maxTokens,
+        frequency_penalty: this.config.options?.frequencyPenalty,
+        presence_penalty: this.config.options?.presencePenalty,
+        stop: this.config.options?.stopSequences,
+      },
+    });
+
+    return {
+      content: res.message.content,
+      additionalInfo: {
+        reasoning: res.message.thinking,
+      },
+    };
+  }
+
+  async *streamText(
+    input: GenerateTextInput,
+  ): AsyncGenerator<StreamTextOutput> {
+    this.withOptions(input.options || {});
+
+    const stream = await this.ollamaClient.chat({
+      model: this.config.model,
+      messages: input.messages,
+      stream: true,
+      options: {
+        top_p: this.config.options?.topP,
+        temperature: this.config.options?.temperature,
+        num_predict: this.config.options?.maxTokens,
+        frequency_penalty: this.config.options?.frequencyPenalty,
+        presence_penalty: this.config.options?.presencePenalty,
+        stop: this.config.options?.stopSequences,
+      },
+    });
+
+    for await (const chunk of stream) {
+      yield {
+        contentChunk: chunk.message.content,
+        done: chunk.done,
+        additionalInfo: {
+          reasoning: chunk.message.thinking,
+        },
+      };
+    }
+  }
+
+  async generateObject<T>(input: GenerateObjectInput): Promise<T> {
+    this.withOptions(input.options || {});
+
+    const response = await this.ollamaClient.chat({
+      model: this.config.model,
+      messages: input.messages,
+      format: z.toJSONSchema(input.schema),
+      options: {
+        top_p: this.config.options?.topP,
+        temperature: this.config.options?.temperature,
+        num_predict: this.config.options?.maxTokens,
+        frequency_penalty: this.config.options?.frequencyPenalty,
+        presence_penalty: this.config.options?.presencePenalty,
+        stop: this.config.options?.stopSequences,
+      },
+    });
+
+    try {
+      return input.schema.parse(JSON.parse(response.message.content)) as T;
+    } catch (err) {
+      throw new Error(`Error parsing response from Ollama: ${err}`);
+    }
+  }
+
+  async *streamObject<T>(input: GenerateObjectInput): AsyncGenerator<T> {
+    let recievedObj: string = '';
+
+    this.withOptions(input.options || {});
+
+    const stream = await this.ollamaClient.chat({
+      model: this.config.model,
+      messages: input.messages,
+      format: z.toJSONSchema(input.schema),
+      stream: true,
+      options: {
+        top_p: this.config.options?.topP,
+        temperature: this.config.options?.temperature,
+        num_predict: this.config.options?.maxTokens,
+        frequency_penalty: this.config.options?.frequencyPenalty,
+        presence_penalty: this.config.options?.presencePenalty,
+        stop: this.config.options?.stopSequences,
+      },
+    });
+
+    for await (const chunk of stream) {
+      recievedObj += chunk.message.content;
+
+      try {
+        yield parse(recievedObj) as T;
+      } catch (err) {
+        console.log('Error parsing partial object from Ollama:', err);
+        yield {} as T;
+      }
+    }
+  }
+}
+
+export default OllamaLLM;