adding the ability to configure ollama chat options and embeddings params via the config.toml file

2025-02-05 13:33:17 -08:00 · 2025-02-05 13:33:17 -08:00 · ad0826111b
commit ad0826111b
parent 46541e6c0c
8 changed files with 1052 additions and 1388 deletions
--- a/README.md
+++ b/README.md
@ -2,7 +2,6 @@

 [![Discord](https://dcbadge.vercel.app/api/server/26aArMy8tT?style=flat&compact=true)](https://discord.gg/26aArMy8tT)

-
 ![preview](.assets/perplexica-screenshot.png?)

 ## Table of Contents <!-- omit in toc -->
--- a/package.json
+++ b/package.json
@ -34,7 +34,7 @@
    "@langchain/google-genai": "^0.0.23",
    "@xenova/transformers": "^2.17.1",
    "axios": "^1.6.8",
-    "better-sqlite3": "^11.0.0",
+    "better-sqlite3": "^11.8.1",
    "compute-cosine-similarity": "^1.1.0",
    "compute-dot": "^1.1.0",
    "cors": "^2.8.5",
--- a/sample.config.toml
+++ b/sample.config.toml
@ -11,4 +11,11 @@ GEMINI = "" # Gemini API key - sk-1234567890abcdef1234567890abcdef

 [API_ENDPOINTS]
 SEARXNG = "http://localhost:32768" # SearxNG API URL
-OLLAMA = "" # Ollama API URL - http://host.docker.internal:11434
+OLLAMA = "" # Ollama API URL - http://host.docker.internal:11434
+
+[OLLAMA_CHAT_OPTIONS]
+# maps to parameters found here: https://v03.api.js.langchain.com/interfaces/_langchain_ollama.ChatOllamaInput.html
+numCtx = 2048 # the default, some models demand more
+
+[OLLAMA_EMBEDDINGS_PARAMS]
+# maps to parameters found here: https://v03.api.js.langchain.com/interfaces/_langchain_ollama.OllamaEmbeddingsParams.html
--- a/src/config.ts
+++ b/src/config.ts
@ -20,6 +20,8 @@ interface Config {
    SEARXNG: string;
    OLLAMA: string;
  };
+  OLLAMA_CHAT_OPTIONS: {};
+  OLLAMA_EMBEDDINGS_PARAMS: {};
 }

 type RecursivePartial<T> = {
@ -51,6 +53,10 @@ export const getSearxngApiEndpoint = () =>

 export const getOllamaApiEndpoint = () => loadConfig().API_ENDPOINTS.OLLAMA;

+export const getOllamaChatOptions = () => loadConfig().OLLAMA_CHAT_OPTIONS;
+export const getOllamaEmbeddingsParams = () =>
+  loadConfig().OLLAMA_EMBEDDINGS_PARAMS;
+
 export const updateConfig = (config: RecursivePartial<Config>) => {
  const currentConfig = loadConfig();

--- a/src/lib/providers/ollama.ts
+++ b/src/lib/providers/ollama.ts
@ -1,11 +1,17 @@
 import { OllamaEmbeddings } from '@langchain/community/embeddings/ollama';
-import { getKeepAlive, getOllamaApiEndpoint } from '../../config';
+import {
+  getKeepAlive,
+  getOllamaApiEndpoint,
+  getOllamaChatOptions,
+  getOllamaEmbeddingsParams,
+} from '../../config';
 import logger from '../../utils/logger';
 import { ChatOllama } from '@langchain/community/chat_models/ollama';
 import axios from 'axios';

 export const loadOllamaChatModels = async () => {
  const ollamaEndpoint = getOllamaApiEndpoint();
+  const ollamaChatOptions = getOllamaChatOptions();
  const keepAlive = getKeepAlive();

  if (!ollamaEndpoint) return {};
@ -23,10 +29,14 @@ export const loadOllamaChatModels = async () => {
      acc[model.model] = {
        displayName: model.name,
        model: new ChatOllama({
-          baseUrl: ollamaEndpoint,
-          model: model.model,
-          temperature: 0.7,
-          keepAlive: keepAlive,
+          ...ollamaChatOptions, // merge the options specified via config
+          ...{
+            // things defined in this dictionary will take precendence
+            baseUrl: ollamaEndpoint,
+            model: model.model,
+            temperature: 0.7,
+            keepAlive: keepAlive,
+          },
        }),
      };

@ -42,6 +52,7 @@ export const loadOllamaChatModels = async () => {

 export const loadOllamaEmbeddingsModels = async () => {
  const ollamaEndpoint = getOllamaApiEndpoint();
+  const ollamaEmbeddingParams = getOllamaEmbeddingsParams();

  if (!ollamaEndpoint) return {};

@ -58,8 +69,12 @@ export const loadOllamaEmbeddingsModels = async () => {
      acc[model.model] = {
        displayName: model.name,
        model: new OllamaEmbeddings({
-          baseUrl: ollamaEndpoint,
-          model: model.model,
+          ...ollamaEmbeddingParams, // merge the options specified via config
+          ...{
+            // things defined in this dictionary will take precendence
+            baseUrl: ollamaEndpoint,
+            model: model.model,
+          },
        }),
      };

--- a/src/routes/config.ts
+++ b/src/routes/config.ts
@ -9,6 +9,8 @@ import {
  getAnthropicApiKey,
  getGeminiApiKey,
  getOpenaiApiKey,
+  getOllamaChatOptions,
+  getOllamaEmbeddingsParams,
  updateConfig,
 } from '../config';
 import logger from '../utils/logger';
@ -54,6 +56,8 @@ router.get('/', async (_, res) => {
    config['anthropicApiKey'] = getAnthropicApiKey();
    config['groqApiKey'] = getGroqApiKey();
    config['geminiApiKey'] = getGeminiApiKey();
+    config['ollamaChatOptions'] = getOllamaChatOptions();
+    config['ollamaEmbeddingsParams'] = getOllamaEmbeddingsParams();

    res.status(200).json(config);
  } catch (err: any) {
@ -75,6 +79,7 @@ router.post('/', async (req, res) => {
    API_ENDPOINTS: {
      OLLAMA: config.ollamaApiUrl,
    },
+    OLLAMA_OPTIONS: config.ollamaOptions,
  };

  updateConfig(updatedConfig);
--- a/ui/yarn.lock
+++ b/ui/yarn.lock
--- a/yarn.lock
+++ b/yarn.lock