adding the ability to configure ollama chat options and embeddings params via the config.toml file

2025-02-05 13:33:17 -08:00 · 2025-02-05 13:33:17 -08:00 · ad0826111b
commit ad0826111b
parent 46541e6c0c
8 changed files with 1052 additions and 1388 deletions
--- a/README.md
+++ b/README.md
@ -2,7 +2,6 @@
 [![Discord](https://dcbadge.vercel.app/api/server/26aArMy8tT?style=flat&compact=true)](https://discord.gg/26aArMy8tT)
 ![preview](.assets/perplexica-screenshot.png?)
 ## Table of Contents <!-- omit in toc -->
--- a/package.json
+++ b/package.json
@ -34,7 +34,7 @@
    "@langchain/google-genai": "^0.0.23",
    "@xenova/transformers": "^2.17.1",
    "axios": "^1.6.8",
-    "better-sqlite3": "^11.0.0",
+    "better-sqlite3": "^11.8.1",
    "compute-cosine-similarity": "^1.1.0",
    "compute-dot": "^1.1.0",
    "cors": "^2.8.5",
--- a/sample.config.toml
+++ b/sample.config.toml
@ -12,3 +12,10 @@ GEMINI = "" # Gemini API key - sk-1234567890abcdef1234567890abcdef
 [API_ENDPOINTS]
 SEARXNG = "http://localhost:32768" # SearxNG API URL
 OLLAMA = "" # Ollama API URL - http://host.docker.internal:11434
 [OLLAMA_CHAT_OPTIONS]
 # maps to parameters found here: https://v03.api.js.langchain.com/interfaces/_langchain_ollama.ChatOllamaInput.html
 numCtx = 2048 # the default, some models demand more
 [OLLAMA_EMBEDDINGS_PARAMS]
 # maps to parameters found here: https://v03.api.js.langchain.com/interfaces/_langchain_ollama.OllamaEmbeddingsParams.html
--- a/src/config.ts
+++ b/src/config.ts
@ -20,6 +20,8 @@ interface Config {
    SEARXNG: string;
    OLLAMA: string;
  };
  OLLAMA_CHAT_OPTIONS: {};
  OLLAMA_EMBEDDINGS_PARAMS: {};
 }
 type RecursivePartial<T> = {
@ -51,6 +53,10 @@ export const getSearxngApiEndpoint = () =>
 export const getOllamaApiEndpoint = () => loadConfig().API_ENDPOINTS.OLLAMA;
 export const getOllamaChatOptions = () => loadConfig().OLLAMA_CHAT_OPTIONS;
 export const getOllamaEmbeddingsParams = () =>
  loadConfig().OLLAMA_EMBEDDINGS_PARAMS;
 export const updateConfig = (config: RecursivePartial<Config>) => {
  const currentConfig = loadConfig();
--- a/src/lib/providers/ollama.ts
+++ b/src/lib/providers/ollama.ts
@ -1,11 +1,17 @@
 import { OllamaEmbeddings } from '@langchain/community/embeddings/ollama';
-import { getKeepAlive, getOllamaApiEndpoint } from '../../config';
+import {
  getKeepAlive,
  getOllamaApiEndpoint,
  getOllamaChatOptions,
  getOllamaEmbeddingsParams,
 } from '../../config';
 import logger from '../../utils/logger';
 import { ChatOllama } from '@langchain/community/chat_models/ollama';
 import axios from 'axios';
 export const loadOllamaChatModels = async () => {
  const ollamaEndpoint = getOllamaApiEndpoint();
  const ollamaChatOptions = getOllamaChatOptions();
  const keepAlive = getKeepAlive();
  if (!ollamaEndpoint) return {};
@ -23,10 +29,14 @@ export const loadOllamaChatModels = async () => {
      acc[model.model] = {
        displayName: model.name,
        model: new ChatOllama({
          ...ollamaChatOptions, // merge the options specified via config
          ...{
            // things defined in this dictionary will take precendence
            baseUrl: ollamaEndpoint,
            model: model.model,
            temperature: 0.7,
            keepAlive: keepAlive,
          },
        }),
      };
@ -42,6 +52,7 @@ export const loadOllamaChatModels = async () => {
 export const loadOllamaEmbeddingsModels = async () => {
  const ollamaEndpoint = getOllamaApiEndpoint();
  const ollamaEmbeddingParams = getOllamaEmbeddingsParams();
  if (!ollamaEndpoint) return {};
@ -58,8 +69,12 @@ export const loadOllamaEmbeddingsModels = async () => {
      acc[model.model] = {
        displayName: model.name,
        model: new OllamaEmbeddings({
          ...ollamaEmbeddingParams, // merge the options specified via config
          ...{
            // things defined in this dictionary will take precendence
            baseUrl: ollamaEndpoint,
            model: model.model,
          },
        }),
      };
--- a/src/routes/config.ts
+++ b/src/routes/config.ts
@ -9,6 +9,8 @@ import {
  getAnthropicApiKey,
  getGeminiApiKey,
  getOpenaiApiKey,
  getOllamaChatOptions,
  getOllamaEmbeddingsParams,
  updateConfig,
 } from '../config';
 import logger from '../utils/logger';
@ -54,6 +56,8 @@ router.get('/', async (_, res) => {
    config['anthropicApiKey'] = getAnthropicApiKey();
    config['groqApiKey'] = getGroqApiKey();
    config['geminiApiKey'] = getGeminiApiKey();
    config['ollamaChatOptions'] = getOllamaChatOptions();
    config['ollamaEmbeddingsParams'] = getOllamaEmbeddingsParams();
    res.status(200).json(config);
  } catch (err: any) {
@ -75,6 +79,7 @@ router.post('/', async (req, res) => {
    API_ENDPOINTS: {
      OLLAMA: config.ollamaApiUrl,
    },
    OLLAMA_OPTIONS: config.ollamaOptions,
  };
  updateConfig(updatedConfig);
--- a/ui/yarn.lock
+++ b/ui/yarn.lock
--- a/yarn.lock
+++ b/yarn.lock