From bd8043cf827c76f015881035d85098eae41738ff Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Wed, 1 May 2024 12:47:50 -0700
Subject: [PATCH 1/5] add LMStudio agent support (generic) support "work" with
 non-tool callable LLMs, highly dependent on system specs

---
 .vscode/settings.json                         |   1 +
 .../AgentConfig/AgentLLMSelection/index.jsx   |   2 +-
 server/endpoints/agentWebsocket.js            |   2 +-
 server/package.json                           |   1 +
 server/utils/agents/aibitat/index.js          |   2 +
 .../agents/aibitat/plugins/chat-history.js    |   1 +
 .../agents/aibitat/providers/ai-provider.js   |  20 +-
 .../utils/agents/aibitat/providers/classes.js |  16 ++
 .../utils/agents/aibitat/providers/index.js   |   2 +
 .../agents/aibitat/providers/lmstudio.js      |  89 ++++++++
 .../agents/aibitat/providers/untooled.js      | 212 ++++++++++++++++++
 server/utils/agents/defaults.js               |   5 +-
 server/utils/agents/index.js                  |  22 +-
 server/utils/http/index.js                    |  11 +
 server/yarn.lock                              |   5 +
 15 files changed, 384 insertions(+), 7 deletions(-)
 create mode 100644 server/utils/agents/aibitat/providers/classes.js
 create mode 100644 server/utils/agents/aibitat/providers/lmstudio.js
 create mode 100644 server/utils/agents/aibitat/providers/untooled.js

diff --git a/.vscode/settings.json b/.vscode/settings.json
index b0fccedf04f..f850bbb003f 100644
--- a/.vscode/settings.json
+++ b/.vscode/settings.json
@@ -17,6 +17,7 @@
     "hljs",
     "inferencing",
     "Langchain",
+    "lmstudio",
     "mbox",
     "Milvus",
     "Mintplex",
diff --git a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
index f1b99747090..51b384642d6 100644
--- a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
+++ b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
@@ -5,7 +5,7 @@ import { AVAILABLE_LLM_PROVIDERS } from "@/pages/GeneralSettings/LLMPreference";
 import { CaretUpDown, MagnifyingGlass, X } from "@phosphor-icons/react";
 import AgentModelSelection from "../AgentModelSelection";
 
-const ENABLED_PROVIDERS = ["openai", "anthropic"];
+const ENABLED_PROVIDERS = ["openai", "anthropic", "lmstudio"];
 
 const LLM_DEFAULT = {
   name: "Please make a selection",
diff --git a/server/endpoints/agentWebsocket.js b/server/endpoints/agentWebsocket.js
index 9809c60737a..c5fc1475fb7 100644
--- a/server/endpoints/agentWebsocket.js
+++ b/server/endpoints/agentWebsocket.js
@@ -51,7 +51,7 @@ function agentWebsocket(app) {
       await agentHandler.createAIbitat({ socket });
       await agentHandler.startAgentCluster();
     } catch (e) {
-      console.error(e.message);
+      console.error(e.message, e);
       socket?.send(JSON.stringify({ type: "wssFailure", content: e.message }));
       socket?.close();
     }
diff --git a/server/package.json b/server/package.json
index 5549ba713df..c673d80c214 100644
--- a/server/package.json
+++ b/server/package.json
@@ -50,6 +50,7 @@
     "joi": "^17.11.0",
     "joi-password-complexity": "^5.2.0",
     "js-tiktoken": "^1.0.7",
+    "jsonrepair": "^3.7.0",
     "jsonwebtoken": "^8.5.1",
     "langchain": "0.1.36",
     "mime": "^3.0.0",
diff --git a/server/utils/agents/aibitat/index.js b/server/utils/agents/aibitat/index.js
index d1e9ae9c8a9..7fa09969a58 100644
--- a/server/utils/agents/aibitat/index.js
+++ b/server/utils/agents/aibitat/index.js
@@ -727,6 +727,8 @@ ${this.getHistory({ to: route.to })
         return new Providers.OpenAIProvider({ model: config.model });
       case "anthropic":
         return new Providers.AnthropicProvider({ model: config.model });
+      case "lmstudio":
+        return new Providers.LMStudioProvider({});
 
       default:
         throw new Error(
diff --git a/server/utils/agents/aibitat/plugins/chat-history.js b/server/utils/agents/aibitat/plugins/chat-history.js
index e3123a83bea..4d3f8fd1efe 100644
--- a/server/utils/agents/aibitat/plugins/chat-history.js
+++ b/server/utils/agents/aibitat/plugins/chat-history.js
@@ -13,6 +13,7 @@ const chatHistory = {
       name: this.name,
       setup: function (aibitat) {
         aibitat.onMessage(async () => {
+          return;
           try {
             const lastResponses = aibitat.chats.slice(-2);
             if (lastResponses.length !== 2) return;
diff --git a/server/utils/agents/aibitat/providers/ai-provider.js b/server/utils/agents/aibitat/providers/ai-provider.js
index 5c56cb62c74..0e871b36e1d 100644
--- a/server/utils/agents/aibitat/providers/ai-provider.js
+++ b/server/utils/agents/aibitat/providers/ai-provider.js
@@ -4,16 +4,25 @@
 
 const { ChatOpenAI } = require("@langchain/openai");
 const { ChatAnthropic } = require("@langchain/anthropic");
+const DEFAULT_WORKSPACE_PROMPT =
+  "You are a helpful ai assistant who can assist the user and use tools available to help answer the users prompts and questions.";
 
 class Provider {
   _client;
   constructor(client) {
     if (this.constructor == Provider) {
-      throw new Error("Class is of abstract type and can't be instantiated");
+      return;
     }
     this._client = client;
   }
 
+  providerLog(text, ...args) {
+    console.log(
+      `\x1b[36m[AgentLLM${this?.model ? ` - ${this.model}` : ""}]\x1b[0m ${text}`,
+      ...args
+    );
+  }
+
   get client() {
     return this._client;
   }
@@ -48,6 +57,15 @@ class Provider {
         return 8_000;
     }
   }
+
+  static systemPrompt(provider = null) {
+    switch (provider) {
+      case "lmstudio":
+        return "You are a helpful ai assistant who can assist the user and use tools available to help answer the users prompts and questions. Tools will be handled by another assistant and you will simply receive their responses to help answer the user prompt - always try to answer the user's prompt the best you can with the context available to you and your general knowledge.";
+      default:
+        return DEFAULT_WORKSPACE_PROMPT;
+    }
+  }
 }
 
 module.exports = Provider;
diff --git a/server/utils/agents/aibitat/providers/classes.js b/server/utils/agents/aibitat/providers/classes.js
new file mode 100644
index 00000000000..3a6e959b1b7
--- /dev/null
+++ b/server/utils/agents/aibitat/providers/classes.js
@@ -0,0 +1,16 @@
+function InheritMultiple(bases = []) {
+  class Bases {
+    constructor() {
+      bases.forEach((base) => Object.assign(this, new base()));
+    }
+  }
+
+  bases.forEach((base) => {
+    Object.getOwnPropertyNames(base.prototype)
+      .filter((prop) => prop != "constructor")
+      .forEach((prop) => (Bases.prototype[prop] = base.prototype[prop]));
+  });
+  return Bases;
+}
+
+module.exports = InheritMultiple;
diff --git a/server/utils/agents/aibitat/providers/index.js b/server/utils/agents/aibitat/providers/index.js
index b163b4cd0e7..ebe4de33f06 100644
--- a/server/utils/agents/aibitat/providers/index.js
+++ b/server/utils/agents/aibitat/providers/index.js
@@ -1,7 +1,9 @@
 const OpenAIProvider = require("./openai.js");
 const AnthropicProvider = require("./anthropic.js");
+const LMStudioProvider = require("./lmstudio.js");
 
 module.exports = {
   OpenAIProvider,
   AnthropicProvider,
+  LMStudioProvider,
 };
diff --git a/server/utils/agents/aibitat/providers/lmstudio.js b/server/utils/agents/aibitat/providers/lmstudio.js
new file mode 100644
index 00000000000..6fc73d5adb1
--- /dev/null
+++ b/server/utils/agents/aibitat/providers/lmstudio.js
@@ -0,0 +1,89 @@
+const OpenAI = require("openai");
+const InheritMultiple = require("./classes.js");
+const Provider = require("./ai-provider.js");
+const UnTooled = require("./untooled.js");
+
+/**
+ * The provider for the LMStudio provider.
+ */
+class LMStudioProvider extends InheritMultiple([Provider, UnTooled]) {
+  model;
+
+  constructor(_config = {}) {
+    super();
+    const model = process.env.LMSTUDIO_MODEL_PREF || "Loaded from Chat UI";
+    const client = new OpenAI({
+      baseURL: process.env.LMSTUDIO_BASE_PATH?.replace(/\/+$/, ""), // here is the URL to your LMStudio instance
+      apiKey: null,
+      maxRetries: 3,
+      model,
+    });
+    this._client = client;
+    this.model = model;
+  }
+
+  get client() {
+    return this._client;
+  }
+
+  /**
+   * Create a completion based on the received messages.
+   *
+   * @param messages A list of messages to send to the API.
+   * @param functions
+   * @returns The completion.
+   */
+  async complete(messages, functions = null) {
+    try {
+      let completion;
+      if (functions.length > 0) {
+        const { toolCall, text } = await this.functionCall(messages, functions);
+
+        if (toolCall !== null) {
+          this.providerLog(`Valid tool call found - running ${toolCall.name}.`);
+          this.deduplicator.trackRun(toolCall.name, toolCall.arguments);
+          return {
+            result: null,
+            functionCall: {
+              name: toolCall.name,
+              arguments: toolCall.arguments,
+            },
+            cost: 0,
+          };
+        }
+        completion = { content: text };
+      }
+
+      if (!completion?.content) {
+        this.providerLog(
+          "Will assume chat completion without tool call inputs."
+        );
+        const response = await this.client.chat.completions.create({
+          model: this.model,
+          messages: this.cleanMsgs(messages),
+        });
+        completion = response.choices[0].message;
+      }
+
+      return {
+        result: completion.content,
+        cost: 0,
+      };
+    } catch (error) {
+      throw error;
+    }
+  }
+
+  /**
+   * Get the cost of the completion.
+   *
+   * @param _usage The completion to get the cost for.
+   * @returns The cost of the completion.
+   * Stubbed since LMStudio has no cost basis.
+   */
+  getCost(_usage) {
+    return 0;
+  }
+}
+
+module.exports = LMStudioProvider;
diff --git a/server/utils/agents/aibitat/providers/untooled.js b/server/utils/agents/aibitat/providers/untooled.js
new file mode 100644
index 00000000000..91a515182e4
--- /dev/null
+++ b/server/utils/agents/aibitat/providers/untooled.js
@@ -0,0 +1,212 @@
+const { safeJsonParse } = require("../../../http");
+const { Deduplicator } = require("../utils/dedupe");
+
+class UnTooled {
+  constructor() {
+    this.deduplicator = new Deduplicator();
+  }
+
+  cleanMsgs(messages) {
+    const modifiedMessages = [];
+    messages.forEach((msg) => {
+      if (msg.role === "function") {
+        const prevMsg = modifiedMessages[modifiedMessages.length - 1].content;
+        modifiedMessages[modifiedMessages.length - 1].content =
+          `${prevMsg}\n${msg.content}`;
+        return;
+      }
+      modifiedMessages.push(msg);
+    });
+    return modifiedMessages;
+  }
+
+  formatFuncs(functions = []) {
+    const funcs = [];
+    functions.forEach((def) => {
+      funcs.push({
+        name: def.name,
+        description: def.description,
+        properties: def.properties,
+      });
+    });
+
+    return JSON.stringify(funcs, null, 2);
+  }
+
+  /**
+   * Check if two arrays of strings or numbers have the same values
+   * @param {string[]|number[]} arr1
+   * @param {string[]|number[]} arr2
+   * @param {Object} [opts]
+   * @param {boolean} [opts.enforceOrder] - By default (false), the order of the values in the arrays doesn't matter.
+   * @return {boolean}
+   */
+  compareArrays(arr1, arr2, opts) {
+    function vKey(i, v) {
+      return (opts?.enforceOrder ? `${i}-` : "") + `${typeof v}-${v}`;
+    }
+
+    if (arr1.length !== arr2.length) return false;
+
+    const d1 = {};
+    const d2 = {};
+    for (let i = arr1.length - 1; i >= 0; i--) {
+      d1[vKey(i, arr1[i])] = true;
+      d2[vKey(i, arr2[i])] = true;
+    }
+
+    for (let i = arr1.length - 1; i >= 0; i--) {
+      const v = vKey(i, arr1[i]);
+      if (d1[v] !== d2[v]) return false;
+    }
+
+    for (let i = arr2.length - 1; i >= 0; i--) {
+      const v = vKey(i, arr2[i]);
+      if (d1[v] !== d2[v]) return false;
+    }
+
+    return true;
+  }
+
+  validFuncCall(functionCall = {}, functions = []) {
+    if (
+      !functionCall ||
+      !functionCall?.hasOwnProperty("name") ||
+      !functionCall?.hasOwnProperty("arguments")
+    ) {
+      return {
+        valid: false,
+        reason: "Missing name or arguments in function call.",
+      };
+    }
+
+    const foundFunc = functions.find((def) => def.name === functionCall.name);
+    if (!foundFunc) {
+      return { valid: false, reason: "Function name does not exist." };
+    }
+
+    const props = Object.keys(foundFunc.parameters.properties);
+    const fProps = Object.keys(functionCall.arguments);
+    if (!this.compareArrays(props, fProps)) {
+      return { valid: false, reason: "Invalid argument schema match." };
+    }
+
+    return { valid: true, reason: null };
+  }
+
+  async functionCall(messages, functions) {
+    const history = [...messages].filter((msg) =>
+      ["user", "assistant"].includes(msg.role)
+    );
+    if (history[history.length - 1].role !== "user") return null;
+
+    const response = await this.client.chat.completions
+      .create({
+        model: this.model,
+        temperature: 0,
+        messages: [
+          {
+            content: `You are a program which picks the most optimal function and parameters to call. 
+DO NOT HAVE TO PICK A FUNCTION IF IT WILL NOT HELP ANSWER OR FULFILL THE USER'S QUERY.
+When a function is selection, respond in JSON with no additional text.
+When there is no relevant function to call - return with a regular chat text response.
+Your task is to pick a **single** function that we will use to call, if any seem useful or relevant for the user query.
+
+Example of Tool definitions:
+[
+  {
+    name: 'rag-memory',
+    description: 'Search against local documents for context that is relevant to the query or store a snippet of text into memory for retrieval later. Storing information should only be done when the user specifically requests for information to be remembered or saved to long-term memory. You should use this tool before search the internet for information.',
+    parameters: {
+      '$schema': 'http://json-schema.org/draft-07/schema#',
+      type: 'object',
+      properties: [
+        action: {
+          type: "string",
+          enum: ["search", "store"],
+          description:
+            "The action we want to take to search for existing similar context or storage of new context.",
+        },
+        content: {
+          type: "string",
+          description:
+            "The plain text to search our local documents with or to store in our vector database.",
+        },
+      ],
+      additionalProperties: false
+    }
+  },
+  {
+    name: 'web-scraping',
+    description: 'Scrapes the content of a webpage or online resource from a URL.',
+    parameters: {
+      '$schema': 'http://json-schema.org/draft-07/schema#',
+      type: 'object',
+      properties: [
+        url: {
+          type: "string",
+          format: "uri",
+          description: "A web URL.",
+        },
+      ],
+      additionalProperties: false
+    },
+  }
+]
+
+Example Query:
+User: Scrape https://example.com
+Your response (JSON ONLY): 
+{
+  name: 'web-scraping'.
+  arguments: {
+    url: 'https://example.com'
+  }
+}
+
+Example Query where tool cannot be used:
+User: Hello!
+Your response (Text Only): Hello, how are you today?
+
+The available function and their definitions are listed below - respond only with JSON or a regular chat response.
+${this.formatFuncs(functions)}
+
+Now, assess the next function to call:
+`,
+            role: "system",
+          },
+          ...history,
+        ],
+      })
+      .then((result) => {
+        if (!result.hasOwnProperty("choices"))
+          throw new Error("LMStudio chat: No results!");
+        if (result.choices.length === 0)
+          throw new Error("LMStudio chat: No results length!");
+        return result.choices[0].message.content;
+      })
+      .catch((_) => {
+        return null;
+      });
+
+    const call = safeJsonParse(response, null);
+    if (call === null) return { toolCall: null, text: response }; // failed to parse, so must be text.
+
+    const { valid, reason } = this.validFuncCall(call, functions);
+    if (!valid) {
+      this.providerLog(`Invalid function tool call: ${reason}.`);
+      return { toolCall: null, text: null };
+    }
+
+    if (this.deduplicator.isDuplicate(call.name, call.arguments)) {
+      this.providerLog(
+        `Function tool with exact arguments has already been called this stack.`
+      );
+      return { toolCall: null, text: null };
+    }
+
+    return { toolCall: call, text: null };
+  }
+}
+
+module.exports = UnTooled;
diff --git a/server/utils/agents/defaults.js b/server/utils/agents/defaults.js
index a030778f4ba..4e12b90621c 100644
--- a/server/utils/agents/defaults.js
+++ b/server/utils/agents/defaults.js
@@ -1,6 +1,7 @@
 const AgentPlugins = require("./aibitat/plugins");
 const { SystemSettings } = require("../../models/systemSettings");
 const { safeJsonParse } = require("../http");
+const Provider = require("./aibitat/providers/ai-provider");
 
 const USER_AGENT = {
   name: "USER",
@@ -14,7 +15,7 @@ const USER_AGENT = {
 
 const WORKSPACE_AGENT = {
   name: "@agent",
-  getDefinition: async () => {
+  getDefinition: async (provider = null) => {
     const defaultFunctions = [
       AgentPlugins.memory.name, // RAG
       AgentPlugins.docSummarizer.name, // Doc Summary
@@ -30,7 +31,7 @@ const WORKSPACE_AGENT = {
     });
 
     return {
-      role: "You are a helpful ai assistant who can assist the user and use tools available to help answer the users prompts and questions.",
+      role: Provider.systemPrompt(provider),
       functions: defaultFunctions,
     };
   },
diff --git a/server/utils/agents/index.js b/server/utils/agents/index.js
index ce80fff4489..5e54c0b3f67 100644
--- a/server/utils/agents/index.js
+++ b/server/utils/agents/index.js
@@ -77,14 +77,32 @@ class AgentHandler {
         if (!process.env.ANTHROPIC_API_KEY)
           throw new Error("Anthropic API key must be provided to use agents.");
         break;
+      case "lmstudio":
+        if (!process.env.LMSTUDIO_BASE_PATH)
+          throw new Error("LMStudio bash path must be provided to use agents.");
+        break;
       default:
         throw new Error("No provider found to power agent cluster.");
     }
   }
 
+  #providerDefault() {
+    switch (this.provider) {
+      case "openai":
+        return "gpt-3.5-turbo";
+      case "anthropic":
+        return "claude-3-sonnet-20240229";
+      case "lmstudio":
+        return "server-default";
+      default:
+        return "unknown";
+    }
+  }
+
   #providerSetupAndCheck() {
     this.provider = this.invocation.workspace.agentProvider || "openai";
-    this.model = this.invocation.workspace.agentModel || "gpt-3.5-turbo";
+    this.model =
+      this.invocation.workspace.agentModel || this.#providerDefault();
     this.log(`Start ${this.#invocationUUID}::${this.provider}:${this.model}`);
     this.#checkSetup();
   }
@@ -137,7 +155,7 @@ class AgentHandler {
     this.aibitat.agent(USER_AGENT.name, await USER_AGENT.getDefinition());
     this.aibitat.agent(
       WORKSPACE_AGENT.name,
-      await WORKSPACE_AGENT.getDefinition()
+      await WORKSPACE_AGENT.getDefinition(this.provider)
     );
 
     this.#funcsToLoad = [
diff --git a/server/utils/http/index.js b/server/utils/http/index.js
index eedc3315408..1fc8c5b961c 100644
--- a/server/utils/http/index.js
+++ b/server/utils/http/index.js
@@ -3,6 +3,7 @@ process.env.NODE_ENV === "development"
   : require("dotenv").config();
 const JWT = require("jsonwebtoken");
 const { User } = require("../../models/user");
+const { jsonrepair } = require("jsonrepair");
 
 function reqBody(request) {
   return typeof request.body === "string"
@@ -65,6 +66,16 @@ function safeJsonParse(jsonString, fallback = null) {
   try {
     return JSON.parse(jsonString);
   } catch {}
+
+  // If the jsonString does not look like an Obj or Array, dont attempt
+  // to repair it.
+  if (jsonString?.startsWith("[") || jsonString?.startsWith("{")) {
+    try {
+      const repairedJson = jsonrepair(jsonString);
+      return JSON.parse(repairedJson);
+    } catch {}
+  }
+
   return fallback;
 }
 
diff --git a/server/yarn.lock b/server/yarn.lock
index 49c202af657..34b9faa474c 100644
--- a/server/yarn.lock
+++ b/server/yarn.lock
@@ -3727,6 +3727,11 @@ jsonpointer@^5.0.1:
   resolved "https://registry.yarnpkg.com/jsonpointer/-/jsonpointer-5.0.1.tgz#2110e0af0900fd37467b5907ecd13a7884a1b559"
   integrity sha512-p/nXbhSEcu3pZRdkW1OfJhpsVtW1gd4Wa1fnQc9YLiTfAjn0312eMKimbdIQzuZl9aa9xUGaRlP9T/CJE/ditQ==
 
+jsonrepair@^3.7.0:
+  version "3.7.0"
+  resolved "https://registry.yarnpkg.com/jsonrepair/-/jsonrepair-3.7.0.tgz#b4fddb9c8d29dd62263f4f037334099e28feac21"
+  integrity sha512-TwE50n4P4gdVfMQF2q+X+IGy4ntFfcuHHE8zjRyBcdtrRK0ORZsjOZD6zmdylk4p277nQBAlHgsEPWtMIQk4LQ==
+
 jsonwebtoken@^8.5.1:
   version "8.5.1"
   resolved "https://registry.yarnpkg.com/jsonwebtoken/-/jsonwebtoken-8.5.1.tgz#00e71e0b8df54c2121a1f26137df2280673bcc0d"

From 0976266b428889e03eff9af83619a287180563b3 Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Wed, 1 May 2024 13:03:12 -0700
Subject: [PATCH 2/5] add comments

---
 server/utils/agents/aibitat/plugins/chat-history.js | 1 -
 server/utils/agents/aibitat/providers/untooled.js   | 2 ++
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/server/utils/agents/aibitat/plugins/chat-history.js b/server/utils/agents/aibitat/plugins/chat-history.js
index 4d3f8fd1efe..e3123a83bea 100644
--- a/server/utils/agents/aibitat/plugins/chat-history.js
+++ b/server/utils/agents/aibitat/plugins/chat-history.js
@@ -13,7 +13,6 @@ const chatHistory = {
       name: this.name,
       setup: function (aibitat) {
         aibitat.onMessage(async () => {
-          return;
           try {
             const lastResponses = aibitat.chats.slice(-2);
             if (lastResponses.length !== 2) return;
diff --git a/server/utils/agents/aibitat/providers/untooled.js b/server/utils/agents/aibitat/providers/untooled.js
index 91a515182e4..acf71d28317 100644
--- a/server/utils/agents/aibitat/providers/untooled.js
+++ b/server/utils/agents/aibitat/providers/untooled.js
@@ -1,6 +1,8 @@
 const { safeJsonParse } = require("../../../http");
 const { Deduplicator } = require("../utils/dedupe");
 
+// Useful inheritance class for a model which supports OpenAi schema for API requests
+// but does not have tool-calling or JSON output support.
 class UnTooled {
   constructor() {
     this.deduplicator = new Deduplicator();

From 7238f1b07f5ca1ace3aca155ca0eac0298257857 Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Thu, 2 May 2024 17:13:59 -0700
Subject: [PATCH 3/5] enable few-shot prompting per function for OSS models

---
 .../AgentConfig/AgentLLMSelection/index.jsx   | 16 +++-
 server/utils/agents/aibitat/index.js          | 12 +++
 server/utils/agents/aibitat/plugins/memory.js | 32 ++++++-
 .../aibitat/plugins/save-file-browser.js      | 26 +++++
 .../utils/agents/aibitat/plugins/summarize.js | 20 ++++
 .../agents/aibitat/plugins/web-browsing.js    | 16 +++-
 .../agents/aibitat/plugins/web-scraping.js    | 15 ++-
 .../providers/{ => helpers}/classes.js        |  0
 .../providers/{ => helpers}/untooled.js       | 94 +++++--------------
 .../agents/aibitat/providers/lmstudio.js      |  5 +-
 10 files changed, 159 insertions(+), 77 deletions(-)
 rename server/utils/agents/aibitat/providers/{ => helpers}/classes.js (100%)
 rename server/utils/agents/aibitat/providers/{ => helpers}/untooled.js (66%)

diff --git a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
index 51b384642d6..408d60a026f 100644
--- a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
+++ b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
@@ -2,10 +2,11 @@ import React, { useEffect, useRef, useState } from "react";
 import AnythingLLMIcon from "@/media/logo/anything-llm-icon.png";
 import AgentLLMItem from "./AgentLLMItem";
 import { AVAILABLE_LLM_PROVIDERS } from "@/pages/GeneralSettings/LLMPreference";
-import { CaretUpDown, MagnifyingGlass, X } from "@phosphor-icons/react";
+import { CaretUpDown, Gauge, MagnifyingGlass, X } from "@phosphor-icons/react";
 import AgentModelSelection from "../AgentModelSelection";
 
 const ENABLED_PROVIDERS = ["openai", "anthropic", "lmstudio"];
+const WARN_PERFORMANCE = ["lmstudio"];
 
 const LLM_DEFAULT = {
   name: "Please make a selection",
@@ -62,6 +63,19 @@ export default function AgentLLMSelection({
   const selectedLLMObject = LLMS.find((llm) => llm.value === selectedLLM);
   return (
     <div className="border-b border-white/40 pb-8">
+      {WARN_PERFORMANCE.includes(selectedLLM) && (
+        <div className="flex flex-col md:flex-row md:items-center gap-x-2 text-white mb-4 bg-blue-800/30 w-fit rounded-lg px-4 py-2">
+          <div className="gap-x-2 flex items-center">
+            <Gauge className="shrink-0" size={25} />
+            <p className="text-sm">
+              Performance of LLMs that do not explicitly support tool-calling is
+              highly dependent on the model's capabilities and accuracy. Some
+              abilities may be limited or non-functional.
+            </p>
+          </div>
+        </div>
+      )}
+
       <div className="flex flex-col">
         <label htmlFor="name" className="block input-label">
           Workspace Agent LLM Provider
diff --git a/server/utils/agents/aibitat/index.js b/server/utils/agents/aibitat/index.js
index 7fa09969a58..c3ad5428f57 100644
--- a/server/utils/agents/aibitat/index.js
+++ b/server/utils/agents/aibitat/index.js
@@ -603,6 +603,18 @@ ${this.getHistory({ to: route.to })
 
       // Execute the function and return the result to the provider
       fn.caller = byAgent || "agent";
+
+      // For OSS LLMs we really need to keep tabs on what they are calling
+      // so we can log it here.
+      if (provider?.verbose) {
+        this?.introspect?.(
+          `[debug]: ${fn.caller} is attempting to call \`${name}\` tool`
+        );
+        this.handlerProps.log(
+          `[debug]: ${fn.caller} is attempting to call \`${name}\` tool`
+        );
+      }
+
       const result = await fn.handler(args);
       Telemetry.sendTelemetry("agent_tool_call", { tool: name }, null, true);
       return await this.handleExecution(
diff --git a/server/utils/agents/aibitat/plugins/memory.js b/server/utils/agents/aibitat/plugins/memory.js
index c76b687b1b6..d31a264d18d 100644
--- a/server/utils/agents/aibitat/plugins/memory.js
+++ b/server/utils/agents/aibitat/plugins/memory.js
@@ -16,7 +16,37 @@ const memory = {
           tracker: new Deduplicator(),
           name: this.name,
           description:
-            "Search against local documents for context that is relevant to the query or store a snippet of text into memory for retrieval later. Storing information should only be done when the user specifically requests for information to be remembered or saved to long-term memory. You should use this tool before search the internet for information.",
+            "Search against local documents for context that is relevant to the query or store a snippet of text into memory for retrieval later. Storing information should only be done when the user specifically requests for information to be remembered or saved to long-term memory. You should use this tool before search the internet for information. Do not use this tool unless you are explicity told to 'remember' or 'store' information.",
+          examples: [
+            {
+              prompt: "What is AnythingLLM?",
+              call: JSON.stringify({
+                action: "search",
+                content: "What is AnythingLLM?",
+              }),
+            },
+            {
+              prompt: "What do you know about Plato's motives?",
+              call: JSON.stringify({
+                action: "search",
+                content: "What are the facts about Plato's motives?",
+              }),
+            },
+            {
+              prompt: "Remember that you are a robot",
+              call: JSON.stringify({
+                action: "store",
+                content: "I am a robot, the user told me that i am.",
+              }),
+            },
+            {
+              prompt: "Save that to memory please.",
+              call: JSON.stringify({
+                action: "store",
+                content: "<insert summary of conversation until now>",
+              }),
+            },
+          ],
           parameters: {
             $schema: "http://json-schema.org/draft-07/schema#",
             type: "object",
diff --git a/server/utils/agents/aibitat/plugins/save-file-browser.js b/server/utils/agents/aibitat/plugins/save-file-browser.js
index 0e509209618..716f37c38ed 100644
--- a/server/utils/agents/aibitat/plugins/save-file-browser.js
+++ b/server/utils/agents/aibitat/plugins/save-file-browser.js
@@ -16,6 +16,32 @@ const saveFileInBrowser = {
           name: this.name,
           description:
             "Save content to a file when the user explicity asks for a download of the file.",
+          examples: [
+            {
+              prompt: "Save me that to a file named 'output'",
+              call: JSON.stringify({
+                file_content:
+                  "<content of the file we will write previous conversation>",
+                filename: "output.txt",
+              }),
+            },
+            {
+              prompt: "Save me that to my desktop",
+              call: JSON.stringify({
+                file_content:
+                  "<content of the file we will write previous conversation>",
+                filename: "<relevant filename>.txt",
+              }),
+            },
+            {
+              prompt: "Save me that to a file",
+              call: JSON.stringify({
+                file_content:
+                  "<content of the file we will write from previous conversation>",
+                filename: "<descriptive filename>.txt",
+              }),
+            },
+          ],
           parameters: {
             $schema: "http://json-schema.org/draft-07/schema#",
             type: "object",
diff --git a/server/utils/agents/aibitat/plugins/summarize.js b/server/utils/agents/aibitat/plugins/summarize.js
index d0cfc6c1b2a..526de116ab0 100644
--- a/server/utils/agents/aibitat/plugins/summarize.js
+++ b/server/utils/agents/aibitat/plugins/summarize.js
@@ -19,6 +19,26 @@ const docSummarizer = {
           controller: new AbortController(),
           description:
             "Can get the list of files available to search with descriptions and can select a single file to open and summarize.",
+          examples: [
+            {
+              prompt: "Summarize example.txt",
+              call: JSON.stringify({
+                action: "summarize",
+                document_filename: "example.txt",
+              }),
+            },
+            {
+              prompt: "What files can you see?",
+              call: JSON.stringify({ action: "list", document_filename: null }),
+            },
+            {
+              prompt: "Tell me about readme.md",
+              call: JSON.stringify({
+                action: "summarize",
+                document_filename: "readme.md",
+              }),
+            },
+          ],
           parameters: {
             $schema: "http://json-schema.org/draft-07/schema#",
             type: "object",
diff --git a/server/utils/agents/aibitat/plugins/web-browsing.js b/server/utils/agents/aibitat/plugins/web-browsing.js
index 889de840f39..198b3ec5547 100644
--- a/server/utils/agents/aibitat/plugins/web-browsing.js
+++ b/server/utils/agents/aibitat/plugins/web-browsing.js
@@ -13,7 +13,21 @@ const webBrowsing = {
           super: aibitat,
           name: this.name,
           description:
-            "Searches for a given query online using a search engine.",
+            "Searches for a given query using a search engine to get better results for the user query.",
+          examples: [
+            {
+              prompt: "Who won the world series today?",
+              call: JSON.stringify({ query: "Winner of today's world series" }),
+            },
+            {
+              prompt: "What is AnythingLLM?",
+              call: JSON.stringify({ query: "AnythingLLM" }),
+            },
+            {
+              prompt: "Current AAPL stock price",
+              call: JSON.stringify({ query: "AAPL stock price today" }),
+            },
+          ],
           parameters: {
             $schema: "http://json-schema.org/draft-07/schema#",
             type: "object",
diff --git a/server/utils/agents/aibitat/plugins/web-scraping.js b/server/utils/agents/aibitat/plugins/web-scraping.js
index 1e614b6bac2..2888445b56a 100644
--- a/server/utils/agents/aibitat/plugins/web-scraping.js
+++ b/server/utils/agents/aibitat/plugins/web-scraping.js
@@ -16,7 +16,17 @@ const webScraping = {
           name: this.name,
           controller: new AbortController(),
           description:
-            "Scrapes the content of a webpage or online resource from a URL.",
+            "Scrapes the content of a webpage or online resource from a provided URL.",
+          examples: [
+            {
+              prompt: "What is useanything.com about?",
+              call: JSON.stringify({ uri: "https://useanything.com" }),
+            },
+            {
+              prompt: "Scrape https://example.com",
+              call: JSON.stringify({ uri: "https://example.com" }),
+            },
+          ],
           parameters: {
             $schema: "http://json-schema.org/draft-07/schema#",
             type: "object",
@@ -24,7 +34,8 @@ const webScraping = {
               url: {
                 type: "string",
                 format: "uri",
-                description: "A web URL.",
+                description:
+                  "A complete web address URL including protocol. Assumes https if not provided.",
               },
             },
             additionalProperties: false,
diff --git a/server/utils/agents/aibitat/providers/classes.js b/server/utils/agents/aibitat/providers/helpers/classes.js
similarity index 100%
rename from server/utils/agents/aibitat/providers/classes.js
rename to server/utils/agents/aibitat/providers/helpers/classes.js
diff --git a/server/utils/agents/aibitat/providers/untooled.js b/server/utils/agents/aibitat/providers/helpers/untooled.js
similarity index 66%
rename from server/utils/agents/aibitat/providers/untooled.js
rename to server/utils/agents/aibitat/providers/helpers/untooled.js
index acf71d28317..a84aad77c92 100644
--- a/server/utils/agents/aibitat/providers/untooled.js
+++ b/server/utils/agents/aibitat/providers/helpers/untooled.js
@@ -1,5 +1,5 @@
-const { safeJsonParse } = require("../../../http");
-const { Deduplicator } = require("../utils/dedupe");
+const { safeJsonParse } = require("../../../../http");
+const { Deduplicator } = require("../../utils/dedupe");
 
 // Useful inheritance class for a model which supports OpenAi schema for API requests
 // but does not have tool-calling or JSON output support.
@@ -22,17 +22,23 @@ class UnTooled {
     return modifiedMessages;
   }
 
-  formatFuncs(functions = []) {
-    const funcs = [];
+  showcaseFunctions(functions = []) {
+    let output = "";
     functions.forEach((def) => {
-      funcs.push({
-        name: def.name,
-        description: def.description,
-        properties: def.properties,
-      });
+      let shotExample = `-----------
+Function name: ${def.name}
+Function Description: ${def.description}
+Function parameters in JSON format:
+${JSON.stringify(def.parameters.properties, null, 4)}\n`;
+
+      if (Array.isArray(def.examples)) {
+        def.examples.forEach(({ prompt, call }) => {
+          shotExample += `Query: "${prompt}"\nJSON: ${call}\n`;
+        });
+      }
+      output += `${shotExample}-----------\n`;
     });
-
-    return JSON.stringify(funcs, null, 2);
+    return output;
   }
 
   /**
@@ -114,67 +120,15 @@ When a function is selection, respond in JSON with no additional text.
 When there is no relevant function to call - return with a regular chat text response.
 Your task is to pick a **single** function that we will use to call, if any seem useful or relevant for the user query.
 
-Example of Tool definitions:
-[
-  {
-    name: 'rag-memory',
-    description: 'Search against local documents for context that is relevant to the query or store a snippet of text into memory for retrieval later. Storing information should only be done when the user specifically requests for information to be remembered or saved to long-term memory. You should use this tool before search the internet for information.',
-    parameters: {
-      '$schema': 'http://json-schema.org/draft-07/schema#',
-      type: 'object',
-      properties: [
-        action: {
-          type: "string",
-          enum: ["search", "store"],
-          description:
-            "The action we want to take to search for existing similar context or storage of new context.",
-        },
-        content: {
-          type: "string",
-          description:
-            "The plain text to search our local documents with or to store in our vector database.",
-        },
-      ],
-      additionalProperties: false
-    }
-  },
-  {
-    name: 'web-scraping',
-    description: 'Scrapes the content of a webpage or online resource from a URL.',
-    parameters: {
-      '$schema': 'http://json-schema.org/draft-07/schema#',
-      type: 'object',
-      properties: [
-        url: {
-          type: "string",
-          format: "uri",
-          description: "A web URL.",
-        },
-      ],
-      additionalProperties: false
-    },
-  }
-]
-
-Example Query:
-User: Scrape https://example.com
-Your response (JSON ONLY): 
-{
-  name: 'web-scraping'.
-  arguments: {
-    url: 'https://example.com'
-  }
-}
-
-Example Query where tool cannot be used:
-User: Hello!
-Your response (Text Only): Hello, how are you today?
+All JSON responses should have two keys.
+'name': this is the name of the function name to call. eg: 'web-scraper', 'rag-memory', etc..
+'arguments': this is an object with the function properties to invoke the function.
+DO NOT INCLUDE ANY OTHER KEYS IN JSON RESPONSES.
 
-The available function and their definitions are listed below - respond only with JSON or a regular chat response.
-${this.formatFuncs(functions)}
+Here are the available tools you can use an examples of a query and response so you can understand how each one works.
+${this.showcaseFunctions(functions)}
 
-Now, assess the next function to call:
-`,
+Now pick a function if there is an appropriate one to use given the last user message and the given conversation so far.`,
             role: "system",
           },
           ...history,
diff --git a/server/utils/agents/aibitat/providers/lmstudio.js b/server/utils/agents/aibitat/providers/lmstudio.js
index 6fc73d5adb1..49387e43b41 100644
--- a/server/utils/agents/aibitat/providers/lmstudio.js
+++ b/server/utils/agents/aibitat/providers/lmstudio.js
@@ -1,7 +1,7 @@
 const OpenAI = require("openai");
-const InheritMultiple = require("./classes.js");
 const Provider = require("./ai-provider.js");
-const UnTooled = require("./untooled.js");
+const InheritMultiple = require("./helpers/classes.js");
+const UnTooled = require("./helpers/untooled.js");
 
 /**
  * The provider for the LMStudio provider.
@@ -20,6 +20,7 @@ class LMStudioProvider extends InheritMultiple([Provider, UnTooled]) {
     });
     this._client = client;
     this.model = model;
+    this.verbose = true;
   }
 
   get client() {

From 9e97cb320d0f2e205335d68c2825fc5f91d32ccf Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Thu, 2 May 2024 18:22:45 -0700
Subject: [PATCH 4/5] Add Agent support for Ollama models

---
 .../AgentConfig/AgentLLMSelection/index.jsx   |   4 +-
 server/package.json                           |   1 +
 server/utils/agents/aibitat/index.js          |   2 +
 .../aibitat/providers/helpers/untooled.js     |  62 ++++------
 .../utils/agents/aibitat/providers/index.js   |   2 +
 .../agents/aibitat/providers/lmstudio.js      |  25 +++-
 .../utils/agents/aibitat/providers/ollama.js  | 107 ++++++++++++++++++
 server/utils/agents/index.js                  |   8 +-
 server/yarn.lock                              |   9 +-
 9 files changed, 177 insertions(+), 43 deletions(-)
 create mode 100644 server/utils/agents/aibitat/providers/ollama.js

diff --git a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
index 408d60a026f..fcb12d94d5d 100644
--- a/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
+++ b/frontend/src/pages/WorkspaceSettings/AgentConfig/AgentLLMSelection/index.jsx
@@ -5,8 +5,8 @@ import { AVAILABLE_LLM_PROVIDERS } from "@/pages/GeneralSettings/LLMPreference";
 import { CaretUpDown, Gauge, MagnifyingGlass, X } from "@phosphor-icons/react";
 import AgentModelSelection from "../AgentModelSelection";
 
-const ENABLED_PROVIDERS = ["openai", "anthropic", "lmstudio"];
-const WARN_PERFORMANCE = ["lmstudio"];
+const ENABLED_PROVIDERS = ["openai", "anthropic", "lmstudio", "ollama"];
+const WARN_PERFORMANCE = ["lmstudio", "ollama"];
 
 const LLM_DEFAULT = {
   name: "Please make a selection",
diff --git a/server/package.json b/server/package.json
index afe6926de03..ca9e21fa3b0 100644
--- a/server/package.json
+++ b/server/package.json
@@ -59,6 +59,7 @@
     "multer": "^1.4.5-lts.1",
     "node-html-markdown": "^1.3.0",
     "node-llama-cpp": "^2.8.0",
+    "ollama": "^0.5.0",
     "openai": "4.38.5",
     "pinecone-client": "^1.1.0",
     "pluralize": "^8.0.0",
diff --git a/server/utils/agents/aibitat/index.js b/server/utils/agents/aibitat/index.js
index c3ad5428f57..9cf2170b7cf 100644
--- a/server/utils/agents/aibitat/index.js
+++ b/server/utils/agents/aibitat/index.js
@@ -741,6 +741,8 @@ ${this.getHistory({ to: route.to })
         return new Providers.AnthropicProvider({ model: config.model });
       case "lmstudio":
         return new Providers.LMStudioProvider({});
+      case "ollama":
+        return new Providers.OllamaProvider({ model: config.model });
 
       default:
         throw new Error(
diff --git a/server/utils/agents/aibitat/providers/helpers/untooled.js b/server/utils/agents/aibitat/providers/helpers/untooled.js
index a84aad77c92..37ecb5599f5 100644
--- a/server/utils/agents/aibitat/providers/helpers/untooled.js
+++ b/server/utils/agents/aibitat/providers/helpers/untooled.js
@@ -102,48 +102,34 @@ ${JSON.stringify(def.parameters.properties, null, 4)}\n`;
     return { valid: true, reason: null };
   }
 
-  async functionCall(messages, functions) {
+  async functionCall(messages, functions, chatCb = null) {
     const history = [...messages].filter((msg) =>
       ["user", "assistant"].includes(msg.role)
     );
     if (history[history.length - 1].role !== "user") return null;
-
-    const response = await this.client.chat.completions
-      .create({
-        model: this.model,
-        temperature: 0,
-        messages: [
-          {
-            content: `You are a program which picks the most optimal function and parameters to call. 
-DO NOT HAVE TO PICK A FUNCTION IF IT WILL NOT HELP ANSWER OR FULFILL THE USER'S QUERY.
-When a function is selection, respond in JSON with no additional text.
-When there is no relevant function to call - return with a regular chat text response.
-Your task is to pick a **single** function that we will use to call, if any seem useful or relevant for the user query.
-
-All JSON responses should have two keys.
-'name': this is the name of the function name to call. eg: 'web-scraper', 'rag-memory', etc..
-'arguments': this is an object with the function properties to invoke the function.
-DO NOT INCLUDE ANY OTHER KEYS IN JSON RESPONSES.
-
-Here are the available tools you can use an examples of a query and response so you can understand how each one works.
-${this.showcaseFunctions(functions)}
-
-Now pick a function if there is an appropriate one to use given the last user message and the given conversation so far.`,
-            role: "system",
-          },
-          ...history,
-        ],
-      })
-      .then((result) => {
-        if (!result.hasOwnProperty("choices"))
-          throw new Error("LMStudio chat: No results!");
-        if (result.choices.length === 0)
-          throw new Error("LMStudio chat: No results length!");
-        return result.choices[0].message.content;
-      })
-      .catch((_) => {
-        return null;
-      });
+    const response = await chatCb({
+      messages: [
+        {
+          content: `You are a program which picks the most optimal function and parameters to call. 
+      DO NOT HAVE TO PICK A FUNCTION IF IT WILL NOT HELP ANSWER OR FULFILL THE USER'S QUERY.
+      When a function is selection, respond in JSON with no additional text.
+      When there is no relevant function to call - return with a regular chat text response.
+      Your task is to pick a **single** function that we will use to call, if any seem useful or relevant for the user query.
+
+      All JSON responses should have two keys.
+      'name': this is the name of the function name to call. eg: 'web-scraper', 'rag-memory', etc..
+      'arguments': this is an object with the function properties to invoke the function.
+      DO NOT INCLUDE ANY OTHER KEYS IN JSON RESPONSES.
+
+      Here are the available tools you can use an examples of a query and response so you can understand how each one works.
+      ${this.showcaseFunctions(functions)}
+
+      Now pick a function if there is an appropriate one to use given the last user message and the given conversation so far.`,
+          role: "system",
+        },
+        ...history,
+      ],
+    });
 
     const call = safeJsonParse(response, null);
     if (call === null) return { toolCall: null, text: response }; // failed to parse, so must be text.
diff --git a/server/utils/agents/aibitat/providers/index.js b/server/utils/agents/aibitat/providers/index.js
index ebe4de33f06..fda8b51360f 100644
--- a/server/utils/agents/aibitat/providers/index.js
+++ b/server/utils/agents/aibitat/providers/index.js
@@ -1,9 +1,11 @@
 const OpenAIProvider = require("./openai.js");
 const AnthropicProvider = require("./anthropic.js");
 const LMStudioProvider = require("./lmstudio.js");
+const OllamaProvider = require("./ollama.js");
 
 module.exports = {
   OpenAIProvider,
   AnthropicProvider,
   LMStudioProvider,
+  OllamaProvider,
 };
diff --git a/server/utils/agents/aibitat/providers/lmstudio.js b/server/utils/agents/aibitat/providers/lmstudio.js
index 49387e43b41..d3aa4346a71 100644
--- a/server/utils/agents/aibitat/providers/lmstudio.js
+++ b/server/utils/agents/aibitat/providers/lmstudio.js
@@ -27,6 +27,25 @@ class LMStudioProvider extends InheritMultiple([Provider, UnTooled]) {
     return this._client;
   }
 
+  async #handleFunctionCallChat({ messages = [] }) {
+    return await this.client.chat.completions
+      .create({
+        model: this.model,
+        temperature: 0,
+        messages,
+      })
+      .then((result) => {
+        if (!result.hasOwnProperty("choices"))
+          throw new Error("LMStudio chat: No results!");
+        if (result.choices.length === 0)
+          throw new Error("LMStudio chat: No results length!");
+        return result.choices[0].message.content;
+      })
+      .catch((_) => {
+        return null;
+      });
+  }
+
   /**
    * Create a completion based on the received messages.
    *
@@ -38,7 +57,11 @@ class LMStudioProvider extends InheritMultiple([Provider, UnTooled]) {
     try {
       let completion;
       if (functions.length > 0) {
-        const { toolCall, text } = await this.functionCall(messages, functions);
+        const { toolCall, text } = await this.functionCall(
+          messages,
+          functions,
+          this.#handleFunctionCallChat.bind(this)
+        );
 
         if (toolCall !== null) {
           this.providerLog(`Valid tool call found - running ${toolCall.name}.`);
diff --git a/server/utils/agents/aibitat/providers/ollama.js b/server/utils/agents/aibitat/providers/ollama.js
new file mode 100644
index 00000000000..d52d80caa08
--- /dev/null
+++ b/server/utils/agents/aibitat/providers/ollama.js
@@ -0,0 +1,107 @@
+const Provider = require("./ai-provider.js");
+const InheritMultiple = require("./helpers/classes.js");
+const UnTooled = require("./helpers/untooled.js");
+const { Ollama } = require("ollama");
+
+/**
+ * The provider for the Ollama provider.
+ */
+class OllamaProvider extends InheritMultiple([Provider, UnTooled]) {
+  model;
+
+  constructor(config = {}) {
+    const {
+      // options = {},
+      model = null,
+    } = config;
+
+    super();
+    this._client = new Ollama({ host: process.env.OLLAMA_BASE_PATH });
+    this.model = model;
+    this.verbose = true;
+  }
+
+  get client() {
+    return this._client;
+  }
+
+  async #handleFunctionCallChat({ messages = [] }) {
+    const response = await this.client.chat({
+      model: this.model,
+      messages,
+      options: {
+        temperature: 0,
+      },
+    });
+    return response?.message?.content || null;
+  }
+
+  /**
+   * Create a completion based on the received messages.
+   *
+   * @param messages A list of messages to send to the API.
+   * @param functions
+   * @returns The completion.
+   */
+  async complete(messages, functions = null) {
+    try {
+      let completion;
+      if (functions.length > 0) {
+        const { toolCall, text } = await this.functionCall(
+          messages,
+          functions,
+          this.#handleFunctionCallChat.bind(this)
+        );
+
+        if (toolCall !== null) {
+          this.providerLog(`Valid tool call found - running ${toolCall.name}.`);
+          this.deduplicator.trackRun(toolCall.name, toolCall.arguments);
+          return {
+            result: null,
+            functionCall: {
+              name: toolCall.name,
+              arguments: toolCall.arguments,
+            },
+            cost: 0,
+          };
+        }
+        completion = { content: text };
+      }
+
+      if (!completion?.content) {
+        this.providerLog(
+          "Will assume chat completion without tool call inputs."
+        );
+        const response = await this.client.chat({
+          model: this.model,
+          messages: this.cleanMsgs(messages),
+          options: {
+            use_mlock: true,
+            temperature: 0.5,
+          },
+        });
+        completion = response.message;
+      }
+
+      return {
+        result: completion.content,
+        cost: 0,
+      };
+    } catch (error) {
+      throw error;
+    }
+  }
+
+  /**
+   * Get the cost of the completion.
+   *
+   * @param _usage The completion to get the cost for.
+   * @returns The cost of the completion.
+   * Stubbed since LMStudio has no cost basis.
+   */
+  getCost(_usage) {
+    return 0;
+  }
+}
+
+module.exports = OllamaProvider;
diff --git a/server/utils/agents/index.js b/server/utils/agents/index.js
index 5e54c0b3f67..e18b8b7bb94 100644
--- a/server/utils/agents/index.js
+++ b/server/utils/agents/index.js
@@ -79,7 +79,11 @@ class AgentHandler {
         break;
       case "lmstudio":
         if (!process.env.LMSTUDIO_BASE_PATH)
-          throw new Error("LMStudio bash path must be provided to use agents.");
+          throw new Error("LMStudio base path must be provided to use agents.");
+        break;
+      case "ollama":
+        if (!process.env.OLLAMA_BASE_PATH)
+          throw new Error("Ollama base path must be provided to use agents.");
         break;
       default:
         throw new Error("No provider found to power agent cluster.");
@@ -94,6 +98,8 @@ class AgentHandler {
         return "claude-3-sonnet-20240229";
       case "lmstudio":
         return "server-default";
+      case "ollama":
+        return "llama3:latest";
       default:
         return "unknown";
     }
diff --git a/server/yarn.lock b/server/yarn.lock
index 1911849d453..c5954570952 100644
--- a/server/yarn.lock
+++ b/server/yarn.lock
@@ -4560,6 +4560,13 @@ octokit@^3.1.0:
     "@octokit/request-error" "^5.0.0"
     "@octokit/types" "^12.0.0"
 
+ollama@^0.5.0:
+  version "0.5.0"
+  resolved "https://registry.yarnpkg.com/ollama/-/ollama-0.5.0.tgz#cb9bc709d4d3278c9f484f751b0d9b98b06f4859"
+  integrity sha512-CRtRzsho210EGdK52GrUMohA2pU+7NbgEaBG3DcYeRmvQthDO7E2LHOkLlUUeaYUlNmEd8icbjC02ug9meSYnw==
+  dependencies:
+    whatwg-fetch "^3.6.20"
+
 on-finished@2.4.1:
   version "2.4.1"
   resolved "https://registry.yarnpkg.com/on-finished/-/on-finished-2.4.1.tgz#58c8c44116e54845ad57f14ab10b03533184ac3f"
@@ -5980,7 +5987,7 @@ webidl-conversions@^3.0.0:
   resolved "https://registry.yarnpkg.com/webidl-conversions/-/webidl-conversions-3.0.1.tgz#24534275e2a7bc6be7bc86611cc16ae0a5654871"
   integrity sha512-2JAn3z8AR6rjK8Sm8orRC0h/bcl/DqL7tRPdGZ4I1CjdF+EaMLmYxBHyXuKL849eucPFhvBoxMsflfOb8kxaeQ==
 
-whatwg-fetch@^3.4.1:
+whatwg-fetch@^3.4.1, whatwg-fetch@^3.6.20:
   version "3.6.20"
   resolved "https://registry.yarnpkg.com/whatwg-fetch/-/whatwg-fetch-3.6.20.tgz#580ce6d791facec91d37c72890995a0b48d31c70"
   integrity sha512-EqhiFU6daOA8kpjOWTL0olhVOF3i7OrFzSYiGsEMB8GcXS+RrzauAERX65xMeNWVqxA6HXH2m69Z9LaKKdisfg==

From af1acc4c3e51d1c5ad7645114ddf10e11804102b Mon Sep 17 00:00:00 2001
From: timothycarambat <rambat1010@gmail.com>
Date: Tue, 7 May 2024 18:05:39 -0700
Subject: [PATCH 5/5] improve json parsing for ollama text responses

---
 server/package.json        | 1 +
 server/utils/http/index.js | 7 +++++--
 server/yarn.lock           | 5 +++++
 3 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/server/package.json b/server/package.json
index ca9e21fa3b0..edee71b023c 100644
--- a/server/package.json
+++ b/server/package.json
@@ -46,6 +46,7 @@
     "dotenv": "^16.0.3",
     "express": "^4.18.2",
     "express-ws": "^5.0.2",
+    "extract-json-from-string": "^1.0.1",
     "extract-zip": "^2.0.1",
     "graphql": "^16.7.1",
     "joi": "^17.11.0",
diff --git a/server/utils/http/index.js b/server/utils/http/index.js
index 1fc8c5b961c..6400c36bcf7 100644
--- a/server/utils/http/index.js
+++ b/server/utils/http/index.js
@@ -4,6 +4,7 @@ process.env.NODE_ENV === "development"
 const JWT = require("jsonwebtoken");
 const { User } = require("../../models/user");
 const { jsonrepair } = require("jsonrepair");
+const extract = require("extract-json-from-string");
 
 function reqBody(request) {
   return typeof request.body === "string"
@@ -67,8 +68,6 @@ function safeJsonParse(jsonString, fallback = null) {
     return JSON.parse(jsonString);
   } catch {}
 
-  // If the jsonString does not look like an Obj or Array, dont attempt
-  // to repair it.
   if (jsonString?.startsWith("[") || jsonString?.startsWith("{")) {
     try {
       const repairedJson = jsonrepair(jsonString);
@@ -76,6 +75,10 @@ function safeJsonParse(jsonString, fallback = null) {
     } catch {}
   }
 
+  try {
+    return extract(jsonString)[0];
+  } catch {}
+
   return fallback;
 }
 
diff --git a/server/yarn.lock b/server/yarn.lock
index c5954570952..5edd09a351f 100644
--- a/server/yarn.lock
+++ b/server/yarn.lock
@@ -2678,6 +2678,11 @@ extract-files@^9.0.0:
   resolved "https://registry.yarnpkg.com/extract-files/-/extract-files-9.0.0.tgz#8a7744f2437f81f5ed3250ed9f1550de902fe54a"
   integrity sha512-CvdFfHkC95B4bBBk36hcEmvdR2awOdhhVUYH6S/zrVj3477zven/fJMYg7121h4T1xHZC+tetUpubpAhxwI7hQ==
 
+extract-json-from-string@^1.0.1:
+  version "1.0.1"
+  resolved "https://registry.yarnpkg.com/extract-json-from-string/-/extract-json-from-string-1.0.1.tgz#5001f17e6c905826dcd5989564e130959de60c96"
+  integrity sha512-xfQOSFYbELVs9QVkKsV9FZAjlAmXQ2SLR6FpfFX1kpn4QAvaGBJlrnVOblMLwrLPYc26H+q9qxo6JTd4E7AwgQ==
+
 extract-zip@^2.0.1:
   version "2.0.1"
   resolved "https://registry.yarnpkg.com/extract-zip/-/extract-zip-2.0.1.tgz#663dca56fe46df890d5f131ef4a06d22bb8ba13a"