feat: add ollama support

kkoch986 · Mar 21, 2024 · dfb8acf · dfb8acf
1 parent 5eb826e
commit dfb8acf
Show file tree

Hide file tree

Showing 5 changed files with 111 additions and 4 deletions.
diff --git a/Dockerfile b/Dockerfile
@@ -3,7 +3,7 @@ FROM node:18-alpine AS build
 WORKDIR /srv
 COPY package*.json /srv/
 RUN npm ci
-# COPY tsconfig.json /srv/
+
 COPY index.ts /srv/index.ts
 RUN npx tsc index.ts
 RUN npm ci --production

diff --git a/Makefile b/Makefile
@@ -1,6 +1,9 @@
 GIT_SHA=$(shell git rev-parse --short=8 HEAD)
 
-all: index.js
+pull-models:
+	curl http://localhost:11434/api/pull -d '{"name": "neural-chat"}'
+
+all: index.js pull-models
 	node index.js
 
 index.js: index.ts

diff --git a/README.md b/README.md
@@ -2,9 +2,10 @@
 
 This module holds the service for generating responses in the interactive
 pipeline.
-It currently offers 2 backends:
+It currently offers 3 backends:
 
 * [Character.AI](https://beta.character.ai/) (using [the Node Unoffical API](https://github.com/realcoloride/node_characterai))
+* [OLlama](https://ollama.com/)
 * An "Echo" backend which just replies with exactly what you send it
 
 ## Interface

diff --git a/docker-compose.yml b/docker-compose.yml
@@ -5,7 +5,18 @@ services:
     ports:
       - "3000:3000"
     environment:
-      BACKEND_TYPE: "characterai"
+      BACKEND_TYPE: "ollama"
       SERVER_PORT: 3000
       CHARACTER_AI_TOKEN: "${CHARACTER_AI_TOKEN}"
       CHARACTER_AI_CHARACTER_ID: "1AYQkwEQ83I3JKxMeNvctG4m7kQL1zTPJuGugAVsT_k"
+  ollama:
+    image: ollama/ollama:latest
+    ports:
+      - "11434:11434"
+    # deploy:
+    #   resources:
+    #     reservations:
+    #       devices:
+    #         - driver: nvidia
+    #           count: 1
+    #           capabilities: [gpu]
diff --git a/index.ts b/index.ts
@@ -13,11 +13,88 @@ type Response = {
   text: string,
 };
 
+type Message = {
+  role: string,
+  content: string,
+};
+
 interface Backend {
   start(): Promise<Response>,
   receive(message:string): Promise<Response>,
 };
 
+// OLlama backend is backed by ollama
+// the assumption is that relevant models have already been pulled
+class OLlamaBackend implements Backend {
+  private baseURL:string;
+  private model:string;
+  private systemPrompts:string[];
+  private initialPrompt: string;
+  private messages: Message[];
+
+  async initialize(baseURL: string, model: string, systemPrompts: string[], initialPrompt: string) {
+    this.model = model;
+    this.baseURL = baseURL;
+    this.systemPrompts = systemPrompts;
+    this.initialPrompt = initialPrompt;
+    // LATER: we could pull the model at this point, but that seems like not necessary at this point
+  }
+
+  async sendPrompt(message:string): Promise<Response> {
+    if (message != "") {
+      this.messages.push({
+        role: 'user',
+        content: message,
+      });
+    }
+    const p = await fetch(this.baseURL + "api/chat", {
+      method: "POST",
+      body: JSON.stringify({
+        "model": this.model,
+        // LATER: support streaming calls?
+        "stream": false,
+        "options": {
+          "temperature": 1
+        },
+        "messages": this.messages,
+      }),
+    })
+    .then((response) => response.json())
+    .then((resp: any) => {
+      // TODO: error handling
+      this.messages.push(resp.message);
+      const i = resp.created_at;
+      return {
+        id: i,
+        characterId: this.model,
+        chatId: i,
+        imageRelativePath: "",
+        srcName: "ollama-" + this.model,
+        text: resp.message.content,
+      };
+    });
+    return p;
+  }
+
+  async start(): Promise<Response> {
+    // send the basic system prompts and return the response
+    const messages = this.systemPrompts.map((m) => ({
+      "role": "system",
+      "content": m,
+    }));
+    messages.push({
+      "role": "user",
+      "content": this.initialPrompt,
+    });
+    this.messages = messages;
+    return this.sendPrompt("");
+  }
+
+  async receive(message: string): Promise<Response> {
+    return this.sendPrompt(message);
+  }
+}
+
 // Echo backend is just a testing backend that replies with exactly
 // the message it was sent
 class EchoBackend implements Backend {
@@ -141,6 +218,21 @@ class CharacterAIBackend implements Backend {
     case "echo":
       backend = new EchoBackend();
       break ;
+    case "ollama":
+      const ol = new OLlamaBackend();
+    // TODO: better parameterize all of this...
+      await ol.initialize(
+        "http://ollama:11434/",
+        "neural-chat",
+        [
+          "you are a zoltar inspired fortune teller with a tiki / bayou flair",
+          "your name is Makani",
+          "you should always respond to prompts with a whimsical style",
+        ],
+        "please introduce yourself",
+      );
+      backend = ol;
+      break ;
     case "characterai":
       const cai = new CharacterAIBackend();
       await cai.initialize(token, characterId)