Fix: add local model host for docker deployment (#156)

tegonhq · Jul 26, 2024 · cd75d91 · cd75d91
1 parent d93cf7c
commit cd75d91
Show file tree

Hide file tree

Showing 3 changed files with 16 additions and 10 deletions.
diff --git a/.env.example b/.env.example
@@ -99,7 +99,7 @@ COHERE_API_KEY=
 OPENAI_API_KEY=
 
 LOCAL_MODEL=llama3
-
+OLLAMA_HOST=http://localhost:11434
 
 
 

diff --git a/apps/server/src/modules/ai-requests/ai-requests.services.ts b/apps/server/src/modules/ai-requests/ai-requests.services.ts
@@ -1,6 +1,6 @@
 import { Injectable, Logger } from '@nestjs/common';
 import { PrismaService } from 'nestjs-prisma';
-import ollama from 'ollama';
+import { Ollama } from 'ollama';
 import OpenAI from 'openai';
 import { ChatCompletionMessageParam } from 'openai/resources';
 
@@ -10,13 +10,15 @@ import { requestInputBody } from './ai-requests.interface';
 export default class AIRequestsService {
   private readonly logger: Logger = new Logger('RequestsService');
   private readonly openaiClient;
+  private readonly ollama;
   constructor(private prisma: PrismaService) {
     if (process.env['OPENAI_API_KEY']) {
       this.openaiClient = new OpenAI({
         apiKey: process.env['OPENAI_API_KEY'],
       });
     } else {
-      ollama.pull({ model: process.env['LOCAL_MODEL'] });
+      this.ollama = new Ollama({ host: process.env['OLLAMA_HOST'] });
+      this.ollama.pull({ model: process.env['LOCAL_MODEL'] });
     }
   }
 
@@ -25,6 +27,10 @@ export default class AIRequestsService {
     const messages = reqBody.messages;
     let model = reqBody.llmModel;
     this.logger.log(`Received request with model: ${model}`);
+    if (!process.env['OPENAI_API_KEY']) {
+      this.logger.log('OPENAI_API_KEY not found, using local model');
+      model = process.env['LOCAL_MODEL'];
+    }
     switch (model) {
       case 'gpt-3.5-turbo':
       case 'gpt-4-turbo':
@@ -39,9 +45,8 @@ export default class AIRequestsService {
         break;
       default:
         // Send request to ollama as fallback
-        model = process.env.LOCAL_MODEL;
         this.logger.log(`Sending request to ollama with model: ${model}`);
-        const response = await ollama.chat({
+        const response = await this.ollama.chat({
           model,
           messages,
         });

diff --git a/turbo.json b/turbo.json
@@ -57,6 +57,7 @@
     "COHERE_API_KEY",
     "OPENAI_API_KEY",
     "LOCAL_MODEL",
+    "OLLAMA_HOST",
 
     "TRIGGER_DB",
     "TRIGGER_DATABASE_URL",
@@ -75,18 +76,18 @@
   "ui": "tui",
   "tasks": {
     "start-prod": {
-      "dependsOn": [ "db:generate" ],
+      "dependsOn": ["db:generate"],
       "cache": false
     },
     "dev": {
-      "dependsOn": [ "db:generate" ],
+      "dependsOn": ["db:generate"],
       "cache": false
     },
     "build": {
-      "dependsOn": [ "db:generate" ],
-      "outputs": [ "dist/**", ".next/**" ]
+      "dependsOn": ["db:generate"],
+      "outputs": ["dist/**", ".next/**"]
     },
-    "lint": { },
+    "lint": {},
     "create-resources": {
       "interactive": true,
       "cache": false
Original file line number	Diff line number	Diff line change
Expand Up		@@ -99,7 +99,7 @@ COHERE_API_KEY=
		OPENAI_API_KEY=

		LOCAL_MODEL=llama3

		OLLAMA_HOST=http://localhost:11434



Expand Down