Add linux-gpu profile to enable GPU (#64)

2024-08-30 16:49:54 +03:00 · 2023-11-03 17:16:35 +01:00
parent 4071ae1b69
commit 611bf84da2
2 changed files with 14 additions and 1 deletions
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -1,11 +1,22 @@
 services:

-  llm:
+  llm: &llm
    image: ollama/ollama:latest
    profiles: ["linux"]
    networks:
      - net

+  llm-gpu:
+    <<: *llm
+    profiles: ["linux-gpu"]
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]
+
  pull-model:
    image: genai-stack/pull-model:latest
    build:
--- a/readme.md
+++ b/readme.md
@@ -38,6 +38,8 @@ No need to install Ollama manually, it will run in a container as
 part of the stack when running with the Linux profile: run `docker compose --profile linux up`.
 Make sure to set the `OLLAMA_BASE_URL=http://llm:11434` in the `.env` file when using Ollama docker container.

+To use the Linux-GPU profile: run `docker compose --profile linux-gpu up`. Also change `OLLAMA_BASE_URL=http://llm-gpu:11434` in the `.env` file.
+
 **Windows**
 Not supported by Ollama, so Windows users need to generate a OpenAI API key and configure the stack to use `gpt-3.5` or `gpt-4` in the `.env` file.
 # Develop