From 6464a33912c62f087f81352ecf71aefcb4b1148f Mon Sep 17 00:00:00 2001
From: Richard Palethorpe <io@richiejp.com>
Date: Mon, 7 Apr 2025 11:25:35 +0100
Subject: [PATCH] fix(docker): Use localrecall main tag instead of master

Signed-off-by: Richard Palethorpe <io@richiejp.com>
---
 docker-compose.gpu.yaml |  2 +-
 docker-compose.yaml     | 15 +++++++++------
 2 files changed, 10 insertions(+), 7 deletions(-)

diff --git a/docker-compose.gpu.yaml b/docker-compose.gpu.yaml
index 3f52417..382eb36 100644
--- a/docker-compose.gpu.yaml
+++ b/docker-compose.gpu.yaml
@@ -38,7 +38,7 @@ services:
               count: 1
               capabilities: [gpu]
   localrecall:
-    image: quay.io/mudler/localrecall:master
+    image: quay.io/mudler/localrecall:main
     ports:
       - 8080
     environment:
diff --git a/docker-compose.yaml b/docker-compose.yaml
index a400f87..771886a 100644
--- a/docker-compose.yaml
+++ b/docker-compose.yaml
@@ -5,16 +5,16 @@ services:
     # Available images with CUDA, ROCm, SYCL, Vulkan
     # Image list (quay.io): https://quay.io/repository/go-skynet/local-ai?tab=tags
     # Image list (dockerhub): https://hub.docker.com/r/localai/localai
-    image: localai/localai:latest-cpu
+    image: local-ai
     command: 
-    # - rombo-org_rombo-llm-v3.0-qwen-32b # minimum suggested model
+    - rombo-org_rombo-llm-v3.0-qwen-32b # minimum suggested model
     - arcee-agent # (smaller)
     - granite-embedding-107m-multilingual
     healthcheck:
       test: ["CMD", "curl", "-f", "http://localhost:8080/readyz"]
-      interval: 10s
-      timeout: 20m
-      retries: 20
+      interval: 60s
+      timeout: 10m
+      retries: 120
     ports:
     - 8081:8080
     environment:
@@ -23,6 +23,9 @@ services:
     volumes:
       - ./volumes/models:/build/models:cached
       - ./volumes/images:/tmp/generated/images
+    devices:
+      - /dev/dri
+
     # decomment the following piece if running with Nvidia GPUs
     # deploy:
     #   resources:
@@ -32,7 +35,7 @@ services:
     #           count: 1
     #           capabilities: [gpu]
   localrecall:
-    image: quay.io/mudler/localrecall:master
+    image: quay.io/mudler/localrecall:main
     ports:
       - 8080
     environment: