From 6464a33912c62f087f81352ecf71aefcb4b1148f Mon Sep 17 00:00:00 2001 From: Richard Palethorpe Date: Mon, 7 Apr 2025 11:25:35 +0100 Subject: [PATCH] fix(docker): Use localrecall main tag instead of master Signed-off-by: Richard Palethorpe --- docker-compose.gpu.yaml | 2 +- docker-compose.yaml | 15 +++++++++------ 2 files changed, 10 insertions(+), 7 deletions(-) diff --git a/docker-compose.gpu.yaml b/docker-compose.gpu.yaml index 3f52417..382eb36 100644 --- a/docker-compose.gpu.yaml +++ b/docker-compose.gpu.yaml @@ -38,7 +38,7 @@ services: count: 1 capabilities: [gpu] localrecall: - image: quay.io/mudler/localrecall:master + image: quay.io/mudler/localrecall:main ports: - 8080 environment: diff --git a/docker-compose.yaml b/docker-compose.yaml index a400f87..771886a 100644 --- a/docker-compose.yaml +++ b/docker-compose.yaml @@ -5,16 +5,16 @@ services: # Available images with CUDA, ROCm, SYCL, Vulkan # Image list (quay.io): https://quay.io/repository/go-skynet/local-ai?tab=tags # Image list (dockerhub): https://hub.docker.com/r/localai/localai - image: localai/localai:latest-cpu + image: local-ai command: - # - rombo-org_rombo-llm-v3.0-qwen-32b # minimum suggested model + - rombo-org_rombo-llm-v3.0-qwen-32b # minimum suggested model - arcee-agent # (smaller) - granite-embedding-107m-multilingual healthcheck: test: ["CMD", "curl", "-f", "http://localhost:8080/readyz"] - interval: 10s - timeout: 20m - retries: 20 + interval: 60s + timeout: 10m + retries: 120 ports: - 8081:8080 environment: @@ -23,6 +23,9 @@ services: volumes: - ./volumes/models:/build/models:cached - ./volumes/images:/tmp/generated/images + devices: + - /dev/dri + # decomment the following piece if running with Nvidia GPUs # deploy: # resources: @@ -32,7 +35,7 @@ services: # count: 1 # capabilities: [gpu] localrecall: - image: quay.io/mudler/localrecall:master + image: quay.io/mudler/localrecall:main ports: - 8080 environment: