-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathcompose.yml
More file actions
31 lines (30 loc) · 1016 Bytes
/
compose.yml
File metadata and controls
31 lines (30 loc) · 1016 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# - Requirement: local file ./goinfer.ini
# - Build: DOCKER_BUILDKIT=1 docker compose build
# - Run: docker compose up
# - Stop: CTRL + C
# - Clean: docker compose down
services:
goinfer-llama:
image: goinfer-llama
container_name: goinfer-llama
build:
context: .
dockerfile: ./Containerfile
args:
# llama.cpp tags: https://github.com/ggml-org/llama.cpp/tags
- llama_git_tag=b6131
# Nvidia container images: https://hub.docker.com/r/nvidia/cuda
- CUDA_VERSION=13.0
- CUDA_PATCH=1
- UBUNTU_VERSION=24.04
command: # no need for arguments
ports: [8080:8080]
volumes:
# GI_MODELS_DIR is also used by goinfer
- ${GI_MODELS_DIR:-./models}:/models
- ${CCACHE_DIR:-./.ccache}:/root/.ccache
- ${GO_CACHE_DIR:-./.go}:/root/go
- ./goinfer.ini:/app/goinfer.ini
environment:
- TZ=UTC0 # time.Unix() uses UTC instead of local time zone
# restart: unless-stopped