-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathportainer-stack-cuda.yml
More file actions
40 lines (39 loc) · 1.1 KB
/
Copy pathportainer-stack-cuda.yml
File metadata and controls
40 lines (39 loc) · 1.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
services:
code-index-api:
image: dvcdsys/code-index:go-cu128
container_name: code-index
restart: unless-stopped
ports:
- "21847:21847"
environment:
- CIX_API_KEY=${API_KEY}
- CIX_EMBEDDING_MODEL=${EMBEDDING_MODEL:-awhiteside/CodeRankEmbed-Q8_0-GGUF}
- CIX_CHROMA_PERSIST_DIR=/data/chroma
- CIX_SQLITE_PATH=/data/sqlite/projects.db
- CIX_MAX_FILE_SIZE=${MAX_FILE_SIZE:-524288}
- CIX_EXCLUDED_DIRS=${EXCLUDED_DIRS:-node_modules,.git,.venv,__pycache__,dist,build,.next,.cache,.DS_Store}
- CIX_N_GPU_LAYERS=99
- CIX_LLAMA_STARTUP_TIMEOUT=120
- CIX_GGUF_CACHE_DIR=/data/models
- NVIDIA_VISIBLE_DEVICES=all
volumes:
- cix_data:/data
deploy:
resources:
limits:
memory: 10G
reservations:
memory: 2G
devices:
- driver: nvidia
count: 1
capabilities: [gpu]
healthcheck:
test: ["/cix-server", "-healthcheck"]
interval: 30s
timeout: 10s
start_period: 120s
retries: 3
volumes:
cix_data:
driver: local