-
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdocker-compose.yml
56 lines (52 loc) · 1.38 KB
/
docker-compose.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
services:
app:
container_name: fasten-app
build:
context: .
dockerfile: Dockerfile
environment:
ES_HOST: http://elasticsearch:9200
ES_USER: elastic
ES_PASSWORD: changeme
ES_INDEX_NAME: fasten-index
EMBEDDING_MODEL_NAME: all-MiniLM-L6-v2
LLM_HOST: http://llama:9090
ports:
- "8000:8000"
volumes:
- ./data:/app/data
depends_on:
elasticsearch:
condition: service_healthy
restart: always
command: >
uvicorn app.main:app --host 0.0.0.0 --port 8000 --reload
elasticsearch:
container_name: fasten-elasticsearch
image: docker.elastic.co/elasticsearch/elasticsearch:8.12.1
environment:
discovery.type: single-node
xpack.security.enabled: "false"
xpack.security.http.ssl.enabled: "false"
ports:
- "9200:9200"
mem_limit: 512m
volumes:
- esdata:/usr/share/elasticsearch/data
healthcheck:
test: [ "CMD-SHELL", "curl -fsSL http://localhost:9200/_cat/health || exit 1" ]
interval: 30s
timeout: 10s
retries: 3
llama:
container_name: fasten-llama
image: ghcr.io/ggerganov/llama.cpp:server
volumes:
- ./models:/models
command: >
-m models/Meta-Llama-3.1-8B-Instruct-F16-Q5_K_M.gguf -n 450 -c 2048 -t 10 --host 0.0.0.0 --port 8080
ports:
- "8090:8090"
volumes:
esdata:
driver: local