Skip to content

Commit 094d2f8

Browse files
committed
chore: test gpt-oss-120b, nemotron and qwen3
1 parent 926a90a commit 094d2f8

File tree

2 files changed

+8
-8
lines changed

2 files changed

+8
-8
lines changed

config/config.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -46,15 +46,15 @@ prompt_guard:
4646
# NOT supported: domain names (example.com), protocol prefixes (http://), paths (/api), ports in address (use 'port' field)
4747
vllm_endpoints:
4848
- name: "gpt-oss-120b-endpoint"
49-
address: "172.28.0.1" # Docker gateway IP to access host machine
49+
address: "192.168.48.1" # Host machine IP address
5050
port: 8001
5151
weight: 1
5252
- name: "qwen3-32b-endpoint"
53-
address: "172.28.0.1" # Docker gateway IP to access host machine
53+
address: "192.168.48.1" # Host machine IP address
5454
port: 8002
5555
weight: 1
5656
- name: "nemotron-super-endpoint"
57-
address: "172.28.0.1" # Docker gateway IP to access host machine
57+
address: "192.168.48.1" # Host machine IP address
5858
port: 8003
5959
weight: 1
6060

deploy/docker-compose/docker-compose.yml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ services:
2020
- HUGGINGFACE_HUB_CACHE=/root/.cache/huggingface
2121
- HF_HUB_ENABLE_HF_TRANSFER=1
2222
extra_hosts:
23-
- "host.docker.internal:172.28.0.1" # Allow container to reach host LLM endpoints
23+
- "host.docker.internal:172.32.0.1" # Allow container to reach host LLM endpoints
2424
networks:
2525
- semantic-network
2626
healthcheck:
@@ -43,7 +43,7 @@ services:
4343
- ./addons/envoy.yaml:/etc/envoy/envoy.yaml:ro,z
4444
command: ["/usr/local/bin/envoy", "-c", "/etc/envoy/envoy.yaml", "--component-log-level", "ext_proc:trace,router:trace,http:trace"]
4545
extra_hosts:
46-
- "host.docker.internal:172.28.0.1" # Allow container to reach host LLM endpoints
46+
- "host.docker.internal:172.32.0.1" # Allow container to reach host LLM endpoints
4747
depends_on:
4848
semantic-router:
4949
condition: service_healthy
@@ -67,7 +67,7 @@ services:
6767
- "8000:8000"
6868
networks:
6969
semantic-network:
70-
ipv4_address: 172.28.0.10
70+
ipv4_address: 172.32.0.10
7171
healthcheck:
7272
test: ["CMD", "curl", "-fsS", "http://localhost:8000/health"]
7373
interval: 10s
@@ -219,7 +219,7 @@ services:
219219
- hf-cache:/home/llmkatan/.cache/huggingface
220220
networks:
221221
semantic-network:
222-
ipv4_address: 172.28.0.20
222+
ipv4_address: 172.32.0.20
223223
command: ["llm-katan", "--model", "/app/models/Qwen/Qwen3-0.6B", "--served-model-name", "qwen3", "--host", "0.0.0.0", "--port", "8002"]
224224
healthcheck:
225225
test: ["CMD", "curl", "-fsS", "http://localhost:8002/health"]
@@ -278,7 +278,7 @@ networks:
278278
driver: bridge
279279
ipam:
280280
config:
281-
- subnet: 172.28.0.0/16
281+
- subnet: 172.32.0.0/16
282282

283283
volumes:
284284
models-cache:

0 commit comments

Comments
 (0)