diff --git a/recipes/gb300-fp8/1k1k/stp/low-latency.yaml b/recipes/gb300-fp8/1k1k/stp/low-latency.yaml index baaad52c..70f529a5 100644 --- a/recipes/gb300-fp8/1k1k/stp/low-latency.yaml +++ b/recipes/gb300-fp8/1k1k/stp/low-latency.yaml @@ -1,7 +1,7 @@ name: "gb300-1k1k-fp8-low-latency" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/recipes/gb300-fp8/1k1k/stp/max.yaml b/recipes/gb300-fp8/1k1k/stp/max.yaml index 22b5954c..5dd098d5 100644 --- a/recipes/gb300-fp8/1k1k/stp/max.yaml +++ b/recipes/gb300-fp8/1k1k/stp/max.yaml @@ -3,7 +3,7 @@ name: "gb300-1k1k-fp8-max" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/recipes/gb300-fp8/1k1k/stp/mid.yaml b/recipes/gb300-fp8/1k1k/stp/mid.yaml index d3b13f41..32766f4e 100644 --- a/recipes/gb300-fp8/1k1k/stp/mid.yaml +++ b/recipes/gb300-fp8/1k1k/stp/mid.yaml @@ -2,7 +2,7 @@ name: "gb300-1k1k-fp8-mid" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/recipes/gb300-fp8/8k1k/stp/low-latency.yaml b/recipes/gb300-fp8/8k1k/stp/low-latency.yaml index 7fd79ef9..914fe9d3 100644 --- a/recipes/gb300-fp8/8k1k/stp/low-latency.yaml +++ b/recipes/gb300-fp8/8k1k/stp/low-latency.yaml @@ -1,7 +1,7 @@ name: "gb300-8k1k-fp8-low-latency" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/recipes/gb300-fp8/8k1k/stp/max.yaml b/recipes/gb300-fp8/8k1k/stp/max.yaml index dbbc190a..2d112d20 100644 --- a/recipes/gb300-fp8/8k1k/stp/max.yaml +++ b/recipes/gb300-fp8/8k1k/stp/max.yaml @@ -3,7 +3,7 @@ name: "gb300-8k1k-fp8-max" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/recipes/gb300-fp8/8k1k/stp/mid.yaml b/recipes/gb300-fp8/8k1k/stp/mid.yaml index 6d7ffca6..9ede478c 100644 --- a/recipes/gb300-fp8/8k1k/stp/mid.yaml +++ b/recipes/gb300-fp8/8k1k/stp/mid.yaml @@ -3,7 +3,7 @@ name: "gb300-8k1k-fp8-mid" model: - path: "dsfp8" + path: "dsr1-fp8" container: "lmsysorg/sglang:v0.5.8-cu130" precision: "fp8" diff --git a/src/srtctl/cli/setup_head.py b/src/srtctl/cli/setup_head.py index 45a4e96b..91582e3f 100644 --- a/src/srtctl/cli/setup_head.py +++ b/src/srtctl/cli/setup_head.py @@ -11,11 +11,11 @@ import argparse import logging import os +import shutil import subprocess import sys import time from pathlib import Path -import shutil # Network configurations ETCD_CLIENT_PORT = 2379