diff --git a/pyproject.toml b/pyproject.toml index 39514d2e2a..6ee93ea899 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -111,15 +111,15 @@ override-dependencies = [ "torch; sys_platform == 'never'", "torchvision; sys_platform == 'never'", "triton; sys_platform == 'never'", - "transformer-engine @ git+https://github.com/NVIDIA/TransformerEngine.git@6a34b6574fa6c29d9d07fdcddf9812cbb1488878", + "transformer-engine @ git+https://github.com/NVIDIA/TransformerEngine.git@d9b7fc5770a88af06e2e9c2bd97b550614c3a69f", "mlflow>=3.5.0", - "cryptography>=43.0.0,<47" + "cryptography>=43.0.0,<47", + "nvidia-modelopt~=0.41.0", + "nvidia-resiliency-ext @ git+https://github.com/NVIDIA/nvidia-resiliency-ext.git@v0.4.1" # Requires a source install to compile cupti for cuda13 ] [tool.uv.sources] megatron-core = { path = "3rdparty/Megatron-LM/", editable = true } -nvidia-modelopt = { git = "https://github.com/NVIDIA/TensorRT-Model-Optimizer.git", rev = "0a4f0a8b933121f7af080261a0a5a7717f2c5d49" } -nvidia-resiliency-ext = { git = "https://github.com/NVIDIA/nvidia-resiliency-ext.git", rev = "v0.4.1" } # Requires a source install to compile cupti for cuda13 [project.optional-dependencies] recipes = [ diff --git a/uv.lock b/uv.lock index 925caa2e41..fa1aa7cbaf 100644 --- a/uv.lock +++ b/uv.lock @@ -21,9 +21,11 @@ prerelease-mode = "allow" overrides = [ { name = "cryptography", specifier = ">=43.0.0,<47" }, { name = "mlflow", specifier = ">=3.5.0" }, + { name = "nvidia-modelopt", specifier = "~=0.41.0" }, + { name = "nvidia-resiliency-ext", git = "https://github.com/NVIDIA/nvidia-resiliency-ext.git?rev=v0.4.1" }, { name = "torch", marker = "sys_platform == 'never'" }, { name = "torchvision", marker = "sys_platform == 'never'" }, - { name = "transformer-engine", git = "https://github.com/NVIDIA/TransformerEngine.git?rev=6a34b6574fa6c29d9d07fdcddf9812cbb1488878" }, + { name = "transformer-engine", git = "https://github.com/NVIDIA/TransformerEngine.git?rev=d9b7fc5770a88af06e2e9c2bd97b550614c3a69f" }, { name = "triton", marker = "sys_platform == 'never'" }, ] @@ -3055,7 +3057,7 @@ requires-dist = [ { name = "mlflow", specifier = ">=3.5.0" }, { name = "nemo-run", marker = "extra == 'recipes'", specifier = ">=0.5.0a0,<0.6.0" }, { name = "nvdlfw-inspect", marker = "extra == 'tensor-inspect'", specifier = "==0.2.1" }, - { name = "nvidia-resiliency-ext", git = "https://github.com/NVIDIA/nvidia-resiliency-ext.git?rev=v0.4.1" }, + { name = "nvidia-resiliency-ext", specifier = "~=0.4.1" }, { name = "omegaconf", specifier = ">=2.3.0" }, { name = "open-clip-torch", specifier = ">=3.2.0" }, { name = "pyyaml", specifier = ">=6.0.2" }, @@ -3132,7 +3134,7 @@ dev = [ { name = "megatron-energon", extra = ["av-decode"] }, { name = "multi-storage-client" }, { name = "nv-grouped-gemm" }, - { name = "nvidia-modelopt", marker = "sys_platform != 'darwin'" }, + { name = "nvidia-modelopt" }, { name = "nvidia-resiliency-ext" }, { name = "nvtx" }, { name = "onnxscript", version = "0.5.0", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version >= '3.13'" }, @@ -7042,8 +7044,8 @@ wheels = [ [[package]] name = "transformer-engine" -version = "2.12.0.dev0+6a34b657" -source = { git = "https://github.com/NVIDIA/TransformerEngine.git?rev=6a34b6574fa6c29d9d07fdcddf9812cbb1488878#6a34b6574fa6c29d9d07fdcddf9812cbb1488878" } +version = "2.12.0+d9b7fc57" +source = { git = "https://github.com/NVIDIA/TransformerEngine.git?rev=d9b7fc5770a88af06e2e9c2bd97b550614c3a69f#d9b7fc5770a88af06e2e9c2bd97b550614c3a69f" } dependencies = [ { name = "einops" }, { name = "importlib-metadata" },