Skip to content

Commit 45266dc

Browse files
committed
Restore ART Megatron installer ownership
1 parent 1bffe46 commit 45266dc

3 files changed

Lines changed: 75 additions & 1577 deletions

File tree

pyproject.toml

Lines changed: 1 addition & 44 deletions
Original file line numberDiff line numberDiff line change
@@ -41,19 +41,6 @@ backend = [
4141
"nvidia-cudnn-frontend<1.21 ; sys_platform == 'linux'",
4242
"vllm @ https://github.com/vivekkalyan/vllm/releases/download/v0.17.0-art1/vllm-0.17.0%2Bart1-cp38-abi3-manylinux_2_31_x86_64.whl ; sys_platform == 'linux'",
4343
]
44-
megatron = [
45-
"torch==2.10.0",
46-
"quack-kernels==0.2.5",
47-
"apex",
48-
"transformer-engine==2.11.0",
49-
"transformer-engine-cu12==2.11.0",
50-
"transformer-engine-torch==2.11.0",
51-
"megatron-core==0.16.0rc0",
52-
"pybind11>=2.13.6",
53-
"megatron-bridge",
54-
"nvidia-ml-py==13.580.82",
55-
"ml-dtypes>=0.5.0 ; python_full_version < '3.13'",
56-
]
5744
langgraph = [
5845
"langchain-core>=0.3.51",
5946
"langgraph>=0.6.2",
@@ -91,6 +78,7 @@ packages = ["src/art", "src/mp_actors"]
9178

9279
[tool.hatch.build.targets.wheel.force-include]
9380
".agents/skills" = "art/skills"
81+
"src/art_megatron_install.py" = "art_megatron_install.py"
9482

9583
[tool.hatch.build]
9684
sources = ["src"]
@@ -138,34 +126,6 @@ override-dependencies = [
138126
"quack-kernels==0.2.5",
139127
]
140128
exclude-dependencies = ["pynvml", "emerging-optimizers"]
141-
no-build-isolation-package = ["apex", "transformer-engine", "transformer-engine-cu12", "transformer-engine-torch", "megatron-core", "megatron-bridge", "nv-grouped-gemm", "mamba-ssm", "causal-conv1d"]
142-
143-
[tool.uv.extra-build-dependencies]
144-
apex = ["torch>=2.8.0"]
145-
megatron-core = ["pybind11"]
146-
transformer-engine-torch = ["torch>=2.8.0"]
147-
148-
[tool.uv.extra-build-variables]
149-
apex = { APEX_CPP_EXT = "1", APEX_CUDA_EXT = "1", APEX_FAST_LAYER_NORM = "1", APEX_PARALLEL_BUILD = "16", NVCC_APPEND_FLAGS = "--threads 4" }
150-
transformer-engine-torch = { NVTE_NO_LOCAL_VERSION = "1" }
151-
152-
[[tool.uv.dependency-metadata]]
153-
name = "apex"
154-
version = "0.1"
155-
requires-dist = ["packaging"]
156-
157-
[[tool.uv.dependency-metadata]]
158-
name = "transformer-engine-torch"
159-
version = "2.11.0"
160-
requires-dist = [
161-
"einops",
162-
"onnx",
163-
"onnxscript",
164-
"packaging",
165-
"pydantic",
166-
"torch",
167-
"transformer-engine-cu12",
168-
]
169129

170130
[tool.ty.environment]
171131
python-version = "3.11"
@@ -238,6 +198,3 @@ dev = [
238198

239199
[tool.uv.sources]
240200
panza = { git = "https://github.com/corbt/panza.git" }
241-
apex = { git = "https://github.com/NVIDIA/apex.git", branch = "25.09" }
242-
megatron-bridge = { git = "https://github.com/NVIDIA-NeMo/Megatron-Bridge.git", rev = "75f2c5ad4afb702b57b4781a00f5291a66bcf183" }
243-
transformer-engine-torch = { git = "https://github.com/NVIDIA/TransformerEngine.git", tag = "v2.11", subdirectory = "transformer_engine/pytorch" }

src/art/megatron/setup.sh

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,9 +7,6 @@ export TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-9.0}"
77
apt-get update
88
apt-get install -y libcudnn9-headers-cuda-12 ninja-build
99

10-
# Python dependencies are declared in pyproject.toml extras.
11-
# Keep backend + megatron together so setup does not prune runtime deps (e.g. vllm).
12-
script_dir="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" && pwd)"
13-
repo_root="$(cd -- "${script_dir}/../../.." && pwd)"
14-
cd "${repo_root}"
15-
uv sync --extra backend --extra megatron --frozen --active
10+
# Python dependencies are installed through art_megatron_install so
11+
# downstream repos can reuse the same source of truth for versions and VCS pins.
12+
uv run python -m art_megatron_install

0 commit comments

Comments
 (0)