pixi manifest and install command (#726)

uralik · web-flow · commit b7c9c31594c8 · 2026-01-23T08:16:52.000-08:00
diff --git a/README.md b/README.md
@@ -32,6 +32,8 @@ You can also find our notebook tutorials (coming soon)
 
 torchforge requires PyTorch 2.9.0 with [Monarch](https://github.com/meta-pytorch/monarch), [vLLM](https://github.com/vllm-project/vllm), and [torchtitan](https://github.com/pytorch/torchtitan).
 
+### Conda
+
 Install torchforge with:
 
 ```bash
@@ -40,7 +42,7 @@ conda activate forge
 ./scripts/install.sh
 ```
 
-### ROCm Installation
+#### ROCm Installation
 
 ROCm users can install with the dedicated script:
 
@@ -61,6 +63,20 @@ The install script installs system dependencies along with torchforge. Note that
 
 Optional: By default, the packages installation uses conda. If you want to install system packages on the target machine instead of conda, you can pass the `--use-sudo` flag to the installation script: `./scripts/install.sh --use-sudo`.
 
+### Pixi
+
+Pixi combines benefits of uv with access to conda forge for system dependencies. [pixi.toml](./pixi.toml) provides a manifest with build tasks with `install` as a the combined install all task.
+
+Install pixi:
+```
+curl -fsSL https://pixi.sh/install.sh | bash
+```
+
+Install torchforge with pixi:
+```
+pixi run install
+```
+
 > **Note:** We are actively working on enabling pure `uv` installation. Currently, Conda is the recommended approach. `uv` support is not fully working at the moment but is being tracked in [issue #494](https://github.com/meta-pytorch/torchforge/issues/494).
 
 After install, you can run the following command and should see output confirming GRPO training is running (you need a minimum 3 GPU devices):
diff --git a/pixi.toml b/pixi.toml
@@ -0,0 +1,92 @@
+# Pixi configuration for Forge
+# This replaces the conda-based installation with pixi environment manager
+#
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+
+[workspace]
+name = "forge"
+version = "0.1.0"
+description = "A PyTorch native platform for post-training generative AI models"
+channels = ["conda-forge", "pytorch", "nvidia"]
+platforms = ["linux-64"]
+
+[system-requirements]
+linux = "5.10"
+cuda = "12.8"
+
+# System dependencies from conda-forge
+[dependencies]
+python = "3.10.*"
+openssl = "*"
+# RDMA and InfiniBand libraries (equivalent to rdma-core, libibverbs)
+rdma-core = "*"
+# Git for installing from git repos
+git = "*"
+# Use uv for fast Python package installation
+uv = ">=0.1.0"
+
+# Development dependencies (equivalent to [dev] extras)
+[feature.dev.dependencies]
+pre-commit = "*"
+pytest = "*"
+pytest-cov = "*"
+pytest-timeout = "*"
+tensorboard = "*"
+tomli = ">=1.1.0"
+anyio = "*"
+pytest-asyncio = "*"
+
+# Documentation dependencies (equivalent to [docs] extras)
+[feature.docs.dependencies]
+sphinx = "==7.2.6"
+matplotlib = "*"
+
+[tasks]
+# Installation tasks using uv for faster package management
+# uv will use the configuration from pyproject.toml [tool.uv] section
+install-pytorch = """
+    uv pip install torch==2.9.0 --index-url https://download.pytorch.org/whl/cu128
+"""
+
+# CRITICAL: Install vLLM dependencies BEFORE installing vLLM itself
+install-vllm-reqs = """
+    uv pip install -r .github/packaging/vllm_reqs_12_8.txt
+"""
+
+install-vllm-deps = """
+    uv pip install six && \
+    uv pip install "setuptools<80"
+"""
+
+# Install vLLM after all dependencies are resolved
+install-vllm = """
+    uv pip install vllm --no-cache-dir --index-url https://download.pytorch.org/whl/preview/forge
+"""
+
+install-torchstore = """
+    uv pip install "git+https://github.com/meta-pytorch/torchstore.git@no-monarch-2025.12.17"
+"""
+
+install-forge = """
+    uv pip install -e ".[dev]"
+"""
+
+# Full installation task - follows exact sequence from install.sh
+install = { depends-on = ["install-pytorch", "install-vllm-reqs", "install-vllm-deps", "install-vllm", "install-torchstore", "install-forge"] }
+
+# Test installation task
+test-install = """
+    python -c "import torch; print(f'PyTorch {torch.__version__} (CUDA: {torch.cuda.is_available()})')" && \
+    python -c "import vllm; print('vLLM imported successfully')" && \
+    python -c "import forge; print('forge imported successfully')" || true
+"""
+
+# Define environments
+[environments]
+default = { solve-group = "default" }
+dev = { features = ["dev"], solve-group = "default" }
+docs = { features = ["docs"], solve-group = "default" }
+
+[target.linux-64.activation]
+scripts = ["scripts/pixi_cuda_env.sh"]
diff --git a/scripts/pixi_cuda_env.sh b/scripts/pixi_cuda_env.sh
@@ -0,0 +1,40 @@
+#!/bin/bash
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+# CUDA environment activation script for Pixi
+# This script is automatically sourced when the pixi environment is activated
+
+# CUDA environment variables
+export CUDA_VERSION=12.8
+export NVCC=/usr/local/cuda-${CUDA_VERSION}/bin/nvcc
+export CUDA_NVCC_EXECUTABLE=/usr/local/cuda-${CUDA_VERSION}/bin/nvcc
+export CUDA_HOME=/usr/local/cuda-${CUDA_VERSION}
+export PATH="${CUDA_HOME}/bin:$PATH"
+export CUDA_INCLUDE_DIRS=$CUDA_HOME/include
+export CUDA_CUDART_LIBRARY=$CUDA_HOME/lib64/libcudart.so
+
+# DO NOT set LD_LIBRARY_PATH globally - it breaks system tools
+# Instead, we use python wrapper functions below to set it only for Python processes
+
+# Define python wrappers that set LD_LIBRARY_PATH only for the launched process
+# Priority: system CUDA driver (/usr/lib64) > CUDA toolkit > conda/pixi libs
+# Use system CUDA driver (newer) instead of compat (outdated stub that may be incompatible)
+python()  {
+    LD_LIBRARY_PATH="/usr/lib64:/usr/local/cuda-12.8/lib64:${CONDA_PREFIX}/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}" \
+    command python "$@"
+}
+python3() {
+    LD_LIBRARY_PATH="/usr/lib64:/usr/local/cuda-12.8/lib64:${CONDA_PREFIX}/lib${LD_LIBRARY_PATH:+:$LD_LIBRARY_PATH}" \
+    command python3 "$@"
+}
+
+# Export functions to subshells when possible (best-effort, shell-dependent)
+if [ -n "${BASH_VERSION:-}" ]; then
+    export -f python python3 2>/dev/null || true
+elif [ -n "${ZSH_VERSION:-}" ]; then
+    typeset -fx python python3 >/dev/null 2>&1 || true
+fi