Skip to content

Add FSDP support to TiledMLP by preventing premature resharding during the tiled backward recompute loop. #2374

Add FSDP support to TiledMLP by preventing premature resharding during the tiled backward recompute loop.

Add FSDP support to TiledMLP by preventing premature resharding during the tiled backward recompute loop. #2374

Workflow file for this run

name: NVIDIA GPU
on:
push:
branches:
- main
pull_request:
branches:
- main
merge_group:
types: [checks_requested]
branches:
- main
workflow_dispatch: # Enables manual trigger
concurrency:
group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.event.merge_group.head_ref || github.ref }}
cancel-in-progress: true
jobs:
nvi-correctness-tests:
if: github.event_name == 'merge_group'
runs-on: ubuntu-latest
env:
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
steps:
- name: Checkout code
uses: actions/checkout@v6
- name: Set up Python
uses: actions/setup-python@v6
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install modal
- name: Run tests
run: |
modal run dev.modal.tests::liger_correctness_tests
nvi-convergence-tests:
if: github.event_name == 'merge_group'
runs-on: ubuntu-latest
env:
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
steps:
- name: Checkout code
uses: actions/checkout@v6
- name: Set up Python
uses: actions/setup-python@v6
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install modal
- name: Run tests
run: |
modal run dev.modal.tests::liger_convergence_tests
nvi-correctness-tests-with-transformers-4-52-0:
if: github.event_name == 'merge_group'
runs-on: ubuntu-latest
env:
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
steps:
- name: Checkout code
uses: actions/checkout@v6
- name: Set up Python
uses: actions/setup-python@v6
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install modal
- name: Run tests
run: |
modal run dev.modal.tests::liger_oldest_v4_correctness_tests
nvi-convergence-tests-with-transformers-4-52-0:
if: github.event_name == 'merge_group'
runs-on: ubuntu-latest
env:
MODAL_TOKEN_ID: ${{ secrets.MODAL_TOKEN_ID }}
MODAL_TOKEN_SECRET: ${{ secrets.MODAL_TOKEN_SECRET }}
steps:
- name: Checkout code
uses: actions/checkout@v6
- name: Set up Python
uses: actions/setup-python@v6
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install modal
- name: Run tests
run: |
modal run dev.modal.tests::liger_oldest_v4_convergence_tests