11absl-py==2.3.1 # via tensorboard
2- accelerate==1.10.1 # via peft, trl, -r requirements-cuda.txt, -r requirements-rocm.txt
3- aiofiles==24 .1.0 # via -r requirements.txt
2+ accelerate==1.12.0 # via peft, trl, -r requirements-cuda.txt, -r requirements-rocm.txt
3+ aiofiles==25 .1.0 # via -r requirements.txt
44aiohappyeyeballs==2.6.1 # via aiohttp
5- aiohttp==3.12.15 # via fsspec
5+ aiohttp==3.13.3 # via fsspec
66aiosignal==1.4.0 # via aiohttp
77annotated-types==0.7.0 # via pydantic
8- anyio==4.10.0 # via httpx, jupyter-server
8+ anyio==4.12.1 # via httpx, jupyter-server
99argon2-cffi==25.1.0 # via jupyter-server
1010argon2-cffi-bindings==25.1.0 # via argon2-cffi
11- arrow==1.3 .0 # via isoduration
12- astroid==3.3.11 # via pylint
13- asttokens==3.0.0 # via stack-data
14- async-lru==2.0.5 # via jupyterlab
15- attrs==25.3 .0 # via aiohttp, jsonschema, referencing
11+ arrow==1.4 .0 # via isoduration
12+ astroid==4.0.3 # via pylint
13+ asttokens==3.0.1 # via stack-data
14+ async-lru==2.1.0 # via jupyterlab
15+ attrs==25.4 .0 # via aiohttp, jsonschema, referencing
1616babel==2.17.0 # via jupyterlab-server
17- beautifulsoup4==4.13.5 # via nbconvert
18- bitsandbytes==0.47.0 # via -r requirements-cuda.txt
19- bleach==6.2.0 # via nbconvert
20- cachetools==6.2.0 # via tox
21- certifi==2025.8.3 # via httpcore, httpx, requests, sentry-sdk
22- cffi==1.17.1 # via argon2-cffi-bindings
23- cfgv==3.4.0 # via pre-commit
17+ beautifulsoup4==4.14.3 # via nbconvert
18+ bitsandbytes==0.49.1 # via -r requirements-cuda.txt
19+ bleach==6.3.0 # via nbconvert
20+ cachetools==6.2.4 # via tox
21+ causal-conv1d==1.6.0 # via mamba-ssm
22+ certifi==2026.1.4 # via httpcore, httpx, requests, sentry-sdk
23+ cffi==2.0.0 # via argon2-cffi-bindings
24+ cfgv==3.5.0 # via pre-commit
2425chardet==5.2.0 # via tox
25- charset-normalizer==3.4.3 # via requests
26- click==8.2 .1 # via wandb
26+ charset-normalizer==3.4.4 # via requests
27+ click==8.3 .1 # via wandb
2728colorama==0.4.6 # via tox
2829comm==0.2.3 # via ipykernel, ipywidgets
2930contourpy==1.3.3 # via matplotlib
3031cycler==0.12.1 # via matplotlib
31- datasets==4.0 .0 # via trl, -r requirements.txt
32- debugpy==1.8.16 # via ipykernel
32+ datasets==4.5 .0 # via trl, -r requirements.txt
33+ debugpy==1.8.19 # via ipykernel
3334decorator==5.2.1 # via ipython
34- deepspeed==0.17.5 # via -r requirements-deepspeed.txt
35+ deepspeed==0.18.4 # via -r requirements-deepspeed.txt
3536defusedxml==0.7.1 # via nbconvert
36- dill==0.3.8 # via datasets, multiprocess, pylint
37+ dill==0.4.0 # via datasets, multiprocess, pylint
3738distlib==0.4.0 # via virtualenv
38- einops==0.8.1 # via deepspeed, flash-attn
39- executing==2.2.0 # via stack-data
39+ einops==0.8.1 # via deepspeed, flash-attn, mamba-ssm
40+ executing==2.2.1 # via stack-data
4041fastjsonschema==2.21.2 # via nbformat
41- filelock==3.19.1 # via datasets, huggingface-hub, torch, tox, transformers, virtualenv
42+ filelock==3.20.3 # via datasets, huggingface-hub, torch, tox, transformers, virtualenv
4243flash-attn==2.7.4.post1 # via -c constraints-dev.txt.in, -r requirements-cuda.txt, -r requirements-rocm.txt
43- fonttools==4.59.2 # via matplotlib
44+ fonttools==4.61.1 # via matplotlib
4445fqdn==1.5.1 # via jsonschema
45- frozenlist==1.7 .0 # via aiohttp, aiosignal
46- fsspec==2025.3.0 # via datasets, huggingface-hub, torch
46+ frozenlist==1.8 .0 # via aiohttp, aiosignal
47+ fsspec==2025.10.0 # via datasets, huggingface-hub, torch
4748gitdb==4.0.12 # via gitpython
48- gitpython==3.1.45 # via wandb
49- grpcio==1.74 .0 # via tensorboard
49+ gitpython==3.1.46 # via wandb
50+ grpcio==1.76 .0 # via tensorboard
5051h11==0.16.0 # via httpcore
51- hf-xet==1.1.9 # via huggingface-hub
52+ hf-xet==1.2.0 # via huggingface-hub
5253hjson==3.1.0 # via deepspeed
5354httpcore==1.0.9 # via httpx
54- httpx==0.28.1 # via jupyterlab
55- huggingface-hub==0.34.4 # via accelerate, datasets, peft, tokenizers, transformers, -r requirements-dev.txt
56- identify==2.6.13 # via pre-commit
57- idna==3.10 # via anyio, httpx, jsonschema, requests, yarl
58- iniconfig==2.1 .0 # via pytest
59- ipykernel==6.30.1 # via jupyter, jupyter-console, jupyterlab, -r requirements-dev.txt
60- ipython==9.5 .0 # via ipykernel, ipywidgets, jupyter-console, -r requirements-dev.txt
55+ httpx==0.28.1 # via datasets, jupyterlab
56+ huggingface-hub==0.36.0 # via accelerate, datasets, kernels , peft, tokenizers, transformers, -r requirements-dev.txt
57+ identify==2.6.16 # via pre-commit
58+ idna==3.11 # via anyio, httpx, jsonschema, requests, yarl
59+ iniconfig==2.3 .0 # via pytest
60+ ipykernel==7.1.0 # via jupyter, jupyter-console, jupyterlab, -r requirements-dev.txt
61+ ipython==9.9 .0 # via ipykernel, ipywidgets, jupyter-console, -r requirements-dev.txt
6162ipython-pygments-lexers==1.1.1 # via ipython
62- ipywidgets==8.1.7 # via jupyter
63+ ipywidgets==8.1.8 # via jupyter
6364isoduration==20.11.0 # via jsonschema
64- isort==6 .0.1 # via pylint, -r requirements-dev.txt
65+ isort==7 .0.0 # via pylint, -r requirements-dev.txt
6566jedi==0.19.2 # via ipython
6667jinja2==3.1.6 # via jupyter-server, jupyterlab, jupyterlab-server, nbconvert, torch
67- json5==0.12.1 # via jupyterlab-server
68+ json5==0.13.0 # via jupyterlab-server
6869jsonpointer==3.0.0 # via jsonschema
69- jsonschema==4.25.1 # via jupyter-events, jupyterlab-server, nbformat
70- jsonschema-specifications==2025.4 .1 # via jsonschema
70+ jsonschema==4.26.0 # via jupyter-events, jupyterlab-server, nbformat
71+ jsonschema-specifications==2025.9 .1 # via jsonschema
7172jupyter==1.1.1 # via -r requirements-dev.txt
72- jupyter-client==8.6.3 # via ipykernel, jupyter-console, jupyter-server, nbclient
73+ jupyter-client==8.8.0 # via ipykernel, jupyter-console, jupyter-server, nbclient
7374jupyter-console==6.6.3 # via jupyter
74- jupyter-core==5.8 .1 # via ipykernel, jupyter-client, jupyter-console, jupyter-server, jupyterlab, nbclient, nbconvert, nbformat
75+ jupyter-core==5.9 .1 # via ipykernel, jupyter-client, jupyter-console, jupyter-server, jupyterlab, nbclient, nbconvert, nbformat
7576jupyter-events==0.12.0 # via jupyter-server
7677jupyter-lsp==2.3.0 # via jupyterlab
7778jupyter-server==2.17.0 # via jupyter-lsp, jupyterlab, jupyterlab-server, notebook, notebook-shim
78- jupyter-server-terminals==0.5.3 # via jupyter-server
79- jupyterlab==4.4.6 # via jupyter, notebook
79+ jupyter-server-terminals==0.5.4 # via jupyter-server
80+ jupyterlab==4.5.2 # via jupyter, notebook
8081jupyterlab-pygments==0.3.0 # via nbconvert
81- jupyterlab-server==2.27.3 # via jupyterlab, notebook
82- jupyterlab-widgets==3.0.15 # via ipywidgets
82+ jupyterlab-server==2.28.0 # via jupyterlab, notebook
83+ jupyterlab-widgets==3.0.16 # via ipywidgets
84+ kernels==0.11.7 # via -r requirements-cuda.txt
8385kiwisolver==1.4.9 # via matplotlib
84- lark==1.2.2 # via rfc3987-syntax
85- liger-kernel==0.6.2 # via -r requirements-cuda.txt
86- llvmlite==0.45.0 # via numba
87- markdown==3.8.2 # via tensorboard
86+ lark==1.3.1 # via rfc3987-syntax
87+ librt==0.7.8 # via mypy
88+ liger-kernel==0.6.4 # via -r requirements-cuda.txt
89+ llvmlite==0.46.0 # via numba
90+ mamba-ssm==2.3.0 # via -r requirements-cuda.txt, -r requirements-rocm.txt
91+ markdown==3.10 # via tensorboard
8892markdown-it-py==4.0.0 # via rich
89- markupsafe==3.0.2 # via jinja2, nbconvert, werkzeug
90- matplotlib==3.10.6 # via -r requirements-dev.txt
91- matplotlib-inline==0.1.7 # via ipykernel, ipython
93+ markupsafe==3.0.3 # via jinja2, nbconvert, werkzeug
94+ matplotlib==3.10.8 # via -r requirements-dev.txt
95+ matplotlib-inline==0.2.1 # via ipykernel, ipython
9296mccabe==0.7.0 # via pylint
9397mdurl==0.1.2 # via markdown-it-py
94- mistune==3.1.4 # via nbconvert
98+ mistune==3.2.0 # via nbconvert
9599mpmath==1.3.0 # via sympy
96- msgpack==1.1.1 # via deepspeed
97- multidict==6.6.4 # via aiohttp, yarl
98- multiprocess==0.70.16 # via datasets
99- mypy==1.17 .1 # via -r requirements-dev.txt
100+ msgpack==1.1.2 # via deepspeed
101+ multidict==6.7.0 # via aiohttp, yarl
102+ multiprocess==0.70.18 # via datasets
103+ mypy==1.19 .1 # via -r requirements-dev.txt
100104mypy-extensions==1.1.0 # via mypy
101- nbclient==0.10.2 # via nbconvert
105+ nbclient==0.10.4 # via nbconvert
102106nbconvert==7.16.6 # via jupyter, jupyter-server
103107nbformat==5.10.4 # via jupyter-server, nbclient, nbconvert
104108nest-asyncio==1.6.0 # via ipykernel
105- networkx==3.5 # via torch
106- ninja==1.13.0 # via deepspeed
107- nodeenv==1.9.1 # via pre-commit
108- notebook==7.4.5 # via jupyter
109+ networkx==3.6.1 # via torch
110+ ninja==1.13.0 # via causal-conv1d, deepspeed, mamba-ssm
111+ nodeenv==1.10.0 # via pre-commit
112+ notebook==7.5.2 # via jupyter
109113notebook-shim==0.2.4 # via jupyterlab, notebook
110- numba==0.62 .1 # via -r requirements.txt
111- numpy==2.3.3 # via accelerate, bitsandbytes, contourpy, datasets, deepspeed, matplotlib, numba, pandas, peft, tensorboard, transformers, -r requirements-dev.txt, -r requirements.txt
114+ numba==0.63 .1 # via -r requirements.txt
115+ numpy==2.3.5 # via accelerate, bitsandbytes, contourpy, datasets, deepspeed, matplotlib, numba, pandas, peft, tensorboard, transformers, -r requirements-dev.txt, -r requirements.txt
112116nvidia-cublas-cu12==12.4.5.8 # via nvidia-cudnn-cu12, nvidia-cusolver-cu12, torch
113117nvidia-cuda-cupti-cu12==12.4.127 # via torch
114118nvidia-cuda-nvrtc-cu12==12.4.127 # via torch
@@ -123,92 +127,90 @@ nvidia-nccl-cu12==2.21.5 # via torch
123127nvidia-nvjitlink-cu12==12.4.127 # via nvidia-cusolver-cu12, nvidia-cusparse-cu12, torch
124128nvidia-nvtx-cu12==12.4.127 # via torch
125129overrides==7.7.0 # via jupyter-server
126- packaging==25.0 # via accelerate, datasets, deepspeed, huggingface-hub, ipykernel, jupyter-events, jupyter-server, jupyterlab, jupyterlab-server, matplotlib, nbconvert, peft, pyproject-api, pytest, tensorboard, tox, transformers, wandb, -r requirements.txt
127- pandas==2.3.2 # via datasets
130+ packaging==25.0 # via accelerate, bitsandbytes, causal-conv1d, datasets, deepspeed, huggingface-hub, ipykernel, jupyter-events, jupyter-server, jupyterlab, jupyterlab-server, kernels, mamba-ssm, matplotlib, nbconvert, peft, pyproject-api, pytest, tensorboard, tox, transformers, trl , wandb, -r requirements.txt
131+ pandas==2.3.3 # via datasets
128132pandocfilters==1.5.1 # via nbconvert
129133parso==0.8.5 # via jedi
130- pathspec==0.12.1 # via mypy
131- peft==0.17 .1 # via -r requirements.txt
134+ pathspec==1.0.3 # via mypy
135+ peft==0.18 .1 # via -r requirements.txt
132136pexpect==4.9.0 # via ipython
133- pillow==11.3 .0 # via matplotlib, tensorboard
134- platformdirs==4.4.0 # via jupyter-core, pylint, tox, virtualenv, wandb
137+ pillow==12.1 .0 # via matplotlib, tensorboard
138+ platformdirs==4.5.1 # via jupyter-core, pylint, tox, virtualenv, wandb
135139pluggy==1.6.0 # via pytest, tox
136- pre-commit==4.3.0 # via -r requirements-dev.txt
137- prometheus-client==0.22 .1 # via jupyter-server
140+ pre-commit==4.5.1 # via -r requirements-dev.txt
141+ prometheus-client==0.24 .1 # via jupyter-server
138142prompt-toolkit==3.0.52 # via ipython, jupyter-console
139- propcache==0.3.2 # via aiohttp, yarl
140- protobuf==6.32.0 # via tensorboard, wandb
141- psutil==7.0.0 # via accelerate, deepspeed, ipykernel, peft
143+ propcache==0.4.1 # via aiohttp, yarl
144+ protobuf==6.33.4 # via tensorboard, wandb
145+ psutil==7.2.1 # via accelerate, deepspeed, ipykernel, peft
142146ptyprocess==0.7.0 # via pexpect, terminado
143147pure-eval==0.2.3 # via stack-data
144148py-cpuinfo==9.0.0 # via deepspeed, -r requirements.txt
145- pyarrow==21 .0.0 # via datasets
146- pycparser==2.22 # via cffi
147- pydantic==2.11.7 # via deepspeed, pylint-pydantic, wandb, -r requirements.txt
148- pydantic-core==2.33.2 # via pydantic
149+ pyarrow==23 .0.0 # via datasets
150+ pycparser==2.23 # via cffi
151+ pydantic==2.12.5 # via deepspeed, pylint-pydantic, wandb, -r requirements.txt
152+ pydantic-core==2.41.5 # via pydantic
149153pygments==2.19.2 # via ipython, ipython-pygments-lexers, jupyter-console, nbconvert, pytest, rich
150- pylint==3.3.8 # via pylint-plugin-utils, pylint-pydantic, -r requirements-dev.txt
154+ pylint==4.0.4 # via pylint-plugin-utils, pylint-pydantic, -r requirements-dev.txt
151155pylint-plugin-utils==0.9.0 # via pylint-pydantic
152- pylint-pydantic==0.3.5 # via -r requirements-dev.txt
153- pyparsing==3.2.3 # via matplotlib
154- pyproject-api==1.9.1 # via tox
155- pytest==8.4.1 # via -r requirements-dev.txt
156+ pylint-pydantic==0.4.1 # via -r requirements-dev.txt
157+ pyparsing==3.3.1 # via matplotlib
158+ pyproject-api==1.10.0 # via tox
159+ pytest==9.0.2 # via -r requirements-dev.txt
156160python-dateutil==2.9.0.post0 # via arrow, jupyter-client, matplotlib, pandas
157- python-json-logger==3.3 .0 # via jupyter-events
161+ python-json-logger==4.0 .0 # via jupyter-events
158162pytz==2025.2 # via pandas
159- pyyaml==6.0.2 # via accelerate, datasets, huggingface-hub, jupyter-events, peft, pre-commit, transformers, wandb, -r requirements.txt
160- pyzmq==27.0.2 # via ipykernel, jupyter-client, jupyter-console, jupyter-server
161- referencing==0.36.2 # via jsonschema, jsonschema-specifications, jupyter-events
162- regex==2025.8.29 # via transformers
163+ pyyaml==6.0.3 # via accelerate, datasets, huggingface-hub, jupyter-events, kernels , peft, pre-commit, transformers, wandb, -r requirements.txt
164+ pyzmq==27.1.0 # via ipykernel, jupyter-client, jupyter-console, jupyter-server
165+ referencing==0.37.0 # via jsonschema, jsonschema-specifications, jupyter-events
166+ regex==2026.1.15 # via transformers
163167requests==2.32.5 # via datasets, huggingface-hub, jupyterlab-server, transformers, wandb
164168rfc3339-validator==0.1.4 # via jsonschema, jupyter-events
165169rfc3986-validator==0.1.1 # via jsonschema, jupyter-events
166170rfc3987-syntax==1.1.0 # via jsonschema
167- rich==14.1 .0 # via -r requirements.txt
168- rpds-py==0.27.1 # via jsonschema, referencing
169- ruff==0.12.11 # via -r requirements-dev.txt
170- safetensors==0.6.2 # via accelerate, peft, transformers
171- send2trash==1.8.3 # via jupyter-server
172- sentry-sdk==2.35.1 # via wandb
173- setuptools==80.9.0 # via jupyterlab, tensorboard
171+ rich==14.2 .0 # via -r requirements.txt
172+ rpds-py==0.30.0 # via jsonschema, referencing
173+ ruff==0.14.13 # via -r requirements-dev.txt
174+ safetensors==0.7.0 # via accelerate, peft, transformers
175+ send2trash==2.1.0 # via jupyter-server
176+ sentry-sdk==2.49.0 # via wandb
177+ setuptools==80.9.0 # via jupyterlab, mamba-ssm, tensorboard
174178six==1.17.0 # via python-dateutil, rfc3339-validator
175179smmap==5.0.2 # via gitdb
176- sniffio==1.3.1 # via anyio
177- soupsieve==2.8 # via beautifulsoup4
180+ soupsieve==2.8.2 # via beautifulsoup4
178181stack-data==0.6.3 # via ipython
179182sympy==1.13.1 # via torch
180183tensorboard==2.20.0 # via -r requirements-dev.txt
181184tensorboard-data-server==0.7.2 # via tensorboard
182185terminado==0.18.1 # via jupyter-server, jupyter-server-terminals
183186tinycss2==1.4.0 # via bleach
184- tokenizers==0.22.0 # via transformers
185- tomlkit==0.13.3 # via pylint
186- torch==2.6.0 # via accelerate, bitsandbytes, deepspeed, flash-attn, liger-kernel, peft, -c constraints-dev.txt.in, -r requirements.txt
187- tornado==6.5.2 # via ipykernel, jupyter-client, jupyter-server, jupyterlab, notebook, terminado
188- tox==4.29.0 # via tox-current-env, -r requirements-dev.txt
187+ tokenizers==0.22.2 # via transformers
188+ tomlkit==0.14.0 # via pylint
189+ torch==2.6.0 # via accelerate, bitsandbytes, causal-conv1d, deepspeed, flash-attn, liger-kernel, mamba-ssm , peft, -c constraints-dev.txt.in, -r requirements.txt
190+ tornado==6.5.4 # via ipykernel, jupyter-client, jupyter-server, jupyterlab, notebook, terminado
191+ tox==4.34.1 # via tox-current-env, -r requirements-dev.txt
189192tox-current-env==0.0.16 # via -r requirements-dev.txt
190193tqdm==4.67.1 # via datasets, deepspeed, huggingface-hub, peft, transformers
191194traitlets==5.14.3 # via ipykernel, ipython, ipywidgets, jupyter-client, jupyter-console, jupyter-core, jupyter-events, jupyter-server, jupyterlab, matplotlib-inline, nbclient, nbconvert, nbformat
192- transformers==4.56.0 # via peft, trl, -r requirements.txt
193- triton==3.2.0 # via liger-kernel, torch
194- trl==0.22.1 # via -r requirements.txt
195- types-python-dateutil==2.9.0.20250822 # via arrow
196- types-pyyaml==6.0.12.20250822 # via -r requirements-dev.txt
197- types-requests==2.32.4.20250809 # via types-tqdm
195+ transformers==4.57.6 # via mamba-ssm, peft, trl, -r requirements.txt
196+ triton==3.2.0 # via liger-kernel, mamba-ssm, torch
197+ trl==0.27.0 # via -r requirements.txt
198+ types-pyyaml==6.0.12.20250915 # via -r requirements-dev.txt
199+ types-requests==2.32.4.20260107 # via types-tqdm
198200types-tqdm==4.67.0.20250809 # via -r requirements-dev.txt
199- typing-extensions==4.15.0 # via aiosignal, anyio, beautifulsoup4, huggingface-hub, ipython, mypy, pydantic, pydantic-core, referencing, torch, typing-inspection, wandb
200- typing-inspection==0.4.1 # via pydantic
201- tzdata==2025.2 # via pandas
201+ typing-extensions==4.15.0 # via aiosignal, anyio, beautifulsoup4, grpcio, huggingface-hub, ipython, mypy, pydantic, pydantic-core, referencing, torch, typing-inspection, wandb
202+ typing-inspection==0.4.2 # via pydantic
203+ tzdata==2025.3 # via arrow, pandas
202204uri-template==1.3.0 # via jsonschema
203- urllib3==2.5.0 # via requests, sentry-sdk, types-requests
204- virtualenv==20.34.0 # via pre-commit, tox
205- wandb==0.21.3 # via -r requirements-dev.txt
206- wcwidth==0.2.13 # via prompt-toolkit
207- webcolors==24.11.1 # via jsonschema
205+ urllib3==2.6.3 # via requests, sentry-sdk, types-requests
206+ virtualenv==20.36.1 # via pre-commit, tox
207+ wandb==0.24.0 # via -r requirements-dev.txt
208+ wcwidth==0.2.14 # via prompt-toolkit
209+ webcolors==25.10.0 # via jsonschema
208210webencodings==0.5.1 # via bleach, tinycss2
209- websocket-client==1.8 .0 # via jupyter-server
210- werkzeug==3.1.3 # via tensorboard
211+ websocket-client==1.9 .0 # via jupyter-server
212+ werkzeug==3.1.5 # via tensorboard
211213wheel==0.45.1 # via -r requirements.txt
212- widgetsnbextension==4.0.14 # via ipywidgets
213- xxhash==3.5 .0 # via datasets
214- yarl==1.20.1 # via aiohttp
214+ widgetsnbextension==4.0.15 # via ipywidgets
215+ xxhash==3.6 .0 # via datasets
216+ yarl==1.22.0 # via aiohttp
0 commit comments