instructlab · courtneypacheco · Feb 2, 2026 · coderabbitai · Jan 26, 2026 · coderabbitai
diff --git a/constraints-dev.txt b/constraints-dev.txt
@@ -1,114 +1,118 @@
-absl-py==2.3.1            # via tensorboard
-accelerate==1.10.1        # via peft, trl, -r requirements-cuda.txt, -r requirements-rocm.txt
-aiofiles==24.1.0          # via -r requirements.txt
+absl-py==2.4.0            # via tensorboard
+accelerate==1.12.0        # via peft, trl, -r requirements-cuda.txt, -r requirements-rocm.txt
+aiofiles==25.1.0          # via -r requirements.txt
 aiohappyeyeballs==2.6.1   # via aiohttp
-aiohttp==3.12.15          # via fsspec
+aiohttp==3.13.3           # via fsspec
 aiosignal==1.4.0          # via aiohttp
 annotated-types==0.7.0    # via pydantic
-anyio==4.10.0             # via httpx, jupyter-server
+anyio==4.12.1             # via httpx, jupyter-server
 argon2-cffi==25.1.0       # via jupyter-server
 argon2-cffi-bindings==25.1.0  # via argon2-cffi
-arrow==1.3.0              # via isoduration
-astroid==3.3.11           # via pylint
-asttokens==3.0.0          # via stack-data
-async-lru==2.0.5          # via jupyterlab
-attrs==25.3.0             # via aiohttp, jsonschema, referencing
-babel==2.17.0             # via jupyterlab-server
-beautifulsoup4==4.13.5    # via nbconvert
-bitsandbytes==0.47.0      # via -r requirements-cuda.txt
-bleach==6.2.0             # via nbconvert
-cachetools==6.2.0         # via tox
-certifi==2025.8.3         # via httpcore, httpx, requests, sentry-sdk
-cffi==1.17.1              # via argon2-cffi-bindings
-cfgv==3.4.0               # via pre-commit
+arrow==1.4.0              # via isoduration
+astroid==4.0.3            # via pylint
+asttokens==3.0.1          # via stack-data
+async-lru==2.1.0          # via jupyterlab
+attrs==25.4.0             # via aiohttp, jsonschema, referencing
+babel==2.18.0             # via jupyterlab-server
+beautifulsoup4==4.14.3    # via nbconvert
+bitsandbytes==0.49.1      # via -r requirements-cuda.txt
+bleach==6.3.0             # via nbconvert
+cachetools==7.0.0         # via tox
+causal-conv1d==1.6.0      # via mamba-ssm
+certifi==2026.1.4         # via httpcore, httpx, requests, sentry-sdk
+cffi==2.0.0               # via argon2-cffi-bindings
+cfgv==3.5.0               # via pre-commit
 chardet==5.2.0            # via tox
-charset-normalizer==3.4.3  # via requests
-click==8.2.1              # via wandb
+charset-normalizer==3.4.4  # via requests
+click==8.3.1              # via typer-slim, wandb
 colorama==0.4.6           # via tox
 comm==0.2.3               # via ipykernel, ipywidgets
 contourpy==1.3.3          # via matplotlib
 cycler==0.12.1            # via matplotlib
-datasets==4.0.0           # via trl, -r requirements.txt
-debugpy==1.8.16           # via ipykernel
+datasets==4.5.0           # via trl, -r requirements.txt
+debugpy==1.8.20           # via ipykernel
 decorator==5.2.1          # via ipython
-deepspeed==0.17.5         # via -r requirements-deepspeed.txt
+deepspeed==0.18.5         # via -r requirements-deepspeed.txt
 defusedxml==0.7.1         # via nbconvert
-dill==0.3.8               # via datasets, multiprocess, pylint
+dill==0.4.0               # via datasets, multiprocess, pylint
 distlib==0.4.0            # via virtualenv
-einops==0.8.1             # via deepspeed, flash-attn
-executing==2.2.0          # via stack-data
+einops==0.8.2             # via deepspeed, flash-attn, mamba-ssm
+executing==2.2.1          # via stack-data
 fastjsonschema==2.21.2    # via nbformat
-filelock==3.19.1          # via datasets, huggingface-hub, torch, tox, transformers, virtualenv
+filelock==3.20.3          # via datasets, huggingface-hub, torch, tox, transformers, virtualenv
 flash-attn==2.7.4.post1   # via -c constraints-dev.txt.in, -r requirements-cuda.txt, -r requirements-rocm.txt
-fonttools==4.59.2         # via matplotlib
+fonttools==4.61.1         # via matplotlib
 fqdn==1.5.1               # via jsonschema
-frozenlist==1.7.0         # via aiohttp, aiosignal
-fsspec==2025.3.0          # via datasets, huggingface-hub, torch
+frozenlist==1.8.0         # via aiohttp, aiosignal
+fsspec==2025.10.0         # via datasets, huggingface-hub, torch
 gitdb==4.0.12             # via gitpython
-gitpython==3.1.45         # via wandb
-grpcio==1.74.0            # via tensorboard
+gitpython==3.1.46         # via wandb
+grpcio==1.76.0            # via tensorboard
 h11==0.16.0               # via httpcore
 hf-xet==1.2.0             # via huggingface-hub
 hjson==3.1.0              # via deepspeed
 httpcore==1.0.9           # via httpx
-httpx==0.28.1             # via jupyterlab
-huggingface-hub==1.3.4    # via accelerate, datasets, peft, tokenizers, transformers, -r requirements-dev.txt
-identify==2.6.13          # via pre-commit
-idna==3.10                # via anyio, httpx, jsonschema, requests, yarl
-iniconfig==2.1.0          # via pytest
-ipykernel==6.30.1         # via jupyter, jupyter-console, jupyterlab, -r requirements-dev.txt
-ipython==9.5.0            # via ipykernel, ipywidgets, jupyter-console, -r requirements-dev.txt
+httpx==0.28.1             # via datasets, huggingface-hub, jupyterlab
+huggingface-hub==1.3.5    # via accelerate, datasets, kernels, peft, tokenizers, transformers, -r requirements-dev.txt
+identify==2.6.16          # via pre-commit
+idna==3.11                # via anyio, httpx, jsonschema, requests, yarl
+iniconfig==2.3.0          # via pytest
+ipykernel==7.1.0          # via jupyter, jupyter-console, jupyterlab, -r requirements-dev.txt
+ipython==9.9.0            # via ipykernel, ipywidgets, jupyter-console, -r requirements-dev.txt
 ipython-pygments-lexers==1.1.1  # via ipython
-ipywidgets==8.1.7         # via jupyter
+ipywidgets==8.1.8         # via jupyter
 isoduration==20.11.0      # via jsonschema
-isort==6.0.1              # via pylint, -r requirements-dev.txt
+isort==7.0.0              # via pylint, -r requirements-dev.txt
 jedi==0.19.2              # via ipython
 jinja2==3.1.6             # via jupyter-server, jupyterlab, jupyterlab-server, nbconvert, torch
-json5==0.12.1             # via jupyterlab-server
+json5==0.13.0             # via jupyterlab-server
 jsonpointer==3.0.0        # via jsonschema
-jsonschema==4.25.1        # via jupyter-events, jupyterlab-server, nbformat
-jsonschema-specifications==2025.4.1  # via jsonschema
+jsonschema==4.26.0        # via jupyter-events, jupyterlab-server, nbformat
+jsonschema-specifications==2025.9.1  # via jsonschema
 jupyter==1.1.1            # via -r requirements-dev.txt
-jupyter-client==8.6.3     # via ipykernel, jupyter-console, jupyter-server, nbclient
+jupyter-client==8.8.0     # via ipykernel, jupyter-console, jupyter-server, nbclient
 jupyter-console==6.6.3    # via jupyter
-jupyter-core==5.8.1       # via ipykernel, jupyter-client, jupyter-console, jupyter-server, jupyterlab, nbclient, nbconvert, nbformat
+jupyter-core==5.9.1       # via ipykernel, jupyter-client, jupyter-console, jupyter-server, jupyterlab, nbclient, nbconvert, nbformat
 jupyter-events==0.12.0    # via jupyter-server
 jupyter-lsp==2.3.0        # via jupyterlab
 jupyter-server==2.17.0    # via jupyter-lsp, jupyterlab, jupyterlab-server, notebook, notebook-shim
-jupyter-server-terminals==0.5.3  # via jupyter-server
-jupyterlab==4.4.6         # via jupyter, notebook
+jupyter-server-terminals==0.5.4  # via jupyter-server
+jupyterlab==4.5.3         # via jupyter, notebook
 jupyterlab-pygments==0.3.0  # via nbconvert
-jupyterlab-server==2.27.3  # via jupyterlab, notebook
-jupyterlab-widgets==3.0.15  # via ipywidgets
+jupyterlab-server==2.28.0  # via jupyterlab, notebook
+jupyterlab-widgets==3.0.16  # via ipywidgets
+kernels==0.12.1           # via -r requirements-cuda.txt
 kiwisolver==1.4.9         # via matplotlib
-lark==1.2.2               # via rfc3987-syntax
-liger-kernel==0.6.2       # via -r requirements-cuda.txt
-llvmlite==0.45.0          # via numba
-markdown==3.8.2           # via tensorboard
+lark==1.3.1               # via rfc3987-syntax
+librt==0.7.8              # via mypy
+liger-kernel==0.6.4       # via -r requirements-cuda.txt
+llvmlite==0.46.0          # via numba
+mamba-ssm==2.3.0          # via -r requirements-cuda.txt, -r requirements-rocm.txt
+markdown==3.10.1          # via tensorboard
 markdown-it-py==4.0.0     # via rich
-markupsafe==3.0.2         # via jinja2, nbconvert, werkzeug
-matplotlib==3.10.6        # via -r requirements-dev.txt
-matplotlib-inline==0.1.7  # via ipykernel, ipython
+markupsafe==3.0.3         # via jinja2, nbconvert, werkzeug
+matplotlib==3.10.8        # via -r requirements-dev.txt
+matplotlib-inline==0.2.1  # via ipykernel, ipython
 mccabe==0.7.0             # via pylint
 mdurl==0.1.2              # via markdown-it-py
-mistune==3.1.4            # via nbconvert
+mistune==3.2.0            # via nbconvert
 mpmath==1.3.0             # via sympy
-msgpack==1.1.1            # via deepspeed
-multidict==6.6.4          # via aiohttp, yarl
-multiprocess==0.70.16     # via datasets
-mypy==1.17.1              # via -r requirements-dev.txt
+msgpack==1.1.2            # via deepspeed
+multidict==6.7.1          # via aiohttp, yarl
+multiprocess==0.70.18     # via datasets
+mypy==1.19.1              # via -r requirements-dev.txt
 mypy-extensions==1.1.0    # via mypy
-nbclient==0.10.2          # via nbconvert
-nbconvert==7.16.6         # via jupyter, jupyter-server
+nbclient==0.10.4          # via nbconvert
+nbconvert==7.17.0         # via jupyter, jupyter-server
 nbformat==5.10.4          # via jupyter-server, nbclient, nbconvert
 nest-asyncio==1.6.0       # via ipykernel
-networkx==3.5             # via torch
-ninja==1.13.0             # via deepspeed
-nodeenv==1.9.1            # via pre-commit
-notebook==7.4.5           # via jupyter
+networkx==3.6.1           # via torch
+ninja==1.13.0             # via causal-conv1d, deepspeed, mamba-ssm
+nodeenv==1.10.0           # via pre-commit
+notebook==7.5.3           # via jupyter
 notebook-shim==0.2.4      # via jupyterlab, notebook
-numba==0.62.1             # via -r requirements.txt
-numpy==2.3.3              # via accelerate, bitsandbytes, contourpy, datasets, deepspeed, matplotlib, numba, pandas, peft, tensorboard, transformers, -r requirements-dev.txt, -r requirements.txt
+numba==0.63.1             # via -r requirements.txt
+numpy==2.3.5              # via accelerate, bitsandbytes, contourpy, datasets, deepspeed, matplotlib, numba, pandas, peft, tensorboard, transformers, -r requirements-dev.txt, -r requirements.txt
 nvidia-cublas-cu12==12.4.5.8  # via nvidia-cudnn-cu12, nvidia-cusolver-cu12, torch
 nvidia-cuda-cupti-cu12==12.4.127  # via torch
 nvidia-cuda-nvrtc-cu12==12.4.127  # via torch
@@ -123,92 +127,92 @@ nvidia-nccl-cu12==2.21.5  # via torch
 nvidia-nvjitlink-cu12==12.4.127  # via nvidia-cusolver-cu12, nvidia-cusparse-cu12, torch
 nvidia-nvtx-cu12==12.4.127  # via torch
 overrides==7.7.0          # via jupyter-server
-packaging==25.0           # via accelerate, datasets, deepspeed, huggingface-hub, ipykernel, jupyter-events, jupyter-server, jupyterlab, jupyterlab-server, matplotlib, nbconvert, peft, pyproject-api, pytest, tensorboard, tox, transformers, wandb, -r requirements.txt
-pandas==2.3.2             # via datasets
+packaging==26.0           # via accelerate, bitsandbytes, causal-conv1d, datasets, deepspeed, huggingface-hub, ipykernel, jupyter-events, jupyter-server, jupyterlab, jupyterlab-server, kernels, mamba-ssm, matplotlib, nbconvert, peft, pyproject-api, pytest, tensorboard, tox, tox-uv, transformers, trl, wandb, wheel, -r requirements.txt
+pandas==3.0.0             # via datasets
 pandocfilters==1.5.1      # via nbconvert
 parso==0.8.5              # via jedi
-pathspec==0.12.1          # via mypy
+pathspec==1.0.4           # via mypy
 peft==0.18.1              # via -r requirements.txt
 pexpect==4.9.0            # via ipython
-pillow==11.3.0            # via matplotlib, tensorboard
-platformdirs==4.4.0       # via jupyter-core, pylint, tox, virtualenv, wandb
+pillow==12.1.0            # via matplotlib, tensorboard
+platformdirs==4.5.1       # via jupyter-core, pylint, tox, virtualenv, wandb
 pluggy==1.6.0             # via pytest, tox
-pre-commit==4.3.0         # via -r requirements-dev.txt
-prometheus-client==0.22.1  # via jupyter-server
+pre-commit==4.5.1         # via -r requirements-dev.txt
+prometheus-client==0.24.1  # via jupyter-server
 prompt-toolkit==3.0.52    # via ipython, jupyter-console
-propcache==0.3.2          # via aiohttp, yarl
-protobuf==6.32.0          # via tensorboard, wandb
-psutil==7.0.0             # via accelerate, deepspeed, ipykernel, peft
+propcache==0.4.1          # via aiohttp, yarl
+protobuf==6.33.5          # via tensorboard, wandb
+psutil==7.2.2             # via accelerate, deepspeed, ipykernel, peft
 ptyprocess==0.7.0         # via pexpect, terminado
 pure-eval==0.2.3          # via stack-data
 py-cpuinfo==9.0.0         # via deepspeed, -r requirements.txt
-pyarrow==21.0.0           # via datasets
-pycparser==2.22           # via cffi
-pydantic==2.11.7          # via deepspeed, pylint-pydantic, wandb, -r requirements.txt
-pydantic-core==2.33.2     # via pydantic
+pyarrow==23.0.0           # via datasets
+pycparser==3.0            # via cffi
+pydantic==2.12.5          # via deepspeed, pylint-pydantic, wandb, -r requirements.txt
+pydantic-core==2.41.5     # via pydantic
 pygments==2.19.2          # via ipython, ipython-pygments-lexers, jupyter-console, nbconvert, pytest, rich
-pylint==3.3.8             # via pylint-plugin-utils, pylint-pydantic, -r requirements-dev.txt
+pylint==4.0.4             # via pylint-plugin-utils, pylint-pydantic, -r requirements-dev.txt
 pylint-plugin-utils==0.9.0  # via pylint-pydantic
-pylint-pydantic==0.3.5    # via -r requirements-dev.txt
-pyparsing==3.2.3          # via matplotlib
-pyproject-api==1.9.1      # via tox
-pytest==8.4.1             # via -r requirements-dev.txt
+pylint-pydantic==0.4.1    # via -r requirements-dev.txt
+pyparsing==3.3.2          # via matplotlib
+pyproject-api==1.10.0     # via tox
+pytest==9.0.2             # via -r requirements-dev.txt
 python-dateutil==2.9.0.post0  # via arrow, jupyter-client, matplotlib, pandas
-python-json-logger==3.3.0  # via jupyter-events
-pytz==2025.2              # via pandas
-pyyaml==6.0.2             # via accelerate, datasets, huggingface-hub, jupyter-events, peft, pre-commit, transformers, wandb, -r requirements.txt
-pyzmq==27.0.2             # via ipykernel, jupyter-client, jupyter-console, jupyter-server
-referencing==0.36.2       # via jsonschema, jsonschema-specifications, jupyter-events
-regex==2025.8.29          # via transformers
-requests==2.32.5          # via datasets, huggingface-hub, jupyterlab-server, transformers, wandb
+python-json-logger==4.0.0  # via jupyter-events
+pyyaml==6.0.3             # via accelerate, datasets, huggingface-hub, jupyter-events, kernels, peft, pre-commit, transformers, wandb, -r requirements.txt
+pyzmq==27.1.0             # via ipykernel, jupyter-client, jupyter-console, jupyter-server
+referencing==0.37.0       # via jsonschema, jsonschema-specifications, jupyter-events
+regex==2026.1.15          # via transformers
+requests==2.32.5          # via datasets, jupyterlab-server, wandb
 rfc3339-validator==0.1.4  # via jsonschema, jupyter-events
 rfc3986-validator==0.1.1  # via jsonschema, jupyter-events
 rfc3987-syntax==1.1.0     # via jsonschema
-rich==14.1.0              # via -r requirements.txt
-rpds-py==0.27.1           # via jsonschema, referencing
-ruff==0.12.11             # via -r requirements-dev.txt
-safetensors==0.6.2        # via accelerate, peft, transformers
-send2trash==1.8.3         # via jupyter-server
-sentry-sdk==2.35.1        # via wandb
-setuptools==80.9.0        # via jupyterlab, tensorboard
+rich==14.3.2              # via -r requirements.txt
+rpds-py==0.30.0           # via jsonschema, referencing
+ruff==0.14.14             # via -r requirements-dev.txt
+safetensors==0.7.0        # via accelerate, peft, transformers
+send2trash==2.1.0         # via jupyter-server
+sentry-sdk==2.51.0        # via wandb
+setuptools==80.10.2       # via jupyterlab, mamba-ssm, tensorboard
+shellingham==1.5.4        # via huggingface-hub
 six==1.17.0               # via python-dateutil, rfc3339-validator
 smmap==5.0.2              # via gitdb
-sniffio==1.3.1            # via anyio
-soupsieve==2.8            # via beautifulsoup4
+soupsieve==2.8.3          # via beautifulsoup4
 stack-data==0.6.3         # via ipython
 sympy==1.13.1             # via torch
 tensorboard==2.20.0       # via -r requirements-dev.txt
 tensorboard-data-server==0.7.2  # via tensorboard
 terminado==0.18.1         # via jupyter-server, jupyter-server-terminals
 tinycss2==1.4.0           # via bleach
 tokenizers==0.22.2        # via transformers
-tomlkit==0.13.3           # via pylint
-torch==2.6.0              # via accelerate, bitsandbytes, deepspeed, flash-attn, liger-kernel, peft, -c constraints-dev.txt.in, -r requirements.txt
-tornado==6.5.2            # via ipykernel, jupyter-client, jupyter-server, jupyterlab, notebook, terminado
-tox==4.29.0               # via tox-uv, -r requirements-dev.txt
-tox-uv==1.25.0            # via -r requirements-dev.txt
-tqdm==4.67.1              # via datasets, deepspeed, huggingface-hub, peft, transformers
+tomlkit==0.14.0           # via pylint
+torch==2.6.0              # via accelerate, bitsandbytes, causal-conv1d, deepspeed, flash-attn, liger-kernel, mamba-ssm, peft, -c constraints-dev.txt.in, -r requirements.txt
+tornado==6.5.4            # via ipykernel, jupyter-client, jupyter-server, jupyterlab, notebook, terminado
+tox==4.34.1               # via tox-uv, -r requirements-dev.txt
+tox-uv==1.29.0            # via -r requirements-dev.txt
+tqdm==4.67.2              # via datasets, deepspeed, huggingface-hub, peft, transformers
 traitlets==5.14.3         # via ipykernel, ipython, ipywidgets, jupyter-client, jupyter-console, jupyter-core, jupyter-events, jupyter-server, jupyterlab, matplotlib-inline, nbclient, nbconvert, nbformat
-transformers==5.0.0       # via peft, trl, -r requirements.txt
-triton==3.2.0             # via liger-kernel, torch
-trl==0.22.1               # via -r requirements.txt
-types-python-dateutil==2.9.0.20250822  # via arrow
-types-pyyaml==6.0.12.20250822  # via -r requirements-dev.txt
-types-requests==2.32.4.20250809  # via types-tqdm
+transformers==5.0.0       # via mamba-ssm, peft, trl, -r requirements.txt
+triton==3.2.0             # via liger-kernel, mamba-ssm, torch
+trl==0.27.1               # via -r requirements.txt
+typer-slim==0.21.1        # via huggingface-hub, transformers
+types-pyyaml==6.0.12.20250915  # via -r requirements-dev.txt
+types-requests==2.32.4.20260107  # via types-tqdm
 types-tqdm==4.67.0.20250809  # via -r requirements-dev.txt
-typing-extensions==4.15.0  # via aiosignal, anyio, beautifulsoup4, huggingface-hub, ipython, mypy, pydantic, pydantic-core, referencing, torch, typing-inspection, wandb
-typing-inspection==0.4.1  # via pydantic
-tzdata==2025.2            # via pandas
+typing-extensions==4.15.0  # via aiosignal, anyio, beautifulsoup4, grpcio, huggingface-hub, ipython, mypy, pydantic, pydantic-core, referencing, torch, typer-slim, typing-inspection, wandb
+typing-inspection==0.4.2  # via pydantic
+tzdata==2025.3            # via arrow
 uri-template==1.3.0       # via jsonschema
-urllib3==2.5.0            # via requests, sentry-sdk, types-requests
-virtualenv==20.34.0       # via pre-commit, tox
-wandb==0.21.3             # via -r requirements-dev.txt
-wcwidth==0.2.13           # via prompt-toolkit
-webcolors==24.11.1        # via jsonschema
+urllib3==2.6.3            # via requests, sentry-sdk, types-requests
+uv==0.9.28                # via tox-uv
+virtualenv==20.36.1       # via pre-commit, tox
+wandb==0.24.1             # via -r requirements-dev.txt
+wcwidth==0.5.3            # via prompt-toolkit
+webcolors==25.10.0        # via jsonschema
 webencodings==0.5.1       # via bleach, tinycss2
-websocket-client==1.8.0   # via jupyter-server
-werkzeug==3.1.3           # via tensorboard
-wheel==0.45.1             # via -r requirements.txt
-widgetsnbextension==4.0.14  # via ipywidgets
-xxhash==3.5.0             # via datasets
-yarl==1.20.1              # via aiohttp
+websocket-client==1.9.0   # via jupyter-server
+werkzeug==3.1.5           # via tensorboard
+wheel==0.46.3             # via -r requirements.txt
+widgetsnbextension==4.0.15  # via ipywidgets
+xxhash==3.6.0             # via datasets
+yarl==1.22.0              # via aiohttp