|
156 | 156 | "bitsandbytes==0.47.0", |
157 | 157 | "braceexpand==0.1.7", |
158 | 158 | "certifi==2025.8.3", |
159 | | - "cffi==1.17.1", |
| 159 | + "cffi==2.0.0", |
160 | 160 | "chardet==5.2.0", |
161 | 161 | "charset-normalizer==3.4.3", # requests requires <4 |
162 | 162 | "git+https://github.com/BBC-Esq/chatterbox-light", |
|
166 | 166 | "colorama==0.4.6", |
167 | 167 | "coloredlogs==15.0.1", |
168 | 168 | "contourpy==1.3.3", # only required by matplotlib |
169 | | - "cryptography==45.0.6", # only required by unstructured and pdfminer.six |
| 169 | + "cryptography==45.0.7", # only required by unstructured and pdfminer.six |
170 | 170 | "ctranslate2==4.6.0", |
171 | 171 | "cycler==0.12.1", |
172 | 172 | "dataclasses-json==0.6.7", |
173 | 173 | "datasets==4.0.0", |
174 | | - "deepdiff==8.6.0", # required by unstructured |
| 174 | + "deepdiff==8.6.1", # required by unstructured |
175 | 175 | "Deprecated==1.2.18", # only needed by pikepdf |
176 | 176 | "deprecation==2.1.0", # only needed by ocrmypdf |
177 | 177 | "diffusers==0.35.1", # required by chatterbox-lite |
|
196 | 196 | "gTTS==2.5.4", |
197 | 197 | "h11==0.16.0", |
198 | 198 | "h5py==3.14.0", |
199 | | - "hf-xet==1.1.9", |
| 199 | + "hf-xet==1.1.10", |
200 | 200 | "html5lib==1.1", # only required by unstructured |
201 | 201 | "httpcore==1.0.9", |
202 | 202 | "httpx==0.28.1", |
|
209 | 209 | "importlib_metadata==8.7.0", |
210 | 210 | "Jinja2==3.1.6", |
211 | 211 | "jiter==0.10.0", # required by openai newer versions |
212 | | - "joblib==1.5.1", |
| 212 | + "joblib==1.5.2", |
213 | 213 | "jsonpatch==1.33", |
214 | 214 | "jsonpath-python==1.0.6", |
215 | 215 | "jsonpointer==3.0.0", |
216 | 216 | "kiwisolver==1.4.9", |
217 | 217 | "langchain==0.3.27", |
218 | 218 | "langchain-community==0.3.29", |
219 | | - "langchain-core==0.3.75", |
| 219 | + "langchain-core==0.3.76", |
220 | 220 | "langchain-huggingface==0.3.1", |
221 | | - "langchain-text-splitters==0.3.10", |
| 221 | + "langchain-text-splitters==0.3.11", |
222 | 222 | "langdetect==1.0.9", |
223 | 223 | "langsmith==0.4.14", |
224 | 224 | "llvmlite==0.44.0", # only required by numba |
225 | 225 | "lxml==6.0.1", |
226 | | - "Markdown==3.8.2", |
| 226 | + "Markdown==3.9", |
227 | 227 | "markdown-it-py==4.0.0", |
228 | 228 | "MarkupSafe==3.0.2", |
229 | 229 | "marshmallow==3.26.1", # dataclasses-json requires <4.0.0 |
230 | 230 | "matplotlib==3.10.6", # uniquely requires pyparsing, cycler, and kiwisolver |
231 | 231 | "mdurl==0.1.2", |
232 | | - "more-itertools==10.7.0", |
| 232 | + "more-itertools==10.8.0", |
233 | 233 | # "moshi==0.2.8", # installed at runtime if needed |
234 | 234 | "mpmath==1.3.0", # sympy 1.13.1 requires <1.4 |
235 | 235 | "msg-parser==1.2.0", |
|
245 | 245 | "ocrmypdf==16.10.4", |
246 | 246 | "olefile==0.47", |
247 | 247 | "onnx==1.19.0", # required by chatterbox-lite |
248 | | - "openai==1.102.0", # only required by chat_lm_studio.py script and whispers2t (if using openai vanilla backend) |
| 248 | + "openai==1.107.0", # only required by chat_lm_studio.py script and whispers2t (if using openai vanilla backend) |
249 | 249 | "openai-whisper==20250625", # only required by whisper_s2t (if using openai vanilla backend) |
250 | 250 | "openpyxl==3.1.5", |
251 | 251 | "optimum==1.27.0", |
|
255 | 255 | "packaging==25.0", |
256 | 256 | "pandas==2.3.2", |
257 | 257 | "pdfminer.six==20250506", # ocrmypdf 16.10.1 requires >=20220319 |
258 | | - "pikepdf==9.10.2", # only needed by ocrmypdf |
| 258 | + "pikepdf==9.11.0", # only needed by ocrmypdf |
259 | 259 | "pillow==11.3.0", |
260 | 260 | # "pi-heif==0.22.0", # only needed by ocrmypdf, but not for my usage of ocrmypdf |
261 | 261 | "pipdeptree", |
262 | 262 | "platformdirs==4.4.0", |
263 | 263 | "pluggy==1.6.0", # only needed by ocrmypdf |
264 | 264 | "propcache==0.3.2", |
265 | | - "protobuf==6.32.0", |
| 265 | + "protobuf==6.32.1", |
266 | 266 | "psutil==7.0.0", |
267 | 267 | "pyarrow==21.0.0", |
268 | 268 | "pybase16384==0.3.8", # only required by chattts |
269 | | - "pycparser==2.22", |
270 | | - "pydantic==2.11.7", |
271 | | - "pydantic_core==2.37.2", # pydantic 2.11.7 requires ==2.37.2; CAUTION, package checker is incorrect, check repo instead |
| 269 | + "pycparser==2.23", |
| 270 | + "pydantic==2.11.8", |
| 271 | + "pydantic_core==2.37.2", # pydantic 2.11.8 requires 2.38.0; CAUTION, check pyproject.toml from pydantic repo instead |
272 | 272 | "pydantic-settings==2.10.1", # langchain-community requires >=2.4.0,<3.0.0 |
273 | 273 | "Pygments==2.19.2", |
274 | 274 | "PyOpenGL==3.1.10", |
|
285 | 285 | "python-oxmsg==0.0.2", # only required by unstructured library |
286 | 286 | "pytz==2025.2", |
287 | 287 | "PyYAML==6.0.2", |
288 | | - "rapidfuzz==3.14.0", |
289 | | - "regex==2025.8.29", |
| 288 | + "rapidfuzz==3.14.1", |
| 289 | + "regex==2025.9.1", |
290 | 290 | "requests==2.32.5", |
291 | 291 | "requests-toolbelt==1.0.0", |
292 | 292 | "rich==14.1.0", |
293 | 293 | "ruamel.yaml==0.18.15", |
294 | 294 | "ruamel.yaml.clib==0.2.12", |
295 | 295 | "s3tokenizer==0.2.0", # required by chatterbox-lite |
296 | 296 | "safetensors==0.6.2", |
297 | | - "scikit-learn==1.7.1", |
298 | | - "scipy==1.16.1", |
| 297 | + "scikit-learn==1.7.2", |
| 298 | + "scipy==1.16.2", |
299 | 299 | "sentence-transformers==4.1.0", |
300 | 300 | "sentencepiece==0.2.1", |
301 | 301 | "six==1.17.0", |
|
319 | 319 | "threadpoolctl==3.6.0", |
320 | 320 | "tiktoken==0.11.0", |
321 | 321 | "tiledb==0.34.2", |
322 | | - "tiledb-cloud==0.13.0", |
| 322 | + "tiledb-cloud==0.14.1", |
323 | 323 | "tiledb-vector-search==0.13.0", |
324 | 324 | "timm==1.0.19", |
325 | 325 | "tokenizers==0.22.0", |
326 | 326 | "tqdm==4.67.1", |
327 | | - "transformers==4.56.1", |
| 327 | + # "transformers==4.56.1", |
| 328 | + "git+https://github.com/huggingface/[email protected]", |
328 | 329 | "typing-inspection==0.4.1", # required by pydantic and pydantic-settings |
329 | 330 | "typing_extensions==4.15.0", |
330 | 331 | "unstructured-client==0.42.3", |
|
333 | 334 | "vector-quantize-pytorch==1.23.2", |
334 | 335 | "vocos==0.1.0", |
335 | 336 | "watchdog==6.0.0", |
336 | | - "webdataset==0.2.111", # only requires by Whisperspeech; next is 1.0.2 so hesitate to upgrade |
| 337 | + "webdataset==1.0.2", # only requires by Whisperspeech; next is 1.0.2 so hesitate to upgrade |
337 | 338 | "webencodings==0.5.1", # only required by html5lib |
338 | 339 | "wrapt==1.17.3", |
339 | 340 | "xlrd==2.0.2", |
|
628 | 629 | 'license': 'mit', |
629 | 630 | }, |
630 | 631 | ], |
631 | | - # 'Google': [ |
632 | | - # { |
633 | | - # 'name': 'embeddinggemma-300m', |
634 | | - # 'dimensions': 768, |
635 | | - # 'max_sequence': 2048, |
636 | | - # 'size_mb': 1210, |
637 | | - # 'repo_id': 'google/embeddinggemma-300m', |
638 | | - # 'cache_dir': 'google--embeddinggemma-300m', |
639 | | - # 'type': 'vector', |
640 | | - # 'parameters': '303m', |
641 | | - # 'precision': 'float32', |
642 | | - # 'license': 'gemma - commercial ok', |
643 | | - # }, |
644 | | - # ], |
| 632 | + 'Google': [ |
| 633 | + { |
| 634 | + 'name': 'embeddinggemma-300m', |
| 635 | + 'dimensions': 768, |
| 636 | + 'max_sequence': 2048, |
| 637 | + 'size_mb': 1210, |
| 638 | + 'repo_id': 'google/embeddinggemma-300m', |
| 639 | + 'cache_dir': 'google--embeddinggemma-300m', |
| 640 | + 'type': 'vector', |
| 641 | + 'parameters': '303m', |
| 642 | + 'precision': 'float32', |
| 643 | + 'license': 'gemma - commercial ok', |
| 644 | + }, |
| 645 | + ], |
645 | 646 | 'IBM': [ |
646 | 647 | { |
647 | 648 | 'name': 'Granite-30m-English', |
|
882 | 883 | 'avg_length': 975, |
883 | 884 | 'loader': 'loader_qwenvl', |
884 | 885 | 'vision_component': 'Custom ViT', |
885 | | - 'chat_component': 'Qwen2.5-VL-3B-Instruct', |
| 886 | + 'chat_component': 'Qwen2.5-3B-Instruct', |
886 | 887 | 'license': 'Custom Non-Commercial', |
887 | 888 | }, |
888 | 889 | 'InternVL3 - 8b': { |
|
910 | 911 | 'avg_length': 918, |
911 | 912 | 'loader': 'loader_qwenvl', |
912 | 913 | 'vision_component': 'Custom ViT', |
913 | | - 'chat_component': 'Qwen2.5-VL-3B-Instruct', |
| 914 | + 'chat_component': 'Qwen2.5-7-Instruct', |
914 | 915 | 'license': 'Custom Non-Commercial', |
915 | 916 | }, |
916 | 917 | 'GLM-4.1V-9B-Thinking': { |
|
0 commit comments