|
112 | 112 | "array_api_compat==1.11.2", # only anndata requires |
113 | 113 | "async-timeout==5.0.1", |
114 | 114 | "attrs==25.3.0", |
115 | | - "av==14.2.0", |
| 115 | + "av==14.3.0", |
116 | 116 | "backoff==2.2.1", |
117 | 117 | "beautifulsoup4==4.13.4", |
118 | 118 | "bitsandbytes==0.45.5", |
119 | 119 | "braceexpand==0.1.7", |
120 | | - "certifi==2025.1.31", |
| 120 | + "certifi==2025.4.26", |
121 | 121 | "cffi==1.17.1", |
122 | 122 | "chardet==5.2.0", |
123 | | - "charset-normalizer==3.4.1", # requests requires <4 |
| 123 | + "charset-normalizer==3.4.2", # requests requires <4 |
124 | 124 | "chattts==0.2.3", |
125 | 125 | "click==8.1.8", |
126 | 126 | "cloudpickle==3.1.1", # only required by tiledb-cloud and 3+ is only supported by tiledb-cloud 0.13+ |
127 | 127 | "colorama==0.4.6", |
128 | 128 | "coloredlogs==15.0.1", |
129 | 129 | "contourpy==1.3.2", # only required by matplotlib |
130 | | - "cryptography==44.0.2", # only required by unstructured library |
| 130 | + "cryptography==44.0.3", # only required by unstructured library |
131 | 131 | "ctranslate2==4.6.0", |
132 | 132 | "cycler==0.12.1", |
133 | 133 | "dataclasses-json==0.6.7", |
134 | 134 | "datasets==3.5.0", |
135 | 135 | "deepdiff==8.4.2", # required by unstructured |
136 | 136 | "Deprecated==1.2.18", # only needed by pikepdf |
137 | 137 | "deprecation==2.1.0", # only needed by ocrmypdf |
138 | | - "dill==0.3.8", # datasets 3.5.0 requires <0.3.9; multiprocess 0.70.16 requires >=0.3.8 |
| 138 | + "dill==0.3.8", # datasets 3.5.1 requires <0.3.9; multiprocess 0.70.16 requires >=0.3.8 |
139 | 139 | "distro==1.9.0", |
140 | 140 | "docx2txt==0.9", |
141 | 141 | "einops==0.8.1", |
|
151 | 151 | "fonttools==4.57.0", # only required by matplotlib |
152 | 152 | "frozendict==2.4.6", |
153 | 153 | "frozenlist==1.5.0", |
154 | | - "fsspec==2024.12.0", # datasets 3.5.0 requires <=2024.12.0 |
| 154 | + "fsspec==2025.3.0", # datasets 3.5.1 requires <=2025.3.0 |
| 155 | + "fsspec[http]==2025.3.0", # datasets 3.5.1 requires <=2025.3.0 |
155 | 156 | "greenlet==3.2.1", |
156 | 157 | "gTTS==2.5.4", |
157 | 158 | "h11==0.16.0", |
|
168 | 169 | "importlib_metadata==8.7.0", |
169 | 170 | "Jinja2==3.1.6", |
170 | 171 | "jiter==0.9.0", # required by openai newer versions |
171 | | - "joblib==1.4.2", |
| 172 | + "joblib==1.5.0", |
172 | 173 | "jsonpatch==1.33", |
173 | 174 | "jsonpath-python==1.0.6", |
174 | 175 | "jsonpointer==3.0.0", |
175 | 176 | "kiwisolver==1.4.8", |
176 | | - "langchain==0.3.24", |
| 177 | + "langchain==0.3.25", |
177 | 178 | "langchain-community==0.3.23", |
178 | | - "langchain-core==0.3.56", |
| 179 | + "langchain-core==0.3.58", |
179 | 180 | "langchain-huggingface==0.1.2", |
180 | 181 | "langchain-text-splitters==0.3.8", |
181 | 182 | "langdetect==1.0.9", |
182 | | - "langsmith==0.3.38", |
| 183 | + "langsmith==0.3.42", |
183 | 184 | "llvmlite==0.44.0", # only required by numba |
184 | 185 | "lxml==5.4.0", |
185 | 186 | "Markdown==3.8", |
186 | 187 | "markdown-it-py==3.0.0", |
187 | 188 | "MarkupSafe==3.0.2", |
188 | | - "marshmallow==3.26.1", |
| 189 | + "marshmallow==3.26.1", # dataclasses-json==0.6.7 requires less than 4.0.0 |
189 | 190 | "matplotlib==3.10.1", # uniquely requires pyparsing==3.1.2 cycler==0.12.1 kiwisolver==1.4.5 |
190 | 191 | "mdurl==0.1.2", |
191 | 192 | "more-itertools==10.7.0", |
192 | 193 | "mpmath==1.3.0", # sympy 1.13.1 requires less than 1.4 |
193 | 194 | "msg-parser==1.2.0", |
194 | 195 | "multidict==6.4.3", |
195 | | - "multiprocess==0.70.16", # datasets 3.5.0 requires <0.70.17 |
| 196 | + "multiprocess==0.70.16", # datasets 3.5.1 requires <0.70.17 |
196 | 197 | "mypy-extensions==1.1.0", |
197 | 198 | "natsort==8.4.0", |
198 | 199 | "nest-asyncio==1.6.0", |
|
208 | 209 | "numpy==1.26.4", |
209 | 210 | "ocrmypdf==16.10.1", |
210 | 211 | "olefile==0.47", |
211 | | - "openai==1.76.0", # only required by chat_lm_studio.py script and whispers2t (if using openai vanilla backend) |
| 212 | + "openai==1.77.0", # only required by chat_lm_studio.py script and whispers2t (if using openai vanilla backend) |
212 | 213 | "openai-whisper==20240930", # only required by whisper_s2t (if using openai vanilla backend) |
213 | 214 | "openpyxl==3.1.5", |
214 | 215 | "optimum==1.24.0", |
215 | 216 | "ordered-set==4.1.0", |
216 | 217 | "orderly-set==5.4.0", # deepdiff 8.2.0 requires orderly-set=5.3.0,<6 |
217 | | - "orjson==3.10.17", |
218 | | - "packaging==24.2", |
| 218 | + "orjson==3.10.18", |
| 219 | + "packaging==24.2", # langchain-core==0.3.56 requires less than 25 |
219 | 220 | "pandas==2.2.3", |
220 | 221 | "pdfminer.six==20250416", # only needed by ocrmypdf |
221 | 222 | "pikepdf==9.7.0", # only needed by ocrmypdf |
|
227 | 228 | "propcache==0.3.1", |
228 | 229 | "protobuf==6.30.2", |
229 | 230 | "psutil==7.0.0", |
230 | | - "pyarrow==19.0.1", |
| 231 | + "pyarrow==20.0.0", |
231 | 232 | "pybase16384==0.3.8", # only required by chattts |
232 | 233 | "pycparser==2.22", |
233 | | - "pydantic==2.11.3", |
234 | | - "pydantic_core==2.33.1", # pydantic 2.11.2 requires pydantic_core==2.33.1 |
235 | | - "pydantic-settings==2.8.1", |
| 234 | + "pydantic==2.11.3", # unstructured-client==0.34.0 requires pydantic>=2.11.2 |
| 235 | + "pydantic_core==2.33.1", # pydantic 2.11.4 requires pydantic_core==2.33.2 |
| 236 | + "pydantic-settings==2.8.1", # langchain-community==0.3.23 requires pydantic-settings>=2.4.0,<3.0.0 |
236 | 237 | "Pygments==2.19.1", |
237 | 238 | "PyOpenGL==3.1.9", |
238 | 239 | "PyOpenGL-accelerate==3.1.9", |
|
258 | 259 | "safetensors==0.5.3", |
259 | 260 | "scikit-learn==1.6.1", |
260 | 261 | "scipy==1.15.2", |
261 | | - "sentence-transformers==4.0.2", |
| 262 | + "sentence-transformers==4.1.0", |
262 | 263 | "sentencepiece==0.2.0", |
263 | 264 | "six==1.17.0", |
264 | 265 | "sniffio==1.3.1", |
|
272 | 273 | "tabulate==0.9.0", |
273 | 274 | "tblib==3.1.0", # only tiledb-cloud requires |
274 | 275 | "tenacity==9.1.2", |
275 | | - "termcolor==3.0.1", |
| 276 | + "termcolor==3.1.0", |
276 | 277 | "tessdata==1.0.0", |
277 | 278 | "tessdata.eng==1.0.0", |
278 | 279 | "threadpoolctl==3.6.0", |
|
289 | 290 | "unstructured-client==0.34.0", |
290 | 291 | "tzdata==2025.2", |
291 | 292 | "urllib3==2.4.0", # requests 2.32.3 requires <3 |
292 | | - "vector-quantize-pytorch==1.22.15", |
| 293 | + "vector-quantize-pytorch==1.22.16", |
293 | 294 | "vocos==0.1.0", |
294 | 295 | "watchdog==6.0.0", |
295 | 296 | "webdataset==0.2.111", # required by all TTS libraries |
|
416 | 417 | 'function': 'Qwen', |
417 | 418 | 'precision': 'bfloat16', |
418 | 419 | 'gated': False, |
419 | | - 'max_new_tokens': 4096, |
| 420 | + 'max_new_tokens': 8192, |
420 | 421 | }, |
421 | 422 | 'Mistral Small 3 - 24b': { |
422 | 423 | 'model': 'Mistral Small 3 - 24b', |
|
449 | 450 | 'function': 'Qwen', |
450 | 451 | 'precision': 'bfloat16', |
451 | 452 | 'gated': False, |
452 | | - 'max_new_tokens': 4096, |
| 453 | + 'max_new_tokens': 8192, |
453 | 454 | }, |
454 | 455 | 'GLM4-Z1 - 32b': { |
455 | 456 | 'model': 'GLM4-Z1 - 32b', |
|
1885 | 1886 | "folder": "tenacity" |
1886 | 1887 | }, |
1887 | 1888 | "Tile DB": { |
1888 | | - "URL": "https://docs.tiledb.com/main", |
| 1889 | + "URL": "https://tiledb-inc-tiledb.readthedocs-hosted.com/projects/tiledb-py/en/stable/python-api.html", |
1889 | 1890 | "folder": "tiledb", |
1890 | | - "scraper_class": "TileDBScraper" |
| 1891 | + # "scraper_class": "TileDBScraper" |
| 1892 | + "scraper_class": "ReadthedocsScraper" |
1891 | 1893 | }, |
1892 | 1894 | "tiledb-vector-search": { |
1893 | 1895 | "URL": "https://tiledb-inc.github.io/TileDB-Vector-Search/documentation/", |
|
0 commit comments