docling-project
diff --git a/‎CHANGELOG.md‎
Lines changed: 16 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎docling/backend/msword_backend.py‎
Lines changed: 40 additions & 29 deletions b/‎docling/backend/msword_backend.py‎
Lines changed: 40 additions & 29 deletions
diff --git a/‎docling/cli/main.py‎
Lines changed: 8 additions & 18 deletions b/‎docling/cli/main.py‎
Lines changed: 8 additions & 18 deletions
diff --git a/‎docling/models/document_picture_classifier.py‎
Lines changed: 31 additions & 7 deletions b/‎docling/models/document_picture_classifier.py‎
Lines changed: 31 additions & 7 deletions
diff --git a/‎docling/models/picture_description_base_model.py‎
Lines changed: 12 additions & 0 deletions b/‎docling/models/picture_description_base_model.py‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎docling/models/vlm_models_inline/mlx_model.py‎
Lines changed: 3 additions & 8 deletions b/‎docling/models/vlm_models_inline/mlx_model.py‎
Lines changed: 3 additions & 8 deletions
diff --git a/‎docs/examples/advanced_chunking_and_serialization.ipynb‎
Lines changed: 13 additions & 14 deletions b/‎docs/examples/advanced_chunking_and_serialization.ipynb‎
Lines changed: 13 additions & 14 deletions
diff --git a/‎docs/examples/custom_convert.py‎
Lines changed: 11 additions & 8 deletions b/‎docs/examples/custom_convert.py‎
Lines changed: 11 additions & 8 deletions
@@ -1,3 +1,19 @@
+## [v2.67.0](https://github.com/docling-project/docling/releases/tag/v2.67.0) - 2026-01-09
+
+### Feature
+
+* Enrichment annotations in the new meta format ([#2859](https://github.com/docling-project/docling/issues/2859)) ([`aab3ff5`](https://github.com/docling-project/docling/commit/aab3ff5d82fc54864657c0c2ff8e0aa21461f23f))
+* Add XPU device support for Intel GPUs ([#2809](https://github.com/docling-project/docling/issues/2809)) ([`2b83fdd`](https://github.com/docling-project/docling/commit/2b83fdd0deeec0f1ad016cc78ea42d3144a86cad))
+* Add option to report timings details ([#2772](https://github.com/docling-project/docling/issues/2772)) ([`cbc6537`](https://github.com/docling-project/docling/commit/cbc6537ee856349cef9b1ed453310e269667534c))
+
+### Fix
+
+* Lock new deps and update python 3.14 warnings ([#2844](https://github.com/docling-project/docling/issues/2844)) ([`d9295df`](https://github.com/docling-project/docling/commit/d9295df30202e251c9e282a4d0ce61653c7268b6))
+* Correct type hint for table_structure_options usage ([#2823](https://github.com/docling-project/docling/issues/2823)) ([`a0530a2`](https://github.com/docling-project/docling/commit/a0530a271e5411bae96cfcb8a6ae23b3431a7462))
+* Transformers models lazy-loaded ([#2826](https://github.com/docling-project/docling/issues/2826)) ([`3ef4525`](https://github.com/docling-project/docling/commit/3ef45258b7de6f5efe13b1f5ba392d72e2854349))
+* Font download by passing font_path to RapidOcr ([#2822](https://github.com/docling-project/docling/issues/2822)) ([`ffafe58`](https://github.com/docling-project/docling/commit/ffafe58ad25e0ebdca44a41f8df9f691c9a393bf))
+* **cli:** Add Layout and Table models to --show-external-plugins ([#2832](https://github.com/docling-project/docling/issues/2832)) ([`ed57089`](https://github.com/docling-project/docling/commit/ed5708907fcd29e56b114ce7062c4c2693c67b6b))
+
 ## [v2.66.0](https://github.com/docling-project/docling/releases/tag/v2.66.0) - 2025-12-24
 
 ### Feature
 
@@ -1515,9 +1515,9 @@ def _is_rich_table_cell(self, cell: _Cell) -> bool:
     def _handle_pictures(
         self, drawing_blip: Any, doc: DoclingDocument
     ) -> list[RefItem]:
-        def get_docx_image(drawing_blip: Any) -> Optional[bytes]:
+        def get_docx_image(image: Any) -> Optional[bytes]:
             image_data: Optional[bytes] = None
-            rId = drawing_blip[0].get(
+            rId = image.get(
                 "{http://schemas.openxmlformats.org/officeDocument/2006/relationships}embed"
             )
             if rId in self.docx_obj.part.rels:
@@ -1527,36 +1527,47 @@ def get_docx_image(drawing_blip: Any) -> Optional[bytes]:
             return image_data
 
         elem_ref: list[RefItem] = []
-        level = self._get_level()
-        # Open the BytesIO object with PIL to create an Image
-        image_data: Optional[bytes] = get_docx_image(drawing_blip)
-        if image_data is None:
-            _log.warning("Warning: image cannot be found")
-            p1 = doc.add_picture(
-                parent=self.parents[level - 1],
-                caption=None,
-                content_layer=self.content_layer,
-            )
-            elem_ref.append(p1.get_ref())
-        else:
-            try:
-                image_bytes = BytesIO(image_data)
-                pil_image = Image.open(image_bytes)
-                p2 = doc.add_picture(
-                    parent=self.parents[level - 1],
-                    image=ImageRef.from_pil(image=pil_image, dpi=72),
-                    caption=None,
-                    content_layer=self.content_layer,
-                )
-                elem_ref.append(p2.get_ref())
-            except (UnidentifiedImageError, OSError):
-                _log.warning("Warning: image cannot be loaded by Pillow")
-                p3 = doc.add_picture(
+        if drawing_blip:
+            level = self._get_level()
+            # Open the BytesIO object with PIL to create an Image
+            parent: Optional[NodeItem] = (
+                self.parents[level - 1]
+                if len(drawing_blip) == 1
+                else doc.add_group(
+                    label=GroupLabel.PICTURE_AREA,
                     parent=self.parents[level - 1],
-                    caption=None,
                     content_layer=self.content_layer,
                 )
-                elem_ref.append(p3.get_ref())
+            )
+            for image in drawing_blip:
+                image_data: Optional[bytes] = get_docx_image(image)
+                if image_data is None:
+                    _log.warning("Warning: image cannot be found")
+                    p1 = doc.add_picture(
+                        parent=parent,
+                        caption=None,
+                        content_layer=self.content_layer,
+                    )
+                    elem_ref.append(p1.get_ref())
+                else:
+                    try:
+                        image_bytes = BytesIO(image_data)
+                        pil_image = Image.open(image_bytes)
+                        p2 = doc.add_picture(
+                            parent=parent,
+                            image=ImageRef.from_pil(image=pil_image, dpi=72),
+                            caption=None,
+                            content_layer=self.content_layer,
+                        )
+                        elem_ref.append(p2.get_ref())
+                    except (UnidentifiedImageError, OSError):
+                        _log.warning("Warning: image cannot be loaded by Pillow")
+                        p3 = doc.add_picture(
+                            parent=parent,
+                            caption=None,
+                            content_layer=self.content_layer,
+                        )
+                        elem_ref.append(p3.get_ref())
         return elem_ref
 
     def _handle_drawingml(self, doc: DoclingDocument, drawingml_els: Any):
 
@@ -833,15 +833,10 @@ def convert(  # noqa: C901
 
                         pipeline_options.vlm_options = SMOLDOCLING_MLX
                     except ImportError:
-                        if sys.version_info < (3, 14):
-                            _log.warning(
-                                "To run SmolDocling faster, please install mlx-vlm:\n"
-                                "pip install mlx-vlm"
-                            )
-                        else:
-                            _log.warning(
-                                "You can run SmolDocling faster with MLX support, but it is unfortunately not yet available on Python 3.14."
-                            )
+                        _log.warning(
+                            "To run SmolDocling faster, please install mlx-vlm:\n"
+                            "pip install mlx-vlm"
+                        )
 
             elif vlm_model == VlmModelType.GRANITEDOCLING:
                 pipeline_options.vlm_options = GRANITEDOCLING_TRANSFORMERS
@@ -851,15 +846,10 @@ def convert(  # noqa: C901
 
                         pipeline_options.vlm_options = GRANITEDOCLING_MLX
                     except ImportError:
-                        if sys.version_info < (3, 14):
-                            _log.warning(
-                                "To run GraniteDocling faster, please install mlx-vlm:\n"
-                                "pip install mlx-vlm"
-                            )
-                        else:
-                            _log.warning(
-                                "You can run GraniteDocling faster with MLX support, but it is unfortunately not yet available on Python 3.14."
-                            )
+                        _log.warning(
+                            "To run GraniteDocling faster, please install mlx-vlm:\n"
+                            "pip install mlx-vlm"
+                        )
 
             elif vlm_model == VlmModelType.SMOLDOCLING_VLLM:
                 pipeline_options.vlm_options = SMOLDOCLING_VLLM
 
@@ -8,8 +8,11 @@
     NodeItem,
     PictureClassificationClass,
     PictureClassificationData,
+    PictureClassificationMetaField,
     PictureItem,
+    PictureMeta,
 )
+from docling_core.types.doc.document import PictureClassificationPrediction
 from PIL import Image
 from pydantic import BaseModel
 
@@ -169,17 +172,38 @@ def __call__(
         outputs = self.document_picture_classifier.predict(images)
 
         for item, output in zip(elements, outputs):
+            predicted_classes = [
+                PictureClassificationClass(
+                    class_name=pred[0],
+                    confidence=pred[1],
+                )
+                for pred in output
+            ]
+
+            # FIXME: annotations is deprecated, remove once all consumers use meta.classification
             item.annotations.append(
                 PictureClassificationData(
                     provenance="DocumentPictureClassifier",
-                    predicted_classes=[
-                        PictureClassificationClass(
-                            class_name=pred[0],
-                            confidence=pred[1],
-                        )
-                        for pred in output
-                    ],
+                    predicted_classes=predicted_classes,
                 )
             )
 
+            # Store classification in the new meta field
+            predictions = [
+                PictureClassificationPrediction(
+                    class_name=pred.class_name,
+                    confidence=pred.confidence,
+                    created_by="DocumentPictureClassifier",
+                )
+                for pred in predicted_classes
+            ]
+            classification_data = PictureClassificationMetaField(
+                predictions=predictions,
+            )
+
+            if item.meta is not None:
+                item.meta.classification = classification_data
+            else:
+                item.meta = PictureMeta(classification=classification_data)
+
             yield item
@@ -4,9 +4,11 @@
 from typing import List, Optional, Type, Union
 
 from docling_core.types.doc import (
+    DescriptionMetaField,
     DoclingDocument,
     NodeItem,
     PictureItem,
+    PictureMeta,
 )
 from docling_core.types.doc.document import (  # TODO: move import to docling_core.types.doc
     PictureDescriptionData,
@@ -80,9 +82,19 @@ def __call__(
         outputs = self._annotate_images(images)
 
         for item, output in zip(elements, outputs):
+            # FIXME: annotations is deprecated, remove once all consumers use meta.classification
             item.annotations.append(
                 PictureDescriptionData(text=output, provenance=self.provenance)
             )
+
+            # Store classification in the new meta field
+            if item.meta is None:
+                item.meta = PictureMeta()
+            item.meta.description = DescriptionMetaField(
+                text=output,
+                created_by=self.provenance,
+            )
+
             yield item
 
     @classmethod
 
@@ -55,14 +55,9 @@ def __init__(
                 from mlx_vlm.prompt_utils import apply_chat_template  # type: ignore
                 from mlx_vlm.utils import load_config  # type: ignore
             except ImportError:
-                if sys.version_info < (3, 14):
-                    raise ImportError(
-                        "mlx-vlm is not installed. Please install it via `pip install mlx-vlm` to use MLX VLM models."
-                    )
-                else:
-                    raise ImportError(
-                        "mlx-vlm is not installed. It is not yet available on Python 3.14."
-                    )
+                raise ImportError(
+                    "mlx-vlm is not installed. Please install it via `pip install mlx-vlm` to use MLX VLM models."
+                )
 
             repo_cache_folder = vlm_options.repo_id.replace("/", "--")
 
 
@@ -419,7 +419,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -451,19 +451,18 @@
     "        **kwargs: Any,\n",
     "    ) -> SerializationResult:\n",
     "        text_parts: list[str] = []\n",
-    "        for annotation in item.annotations:\n",
-    "            if isinstance(annotation, PictureClassificationData):\n",
-    "                predicted_class = (\n",
-    "                    annotation.predicted_classes[0].class_name\n",
-    "                    if annotation.predicted_classes\n",
-    "                    else None\n",
-    "                )\n",
-    "                if predicted_class is not None:\n",
-    "                    text_parts.append(f\"Picture type: {predicted_class}\")\n",
-    "            elif isinstance(annotation, PictureMoleculeData):\n",
-    "                text_parts.append(f\"SMILES: {annotation.smi}\")\n",
-    "            elif isinstance(annotation, PictureDescriptionData):\n",
-    "                text_parts.append(f\"Picture description: {annotation.text}\")\n",
+    "\n",
+    "        if item.meta is not None:\n",
+    "            if item.meta.classification is not None:\n",
+    "                main_pred = item.meta.classification.get_main_prediction()\n",
+    "                if main_pred is not None:\n",
+    "                    text_parts.append(f\"Picture type: {main_pred.class_name}\")\n",
+    "\n",
+    "            if item.meta.molecule is not None:\n",
+    "                text_parts.append(f\"SMILES: {item.meta.molecule.smi}\")\n",
+    "\n",
+    "            if item.meta.description is not None:\n",
+    "                text_parts.append(f\"Picture description: {item.meta.description.text}\")\n",
     "\n",
     "        text_res = \"\\n\".join(text_parts)\n",
     "        text_res = doc_serializer.post_process(text=text_res)\n",
 
@@ -43,6 +43,7 @@
 from docling.datamodel.base_models import InputFormat
 from docling.datamodel.pipeline_options import (
     PdfPipelineOptions,
+    TableStructureOptions,
 )
 from docling.document_converter import DocumentConverter, PdfFormatOption
 
@@ -65,7 +66,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = False
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = False
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=False)
 
     # doc_converter = DocumentConverter(
     #     format_options={
@@ -80,7 +81,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = True
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
 
     # doc_converter = DocumentConverter(
     #     format_options={
@@ -95,7 +96,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = False
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
 
     # doc_converter = DocumentConverter(
     #     format_options={
@@ -110,7 +111,9 @@ def main():
     pipeline_options = PdfPipelineOptions()
     pipeline_options.do_ocr = True
     pipeline_options.do_table_structure = True
-    pipeline_options.table_structure_options.do_cell_matching = True
+    pipeline_options.table_structure_options = TableStructureOptions(
+        do_cell_matching=True
+    )
     pipeline_options.ocr_options.lang = ["es"]
     pipeline_options.accelerator_options = AcceleratorOptions(
         num_threads=4, device=AcceleratorDevice.AUTO
@@ -128,7 +131,7 @@ def main():
     # pipeline_options.do_ocr = True
     # pipeline_options.ocr_options.use_gpu = False  # <-- set this.
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
 
     # doc_converter = DocumentConverter(
     #     format_options={
@@ -141,7 +144,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = True
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
     # pipeline_options.ocr_options = TesseractOcrOptions()
 
     # doc_converter = DocumentConverter(
@@ -155,7 +158,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = True
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
     # pipeline_options.ocr_options = TesseractCliOcrOptions()
 
     # doc_converter = DocumentConverter(
@@ -169,7 +172,7 @@ def main():
     # pipeline_options = PdfPipelineOptions()
     # pipeline_options.do_ocr = True
     # pipeline_options.do_table_structure = True
-    # pipeline_options.table_structure_options.do_cell_matching = True
+    # pipeline_options.table_structure_options = TableStructureOptions(do_cell_matching=True)
     # pipeline_options.ocr_options = OcrMacOptions()
 
     # doc_converter = DocumentConverter(