|
1 | 1 | from collections import deque |
| 2 | +from unittest.mock import Mock |
2 | 3 |
|
3 | 4 | import pytest |
4 | 5 | import yaml |
|
7 | 8 |
|
8 | 9 | from docling_core.types.doc.document import ( |
9 | 10 | CURRENT_VERSION, |
| 11 | + BoundingBox, |
10 | 12 | DocItem, |
11 | 13 | DoclingDocument, |
12 | 14 | DocumentOrigin, |
|
15 | 17 | KeyValueItem, |
16 | 18 | ListItem, |
17 | 19 | PictureItem, |
| 20 | + ProvenanceItem, |
18 | 21 | SectionHeaderItem, |
| 22 | + Size, |
19 | 23 | TableCell, |
20 | 24 | TableData, |
21 | 25 | TableItem, |
@@ -407,3 +411,127 @@ def test_version_doc(): |
407 | 411 | comp_version = f"{major_split[0]}.{minor_split[0]}.{int(patch_split[0]) + 1}" |
408 | 412 | doc = DoclingDocument(name="Untitled 1", version=comp_version) |
409 | 413 | assert doc.version == CURRENT_VERSION |
| 414 | + |
| 415 | + |
| 416 | +def test_docitem_get_image(): |
| 417 | + # Prepare the document |
| 418 | + doc = DoclingDocument(name="Dummy") |
| 419 | + |
| 420 | + page1_image = PILImage.new(mode="RGB", size=(200, 400), color=(0, 0, 0)) |
| 421 | + doc_item_image = PILImage.new(mode="RGB", size=(20, 40), color=(255, 0, 0)) |
| 422 | + page1_image.paste(doc_item_image, box=(20, 40)) |
| 423 | + |
| 424 | + doc.add_page( # With image |
| 425 | + page_no=1, |
| 426 | + size=Size(width=20, height=40), |
| 427 | + image=ImageRef.from_pil(page1_image, dpi=72), |
| 428 | + ) |
| 429 | + doc.add_page(page_no=2, size=Size(width=20, height=40), image=None) # Without image |
| 430 | + |
| 431 | + # DocItem with no provenance |
| 432 | + doc_item = DocItem(self_ref="#", label=DocItemLabel.TEXT, prov=[]) |
| 433 | + assert doc_item.get_image(doc=doc) is None |
| 434 | + |
| 435 | + # DocItem on an invalid page |
| 436 | + doc_item = DocItem( |
| 437 | + self_ref="#", |
| 438 | + label=DocItemLabel.TEXT, |
| 439 | + prov=[ProvenanceItem(page_no=3, bbox=Mock(spec=BoundingBox), charspan=(1, 2))], |
| 440 | + ) |
| 441 | + assert doc_item.get_image(doc=doc) is None |
| 442 | + |
| 443 | + # DocItem on a page without page image |
| 444 | + doc_item = DocItem( |
| 445 | + self_ref="#", |
| 446 | + label=DocItemLabel.TEXT, |
| 447 | + prov=[ProvenanceItem(page_no=2, bbox=Mock(spec=BoundingBox), charspan=(1, 2))], |
| 448 | + ) |
| 449 | + assert doc_item.get_image(doc=doc) is None |
| 450 | + |
| 451 | + # DocItem on a page with valid page image |
| 452 | + doc_item = DocItem( |
| 453 | + self_ref="#", |
| 454 | + label=DocItemLabel.TEXT, |
| 455 | + prov=[ |
| 456 | + ProvenanceItem( |
| 457 | + page_no=1, bbox=BoundingBox(l=2, t=4, r=4, b=8), charspan=(1, 2) |
| 458 | + ) |
| 459 | + ], |
| 460 | + ) |
| 461 | + returned_doc_item_image = doc_item.get_image(doc=doc) |
| 462 | + assert ( |
| 463 | + returned_doc_item_image is not None |
| 464 | + and returned_doc_item_image.tobytes() == doc_item_image.tobytes() |
| 465 | + ) |
| 466 | + |
| 467 | + |
| 468 | +def test_floatingitem_get_image(): |
| 469 | + # Prepare the document |
| 470 | + doc = DoclingDocument(name="Dummy") |
| 471 | + |
| 472 | + page1_image = PILImage.new(mode="RGB", size=(200, 400), color=(0, 0, 0)) |
| 473 | + floating_item_image = PILImage.new(mode="RGB", size=(20, 40), color=(255, 0, 0)) |
| 474 | + page1_image.paste(floating_item_image, box=(20, 40)) |
| 475 | + |
| 476 | + doc.add_page( # With image |
| 477 | + page_no=1, |
| 478 | + size=Size(width=20, height=40), |
| 479 | + image=ImageRef.from_pil(page1_image, dpi=72), |
| 480 | + ) |
| 481 | + doc.add_page(page_no=2, size=Size(width=20, height=40), image=None) # Without image |
| 482 | + |
| 483 | + # FloatingItem with explicit image different from image based on provenance |
| 484 | + new_image = PILImage.new(mode="RGB", size=(40, 80), color=(0, 255, 0)) |
| 485 | + floating_item = FloatingItem( |
| 486 | + self_ref="#", |
| 487 | + label=DocItemLabel.PICTURE, |
| 488 | + prov=[ |
| 489 | + ProvenanceItem( |
| 490 | + page_no=1, bbox=BoundingBox(l=2, t=4, r=6, b=12), charspan=(1, 2) |
| 491 | + ) |
| 492 | + ], |
| 493 | + image=ImageRef.from_pil(image=new_image, dpi=72), |
| 494 | + ) |
| 495 | + retured_image = floating_item.get_image(doc=doc) |
| 496 | + assert retured_image is not None and retured_image.tobytes() == new_image.tobytes() |
| 497 | + |
| 498 | + # FloatingItem without explicit image and no provenance |
| 499 | + floating_item = FloatingItem( |
| 500 | + self_ref="#", label=DocItemLabel.PICTURE, prov=[], image=None |
| 501 | + ) |
| 502 | + assert floating_item.get_image(doc=doc) is None |
| 503 | + |
| 504 | + # FloatingItem without explicit image on invalid page |
| 505 | + floating_item = FloatingItem( |
| 506 | + self_ref="#", |
| 507 | + label=DocItemLabel.PICTURE, |
| 508 | + prov=[ProvenanceItem(page_no=3, bbox=Mock(spec=BoundingBox), charspan=(1, 2))], |
| 509 | + image=None, |
| 510 | + ) |
| 511 | + assert floating_item.get_image(doc=doc) is None |
| 512 | + |
| 513 | + # FloatingItem without explicit image on a page without page image |
| 514 | + floating_item = FloatingItem( |
| 515 | + self_ref="#", |
| 516 | + label=DocItemLabel.PICTURE, |
| 517 | + prov=[ProvenanceItem(page_no=2, bbox=Mock(spec=BoundingBox), charspan=(1, 2))], |
| 518 | + image=None, |
| 519 | + ) |
| 520 | + assert floating_item.get_image(doc=doc) is None |
| 521 | + |
| 522 | + # FloatingItem without explicit image on a page with page image |
| 523 | + floating_item = FloatingItem( |
| 524 | + self_ref="#", |
| 525 | + label=DocItemLabel.PICTURE, |
| 526 | + prov=[ |
| 527 | + ProvenanceItem( |
| 528 | + page_no=1, bbox=BoundingBox(l=2, t=4, r=4, b=8), charspan=(1, 2) |
| 529 | + ) |
| 530 | + ], |
| 531 | + image=None, |
| 532 | + ) |
| 533 | + retured_image = floating_item.get_image(doc=doc) |
| 534 | + assert ( |
| 535 | + retured_image is not None |
| 536 | + and retured_image.tobytes() == floating_item_image.tobytes() |
| 537 | + ) |
0 commit comments