Skip to content

Commit 8447714

Browse files
author
marwan37
committed
re-integrate docker settings and cleanup config.yaml
1 parent f501c4a commit 8447714

File tree

3 files changed

+22
-14
lines changed

3 files changed

+22
-14
lines changed

omni-reader/configs/config.yaml

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -15,18 +15,6 @@ parameters:
1515
input_image_paths: []
1616
selected_models: ["gpt4o", "granite", "llava34b", "pixtral", "gemma3", "llava-phi3"]
1717

18-
# Pipeline settings
19-
settings:
20-
docker:
21-
requirements:
22-
- "litellm>=1.10.0"
23-
- "openai>=1.10.0"
24-
- "pillow>=10.0.0"
25-
- "ollama>=0.1.0"
26-
- "jiwer>=3.0.0"
27-
- "textdistance>=4.6.0"
28-
- "polars>=0.19.19"
29-
3018
# Component-specific configurations
3119
steps:
3220
run_ocr:

omni-reader/pipelines/batch_pipeline.py

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,10 +15,12 @@
1515
# limitations under the License.
1616
"""OCR Batch Pipeline implementation for processing images with multiple models."""
1717

18+
import os
1819
from typing import Any, Dict, List, Optional
1920

2021
from dotenv import load_dotenv
2122
from zenml import pipeline
23+
from zenml.config import DockerSettings
2224
from zenml.logger import get_logger
2325

2426
from steps import (
@@ -31,8 +33,16 @@
3133

3234
logger = get_logger(__name__)
3335

36+
docker_settings = DockerSettings(
37+
requirements_file="requirements.txt",
38+
environment={
39+
"OPENAI_API_KEY": os.getenv("OPENAI_API_KEY"),
40+
"MISTRAL_API_KEY": os.getenv("MISTRAL_API_KEY"),
41+
},
42+
)
43+
3444

35-
@pipeline
45+
@pipeline(settings={"docker": docker_settings})
3646
def ocr_batch_pipeline(
3747
image_paths: Optional[List[str]] = None,
3848
image_folder: Optional[str] = None,

omni-reader/pipelines/evaluation_pipeline.py

Lines changed: 11 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,11 +15,13 @@
1515
# limitations under the License.
1616
"""OCR Evaluation Pipeline implementation for comparing models using existing results."""
1717

18+
import os
1819
from typing import Any, Dict, List, Optional
1920

2021
import polars as pl
2122
from dotenv import load_dotenv
2223
from zenml import pipeline, step
24+
from zenml.config import DockerSettings
2325
from zenml.logger import get_logger
2426

2527
from steps import (
@@ -33,8 +35,16 @@
3335

3436
logger = get_logger(__name__)
3537

38+
docker_settings = DockerSettings(
39+
requirements_file="requirements.txt",
40+
environment={
41+
"OPENAI_API_KEY": os.getenv("OPENAI_API_KEY"),
42+
"MISTRAL_API_KEY": os.getenv("MISTRAL_API_KEY"),
43+
},
44+
)
45+
3646

37-
@pipeline
47+
@pipeline(settings={"docker": docker_settings})
3848
def ocr_evaluation_pipeline(
3949
model_names: List[str] = None,
4050
results_dir: str = "ocr_results",

0 commit comments

Comments
 (0)