@@ -15,7 +15,7 @@ def test_dag_loads(self):
1515 """Ensure the DAG is registered with the expected ID and task."""
1616 self .assertEqual (DAG .dag_id , "ocrmypdf_batch" )
1717 task_ids = [task .task_id for task in DAG .tasks ]
18- self .assertEqual (task_ids , ["run_ocrmypdf" , "move_processed_pdfs" , " success" ])
18+ self .assertEqual (task_ids , ["run_ocrmypdf" , "success" ])
1919
2020 @mock .patch ("centralized_metadata.optimize_pdf_dag.run_and_stream" )
2121 def test_process_pdfs_runs_command_per_file (self , mock_run_and_stream ):
@@ -26,21 +26,30 @@ def test_process_pdfs_runs_command_per_file(self, mock_run_and_stream):
2626 open (pdf_one , "wb" ).close ()
2727 open (pdf_two , "wb" ).close ()
2828
29+ def fake_run (command , prefix = None ):
30+ Path (command [5 ]).write_bytes (b"optimized" )
31+
32+ mock_run_and_stream .side_effect = fake_run
33+
2934 result = process_pdfs (params = {"pdf_directory" : tmp_dir })
3035
3136 self .assertEqual (
3237 result ,
3338 [
3439 {
35- "original" : pdf_one ,
40+ "original" : os .path .realpath (
41+ os .path .join (tmp_dir , "Originals" , "file_one.pdf" )
42+ ),
3643 "optimized" : os .path .realpath (
37- os .path .join (tmp_dir , "file_one_opti.pdf" )
44+ os .path .join (tmp_dir , "Optimized" , " file_one_opti.pdf" )
3845 ),
3946 },
4047 {
41- "original" : pdf_two ,
48+ "original" : os .path .realpath (
49+ os .path .join (tmp_dir , "Originals" , "file_two.pdf" )
50+ ),
4251 "optimized" : os .path .realpath (
43- os .path .join (tmp_dir , "file_two_opti.pdf" )
52+ os .path .join (tmp_dir , "Optimized" , " file_two_opti.pdf" )
4453 ),
4554 },
4655 ],
@@ -61,6 +70,13 @@ def test_process_pdfs_runs_command_per_file(self, mock_run_and_stream):
6170 )
6271 self .assertEqual (call_args .kwargs .get ("prefix" ), expected_file .name )
6372
73+ originals_dir = Path (tmp_dir ) / "Originals"
74+ optimized_dir = Path (tmp_dir ) / "Optimized"
75+ self .assertTrue ((originals_dir / "file_one.pdf" ).exists ())
76+ self .assertTrue ((originals_dir / "file_two.pdf" ).exists ())
77+ self .assertTrue ((optimized_dir / "file_one_opti.pdf" ).exists ())
78+ self .assertTrue ((optimized_dir / "file_two_opti.pdf" ).exists ())
79+
6480 @mock .patch ("centralized_metadata.optimize_pdf_dag.run_and_stream" )
6581 def test_process_pdfs_handles_empty_directory (self , mock_run_and_stream ):
6682 """Confirm we short-circuit gracefully when no PDFs exist."""
@@ -77,6 +93,11 @@ def test_process_pdfs_prefers_dag_run_conf(self, mock_run_and_stream):
7793 pdf_path = os .path .realpath (os .path .join (tmp_dir , "file.pdf" ))
7894 open (pdf_path , "wb" ).close ()
7995
96+ def fake_run (command , prefix = None ):
97+ Path (command [5 ]).write_text ("optimized" )
98+
99+ mock_run_and_stream .side_effect = fake_run
100+
80101 dag_run_mock = mock .Mock ()
81102 dag_run_mock .conf = {"pdf_directory" : tmp_dir }
82103
@@ -88,9 +109,11 @@ def test_process_pdfs_prefers_dag_run_conf(self, mock_run_and_stream):
88109 result ,
89110 [
90111 {
91- "original" : pdf_path ,
112+ "original" : os .path .realpath (
113+ os .path .join (tmp_dir , "Originals" , "file.pdf" )
114+ ),
92115 "optimized" : os .path .realpath (
93- os .path .join (tmp_dir , "file_opti.pdf" )
116+ os .path .join (tmp_dir , "Optimized" , " file_opti.pdf" )
94117 ),
95118 }
96119 ],
@@ -111,6 +134,11 @@ def test_process_pdfs_uses_share_root_and_relative_path(
111134 pdf_path = target_dir / "variable.pdf"
112135 pdf_path .touch ()
113136
137+ def fake_run (command , prefix = None ):
138+ Path (command [5 ]).write_bytes (b"optimized" )
139+
140+ mock_run_and_stream .side_effect = fake_run
141+
114142 def fake_variable_get (key , default_var = None ):
115143 if key == "OCR_PDF_SHARE_ROOT" :
116144 return share_root
@@ -126,8 +154,8 @@ def fake_variable_get(key, default_var=None):
126154 result ,
127155 [
128156 {
129- "original" : str (pdf_path .resolve ()),
130- "optimized" : str ((target_dir / "variable_opti.pdf" ).resolve ()),
157+ "original" : str (( target_dir / "Originals" / "variable.pdf" ) .resolve ()),
158+ "optimized" : str ((target_dir / "Optimized" / " variable_opti.pdf" ).resolve ()),
131159 }
132160 ],
133161 )
0 commit comments