Update tests

cschloer · cschloer · commit 22540a70bb83 · 2025-08-28T13:14:23.000+02:00
diff --git a/data/test_floating_point_error2.xlsx b/data/test_floating_point_error2.xlsx
diff --git a/tests/processors/test_dump_to_s3.py b/tests/processors/test_dump_to_s3.py
@@ -298,15 +298,20 @@ def test_large_dump_s3():
     server = ThreadedMotoServer()
     server.start()
     os.environ["LAMINAR_S3_HOST"] = "http://localhost:5000"
-    
+
     # Disable checksum validation to fix moto compatibility issues
     # Monkey patch the checksum validation to avoid moto checksum mismatch
     import botocore.httpchecksum
+
     original_validate = botocore.httpchecksum.StreamingChecksumBody._validate_checksum
+
     def mock_validate_checksum(self):
         pass  # Skip checksum validation for moto
-    botocore.httpchecksum.StreamingChecksumBody._validate_checksum = mock_validate_checksum
-    
+
+    botocore.httpchecksum.StreamingChecksumBody._validate_checksum = (
+        mock_validate_checksum
+    )
+
     try:
         # create bucket and put objects
         conn = boto3.client("s3", endpoint_url="http://localhost:5000")
@@ -356,5 +361,70 @@ def mock_validate_checksum(self):
         assert datapackage.descriptor["count_of_rows"] == num_rows
     finally:
         # Restore original checksum validation
-        botocore.httpchecksum.StreamingChecksumBody._validate_checksum = original_validate
+        botocore.httpchecksum.StreamingChecksumBody._validate_checksum = (
+            original_validate
+        )
         server.stop()
+
+
+@mock_aws
+@pytest.mark.skipif(TEST_DEV, reason="test development")
+def test_dump_xlsx_rounding():
+    server = ThreadedMotoServer()
+    server.start()
+    os.environ["LAMINAR_S3_HOST"] = "http://localhost:5000"
+    # create bucket and put objects
+    conn = boto3.client("s3", endpoint_url="http://localhost:5000")
+    conn.create_bucket(Bucket="testing_bucket")
+    conn.create_bucket(Bucket="testing_dump_bucket")
+    conn.upload_file(
+        "data/test_floating_point_error2.xlsx",
+        "testing_bucket",
+        "test_floating_point_error2.xlsx",
+    )
+
+    flows = [
+        load(
+            {
+                "from": "s3://testing_bucket/test_floating_point_error2.xlsx",
+                "name": "res",
+                "format": "xlsx",
+                "sheet": 1,
+                "preserve_formatting": True,
+                "adjust_floating_point_error": True,
+                "infer_strategy": "strings",
+                "cast_strategy": "strings",
+            }
+        ),
+        dump_to_s3(
+            {
+                "prefix": "test",
+                "force-format": True,
+                "format": "csv",
+                "save_pipeline_spec": True,
+                "temporal_format_property": "outputFormat",
+                "bucket_name": "testing_dump_bucket",
+                "data_manager": "test",
+            }
+        ),
+    ]
+
+    rows, datapackage, _ = Flow(*flows).results()
+    body = (
+        conn.get_object(Bucket="testing_dump_bucket", Key="test/res.csv")["Body"]
+        .read()
+        .decode("utf-8")
+    )
+
+    assert len(body)
+    assert len(datapackage.resources) == 1
+    csv_file = io.StringIO(body)
+    reader = csv.reader(csv_file)
+    dumped_rows = []
+    for row in reader:
+        dumped_rows.append(row)
+
+    # print(dumped_rows)
+    assert dumped_rows[34][15] == rows[0][33]["ChlaYSI"]
+    assert dumped_rows[34][15] == "1.23"
+    server.stop()
diff --git a/tests/processors/test_load.py b/tests/processors/test_load.py
@@ -692,6 +692,7 @@ def test_load_csv_multiline_header():
     assert datapackage.resources[0].schema.fields[0].name == "1;5"
     assert datapackage.resources[0].schema.fields[2].name == "3;3"
 
+
 @pytest.mark.skipif(TEST_DEV, reason="test development")
 def test_floating_point_error():
     flows = [
@@ -701,6 +702,7 @@ def test_floating_point_error():
                 "name": "res",
                 "format": "xlsx",
                 "sheet": 1,
+                "adjust_floating_point_error": True,
                 "preserve_formatting": True,
                 "infer_strategy": "strings",
                 "cast_strategy": "strings",
@@ -712,3 +714,24 @@ def test_floating_point_error():
     assert len(rows) == 1
     assert str(rows[0][6]["Temp"]) == "23.5"
 
+
+@pytest.mark.skipif(TEST_DEV, reason="test development")
+def test_floating_point_error_2():
+    flows = [
+        load(
+            {
+                "from": "data/test_floating_point_error2.xlsx",
+                "name": "res",
+                "format": "xlsx",
+                "sheet": 1,
+                "adjust_floating_point_error": True,
+                "preserve_formatting": True,
+                "infer_strategy": "strings",
+                "cast_strategy": "strings",
+            }
+        )
+    ]
+    rows, datapackage, _ = Flow(*flows).results()
+
+    assert len(rows) == 1
+    assert str(rows[0][33]["ChlaYSI"]) == "1.23"