We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents bbadb72 + 68f1d95 commit ae242ddCopy full SHA for ae242dd
app/etl/transform.py
@@ -22,11 +22,14 @@ def transform(df: pd.DataFrame) -> pd.DataFrame:
22
23
# Handle duplicates
24
initial_rows = len(df_transformed)
25
- # TODO (Find & Fix): Duplicates are not removed
+ # Removing duplicates
26
+ df_transformed=df_transformed.drop_duplicates()
27
+
28
duplicates_removed = initial_rows - len(df_transformed)
29
if duplicates_removed > 0:
- # TODO (Find & Fix): Should log how many duplicates were removed
- pass
30
+ # Number of duplicates removed
31
+ print(f"✅ Removed {duplicates_removed} duplicate rows.")
32
33
34
# Handle null values in numeric columns
35
numeric_columns = df_transformed.select_dtypes(include=['number']).columns
0 commit comments