diff --git a/src/transform/clean.py b/src/transform/clean.py index 0dfc348..ea4424a 100644 --- a/src/transform/clean.py +++ b/src/transform/clean.py @@ -18,7 +18,7 @@ def normalise_timestamps(df: pd.DataFrame, col: str) -> pd.DataFrame: def deduplicate(df: pd.DataFrame, key_cols: list[str]) -> pd.DataFrame: before = len(df) df = df.drop_duplicates(subset=key_cols, keep="last") - print(f"[clean] Dedup removed {before - len(df)} rows") + print(f"[clean] Deduplicated, removed {before - len(df)} rows") return df