Skip to content

Commit

Permalink
hotfix remove notna from ratings first
Browse files Browse the repository at this point in the history
  • Loading branch information
threnjen committed Jan 11, 2025
1 parent ef9c8ef commit 2026a81
Showing 1 changed file with 1 addition and 0 deletions.
1 change: 1 addition & 0 deletions modules/ratings_data_cleaner/main.py
Original file line number Diff line number Diff line change
Expand Up @@ -118,6 +118,7 @@ def _create_table_from_data(self, all_entries: dict[list]) -> pd.DataFrame:

def _create_quality_review_table(self, df: pd.DataFrame) -> pd.DataFrame:
"""Create a cleaned and refined table of data"""
df = df[df["value"].notna()]

df["value"] = df["value"].replace(r"[^A-Za-z0-9 ]+", "", regex=True)
df["value"] = df["value"].str.lower().apply(lambda x: filter_stopwords(x))
Expand Down

0 comments on commit 2026a81

Please sign in to comment.