Skip to content

Commit

Permalink
fix pyspark logic
Browse files Browse the repository at this point in the history
  • Loading branch information
uche-madu committed Oct 18, 2023
1 parent 734a3cc commit d8f9cec
Showing 1 changed file with 5 additions and 2 deletions.
7 changes: 5 additions & 2 deletions pyspark-scripts/config.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,9 @@
from dags.user_analytics import BUCKET_NAME


GCS_BUCKET = "deb-capstone"
MOVIE_FILES = "{}/project-data/movie_reviews".format(GCS_BUCKET)
MOVIES_METADATA_FILE_PATH = "{}/processed_files_metadata.txt".format(MOVIE_FILES)
MOVIES_METADATA_FILE_PATH = "{}/project-data/movie_reviews/processed_files_metadata.txt".format(GCS_BUCKET)
MODEL_DIR = "{}/models/sentiment_spark_nlp".format(GCS_BUCKET)

# My HuggingFace sentiment model fine-tuned using IMDb movie reviews dataset.
Expand All @@ -15,4 +18,4 @@
BQ_LOG_REVIEWS_TABLE = "review_logs"

LOG_FILES = "{}/project-data/log_reviews".format(GCS_BUCKET)
LOG_METADATA_FILE_PATH = "{}/processed_files_metadata.txt".format(LOG_FILES)
LOG_METADATA_FILE_PATH = "{}/project-data/log_reviews/processed_files_metadata.txt".format(GCS_BUCKET)

0 comments on commit d8f9cec

Please sign in to comment.