Skip to content

Commit

Permalink
Symlink output files to latest dir
Browse files Browse the repository at this point in the history
  • Loading branch information
lwrubel committed Jul 29, 2024
1 parent 99e12d4 commit 2dcf8fa
Showing 1 changed file with 14 additions and 3 deletions.
17 changes: 14 additions & 3 deletions rialto_airflow/dags/harvest.py
Original file line number Diff line number Diff line change
Expand Up @@ -126,11 +126,22 @@ def pubs_to_contribs(pubs, doi_sunet_pickle, authors_csv, snapshot_dir):
return str(output)

@task()
def publish(dataset):
def publish(pubs_to_contribs, merge_publications):
"""
Publish aggregate data to JupyterHub environment.
"""
return True
contribs_path = Path(data_dir) / "latest" / "contributions.parquet"
pubs_path = Path(data_dir) / "latest" / "publications.parquet"

if contribs_path.exists():
contribs_path.unlink()
if pubs_path.exists():
pubs_path.unlink()

contribs_path.symlink_to(pubs_to_contribs)
pubs_path.symlink_to(merge_publications)

return str(contribs_path), str(pubs_path)

snapshot_dir = setup()

Expand All @@ -156,7 +167,7 @@ def publish(dataset):

contribs = pubs_to_contribs(pubs, doi_sunet, authors_csv, snapshot_dir)

publish(contribs)
publish(contribs, pubs)


harvest()

0 comments on commit 2dcf8fa

Please sign in to comment.