run-hydra-pspec.py


import numpy as np
import scipy.special
from pathlib import Path
from pprint import pprint
from resource import getrusage, RUSAGE_SELF
import os
import time
import sys
import json

from jsonargparse import ArgumentParser, ActionConfigFile
from jsonargparse.typing import Path_fr, Path_dw
from pyuvdata import UVData
from astropy.units import Quantity

import hydra_pspec as hp
from hydra_pspec.utils import (
    form_pseudo_stokes_vis,
    filter_freqs,
    get_git_version_info,
    add_mtime_to_filepath
)

try:
    from mpi4py import MPI

    HAVE_MPI = True
    comm = MPI.COMM_WORLD
    size = comm.Get_size()
    rank = comm.Get_rank()
except ImportError:
    HAVE_MPI = False
    # This can be made more robust
    import sys
    print("This script requires MPI.  Exiting.")
    sys.exit()

parser = ArgumentParser()
parser.add_argument(
    "--ant_str",
    type=str,
    default="cross",
    help="Comma delimited list of antenna pairs joined by underscores, e.g. "
         "'1_11,12_14'.  Used via the `ant_str` kwarg in "
         "`pyuvdata.UVData.select`."
)
parser.add_argument(
    "--sigcov0",
    type=str,
    help="Path to a single file or a directory containing a per-baseline "
         "initial guess for the EoR signal covariance.  Files must be readable "
         "by `np.load`."
)
parser.add_argument(
    "--sigcov0_file",
    type=str,
    help="If passing a directory containing per-baseline initial guesses for "
         "the EoR signal covariance to --sigcov0, --sigcov0_file specifies the"
         " name of the file to load in each baseline's subdirectory."
)
parser.add_argument(
    "--Nfgmodes",
    type=int,
    default=8,
    help="Number of FG eigenmodes for FG model."
)
parser.add_argument(
    "--fgmodes",
    type=str,
    help="Path to a single file or a directory containing per-baseline FG "
         "model basis vector arrays with shape (Nfreqs, Nmodes).  Files must "
         "be readable by `np.load`."
)
parser.add_argument(
    "--fgmodes_file",
    type=str,
    help="If passing a directory containing per-baseline FG eigenvectors to "
         "--fgmodes, --fgmodes_file specifies the name of the file to load "
         " in each baseline's subdirectory."
)
parser.add_argument(
    "--freq_range",
    type=str,
    help="Frequencies to use in the data.  Can be either a single frequency, "
         "a comma delimited list of frequencies ('100,110,150'), or a minimum"
         " and maximum frequency joined by '-' ('100-200').  Frequency string"
         " cannot contain spaces."
)
parser.add_argument(
    "--flags",
    type=str,
    help="Path to a single file or a directory containing per-baseline flags. "
         "Files must be readable by `np.load` and must have the same shape as "
         "the visibilities for a single baseline being analyzed.  The flags "
         "must be a boolean array where True and False correspond to flagged "
         "(unused) and unflagged (used) data, respectively."
)
parser.add_argument(
    "--flags_file",
    type=str,
    help="If passing a directory containing per-baseline flags to --flags, "
         "--flags_file specifies the name of the file to load in each "
         "baseline's subdirectory."
)
parser.add_argument(
    "--noise",
    type=str,
    help="Path to a single file or a directory containing per-baseline noise. "
         "Files must be readable by `np.load` and must have the same shape as "
         "the visibilities for a single baseline being analyzed."
)
parser.add_argument(
    "--noise_file",
    type=str,
    help="If passing a directory containing per-baseline noise to --noise, "
         "--noise_file specifies the name of the file to load in each "
         "baseline's subdirectory."
)
parser.add_argument(
    "--noise_cov",
    type=str,
    help="Path to a single file or a directory containing per-baseline noise "
         "covariance matrices.  Files must be readable by `np.load`."
)
parser.add_argument(
    "--noise_cov_file",
    type=str,
    help="If passing a directory containint per-baseline noise covariance "
         "matrices to --noise_cov, --noise_cov_file specifies the name of the "
         "file to load in each baseline's subdirectory."
)
parser.add_argument(
    "--nsamples",
    type=str,
    help="Path to a single file or a directory containing per-baseline "
         "Nsamples arrays. Files must be readable by `np.load` and must have "
         "the same shape as the visibilities for a single baseline being "
         "analyzed."
)
parser.add_argument(
    "--nsamples_file",
    type=str,
    help="If passing a directory containing per-baseline nsamples to "
         "--nsamples, --nsamples_file specifies the name of the file to load "
         "in each baseline's subdirectory."
)
parser.add_argument(
    "--n_ps_prior_bins",
    type=int,
    default=3,
    help="Sets the number of bins to the left and right of the delay=0 mode "
         "bound by the prior (set via --ps_prior_lo and --ps_prior_hi).  If "
         "n_ps_prior_bins is set to 3 (default), then 3 bins to the left and"
         " 3 bins to the right of the delay=0 bin will be affected by the "
         "prior."
)
parser.add_argument(
    "--ps_prior_lo",
    type=float,
    default=0.0,
    help="Sets the lower bound of the prior on the delay power spectrum. "
         "Defaults to 0 which corresponds to no lower bound."
)
parser.add_argument(
    "--ps_prior_hi",
    type=float,
    default=0.0,
    help="Sets the upper bound of the prior on the delay power spectrum. "
         "Defaults to 0 which corresponds to no upper bound."
)
parser.add_argument(
    "--map_estimate",
    action="store_true",
    help="Calculate the maximum a posteriori estimate only (1 iteration)."
)
parser.add_argument(
    "--Niter",
    type=int,
    default=100,
    help="Number of iterations."
)
parser.add_argument(
    "--seed",
    type=int,
    default=None,
    help="Random seed for `numpy.random.seed`."
)
parser.add_argument(
    "-v", "--verbose",
    dest="verbose",
    action="store_true",
    default=False,
    help="Display debug/timing statements."
)
parser.add_argument(
    "--Nproc",
    type=int,
    default=1,
    help="Number of multiprocess threads.  Defaults to 1."
)
parser.add_argument(
    "--out_dir",
    type=Path_dw,
    default="./",
    help="Path to directory for writing output(s).  Defaults to './'."
)
parser.add_argument(
    "--dirname",
    type=str,
    help="Name of subdirectory for output(s).  Files will be written to "
         "`Path(args.out_dir) / args.dirname`.  Defaults to "
         "f'results-{freqs.min()}-{freqs.max()}MHz-Niter-{Niter}'."
)
parser.add_argument(
    "--clobber",
    action="store_true",
    default=False,
    help="Clobber existing files."
)
parser.add_argument(
    "--write_Niter",
    type=int,
    default=100,
    help="Number of iterations between output file writing.  Smaller numbers "
         "yield more overhead for I/O.  Larger numbers risk losing more "
         "samples if a job fails or times out."
)
parser.add_argument(
    "file_paths",
    type=Path_fr,
    nargs="+",
    help="Path(s) to UVData compatible visibility file."
)
parser.add_argument(
    '--config',
    action=ActionConfigFile
)
args = parser.parse_args()


def check_shape(shape, d_shape, desc=""):
        assert shape == d_shape, (
            f"The {desc} array has shape {shape} which does not match the "
            f"shape of the per-baseline data, {d_shape}."
        )

def check_load_path(fp):
        """
        Check if file path `fp` points to a file (load) or directory (pass).

        Parameters
        ----------
        fp : str or Path
            Path to file or directory.

        """
        if not isinstance(fp, Path):
            fp = Path(fp)
        
        fp_is_dir = fp.is_dir()
        if fp_is_dir:
            return fp_is_dir, None
        else:
            data = np.load(fp)
            return fp_is_dir, data

def split_data_for_scatter(data: list, n_ranks: int) -> list:
    """Split a list into a list of lists for MPI scattering"""
    data_length = len(data)
    quot, rem = divmod(data_length, n_ranks)

    if quot == 0:
        print(f"Error: Number of baselines ({data_length}) should be >= number of MPI ranks ({size})!")
        sys.stdout.flush()
        comm.Abort()

    # determine the size of each sub-task
    counts = [quot + 1 if n < rem else quot for n in range(n_ranks)]

    # determine the starting and ending indices of each sub-task
    starts = [sum(counts[:n]) for n in range(n_ranks)]
    ends = [sum(counts[:n + 1]) for n in range(n_ranks)]

    # converts data into a list of arrays
    scatter_data = [data[starts[n]:ends[n]] for n in range(n_ranks)]
    return scatter_data


if rank == 0:
    time_load_start = time.perf_counter()
    if "config" in args.__dict__:
        print(f"Loading config file {str(args.config[0])}", end="\n\n")
    pprint(args.__dict__)
    print()

    if not args.file_paths:
        print('Must pass file(s) to analyze via --file_paths.  Exiting.')
        sys.exit()
    else:
        file_paths = sorted([Path(fp) for fp in args.file_paths])
    nfiles = len(file_paths)
    print(f"Reading {nfiles} file(s)")

    uvd = UVData()
    if args.freq_range:
        uvd.read(file_paths[0], read_data=False)
        freqs_in = uvd.freq_array
        if not uvd.use_future_array_shapes:
            # Remove the Nspws axis
            freqs_in = freqs_in[0]
        freqs_in = Quantity(freqs_in, unit="Hz")
        freqs_to_keep = filter_freqs(args.freq_range, freqs_in)
        freqs_to_keep = freqs_to_keep.to("Hz").value
    else:
        freqs_to_keep = None
    uvd.read(file_paths, ant_str=args.ant_str, frequencies=freqs_to_keep)
    uvd.conjugate_bls()
    if args.file_paths:
        # Sum XX and YY polarizations to obtain pseudo-Stokes I (pI)
        # visibilities and store them in the XX polarization
        uvd = form_pseudo_stokes_vis(uvd)

    Nfreqs = uvd.Nfreqs
    freqs = uvd.freq_array
    if not uvd.use_future_array_shapes:
        freqs = freqs[0]
    freqs = Quantity(freqs, unit="Hz")
    freq_str = (
        f"{freqs.min().to('MHz').value:.3f}-"
        + f"{freqs.max().to('MHz').value:.3f}MHz"
    )

    # Output file set up
    out_dir = Path(args.out_dir)
    if not args.dirname:
        out_dir /= f"results-{freq_str}-Niter-{args.Niter}"
    else:
        if args.map_estimate:
            out_dir /= args.dirname + "-map-estimate"
        else:
            out_dir /= args.dirname
    if out_dir.exists() and not args.clobber:
        # Check for existing output files to avoid overwriting
        add_mtime_to_filepath(out_dir)
    out_dir.mkdir(exist_ok=True, parents=True)
    print(f"\nWriting output(s) to {out_dir.absolute()}", end="\n\n")
    results_dir = out_dir
    
    # Catalog git version
    try:
        git_info = get_git_version_info()
    except:
        git_info = ''
    with open(out_dir / "git.json", "w") as f:
        json.dump(git_info, f, indent=2)
    
    # Catalog command line arguments
    if args.clobber and os.path.isfile(out_dir / "args.json"):
        # Remove existing file if clobber=True
        os.remove(out_dir / "args.json")
    parser.save(args, out_dir / "args.json", format="json_indented", skip_none=False)
    if "SLURM_JOB_ID" in os.environ:
        # If running in SLURM, create empty file named with the SLURM Job ID
        (out_dir / os.environ["SLURM_JOB_ID"]).touch()

    all_data_weights = []
    for i_bl, antpair in enumerate(uvd.get_antpairs()):
        bl_str = f"{antpair[0]}-{antpair[1]}"

        # Get visibility data with shape (Ntimes, Nfreqs)
        # pI visibilities stored in the XX polarization
        d = uvd.get_data(antpair + ("xx",), force_copy=True)

        bl_data_shape = d.shape
        cov_ff_shape = (Nfreqs, Nfreqs)
        fgmodes_shape = (Nfreqs, args.Nfgmodes)

        if args.flags:
            flags_path = Path(args.flags)
            flags_path_is_dir, flags = check_load_path(flags_path)
            if flags_path_is_dir:
                bl_flags_path = flags_path / bl_str / args.flags_file
                flags = np.load(bl_flags_path)
            check_shape(flags.shape, bl_data_shape, desc=f"flags")
        else:
            # FIXME: there is nothing currently in place to handle flags which
            # differ between polarizations in `form_pseudo_stokes_vis`. 
            # Differing flags should be accounted for in the future, possibly
            # via Nsamples.
            flags = uvd.get_flags(antpair + ("xx",))

        if args.nsamples:
            nsamples_path = Path(args.nsamples)
            nsamples_path_is_dir, nsamples = check_load_path(nsamples_path)
            if nsamples_path_is_dir:
                bl_nsamples_path = nsamples_path / bl_str / args.nsamples_file
                nsamples = np.load(bl_nsamples_path)
            check_shape(nsamples.shape, bl_data_shape, desc=f"nsamples")
        else:
            nsamples = None

        if args.noise:
            noise_path = Path(args.noise)
            noise_path_is_dir, noise = check_load_path(noise_path)
            if noise_path_is_dir:
                bl_noise_path = noise_path / bl_str / args.noise_file
                noise = np.load(bl_noise_path)
            check_shape(noise.shape, bl_data_shape, desc=f"noise")
            if nsamples is not None:
                # Approximate the reduction in the noise from averaging
                # together many data points by dividing by Nsamples
                noise /= np.sqrt(nsamples)
            # If passing an array of noise, the data should be noiseless
            d += noise

        if args.sigcov0:
            sigcov0_path = Path(args.sigcov0)
            sigcov0_path_is_dir, sigcov0 = check_load_path(sigcov0_path)
            if sigcov0_path_is_dir:
                bl_sigcov0_path = sigcov0_path / bl_str / args.sigcov0_file
                sigcov0 = np.load(bl_sigcov0_path)
            check_shape(sigcov0.shape, cov_ff_shape, desc="signal covariance")
        else:
            sigcov0 = np.eye(Nfreqs)

        if args.noise_cov:
            noise_cov_path = Path(args.noise_cov)
            noise_cov_path_is_dir, noise_cov = check_load_path(noise_cov_path)
            if noise_cov_path_is_dir:
                bl_noise_cov_path = (
                    noise_cov_path / bl_str / args.noise_cov_file
                )
                noise_cov = np.load(bl_noise_cov_path)
            check_shape(noise_cov.shape, cov_ff_shape, desc="noise covariance")
            Ninv = np.linalg.inv(noise_cov)
        else:
            Ninv = np.eye(Nfreqs) / (10.)**2. # FIXME

        if args.fgmodes:
            fgmodes_path = Path(args.fgmodes)
            fgmodes_path_is_dir, fgmodes = check_load_path(fgmodes_path)
            if fgmodes_path_is_dir:
                if not args.fgmodes_file:
                    # Look for a file with the default filename from
                    # hydra-pspec/scripts/calc-vis-cov-matrices.py
                    fgmodes_path = (
                        fgmodes_path / bl_str / f"evecs-{freq_str}.npy"
                    )
                else:
                    fgmodes_path = fgmodes_path / bl_str / args.fgmodes_file
                fgmodes = np.load(fgmodes_path)
            fgmodes = fgmodes[:, :args.Nfgmodes]
            check_shape(fgmodes.shape, fgmodes_shape, desc="fgmodes")
        else:
            # Generate approximate set of FG modes from Legendre polynomials
            fgmodes = np.array([
                scipy.special.legendre(i)(np.linspace(-1., 1., freqs.size))
                for i in range(args.Nfgmodes)
            ]).T

        bl_data_weights = {
            "antpair": antpair,
            "d": d,
            "w": flags,
            "fgmodes": fgmodes,
            "S_initial": sigcov0,
            "Ninv": Ninv,
            "out_dir": out_dir
        }
        if args.sigcov0:
            bl_data_weights["S_initial"] = sigcov0
        if args.noise_cov:
            bl_data_weights["N"] = noise_cov
        all_data_weights.append(bl_data_weights)
    all_data_weights = split_data_for_scatter(all_data_weights, size)
    time_load_end = time.perf_counter()
    time_load = time_load_end - time_load_start
else:
    all_data_weights = None

# Send per-baseline visibilities to each process
list_of_baselines = comm.scatter(all_data_weights)
if rank == 0:
    time_scatter_end = time.perf_counter()
    time_scatter = time_scatter_end - time_load_end

write_times = []
ant_pairs = []
for data in list_of_baselines:
    antpair = data["antpair"]
    d = data["d"]
    w = ~data["w"]
    fgmodes = data["fgmodes"]
    S_initial = data["S_initial"]
    Ninv = data["Ninv"]

    # Create a subdirectory in out_dir for each baseline
    out_dir = data["out_dir"]
    bl_str = f"{antpair[0]}-{antpair[1]}"
    out_dir /= bl_str
    out_dir.mkdir(exist_ok=True, parents=True)

    # Power spectrum prior
    # This has shape (2, Ndelays). The first dimension is for the upper and
    # lower prior bounds respectively. If the prior for a given delay is
    # set to zero, no prior is applied. Otherwise, the solution is restricted
    # to be within the range ps_prior[1] < soln < ps_prior[0].
    Nfreqs = d.shape[1]
    ps_prior = np.zeros((2, Nfreqs))
    if args.ps_prior_lo != 0 or args.ps_prior_hi != 0:
        ps_prior_inds = slice(
            Nfreqs//2 - args.n_ps_prior_bins,
            Nfreqs//2 + args.n_ps_prior_bins + 1
        )
        ps_prior[0, ps_prior_inds] = args.ps_prior_hi
        ps_prior[1, ps_prior_inds] = args.ps_prior_lo

    if rank == 0:
        verbose = args.verbose
    else:
        verbose = False
    if verbose:
        print("Printing status messages for:")
        print(f"Rank:     {rank}")
        print(f"Baseline: {antpair}", end="\n\n")


    # Calculate time-independent flags based on whether *any* times have 
    # flags in each channel
    w_any = np.ones_like(w[0]) # all set to True (= not flagged)
    for jj in range(w_any.size):
        # Check if there are any times flagged in this channel
        if np.any(~w[:,jj]):
            w_any[jj] = False

    # Run Gibbs sampler
    signal_cr, signal_S, signal_ps, fg_amps, chisq, ln_post, write_time = \
        hp.pspec.gibbs_sample_with_fg(
            d,
            w_any,  # FIXME: add functionality for time-dependent flags
            S_initial,
            fgmodes,
            Ninv,
            ps_prior,
            Niter=args.Niter,
            seed=args.seed,
            map_estimate=args.map_estimate,
            verbose=verbose,
            nproc=args.Nproc,
            write_Niter=args.write_Niter,
            out_dir=out_dir
        )
    ant_pairs.append(str(antpair[0])+"_"+str(antpair[1]))
    write_times.append(write_time)
write_timings = {"rank": rank, "ant_pairs": ant_pairs, "write_times": write_times}
gathered_write_timings = comm.gather(write_timings)

pre_barrier = time.perf_counter()
comm.barrier()
post_barrier = time.perf_counter()
time_barrier = post_barrier - pre_barrier

if rank == 0:
    time_gibbs_stop = time.perf_counter()
    time_gibbs = time_gibbs_stop - time_scatter_end

    time_overall = time_gibbs_stop - time_load_start

    timings = {}
    timings["num_ranks"] = size
    timings["num_baselines"] = len(uvd.get_antpairs())
    timings["rank_0_timers"] = {"load_data": time_load,
                                "scatter": time_scatter,
                                "process": time_gibbs,
                                "barrier": time_barrier,
                                "total": time_overall}
    timings["write_data"] = gathered_write_timings

    with open(Path(results_dir, "timings.json"), "w") as f:
        json.dump(timings, f, indent=2)

    resources = getrusage(RUSAGE_SELF)
    stats = {"ru_maxrss": resources.ru_maxrss,
             "ru_utime": resources.ru_utime,
             "ru_stime": resources.ru_stime
             }
    with open(Path(results_dir, "resources.json"), "w") as f:
        json.dump(stats, f, indent=2)