Skip to content

Commit

Permalink
Merge pull request #189 from greavess/patch-1
Browse files Browse the repository at this point in the history
Work around for .DynamicClusterCall error
  • Loading branch information
thierrygosselin authored Jun 5, 2024
2 parents a2d63d5 + 6b2c71b commit 7e1c321
Show file tree
Hide file tree
Showing 3 changed files with 19 additions and 18 deletions.
2 changes: 1 addition & 1 deletion R/detect_paralogs.R
Original file line number Diff line number Diff line change
Expand Up @@ -236,7 +236,7 @@ detect_paralogs <- function(

# Extract the depth/coverage info from GDS -----------------------------------
if (verbose) message("Extracting coverage...")
depth.info <- extract_coverage(gds = data, individuals = FALSE, coverage.stats = "sum") %>%
depth.info <- extract_coverage(gds = data, individuals = FALSE, coverage.stats = "sum", parallel.core = parallel.core) %>%
dplyr::mutate(dplyr::across(where(is.factor), .fns = as.character)) %>%
dplyr::left_join(
gds2tidy(gds = data, parallel.core = parallel.core) %>%
Expand Down
4 changes: 2 additions & 2 deletions R/filter_ma.R
Original file line number Diff line number Diff line change
Expand Up @@ -922,7 +922,8 @@ minor_allele_stats <- function(
ad = TRUE,
coverage.stats = "sum",
subsample.info = 1,
verbose = FALSE
verbose = FALSE,
parallel.core = parallel.core
) %$%
m.info
} else {
Expand Down Expand Up @@ -1103,4 +1104,3 @@ ma_one <- carrier::crate(function(x) {
mac.data$MAC_GLOBAL %<>% as.integer(.)
return(mac.data)
})#End ma_one

31 changes: 16 additions & 15 deletions R/gds.R
Original file line number Diff line number Diff line change
Expand Up @@ -1099,7 +1099,8 @@ extract_coverage <- function(
ad = TRUE,
coverage.stats = c("sum", "mean", "median", "iqr"),
subsample.info = 1,
verbose = TRUE
verbose = TRUE,
parallel.core = TRUE
) {

if (verbose) cli::cli_progress_step("Coverage ...")
Expand All @@ -1112,7 +1113,8 @@ extract_coverage <- function(
dp = TRUE,
ad = TRUE,
individuals = TRUE,
markers = TRUE
markers = TRUE,
parallel.core = TRUE
) {

coverage.stats <- match.arg(
Expand All @@ -1133,7 +1135,7 @@ extract_coverage <- function(
)

if (markers) {
dp_f_m <- function(gds, coverage.stats) {
dp_f_m <- function(gds, coverage.stats, parallel.core = TRUE) {

# Using switch instead was not optimal for additional options in the func...
if (coverage.stats == "sum") rad_cov_stats <- function(x) round(sum(x, na.rm = TRUE))
Expand All @@ -1148,11 +1150,11 @@ extract_coverage <- function(
FUN = rad_cov_stats,
as.is = "integer",
margin = "by.variant",
parallel = TRUE
parallel = parallel.core
)
}

dp.m <- purrr::map_dfc(.x = coverage.stats.l, .f = dp_f_m, gds = gds)
dp.m <- purrr::map_dfc(.x = coverage.stats.l, .f = dp_f_m, gds = gds, parallel.core = parallel.core)
}

if (individuals) {
Expand Down Expand Up @@ -1271,7 +1273,8 @@ extract_coverage <- function(
dp = dp,
ad = ad,
individuals = individuals,
markers = markers
markers = markers,
parallel.core = parallel.core
)

# required for individuals and markers
Expand Down Expand Up @@ -2319,7 +2322,7 @@ generate_stats <- function(
if (!rlang::has_name(m.info, "HET_OBS") || force.stats) {
m.info %<>%
dplyr::mutate(
HET_OBS = round(markers_het(gds), 6),
HET_OBS = round(markers_het(gds, parallel.core), 6),
FIS = round(markers_fis(gds), 6)
)
}
Expand Down Expand Up @@ -2540,7 +2543,7 @@ generate_stats <- function(
}

if (markers) {
dp_f_m <- function(gds, coverage.stats, dart.data) {
dp_f_m <- function(gds, coverage.stats, dart.data, parallel.core = TRUE) {
# Using switch instead was not optimal for additional options in the func...
if (coverage.stats == "sum") rad_cov_stats <- function(x) round(sum(x, na.rm = TRUE))
if (coverage.stats == "mean") rad_cov_stats <- function(x) round(mean(x, na.rm = TRUE))
Expand All @@ -2558,13 +2561,13 @@ generate_stats <- function(
FUN = rad_cov_stats,
as.is = "integer",
margin = "by.variant",
parallel = TRUE
parallel = parallel.core
)
}
return(x)
}

dp.m <- purrr::map_dfc(.x = coverage.stats.l, .f = dp_f_m, gds = gds, dart.data = dart.data)
dp.m <- purrr::map_dfc(.x = coverage.stats.l, .f = dp_f_m, gds = gds, dart.data = dart.data, parallel.core = parallel.core)
}

if (individuals) {
Expand Down Expand Up @@ -2860,7 +2863,7 @@ generate_stats <- function(
corr.info <- stringi::stri_join(corr.info, cmt)
}
if (coverage) {
if (stats::sd(i.info$COVERAGE_MEAN) != 0) {
if (stats::sd(i.info$COVERAGE_MEAN, na.rm = TRUE) != 0) {
cc <- ceiling(stats::cor(i.info$COVERAGE_TOTAL, i.info$COVERAGE_MEAN, use = "pairwise.complete.obs") * 100) / 100
} else {
cc <- "NA"
Expand Down Expand Up @@ -3061,15 +3064,15 @@ individual_het <- function(gds) {
#' @rdname markers_het
#' @keywords internal
#' @export
markers_het <- function(gds) {
markers_het <- function(gds, parallel.core = TRUE) {
# PLAN A
SeqArray::seqApply(
gdsfile = gds,
var.name = "$dosage_alt",
FUN = function(x) sum(x == 1, na.rm = TRUE) / sum(!is.na(x)),
margin = "by.variant",
as.is = "double",
parallel = TRUE
parallel = parallel.core
)
# PLAN B
# not faster... strange because for sample it is faster...
Expand Down Expand Up @@ -3360,5 +3363,3 @@ write_gds <- function(
if (open) data.gds <- read_rad(data.gds, verbose = FALSE)
return(data.gds)
} # End write_gds


0 comments on commit 7e1c321

Please sign in to comment.