cmu-delphi
diff --git a/‎DESCRIPTION
Lines changed: 1 addition & 1 deletion b/‎DESCRIPTION
Lines changed: 1 addition & 1 deletion
diff --git a/‎NAMESPACE
Lines changed: 2 additions & 22 deletions b/‎NAMESPACE
Lines changed: 2 additions & 22 deletions
diff --git a/‎R/dist_quantiles.R
Lines changed: 31 additions & 228 deletions b/‎R/dist_quantiles.R
Lines changed: 31 additions & 228 deletions
@@ -36,7 +36,7 @@ Imports:
     generics,
     ggplot2,
     glue,
-    hardhat (>= 1.3.0),
+    hardhat (>= 1.4.0.9002),
     lifecycle,
     lubridate,
     magrittr,
 
@@ -2,8 +2,6 @@
 
 S3method(Add_model,epi_workflow)
 S3method(Add_model,workflow)
-S3method(Math,dist_quantiles)
-S3method(Ops,dist_quantiles)
 S3method(Remove_model,epi_workflow)
 S3method(Remove_model,workflow)
 S3method(Update_model,epi_workflow)
@@ -48,13 +46,9 @@ S3method(fit,epi_workflow)
 S3method(flusight_hub_formatter,canned_epipred)
 S3method(flusight_hub_formatter,data.frame)
 S3method(forecast,epi_workflow)
-S3method(format,dist_quantiles)
-S3method(is.na,dist_quantiles)
-S3method(is.na,distribution)
 S3method(key_colnames,epi_workflow)
 S3method(key_colnames,recipe)
-S3method(mean,dist_quantiles)
-S3method(median,dist_quantiles)
+S3method(mean,quantile_pred)
 S3method(predict,epi_workflow)
 S3method(predict,flatline)
 S3method(prep,check_enough_train_data)
@@ -101,7 +95,7 @@ S3method(print,step_lag_difference)
 S3method(print,step_naomit)
 S3method(print,step_population_scaling)
 S3method(print,step_training_window)
-S3method(quantile,dist_quantiles)
+S3method(quantile,quantile_pred)
 S3method(refresh_blueprint,default_epi_recipe_blueprint)
 S3method(residuals,flatline)
 S3method(run_mold,default_epi_recipe_blueprint)
@@ -125,8 +119,6 @@ S3method(tidy,check_enough_train_data)
 S3method(tidy,frosting)
 S3method(tidy,layer)
 S3method(update,layer)
-S3method(vec_ptype_abbr,dist_quantiles)
-S3method(vec_ptype_full,dist_quantiles)
 S3method(weighted_interval_score,default)
 S3method(weighted_interval_score,dist_default)
 S3method(weighted_interval_score,dist_quantiles)
@@ -160,7 +152,6 @@ export(climate_args_list)
 export(climatological_forecaster)
 export(default_epi_recipe_blueprint)
 export(detect_layer)
-export(dist_quantiles)
 export(epi_recipe)
 export(epi_recipe_blueprint)
 export(epi_workflow)
@@ -230,7 +221,6 @@ export(update_frosting)
 export(update_model)
 export(validate_layer)
 export(weighted_interval_score)
-import(distributional)
 import(epidatasets)
 import(epiprocess)
 import(parsnip)
@@ -325,14 +315,11 @@ importFrom(rlang,list2)
 importFrom(rlang,set_names)
 importFrom(rlang,sym)
 importFrom(stats,as.formula)
-importFrom(stats,family)
 importFrom(stats,lm)
-importFrom(stats,median)
 importFrom(stats,model.frame)
 importFrom(stats,na.omit)
 importFrom(stats,poly)
 importFrom(stats,predict)
-importFrom(stats,qnorm)
 importFrom(stats,quantile)
 importFrom(stats,residuals)
 importFrom(tibble,as_tibble)
@@ -346,13 +333,6 @@ importFrom(tidyr,pivot_wider)
 importFrom(tidyr,unnest)
 importFrom(tidyselect,all_of)
 importFrom(utils,capture.output)
-importFrom(vctrs,as_list_of)
-importFrom(vctrs,field)
-importFrom(vctrs,new_rcrd)
-importFrom(vctrs,new_vctr)
 importFrom(vctrs,vec_cast)
 importFrom(vctrs,vec_data)
-importFrom(vctrs,vec_ptype_abbr)
-importFrom(vctrs,vec_ptype_full)
-importFrom(vctrs,vec_recycle_common)
 importFrom(workflows,extract_preprocessor)
@@ -1,209 +1,68 @@
-#' @importFrom vctrs field vec_cast new_rcrd
-new_quantiles <- function(values = double(1), quantile_levels = double(1)) {
-  arg_is_probabilities(quantile_levels)
-
-  vec_cast(values, double())
-  vec_cast(quantile_levels, double())
-  values <- unname(values)
-  if (length(values) == 0L) {
-    return(new_rcrd(
-      list(
-        values = rep(NA_real_, length(quantile_levels)),
-        quantile_levels = quantile_levels
-      ),
-      class = c("dist_quantiles", "dist_default")
-    ))
-  }
-  stopifnot(length(values) == length(quantile_levels))
-
-  stopifnot(!vctrs::vec_duplicate_any(quantile_levels))
-  if (is.unsorted(quantile_levels)) {
-    o <- vctrs::vec_order(quantile_levels)
-    values <- values[o]
-    quantile_levels <- quantile_levels[o]
-  }
-  if (is.unsorted(values, na.rm = TRUE)) {
-    cli_abort("`values[order(quantile_levels)]` produces unsorted quantiles.")
-  }
-
-  new_rcrd(list(values = values, quantile_levels = quantile_levels),
-    class = c("dist_quantiles", "dist_default")
-  )
-}
-
-
-
-#' @importFrom vctrs vec_ptype_abbr vec_ptype_full
-#' @export
-vec_ptype_abbr.dist_quantiles <- function(x, ...) "dist_qntls"
-#' @export
-vec_ptype_full.dist_quantiles <- function(x, ...) "dist_quantiles"
-
-#' @export
-format.dist_quantiles <- function(x, digits = 2, ...) {
-  m <- suppressWarnings(median(x))
-  paste0("quantiles(", round(m, digits), ")[", vctrs::vec_size(x), "]")
-}
-
-
-#' A distribution parameterized by a set of quantiles
-#'
-#' @param values A vector (or list of vectors) of values.
-#' @param quantile_levels A vector (or list of vectors) of probabilities
-#'   corresponding to `values`.
-#'
-#' When creating multiple sets of `values`/`quantile_levels` resulting in
-#' different distributions, the sizes must match. See the examples below.
-#'
-#' @return A vector of class `"distribution"`.
-#'
-#' @export
-#'
-#' @examples
-#' dist_quantiles(1:4, 1:4 / 5)
-#' dist_quantiles(list(1:3, 1:4), list(1:3 / 4, 1:4 / 5))
-#' dstn <- dist_quantiles(list(1:4, 8:11), c(.2, .4, .6, .8))
-#' dstn
-#'
-#' quantile(dstn, p = c(.1, .25, .5, .9))
-#' median(dstn)
-#'
-#' # it's a bit annoying to inspect the data
-#' distributional::parameters(dstn[1])
-#' nested_quantiles(dstn[1])[[1]]
-#'
-#' @importFrom vctrs as_list_of vec_recycle_common new_vctr
-dist_quantiles <- function(values, quantile_levels) {
-  if (!is.list(quantile_levels)) {
-    assert_numeric(quantile_levels, lower = 0, upper = 1, any.missing = FALSE, min.len = 1L)
-    quantile_levels <- list(quantile_levels)
-  }
-  if (!is.list(values)) {
-    if (length(values) == 0L) values <- NA_real_
-    values <- list(values)
-  }
-
-  values <- as_list_of(values, .ptype = double())
-  quantile_levels <- as_list_of(quantile_levels, .ptype = double())
-  args <- vec_recycle_common(values = values, quantile_levels = quantile_levels)
-
-  qntls <- as_list_of(
-    map2(args$values, args$quantile_levels, new_quantiles),
-    .ptype = new_quantiles(NA_real_, 0.5)
-  )
-  new_vctr(qntls, class = "distribution")
-}
-
-validate_dist_quantiles <- function(values, quantile_levels) {
-  map(quantile_levels, arg_is_probabilities)
-  common_length <- vctrs::vec_size_common( # aborts internally
-    values = values,
-    quantile_levels = quantile_levels
-  )
-  length_diff <- vctrs::list_sizes(values) != vctrs::list_sizes(quantile_levels)
-  if (any(length_diff)) {
-    cli_abort(c(
-      "`values` and `quantile_levels` must have common length.",
-      i = "Mismatches found at position(s): {.val {which(length_diff)}}."
-    ))
-  }
-  level_duplication <- map_lgl(quantile_levels, vctrs::vec_duplicate_any)
-  if (any(level_duplication)) {
-    cli_abort(c(
-      "`quantile_levels` must not be duplicated.",
-      i = "Duplicates found at position(s): {.val {which(level_duplication)}}."
-    ))
-  }
-}
-
-
-is_dist_quantiles <- function(x) {
-  is_distribution(x) & all(stats::family(x) == "quantiles")
-}
-
-
-
-#' @export
-#' @importFrom stats median qnorm family
-median.dist_quantiles <- function(x, na.rm = FALSE, ..., middle = c("cubic", "linear")) {
-  quantile_levels <- field(x, "quantile_levels")
-  values <- field(x, "values")
-  # we have exactly that quantile
-  if (0.5 %in% quantile_levels) {
-    return(values[match(0.5, quantile_levels)])
-  }
-  # if there's only 1 quantile_level (and it isn't 0.5), or the smallest quantile is larger than 0.5 or the largest smaller than 0.5, or if every value is NA, return NA
-  if (length(quantile_levels) < 2 || min(quantile_levels) > 0.5 || max(quantile_levels) < 0.5 || all(is.na(values))) {
-    return(NA)
-  }
-  if (length(quantile_levels) < 3 || min(quantile_levels) > .25 || max(quantile_levels) < .75) {
-    return(stats::approx(quantile_levels, values, xout = 0.5)$y)
-  }
-  quantile(x, 0.5, ..., middle = middle)
-}
 
 # placeholder to avoid errors, but not ideal
 #' @export
-mean.dist_quantiles <- function(x, na.rm = FALSE, ..., middle = c("cubic", "linear")) {
-  median(x, ..., middle = middle)
+mean.quantile_pred <- function(x, na.rm = FALSE, ...) {
+  median(x, ...)
 }
 
 #' @export
 #' @importFrom stats quantile
-#' @import distributional
-quantile.dist_quantiles <- function(x, p, ..., middle = c("cubic", "linear")) {
+quantile.quantile_pred <- function(x, p, ..., middle = c("cubic", "linear")) {
   arg_is_probabilities(p)
   p <- sort(p)
-  middle <- match.arg(middle)
+  middle <- rlang::arg_match(middle)
   quantile_extrapolate(x, p, middle)
 }
 
 
 quantile_extrapolate <- function(x, tau_out, middle) {
-  tau <- field(x, "quantile_levels")
-  qvals <- field(x, "values")
-  nas <- is.na(qvals)
-  if (all(nas)) {
-    return(rep(NA, times = length(tau_out)))
-  }
-  qvals_out <- rep(NA, length(tau_out))
-  qvals <- qvals[!nas]
-  tau <- tau[!nas]
+  tau <- x %@% "quantile_levels"
+  qvals <- as.matrix(x)
 
   # short circuit if we aren't actually extrapolating
   # matches to ~15 decimals
   if (all(tau_out %in% tau)) {
-    return(qvals[match(tau_out, tau)])
+    return(hardhat::quantile_pred(
+      qvals[ ,match(tau_out, tau), drop = FALSE], tau_out
+    ))
   }
   if (length(tau) < 2) {
-    cli_abort(
-      "Quantile extrapolation is not possible with fewer than 2 quantiles."
-    )
-    return(qvals_out)
+    cli_abort(paste(
+      "Quantile extrapolation is not possible when fewer than 2 quantiles",
+      "are available."
+    ))
   }
+  qvals_out <- map(
+    vctrs::vec_chop(qvals),
+    ~ extrapolate_quantiles_single(.x, tau, tau_out, middle)
+  )
 
+  hardhat::quantile_pred(qvals_out, tau_out)
+}
+
+extrapolate_quantiles_single <- function(qvals, tau, tau_out, middle) {
   indl <- tau_out < min(tau)
   indr <- tau_out > max(tau)
   indm <- !indl & !indr
+  qvals_out <- rep(NA, length(tau_out))
 
   if (middle == "cubic") {
     method <- "cubic"
-    result <- tryCatch(
-      {
-        Q <- stats::splinefun(tau, qvals, method = "hyman")
-        quartiles <- Q(c(.25, .5, .75))
-      },
-      error = function(e) {
-        return(NA)
-      }
-    )
+    result <- tryCatch({
+      Q <- stats::splinefun(tau, qvals, method = "hyman")
+      quartiles <- Q(c(.25, .5, .75))
+    },
+    error = function(e) {
+      return(NA)
+    })
   }
   if (middle == "linear" || any(is.na(result))) {
     method <- "linear"
     quartiles <- stats::approx(tau, qvals, c(.25, .5, .75))$y
   }
   if (any(indm)) {
-    qvals_out[indm] <- switch(method,
+    qvals_out[indm] <- switch(
+      method,
       linear = stats::approx(tau, qvals, tau_out[indm])$y,
       cubic = Q(tau_out[indm])
     )
@@ -242,59 +101,3 @@ tail_extrapolate <- function(tau_out, qv) {
   m <- diff(y) / diff(x)
   m * (x0 - x[1]) + y[1]
 }
-
-
-#' @method Math dist_quantiles
-#' @export
-Math.dist_quantiles <- function(x, ...) {
-  quantile_levels <- field(x, "quantile_levels")
-  values <- field(x, "values")
-  values <- vctrs::vec_math(.Generic, values, ...)
-  new_quantiles(values = values, quantile_levels = quantile_levels)
-}
-
-#' @method Ops dist_quantiles
-#' @export
-Ops.dist_quantiles <- function(e1, e2) {
-  is_quantiles <- c(
-    inherits(e1, "dist_quantiles"),
-    inherits(e2, "dist_quantiles")
-  )
-  is_dist <- c(inherits(e1, "dist_default"), inherits(e2, "dist_default"))
-  tau1 <- tau2 <- NULL
-  if (is_quantiles[1]) {
-    q1 <- field(e1, "values")
-    tau1 <- field(e1, "quantile_levels")
-  }
-  if (is_quantiles[2]) {
-    q2 <- field(e2, "values")
-    tau2 <- field(e2, "quantile_levels")
-  }
-  tau <- union(tau1, tau2)
-  if (all(is_dist)) {
-    cli_abort(
-      "You can't perform arithmetic between two distributions like this."
-    )
-  } else {
-    if (is_quantiles[1]) {
-      q2 <- e2
-    } else {
-      q1 <- e1
-    }
-  }
-  q <- vctrs::vec_arith(.Generic, q1, q2)
-  new_quantiles(values = q, quantile_levels = tau)
-}
-
-#' @method is.na distribution
-#' @export
-is.na.distribution <- function(x) {
-  sapply(vec_data(x), is.na)
-}
-
-#' @method is.na dist_quantiles
-#' @export
-is.na.dist_quantiles <- function(x) {
-  q <- field(x, "values")
-  all(is.na(q))
-}