From 542a9561357ed774c02d7ab87f355fefd5e9c826 Mon Sep 17 00:00:00 2001
From: Dan McGraw <daniel.e.mcgraw@usace.army.mil>
Date: Mon, 18 May 2026 11:52:20 -0600
Subject: [PATCH 1/2] Fixed bug with pmf_stage > pmf_mean. Replaced with abs()
 to prevent undefined results and flexibility for higher or lower shift. Added
 support for 3 stage input (best, low, high) as well. In this case, sigma is
 calculated from the three

---
 R/rejection_sampling.R | 139 ++++++++++++++++++++++++++++-------------
 1 file changed, 97 insertions(+), 42 deletions(-)

diff --git a/R/rejection_sampling.R b/R/rejection_sampling.R
index 8bce429..135a578 100644
--- a/R/rejection_sampling.R
+++ b/R/rejection_sampling.R
@@ -28,19 +28,26 @@ thin_samples <- function(n, z_sorted, stage_sorted) {
 #'
 #' Computes the parameters of a three-parameter lognormal distribution for use
 #' as a probabilistic maximum stage (PMF) in rejection sampling. The shift
-#' parameter defines the lower bound of the distribution.
+#' parameter defines the hard lower bound of the distribution. The function
+#' supports two modes: (1) supplying a best estimate and assuming sigma, or
+#' (2) supplying a best estimate, low, and high to solve for sigma numerically.
 #'
-#' @param pmf_shift Numeric. Lower bound (shift) of the lognormal distribution.
-#'   Must be greater than \code{pmf_mean}.
-#' @param pmf_mean Numeric. Mean of the PMF stage distribution. Must be less
-#'   than \code{pmf_shift}.
-#' @param pmf_sigma Numeric. Standard deviation on the log scale. Defaults to
-#'   \code{0.5}.
+#' @param pmf_shift Numeric. Hard lower bound (shift) of the lognormal
+#'   distribution. Must be less than all of \code{pmf_best}, \code{pmf_low},
+#'   and \code{pmf_high}.
+#' @param pmf_best Numeric. Best estimate (mean) of the PMF stage distribution.
+#' @param pmf_sigma Numeric. Standard deviation on the log scale. Required if
+#'   \code{pmf_low} and \code{pmf_high} are not supplied. Defaults to
+#'   \code{NULL}.
+#' @param pmf_low Numeric. Low estimate of PMF stage (5th percentile). Optional.
+#'   If supplied, \code{pmf_high} must also be supplied.
+#' @param pmf_high Numeric. High estimate of PMF stage (95th percentile).
+#'   Optional. If supplied, \code{pmf_low} must also be supplied.
 #'
 #' @return A named list with the following elements:
 #' \describe{
-#'   \item{pmf_shift}{Lower bound of the distribution.}
-#'   \item{pmf_mean}{Mean of the distribution.}
+#'   \item{pmf_shift}{Hard lower bound of the distribution.}
+#'   \item{pmf_best}{Best estimate of PMF stage.}
 #'   \item{pmf_sigma}{Standard deviation on the log scale.}
 #'   \item{pmf_mu}{Derived location parameter on the log scale.}
 #'   \item{pmf_p05}{5th percentile of the PMF stage distribution.}
@@ -48,37 +55,84 @@ thin_samples <- function(n, z_sorted, stage_sorted) {
 #' }
 #'
 #' @examples
-#' pmf <- pmf_stage_lognormal(pmf_shift = 1200, pmf_mean = 1150, pmf_sigma = 0.5)
-#' pmf$pmf_p05
-#' pmf$pmf_p95
+#' # Mode 1: assume sigma
+#' pmf <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9, pmf_sigma = 0.5)
 #'
+#' # Mode 2: solve for sigma from low/high estimates
+#' pmf <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9,
+#'                             pmf_low = 239, pmf_high = 245)
 #' @export
-pmf_stage_lognormal <- function(pmf_shift, pmf_mean, pmf_sigma = 0.5){
-  if (pmf_mean >= pmf_shift) {
-    cli::cli_abort(c(
-      "{.arg pmf_mean} must be less than {.arg pmf_shift}.",
-      "x" = "{.arg pmf_mean} is {.val {pmf_mean}} but {.arg pmf_shift} is {.val {pmf_shift}}."
-    ))
-  }
+pmf_stage_lognormal <- function(pmf_shift, pmf_best,
+                                pmf_sigma = NULL,
+                                pmf_low   = NULL,
+                                pmf_high  = NULL) {
+
+  # Use inputs to determine which functional mode.
+  # No pmf_low or pmf high? -> Must assume sigma = 0.5
+  if (!is.null(pmf_low) && !is.null(pmf_high)) {
+    if (pmf_shift > pmf_low) {
+      cli::cli_abort(c(
+        "{.arg pmf_shift} must be less than {.arg pmf_low}.",
+        "x" = "{.arg pmf_shift} is {.val {pmf_shift}} but {.arg pmf_low} is {.val {pmf_low}}."
+      ))
+    }
+    if (pmf_low >= pmf_best) {
+      cli::cli_abort(c(
+        "{.arg pmf_low} must be less than {.arg pmf_best}.",
+        "x" = "{.arg pmf_low} is {.val {pmf_low}} but {.arg pmf_best} is {.val {pmf_best}}."
+      ))
+    }
+    if (pmf_best >= pmf_high) {
+      cli::cli_abort(c(
+        "{.arg pmf_best} must be less than {.arg pmf_high}.",
+        "x" = "{.arg pmf_best} is {.val {pmf_best}} but {.arg pmf_high} is {.val {pmf_high}}."
+      ))
+    }
 
-  # Derive mu ====
-  pmf_mu    <- log(pmf_mean - pmf_shift) - (pmf_sigma^2 / 2)
+    # --- Mode 2: solve for sigma ---
+    sigma_obj <- function(sigma) {
+      mu          <- log(pmf_best - pmf_shift) - sigma^2 / 2
+      implied_p05 <- pmf_shift + qlnorm(0.05, mu, sigma)
+      implied_p95 <- pmf_shift + qlnorm(0.95, mu, sigma)
+      (implied_p05 - pmf_low)^2 + (implied_p95 - pmf_high)^2
+    }
+    pmf_sigma <- optimise(sigma_obj, interval = c(1e-6, 10))$minimum
+
+  } else {
 
-  # Summary stats
-  # pmf_median <- pmf_shift + exp(pmf_mu)
-  # pmf_sd     <- sqrt((exp(pmf_sigma^2) - 1) * exp(2 * pmf_mu + pmf_sigma^2))
-  pmf_p05    <- pmf_shift + qlnorm(0.05, pmf_mu, pmf_sigma)
-  pmf_p95    <- pmf_shift + qlnorm(0.95, pmf_mu, pmf_sigma)
+    # --- Mode 1: sigma supplied ---
+    if (is.null(pmf_sigma)) {
+      cli::cli_abort(
+        "Either {.arg pmf_sigma} or both {.arg pmf_low} and {.arg pmf_high} must be supplied."
+      )
+    }
+    if (pmf_sigma <= 0) {
+      cli::cli_abort(c(
+        "{.arg pmf_sigma} must be positive.",
+        "x" = "{.arg pmf_sigma} is {.val {pmf_sigma}}."
+      ))
+    }
+    if (pmf_shift >= pmf_best) {
+      cli::cli_abort(c(
+        "{.arg pmf_shift} must be less than {.arg pmf_best}.",
+        "x" = "{.arg pmf_shift} is {.val {pmf_shift}} but {.arg pmf_best} is {.val {pmf_best}}."
+      ))
+    }
+  }
 
-  # create pmf_stage_LN as a list
-  pmf_stage_LN <- list(pmf_shift = pmf_shift,
-                       pmf_mean = pmf_mean,
-                       pmf_sigma = pmf_sigma,
-                       pmf_mu = pmf_mu,
-                       pmf_p05 = pmf_p05,
-                       pmf_p95 = pmf_p95)
+  # --- Derive mu and quantiles ---
+  pmf_mu  <- log(pmf_best - pmf_shift) - (pmf_sigma^2 / 2)
+  pmf_p05 <- pmf_shift + qlnorm(0.05, pmf_mu, pmf_sigma)
+  pmf_p95 <- pmf_shift + qlnorm(0.95, pmf_mu, pmf_sigma)
 
-  return(pmf_stage_LN)
+  list(
+    pmf_shift = pmf_shift,
+    pmf_best  = pmf_best,
+    pmf_sigma = pmf_sigma,
+    pmf_mu    = pmf_mu,
+    pmf_p05   = pmf_p05,
+    pmf_p95   = pmf_p95
+  )
 }
 
 #' Rejection Sampling of Stage Bounded by a Probabilistic Maximum Stage
@@ -106,27 +160,28 @@ pmf_stage_lognormal <- function(pmf_shift, pmf_mean, pmf_sigma = 0.5){
 #'
 #' @examples
 #' \dontrun{
-#' pmf <- pmf_stage_lognormal(pmf_shift = 1200, pmf_mean = 1150, pmf_sigma = 0.5)
+#' pmf_ln <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9, pmf_sigma = 0.5)
 #'
 #' result <- rejection_sampling_stage(
-#'   pmf_stage_LN  = pmf,
+#'   pmf_stage_LN  = pmf_ln,
 #'   stage_freq_df = my_stage_freq_df,
 #'   n_samples     = 1e7
 #' )
 #' }
 #'
 #' @export
-rejection_sampling_stage <- function(pmf_stage_LN, stage_freq_df = NULL, aep = NULL, stage = NULL, n_samples = 1E7){
+rejection_sampling_stage <- function(pmf_stage_LN, stage_freq_df = NULL, aep = NULL, stage = NULL, n_samples = 1e7){
   # Resolve inputs
   if (!is.null(stage_freq_df)) {
     if (!is.null(aep) || !is.null(stage)) {
       cli::cli_abort("Provide either {.arg stage_freq_df} or {.arg aep}/{.arg stage}, not both.")
     }
-    aep   <- stage_freq_df[[1]]
-    stage <- stage_freq_df[[2]]
+    aep_vals   <- stage_freq_df[[1]]
+    stage_vals <- stage_freq_df[[2]]
 
   } else if (!is.null(aep) && !is.null(stage)) {
-    # use as-is
+    aep_vals   <- aep
+    stage_vals <- stage
 
   } else {
     cli::cli_abort(c(
@@ -141,8 +196,8 @@ rejection_sampling_stage <- function(pmf_stage_LN, stage_freq_df = NULL, aep = N
   pmf_sigma <- pmf_stage_LN[["pmf_sigma"]]
 
   # Transform to z-space for interpolation function ============================
-  z_aep <- qnorm(1-aep)
-  zaep_stage <- approxfun(z_aep, stage, rule = 2)
+  z_aep <- qnorm(1-aep_vals)
+  zaep_stage <- approxfun(z_aep, stage_vals, rule = 2)
 
   # First sample rejection =====================================================
   # Sample AEPs

From 4f027df588cd95db57140f933e496a1cb96b1617 Mon Sep 17 00:00:00 2001
From: Dan McGraw <daniel.e.mcgraw@usace.army.mil>
Date: Mon, 18 May 2026 11:55:09 -0600
Subject: [PATCH 2/2] updated subsequent documentation

---
 R/rejection_sampling.R          | 12 ++++-----
 man/pmf_stage_lognormal.Rd      | 43 +++++++++++++++++++++++----------
 man/rejection_sampling_stage.Rd |  4 +--
 3 files changed, 38 insertions(+), 21 deletions(-)

diff --git a/R/rejection_sampling.R b/R/rejection_sampling.R
index 135a578..5f07e3b 100644
--- a/R/rejection_sampling.R
+++ b/R/rejection_sampling.R
@@ -28,20 +28,20 @@ thin_samples <- function(n, z_sorted, stage_sorted) {
 #'
 #' Computes the parameters of a three-parameter lognormal distribution for use
 #' as a probabilistic maximum stage (PMF) in rejection sampling. The shift
-#' parameter defines the hard lower bound of the distribution. The function
-#' supports two modes: (1) supplying a best estimate and assuming sigma, or
+#' parameter defines the lower or upper bound of the distribution (typically, the lower value).
+#' The function supports two modes: (1) supplying a best estimate and assuming sigma, or
 #' (2) supplying a best estimate, low, and high to solve for sigma numerically.
 #'
 #' @param pmf_shift Numeric. Hard lower bound (shift) of the lognormal
 #'   distribution. Must be less than all of \code{pmf_best}, \code{pmf_low},
 #'   and \code{pmf_high}.
 #' @param pmf_best Numeric. Best estimate (mean) of the PMF stage distribution.
-#' @param pmf_sigma Numeric. Standard deviation on the log scale. Required if
+#' @param pmf_sigma Numeric. Assumed standard deviation on the log scale. Required if
 #'   \code{pmf_low} and \code{pmf_high} are not supplied. Defaults to
-#'   \code{NULL}.
-#' @param pmf_low Numeric. Low estimate of PMF stage (5th percentile). Optional.
+#'   \code{NULL}. Suggested value = 0.5.
+#' @param pmf_low Numeric. Low estimate of PMF stage (assumed 5th percentile). Optional.
 #'   If supplied, \code{pmf_high} must also be supplied.
-#' @param pmf_high Numeric. High estimate of PMF stage (95th percentile).
+#' @param pmf_high Numeric. High estimate of PMF stage (assumed 95th percentile).
 #'   Optional. If supplied, \code{pmf_low} must also be supplied.
 #'
 #' @return A named list with the following elements:
diff --git a/man/pmf_stage_lognormal.Rd b/man/pmf_stage_lognormal.Rd
index 8b1e269..9d0580d 100644
--- a/man/pmf_stage_lognormal.Rd
+++ b/man/pmf_stage_lognormal.Rd
@@ -4,23 +4,36 @@
 \alias{pmf_stage_lognormal}
 \title{Parameterize a Three-Parameter Lognormal PMF for Stage}
 \usage{
-pmf_stage_lognormal(pmf_shift, pmf_mean, pmf_sigma = 0.5)
+pmf_stage_lognormal(
+  pmf_shift,
+  pmf_best,
+  pmf_sigma = NULL,
+  pmf_low = NULL,
+  pmf_high = NULL
+)
 }
 \arguments{
-\item{pmf_shift}{Numeric. Lower bound (shift) of the lognormal distribution.
-Must be greater than \code{pmf_mean}.}
+\item{pmf_shift}{Numeric. Hard lower bound (shift) of the lognormal
+distribution. Must be less than all of \code{pmf_best}, \code{pmf_low},
+and \code{pmf_high}.}
 
-\item{pmf_mean}{Numeric. Mean of the PMF stage distribution. Must be less
-than \code{pmf_shift}.}
+\item{pmf_best}{Numeric. Best estimate (mean) of the PMF stage distribution.}
 
-\item{pmf_sigma}{Numeric. Standard deviation on the log scale. Defaults to
-\code{0.5}.}
+\item{pmf_sigma}{Numeric. Assumed standard deviation on the log scale. Required if
+\code{pmf_low} and \code{pmf_high} are not supplied. Defaults to
+\code{NULL}. Suggested value = 0.5.}
+
+\item{pmf_low}{Numeric. Low estimate of PMF stage (assumed 5th percentile). Optional.
+If supplied, \code{pmf_high} must also be supplied.}
+
+\item{pmf_high}{Numeric. High estimate of PMF stage (assumed 95th percentile).
+Optional. If supplied, \code{pmf_low} must also be supplied.}
 }
 \value{
 A named list with the following elements:
 \describe{
-\item{pmf_shift}{Lower bound of the distribution.}
-\item{pmf_mean}{Mean of the distribution.}
+\item{pmf_shift}{Hard lower bound of the distribution.}
+\item{pmf_best}{Best estimate of PMF stage.}
 \item{pmf_sigma}{Standard deviation on the log scale.}
 \item{pmf_mu}{Derived location parameter on the log scale.}
 \item{pmf_p05}{5th percentile of the PMF stage distribution.}
@@ -30,11 +43,15 @@ A named list with the following elements:
 \description{
 Computes the parameters of a three-parameter lognormal distribution for use
 as a probabilistic maximum stage (PMF) in rejection sampling. The shift
-parameter defines the lower bound of the distribution.
+parameter defines the lower or upper bound of the distribution (typically, the lower value).
+The function supports two modes: (1) supplying a best estimate and assuming sigma, or
+(2) supplying a best estimate, low, and high to solve for sigma numerically.
 }
 \examples{
-pmf <- pmf_stage_lognormal(pmf_shift = 1200, pmf_mean = 1150, pmf_sigma = 0.5)
-pmf$pmf_p05
-pmf$pmf_p95
+# Mode 1: assume sigma
+pmf <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9, pmf_sigma = 0.5)
 
+# Mode 2: solve for sigma from low/high estimates
+pmf <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9,
+                            pmf_low = 239, pmf_high = 245)
 }
diff --git a/man/rejection_sampling_stage.Rd b/man/rejection_sampling_stage.Rd
index a2f5ade..c9e061b 100644
--- a/man/rejection_sampling_stage.Rd
+++ b/man/rejection_sampling_stage.Rd
@@ -40,10 +40,10 @@ assigned Weibull plotting positions for use in frequency analysis.
 }
 \examples{
 \dontrun{
-pmf <- pmf_stage_lognormal(pmf_shift = 1200, pmf_mean = 1150, pmf_sigma = 0.5)
+pmf_ln <- pmf_stage_lognormal(pmf_shift = 239, pmf_best = 241.9, pmf_sigma = 0.5)
 
 result <- rejection_sampling_stage(
-  pmf_stage_LN  = pmf,
+  pmf_stage_LN  = pmf_ln,
   stage_freq_df = my_stage_freq_df,
   n_samples     = 1e7
 )