From e1d8053a07d745fb5dd019bd5283ed204721ae3a Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Tue, 13 Aug 2024 20:55:41 +0100
Subject: [PATCH 01/17] SafePoisson with safety for large means

---
 EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl |   5 +-
 EpiAware/src/EpiAwareUtils/SafePoisson.jl   | 262 ++++++++++++++++++++
 2 files changed, 265 insertions(+), 2 deletions(-)
 create mode 100644 EpiAware/src/EpiAwareUtils/SafePoisson.jl

diff --git a/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl b/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
index 14442e9ab..f74163a34 100644
--- a/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
+++ b/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
@@ -8,13 +8,13 @@ using ..EpiAwareBase
 using DataFramesMeta: DataFrame, @rename!
 using DynamicPPL: Model, fix, condition, @submodel, @model
 using MCMCChains: Chains
-using Random: AbstractRNG
+using Random: AbstractRNG, randexp
 using Tables: rowtable
 
 using Distributions, DocStringExtensions, QuadGK, Statistics, Turing
 
 #Export Structures
-export HalfNormal, DirectSample
+export HalfNormal, DirectSample, SafePoisson
 
 #Export functions
 export scan, spread_draws, censored_pmf, get_param_array, prefix_submodel
@@ -32,5 +32,6 @@ include("turing-methods.jl")
 include("DirectSample.jl")
 include("post-inference.jl")
 include("get_param_array.jl")
+include("SafePoisson.jl")
 
 end
diff --git a/EpiAware/src/EpiAwareUtils/SafePoisson.jl b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
new file mode 100644
index 000000000..9a2059b3a
--- /dev/null
+++ b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
@@ -0,0 +1,262 @@
+@doc raw"
+Create a Poisson distribution with the specified mean that avoids `InExactError`
+when the mean is too large.
+
+# Arguments:
+using Base: disable_text_style
+
+- `λ`: The mean of the Poisson distribution.
+
+# Returns:
+
+- A `SafePoisson` distribution with the specified mean.
+
+# Examples:
+
+```jldoctest SafePoisson
+using EpiAware, Distributions
+
+bigλ = exp(48.0) #Large value of λ
+d = SafePoisson(bigλ)
+# output
+EpiAware.EpiAwareUtils.SafePoisson{Float64}(λ=7.016735912097631e20)
+```
+
+```jldoctest SafePoisson
+cdf(d, 2)
+# output
+0.0
+```
+
+```jldoctest SafePoisson
+logpdf(d, 100)
+# output
+-7.016735912097631e20
+```
+
+```jldoctest SafePoisson
+mean(d)
+# output
+7.016735912097631e20
+```
+
+```jldoctest SafePoisson
+var(d)
+# output
+7.016735912097631e20
+```
+"
+struct SafePoisson{T <: Real} <: ContinuousUnivariateDistribution
+    λ::T
+
+    SafePoisson{T}(λ::Real) where {T <: Real} = new{T}(λ)
+    SafePoisson(λ::Real) = SafePoisson{eltype(λ)}(λ)
+end
+
+# Default outer constructor
+SafePoisson() = SafePoisson{Float64}(1.0)
+
+# helper functions
+_poisson(d::SafePoisson) = Poisson{typeof(d.λ)}(d.λ)
+
+# ineffiecient but safe floor function to integer, which can handle large values o
+function _safe_int_floor(x::Real)
+    try
+        return floor(Int, x)
+    catch
+        return floor(BigInt, x)
+    end
+end
+
+function _safe_int_round(x::Real)
+    try
+        return round(Int, x)
+    catch
+        return round(BigInt, x)
+    end
+end
+
+### Parameters
+
+Distributions.params(d::SafePoisson) = _poisson(d) |> params
+Distributions.partype(::SafePoisson{T}) where {T} = T
+Distributions.rate(d::SafePoisson) = d.λ
+
+### Statistics
+
+Distributions.mean(d::SafePoisson) = d.λ
+Distributions.mode(d::SafePoisson) = _safe_int_floor(d.λ)
+Distributions.var(d::SafePoisson) = d.λ
+Distributions.skewness(d::SafePoisson) = one(typeof(d.λ)) / sqrt(d.λ)
+Distributions.kurtosis(d::SafePoisson) = one(typeof(d.λ)) / d.λ
+
+function Distributions.entropy(d::SafePoisson{T}) where T<:Real
+    entropy(_poisson(d))
+end
+
+Distributions.kldivergence(p::SafePoisson, q::SafePoisson) = kldivergence(_poisson(p), _poisson(q))
+
+### Evaluation
+
+Distributions.mgf(d::SafePoisson, t::Real) = mgf(_poisson(d), t)
+Distributions.cgf(d::SafePoisson, t) = cgf(_poisson(d), t)
+Distributions.cf(d::SafePoisson, t::Real) = cf(_poisson(d), t)
+Distributions.logpdf(d::SafePoisson, x::Integer) = logpdf(_poisson(d), x)
+Distributions.pdf(d::SafePoisson, x::Integer) = pdf(_poisson(d), x)
+Distributions.cdf(d::SafePoisson, x::Integer) = cdf(_poisson(d), x)
+Distributions.ccdf(d::SafePoisson, x::Integer) = ccdf(_poisson(d), x)
+Distributions.quantile(d::SafePoisson, q::Real) = quantile(_poisson(d), q)
+
+### Support
+
+Base.minimum(d::SafePoisson) = 0
+Base.maximum(d::SafePoisson) = Inf
+Distributions.insupport(d::SafePoisson, x::Integer) = x >= 0
+
+### Sampling
+### Taken from FastPoisson.jl https://github.com/SciML/PoissonRandom.jl/blob/master/src/PoissonRandom.jl
+
+
+count_rand(λ) = count_rand(Random.GLOBAL_RNG, λ)
+function count_rand(rng::AbstractRNG, λ)
+    n = 0
+    c = randexp(rng)
+    while c < λ
+        n += 1
+        c += randexp(rng)
+    end
+    return n
+end
+
+# Algorithm from:
+#
+#   J.H. Ahrens, U. Dieter (1982)
+#   "Computer Generation of Poisson Deviates from Modified Normal Distributions"
+#   ACM Transactions on Mathematical Software, 8(2):163-179
+#
+#   For μ sufficiently large, (i.e. >= 10.0)
+#
+ad_rand(λ) = ad_rand(Random.GLOBAL_RNG, λ)
+function ad_rand(rng::AbstractRNG, λ)
+    s = sqrt(λ)
+    d = 6.0 * λ^2
+    L = _safe_int_floor(λ - 1.1484)
+    # Step N
+    G = λ + s * randn(rng)
+
+    if G >= 0.0
+        K = _safe_int_floor(G)
+        # Step I
+        if K >= L
+            return K
+        end
+
+        # Step S
+        U = rand(rng)
+        if d * U >= (λ - K)^3
+            return K
+        end
+
+        # Step P
+        px, py, fx, fy = procf(λ, K, s)
+
+        # Step Q
+        if fy * (1 - U) <= py * exp(px - fx)
+            return K
+        end
+    end
+
+    while true
+        # Step E
+        E = randexp(rng)
+        U = 2.0 * rand(rng) - 1.0
+        T = 1.8 + copysign(E, U)
+        if T <= -0.6744
+            continue
+        end
+
+        K = _safe_int_floor(λ + s * T)
+        px, py, fx, fy = procf(λ, K, s)
+        c = 0.1069 / λ
+
+        # Step H
+        @fastmath if c * abs(U) <= py * exp(px + E) - fy * exp(fx + E)
+            return K
+        end
+    end
+end
+
+# log(1+x)-x
+# accurate ~2ulps for -0.227 < x < 0.315
+function log1pmx_kernel(x::Float64)
+    r = x / (x + 2.0)
+    t = r * r
+    w = @evalpoly(t,
+        6.66666666666666667e-1, # 2/3
+        4.00000000000000000e-1, # 2/5
+        2.85714285714285714e-1, # 2/7
+        2.22222222222222222e-1, # 2/9
+        1.81818181818181818e-1, # 2/11
+        1.53846153846153846e-1, # 2/13
+        1.33333333333333333e-1, # 2/15
+        1.17647058823529412e-1) # 2/17
+    hxsq = 0.5 * x * x
+    r * (hxsq + w * t) - hxsq
+end
+
+# use naive calculation or range reduction outside kernel range.
+# accurate ~2ulps for all x
+function log1pmx(x::Float64)
+    if !(-0.7 < x < 0.9)
+        return log1p(x) - x
+    elseif x > 0.315
+        u = (x - 0.5) / 1.5
+        return log1pmx_kernel(u) - 9.45348918918356180e-2 - 0.5 * u
+    elseif x > -0.227
+        return log1pmx_kernel(x)
+    elseif x > -0.4
+        u = (x + 0.25) / 0.75
+        return log1pmx_kernel(u) - 3.76820724517809274e-2 + 0.25 * u
+    elseif x > -0.6
+        u = (x + 0.5) * 2.0
+        return log1pmx_kernel(u) - 1.93147180559945309e-1 + 0.5 * u
+    else
+        u = (x + 0.625) / 0.375
+        return log1pmx_kernel(u) - 3.55829253011726237e-1 + 0.625 * u
+    end
+end
+
+# Procedure F
+function procf(λ, K::Int, s::Float64)
+    # can be pre-computed, but does not seem to affect performance
+    ω = 0.3989422804014327 / s
+    b1 = 0.041666666666666664 / λ
+    b2 = 0.3 * b1 * b1
+    c3 = 0.14285714285714285 * b1 * b2
+    c2 = b2 - 15.0 * c3
+    c1 = b1 - 6.0 * b2 + 45.0 * c3
+    c0 = 1.0 - b1 + 3.0 * b2 - 15.0 * c3
+
+    if K < 10
+        px = -float(λ)
+        py = λ^K / factorial(K)
+    else
+        δ = 0.08333333333333333 / K
+        δ -= 4.8 * δ^3
+        V = (λ - K) / K
+        px = K * log1pmx(V) - δ # avoids need for table
+        py = 0.3989422804014327 / sqrt(K)
+    end
+    X = (K - λ + 0.5) / s
+    X2 = X^2
+    fx = -0.5 * X2 # missing negation in pseudo-algorithm, but appears in fortran code.
+    fy = ω * (((c3 * X2 + c2) * X2 + c1) * X2 + c0)
+    return px, py, fx, fy
+end
+
+pois_rand(λ) = pois_rand(Random.GLOBAL_RNG, λ)
+pois_rand(rng::AbstractRNG, λ) = λ < 6 ? count_rand(rng, λ) : ad_rand(rng, λ)
+
+function Base.rand(rng::AbstractRNG, d::SafePoisson)
+    pois_rand(rng, d.λ)
+end

From ca84aaf37e504969e8972bbe06f5d4c48380b1b8 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Tue, 13 Aug 2024 23:32:33 +0100
Subject: [PATCH 02/17] better selection for conversion to Int or BigInt

---
 EpiAware/src/EpiAwareUtils/SafePoisson.jl | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafePoisson.jl b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
index 9a2059b3a..2cc949600 100644
--- a/EpiAware/src/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
@@ -3,7 +3,6 @@ Create a Poisson distribution with the specified mean that avoids `InExactError`
 when the mean is too large.
 
 # Arguments:
-using Base: disable_text_style
 
 - `λ`: The mean of the Poisson distribution.
 
@@ -59,19 +58,21 @@ SafePoisson() = SafePoisson{Float64}(1.0)
 # helper functions
 _poisson(d::SafePoisson) = Poisson{typeof(d.λ)}(d.λ)
 
-# ineffiecient but safe floor function to integer, which can handle large values o
+# ineffiecient but safe floor function to integer, which can handle large values of x
 function _safe_int_floor(x::Real)
-    try
+    Tf = typeof(x)
+    if (Tf(typemin(Int))-one(Tf)) < x < (Tf(typemax(Int))+one(Tf))
         return floor(Int, x)
-    catch
+    else
         return floor(BigInt, x)
     end
 end
 
 function _safe_int_round(x::Real)
-    try
+    Tf = typeof(x)
+    if (Tf(typemin(Int))-one(Tf)) < x < (Tf(typemax(Int))+one(Tf))
         return round(Int, x)
-    catch
+    else
         return round(BigInt, x)
     end
 end
@@ -114,7 +115,7 @@ Base.maximum(d::SafePoisson) = Inf
 Distributions.insupport(d::SafePoisson, x::Integer) = x >= 0
 
 ### Sampling
-### Taken from FastPoisson.jl https://github.com/SciML/PoissonRandom.jl/blob/master/src/PoissonRandom.jl
+### Taken from PoissonRandom.jl https://github.com/SciML/PoissonRandom.jl/blob/master/src/PoissonRandom.jl
 
 
 count_rand(λ) = count_rand(Random.GLOBAL_RNG, λ)

From ed6968247fafa9f63b834223ecf11eb1076588e7 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Tue, 13 Aug 2024 23:32:43 +0100
Subject: [PATCH 03/17] add SafeNegativeBinomial

---
 EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl   |   3 +-
 .../src/EpiAwareUtils/SafeNegativeBinomial.jl | 126 ++++++++++++++++++
 2 files changed, 128 insertions(+), 1 deletion(-)
 create mode 100644 EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl

diff --git a/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl b/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
index f74163a34..532747869 100644
--- a/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
+++ b/EpiAware/src/EpiAwareUtils/EpiAwareUtils.jl
@@ -14,7 +14,7 @@ using Tables: rowtable
 using Distributions, DocStringExtensions, QuadGK, Statistics, Turing
 
 #Export Structures
-export HalfNormal, DirectSample, SafePoisson
+export HalfNormal, DirectSample, SafePoisson, SafeNegativeBinomial
 
 #Export functions
 export scan, spread_draws, censored_pmf, get_param_array, prefix_submodel
@@ -33,5 +33,6 @@ include("DirectSample.jl")
 include("post-inference.jl")
 include("get_param_array.jl")
 include("SafePoisson.jl")
+include("SafeNegativeBinomial.jl")
 
 end
diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
new file mode 100644
index 000000000..9d8d14855
--- /dev/null
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -0,0 +1,126 @@
+@doc raw"
+Create a Negative binomial distribution with the specified mean that avoids `InExactError`
+when the mean is too large.
+
+
+# Parameterisation:
+We are using a mean and cluster factorization of the negative binomial distribution such
+that the variance to mean relationship is:
+
+```math
+\sigma^2  = \mu + \alpha^2 \mu^2
+```
+
+The reason for this parameterisation is that at sufficiently large mean values (i.e. `μ > 1 / α`) `α` is approximately equal to the
+standard fluctuation of the distribution, e.g. if `α = 0.05` we expect typical fluctuations of samples from the negative binomial to be
+about 5% of the mean when the mean is notably larger than 20. Otherwise, we expect approximately Poisson noise. In our opinion, this
+parameterisation is useful for specifying the distribution in a way that is easier to reason on priors for `α`.
+
+# Arguments:
+
+- `μ`: The mean of the Negative binomial distribution.
+- `α`: The cluster factor of the Negative binomial distribution.
+
+# Returns:
+
+- A `SafePoisson` distribution with the specified mean.
+
+# Examples:
+
+```jldoctest SafeNegativeBinomial
+using EpiAware, Distributions
+
+bigλ = exp(48.0) #Large value of λ
+α = 0.05
+d = SafeNegativeBinomial(bigλ, α)
+# output
+EpiAware.EpiAwareUtils.SafeNegativeBinomial{Float64}(μ=7.016735912097631e20, α=0.05)
+```
+
+```jldoctest SafeNegativeBinomial
+cdf(d, 2)
+# output
+8.523453224359909e-90
+```
+
+```jldoctest SafeNegativeBinomial
+logpdf(d, 100)
+# output
+-194.3125906630495
+```
+
+```jldoctest SafeNegativeBinomial
+mean(d)
+# output
+7.016735912097631e20
+```
+
+```jldoctest SafeNegativeBinomial
+var(d)
+# output
+1.2308645715030148e39
+```
+"
+struct SafeNegativeBinomial{T<:Real} <: DiscreteUnivariateDistribution
+    μ::T
+    α::T
+
+    function SafeNegativeBinomial{T}(μ::T, α::T) where {T <: Real}
+        return new{T}(μ, α)
+    end
+    SafeNegativeBinomial(μ::Real, α::Real) = SafeNegativeBinomial{eltype(μ)}(μ, α)
+end
+
+# helper function
+function _negbin(d::SafeNegativeBinomial)
+    μ² = d.μ^2
+    ex_σ² = sqrt(d.α) * μ²
+    p = d.μ / (d.μ + ex_σ²)
+    r = μ² / ex_σ²
+    return NegativeBinomial(r, p)
+end
+
+#### Parameters
+
+Distributions.params(d::SafeNegativeBinomial) = _negbin(d) |> params
+Distributions.partype(::SafeNegativeBinomial{T}) where {T} = T
+
+Distributions.succprob(d::SafeNegativeBinomial) = _negbin(d).p
+Distributions.failprob(d::SafeNegativeBinomial{T}) where {T} = one(T) - _negbin(d).p
+
+#### Statistics
+
+Distributions.mean(d::SafeNegativeBinomial) = d.μ
+Distributions.var(d::SafeNegativeBinomial) = d.μ + d.α^2 * d.μ^2
+Distributions.std(d::SafeNegativeBinomial) = sqrt(var(d))
+Distributions.skewness(d::SafeNegativeBinomial) = _negbin(d) |> skewness
+Distributions.kurtosis(d::SafeNegativeBinomial) = _negbin(d) |> kurtosis
+Distributions.mode(d::SafeNegativeBinomial) = _negbin(d) |> mode
+Distributions.kldivergence(p::SafeNegativeBinomial, q::SafeNegativeBinomial) = kldivergence(_negbin(p), _negbin(q))
+
+#### Evaluation & Sampling
+
+Distributions.logpdf(d::SafeNegativeBinomial, k::Real) = logpdf(_negbin(d), k)
+
+Distributions.cdf(d::SafeNegativeBinomial, x::Real) = cdf(_negbin(d), x)
+Distributions.ccdf(d::SafeNegativeBinomial, x::Real) = ccdf(_negbin(d), x)
+Distributions.logcdf(d::SafeNegativeBinomial, x::Real) = logcdf(_negbin(d), x)
+Distributions.logccdf(d::SafeNegativeBinomial, x::Real) = logccdf(_negbin(d), x)
+Distributions.quantile(d::SafeNegativeBinomial, q::Real) = quantile(_negbin(d), q)
+Distributions.cquantile(d::SafeNegativeBinomial, q::Real) = cquantile(_negbin(d), q)
+Distributions.invlogcdf(d::SafeNegativeBinomial, lq::Real) = invlogcdf(_negbin(d), lq)
+Distributions.invlogccdf(d::SafeNegativeBinomial, lq::Real) = invlogccdf(_negbin(d), lq)
+
+## sampling
+function Base.rand(rng::AbstractRNG, d::SafeNegativeBinomial)
+    _d = _negbin(d)
+    if isone(_d.p)
+        return 0
+    else
+        return rand(rng, SafePoisson(rand(rng, Gamma(_d.r, (1 - _d.p)/_d.p))))
+    end
+end
+
+Distributions.mgf(d::SafeNegativeBinomial, t::Real) = mgf(_negbin(d), t)
+Distributions.cgf(d::SafeNegativeBinomial, t) = cgf(_negbin(d), t)
+Distributions.cf(d::SafeNegativeBinomial, t::Real) = cf(_negbin(d), t)

From 693569881502cce69fa9ad647b9e7ca646710316 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 00:04:46 +0100
Subject: [PATCH 04/17] add unit tests to doctests

---
 .../src/EpiAwareUtils/SafeNegativeBinomial.jl | 15 +++--
 .../EpiAwareUtils/SafeNegativeBinomial.jl     | 62 +++++++++++++++++++
 EpiAware/test/EpiAwareUtils/SafePoisson.jl    | 57 +++++++++++++++++
 3 files changed, 130 insertions(+), 4 deletions(-)
 create mode 100644 EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
 create mode 100644 EpiAware/test/EpiAwareUtils/SafePoisson.jl

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index 9d8d14855..47085e682 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -23,7 +23,7 @@ parameterisation is useful for specifying the distribution in a way that is easi
 
 # Returns:
 
-- A `SafePoisson` distribution with the specified mean.
+- A `SafeNegativeBinomial` distribution with the specified mean.
 
 # Examples:
 
@@ -40,13 +40,13 @@ EpiAware.EpiAwareUtils.SafeNegativeBinomial{Float64}(μ=7.016735912097631e20, α
 ```jldoctest SafeNegativeBinomial
 cdf(d, 2)
 # output
-8.523453224359909e-90
+0.0
 ```
 
 ```jldoctest SafeNegativeBinomial
 logpdf(d, 100)
 # output
--194.3125906630495
+-16556.546939786767
 ```
 
 ```jldoctest SafeNegativeBinomial
@@ -74,12 +74,19 @@ end
 # helper function
 function _negbin(d::SafeNegativeBinomial)
     μ² = d.μ^2
-    ex_σ² = sqrt(d.α) * μ²
+    ex_σ² = d.α^2 * μ²
     p = d.μ / (d.μ + ex_σ²)
     r = μ² / ex_σ²
     return NegativeBinomial(r, p)
 end
 
+### Support
+
+Base.minimum(d::SafeNegativeBinomial) = 0
+Base.maximum(d::SafeNegativeBinomial) = Inf
+Distributions.insupport(d::SafeNegativeBinomial, x::Integer) = x >= 0
+
+
 #### Parameters
 
 Distributions.params(d::SafeNegativeBinomial) = _negbin(d) |> params
diff --git a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
new file mode 100644
index 000000000..a6675aca8
--- /dev/null
+++ b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -0,0 +1,62 @@
+@testitem "Testing SafeNegativeBinomial Constructor " begin
+    μ = 10.0
+    α = 0.05
+    dist = SafeNegativeBinomial(μ, α)
+    @test typeof(dist) <: SafeNegativeBinomial
+end
+
+@testitem "Check distribution properties of SafeNegativeBinomial" begin
+    using Distributions, HypothesisTests, StatsBase
+    μ = 10.0
+    α = 0.05
+    dist = SafeNegativeBinomial(μ, α)
+    #Check Distributions.jl mean function
+    @test mean(dist) ≈ μ
+    @test var(dist) ≈ μ + α^2 * μ^2
+    samples = [rand(dist) for _ in 1:100_000]
+    #Check mean from direct sampling of Distributions version and ANOVA and Variance F test comparisons
+    _dist = EpiAware.EpiAwareUtils._negbin(dist)
+    direct_samples = rand(_dist, 100_000)
+    mean_pval = OneWayANOVATest(samples, direct_samples) |> pvalue
+    @test mean_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
+    var_pval = VarianceFTest(samples, direct_samples) |> pvalue
+    @test var_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
+    @test isapprox(var(dist), var(direct_samples), atol = 0.1)
+
+    @testset "Check quantiles" begin
+        for q in [0.1, 0.25, 0.5, 0.75, 0.9]
+            @test isapprox(quantile(dist, q), quantile(direct_samples, q), atol = 0.1)
+        end
+    end
+
+    @testset "Check support boundaries" begin
+        @test minimum(dist) == 0
+        @test maximum(dist) == Inf
+    end
+
+    @testset "Check logpdf against Distributions" begin
+        for x in 0:10:100
+            @test isapprox(logpdf(dist, x),
+                logpdf(_dist, x), atol = 0.1)
+        end
+    end
+
+    @testset "Check CDF" begin
+        x = 0:10:100
+        @test isapprox(cdf(dist, x), ecdf(direct_samples)(x), atol = 0.05)
+    end
+end
+
+@testitem "Testing safety of rand call for SafeNegativeBinomial at large values" begin
+    using Distributions
+    bigμ = exp(48.0) #Large value of λ
+    α = 0.05
+    dist = SafeNegativeBinomial(bigμ, α)
+    @testset "Large value of mean samples a BigInt with SafePoisson" begin
+        @test rand(dist) isa BigInt
+    end
+    @testset "Large value of mean sample failure with Poisson" begin
+        _dist = EpiAware.EpiAwareUtils._negbin(dist)
+        @test_throws InexactError rand(_dist)
+    end
+end
diff --git a/EpiAware/test/EpiAwareUtils/SafePoisson.jl b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
new file mode 100644
index 000000000..8af0ced22
--- /dev/null
+++ b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
@@ -0,0 +1,57 @@
+@testitem "Testing SafePoisson Constructor " begin
+    λ = 10.0
+    dist = SafePoisson(λ)
+    @test typeof(dist) <: SafePoisson
+end
+
+@testitem "Check distribution properties of SafePoisson" begin
+    using Distributions, HypothesisTests, StatsBase
+    λ = 10.0
+    dist = SafePoisson(λ)
+    #Check Distributions.jl mean function
+    @test mean(dist) ≈ λ
+    samples = [rand(dist) for _ in 1:100_000]
+    #Check mean from direct sampling of Distributions version and ANOVA and Variance F test comparisons
+    direct_samples = rand(Poisson(λ), 100_000)
+    mean_pval = OneWayANOVATest(samples, direct_samples) |> pvalue
+    @test mean_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
+    var_pval = VarianceFTest(samples, direct_samples) |> pvalue
+    @test var_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
+    @test isapprox(var(dist), var(direct_samples), atol = 0.1)
+
+    @testset "Check quantiles" begin
+        for q in [0.1, 0.25, 0.5, 0.75, 0.9]
+            @test isapprox(quantile(dist, q), quantile(direct_samples, q), atol = 0.1)
+        end
+    end
+
+    @testset "Check support boundaries" begin
+        @test minimum(dist) == 0
+        @test maximum(dist) == Inf
+    end
+
+    @testset "Check logpdf against Distributions" begin
+        for x in 0:10:100
+            @test isapprox(logpdf(dist, x),
+                logpdf(Poisson(λ), x), atol = 0.1)
+        end
+    end
+
+    @testset "Check CDF" begin
+        x = 0:10:100
+        @test isapprox(cdf(dist, x), ecdf(direct_samples)(x), atol = 0.05)
+    end
+end
+
+@testitem "Testing safety of rand call for SafePoisson at large values" begin
+    using Distributions
+    bigλ = exp(48.0) #Large value of λ
+    dist = SafePoisson(bigλ)
+    @testset "Large value of mean samples a BigInt with SafePoisson" begin
+        @test rand(dist) isa BigInt
+    end
+    @testset "Large value of mean sample failure with Poisson" begin
+        _dist = Poisson(dist.λ)
+        @test_throws InexactError rand(_dist)
+    end
+end

From 67924eb9e8fc4b5c123868fd1e1a722cb88f6f38 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 00:05:19 +0100
Subject: [PATCH 05/17] reformat

---
 EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl |  9 +++++----
 EpiAware/src/EpiAwareUtils/SafePoisson.jl          | 11 ++++++-----
 2 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index 47085e682..f9725b89e 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -61,7 +61,7 @@ var(d)
 1.2308645715030148e39
 ```
 "
-struct SafeNegativeBinomial{T<:Real} <: DiscreteUnivariateDistribution
+struct SafeNegativeBinomial{T <: Real} <: DiscreteUnivariateDistribution
     μ::T
     α::T
 
@@ -86,7 +86,6 @@ Base.minimum(d::SafeNegativeBinomial) = 0
 Base.maximum(d::SafeNegativeBinomial) = Inf
 Distributions.insupport(d::SafeNegativeBinomial, x::Integer) = x >= 0
 
-
 #### Parameters
 
 Distributions.params(d::SafeNegativeBinomial) = _negbin(d) |> params
@@ -103,7 +102,9 @@ Distributions.std(d::SafeNegativeBinomial) = sqrt(var(d))
 Distributions.skewness(d::SafeNegativeBinomial) = _negbin(d) |> skewness
 Distributions.kurtosis(d::SafeNegativeBinomial) = _negbin(d) |> kurtosis
 Distributions.mode(d::SafeNegativeBinomial) = _negbin(d) |> mode
-Distributions.kldivergence(p::SafeNegativeBinomial, q::SafeNegativeBinomial) = kldivergence(_negbin(p), _negbin(q))
+function Distributions.kldivergence(p::SafeNegativeBinomial, q::SafeNegativeBinomial)
+    kldivergence(_negbin(p), _negbin(q))
+end
 
 #### Evaluation & Sampling
 
@@ -124,7 +125,7 @@ function Base.rand(rng::AbstractRNG, d::SafeNegativeBinomial)
     if isone(_d.p)
         return 0
     else
-        return rand(rng, SafePoisson(rand(rng, Gamma(_d.r, (1 - _d.p)/_d.p))))
+        return rand(rng, SafePoisson(rand(rng, Gamma(_d.r, (1 - _d.p) / _d.p))))
     end
 end
 
diff --git a/EpiAware/src/EpiAwareUtils/SafePoisson.jl b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
index 2cc949600..eb4c434fa 100644
--- a/EpiAware/src/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
@@ -61,7 +61,7 @@ _poisson(d::SafePoisson) = Poisson{typeof(d.λ)}(d.λ)
 # ineffiecient but safe floor function to integer, which can handle large values of x
 function _safe_int_floor(x::Real)
     Tf = typeof(x)
-    if (Tf(typemin(Int))-one(Tf)) < x < (Tf(typemax(Int))+one(Tf))
+    if (Tf(typemin(Int)) - one(Tf)) < x < (Tf(typemax(Int)) + one(Tf))
         return floor(Int, x)
     else
         return floor(BigInt, x)
@@ -70,7 +70,7 @@ end
 
 function _safe_int_round(x::Real)
     Tf = typeof(x)
-    if (Tf(typemin(Int))-one(Tf)) < x < (Tf(typemax(Int))+one(Tf))
+    if (Tf(typemin(Int)) - one(Tf)) < x < (Tf(typemax(Int)) + one(Tf))
         return round(Int, x)
     else
         return round(BigInt, x)
@@ -91,11 +91,13 @@ Distributions.var(d::SafePoisson) = d.λ
 Distributions.skewness(d::SafePoisson) = one(typeof(d.λ)) / sqrt(d.λ)
 Distributions.kurtosis(d::SafePoisson) = one(typeof(d.λ)) / d.λ
 
-function Distributions.entropy(d::SafePoisson{T}) where T<:Real
+function Distributions.entropy(d::SafePoisson{T}) where {T <: Real}
     entropy(_poisson(d))
 end
 
-Distributions.kldivergence(p::SafePoisson, q::SafePoisson) = kldivergence(_poisson(p), _poisson(q))
+function Distributions.kldivergence(p::SafePoisson, q::SafePoisson)
+    kldivergence(_poisson(p), _poisson(q))
+end
 
 ### Evaluation
 
@@ -117,7 +119,6 @@ Distributions.insupport(d::SafePoisson, x::Integer) = x >= 0
 ### Sampling
 ### Taken from PoissonRandom.jl https://github.com/SciML/PoissonRandom.jl/blob/master/src/PoissonRandom.jl
 
-
 count_rand(λ) = count_rand(Random.GLOBAL_RNG, λ)
 function count_rand(rng::AbstractRNG, λ)
     n = 0

From d315aecaf428c1e5232e7e36550664e69beba0fb Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 00:43:29 +0100
Subject: [PATCH 06/17] Add type promotion so AD works with distribution
 constructor

---
 EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index f9725b89e..713beb7b0 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -68,9 +68,15 @@ struct SafeNegativeBinomial{T <: Real} <: DiscreteUnivariateDistribution
     function SafeNegativeBinomial{T}(μ::T, α::T) where {T <: Real}
         return new{T}(μ, α)
     end
-    SafeNegativeBinomial(μ::Real, α::Real) = SafeNegativeBinomial{eltype(μ)}(μ, α)
 end
 
+#Outer constructors make AD work
+function SafeNegativeBinomial(μ::T, α::T) where {T <: Real}
+    return SafeNegativeBinomial{T}(μ, α)
+end
+
+SafeNegativeBinomial(μ::Real, α::Real) = SafeNegativeBinomial(promote(μ, α)...)
+
 # helper function
 function _negbin(d::SafeNegativeBinomial)
     μ² = d.μ^2

From 583dd2ecb0728ff221b367998e4dcc952a0c4ec3 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 00:43:47 +0100
Subject: [PATCH 07/17] Add logpdf grad call unit tests for Safe discrete dists

---
 .../EpiAwareUtils/SafeNegativeBinomial.jl     | 23 +++++++++++++++++++
 EpiAware/test/EpiAwareUtils/SafePoisson.jl    | 23 +++++++++++++++++++
 EpiAware/test/Project.toml                    |  3 +++
 3 files changed, 49 insertions(+)

diff --git a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
index a6675aca8..4286ab164 100644
--- a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -60,3 +60,26 @@ end
         @test_throws InexactError rand(_dist)
     end
 end
+
+@testitem "Check gradients can be evaluated for logpdf of SafeNegativeBinomial" begin
+    using Distributions, ReverseDiff, FiniteDifferences, ForwardDiff
+    log_μ = 48. #Plausible large value to hit with a log scale random walk over a number of time steps
+    α = 0.05
+
+    # Make a helper function for grad calls
+    f(x) = SafeNegativeBinomial(exp(x[1]), α) |> nb -> logpdf(nb, 100)
+    g_fin_diff = grad(central_fdm(5, 1), f, [log_μ])[1]
+
+    # Compiled ReverseDiff version
+    input = randn(1)
+    const f_tape = ReverseDiff.GradientTape(f, input)
+    const compiled_f_tape = ReverseDiff.compile(f_tape)
+    cfg = ReverseDiff.GradientConfig(input)
+    g_rvd = ReverseDiff.gradient(f, [log_μ], cfg)
+
+    # ForwardDiff version
+    g_fd = ForwardDiff.gradient(f, [log_μ])
+
+    @test g_fin_diff ≈ g_rvd
+    @test g_fin_diff ≈ g_fd
+end
diff --git a/EpiAware/test/EpiAwareUtils/SafePoisson.jl b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
index 8af0ced22..49ed1e566 100644
--- a/EpiAware/test/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
@@ -55,3 +55,26 @@ end
         @test_throws InexactError rand(_dist)
     end
 end
+
+@testitem "Check gradients can be evaluated for logpdf of SafePoisson" begin
+    using Distributions, ReverseDiff, FiniteDifferences, ForwardDiff
+    log_μ = 48. #Plausible large value to hit with a log scale random walk over a number of time steps
+    α = 0.05
+
+    # Make a helper function for grad calls
+    f(x) = SafePoisson(exp(x[1])) |> poi -> logpdf(poi, 100)
+    g_fin_diff = grad(central_fdm(5, 1), f, [log_μ])[1]
+
+    # Compiled ReverseDiff version
+    input = randn(1)
+    const f_tape = ReverseDiff.GradientTape(f, input)
+    const compiled_f_tape = ReverseDiff.compile(f_tape)
+    cfg = ReverseDiff.GradientConfig(input)
+    g_rvd = ReverseDiff.gradient(f, [log_μ], cfg)
+
+    # ForwardDiff version
+    g_fd = ForwardDiff.gradient(f, [log_μ])
+
+    @test g_fin_diff ≈ g_rvd
+    @test g_fin_diff ≈ g_fd
+end
diff --git a/EpiAware/test/Project.toml b/EpiAware/test/Project.toml
index f944a2595..95298f7be 100644
--- a/EpiAware/test/Project.toml
+++ b/EpiAware/test/Project.toml
@@ -5,12 +5,15 @@ DataFramesMeta = "1313f7d8-7da2-5740-9ea0-a2ca25f37964"
 Distributions = "31c24e10-a181-5473-b8eb-7969acd0382f"
 Documenter = "e30172f5-a6a5-5a46-863b-614d45cd2de4"
 DynamicPPL = "366bfd00-2699-11ea-058f-f148b4cae6d8"
+FiniteDifferences = "26cc04aa-876d-5657-8c51-4c34ba976000"
+ForwardDiff = "f6369f11-7733-5829-9624-2563aa707210"
 HypothesisTests = "09f84164-cd44-5f33-b23f-e6b0d136a0d5"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 LogExpFunctions = "2ab3a3ac-af41-5b50-aa03-7779005ae688"
 MCMCChains = "c7f686f2-ff18-58e9-bc7b-31028e88f75d"
 Pathfinder = "b1d3bc72-d0e7-4279-b92f-7fa5d6d2d454"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
+ReverseDiff = "37e2e3b7-166d-5795-8a7a-e32c996b4267"
 SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"

From f165ebcfb3ca845f8a70740d563c4d17497cefad Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 01:04:06 +0100
Subject: [PATCH 08/17] reformat

---
 EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl | 2 +-
 EpiAware/test/EpiAwareUtils/SafePoisson.jl          | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
index 4286ab164..982f9d821 100644
--- a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -63,7 +63,7 @@ end
 
 @testitem "Check gradients can be evaluated for logpdf of SafeNegativeBinomial" begin
     using Distributions, ReverseDiff, FiniteDifferences, ForwardDiff
-    log_μ = 48. #Plausible large value to hit with a log scale random walk over a number of time steps
+    log_μ = 48.0 #Plausible large value to hit with a log scale random walk over a number of time steps
     α = 0.05
 
     # Make a helper function for grad calls
diff --git a/EpiAware/test/EpiAwareUtils/SafePoisson.jl b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
index 49ed1e566..d28d19a56 100644
--- a/EpiAware/test/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
@@ -58,7 +58,7 @@ end
 
 @testitem "Check gradients can be evaluated for logpdf of SafePoisson" begin
     using Distributions, ReverseDiff, FiniteDifferences, ForwardDiff
-    log_μ = 48. #Plausible large value to hit with a log scale random walk over a number of time steps
+    log_μ = 48.0 #Plausible large value to hit with a log scale random walk over a number of time steps
     α = 0.05
 
     # Make a helper function for grad calls

From bc82075b8a42148c9dc5c1c7eb4db26280eb74c8 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 13:07:20 +0100
Subject: [PATCH 09/17] change neg bin param to (r, p)

---
 .../src/EpiAwareUtils/SafeNegativeBinomial.jl | 61 +++++++++----------
 .../EpiAwareUtils/SafeNegativeBinomial.jl     | 39 +++++++++---
 2 files changed, 58 insertions(+), 42 deletions(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index 713beb7b0..5a8f6f2eb 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -11,15 +11,15 @@ that the variance to mean relationship is:
 \sigma^2  = \mu + \alpha^2 \mu^2
 ```
 
-The reason for this parameterisation is that at sufficiently large mean values (i.e. `μ > 1 / α`) `α` is approximately equal to the
-standard fluctuation of the distribution, e.g. if `α = 0.05` we expect typical fluctuations of samples from the negative binomial to be
+The reason for this parameterisation is that at sufficiently large mean values (i.e. `r > 1 / p`) `p` is approximately equal to the
+standard fluctuation of the distribution, e.g. if `p = 0.05` we expect typical fluctuations of samples from the negative binomial to be
 about 5% of the mean when the mean is notably larger than 20. Otherwise, we expect approximately Poisson noise. In our opinion, this
-parameterisation is useful for specifying the distribution in a way that is easier to reason on priors for `α`.
+parameterisation is useful for specifying the distribution in a way that is easier to reason on priors for `p`.
 
 # Arguments:
 
-- `μ`: The mean of the Negative binomial distribution.
-- `α`: The cluster factor of the Negative binomial distribution.
+- `r`: The number of successes, although this can be extended to a continous number.
+- `p`: Success rate.
 
 # Returns:
 
@@ -30,15 +30,19 @@ parameterisation is useful for specifying the distribution in a way that is easi
 ```jldoctest SafeNegativeBinomial
 using EpiAware, Distributions
 
-bigλ = exp(48.0) #Large value of λ
-α = 0.05
-d = SafeNegativeBinomial(bigλ, α)
+bigμ = exp(48.0) #Large value of μ
+σ² = bigμ + 0.05 * bigμ^2 #Large variance
+
+# We can calculate the success rate from the mean to variance relationship
+p = bigμ / σ²
+r = bigμ * p / (1 - p)
+d = SafeNegativeBinomial(r, p)
 # output
-EpiAware.EpiAwareUtils.SafeNegativeBinomial{Float64}(μ=7.016735912097631e20, α=0.05)
+EpiAware.EpiAwareUtils.SafeNegativeBinomial{Float64}(r=20.0, p=2.85032816548187e-20)
 ```
 
 ```jldoctest SafeNegativeBinomial
-cdf(d, 2)
+cdf(d, 100)
 # output
 0.0
 ```
@@ -46,7 +50,7 @@ cdf(d, 2)
 ```jldoctest SafeNegativeBinomial
 logpdf(d, 100)
 # output
--16556.546939786767
+-850.1397180331871
 ```
 
 ```jldoctest SafeNegativeBinomial
@@ -58,33 +62,27 @@ mean(d)
 ```jldoctest SafeNegativeBinomial
 var(d)
 # output
-1.2308645715030148e39
+2.4617291430060293e40
 ```
 "
 struct SafeNegativeBinomial{T <: Real} <: DiscreteUnivariateDistribution
-    μ::T
-    α::T
+    r::T
+    p::T
 
-    function SafeNegativeBinomial{T}(μ::T, α::T) where {T <: Real}
-        return new{T}(μ, α)
+    function SafeNegativeBinomial{T}(r::T, p::T) where {T <: Real}
+        return new{T}(r, p)
     end
 end
 
 #Outer constructors make AD work
-function SafeNegativeBinomial(μ::T, α::T) where {T <: Real}
-    return SafeNegativeBinomial{T}(μ, α)
+function SafeNegativeBinomial(r::T, p::T) where {T <: Real}
+    return SafeNegativeBinomial{T}(r, p)
 end
 
-SafeNegativeBinomial(μ::Real, α::Real) = SafeNegativeBinomial(promote(μ, α)...)
+SafeNegativeBinomial(r::Real, p::Real) = SafeNegativeBinomial(promote(r, p)...)
 
 # helper function
-function _negbin(d::SafeNegativeBinomial)
-    μ² = d.μ^2
-    ex_σ² = d.α^2 * μ²
-    p = d.μ / (d.μ + ex_σ²)
-    r = μ² / ex_σ²
-    return NegativeBinomial(r, p)
-end
+_negbin(d::SafeNegativeBinomial) =NegativeBinomial(d.r, d.p)
 
 ### Support
 
@@ -102,9 +100,9 @@ Distributions.failprob(d::SafeNegativeBinomial{T}) where {T} = one(T) - _negbin(
 
 #### Statistics
 
-Distributions.mean(d::SafeNegativeBinomial) = d.μ
-Distributions.var(d::SafeNegativeBinomial) = d.μ + d.α^2 * d.μ^2
-Distributions.std(d::SafeNegativeBinomial) = sqrt(var(d))
+Distributions.mean(d::SafeNegativeBinomial) = _negbin(d) |> mean
+Distributions.var(d::SafeNegativeBinomial) = _negbin(d) |> var
+Distributions.std(d::SafeNegativeBinomial) = _negbin(d) |> std
 Distributions.skewness(d::SafeNegativeBinomial) = _negbin(d) |> skewness
 Distributions.kurtosis(d::SafeNegativeBinomial) = _negbin(d) |> kurtosis
 Distributions.mode(d::SafeNegativeBinomial) = _negbin(d) |> mode
@@ -127,11 +125,10 @@ Distributions.invlogccdf(d::SafeNegativeBinomial, lq::Real) = invlogccdf(_negbin
 
 ## sampling
 function Base.rand(rng::AbstractRNG, d::SafeNegativeBinomial)
-    _d = _negbin(d)
-    if isone(_d.p)
+    if isone(d.p)
         return 0
     else
-        return rand(rng, SafePoisson(rand(rng, Gamma(_d.r, (1 - _d.p) / _d.p))))
+        return rand(rng, SafePoisson(rand(rng, Gamma(d.r, (1 - d.p) / d.p))))
     end
 end
 
diff --git a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
index 982f9d821..dc39eebac 100644
--- a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -1,7 +1,12 @@
 @testitem "Testing SafeNegativeBinomial Constructor " begin
     μ = 10.0
     α = 0.05
-    dist = SafeNegativeBinomial(μ, α)
+    # calculate the r, p parameters
+    σ² = μ + α * μ^2
+    p = μ / σ²
+    r = μ * p / (1 - p)
+
+    dist = SafeNegativeBinomial(r, p)
     @test typeof(dist) <: SafeNegativeBinomial
 end
 
@@ -9,10 +14,15 @@ end
     using Distributions, HypothesisTests, StatsBase
     μ = 10.0
     α = 0.05
-    dist = SafeNegativeBinomial(μ, α)
+    # calculate the r, p parameters
+    σ² = μ + α * μ^2
+    p = μ / σ²
+    r = μ * p / (1 - p)
+
+    dist = SafeNegativeBinomial(r, p)
     #Check Distributions.jl mean function
     @test mean(dist) ≈ μ
-    @test var(dist) ≈ μ + α^2 * μ^2
+    @test var(dist) ≈ σ²
     samples = [rand(dist) for _ in 1:100_000]
     #Check mean from direct sampling of Distributions version and ANOVA and Variance F test comparisons
     _dist = EpiAware.EpiAwareUtils._negbin(dist)
@@ -49,9 +59,14 @@ end
 
 @testitem "Testing safety of rand call for SafeNegativeBinomial at large values" begin
     using Distributions
-    bigμ = exp(48.0) #Large value of λ
+    μ = exp(48.0) #Large value of λ
     α = 0.05
-    dist = SafeNegativeBinomial(bigμ, α)
+    # calculate the r, p parameters
+    σ² = μ + α * μ^2
+    p = μ / σ²
+    r = μ * p / (1 - p)
+
+    dist = SafeNegativeBinomial(r, p)
     @testset "Large value of mean samples a BigInt with SafePoisson" begin
         @test rand(dist) isa BigInt
     end
@@ -63,22 +78,26 @@ end
 
 @testitem "Check gradients can be evaluated for logpdf of SafeNegativeBinomial" begin
     using Distributions, ReverseDiff, FiniteDifferences, ForwardDiff
-    log_μ = 48.0 #Plausible large value to hit with a log scale random walk over a number of time steps
+    μ = exp(48.0) #Large value of λ
     α = 0.05
+    # calculate the r, p parameters
+    σ² = μ + α * μ^2
+    p = μ / σ²
+    r = μ * p / (1 - p)
 
     # Make a helper function for grad calls
-    f(x) = SafeNegativeBinomial(exp(x[1]), α) |> nb -> logpdf(nb, 100)
-    g_fin_diff = grad(central_fdm(5, 1), f, [log_μ])[1]
+    f(x) = SafeNegativeBinomial(exp(x[1]), p) |> nb -> logpdf(nb, 100)
+    g_fin_diff = grad(central_fdm(5, 1), f, [log(r)])[1]
 
     # Compiled ReverseDiff version
     input = randn(1)
     const f_tape = ReverseDiff.GradientTape(f, input)
     const compiled_f_tape = ReverseDiff.compile(f_tape)
     cfg = ReverseDiff.GradientConfig(input)
-    g_rvd = ReverseDiff.gradient(f, [log_μ], cfg)
+    g_rvd = ReverseDiff.gradient(f, [log(r)], cfg)
 
     # ForwardDiff version
-    g_fd = ForwardDiff.gradient(f, [log_μ])
+    g_fd = ForwardDiff.gradient(f, [log(r)])
 
     @test g_fin_diff ≈ g_rvd
     @test g_fin_diff ≈ g_fd

From f36c6136491ca15cba8ad8cc02b89c9a1c28c477 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 13:37:57 +0100
Subject: [PATCH 10/17] Update utils.jl

---
 EpiAware/src/EpiObsModels/utils.jl | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/EpiAware/src/EpiObsModels/utils.jl b/EpiAware/src/EpiObsModels/utils.jl
index ccb0227f6..33a46949f 100644
--- a/EpiAware/src/EpiObsModels/utils.jl
+++ b/EpiAware/src/EpiObsModels/utils.jl
@@ -40,8 +40,8 @@ A `NegativeBinomial` distribution object.
 """
 function NegativeBinomialMeanClust(μ, α)
     μ² = μ^2
-    ex_σ² = α * μ²
-    p = μ / (μ + ex_σ²)
-    r = μ² / ex_σ²
-    return NegativeBinomial(r, p)
+    σ² = μ + α * μ²
+    p = μ / σ²
+    r = 1 / α
+    return SafeNegativeBinomial(r, p)
 end

From b06f6b3555d6d03600d03b8e683030fb9d91d048 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 13:38:48 +0100
Subject: [PATCH 11/17] reformat

---
 EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index 5a8f6f2eb..41a51641a 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -82,7 +82,7 @@ end
 SafeNegativeBinomial(r::Real, p::Real) = SafeNegativeBinomial(promote(r, p)...)
 
 # helper function
-_negbin(d::SafeNegativeBinomial) =NegativeBinomial(d.r, d.p)
+_negbin(d::SafeNegativeBinomial) = NegativeBinomial(d.r, d.p)
 
 ### Support
 

From bf9145c7130983550e19413627bc0f2eaaef367f Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 14:01:56 +0100
Subject: [PATCH 12/17] change empirical var test to more principled approach

---
 EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl | 12 +++++++-----
 EpiAware/test/EpiAwareUtils/SafePoisson.jl          |  9 ++++++---
 2 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
index dc39eebac..8c828e49d 100644
--- a/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/test/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -23,16 +23,18 @@ end
     #Check Distributions.jl mean function
     @test mean(dist) ≈ μ
     @test var(dist) ≈ σ²
-    samples = [rand(dist) for _ in 1:100_000]
+    n = 100_000
+    samples = [rand(dist) for _ in 1:n]
     #Check mean from direct sampling of Distributions version and ANOVA and Variance F test comparisons
-    _dist = EpiAware.EpiAwareUtils._negbin(dist)
-    direct_samples = rand(_dist, 100_000)
+    _dist = NegativeBinomial(r, p)
+    direct_samples = rand(_dist, n)
     mean_pval = OneWayANOVATest(samples, direct_samples) |> pvalue
     @test mean_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
     var_pval = VarianceFTest(samples, direct_samples) |> pvalue
     @test var_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
-    @test isapprox(var(dist), var(direct_samples), atol = 0.1)
-
+    # Check that the variance is closer than 6 std of estimator to the direct samples
+    # very unlikely failure if the model is correctly implemented
+    @test abs(var(dist) - var(direct_samples)) < 6 * var(_dist)^2 * sqrt(2 / n)
     @testset "Check quantiles" begin
         for q in [0.1, 0.25, 0.5, 0.75, 0.9]
             @test isapprox(quantile(dist, q), quantile(direct_samples, q), atol = 0.1)
diff --git a/EpiAware/test/EpiAwareUtils/SafePoisson.jl b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
index d28d19a56..f8fa89cad 100644
--- a/EpiAware/test/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/test/EpiAwareUtils/SafePoisson.jl
@@ -10,14 +10,17 @@ end
     dist = SafePoisson(λ)
     #Check Distributions.jl mean function
     @test mean(dist) ≈ λ
-    samples = [rand(dist) for _ in 1:100_000]
+    n = 100_000
+    samples = [rand(dist) for _ in 1:n]
     #Check mean from direct sampling of Distributions version and ANOVA and Variance F test comparisons
-    direct_samples = rand(Poisson(λ), 100_000)
+    direct_samples = rand(Poisson(λ), n)
     mean_pval = OneWayANOVATest(samples, direct_samples) |> pvalue
     @test mean_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
     var_pval = VarianceFTest(samples, direct_samples) |> pvalue
     @test var_pval > 1e-6 #Very unlikely to fail if the model is correctly implemented
-    @test isapprox(var(dist), var(direct_samples), atol = 0.1)
+    # Check that the variance is closer than 6 std of estimator to the direct samples
+    # very unlikely failure if the model is correctly implemented
+    @test abs(var(dist) - var(direct_samples)) < 6 * var(Poisson(λ))^2 * sqrt(2 / n)
 
     @testset "Check quantiles" begin
         for q in [0.1, 0.25, 0.5, 0.75, 0.9]

From 239fe3b7658aae4158035636ca9a894a0cbd7efc Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 15:22:46 +0100
Subject: [PATCH 13/17] add default nadapts rather than just 50% of target
 sampling

---
 EpiAware/src/EpiInference/NUTSampler.jl | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/EpiAware/src/EpiInference/NUTSampler.jl b/EpiAware/src/EpiInference/NUTSampler.jl
index c3c69e926..b7639859b 100644
--- a/EpiAware/src/EpiInference/NUTSampler.jl
+++ b/EpiAware/src/EpiInference/NUTSampler.jl
@@ -24,6 +24,8 @@ The `NUTSampler` struct represents using the No-U-Turn Sampler (NUTS) to sample
     ndraws::Int
     "The metric type to use for the HMC sampler."
     metricT::M = DiagEuclideanMetric
+    "number of adaptation steps"
+    nadapts::Int = 250
 end
 
 @doc raw"
@@ -51,6 +53,7 @@ function _apply_nuts(model, method, prev_result; kwargs...)
         method.mcmc_parallel,
         method.ndraws ÷ method.nchains,
         method.nchains;
+        nadapts = method.nadapts,
         kwargs...)
 end
 
@@ -69,5 +72,6 @@ function _apply_nuts(model, method, prev_result::PathfinderResult; kwargs...)
         method.ndraws ÷ method.nchains,
         method.nchains;
         init_params = init_params,
+        nadapts = method.nadapts,
         kwargs...)
 end

From d2d617c24a90088d3343826b132072c752d763e7 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 15:23:14 +0100
Subject: [PATCH 14/17] Update NUTSampler.jl

---
 EpiAware/src/EpiInference/NUTSampler.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/EpiAware/src/EpiInference/NUTSampler.jl b/EpiAware/src/EpiInference/NUTSampler.jl
index b7639859b..fc05d72a7 100644
--- a/EpiAware/src/EpiInference/NUTSampler.jl
+++ b/EpiAware/src/EpiInference/NUTSampler.jl
@@ -25,7 +25,7 @@ The `NUTSampler` struct represents using the No-U-Turn Sampler (NUTS) to sample
     "The metric type to use for the HMC sampler."
     metricT::M = DiagEuclideanMetric
     "number of adaptation steps"
-    nadapts::Int = 250
+    nadapts::Int = 500
 end
 
 @doc raw"

From cf07966a45aed4ff79cec11e992b8d648523659a Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 17:34:21 +0100
Subject: [PATCH 15/17] set dist check_args = false

---
 EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl | 2 +-
 EpiAware/src/EpiAwareUtils/SafePoisson.jl          | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
index 41a51641a..3a32de966 100644
--- a/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
+++ b/EpiAware/src/EpiAwareUtils/SafeNegativeBinomial.jl
@@ -82,7 +82,7 @@ end
 SafeNegativeBinomial(r::Real, p::Real) = SafeNegativeBinomial(promote(r, p)...)
 
 # helper function
-_negbin(d::SafeNegativeBinomial) = NegativeBinomial(d.r, d.p)
+_negbin(d::SafeNegativeBinomial) = NegativeBinomial(d.r, d.p; check_args = false)
 
 ### Support
 
diff --git a/EpiAware/src/EpiAwareUtils/SafePoisson.jl b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
index eb4c434fa..a4b7f13ca 100644
--- a/EpiAware/src/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
@@ -56,7 +56,7 @@ end
 SafePoisson() = SafePoisson{Float64}(1.0)
 
 # helper functions
-_poisson(d::SafePoisson) = Poisson{typeof(d.λ)}(d.λ)
+_poisson(d::SafePoisson) = Poisson(d.λ; check_args=false)
 
 # ineffiecient but safe floor function to integer, which can handle large values of x
 function _safe_int_floor(x::Real)

From 7e57378bc3cc6ba80734510ba575b8a9ba98c49c Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 17:36:05 +0100
Subject: [PATCH 16/17] Set nadapts to Turing Default

---
 EpiAware/src/EpiInference/NUTSampler.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/EpiAware/src/EpiInference/NUTSampler.jl b/EpiAware/src/EpiInference/NUTSampler.jl
index fc05d72a7..fcf99f24a 100644
--- a/EpiAware/src/EpiInference/NUTSampler.jl
+++ b/EpiAware/src/EpiInference/NUTSampler.jl
@@ -25,7 +25,7 @@ The `NUTSampler` struct represents using the No-U-Turn Sampler (NUTS) to sample
     "The metric type to use for the HMC sampler."
     metricT::M = DiagEuclideanMetric
     "number of adaptation steps"
-    nadapts::Int = 500
+    nadapts::Int = -1 #This uses the Turing NUTS number of adaptation steps default which is half of the number of draws
 end
 
 @doc raw"

From 00dee998d2cd22785e077166edfce9747db01885 Mon Sep 17 00:00:00 2001
From: Samuel Brand <sam055@mac.com>
Date: Wed, 14 Aug 2024 17:36:55 +0100
Subject: [PATCH 17/17] reformat

---
 EpiAware/src/EpiAwareUtils/SafePoisson.jl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/EpiAware/src/EpiAwareUtils/SafePoisson.jl b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
index a4b7f13ca..57a541325 100644
--- a/EpiAware/src/EpiAwareUtils/SafePoisson.jl
+++ b/EpiAware/src/EpiAwareUtils/SafePoisson.jl
@@ -56,7 +56,7 @@ end
 SafePoisson() = SafePoisson{Float64}(1.0)
 
 # helper functions
-_poisson(d::SafePoisson) = Poisson(d.λ; check_args=false)
+_poisson(d::SafePoisson) = Poisson(d.λ; check_args = false)
 
 # ineffiecient but safe floor function to integer, which can handle large values of x
 function _safe_int_floor(x::Real)