JuliaStats · ForceBru · Jun 4, 2025 · Jun 4, 2025 · Jun 4, 2025 · Jun 4, 2025
diff --git a/docs/src/univariate.md b/docs/src/univariate.md
@@ -244,6 +244,20 @@ GeneralizedExtremeValue
 plotdensity((0, 30), GeneralizedExtremeValue, (0, 1, 1)) # hide
 ```
 
+```@docs
+GeneralizedHyperbolic
+```
+```@example plotdensity
+plotdensity((-8, 8), GeneralizedHyperbolic, (3, 2, 1, -1, 1/2)) # hide
+```
+
+```@docs
+GeneralizedInverseGaussian
+```
+```@example plotdensity
+plotdensity((0, 20), GeneralizedInverseGaussian, (3, 8, -1/2)) # hide
+```
+
 ```@docs
 GeneralizedPareto
 ```

diff --git a/src/Distributions.jl b/src/Distributions.jl
@@ -100,6 +100,8 @@ export
     FullNormalCanon,
     Gamma,
     DiscreteNonParametric,
+    GeneralizedHyperbolic,
+    GeneralizedInverseGaussian,
     GeneralizedPareto,
     GeneralizedExtremeValue,
     Geometric,

diff --git a/src/univariate/continuous/generalizedhyperbolic.jl b/src/univariate/continuous/generalizedhyperbolic.jl
@@ -0,0 +1,328 @@
+@doc raw"""
+    GeneralizedHyperbolic(α, β, δ, μ=0, λ=1)
+
+The *generalized hyperbolic (GH) distribution* with traditional parameters:
+
+- $\alpha>0$ (shape);
+- $-\alpha<\beta<\alpha$ (skewness);
+- $\delta>0$ ("scale", but not really, because it appears as an argument to the modified Bessel function of the 2nd kind in the normalizing constant);
+- $\mu\in\mathbb R$ (location);
+- $\lambda\in\mathbb R$ is a shape parameter, where $\lambda\neq 1$ makes the distribution "generalized"
+
+has probability density function:
+
+```math
+\frac{
+ (\gamma/\delta)^{\lambda}
+}{
+ \sqrt{2\pi} K_{\lambda}(\delta \gamma)
+}
+e^{\beta (x-\mu)}
+\frac{
+ K_{\lambda-1/2}\left(\alpha\sqrt{\delta^2 + (x-\mu)^2}\right)
+}{
+ \left(\alpha^{-1} \sqrt{\delta^2 + (x-\mu)^2}\right)^{1/2 - \lambda}
+}, \quad\gamma=\sqrt{\alpha^2 - \beta^2}
+```
+
+These parameters are actually stored in `struct GeneralizedHyperbolic{T<:Real}`.
+
+External links:
+
+* [Generalized hyperbolic distribution on Wikipedia](https://en.wikipedia.org/wiki/Generalised_hyperbolic_distribution).
+* [`HyperbolicDistribution` in Wolfram language](https://reference.wolfram.com/language/ref/HyperbolicDistribution.html).
+"""
+struct GeneralizedHyperbolic{T<:Real} <: ContinuousUnivariateDistribution
+    α::T
+    β::T
+    δ::T
+    μ::T
+    λ::T
+    function GeneralizedHyperbolic(α::T, β::T, δ::T, μ::T=zero(T), λ::T=one(T); check_args::Bool=true) where T<:Real
+        check_args && @check_args GeneralizedHyperbolic (α, α > zero(α)) (δ, δ > zero(δ)) (β, -α < β < α)
+        new{T}(α, β, δ, μ, λ)
+    end
+end
+
+GeneralizedHyperbolic(α::Real, β::Real, δ::Real, μ::Real=0, λ::Real=1; check_args::Bool=true) =
+    GeneralizedHyperbolic(promote(α, β, δ, μ, λ)...; check_args)
+
+@doc raw"""
+    GeneralizedHyperbolic(Val(:locscale), z, p=0, μ=0, σ=1, λ=1)
+
+Location-scale parameterization [1] of the generalized hyperbolic distribution with parameters
+
+- $z>0$ (shape);
+- $p\in\mathbb R$ measures skewness ($p=0$ results in a symmetric distribution);
+- $\mu\in\mathbb R$ and $\sigma>0$ are location and scale;
+- $\lambda\in\mathbb R$ is a shape parameter, where $\lambda\neq 1$ makes the distribution "generalized"
+
+has probability density function:
+
+```math
+\frac{\sqrt z}{
+ \sqrt{2\pi} K_{\lambda}(z)
+}
+e^{p z \cdot\varepsilon}
+\sqrt{
+ \left(\frac{1+\varepsilon^2}{1+p^2}\right)^{\lambda - 1/2}
+}
+K_{\lambda-1/2}\left[
+ z \sqrt{(1+p^2)(1+\varepsilon^2)}
+\right]
+```
+
+These parameters are _not_ stored in `struct GeneralizedHyperbolic`.
+Use `params(d, Val(:locscale))`, where `d` is an instance of `GeneralizedHyperbolic`, to retrieve them.
+
+Advantages of this parameterization:
+
+- It's truly location-scale, whereas $\delta$ in the traditional parameterization isn't a true scale parameter.
+- All parameters are either positive or unconstrained. The traditional parameterization has the complicated linear constraint $-\alpha<\beta<\alpha$.
+
+References:
+
+1. Puig, Pedro, and Michael A. Stephens. “Goodness-of-Fit Tests for the Hyperbolic Distribution.” The Canadian Journal of Statistics / La Revue Canadienne de Statistique 29, no. 2 (2001): 309–20. https://doi.org/10.2307/3316079.
+"""
+GeneralizedHyperbolic(::Val{:locscale}, z::Real, p::Real=0, μ::Real=0, σ::Real=1, λ::Real=1; check_args::Bool=true) =
+	GeneralizedHyperbolic(z * sqrt(1 + p^2)/σ, z * p / σ, σ, μ, λ; check_args)
+
+params(d::GeneralizedHyperbolic) = (d.α, d.β, d.δ, d.μ, d.λ)
+params(d::GeneralizedHyperbolic, ::Val{:locscale}) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    (; z=δ * γ, p=β / γ, μ, σ=δ, λ)
+end
+partype(::GeneralizedHyperbolic{T}) where T = T
+
+@distr_support GeneralizedHyperbolic -Inf Inf
+
+"Fit quadratic `y = ax^2 + bx + c` through 3 points (x, y), return coefficients `(a, b)`."
+function _fit_quadratic(x1, y1, x2, y2, x3, y3)
+    @assert x1 <= x2 <= x3
+    denom = (x1-x2) * (x1-x3) * (x2-x3) # < 0
+    a = (
+        x3 * (y2-y1) + x2 * (y1-y3) + x1 * (y3-y2)
+    ) / denom
+    b = (
+        x3^2 * (y1-y2) + x1^2 * (y2-y3) + x2^2 * (y3-y1)
+    ) / denom
+    (a, b)
+end
+
+"""
+    mode(::GeneralizedHyperbolic)
+
+- Exact formulae are used for λ=1 and λ=2.
+- For other values of λ quadratic fit search is used. The initial bracket `lo < mode < hi` is computed based on
+inequalities from [1, eq. 2.27].
+
+## References
+
+1. Robert E. Gaunt, Milan Merkle, "On bounds for the mode and median of the generalized hyperbolic and related distributions", Journal of Mathematical Analysis and Applications, Volume 493, Issue 1, 2021, 124508, ISSN 0022-247X, https://doi.org/10.1016/j.jmaa.2020.124508.
+"""
+function mode(d::GeneralizedHyperbolic)
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    if λ ≈ 1
+        μ + β * δ / γ # Wolfram
+    elseif λ ≈ 2
+        μ + β / α / γ^2 * (α + sqrt(β^2 + (α * δ * γ)^2)) # Wolfram
+    else
+        # FIXME: quadratic fit search should probably be factored into a separate function
+        lo, hi = let # Bounds for the bracketing interval
+            EX = mean(d)
+            # eq. 2.27 from the paper: EX - upper < mode < EX - lower for β>0.
+            # When β<0, the inequality is reversed.
+            lower = β/γ^2 * (
+                1/2 + sqrt(λ^2 + δ^2 * γ^2) - sqrt((λ - 1/2)^2 + δ^2 * γ^2)
+            )
+            upper = β/γ^2 * (
+                5/2 + sqrt((λ + 1)^2 + δ^2 * γ^2) - sqrt((λ - 3/2)^2 + δ^2 * γ^2)
+            )
+            if β < 0
+                upper, lower = lower, upper
+            end
+            EX - upper, EX - lower
+        end
+
+        # Minimize negative log-PDF using quadratic fit search
+        x1, x2, x3 = lo, (lo + hi)/2, hi # invariant: x1 < x2 < x3
+        xopt = x2
+        y1, y2, y3 = -logpdf(d, x1), -logpdf(d, x2), -logpdf(d, x3)
+        a, b = _fit_quadratic(x1, y1, x2, y2, x3, y3)
+        if a < 0
+            @warn "Quadratic points up instead of down: a=$a."
+            return xopt
+        end
+        (!isfinite(a) || !isfinite(b)) && return xopt
+        niter = 0
+        while x3 - x1 > 1e-6
+            niter += 1
+            xopt = -b / (2a)
+            yopt = -logpdf(d, xopt)
+
+            if xopt < x2
+                if yopt > y2
+                    x1, y1 = xopt, yopt
+                else
+                    x2, x3 = xopt, x2
+                    y2, y3 = yopt, y2
+                end
+            else # xopt > x2
+                if yopt > y2
+                    x3, y3 = xopt, yopt
+                else
+                    x1, x2 = x2, xopt
+                    y1, y2 = y2, yopt
+                end
+            end
+
+            a, b = _fit_quadratic(x1, y1, x2, y2, x3, y3)
+            if !isfinite(a) || !isfinite(b)
+                (abs(x2 - x1) < 1e-6 || abs(x3 - x2) < 1e-6) && break
+                @warn "Failed to build quadratic" (; niter, x1, y1, x2, y2, x3, y3)
+                break
+            end
+        end
+        xopt
+    end
+end
+
+mean(d::GeneralizedHyperbolic) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+    μ + β * δ / γ * besselk(1 + λ, δ * γ) / besselk(λ, δ * γ)
+end
+
+var(d::GeneralizedHyperbolic) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    t0 = besselk(0 + λ, δ * γ)
+    t1 = besselk(1 + λ, δ * γ)
+    t2 = besselk(2 + λ, δ * γ)
+    δ / γ * t1/t0 - (β * δ / γ * t1/t0)^2 + (β * δ / γ)^2 * t2/t0
+end
+
+skewness(d::GeneralizedHyperbolic) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    t0 = besselk(0 + λ, δ * γ)
+    t1 = besselk(1 + λ, δ * γ)
+    t2 = besselk(2 + λ, δ * γ)
+    t3 = besselk(3 + λ, δ * γ)
+    (
+        -3β * (δ / γ * t1/t0)^2 + 2 * (β * δ / γ * t1/t0)^3 + 3β * (δ / γ)^2 * t2/t0
+        - 3 * (β * δ / γ)^3 * t1*t2/t0^2 + (β * δ / γ)^3 * t3/t0
+    ) / sqrt(
+        δ / γ * t1/t0 - (β * δ / γ * t1/t0)^2 + (β * δ / γ)^2 * t2/t0
+    )^3
+end
+
+kurtosis(d::GeneralizedHyperbolic) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    t0 = besselk(0 + λ, δ * γ)
+    t1 = besselk(1 + λ, δ * γ)
+    t2 = besselk(2 + λ, δ * γ)
+    t3 = besselk(3 + λ, δ * γ)
+    t4 = besselk(4 + λ, δ * γ)
+    (
+        3 * γ^2 * t0^3 * t2 + 6 * β^2 * γ * δ * t0 * (t1^3 - 2t0 * t1 * t2 + t0^2 * t3)
+        + β^4 * δ^2 * (-3 * t1^4 + 6t0 * t1^2 * t2 - 4 * t0^2 * t1 * t3 + t0^3 * t4)
+    ) / (
+        γ * t0 * t1 + β^2 * δ * (-t1^2 + t0 * t2)
+    )^2 - 3 # EXCESS kurtosis
+end
+
+logpdf(d::GeneralizedHyperbolic, x::Real) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    function logbesselk(v::Real, x::Real, K::Integer=5)
+        if x > 600
+            # Asymptotic expansion, works for massive values of `x` on the order of 10^3, 10^4 and higher.
+            # Important, because otherwise PDF becomes exactly zero `exp(-Inf)==0` way too early.
+            μ = 4v^2
+            term = one(x)
+            s = one(x)
+            for k in 1:K
+                term *= (μ - (2k-1)^2) / (k * 8x)
+                s += term
+            end
+            (log(π) - log(2x))/2 - x + log(abs(s))
+        else
+            log(besselk(v, x)) # Returns `-Inf` for x>600
+        end
+    end
+
+    (
+        -0.5log(2π) - logbesselk(λ, γ * δ) + λ * (log(γ) - log(δ))
+        + β * (x - μ)
+        + (λ - 1/2) * (0.5log(δ^2 + (x - μ)^2) - log(α))
+        + logbesselk(λ - 1/2, α * sqrt(δ^2 + (x - μ)^2))
+    )
+end
+
+cdf(d::GeneralizedHyperbolic, x::Real) =
+	if isinf(x)
+		(x < 0) ? zero(x) : one(x)
+	elseif isnan(x)
+		typeof(x)(NaN)
+	else
+        quadgk(z -> pdf(d, z), -Inf, x, maxevals=10^4)[1]
+	end
+
+@quantile_newton GeneralizedHyperbolic
+
+mgf(d::GeneralizedHyperbolic, t::Number) = begin
+    α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    g = sqrt(α^2 - (t + β)^2)
+    exp(t * μ) / g^λ * sqrt((α - β) * (α + β))^λ * besselk(λ, g * δ) / besselk(λ, γ * δ)
+end
+
+cf(d::GeneralizedHyperbolic, t::Number) = mgf(d, 1im * t)
+
+@doc raw"""
+    rand(::AbstractRNG, ::GeneralizedHyperbolic)
+
+Sample from `GeneralizedHyperbolic(α, β, δ, μ, λ)` using its mixture representation:
+
+```math
+\begin{aligned}
+\gamma &= \sqrt{\alpha^2 - \beta^2}\\
+V &\sim \mathrm{GeneralizedInverseGaussian}(\delta / \gamma, \delta^2, \lambda)\\
+\xi &= \mu + \beta V + \sqrt{V} \varepsilon, \quad\varepsilon \sim \mathcal N(0,1)
+\end{aligned}
+```
+
+Then ξ is distributed as `GeneralizedHyperbolic(α, β, δ, μ, λ)`.
+
+Verified in Wolfram Mathematica:
+
+```
+In:= TransformedDistribution[\[Mu] + \[Beta]*V + 
+  Sqrt[V] \[Epsilon], {\[Epsilon] \[Distributed] NormalDistribution[],
+   V \[Distributed] 
+   InverseGaussianDistribution[\[Delta]/
+     Sqrt[\[Alpha]^2 - \[Beta]^2], \[Delta]^2, \[Lambda]]}]
+
+Out= HyperbolicDistribution[\[Lambda], \[Alpha], \[Beta], \[Delta], \[Mu]]
+```
+
+Note that here λ is the first parameter, while in this implementation it's the _last_ one.
+"""
+rand(rng::AbstractRNG, d::GeneralizedHyperbolic) = begin
+	α, β, δ, μ, λ = params(d)
+    γ = sqrt(α^2 - β^2)
+
+    V = rand(rng, GeneralizedInverseGaussian(δ/γ, δ^2, λ))
+    μ + β * V + sqrt(V) * randn(rng)
+end