normal_distribution_mod: set distribution_params_types

jla commit message: Functions inv_std_normal_cdf and set_normal_params_from_ens now set the appropriate values for the bounded_below, bounded_above, lower_bound and upper_bound components of the distribution_params_type. The distribution_params_type was changed to intent out in set_normal_params_from_ens. The magic number definition of the maximum delta in the inv_cdf root searching routine was changed to be a parameter but the value of 1e-8 was unchanged. A comment notes that changing this parameter to 1e-9 allows all of Ian Groom’s KDE distribution tests to pass. HK note, assuming this is if you use inv_cdf from normal_distribution_mod rather than rootfinding mode with KDE. fixes #787
NCAR · Dec 26, 2024 · b9e67b4 · b9e67b4
1 parent be7f568
commit b9e67b4
Showing 1 changed file with 22 additions and 5 deletions.
diff --git a/assimilation_code/modules/assimilation/normal_distribution_mod.f90 b/assimilation_code/modules/assimilation/normal_distribution_mod.f90
@@ -61,6 +61,7 @@ subroutine test_normal
                                   1e-5_r8, 1e-4_r8, 1e-3_r8, 1e-2_r8, 1e-1_r8, 1e-0_r8]
 
 ! Compare to matlab 
+write(*, *) 'Absolute value of differences should be less than 1e-15'
 ! Absolute value of differences should be less than 1e-15
 do i = 1, 7
    cdf_diff(i) = normal_cdf(mx(i), mmean(i), msd(i)) - mcdf(i)
@@ -157,6 +158,9 @@ function inv_weighted_normal_cdf(alpha, mean, sd, q) result(x)
 real(r8) :: normalized_q
 
 ! VARIABLES THROUGHOUT NEED TO SWITCH TO DIGITS_12
+! The comment above is not consistent with the performance of these routines 
+! as validated by test_normal. There is no evidence that this is still
+! required.
 
 ! Can search in a standard normal, then multiply by sd at end and add mean
 ! Divide q by alpha to get the right place for weighted normal
@@ -196,8 +200,6 @@ function approx_inv_normal_cdf(quantile_in) result(x)
 real(r8), intent(in) :: quantile_in
 
 ! This is used to get a good first guess for the search in inv_std_normal_cdf
-! The params argument is not needed here but is required for consistency &
-! with other distributions
 
 ! normal inverse
 ! translate from http://home.online.no/~pjacklam/notes/invnorm
@@ -285,14 +287,17 @@ function inv_std_normal_cdf(quantile) result(x)
 ! Given a quantile q, finds the value of x for which the standard normal cdf
 ! has approximately this quantile
 
-! Where should the stupid p type come from
 type(distribution_params_type) :: p
 real(r8) :: mean, sd
 
 ! Set the mean and sd to 0 and 1 for standard normal
 mean        = 0.0_r8;     sd          = 1.0_r8
 p%params(1) = mean;       p%params(2) = sd
 
+! Normal is unbounded
+p%bounded_below = .false.;       p%bounded_above = .false.
+p%lower_bound   = missing_r8;    p%upper_bound   = missing_r8
+
 x = inv_std_normal_cdf_params(quantile, p)
 
 end function inv_std_normal_cdf
@@ -301,6 +306,10 @@ end function inv_std_normal_cdf
 
 function inv_cdf(quantile_in, cdf, first_guess, p) result(x)
 
+! This routine is used for many distributions, not just the normal distribution
+! Could be moved to its own module for clarity or combined with Ian Groom's
+! rootfinding module as an option. 
+
 interface
    function cdf(x, p)
       use types_mod, only : r8
@@ -338,6 +347,11 @@ function first_guess(quantile, p)
 ! Limit on number of times to halve the increment; No deep thought.
 integer, parameter :: max_half_iterations = 25
 
+! Largest delta for computing centered difference derivative
+! Changing this can affect accuracy for specific applications like Ian Grooms KDE
+! Changing to 1e-9 allows all of the KDE tests to PASS
+real(r8), parameter :: max_delta = 1e-8_r8
+
 real(r8) :: quantile
 real(r8) :: reltol, dq_dx, delta
 real(r8) :: x_guess, q_guess, x_new, q_new, del_x, del_q, del_q_old, q_old
@@ -387,7 +401,7 @@ function first_guess(quantile, p)
    ! Analytically, the PDF is derivative of CDF but this can be numerically inaccurate for extreme values
    ! Use numerical derivatives of the CDF to get more accurate inversion
    ! These values for the delta for the approximation work with Gfortran
-   delta = max(1e-8_r8, 1e-8_r8 * abs(x_guess))
+   delta = max(max_delta, max_delta * abs(x_guess))
    dq_dx = (cdf(x_guess + delta, p) - cdf(x_guess - delta, p)) / (2.0_r8 * delta)
    ! Derivative of 0 means we're not going anywhere else
    if(dq_dx <= 0.0_r8) then
@@ -482,14 +496,17 @@ subroutine set_normal_params_from_ens(ens, num, p)
 
 integer,                        intent(in)                         :: num
 real(r8),                       intent(in)                        :: ens(num)
-type(distribution_params_type), intent(inout) :: p
+type(distribution_params_type), intent(out) :: p
 
 ! Set up the description of the normal distribution defined by the ensemble
 p%distribution_type = NORMAL_DISTRIBUTION
 
 ! The two meaningful params are the mean and standard deviation
 call normal_mean_sd(ens, num, p%params(1), p%params(2))
 
+! Normal is unbounded
+p%bounded_below = .false.;       p%bounded_above = .false.
+p%lower_bound   = missing_r8;    p%upper_bound   = missing_r8
 
 end subroutine set_normal_params_from_ens