Source code for cratermaker.utils.montecarlo_utils

from typing import Any

import numpy as np
from numba import njit
from numpy import cross
from numpy.linalg import norm
from numpy.random import Generator
from numpy.typing import NDArray
from scipy.stats import truncnorm
from uxarray import Grid

from cratermaker.constants import FloatLike
from cratermaker.core.base import _rng_init



[docs]
def get_random_location(
    size: int = 1,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Computes random longitude and latitude values.

    Generates a set of latitude and longitude values that are uniformly distributed on the surface of a sphere.

    Parameters
    ----------
    size : int or tuple of ints, optional
        The number of samples to generate. If size is None (the default), a single tuple is returned. If size is greater than 1,
        then a structured array with fields 'lon' and 'lat' is returned.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    A structured numpy array with the location data in the format [('lon', 'f8'), ('lat', 'f8')].
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    u = rng.uniform(size=size)
    v = rng.uniform(size=size)

    # Compute the angles theta and phi
    theta = 2 * np.pi * u
    phi = np.arccos(2 * v - 1)

    # Convert to lon/lat
    lon = np.rad2deg(theta - np.pi)  # Use the convention that longitude is in the range [-180, 180]
    lat = np.rad2deg(phi - np.pi / 2.0)

    lonlat_arr = np.empty(size, dtype=[("lon", "f8"), ("lat", "f8")])

    # Reshape lat and lon to the original size if necessary
    lon = lon.reshape(size)
    lat = lat.reshape(size)

    # Combine lat and lon into a structured array
    lonlat_arr["lon"] = lon
    lonlat_arr["lat"] = lat

    return lonlat_arr



@njit
def _get_one_random_location(face_nodes, node_x, node_y, node_z, rng_vals):
    valid_nodes = face_nodes[face_nodes >= 0]
    n = len(valid_nodes)
    n_tris = n - 2
    tris = np.empty((n_tris, 3), dtype=np.int64)
    for j in range(n_tris):
        tris[j, 0] = 0
        tris[j, 1] = j + 1
        tris[j, 2] = j + 2

    n_valid = len(valid_nodes)
    vertices = np.empty((n_valid, 3), dtype=np.float64)
    for i in range(n_valid):
        idx = valid_nodes[i]
        vertices[i, 0] = node_x[idx]
        vertices[i, 1] = node_y[idx]
        vertices[i, 2] = node_z[idx]

    areas = np.empty(len(tris))
    for i in range(len(tris)):
        j0, j1, j2 = tris[i]
        v0, v1, v2 = vertices[j0], vertices[j1], vertices[j2]
        areas[i] = 0.5 * norm(cross(v1 - v0, v2 - v0))
    areas /= areas.sum()
    cum_areas = np.cumsum(areas)

    # triangle selection
    tri_idx = np.searchsorted(cum_areas, rng_vals[0])
    j0, j1, j2 = tris[tri_idx]
    v0, v1, v2 = vertices[j0], vertices[j1], vertices[j2]

    r1, r2 = rng_vals[1], rng_vals[2]
    if r1 + r2 > 1.0:
        r1, r2 = 1.0 - r1, 1.0 - r2
    r0 = 1.0 - r1 - r2
    return r0 * v0 + r1 * v1 + r2 * v2


def get_random_location_on_face(
    grid: Grid,
    face_index: int | NDArray[np.int64],
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Generate a random coordinate within a given face of an unstructured mesh.

    Parameters
    ----------
    grid : uxarray.Grid
        The grid object containing the mesh information.
    face_index : int | NDArray[np.int64]
        The index or array of indices of the face within the grid to obtain the random sample.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    A structured numpy array with the location data in the format of the same shape as face_index [('lon', 'f8'), ('lat', 'f8')].
    """
    from uxarray.grid import coordinates

    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    # Extract node indices for the given face(s)
    face_index = np.atleast_1d(face_index)
    size = len(face_index)
    node_indices = grid.face_node_connectivity[face_index, :]

    # Prepare index arrays
    locations = np.empty(size, dtype=[("lon", "f8"), ("lat", "f8")])

    node_x = grid.node_x.values
    node_y = grid.node_y.values
    node_z = grid.node_z.values
    rng_vals = rng.random((size, 3))
    for i in range(size):
        ind = node_indices.values[i]
        ind = ind[ind >= 0]
        p = _get_one_random_location(ind, node_x, node_y, node_z, rng_vals=rng_vals[i, :])
        lon, lat = coordinates._xyz_to_lonlat_deg(*p)
        locations["lon"][i] = np.float64(lon)
        locations["lat"][i] = np.float64(lat)

    return locations



[docs]
def get_random_impact_angle(
    size: int | tuple[int, ...] = 1,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Sample impact angles from a distribution centered on 45deg.

    For the theory, see Shoemaker (1962) "Interpretation of lunar craters."

    Parameters
    ----------
    size : int or tuple of ints, optional
        The number of samples to generate. If the shape is (m, n, k), then m * n * k samples are drawn. If size is None (the default), a single value is returned if `diameters` is a scalar, otherwise an array of samples is returned with the same size as `diameters`.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    ndarray of np.float64
        An array of impact angles (in degrees).
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    u = np.sqrt(rng.uniform(size=size))
    impact_angle = np.arcsin(u)
    return np.rad2deg(impact_angle)



def get_random_impact_direction(
    size: int | tuple[int, ...] = 1,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Sample impact direction from a uniform distribution.

    Parameters
    ----------
    size : int or tuple of ints, optional
        The number of samples to generate. If the shape is (m, n, k), then m * n * k samples are drawn. If size is None (the default), a single scalar value is returned.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    ndarray of np.float64
        An array of impact angles (in degrees).
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    pdir = rng.uniform(0.0, 360.0, size=size)
    return pdir



[docs]
def get_random_size(
    diameters: NDArray[np.float64],
    cdf: NDArray[np.float64],
    size: int | tuple[int, ...] | None = None,
    mu: int | tuple[int, ...] | None = None,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Sample diameters from a cumulative size-frequency distribution (SFD).

    Given an array of diameters and optionally a cumulative distribution function (CDF), this function generates new diameter values that follow the specified distribution. The SFD is treated as a continuous function that interpolates between the provided diameters, which are assumed to represent a power-law distribution.

    Parameters
    ----------
    diameters : array_like
        An array of diameters from which the SFD is constructed. Must be 1-dimensional.
    cdf : array_like
        The cumulative distribution function corresponding to `diameters`. Must be the same size as `diameters` and must be monotonically increasing with decreasing diameter value.
    size : int or tuple of ints, optional
        The number of samples to generate. If the shape is (m, n, k), then m * n * k samples are drawn. If size is None and mu is None then a single value is returned. Note: mu and size are mutually exclusive.
    mu : int or tuple of ints, optional
        The expected number of samples to generate using a Poisson random number genertor. If the shape is (m, n, k), then m * n * k samples are drawn. Note: mu and size are mutually exclusive.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    ndarray of np.float64
        An array of sampled diameter values from the SFD.

    Notes
    -----
    The SFD is assumed to be a continuous distribution that follows a power-law between the provided discrete diameter values. Linear interpolation in log-space is used to sample new values between the known diameters.
    A small amount of random noise (of the order 1e-3 the diameter value) is added to the final diameter value to ensure that diameter values are unlikely to be identical, even when an input CDF could lead to identical diameter values.

    Examples
    --------
    >>> diameters = np.array([100.0, 56.0, 32.0, 18.0, 10.0])
    >>> ncumul = np.array([1.0, 0.51, 0.21, 0.06, 0.01])
    >>> sample_from_sfd(diameters, cdf=ncumul, size=4)
    array([14.80803668, 44.95292261, 29.80797715, 23.11082091])
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    # Check that the shapes and sizes of diameters and cdf are compatible
    if np.isscalar(diameters) or np.isscalar(cdf):
        raise ValueError("The 'diameters' and 'cdf' arguments must be arrays")
    if diameters.ndim != 1:
        raise ValueError("The 'diameters' argument must be a 1-dimensional array")
    if diameters.size != cdf.shape[0]:
        raise ValueError("The 'diameters' array must have the same size as axis 0 of 'cdf'")
    if diameters.size < 2:
        raise ValueError("The 'diameters' and 'cdf' arguments must have at least two elements")
    if np.any(diameters <= 0.0):
        raise ValueError("All values in the 'diameters' argument must be positive")
    if np.any(cdf <= 0.0):
        raise ValueError("All values in the 'cdf' argument must be positive")
    if size is None and mu is None:
        size = 1
    elif size is not None and mu is not None:
        raise ValueError("The 'size' and 'mu' arguments are mutually exclusive")
    elif size is None and mu is not None:
        size = rng.poisson(mu)

    # Sort the diameters in descending order and get the cumulative distribution if it was not supplied
    sorted_indices = np.argsort(diameters)[::-1]
    sorted_diameters = diameters[sorted_indices]
    sorted_cdf = cdf[sorted_indices]

    # Check to make sure that the CDF is correctly specified so that as diameter is decreasing it is monotonically increasing
    is_monotonic_increasing = np.all(np.diff(sorted_cdf) >= 0)
    if not is_monotonic_increasing:
        raise ValueError("The CDF must be monotonically increasing with decreasing diameter.")

    # Normalize the cdf and put it in logspace
    sorted_cdf /= sorted_cdf[-1]
    log_sorted_cdf = np.log(sorted_cdf)

    # Generate uniform random numbers for the entire sample size
    u = rng.uniform(low=sorted_cdf[0], high=sorted_cdf[-1], size=size)
    u = np.log(u)

    # Handle the situation where u is a scalar (size is None and diameters is a scalar)
    if np.isscalar(u):
        u = np.array([u])

    # Flatten u to work with it as a 1D array
    original_shape = u.shape
    u = u.flatten()

    # Find the indices where the random numbers would be inserted to maintain order
    # Use the right side of the interval to avoid edge effects for when u == sorted_cdf[0]
    # Because rng.uniform returns values in the half-open interval [sorted_cdf[0], sorted_cdf[-1]), u will never be exactly equal to sorted_cdf[-1]
    indices = np.searchsorted(log_sorted_cdf, u, side="right")

    # Initialize the new_diameters array
    new_diameters = np.empty(u.shape)

    log_diam_low = np.log(sorted_diameters[indices - 1])
    log_diam_high = np.log(sorted_diameters[indices])
    log_nval_low = log_sorted_cdf[indices - 1]
    log_nval_high = log_sorted_cdf[indices]

    fractions = (u - log_nval_low) / (log_nval_high - log_nval_low)
    log_diam_interp = log_diam_low + fractions * (log_diam_high - log_diam_low)
    new_diameters = np.exp(log_diam_interp)

    # Reshape new_diameters to the original shape of u
    new_diameters = new_diameters.reshape(original_shape)

    # Add a small random noise to the diameters
    noise = 1e-8 * rng.uniform(size=new_diameters.shape)
    new_diameters *= 1 + noise
    return new_diameters




[docs]
def get_random_velocity(
    vmean: np.float64,
    vescape: np.float64 | None = None,
    size: int | tuple[int, ...] = 1,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> NDArray[np.float64]:
    """
    Sample impact velocities from a Rayleigh distribution given a mean velocity. Optionally account for the escape velocity.

    Parameters
    ----------
    vmean : np.float64
        The mean velocity of the distribution.
    vescape : np.float64 | None, optional
        The escape velocity of the target body. If None, the escape velocity is not used in the calculation, and the disrtribution will be a maxwellian. If it is included, then the distribution will depend on the value of vmean. If vmean > vescape, then the distribution will adjusted so that the escape velocity is the minimum velocity by computing an encounter velocity then summing the encounter and escape velocities in quadrature. If vmean < vescape, then the distirbution will be a truncated maxwellian.
    size : int or tuple of ints, optional
        The number of samples to generate. If the shape is (m, n, k), then m * n * k samples are drawn. If size is None (the default), a single value is returned if `diameters` is a scalar, otherwise an array of samples is returned with the same size as `diameters`.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any
        |kwargs|

    Returns
    -------
    ndarray
        An array of impact velocities (in m/s).
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    if vescape is not None:
        if vmean > vescape:
            vencounter = np.sqrt(vmean**2 - vescape**2)
            velocities = get_random_velocity(vencounter, rng=rng, size=size)
            return np.sqrt(velocities**2 + vescape**2)
        else:
            velocities = np.full(size, 2 * vescape)
            while True:
                nbad = np.sum(velocities > vescape)
                velocities[velocities > vescape] = get_random_velocity(vmean, rng=rng, size=nbad)
                if np.all(velocities < vescape):
                    return velocities

    sigma = vmean / np.sqrt(8 / np.pi)

    vx = rng.normal(0, sigma, size=size)
    vy = rng.normal(0, sigma, size=size)
    vz = rng.normal(0, sigma, size=size)
    velocities = np.sqrt(vx**2 + vy**2 + vz**2)

    return velocities




[docs]
def bounded_norm(
    loc: FloatLike,
    scale: FloatLike,
    size: int | tuple[int, ...] = 1,
    lower_bound: FloatLike | None = None,
    upper_bound: FloatLike | None = None,
    rng: Generator | None = None,
    rng_seed: int | None = None,
    rng_state: dict | None = None,
    **kwargs: Any,
) -> FloatLike:
    """
    Sample from a truncated normal distribution that is bounded by either an upper and lower bound, or if None is provided, by the 1-sigma stdev.

    Parameters
    ----------
    loc : FloatLike
       mean of the distribution
    scale : FloatLike
       standard deviation and bounds of the distribution
    size : int or tuple of ints, optional
        The number of samples to generate. If the shape is (m, n, k), then m * n * k samples are drawn. If size is None (the default), a single value is returned if `diameters` is a scalar, otherwise an array of samples is returned with the same size as `diameters`.
    lower_bound : FloatLike | None, optional
        The lower bound of the distribution. If None, the lower bound is set to mean - scale.
    upper_bound : FloatLike | None, optional
        The upper bound of the distribution. If None, the upper bound is set to mean + scale.
    rng : numpy.random.Generator | None
        |rng|
    rng_seed : Any type allowed by the rng_seed argument of numpy.random.Generator, optional
        |rng_seed|
    rng_state : dict, optional
        |rng_state|
    **kwargs : Any

    Returns
    -------
    float
       Truncated norm bounded by loc-scale, loc+scale
    """
    rng, _ = _rng_init(rng=rng, rng_seed=rng_seed, rng_state=rng_state, **kwargs)

    if lower_bound is None:
        lower_bound = loc - scale
    if upper_bound is None:
        upper_bound = loc + scale
    truncated_normal = truncnorm(
        (lower_bound - loc) / scale,
        (upper_bound - loc) / scale,
        loc=loc,
        scale=scale,
    )

    return truncated_normal.rvs(size, random_state=rng)