Descriptive Statistics

`circ_r(alpha=None, w=None, Cbar=None, Sbar=None)`

Circular mean resultant vector length (r).

\[ r = \sqrt{\bar{C}^2 + \bar{S}^2} \]

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`Cbar`	`Optional[float]`	Precomputed intermediate values	`None`
`Sbar`	`Optional[float]`	Precomputed intermediate values	`None`

Returns:

Name	Type	Description
`r`	`float`	Resultant vector length

References

Implementation of Example 26.5 (Zar, 2010)

Source code in pycircstat2/descriptive.py

def circ_r(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    Cbar: Optional[float] = None,
    Sbar: Optional[float] = None,
) -> float:
    r"""
    Circular mean resultant vector length (r).

    $$
    r = \sqrt{\bar{C}^2 + \bar{S}^2}
    $$

    Parameters
    ----------
    alpha: np.array (n, )
        Angles in radian.
    w: np.array (n,)
        Frequencies or weights
    Cbar, Sbar: float
        Precomputed intermediate values

    Returns
    -------
    r: float
        Resultant vector length

    References
    ----------
    Implementation of Example 26.5 (Zar, 2010)
    """
    if Cbar is None or Sbar is None:
        if alpha is None:
            raise ValueError("`alpha` is required if `Cbar` and `Sbar` are not provided.")
        w = np.ones_like(alpha) if w is None else w
        Cbar, Sbar = compute_C_and_S(alpha, w)

    r = np.sqrt(Cbar**2 + Sbar**2)

    return r

`circ_mean(alpha, w=None)`

Circular mean (m).

\[\cos\bar\theta = C/R,\space \sin\bar\theta = S/R\]

or

\[ \bar\theta = \begin{cases} \tan^{-1}\left(S/C\right), & \text{if } S > 0, C > 0 \\ \tan^{-1}\left(S/C\right) + \pi, & \text{if } C < 0 \\ \tan^{-1}\left(S/C\right) + 2\pi, & \text{S < 0, C > 0} \end{cases} \]

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`

Returns:

Name	Type	Description
`m`	`float or NaN`	Circular mean

Note

Implementation of Example 26.5 (Zar, 2010)

Source code in pycircstat2/descriptive.py

def circ_mean(
    alpha: np.ndarray,
    w: Optional[np.ndarray] = None,
) -> float:
    r"""
    Circular mean (m).

    $$\cos\bar\theta = C/R,\space \sin\bar\theta = S/R$$

    or 

    $$
    \bar\theta =
    \begin{cases} 
    \tan^{-1}\left(S/C\right), & \text{if } S > 0, C > 0 \\ 
    \tan^{-1}\left(S/C\right) + \pi, & \text{if } C < 0 \\ 
    \tan^{-1}\left(S/C\right) + 2\pi, & \text{S < 0, C > 0}
    \end{cases}
    $$

    Parameters
    ----------
    alpha: np.array (n, )
        Angles in radian.
    w: np.array (n,)
        Frequencies or weights

    Returns
    -------
    m: float or NaN
        Circular mean

    Note
    ----
    Implementation of Example 26.5 (Zar, 2010)
    """
    if w is None:
        w = np.ones_like(alpha)

    # mean resultant vecotr length
    Cbar, Sbar = compute_C_and_S(alpha, w)
    r = circ_r(alpha, w, Cbar, Sbar)

    # angular mean
    if np.isclose(r, 0):
        m = np.nan
    else:
        m = np.arctan2(Sbar, Cbar)

    return float(angmod(m))

`circ_mean_and_r(alpha, w=None)`

Circular mean (m) and resultant vector length (r).

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`

Returns:

Name	Type	Description
`m`	`float or NaN`	Circular mean
`r`	`float`	Resultant vector length

Note

Implementation of Example 26.5 (Zar, 2010)

Source code in pycircstat2/descriptive.py

def circ_mean_and_r(
    alpha: np.ndarray,
    w: Optional[np.ndarray] = None,
) -> Tuple[float, float]:
    """
    Circular mean (m) and resultant vector length (r).

    Parameters
    ----------
    alpha: np.array (n, )
        Angles in radian.
    w: np.array (n,)
        Frequencies or weights

    Returns
    -------
    m: float or NaN
        Circular mean
    r: float
        Resultant vector length

    Note
    ----
    Implementation of Example 26.5 (Zar, 2010)
    """
    if w is None:
        w = np.ones_like(alpha)

    # mean resultant vecotr length
    Cbar, Sbar = compute_C_and_S(alpha, w)
    r = circ_r(alpha, w, Cbar, Sbar)

    # angular mean
    if np.isclose(r, 0):
        m = np.nan
        return float(m), r
    else:
        m = np.arctan2(Sbar, Cbar)

        return float(angmod(m)), r

`circ_mean_and_r_of_means(circs=None, ms=None, rs=None)`

The Mean of a set of Mean Angles

Parameters:

Name	Type	Description	Default
`circs`	`Union[list, None]`	a list of Circular Objects	`None`
`ms`	`Optional[ndarray]`	a set of mean angles in radian	`None`
`rs`	`Optional[ndarray]`	a set of mean resultant vecotr lengths	`None`

Returns:

Name	Type	Description
`m`	`float`	mean of means in radian
`r`	`float`	mean of mean resultant vector lengths

Source code in pycircstat2/descriptive.py

def circ_mean_and_r_of_means(
    circs: Union[list, None] = None,
    ms: Optional[np.ndarray] = None,
    rs: Optional[np.ndarray] = None,
) -> Tuple[float, float]:
    """The Mean of a set of Mean Angles

    Parameters
    ----------
    circs: list
        a list of Circular Objects

    ms: np.array (n, )
        a set of mean angles in radian

    rs: np.array (n, )
        a set of mean resultant vecotr lengths

    Returns
    -------
    m: float
        mean of means in radian

    r: float
        mean of mean resultant vector lengths

    """

    if circs is None:
        assert isinstance(ms, np.ndarray) and isinstance(rs, np.ndarray), (
            "If `circs` is None, then `ms` and `rs` are needed."
        )
    else:
        ms, rs = map(np.array, zip(*[(circ.mean, circ.r) for circ in circs]))

    X = np.mean(np.cos(ms) * rs)
    Y = np.mean(np.sin(ms) * rs)
    r = np.sqrt(X**2 + Y**2)
    C = X / r
    S = Y / r

    m = angmod(np.arctan2(S, C))

    return float(m), r

`circ_moment(alpha, w=None, p=1, mean=None, centered=False)`

Compute the p-th circular moment.

\[ m^{\prime}_{p} = \bar{C}_{p} + i\bar{S}_{p} \]

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights. If None, equal weights are used.	`None`
`p`	`int`	Order of the moment to compute.	`1`
`mean`	`Union[float, ndarray, None]`	Precomputed circular mean. If None, mean is computed internally.	`None`
`centered`	`bool`	If True, center alpha by subtracting the mean.	`False`

Returns:

Name	Type	Description
`mp`	`complex`	The p-th circular moment as a complex number.

Note

Implementation of Equation 2.24 (Fisher, 1993).

Source code in pycircstat2/descriptive.py

def circ_moment(
    alpha: np.ndarray,
    w: Optional[np.ndarray] = None,
    p: int = 1,
    mean: Union[float, np.ndarray, None] = None,
    centered: bool = False,
) -> complex:
    r"""
    Compute the p-th circular moment.

    $$
    m^{\prime}_{p} = \bar{C}_{p} + i\bar{S}_{p}
    $$

    Parameters
    ----------
    alpha: np.ndarray
        Angles in radian.
    w: np.ndarray, optional
        Frequencies or weights. If None, equal weights are used.
    p: int, optional
        Order of the moment to compute.
    mean: float, optional
        Precomputed circular mean. If None, mean is computed internally.
    centered: bool, optional
        If True, center alpha by subtracting the mean.

    Returns
    -------
    mp: complex
        The p-th circular moment as a complex number.

    Note
    ----
    Implementation of Equation 2.24 (Fisher, 1993).
    """
    if w is None:
        w = np.ones_like(alpha)

    if mean is None:
        mean = circ_mean(alpha, w) if centered else 0.0

    Cbar, Sbar = compute_C_and_S(alpha, w, p, mean)

    return Cbar + 1j * Sbar

`circ_dispersion(alpha, w=None, mean=None)`

Sample Circular Dispersion, defined by Equation 2.28 (Fisher, 1993):

\[ \hat\delta = (1 - \hat\rho_{2})/(2 \hat\rho_{1}^{2}) \]

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`mean`		Precomputed circular mean.	`None`

Returns:

Name	Type	Description
`dispersion`	`float`	Sample Circular Dispersion

Source code in pycircstat2/descriptive.py

def circ_dispersion(
    alpha: np.ndarray,
    w: Optional[np.ndarray] = None,
    mean=None,
) -> float:
    r"""
    Sample Circular Dispersion, defined by Equation 2.28 (Fisher, 1993):

    $$
    \hat\delta = (1 - \hat\rho_{2})/(2 \hat\rho_{1}^{2})
    $$

    Parameters
    ----------

    alpha: np.array, (n, )
        Angles in radian.
    w: None or np.array, (n)
        Frequencies or weights
    mean: None or float
        Precomputed circular mean.

    Returns
    -------
    dispersion: float
        Sample Circular Dispersion
    """

    if w is None:
        w = np.ones_like(alpha)

    mp1 = circ_moment(alpha=alpha, w=w, p=1, mean=mean, centered=False)  # eq(2.26)
    mp2 = circ_moment(alpha=alpha, w=w, p=2, mean=mean, centered=False)  # eq(2.27)

    r1 = np.abs(mp1)
    r2 = np.abs(mp2)

    dispersion = (1 - r2) / (2 * r1**2)  # eq(2.28)

    return dispersion

`circ_skewness(alpha, w=None)`

Circular skewness, as defined by Equation 2.29 (Fisher, 1993):

\[\hat s = [\hat\rho_2 \sin(\hat\mu_2 - 2 \hat\mu_1)] / (1 - \hat\rho_1)^{\frac{3}{2}}\]

But unlike the implementation of Fisher (1993), here we followed Pewsey et al. (2014) by NOT centering the second moment.

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`

Returns:

Name	Type	Description
`skewness`	`float`	Circular Skewness

Source code in pycircstat2/descriptive.py

def circ_skewness(alpha: np.ndarray, w: Optional[np.ndarray] = None) -> float:
    r"""
    Circular skewness, as defined by Equation 2.29 (Fisher, 1993):

    $$\hat s = [\hat\rho_2 \sin(\hat\mu_2 - 2 \hat\mu_1)] / (1 - \hat\rho_1)^{\frac{3}{2}}$$

    But unlike the implementation of Fisher (1993), here we followed Pewsey et al. (2014) by NOT centering the second moment.

    Parameters
    ----------

    alpha: np.array, (n, )
        Angles in radian.
    w: None or np.array, (n)
        Frequencies or weights

    Returns
    -------
    skewness: float
        Circular Skewness
    """

    if w is None:
        w = np.ones_like(alpha)

    mp1 = circ_moment(alpha=alpha, w=w, p=1, mean=None, centered=False)
    mp2 = circ_moment(alpha=alpha, w=w, p=2, mean=None, centered=False)  # eq(2.27)

    u1, r1 = convert_moment(mp1)
    u2, r2 = convert_moment(mp2)

    skewness = (r2 * np.sin(u2 - 2 * u1)) / (1 - r1) ** 1.5

    return skewness

`circ_kurtosis(alpha, w=None)`

Circular kurtosis, as defined by Equation 2.30 (Fisher, 1993):

\[\hat k = [\hat\rho_2 \cos(\hat\mu_2 - 2 \hat\mu_1) - \hat\rho_1^4] / (1 - \hat\rho_1)^{2}\]

But unlike the implementation of Fisher (1993), here we followed Pewsey et al. (2014) by NOT centering the second moment.

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`

Returns:

Name	Type	Description
`kurtosis`	`float`	Circular Kurtosis

Source code in pycircstat2/descriptive.py

def circ_kurtosis(alpha: np.ndarray, w: Optional[np.ndarray] = None) -> float:
    r"""
    Circular kurtosis, as defined by Equation 2.30 (Fisher, 1993):

    $$\hat k = [\hat\rho_2 \cos(\hat\mu_2 - 2 \hat\mu_1) - \hat\rho_1^4] / (1 - \hat\rho_1)^{2}$$

    But unlike the implementation of Fisher (1993), here we followed Pewsey et al. (2014) by **NOT** centering the second moment.

    Parameters
    ----------

    alpha: np.array, (n, )
        Angles in radian.
    w: None or np.array, (n)
        Frequencies or weights

    Returns
    -------
    kurtosis: float
        Circular Kurtosis
    """

    if w is None:
        w = np.ones_like(alpha)

    mp1 = circ_moment(alpha=alpha, w=w, p=1, mean=None, centered=False)
    mp2 = circ_moment(alpha=alpha, w=w, p=2, mean=None, centered=False)  # eq(2.27)

    u1, r1 = convert_moment(mp1)
    u2, r2 = convert_moment(mp2)

    kurtosis = (r2 * np.cos(u2 - 2 * u1) - r1**4) / (1 - r1) ** 2

    return kurtosis

`angular_var(alpha=None, w=None, r=None, bin_size=None)`

Angular variance

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`r`	`Optional[float]`	Resultant vector length	`None`
`bin_size`	`Optional[float]`	Interval size of grouped data. Needed for correcting biased r.	`None`

Returns:

Name	Type	Description
`angular_variance`	`float`	Angular variance, range from 0 to 2.

References

Batschlet (1965, 1981), from Section 26.5 of Zar (2010)

Source code in pycircstat2/descriptive.py

def angular_var(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    r: Optional[float] = None,
    bin_size: Optional[float] = None,
) -> float:
    r"""
    Angular variance

    Parameters
    ----------
    alpha: np.array (n, ) or None
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    r: float or None
        Resultant vector length
    bin_size: float
        Interval size of grouped data. Needed for correcting biased r.

    Returns
    -------
    angular_variance: float
        Angular variance, range from 0 to 2.

    References
    ----------
    - Batschlet (1965, 1981), from Section 26.5 of Zar (2010)
    """

    variance = circ_var(alpha=alpha, w=w, r=r, bin_size=bin_size)
    angular_variance = 2 * variance
    return angular_variance

`angular_std(alpha=None, w=None, r=None, bin_size=None)`

Angular (standard) deviation

\[ s = \sqrt{2V} = \sqrt{2(1 - r)} \]

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`r`	`Optional[float]`	Resultant vector length	`None`
`bin_size`	`Optional[float]`	Interval size of grouped data. Needed for correcting biased r.	`None`

Returns:

Name	Type	Description
`angular_std`	`float`	Angular (standard) deviation, range from 0 to sqrt(2).

References

Equation 26.20 of Zar (2010)

Source code in pycircstat2/descriptive.py

def angular_std(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    r: Optional[float] = None,
    bin_size: Optional[float] = None,
) -> float:
    r"""
    Angular (standard) deviation

    $$
    s = \sqrt{2V} = \sqrt{2(1 - r)}
    $$

    Parameters
    ----------
    alpha: np.array (n, ) or None
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    r: float or None
        Resultant vector length
    bin_size: float
        Interval size of grouped data. Needed for correcting biased r.

    Returns
    -------
    angular_std: float
        Angular (standard) deviation, range from 0 to sqrt(2).

    References
    ----------
    - Equation 26.20 of Zar (2010)
    """

    angular_variance = angular_var(alpha=alpha, w=w, r=r, bin_size=bin_size)
    angular_std = np.sqrt(angular_variance)
    return angular_std

`circ_var(alpha=None, w=None, r=None, bin_size=None)`

Circular variance

\[ V = 1 - r \]

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`r`	`Optional[float]`	Resultant vector length	`None`
`bin_size`	`Optional[float]`	Interval size of grouped data. Needed for correcting biased r.	`None`

Returns:

Name	Type	Description
`variance`	`float`	Circular variance, range from 0 to 1.

References

Equation 2.11 of Fisher (1993)
Equation 26.17 of Zar (2010)

Source code in pycircstat2/descriptive.py

def circ_var(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    r: Optional[float] = None,
    bin_size: Optional[float] = None,
) -> float:
    r"""
    Circular variance

    $$ V = 1 - r $$

    Parameters
    ----------
    alpha: np.array (n, ) or None
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    r: float or None
        Resultant vector length
    bin_size: float
        Interval size of grouped data. Needed for correcting biased r.

    Returns
    -------
    variance: float
        Circular variance, range from 0 to 1.

    References
    ----------
    - Equation 2.11 of Fisher (1993)
    - Equation 26.17 of Zar (2010)
    """

    # If `r` is provided, use it directly
    if r is None:
        if alpha is None:
            raise ValueError("If `r` is None, then `alpha` is required to compute it.")
        r = circ_r(alpha, w)  # `circ_r` already handles `w=None` as `np.ones_like(alpha)`

    # Determine bin_size if not explicitly provided
    if bin_size is None and w is not None and not np.all(w == w[0]):
        if alpha is None:
            raise ValueError("If `bin_size` is None but `w` is provided, `alpha` must be given.")
        bin_size = float(np.diff(alpha).min())

    # Correct `r` if binning is applied
    rc = r if bin_size is None or bin_size == 0 else r * (bin_size / (2 * np.sin(bin_size / 2)))

    variance = 1 - rc

    return variance

`circ_std(alpha=None, w=None, r=None, bin_size=None)`

Circular standard deviation (s).

\[ s = \sqrt{-2 \ln(1 - V)} \]

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`r`	`Optional[float]`	Resultant vector length	`None`
`bin_size`	`Optional[float]`	Interval size of grouped data. Needed for correcting biased r.	`None`

Returns:

Name	Type	Description
`s`	`float`	Circular standard deviation.

References

Implementation of Equation 26.15-16/20-21 (Zar, 2010)

Source code in pycircstat2/descriptive.py

def circ_std(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    r: Optional[float] = None,
    bin_size: Optional[float] = None,
) -> float:
    r"""
    Circular standard deviation (s).

    $$ s = \sqrt{-2 \ln(1 - V)} $$

    Parameters
    ----------
    alpha: np.array (n, ) or None
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    r: float or None
        Resultant vector length
    bin_size: float
        Interval size of grouped data.
        Needed for correcting biased r.

    Returns
    -------
    s: float
        Circular standard deviation.

    References
    ----------
    Implementation of Equation 26.15-16/20-21 (Zar, 2010)
    """
    var = circ_var(alpha=alpha, w=w, r=r, bin_size=bin_size)

    # circular standard deviation
    s = np.sqrt(-2 * np.log(1 - var))  # eq(26.21)

    return s

`circ_median(alpha, w=None, method='deviation', return_average=True, average_method='all')`

Circular median.

Two ways to compute the circular median for ungrouped data (Fisher, 1993):

deviation: find the angle that has the minimal mean deviation.
count: find the angle that has the equally devide the number of points on the right and left of it.

For grouped data, we use the method described in Mardia (1972).

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`method`	`str`	For ungrouped data, there are two ways To compute the medians: deviation count Set to `none` to return np.nan.	`'deviation'`
`return_average`	`bool`	Return the average of the median	`True`
`average_method`	`str`	all: circular mean of all medians unique: circular mean of unique medians	`'all'`

Returns:

Name	Type	Description
`median`	`float or NaN`

References

For ungrouped data: Section 2.3.2 of Fisher (1993)
For grouped data: Mardia (1972)

Source code in pycircstat2/descriptive.py

def circ_median(
    alpha: np.ndarray,
    w: Optional[np.ndarray] = None,
    method: str = "deviation",
    return_average: bool = True,
    average_method: str = "all",
) -> Union[float, np.ndarray]:
    r"""
    Circular median.

    Two ways to compute the circular median for ungrouped data (Fisher, 1993):

    - `deviation`: find the angle that has the minimal mean deviation.
    - `count`: find the angle that has the equally devide the number of points on the right and left of it.

    For grouped data, we use the method described in Mardia (1972).

    Parameters
    ----------
    alpha: np.array (n, )
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    method: str
        - For ungrouped data, there are two ways
        - To compute the medians:
            - deviation
            - count
        - Set to `none` to return np.nan.
    return_average: bool
        Return the average of the median
    average_method: str
        - all: circular mean of all medians
        - unique: circular mean of unique medians

    Returns
    -------
    median: float or NaN

    References
    ----------
    - For ungrouped data: Section 2.3.2 of Fisher (1993)
    - For grouped data: Mardia (1972)
    """

    if w is None:
        w = np.ones_like(alpha)

    # grouped data
    if not np.all(w == 1):
        median = _circ_median_grouped(alpha, w)
    # ungrouped data
    else:
        # find which data point that can divide the dataset into two half
        if method == "count":
            median = _circ_median_count(alpha)
        # find the angle that has the minimal mean deviation
        elif method == "deviation":
            median = _circ_median_mean_deviation(alpha)
        elif method == "none" or method is None:
            median = np.nan
        else:
            raise ValueError(
                f"Method `{method}` for `circ_median` is not supported.\nTry `deviation` or `count`"
            )

    if return_average:
        if average_method == "all":
            # Circular mean of all medians
            median = circ_mean(alpha=np.asarray(median))
        elif average_method == "unique":
            # Circular mean of unique medians
            median = circ_mean(alpha=np.unique(median))
        else:
            raise ValueError(
                f"Average method `{average_method}` is not supported.\nTry `all` or `unique`."
            )

    return angmod(median)

`circ_mean_deviation_chuncked(alpha, beta, chunk_size=1000)`

Optimized circular mean deviation with chunking.

\[ \delta = \pi - \frac{1}{n} \sum^{n}_{1}\left| \pi - \left| \alpha - \beta \right| \right| \]

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Data in radians.	required
`beta`	`ndarray`	Reference angles in radians.	required
`chunk_size`	`int`	Number of rows to process in chunks.	`1000`

Returns:

Type	Description
`ndarray`	Circular mean deviation.

Source code in pycircstat2/descriptive.py

def circ_mean_deviation_chuncked(
    alpha: Union[np.ndarray, float, int, list],
    beta: Union[np.ndarray, float, int, list],
    chunk_size=1000,
):
    r"""
    Optimized circular mean deviation with chunking.

    $$
    \delta = \pi - \frac{1}{n} \sum^{n}_{1}\left| \pi - \left| \alpha - \beta \right| \right|
    $$

    Parameters
    ----------
    alpha : np.ndarray
        Data in radians.
    beta : np.ndarray
        Reference angles in radians.
    chunk_size : int
        Number of rows to process in chunks.

    Returns
    -------
    np.ndarray
        Circular mean deviation.
    """
    if not isinstance(alpha, np.ndarray):
        alpha = np.array([alpha])

    if not isinstance(beta, np.ndarray):
        beta = np.array([beta])

    n = len(beta)
    result = np.zeros(n)

    for i in range(0, n, chunk_size):
        beta_chunk = beta[i : i + chunk_size]
        angdist = np.pi - np.abs(np.pi - np.abs(alpha - beta_chunk[:, None]))
        result[i : i + chunk_size] = np.mean(angdist, axis=1).round(5)

    return result

`circ_mean_deviation(alpha, beta)`

Circular mean deviation.

\[ \delta = \pi - \left| \pi - \left| \alpha - \beta \right| \right| / n \]

It is the mean angular distance from one data point to all others. The circular median of a set of data should be the point with minimal circular mean deviation.

Parameters:

Name	Type	Description	Default
`alpha`	`Union[ndarray, float, int, list]`	Data in radian.	required
`beta`	`Union[ndarray, float, int, list]`	reference angle in radian.	required

Returns:

Type	Description
`circular mean deviation: np.array`

Note

eq 2.32, Section 2.3.2, Fisher (1993)

Source code in pycircstat2/descriptive.py

def circ_mean_deviation(
    alpha: Union[np.ndarray, float, int, list],
    beta: Union[np.ndarray, float, int, list],
) -> np.ndarray:
    r"""
    Circular mean deviation.

    $$
    \delta = \pi - \left| \pi - \left| \alpha - \beta \right| \right| / n
    $$

    It is the mean angular distance from one data point to all others.
    The circular median of a set of data should be the point with minimal
    circular mean deviation.

    Parameters
    ---------
    alpha: np.array, int or float
        Data in radian.
    beta: np.array, int or float
        reference angle in radian.

    Returns
    -------
    circular mean deviation: np.array

    Note
    ----
    eq 2.32, Section 2.3.2, Fisher (1993)
    """
    if not isinstance(alpha, np.ndarray):
        alpha = np.array([alpha])

    if not isinstance(beta, np.ndarray):
        beta = np.array([beta])

    return (np.pi - np.mean(np.abs(np.pi - np.abs(alpha - beta[:, None])), 1)).round(5)

`circ_mean_ci(alpha=None, w=None, mean=None, r=None, n=None, ci=0.95, method='approximate', B=2000)`

Confidence interval of circular mean.

There are three methods to compute the confidence interval of circular mean:

approximate: for n > 8
bootstrap: for 8 < n < 25
dispersion: for n >= 25

Approximate Method

For n as small as 8, and r \(\le\) 0.9, r \(>\) \(\sqrt{\chi^{2}_{\alpha, 1}/2n}\), the confidence interval can be approximated by:

\[ \delta = \arccos\left(\sqrt{\frac{2n(2R^{2} - n\chi^{2}_{\alpha, 1})}{4n - \chi^{2}_{\alpha, 1}}} /R \right) \]

For r \(\ge\) 0.9,

\[ \delta = \arccos \left(\sqrt{n^2 - (n^2 - R^2)e^{\chi^2_{\alpha, 1}/n} } /R \right) \]

Bootstrap Method

For 8 \(<\) n \(<\) 25, the confidence interval can be computed by bootstrapping the data.

Dispersion Method

For n \(\ge\) 25, the confidence interval can be computed by the circular dispersion:

\[ \hat\sigma = \hat\delta / n\]

where \(\hat\delta\) is the sample circular dispersion (see circ_dispersion). The confidence interval is then:

\[(\hat\mu - \sin^-1(z_{\frac{1}{2}\alpha}\hat\sigma),\space \hat\mu + \sin^-1(z_{\frac{1}{2}\alpha} \hat\sigma))\]

Parameters:

Name	Type	Description	Default
`alpha`	`Optional[ndarray]`	Angles in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`
`mean`	`Optional[float]`	Precomputed circular mean.	`None`
`r`	`Optional[float]`	Precomputed resultant vector length.	`None`
`n`	`Union[int, None]`	Sample size.	`None`
`ci`	`float`	Confidence interval (default is 0.95).	`0.95`
`method`	`str`	approximate: for n > 8 bootstrap: for n < 25 dispersion: for n >= 25	`'approximate'`
`B`	`int`	Number of samples for bootstrap.	`2000`

Returns:

Name	Type	Description
`lower_bound`	`float`	Lower bound of the confidence interval.
`upper_bound`	`float`	Upper bound of the confidence

References

Section 26.7, Zar (2010)
Section 4.4.4a/b, Fisher (1993)

Source code in pycircstat2/descriptive.py

def circ_mean_ci(
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    mean: Optional[float] = None,
    r: Optional[float] = None,
    n: Union[int, None] = None,
    ci: float = 0.95,
    method: str = "approximate",
    B: int = 2000,  # number of samples for bootstrap
) -> tuple[float, float]:
    r"""
    Confidence interval of circular mean.

    There are three methods to compute the confidence interval of circular mean:

    - `approximate`: for n > 8
    - `bootstrap`: for 8 < n < 25
    - `dispersion`: for n >= 25

    ### Approximate Method

    For n as small as 8, and r $\le$ 0.9, r $>$ $\sqrt{\chi^{2}_{\alpha, 1}/2n}$, the confidence interval can be approximated by:

    $$
    \delta = \arccos\left(\sqrt{\frac{2n(2R^{2} - n\chi^{2}_{\alpha, 1})}{4n - \chi^{2}_{\alpha, 1}}} /R \right)
    $$

    For r $\ge$ 0.9,

    $$
    \delta = \arccos \left(\sqrt{n^2 - (n^2 - R^2)e^{\chi^2_{\alpha, 1}/n} } /R \right)
    $$

    ### Bootstrap Method

    For 8 $<$ n $<$ 25, the confidence interval can be computed by bootstrapping the data.

    ### Dispersion Method

    For n $\ge$ 25, the confidence interval can be computed by the circular dispersion:

    $$ \hat\sigma = \hat\delta / n$$

    where $\hat\delta$ is the sample circular dispersion (see `circ_dispersion`). The confidence interval is then:

    $$(\hat\mu - \sin^-1(z_{\frac{1}{2}\alpha}\hat\sigma),\space \hat\mu + \sin^-1(z_{\frac{1}{2}\alpha} \hat\sigma))$$

    Parameters
    ----------
    alpha: np.array (n, )
        Angles in radian.
    w: np.array (n,) or None
        Frequencies or weights
    mean: float or None
        Precomputed circular mean.
    r: float or None
        Precomputed resultant vector length.
    n: int or None
        Sample size.
    ci: float
        Confidence interval (default is 0.95).
    method: str
        - approximate: for n > 8
        - bootstrap: for n < 25
        - dispersion: for n >= 25
    B: int
        Number of samples for bootstrap.

    Returns
    -------
    lower_bound: float
        Lower bound of the confidence interval.
    upper_bound: float
        Upper bound of the confidence

    References
    ----------
    - Section 26.7, Zar (2010)
    - Section 4.4.4a/b, Fisher (1993)
    """



    #  n > 8, according to Ch 26.7 (Zar, 2010)
    if method == "approximate":
        (lb, ub) = _circ_mean_ci_approximate(
            alpha=alpha, w=w, mean=mean, r=r, n=n, ci=ci
        )

    # n < 25, according to 4.4.4a (Fisher, 1993, P75)
    elif method == "bootstrap" and alpha is not None:
        (lb, ub) = _circ_mean_ci_bootstrap(alpha=alpha, B=B, ci=ci)

    # n >= 25, according to 4.4.4b (Fisher, 1993, P75)
    elif method == "dispersion" and alpha is not None:
        (lb, ub) = _circ_mean_ci_dispersion(alpha=alpha, w=w, mean=mean, ci=ci)

    else:
        raise ValueError(
            f"Method `{method}` for `circ_mean_ci` is not supported.\nTry `dispersion`, `approximate` or `bootstrap`"
        )

    return float(angmod(lb)), float(angmod(ub))

`circ_median_ci(median=None, alpha=None, w=None, method='deviation', ci=0.95)`

Confidence interval for circular median

For n > 15, the confidence interval can be computed by:

\[ m = 1 + \text{integer part of} \frac{1}{2} n^{1/2} z_{\frac{1}{2}\alpha} \]

For n \(\le\) 15, the confidence interval can be selected from the table in Fisher (1993).

Parameters:

Name	Type	Description	Default
`median`	`Optional[float]`	Circular median.	`None`
`alpha`	`Optional[ndarray]`	Data in radian.	`None`
`w`	`Optional[ndarray]`	Frequencies or weights	`None`

Returns:

Type	Description
`lower, upper, ci: tuple`	confidence intervals and alpha-level

Note

Implementation of section 4.4.2 (Fisher,1993)

Source code in pycircstat2/descriptive.py

def circ_median_ci(
    median: Optional[float] = None,
    alpha: Optional[np.ndarray] = None,
    w: Optional[np.ndarray] = None,
    method: str = "deviation",
    ci: float = 0.95,
) -> tuple:
    r"""Confidence interval for circular median

    For n > 15, the confidence interval can be computed by:

    $$
    m = 1 + \text{integer part of} \frac{1}{2} n^{1/2} z_{\frac{1}{2}\alpha}
    $$

    For n $\le$ 15, the confidence interval can be selected from the table in Fisher (1993).

    Parameters
    ----------
    median: float or None
        Circular median.
    alpha: np.array or None
        Data in radian.
    w: np.array or None
        Frequencies or weights

    Returns
    -------
    lower, upper, ci: tuple
        confidence intervals and alpha-level

    Note
    ----
    Implementation of section 4.4.2 (Fisher,1993)
    """

    if median is None:
        if alpha is None:
            raise ValueError("If `median` is None, then `alpha` is needed.")
        if w is None:
            w = np.ones_like(alpha)
        median = float(circ_median(alpha=alpha, w=w, method=method, return_average=True))

    if alpha is None:
        raise ValueError(
            "`alpha` is needed for computing the confidence interval for circular median."
        )

    n = len(alpha)
    alpha = np.sort(alpha)

    if n > 15:
        z = norm.ppf(1 - 0.5 * (1 - ci))

        offset = int(1 + np.floor(0.5 * np.sqrt(n) * z))  # fisher:eq(4.19)

        # idx_median = np.where(alpha.round(5) < np.round(median, 5))[0][-1]
        arr = np.where(alpha.round(5) < np.round(median, 5))[0]
        if len(arr) == 0:
            # That means median is smaller than alpha[0] (to 5 decimals).
            # In a circular sense, the “closest index below” is alpha[-1].
            idx_median = len(alpha) - 1
        else:
            idx_median = arr[-1]

        idx_lb = idx_median - offset + 1
        idx_ub = idx_median + offset
        if np.round(median, 5) in alpha.round(5):  # don't count the median per se
            idx_ub += 1

        if idx_ub > n:
            idx_ub = idx_ub - n

        if idx_lb < 0:
            idx_lb = n + idx_lb

        lower, upper = alpha[int(idx_lb)], alpha[int(idx_ub)]

        if not is_within_circular_range(median, lower, upper):
            lower, upper = upper, lower

    # selected confidence intervals for the median direction for n < 15
    # from A6, Fisher, 1993.
    # We only return the widest CI if there are more than one in the table.

    elif n == 3:
        lower, upper = alpha[0], alpha[2]
        ci = 0.75
    elif n == 4:
        lower, upper = alpha[0], alpha[3]
        ci = 0.875
    elif n == 5:
        lower, upper = alpha[0], alpha[4]
        ci = 0.937
    elif n == 6:
        lower, upper = alpha[0], alpha[5]
        ci = 0.97
    elif n == 7:
        lower, upper = alpha[0], alpha[6]
        ci = 0.984
    elif n == 8:
        lower, upper = alpha[0], alpha[7]
        ci = 0.992
    elif n == 9:
        lower, upper = alpha[0], alpha[8]
        ci = 0.996
    elif n == 10:
        lower, upper = alpha[1], alpha[8]
        ci = 0.978
    elif n == 11:
        lower, upper = alpha[1], alpha[9]
        ci = 0.99
    elif n == 12:
        lower, upper = alpha[2], alpha[9]
        ci = 0.962
    elif n == 13:
        lower, upper = alpha[2], alpha[10]
        ci = 0.978
    elif n == 14:
        lower, upper = alpha[3], alpha[10]
        ci = 0.937
    elif n == 15:
        lower, upper = alpha[2], alpha[12]
        ci = 0.965
    else:
        lower, upper = np.nan, np.nan

    return (angmod(lower), angmod(upper), ci)

`circ_kappa(r, n=None)`

Estimate kappa by approximation.

\[ \hat\kappa_{ML} = \begin{cases} 2r + r^3 + 5r^5/6, , & \text{if } r < 0.53 \\ -0.4 + 1.39 r + 0.43 / (1 - r) , & \text{if } 0.53 \le r < 0.85\\ 1 / (r^3 - 4r^2 + 3r), & \text{if } r \ge 0.85 \end{cases} \]

For \(n \le 15\):

\[ \hat\kappa = \begin{cases} \max\left(\hat\kappa - \frac{2}{n\hat\kappa}, 0\right), & \text{if } \hat\kappa < 2 \\ \frac{(n - 1)^3 \hat\kappa}{n^3 + n}, & \text{if } \hat\kappa \ge 2 \end{cases} \]

Parameters:

Name	Type	Description	Default
`r`	`float`	Resultant vector length	required
`n`	`Union[int, None]`	Sample size. If n is not None, the adjustment for small sample size will be applied.	`None`

Returns:

Name	Type	Description
`kappa`	`float`	Concentration parameter

Reference

Section 4.5.5 (P88, Fisher, 1993)

Source code in pycircstat2/descriptive.py

def circ_kappa(r: float, n: Union[int, None] = None) -> float:
    r"""Estimate kappa by approximation.

    $$
    \hat\kappa_{ML} =
    \begin{cases}
     2r + r^3 + 5r^5/6, , & \text{if } r < 0.53  \\
     -0.4 + 1.39 r + 0.43 / (1 - r) , & \text{if } 0.53 \le r < 0.85\\
        1 / (r^3 - 4r^2 + 3r), & \text{if } r \ge 0.85
    \end{cases}
    $$

    For $n \le 15$:

    $$
    \hat\kappa =
    \begin{cases}
        \max\left(\hat\kappa - \frac{2}{n\hat\kappa}, 0\right), & \text{if } \hat\kappa < 2 \\
        \frac{(n - 1)^3 \hat\kappa}{n^3 + n}, & \text{if } \hat\kappa \ge 2
    \end{cases}
    $$


    Parameters
    ----------
    r: float
        Resultant vector length
    n: int or None
        Sample size. If n is not None, the adjustment for small sample size will be applied.

    Returns
    -------
    kappa: float
        Concentration parameter

    Reference
    ---------
    Section 4.5.5 (P88, Fisher, 1993)
    """

    # eq 4.40
    if r < 0.53:
        kappa = 2 * r + r**3 + 5 * r**5 / 6
    elif r < 0.85:
        kappa = -0.4 + 1.39 * r + 0.43 / (1 - r)
    else:
        nom = r**3 - 4 * r**2 + 3 * r
        if nom != 0:
            kappa = 1 / nom
        else:
            # not sure how to handle this...
            kappa = 1e-16

    # eq 4.41
    if n is not None:
        if n <= 15 and r < 0.7:
            if kappa < 2:
                kappa = np.max([kappa - 2 * 1 / (n * kappa), 0])
            else:
                kappa = (n - 1) ** 3 * kappa / (n**3 + n)

    return kappa

`circ_dist(x, y=None, metric='center', return_sum=False)`

Compute the element-wise circular distance between two arrays of angles.

Parameters:

Name	Type	Description	Default
`x`	`array - like`	First sample of circular data (radians).	required
`y`	`array - like`	Second sample of circular data (radians). If None, computes element-wise distances within `x` itself.	`None`
`metric`	`str`	Distance metric to use, options: - "center" (default): Standard circular difference wrapped to [-π, π]. - "geodesic": π - \|π - \|x - y\|\|. - "angularseparation": 1 - cos(x - y). - "chord": sqrt(2 * (1 - cos(x - y))).	`'center'`
`return_sum`	`bool`	If True, returns the sum of all computed distances (like R's `dist.circular()`).	`False`

Returns:

Type	Description
`array`	Element-wise distance values based on the chosen metric.

Source code in pycircstat2/descriptive.py

def circ_dist(
    x: Union[np.ndarray, float],
    y: Optional[Union[np.ndarray, float]] = None,
    metric: str = "center",
    return_sum: bool = False,
) -> Union[np.ndarray, float]:
    r"""
    Compute the element-wise circular distance between two arrays of angles.

    Parameters
    ----------
    x : array-like
        First sample of circular data (radians).
    y : array-like, optional
        Second sample of circular data (radians). If None, computes element-wise
        distances within `x` itself.
    metric : str, optional
        Distance metric to use, options:
        - "center" (default): Standard circular difference wrapped to [-π, π].
        - "geodesic": π - |π - |x - y||.
        - "angularseparation": 1 - cos(x - y).
        - "chord": sqrt(2 * (1 - cos(x - y))).
    return_sum : bool, optional
        If True, returns the sum of all computed distances (like R's `dist.circular()`).

    Returns
    -------
    array
        Element-wise distance values based on the chosen metric.
    """
    x = np.asarray(x)

    if y is None:
        y = x

    y = np.asarray(y)

    # Ensure broadcasting works without explicit shape checks
    try:
        np.broadcast_shapes(x.shape, y.shape)
    except ValueError:
        raise ValueError(
            f"Shapes {x.shape} and {y.shape} are incompatible for broadcasting."
        )

    if metric == "center":
        distances = np.angle(np.exp(1j * x) / np.exp(1j * y))

    elif metric == "geodesic":
        distances = np.pi - np.abs(np.pi - np.abs(x - y))

    elif metric == "angularseparation":
        distances = 1 - np.cos(x - y)

    elif metric == "chord":
        distances = np.sqrt(2 * (1 - np.cos(x - y)))

    else:
        raise ValueError(f"Unknown metric: {metric}")

    return np.sum(distances).astype(float) if return_sum else distances

`circ_pairdist(x, y=None, metric='center', return_sum=False)`

Compute the pairwise circular distance between all elements in x and y.

Parameters:

Name	Type	Description	Default
`x`	`array - like`	First sample of circular data (radians).	required
`y`	`array - like`	Second sample of circular data (radians). If None, computes pairwise distances within `x` itself.	`None`
`metric`	`str`	Distance metric to use (same options as `circ_dist`).	`'center'`
`return_sum`	`bool`	If True, returns the sum of all computed distances (like R's `dist.circular()`).	`False`

Returns:

Type	Description
`ndarray`	Pairwise distance matrix where entry (i, j) is the circular distance between x[i] and y[j] based on the chosen metric.

Source code in pycircstat2/descriptive.py

def circ_pairdist(
    x: np.ndarray,
    y: Optional[np.ndarray] = None,
    metric: str = "center",
    return_sum: bool = False,
) -> Union[np.ndarray, float]:
    r"""
    Compute the pairwise circular distance between all elements in `x` and `y`.

    Parameters
    ----------
    x : array-like
        First sample of circular data (radians).
    y : array-like, optional
        Second sample of circular data (radians). If None, computes pairwise
        distances within `x` itself.
    metric : str, optional
        Distance metric to use (same options as `circ_dist`).
    return_sum : bool, optional
        If True, returns the sum of all computed distances (like R's `dist.circular()`).

    Returns
    -------
    ndarray
        Pairwise distance matrix where entry (i, j) is the circular distance
        between x[i] and y[j] based on the chosen metric.
    """
    x = np.asarray(x)

    # If y is not provided, compute pairwise distances within x
    if y is None:
        y = x

    y = np.asarray(y)

    # Reshape to allow broadcasting for pairwise computation
    x_reshaped = x[:, None]  # Shape (n, 1)
    y_reshaped = y[None, :]  # Shape (1, m)

    return circ_dist(x_reshaped, y_reshaped, metric=metric, return_sum=return_sum)

`convert_moment(mp)`

Convert complex moment to polar coordinates.

Parameters:

Name	Type	Description	Default
`mp`	`complex`	Complex moment	required

Returns:

Name	Type	Description
`u`	`float`	Angle in radian
`r`	`float`	Magnitude

Source code in pycircstat2/descriptive.py

def convert_moment(
    mp: complex,
) -> Tuple[float, float]:
    """
    Convert complex moment to polar coordinates.

    Parameters
    ----------
    mp: complex
        Complex moment

    Returns
    -------
    u: float
        Angle in radian
    r: float
        Magnitude

    """

    u = float(angmod(float(np.angle(mp))))
    r = np.abs(mp)

    return u, r

`compute_C_and_S(alpha, w, p=1, mean=0.0)`

Compute the intermediate values Cbar and Sbar.

\[ \displaylines{ \bar{C}_{p} = \frac{\sum_{i=1}^{n} w_{i} \cos(p(\alpha_{i} - \mu))}{n} \\ \bar{S}_{p} = \frac{\sum_{i=1}^{n} w_{i} \sin(p(\alpha_{i} - \mu))}{n} } \]

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian.	required
`w`	`ndarray`	Frequencies or weights.	required
`p`	`int`	Order of the moment (default is 1, for the first moment).	`1`
`mean`	`Union[float, ndarray]`	Mean angle (μ) to center the computation (default is 0.0).	`0.0`

Returns:

Name	Type	Description
`Cbar`	`float`	Weighted mean cosine for the given moment.
`Sbar`	`float`	Weighted mean sine for the given moment.

Source code in pycircstat2/descriptive.py

def compute_C_and_S(
    alpha: np.ndarray,
    w: np.ndarray,
    p: int = 1,
    mean: Union[float, np.ndarray] = 0.0,
) -> Tuple[float, float]:
    r"""
    Compute the intermediate values Cbar and Sbar.

    $$
    \displaylines{
    \bar{C}_{p} = \frac{\sum_{i=1}^{n} w_{i} \cos(p(\alpha_{i} - \mu))}{n} \\
    \bar{S}_{p} = \frac{\sum_{i=1}^{n} w_{i} \sin(p(\alpha_{i} - \mu))}{n}
    }
    $$

    Parameters
    ----------
    alpha: np.ndarray
        Angles in radian.
    w: np.ndarray
        Frequencies or weights.
    p: int, optional
        Order of the moment (default is 1, for the first moment).
    mean: float, optional
        Mean angle (μ) to center the computation (default is 0.0).

    Returns
    -------
    Cbar: float
        Weighted mean cosine for the given moment.
    Sbar: float
        Weighted mean sine for the given moment.
    """
    n = np.sum(w)
    Cbar = np.sum(w * np.cos(p * (alpha - mean))) / n
    Sbar = np.sum(w * np.sin(p * (alpha - mean))) / n

    return Cbar, Sbar

`compute_hdi(samples, ci=0.95)`

Compute the Highest Density Interval (HDI) for circular data.

Parameters:

Name	Type	Description	Default
`samples`	`ndarray`	Bootstrap samples of the circular mean in radians.	required
`ci`	`float`	Credible interval (default is 0.95 for 95% HDI).	`0.95`

Returns:

Name	Type	Description
`hdi`	`tuple`	Lower and upper bounds of the HDI in radians.

Source code in pycircstat2/descriptive.py

def compute_hdi(samples: np.ndarray, ci:float=0.95)->tuple[float, float]:
    """
    Compute the Highest Density Interval (HDI) for circular data.

    Parameters
    ----------
    samples : np.ndarray
        Bootstrap samples of the circular mean in radians.
    ci : float, optional
        Credible interval (default is 0.95 for 95% HDI).

    Returns
    -------
    hdi : tuple
        Lower and upper bounds of the HDI in radians.
    """
    # Wrap samples to [0, 2π) for circular consistency
    wrapped_samples = angmod(samples)

    # Sort the samples
    sorted_samples = np.sort(wrapped_samples)

    # Number of samples in the HDI
    n_samples = len(sorted_samples)
    interval_idx = int(np.floor(ci * n_samples))
    if interval_idx == 0:
        raise ValueError("Insufficient data to compute HDI.")

    # Find the shortest interval
    hdi_width = np.inf
    for i in range(n_samples - interval_idx):
        lower = float(sorted_samples[i])
        upper = float(sorted_samples[i + interval_idx])
        width = angmod(upper - lower)  # Handle wrapping for circularity
        if width < hdi_width:
            hdi_width = width
            hdi_bounds = (lower, upper)

    return hdi_bounds

`compute_smooth_params(r, n)`

Parameters:

Name	Type	Description	Default
`r`	`float`	resultant vector length	required
`n`	`int`	sample size	required

Returns:

Name	Type	Description
`h`	`float`	smoothing parameter

Reference

Section 2.2 (P26, Fisher, 1993)

Source code in pycircstat2/descriptive.py

def compute_smooth_params(r: float, n: int) -> float:
    """
    Parameters
    ----------
    r: float
        resultant vector length
    n: int
        sample size

    Returns
    -------
    h: float
        smoothing parameter

    Reference
    ---------
    Section 2.2 (P26, Fisher, 1993)
    """

    kappa = circ_kappa(r, n)
    zeta = 1 / np.sqrt(kappa)  # eq 2.3
    h = np.sqrt(7) * zeta / np.power(n, 0.2)  # eq 2.4

    return h

`nonparametric_density_estimation(alpha, h, radius=1)`

Nonparametric density estimates with a quartic kernel function.

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radian	required
`h`	`float`	Smoothing parameters	required
`radius`	`float`	radius of the plotted circle	`1`

Returns:

Name	Type	Description
`x`	`ndarray(100)`	grid
`f`	`ndarray(100)`	density

Reference

Section 2.2 (P26, Fisher, 1993)

Source code in pycircstat2/descriptive.py

def nonparametric_density_estimation(
    alpha: np.ndarray,  # angles in radian
    h: float,  # smoothing parameters
    radius: float = 1,  # radius of the plotted circle
) -> tuple:
    """Nonparametric density estimates with
    a quartic kernel function.

    Parameters
    ----------
    alpha: np.ndarray (n, )
        Angles in radian
    h: float
        Smoothing parameters
    radius: float
        radius of the plotted circle

    Returns
    -------
    x: np.ndarray (100, )
        grid
    f: np.ndarray (100, )
        density

    Reference
    ---------
    Section 2.2 (P26, Fisher, 1993)
    """

    # vectorized version of step 3
    a = alpha
    n = len(a)
    x = np.linspace(0, 2 * np.pi, 100)
    d = np.abs(x[:, None] - a)
    e = np.minimum(d, 2 * np.pi - d)
    e = np.minimum(e, h)
    sum = np.sum((1 - e**2 / h**2) ** 2, 1)
    f = 0.9375 * sum / n / h

    f = radius * np.sqrt(1 + np.pi * f) - radius

    return x, f

`circ_range(alpha)`

Compute the circular range of angular data.

The circular range is the difference between the maximum and minimum angles in the dataset, adjusted for circular continuity.

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Angles in radians.	required

Returns:

Type	Description
`float`	Circular range, a measure of clustering (higher = more clustered).

Reference

P162, Section 7.2.3 of Jammalamadaka, S. Rao and SenGupta, A. (2001)

Source code in pycircstat2/descriptive.py

def circ_range(alpha: np.ndarray) -> np.float64:
    """
    Compute the circular range of angular data.

    The circular range is the difference between the maximum and minimum angles
    in the dataset, adjusted for circular continuity.

    Parameters
    ----------
    alpha : np.ndarray
        Angles in radians.

    Returns
    -------
    float
        Circular range, a measure of clustering (higher = more clustered).

    Reference
    ---------
    P162, Section 7.2.3 of Jammalamadaka, S. Rao and SenGupta, A. (2001)
    """
    alpha = np.sort(alpha % (2 * np.pi))  # Convert to [0, 2π) and sort
    spacings = np.diff(alpha, prepend=alpha[-1] - 2 * np.pi)  # Compute spacings
    return 2 * np.pi - np.max(spacings)  # Circular range

`circ_quantile(alpha, probs=np.array([0, 0.25, 0.5, 0.75, 1.0]), type=7)`

Compute quantiles for circular data.

This function computes quantiles for circular data by shifting the data to be centered around the circular median, applying a linear quantile function, and then shifting back.

Parameters:

Name	Type	Description	Default
`alpha`	`ndarray`	Sample of circular data (radians).	required
`probs`	`float or ndarray`	Probabilities at which to compute quantiles. Default is `[0, 0.25, 0.5, 0.75, 1.0]`.	`array([0, 0.25, 0.5, 0.75, 1.0])`
`type`	`int`	Quantile algorithm type (default `7`, matches R’s default quantile type).	`7`

Returns:

Type	Description
`ndarray`	Circular quantiles.

References

R's quantile.circular from the circular package.
Fisher (1993), Section 2.3.2.

Source code in pycircstat2/descriptive.py

def circ_quantile(
    alpha: np.ndarray,
    probs: Union[float, np.ndarray] = np.array([0, 0.25, 0.5, 0.75, 1.0]),
    type: int = 7,
) -> np.ndarray:
    """
    Compute quantiles for circular data.

    This function computes quantiles for circular data by shifting the
    data to be centered around the circular median, applying a linear quantile function,
    and then shifting back.

    Parameters
    ----------
    alpha : np.ndarray
        Sample of circular data (radians).
    probs : float or np.ndarray, optional
        Probabilities at which to compute quantiles. Default is `[0, 0.25, 0.5, 0.75, 1.0]`.
    type : int, optional
        Quantile algorithm type (default `7`, matches R’s default quantile type).

    Returns
    -------
    np.ndarray
        Circular quantiles.

    References
    ----------
    - R's `quantile.circular` from the `circular` package.
    - Fisher (1993), Section 2.3.2.
    """

    # Convert to numpy array
    alpha = np.asarray(alpha)
    probs = np.atleast_1d(probs)

    # Compute circular median
    circular_median = circ_median(alpha)

    # If the median is NaN (e.g., uniform data), return NaNs
    if np.isnan(circular_median):
        return np.full_like(probs, np.nan)

    # Transform data relative to circular median
    shifted_alpha = (alpha - circular_median) % (2 * np.pi)
    shifted_alpha = np.where(
        shifted_alpha > np.pi, shifted_alpha - 2 * np.pi, shifted_alpha
    )

    # Compute linear quantiles on transformed data
    linear_quantiles = np.quantile(
        shifted_alpha, probs, method="linear" if type == 7 else "midpoint"
    )

    # Transform back to original circular space
    circular_quantiles = (linear_quantiles + circular_median) % (2 * np.pi)

    return circular_quantiles