Source code for pwkit.kbn_conf

# -*- mode: python; coding: utf-8 -*-
# Copyright 2014 Peter Williams <peter@newton.cx> and collaborators.
# Licensed under the MIT License.

"""pwkit.kbn_conf - calculate Poisson-like confidence intervals assuming a background

This module implements the Bayesian confidence intervals for Poisson processes
in a background using the approach described in Kraft, Burrows, & Nousek
(1991). That paper provides tables of values; this module can calculate
intervals for arbitrary inputs. Requires `scipy`.

This implementation almost directly transcribes the equations. We do, however,
work in log-gamma space to try to avoid overflows with large values of N or B.

Functions:

kbn_conf     - Compute a single confidence limit.
vec_kbn_conf - Vectorized version of `kbn_conf`.

TODO: tests!

"""
from __future__ import absolute_import, division, print_function, unicode_literals

__all__ = str("kbn_conf vec_kbn_conf").split()

from numpy import exp, log, vectorize
from scipy.special import gammaln
from scipy.integrate import quad
from scipy.optimize import newton


def _cconst(N, B):
    s = 0.0
    lnb = log(B)

    for n in range(N + 1):
        s += exp(-B + n * lnb - gammaln(n + 1))

    return 1.0 / s


def _fcnb(C, N, B, S):
    return C * exp(-(S + B) + N * log(S + B) - gammaln(N + 1))


def _fnb(N, B, S):
    return _fcnb(_cconst(N, B), N, B, S)


[docs] def kbn_conf(N, B, CL): """Given a (integer) number of observed Poisson events `N` and a (real) expected number of background events `B` and a confidence limit `CL` (between 0 and 1), return the confidence interval on the source event rate. Returns: (Smin, Smax) This interval is calculated using the Bayesian formalism of Kraft, Burrows, & Nousek (1991), which assumes no uncertainty in `B` and returns the smallest possible interval that satisfies the above properties. Example: in a certain time interval, 3 events were recorded. Based on external knowledge, it is expected that on average 0.5 background events will be recorded in the same interval. The 95% confidence interval on the source event rate is >>> kbn_conf.kbn_conf (3, 0.5, 0.95) <<< (0.22156, 7.40188) which agrees with the entry in Table 2 of KBN91. Reference info: 1991ApJ...374..344K, doi:10.1086/170124 """ tol = 1e-6 origN = N try: N = int(N) assert N == origN except Exception: raise ValueError("N must be an integer") CL = float(CL) if CL <= 0.0 or CL >= 1.0: raise ValueError("CL must be between 0 and 1, noninclusive") B = float(B) if B < 0: raise ValueError("B must be nonnegative") # OK, arg-checking is out of the way. Precompute some things ... C = _cconst(N, B) f = lambda s: _fcnb(C, N, B, s) # The goal is find Smin and Smax such that the integral of _fnb between # Smin and Smax is CL, and _fnb (Smin) = _fnb (Smax). Follow the # suggestion in Kraft, Burrows, & Nousek (1991) and start at the # maximum-probability value, integrating outwards trying to maintain the # constraints. We have to be careful because smin cannot go below zero, # and to ignore the enormous typo ("local maximum at S = B + N"!) in the # paper! smin = smax = max(N - B, 0.0) fmin = f(smin) fmax = f(smax) conf = 0.0 while conf < CL: if smin == 0.0 or fmin < fmax: stepsize = max(0.2 * abs(CL - conf) / CL / fmax, tol) conf += quad(f, smax, smax + stepsize)[0] smax += stepsize fmax = f(smax) else: stepsize = max(min(0.2 * abs(CL - conf) / CL / fmin, 0.1 * smin), tol) if smin - stepsize < tol: conf += quad(f, 0, smin)[0] smin = 0.0 else: conf += quad(f, smin - stepsize, smin)[0] smin -= stepsize fmin = f(smin) return smin, smax
vec_kbn_conf = vectorize( kbn_conf, otypes=[float, float], doc="""Vectorized form of `kbn_conf`. All three inputs must be broadcastable to a common shape.""", )