emod_analysis

`binom_vec(yobs, ysim)`

Source code in local_python/py_assets_common/emod_analysis.py

def binom_vec(yobs, ysim):
    '''
    '''

    lliktot = 0

    pVec = ysim
    kVec = yobs[0]
    NVec = yobs[1]

    for k1 in range(len(kVec)):
        p = min(1-pVec[k1], 1-1e-7)
        k = kVec[k1]
        N = NVec[k1]

        if (N == 0):
            continue

        if ((p == 0 and k > 0) or (p == 1 and k < N)):
            raise Exception('Bad binomial data')

        if (k == 0):
            lliktot = lliktot + N*np.log(1-p)
            continue

        if (k == N):
            lliktot = lliktot + k*np.log(p)
            continue

        lliktot += k*np.log(p+1e-10) + (N-k)*np.log(1-p+1e-10) + \
            N*np.log(N/(N-k)) - k*np.log(k/(N-k)) + \
            0.5*np.log(N/k/2/np.pi/(N-k))

    return lliktot

`gauss_opt(yobs, ysim)`

Source code in local_python/py_assets_common/emod_analysis.py

def gauss_opt(yobs, ysim):
    '''
    '''

    k = np.array(yobs[0])
    N = np.array(yobs[1])
    mu = np.array(ysim[0])/(np.array(ysim[1])+EPS)
    x = k/(N+EPS)
    sig2 = 1.0/N[N > 0]
    dmu2 = np.power(x-mu, 2.0)[N > 0]

    lyscal = 0.0

    while (True):
        (llik, G, H) = gauss_vec(dmu2, sig2, np.exp(lyscal))
        sstptot = G/(H+EPS)

        # Step size control
        if (abs(sstptot) > 5.0):
            sstptot = np.sign(sstptot)*5.0

        lyscal = lyscal - sstptot

        if (abs(sstptot) < 1.0e-4):
            break

    return (llik, np.exp(lyscal))

`gauss_vec(dmu2, sig2, yscal=1.0)`

Source code in local_python/py_assets_common/emod_analysis.py

def gauss_vec(dmu2, sig2, yscal=1.0):
    '''
    '''

    llik = -0.5*np.sum(dmu2/(sig2*yscal*yscal) +
                       np.log(2*np.pi*sig2*yscal*yscal))
    G = 1.0*np.sum(dmu2/(sig2*yscal*yscal)-1.0)
    H = -2.0*np.sum(dmu2/(sig2*yscal*yscal))

    return (llik, G, H)

`multinom_vec(yobs, ysim)`

Source code in local_python/py_assets_common/emod_analysis.py

def multinom_vec(yobs, ysim):
    '''
    '''

    lliktot = 0.0
    mlam = 0.1
    yobstot = 0.0
    ysimtot = 0.0

    for k1 in range(len(yobs)):
        yobsval = float(yobs[k1])
        ysimval = float(ysim[k1])

        if (yobsval >= 0):
            lliktot = lliktot + yobsval*np.log((ysimval + mlam)/yobsval) \
                              - 0.5*np.log(2.0*np.pi*yobsval)
            yobstot = yobstot + yobsval
            ysimtot = ysimtot + ysimval + mlam

    if (yobstot > 0):
        lliktot = lliktot + yobstot*np.log(yobstot/ysimtot) + \
                              0.5*np.log(2.0*np.pi*yobstot)

    return lliktot

`norpois_opt(yobs, ysim)`

Preferred entry point for norpois_vec function, which calculates a Poisson-based estimation of log-liklihood for a timeseries. This function determines coefficients in the scale factor by maximizing log-liklihood.

Maximum liklihood scale factor coefficients may result in unreasonable values (i.e., reporting rates greater than 100%). Unreasonable scaling coefficients occur when simulation outcomes are a very poor match to observed values.

Parameters:

Name	Type	Description	Default
`yobs`	`list[float]`	List of observed timeseries values.	required
`ysim`	`list[float]`	List of simulated timeseries values. May be longer than the list of observed values.	required

Returns:

Name	Type	Description
`Ltot`	`float`	Calculated log-liklihood estimator.
`pvec`	`[float, float]`	The [mval, bval] parameters that maximize the log-liklihood.

Source code in local_python/py_assets_common/emod_analysis.py

def norpois_opt(yobs: list[float], ysim: list[float]):
    '''
    Preferred entry point for `norpois_vec` function, which calculates a
    Poisson-based estimation of log-liklihood for a timeseries. This function
    determines coefficients in the scale factor by maximizing log-liklihood.

    Maximum liklihood scale factor coefficients may result in unreasonable
    values (i.e., reporting rates greater than 100%). Unreasonable scaling
    coefficients occur when simulation outcomes are a very poor match to
    observed values.

    Args:
        yobs: List of observed timeseries values.

        ysim: List of simulated timeseries values. May be longer than
            the list of observed values.

    Returns:
        Ltot (float): Calculated log-liklihood estimator.

        pvec ([float, float]): The [mval, bval] parameters that maximize the
            log-liklihood.
    '''

    # May have more simulated outcomes than observed outcomes
    if (len(ysim) < len(yobs)):
        raise ValueError("Simulation vector is too short.")

    x = np.zeros((2, 1))

    while (True):
        (Ltot, dval) = norpois_vec(yobs, ysim, x[0, 0], x[1, 0])

        # Convergence check
        dmag = np.max(np.abs(dval))
        if (dmag < 1.0e-5):
            break

        x = x - dval

    pvec = [float(x[0, 0]), float(x[1, 0])]

    return (Ltot, pvec)

`norpois_vec(yobs, ysim, mval=0.0, bval=0.0)`

Poisson-based estimation of log-liklihood for a timeseries. The vector of observed values is used as the occurances (k) and the vector of simulated values is used as the rates (lam). Stirling's approximation is applied to the factorial term: ln P = kln(lam/k) - lam + k - 0.5ln(2pik)

A small positive value is added to the simulated rates so they are never exactly zero. The adjusted rates are then modified by a scale factor that represents the case to infection ratio. Scale factor adjustements have an exp(m*x + b) form that allows for changes over time. The values in the timeseries are assumed to be equally spaced, so the x value in the scale factor is the index of the value in the vector. lam = (ysim + delt)exp(mvalx + bval) k = yobs

First and second derivatives of probability with respect to mval and bval coefficients in the scale factor are also calculated.

Parameters:

Name	Type	Description	Default
`yobs`	`list[float]`	List of observed timeseries values.	required
`ysim`	`list[float]`	List of simulated timeseries values. May be longer than the list of observed values.	required
`mval`	`float`	Linear parameter in scale factor calculations.	`0.0`
`bval`	`float`	Constant parameter in scale factor calculations.	`0.0`

Returns:

Name	Type	Description
`Ltot`	`float`	Calculated log-liklihood estimator.
`dval`	`[float, float]`	Estimated Newton-step to adjust [mval, bval] parameters when maximizing log-liklihood.

Source code in local_python/py_assets_common/emod_analysis.py

def norpois_vec(yobs: list[float], ysim: list[float],
                mval: float = 0.0, bval: float = 0.0):
    '''
    Poisson-based estimation of log-liklihood for a timeseries. The vector of
    observed values is used as the occurances (k) and the vector of simulated
    values is used as the rates (lam). Stirling's approximation is applied to
    the factorial term:
        ln P = k*ln(lam/k) - lam + k - 0.5*ln(2*pi*k)

    A small positive value is added to the simulated rates so they are never
    exactly zero. The adjusted rates are then modified by a scale factor
    that represents the case to infection ratio. Scale factor adjustements
    have an `exp(m*x + b)` form that allows for changes over time. The values
    in the timeseries are assumed to be equally spaced, so the `x` value in
    the scale factor is the index of the value in the vector.
        lam = (ysim + delt)*exp(mval*x + bval)
        k = yobs

    First and second derivatives of probability with respect to `mval` and
    `bval` coefficients in the scale factor are also calculated.

    Args:
        yobs: List of observed timeseries values.

        ysim: List of simulated timeseries values. May be longer than
            the list of observed values.

        mval: Linear parameter in scale factor calculations.

        bval: Constant parameter in scale factor calculations.

    Returns:
        Ltot (float): Calculated log-liklihood estimator.

        dval ([float, float]): Estimated Newton-step to adjust [mval, bval]
            parameters when maximizing log-liklihood.
    '''

    # L - liklihood; G - gradient; H - Hessian
    Ltot = 0.0
    Gtot = np.zeros((2, 1))
    Htot = np.zeros((2, 2))
    delt = 0.01  # Small positive value (FLT_EPS is way too small)

    # Each timeseries value is evaluated serially
    for k1 in range(len(yobs)):
        yobs0 = float(yobs[k1])
        ysim0 = float(ysim[k1]) + delt
        rfac = np.exp(mval*k1 + bval)

        if (yobs0 > 0):
            Ltot += yobs0*np.log(ysim0*rfac/yobs0) - ysim0*rfac + \
                    yobs0 - 0.5*np.log(2.0*np.pi*yobs0)

            Gtot[0, 0] += yobs0*k1 - ysim0*rfac*k1
            Gtot[1, 0] += yobs0 - ysim0*rfac

            Htot[0, 0] += -ysim0*rfac*k1*k1
            Htot[1, 0] += -ysim0*rfac*k1
            Htot[0, 1] += -ysim0*rfac*k1
            Htot[1, 1] += -ysim0*rfac

        elif (yobs0 == 0):
            Ltot += -ysim0*rfac

            Gtot[0, 0] += -ysim0*rfac*k1
            Gtot[1, 0] += -ysim0*rfac

            Htot[0, 0] += -ysim0*rfac*k1*k1
            Htot[1, 0] += -ysim0*rfac*k1
            Htot[0, 1] += -ysim0*rfac*k1
            Htot[1, 1] += -ysim0*rfac

    dval = np.linalg.solve(Htot, Gtot)

    return (Ltot, dval)