splineknots.py

import numpy as _N
import patsy
#import LOST.utilities as _U
import ka_tools.utilities as _U
import matplotlib.pyplot as _plt
from LOST.utildirs import setFN
from filter import gauKer

v = 5
c = 5
def genKnts(tscl, xMax):
    """
    generate a set of knots for history term.
    """
    knts = _N.empty(6)
    ck   = 0   #  current knot
    TSCL = int(1.5*tscl)
    knts[0:3] = TSCL *_N.random.rand(3)
    knts[3:]  = TSCL + (xMax - TSCL)*_N.random.rand(3)
    return _N.sort(knts)

# def hazzard(dt, TR, bindat, tsclPct=0.85):
#     ####  Suggest knots for history term

#     isis    = _U.fromBinDat(bindat, ISIs=True)
#     ecdf    = _sma.distributions.ECDF(isis)
#     xs      = _N.arange(0, max(isis))        #  in units of ms.
#     cdf     = ecdf(_N.arange(0, max(isis)))  # value of cdf from [0, 1)
#     tscl    = _N.where(cdf > tsclPct)[0][0]
#     dt      = 0.001

#     S  = 1 - cdf

#     haz = -(_N.diff(S) / (0.5*(S[0:-1]+S[1:])))/dt   #  Units of Hz
#     #  defined on xs[0:-1]
#     haz[_N.where(haz == 0)[0]] = 0.0001    #  need this because log
#     #  rough frequency
#     #nSpks = len(isis) + TR
#     #Hz = float(nSpks) / (TR*N*dt)
#     nhaz = haz / _N.mean(haz[int(1.5*tscl):int(2.5*tscl)])  #  

#     #nhaz = haz / Hz
#     return xs, nhaz, tscl


# def suggestHistKnots(dt, TR, bindat, tsclPct=0.85, outfn="fittedL2.dat"):
#     global v, c
#     xs, nhaz, tscl = hazzard(dt, TR, bindat, tsclPct=tsclPct)

#     ITERS   = 1000
#     allKnts = _N.empty((ITERS, 6))
#     r2s    = _N.empty(ITERS)

#     ac = _N.zeros(c)
#     for tr in range(ITERS):
#         bGood = False
#         while not bGood:
#             knts = genKnts(tscl, xs[-1]*0.9)

#             B  = patsy.bs(xs[0:-1], knots=knts, include_intercept=True)

#             Bc = B[:, v:];   Bv = B[:, 0:v]

#             try:
#                 iBvTBv = _N.linalg.inv(_N.dot(Bv.T, Bv))
#                 bGood = True
#             except _N.linalg.linalg.LinAlgError:
#                 print "Linalg Error"

#         av = _N.dot(iBvTBv, _N.dot(Bv.T, _N.log(nhaz) - _N.dot(Bc, ac)))
#         a = _N.array(av.tolist() + ac.tolist())

#         #  Now fit where the last few nots are fixed
#         splFt          = _N.exp(_N.dot(B, a))
#         df             = nhaz - splFt
#         r2s[tr]        = _N.dot(df[0:int(tscl)], df[0:int(tscl)])
#         allKnts[tr, :] = knts

#     bstKnts = allKnts[_N.where(r2s == r2s.min())[0][0], :]

#     B  = patsy.bs(xs[0:-1], knots=bstKnts, include_intercept=True)
#     Bc = B[:, v:];   Bv = B[:, 0:v]
#     iBvTBv = _N.linalg.inv(_N.dot(Bv.T, Bv))
#     av = _N.dot(iBvTBv, _N.dot(Bv.T, _N.log(nhaz) - _N.dot(Bc, ac)))
#     a = _N.array(av.tolist() + ac.tolist())
#     #  Now fit where the last few nots are fixed
#     lmd2          = _N.exp(_N.dot(B, a))

#     return bstKnts, lmd2, nhaz, tscl

# def suggestHistKnotsFromLam(xs, nhaz, outfn="fittedL2.dat"):
#     global v, c

#     ITERS   = 1000
#     allKnts = _N.empty((ITERS, 6))
#     r2s    = _N.empty(ITERS)

#     ac = _N.zeros(c)
#     for tr in range(ITERS):
#         bGood = False
#         while not bGood:
#             knts = genKnts(tscl, xs[-1]*0.9)

#             B  = patsy.bs(xs[0:-1], knots=knts, include_intercept=True)

#             Bc = B[:, v:];   Bv = B[:, 0:v]

#             try:
#                 iBvTBv = _N.linalg.inv(_N.dot(Bv.T, Bv))
#                 bGood = True
#             except _N.linalg.linalg.LinAlgError:
#                 print "Linalg Error"

#         av = _N.dot(iBvTBv, _N.dot(Bv.T, _N.log(nhaz) - _N.dot(Bc, ac)))
#         a = _N.array(av.tolist() + ac.tolist())

#         #  Now fit where the last few nots are fixed
#         splFt          = _N.exp(_N.dot(B, a))
#         df             = nhaz - splFt
#         r2s[tr]        = _N.dot(df[0:int(tscl)], df[0:int(tscl)])
#         allKnts[tr, :] = knts

#     bstKnts = allKnts[_N.where(r2s == r2s.min())[0][0], :]

#     B  = patsy.bs(xs[0:-1], knots=bstKnts, include_intercept=True)
#     Bc = B[:, v:];   Bv = B[:, 0:v]
#     iBvTBv = _N.linalg.inv(_N.dot(Bv.T, Bv))
#     av = _N.dot(iBvTBv, _N.dot(Bv.T, _N.log(nhaz) - _N.dot(Bc, ac)))
#     a = _N.array(av.tolist() + ac.tolist())
#     #  Now fit where the last few nots are fixed
#     lmd2          = _N.exp(_N.dot(B, a))

#     return bstKnts, lmd2, nhaz, tscl


def suggestPSTHKnots(dt, TR, N, bindat, bnsz=10, psth_knts=10, psth_run=False):
    """
    bnsz   binsize used to calculate approximate PSTH
    """
    rszd = False
    if N % bnsz != 0:
        rszd = True
        pcs = _N.ceil(N/bnsz)
        bnsz = int(_N.floor(N / pcs))

    spkts  = _U.fromBinDat(bindat, SpkTs=True)

    #  apsth needs to be same size as N.  ie N%bnsz needs to be 0
    h, bs = _N.histogram(spkts, bins=_N.linspace(0, N, (N//bnsz)+1))

    fs     = (h / (TR * bnsz * dt))
    _apsth = _N.repeat(fs, bnsz)    #    piecewise boxy approximate PSTH
    if rszd:
        apsth = _N.zeros(N)
        apsth[0:(N//bnsz)*bnsz] = _apsth
        apsth[(N//bnsz)*bnsz:]  = apsth[(N//bnsz)*bnsz-1]
    else:
        apsth = _apsth

    apsth *= dt
    gk = gauKer(5) 
    gk /= _N.sum(gk)
    f_apsth = _N.convolve(apsth, gk, mode="same")
    dpsth_pctl = _N.cumsum(_N.abs(_N.diff(f_apsth)))
    dpsth_pctl /= dpsth_pctl[-1]
    dpsth_pctl[0] = 0

    ITERS = 40
    x     = _N.linspace(0., N-1, N, endpoint=False)  # in units of ms.
    r2s   = _N.empty(ITERS)
    best_r2s = _N.zeros(5)

    for iknts in range(5, 6):
        allKnts = _N.empty((ITERS, iknts))
        allCoeffs  = []

        tAvg  = 1./iknts
        tsMin = tAvg*0.5
        tsMax = tAvg*1.5

        for it in range(ITERS):
            knt_inds = _N.zeros(iknts+1)
            bGood = False
            while not bGood:
                try:
                    #pieces  = tsMin + _N.random.rand(iknts+1)*(tsMax-tsMin)
                    rnd_pctls   = _N.sort(_N.random.rand(iknts+1))

                    #pieces  = tsMin + _N.random.rand(iknts+1)*(tsMax-tsMin)
                    for i in range(iknts+1):
                        iHere = _N.where((rnd_pctls[i] >= dpsth_pctl[0:-1]) & (rnd_pctls[i] < dpsth_pctl[1:]))[0]
                        knt_inds[i] = iHere[0]

                    # knts    = _N.empty(iknts+1)

                    # knts[0] = pieces[0]
                    # for i in range(1, iknts+1):
                    #     knts[i] = knts[i-1] + pieces[i]
                    # knts /= knts[-1]
                    # knts[0:-1] *= N
                    #knts  = _N.sort((0.1 + 0.85*_N.random.rand(iknts))*N)
                    B     = patsy.bs(x, knots=(knt_inds[0:-1]), include_intercept=True)
                    iBTB   = _N.linalg.inv(_N.dot(B.T, B))
                    bGood  = True
                except _N.linalg.linalg.LinAlgError:
                    print("Linalg Error or Value Error in suggestPSTHKnots")
                except ValueError:
                    print("Linalg Error or Value Error in suggestPSTHKnots")


            #a     = _N.dot(iBTB, _N.dot(B.T, _N.log(apsth)))
            a     = _N.dot(iBTB, _N.dot(B.T, apsth))
            #ft    = _N.exp(_N.dot(B, a))
            ft    = _N.dot(B, a)
            r2s[it] = _N.dot(ft - apsth, ft - apsth)
            allKnts[it, :] = knt_inds[0:-1]
            allCoeffs.append(a)

        mnIt = _N.where(r2s == r2s.min())[0][0]
        best_r2s[iknts-10] = r2s[mnIt]
    knts = allKnts[mnIt]
    cfs  = allCoeffs[mnIt]
    B     = patsy.bs(x, knots=knts, include_intercept=True)

    if psth_run:
        fig = _plt.figure()
        _plt.plot(_N.dot(B, cfs))
        _plt.plot(apsth)

    return knts, apsth, cfs

def display(N, dt, tscl, nhaz, apsth, lambda2, psth, histknts, psthknts, dir=None):
    """
    N        length of trial, also time in ms
    tscl
    nhaz     normalized hazzard function.  calculated under assumption of stationarity of psth
    apsth    approximate stepwise psth
    lambda2  ground truth   lambda2 term
    psth     ground truth   lambda1 term
    """
    global v, c

    x  = _N.linspace(0., N-1, N, endpoint=False)  # in units of ms.

    theknts = [histknts, psthknts]
    for f in range(1, 3):
        knts = theknts[f-1]
        
        if f == 1:
            fig, ax = _plt.subplots(figsize=(6, 4))
            B  = patsy.bs(x[0:len(nhaz)], knots=knts, include_intercept=True)
            Bc = B[:, v:];    Bv = B[:, 0:v]
            ac = _N.zeros(c)
            iBvTBv = _N.linalg.inv(_N.dot(Bv.T, Bv))

            av = _N.dot(iBvTBv, _N.dot(Bv.T, _N.log(nhaz) - _N.dot(Bc, ac)))

            a = _N.array(av.tolist() + ac.tolist())
            _plt.plot(x[0:len(nhaz)], nhaz, color="grey", lw=2)   #  empirical
            ymax = -1
            if lambda2 is not None:
                _plt.plot(lambda2, color="red", lw=2)               #  ground truth
                ymax = max(lambda2)
            _plt.ylim(0, max(ymax, max(nhaz[0:tscl]))*1.1)
            _plt.xlim(0, 3*tscl)
            splFt = _N.exp(_N.dot(B, a))
            _plt.plot(splFt)
            ax.spines["top"].set_visible(False)
            ax.spines["right"].set_visible(False)
            ax.xaxis.set_ticks_position("bottom")
            ax.yaxis.set_ticks_position("left")
            _plt.savefig(setFN("hist.eps", dir=dir))
            _plt.xlim(0, tscl)
            #_plt.grid()
            _plt.savefig(setFN("histZ.eps", dir=dir))
            _plt.close()
        else:
            fig = _plt.figure()
            B  = patsy.bs(x, knots=knts, include_intercept=True)
            iBTB   = _N.linalg.inv(_N.dot(B.T, B))
            a     = _N.dot(iBTB, _N.dot(B.T, _N.log(apsth)))
            _plt.plot(x, apsth, color="grey", lw=2)   #  empirical
            if psth is not None:
                fHz   = ((_N.exp(psth)*dt) / (1 + dt*_N.exp(psth))) / dt
                _plt.plot(fHz, color="red", lw=2)               #  ground truth

            splFt = _N.exp(_N.dot(B, a))
            _plt.plot(splFt)
            _plt.savefig(setFN("psth.eps", dir=dir))
            _plt.close()

"""
def reasonableHist(lmd, maxH=1.2):
    L = lmd.shape[0]
    cmpLmd = _N.array(lmd)  #  compressed lambda

    maxAmp = _N.max(lmd-1)
    bAbv    = False
    bFellOnce=False
    bForce1 = False   #  force it to be 1 hereafter
    
    for i in range(L):
        if (not bAbv) and lmd[i] > 1:
            bAbv = True
            
        if (lmd[i] > 1):
            cmpLmd[i] = 1 + ((lmd[i] - 1) / maxAmp) * (maxH - 1)
        elif (lmd[i] < 1) and bAbv:
            cmpLmd[i] = 1

        if bAbv and (not bFellOnce):
            if lmd[i] < lmd[i-1]:
                bFellOnce = True

        if (not bForce1) and bAbv and (lmd[i] > lmd[i-1]) and bFellOnce:
            bForce1 = True
            cmpLmd[i] = 1
        if bForce1:
            cmpLmd[i] = 1

            
    return cmpLmd
"""

def reasonableHistory(lmd, maxH=1.2, cutoff=100):
    """
    search for max between 0 and cutoff
    """
    L = lmd.shape[0]
    cmpLmd = _N.array(lmd)  #  compressed lambda

    maxAmp = _N.max(lmd-1)
    bAbv    = False
    bFellOnce=False
    bForce1 = False   #  force it to be 1 hereafter
    
    for i in range(L):
        if (not bAbv) and lmd[i] > 1:
            bAbv = True
            
        if (lmd[i] > 1):
            cmpLmd[i] = 1 + ((lmd[i] - 1) / maxAmp) * (maxH - 1)
        elif (lmd[i] < 1) and bAbv:
            cmpLmd[i] = 1

        if bAbv and (not bFellOnce):
            if lmd[i] < lmd[i-1]:
                bFellOnce = True

        if (not bForce1) and bAbv and (lmd[i] > lmd[i-1]) and bFellOnce:
            bForce1 = True
            cmpLmd[i] = 1
        if bForce1:
            cmpLmd[i] = 1

            
    return cmpLmd

def reasonableHistory2(lmd, maxH=1.2, strT=1, cutoff=100, dcyTS=60):
    """
    search for max between 0 and cutoff
    stretchT
    """
    hiest = max(lmd[0:cutoff])
    L = lmd.shape[0]
    cmpLmd = _N.empty(dcyTS)  #  compressed lambda

    ihiest= _N.where(lmd == hiest)[0][0]

    ###  
    x    = _N.linspace(0, ihiest, ihiest+1)

    for i in range(ihiest + 1):
        cmpLmd[i] = lmd[i] * (maxH / hiest)
    
    print(ihiest)
    if strT > 1:

        nIDP   = int((ihiest+1)*strT)   #  number of interpolated data points
        xI     = _N.linspace(0, ihiest, nIDP)
        cI     = _N.interp(xI, x, cmpLmd[0:ihiest+1])

        cmpLmd[0:nIDP] = cI
        ihiest = int(ihiest*strT)

    dy  = (maxH - 1) / float(dcyTS - ihiest)
    for i in range(ihiest + 1, dcyTS):
        cmpLmd[i] = maxH -  (i - ihiest) * dy

    return cmpLmd


def findAndSaturateHist(cl, refrT=30, MAXcl=None):
    """
    how high
    """
    ITERS = 1000

    dgr   = 2
    ktl   = _N.empty(dgr+1)
    cktl  = _N.zeros(dgr+2)
    xs    = _N.linspace(0, 1, refrT)
    scr   = _N.empty(ITERS)

    aS    = _N.empty((ITERS, dgr+4))
    kts   = _N.empty((ITERS, dgr))

    lcl   = _N.log(cl)
    for it in range(ITERS):
        bOK = False
        while not bOK:
            try:
                ktl = _N.random.rand(dgr+1) 

                for d in range(1, dgr+2):
                    cktl[d] = cktl[d-1] + ktl[d-1]
                cktl /= cktl[-1]

                B  = patsy.bs(xs, knots=cktl[1:-1], include_intercept=True)

                iBvTBv = _N.linalg.inv(_N.dot(B.T, B))

                a  = _N.dot(iBvTBv, _N.dot(B.T, lcl))

                ftd = _N.exp(_N.dot(B, a))
                scr[it] = _N.sum((ftd - cl)**2)

                aS[it] = a
                kts[it] = cktl[1:-1]
                bOK = True
            except _N.linalg.linalg.LinAlgError:
                print("LinAlgError in findAndSaturateHist part 1")

    bI      = _N.where(scr == _N.min(scr))[0][0]

    bestKts = kts[bI]
    bestAs  = aS[bI]

    ######
    B  = patsy.bs(xs, knots=bestKts, include_intercept=True)
    ftdC = _N.exp(_N.dot(B, bestAs))

    if MAXcl is not None:
        #  now compress, and 
        MAX = _N.max(ftdC[0:refrT])
        maxInd = _N.where(ftdC == MAX)[0][0]
        ftdC[maxInd:] = _N.linspace(MAX, 1, refrT-maxInd)

        bg1Inds = _N.where(ftdC > 1)[0]

        ftdC[bg1Inds] = (((ftdC[bg1Inds] - 1) / (MAX - 1)) * (MAXcl-1)) +1
        lt1Inds = _N.where(ftdC[refrT:] < 1)[0]
        ftdC[refrT+lt1Inds] = 1
    
    lftdC = _N.log(ftdC)
    for it in range(ITERS):
        bOK = False
        while not bOK:
            try:
                ktl = _N.random.rand(dgr+1) 

                for d in range(1, dgr+2):
                    cktl[d] = cktl[d-1] + ktl[d-1]
                cktl /= cktl[-1]

                B  = patsy.bs(xs, knots=cktl[1:-1], include_intercept=True)

                iBvTBv = _N.linalg.inv(_N.dot(B.T, B))

                a  = _N.dot(iBvTBv, _N.dot(B.T, lftdC))

                ftd = _N.exp(_N.dot(B, a))
                scr[it] = _N.sum((ftd - ftdC)**2)

                aS[it] = a
                kts[it] = cktl[1:-1]
                bOK = True
            except _N.linalg.linalg.LinAlgError:
                print("LinAlgError in findAndSaturateHist part 2")


    bI      = _N.where(scr == _N.min(scr))[0][0]

    bestKts = kts[bI]
    bestAs  = aS[bI]
    
    return xs, bestKts, bestAs