#!pip install git+https://github.com/compi1234/pyspch.git
try:
    import pyspch
except ModuleNotFoundError:
    try:
        print(
        """
        To enable this notebook on platforms as Google Colab, 
        install the pyspch package and dependencies by running following code:

        !pip install git+https://github.com/compi1234/pyspch.git
        """
        )
    except ModuleNotFoundError:
        raise

%matplotlib inline    
import sys, os,time
import numpy as np
import pandas as pd
from IPython.display import display, HTML, clear_output
import ipywidgets as widgets
import matplotlib.pyplot as plt
import matplotlib as mpl
import seaborn as sns

import pyspch.stats.probdist as Densities
from pyspch.stats import libhmm

# print all variable statements
from IPython.core.interactiveshell import InteractiveShell
InteractiveShell.ast_node_interactivity = "all"
# graphical and print preferences
cmap_1 = sns.light_palette("caramel",50,input="xkcd")
cmap_2 = sns.light_palette("caramel",50,input="xkcd")[0:25]
cmap_3 = sns.light_palette("caramel",50,input="xkcd")[25:50]
cmap = cmap_2
pd.options.display.float_format = '{:,.3f}'.format

# catch future warnings -- occurring in matplotlib
import warnings
warnings.simplefilter(action='ignore', category=FutureWarning)

mpl.rcParams['figure.figsize'] = [12.0, 6.0]
#mpl.rcParams['ps.papersize'] = 'A4'
mpl.rcParams['xtick.labelsize'] = 14
mpl.rcParams['ytick.labelsize'] = 14
mpl.rcParams['axes.titlepad'] = 15
mpl.rcParams['axes.titlesize'] = 'large'
mpl.rcParams['axes.linewidth'] = 2
mpl.rc('lines', linewidth=3, color='k')

%%HTML
<style type="text/css">
table.dataframe td, table.dataframe th {
    border: 2px  black solid !important;
    column-width: 60px;
    color: black !important;
}

imat = np.array([1.0, 0.0, 0.])
tmat = np.array([[.6,.4,0.],[0.,.5,.5],[0.,0.,1.]]) 
hmm1 = libhmm.HMM(n_states=3,prob_style="lin",obs_model=dd1,
                  transmat=tmat,initmat=imat)
hmm1.print_model()

HMM STATE MODEL
=================

OBSERVATION MODEL
=================

++ Feature (0) ++

Xl=np.array(['A','B','B','A','B']).reshape(-1,1)
X = dd1.lbl2indx(Xl)
obs_probs = dd1.predict_prob(X)

print("OBSERVATION LABELS\n")
pd.DataFrame(Xl.T)
print("OBSERVATIONS (INDICES)\n")
pd.DataFrame(X.T) 

print("OBSERVATION PROBABILITIES\n")
pd.DataFrame(obs_probs.T,index=dd1.classes_)

OBSERVATION LABELS

OBSERVATIONS (INDICES)

OBSERVATION PROBABILITIES

tr = libhmm.Trellis(hmm1)
tr.viterbi_pass(X.reshape(-1,1))
tr.obs_probs.T, tr.probs.T, tr.backptrs.T

(array([[0.7, 0.3, 0.3, 0.7, 0.3],
        [0.1, 0.9, 0.9, 0.1, 0.9],
        [0.6, 0.4, 0.4, 0.6, 0.4]]),
 array([[0.7       , 0.126     , 0.02268   , 0.0095256 , 0.00171461],
        [0.        , 0.252     , 0.1134    , 0.00567   , 0.00342922],
        [0.        , 0.        , 0.0504    , 0.03402   , 0.013608  ]]),
 array([[ 0,  0,  0,  0,  0],
        [ 1,  0,  1,  1,  0],
        [ 2, -1,  1,  1,  2]]))

print("Key results for Viterbi Pass\n================================")
print("Sequence Probability: %.4f \nEnd-state: %d" %(tr.seq_prob,tr.end_state))
print("Alignment:",tr.hmm.states[tr.backtrace()])

Key results for Viterbi Pass
================================
Sequence Probability: 0.0136 
End-state: 2
Alignment: [0 1 1 2 2]

tr.print_trellis(X=Xl)

Observations

Observation Probabilities

Trellis Probabilities (Viterbi)

Alignment

Sequence Probability: 1.36e-02

tr.plot_trellis(xticks=Xl.flatten(),plot_obs_probs=True,plot_backptrs=True,plot_alignment=True,
                plot_norm=True,cmap=cmap_1,vmin=0.,vmax=2,cmapf=cmap_2)

tr2 = libhmm.Trellis(hmm1,style='Forward')
tr2.forward_pass(X.reshape(-1,1))
tr2.print_trellis()

Observation Probabilities

Trellis Probabilities (Forward)

Sequence Probability: 3.29e-02

em1 = np.array( [ [ .05,.1,.85], [.1,.75,.15], [.5,.3,.2], [.2,.4,.4] ] )
em2 = np.array( [ [.9,.1], [.7,.3], [.1,.9], [.9,.1] ] )
dd2 = Densities.Discrete(feature_probs=[em1,em2],
                   labels=[['H','M','L'],['U','V']],
                   classes=[ 'sil', 'm', 'iy', 's'])

dd2.print_model()

++ Feature (0) ++

++ Feature (1) ++

imat = np.array([1.0, 0.0, 0.0, 0.0])
tmat = np.array([[.8,.2,0.,0.],[0.,.8,.2,0.],[0.,0.,.8,.2],[.2,0.,0.,.8]]) 
hmm2 = libhmm.HMM(n_states=4,prob_style="lin",obs_model=dd2,
                  transmat=tmat,initmat=imat)
hmm2.print_model()

HMM STATE MODEL
=================

OBSERVATION MODEL
=================

++ Feature (0) ++

++ Feature (1) ++

hmm2.__dict__

{'_Debug': False,
 'prob_style': 'lin',
 'prob_floor': 1e-39,
 'obs_model': <pyspch.stats.probdist.Discrete at 0x27f0f44f850>,
 'n_classes': 4,
 'states': array([0, 1, 2, 3]),
 'n_states': 4,
 'obs_indx': array([0, 1, 2, 3]),
 'transmat': array([[0.8, 0.2, 0. , 0. ],
        [0. , 0.8, 0.2, 0. ],
        [0. , 0. , 0.8, 0.2],
        [0.2, 0. , 0. , 0.8]]),
 'initmat': array([1., 0., 0., 0.]),
 'end_states': array([0, 1, 2, 3])}

X2l = np.array( [ ['L','U'], ['M','U'], ['L','V'], ['M','U'], 
            ['L','U'], ['H','V'], ['H','V'],['M','V'],['M','U'] ,['L','U']])
X2 = dd2.lbl2indx(X2l)
X2

array([[2, 0],
       [1, 0],
       [2, 1],
       [1, 0],
       [2, 0],
       [0, 1],
       [0, 1],
       [1, 1],
       [1, 0],
       [2, 0]])

# force finalization in SIL
hmm2.end_states = np.array([0])
# the Normalize flag normalizes the max observation probability in each frame to 1.
tr = libhmm.Trellis(hmm2,Normalize=True)
tr.viterbi_pass(X2)
tr.obs_probs.T, tr.probs.T, tr.backptrs.T

(array([[0.765, 0.09 , 0.085, 0.09 , 0.765, 0.005, 0.005, 0.01 , 0.09 ,
         0.765],
        [0.105, 0.525, 0.045, 0.525, 0.105, 0.03 , 0.03 , 0.225, 0.525,
         0.105],
        [0.02 , 0.03 , 0.18 , 0.03 , 0.02 , 0.45 , 0.45 , 0.27 , 0.03 ,
         0.02 ],
        [0.36 , 0.36 , 0.04 , 0.36 , 0.36 , 0.02 , 0.02 , 0.04 , 0.36 ,
         0.36 ]]),
 array([[1.00000000e+00, 6.85714286e-01, 1.00000000e+00, 2.22040816e-01,
         1.00000000e+00, 7.18989310e-02, 7.98877011e-04, 1.02880658e-04,
         9.25925926e-03, 5.31250000e-01],
        [0.00000000e+00, 1.00000000e+00, 7.72058824e-01, 1.00000000e+00,
         6.18151672e-01, 2.66666667e-01, 1.77777778e-02, 1.48148148e-02,
         8.64197531e-02, 2.52057613e-02],
        [0.00000000e+00, 0.00000000e+00, 7.72058824e-01, 5.71428571e-02,
         2.94357939e-02, 1.00000000e+00, 1.00000000e+00, 1.00000000e+00,
         3.33333333e-01, 1.85185185e-02],
        [0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 1.71428571e-01,
         3.63321799e-01, 1.04489796e-01, 1.11111111e-02, 3.70370370e-02,
         1.00000000e+00, 1.00000000e+00]]),
 array([[ 0,  0,  0,  0,  0,  0,  0,  3,  3,  3],
        [ 1,  0,  1,  1,  1,  1,  1,  1,  1,  1],
        [ 2, -1,  1,  2,  1,  1,  2,  2,  2,  2],
        [ 3, -1, -1,  2,  3,  3,  2,  2,  2,  3]]))

tr.plot_trellis(xticks=X2,plot_obs_probs=True,plot_backptrs=True,plot_alignment=True,
                plot_norm=True,cmap=cmap_1,vmin=0.,vmax=2,cmapf=cmap_2,fmt=".2e")

print("Alignment\n")
pd.DataFrame(tr.hmm.states[tr.backtrace()]).T 
print("Sequence Likelihood: %.3e" % tr.seq_prob)
print("Trellis scale in final column: %.3e" % tr.scale)

Alignment

Sequence Likelihood: 7.865e-09
Trellis scale in final column: 1.480e-08

states = ['sil_1','m','iy','s','sil_2']
imat = np.array([1.0, 0.0, 0.0, 0.0, 0.0])
tmat = np.array([[.8,.2,0.,0.,0.],[0.,.8,.2,0.,0.],[0.,0.,.8,.2,0.],[0.,0.,0.,.8,.2],
                [0.,0.,0.,0.,1.]]) 
obs_indx = [0,1,2,3,0]
hmm3 = libhmm.HMM(n_states=5,states=states,prob_style="lin",obs_model=dd2,obs_indx=obs_indx,
                  transmat=tmat,initmat=imat)
hmm3.print_model()

HMM STATE MODEL
=================

OBSERVATION MODEL
=================

++ Feature (0) ++

++ Feature (1) ++

# force finalization in SIL
hmm3.end_states = np.array([4])
# the Normalize flag normalizes the max observation probability in each frame to 1.
tr = libhmm.Trellis(hmm3,Normalize=True)
tr.viterbi_pass(X2)
#tr.obs_probs.T, tr.probs.T, tr.backptrs.T
tr.plot_trellis(xticks=X2,plot_obs_probs=True,plot_backptrs=True,plot_alignment=True,
                plot_norm=True,cmap=cmap_1,vmin=0.,vmax=2,cmapf=cmap_2,fmt=".2e")

print("Alignment\n")
pd.DataFrame(tr.hmm.states[tr.backtrace()]).T 
print("Sequence Likelihood: %.3e" % tr.seq_prob)
print("Trellis scale in final column: %.3e" % tr.scale)

Alignment

Sequence Likelihood: 7.865e-09
Trellis scale in final column: 1.480e-08

	S0	S1	S2
P(0\|.)	0.700	0.100	0.600
P(1\|.)	0.300	0.900	0.400

	0	1	2
P(0\|.)	0.600	0.000	0.000
P(1\|.)	0.400	0.500	0.000
P(2\|.)	0.000	0.500	1.000

	S0	S1	S2
P(0\|.)	0.700	0.100	0.600
P(1\|.)	0.300	0.900	0.400

	0	1	2	3	4
S0	0.700	0.300	0.300	0.700	0.300
S1	0.100	0.900	0.900	0.100	0.900
S2	0.600	0.400	0.400	0.600	0.400

	0	1	2	3	4
0	0.700	0.300	0.300	0.700	0.300
1	0.100	0.900	0.900	0.100	0.900
2	0.600	0.400	0.400	0.600	0.400

HMM EXAMPLES¶

(b) The state Model of the HMM¶

(c) An Observation Stream¶

Trellis Computations: (Viterbi, Forward Algorithm)¶

Forward Pass Probabilities¶

2. COMPLETION and BACKTRACING¶

3. Forward Algorithm Example¶

Example 2: Multi-D Discrete Features¶

Having different states with shared observation models¶

	0	1	2	3	4
0	0.700	0.126	0.023	0.010	0.002
1	0.000	0.252	0.113	0.006	0.003
2	0.000	0.000	0.050	0.034	0.014

	0	1	2	3
P(0\|.)	0.800	0.000	0.000	0.200
P(1\|.)	0.200	0.800	0.000	0.000
P(2\|.)	0.000	0.200	0.800	0.000
P(3\|.)	0.000	0.000	0.200	0.800

	sil_1	m	iy	s	sil_2
P(sil_1\|.)	0.800	0.000	0.000	0.000	0.000
P(m\|.)	0.200	0.800	0.000	0.000	0.000
P(iy\|.)	0.000	0.200	0.800	0.000	0.000
P(s\|.)	0.000	0.000	0.200	0.800	0.000
P(sil_2\|.)	0.000	0.000	0.000	0.200	1.000