# Do the imports #
##################
#
%matplotlib inline
import os,sys 
import numpy as np
import math

import pandas as pd
from IPython.display import display, Audio, HTML, clear_output
import ipywidgets as widgets
from ipywidgets import Box, HBox, VBox, Layout,interactive
import seaborn as sns
import matplotlib.pyplot as plt
import matplotlib as mpl
#

import pyspch.sp as Sps
import pyspch.core as Spch
import pyspch.display as Spd
import pyspch.dtw as dtw

    
# make notebook cells stretch over the full screen
display(HTML(data="""
<style>
    div#notebook-container    { width: 95%; }
    div#menubar-container     { width: 65%; }
    div#maintoolbar-container { width: 99%; }
</style>
"""))

mpl.rcParams['figure.figsize'] = [12.0, 8.0]
mpl.rcParams['font.size'] = 12
mpl.rcParams['legend.fontsize'] = 'large'
mpl.rcParams['figure.titlesize'] = 'large'

x1d = np.array([.05, -.1, 0.77, .335, .95, 1.75])
y1d = np.array([0.,1.,2.])
# we also define some plotting arguments for this example
plt_args = {'xy_annot':True,'ftr_annot':True,'fig_width':5,'ftr_scale':.15,'fmt':"{:.2f}",'text_size':"xx-small"}
dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x1d,y1d,trans='DTW',result='details')
print("DTW distance: %.3f " % dist)
dtw.plot_trellis(x=x1d,y=y1d,xy_mat=cd_matrix,trace=trace,**plt_args)

DTW distance: 0.573

#STEP1: Compute the local distance matrix
fig1 = dtw.plot_trellis(x=x1d,y=y1d,xy_mat=ld_matrix,**plt_args)
fig1

# STEP2: Compute the Cummulative Distance Matrix and add backpointers
fig2 = dtw.plot_trellis(x=x1d,y=y1d,xy_mat=cd_matrix,bptrs=bptrs,**plt_args)
fig2

# STEP 3: Follow the backpointers in reverse order from end to beginning to find the optimal alignment
#xy_annot=True,ftr_annot=True,fig_width=4,fmt="{:.3f}",text_size="x-small"

fig3 = dtw.plot_trellis(x=x1d,y=y1d,xy_mat=cd_matrix,trace=trace,**plt_args)
display(fig3)

# we can also plot 2 side by side
fig = dtw.plot_trellis2(x1d,y1d,ld_matrix,cd_matrix,trace=trace,figsize=(10,4),**plt_args)
display(fig)

# compute "warped" versions of x,y on the basis of an alignment
# note: a warping obtained on 1 set of features can be applied to another set 
# given that the feature sequences are equally long for both processing types
x_wp,y_wp = dtw.warp(x1d,y1d,trace)
pd.DataFrame((x_wp,y_wp))

f,ax=plt.subplots(figsize=(8,2))
ax.invert_yaxis()
dtw.text_heatmap(np.array([x_wp,y_wp]),ax=ax,annot=True,edgecolor='k',cmap='YlOrBr',alpha=.75)

x1d = np.array([.05, 1.3, 1.7, 0.77, -1.,0.,-0.5, .95, 1.75,2.7,.3])
y1d = np.array([0.,1.,2.,0.,.5,2,1.,0.])
# we also define some plotting arguments for this example
plt_args = {'xy_annot':True,'ftr_annot':False,'fig_width':10,'ftr_scale':.05,'fmt':"{:.2f}",'text_size':"xx-small"}
dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x1d,y1d,trans='DTW',result='details')
print("DTW distance: %.3f " % dist)

dtw.plot_trellis(x=x1d,y=y1d,xy_mat=cd_matrix,bptrs=bptrs,trace=trace,**plt_args)
dtw.plot_trellis2(x1d,y1d,ld_matrix,cd_matrix,bptrs=bptrs,trace=trace,**plt_args)

DTW distance: 3.360

#x2d = np.array([[0.,1.,2.,1.,0.,0.1,-0.1,0.,.05],[0.3,1.3,1.5,1.5,1.,0.3,-0.24,0.3,.05]]).T
x2d = np.array([[0.,1.,2.,1.,0.,0.1,.05],[0.3,1.3,1.5,1.5,1.,0.3,.05]]).T
y2d = np.array([[0.,0.,0.,1.,2],[1.,1.,1.,1.,-1]]).T + .1*np.random.rand(5,2)
plt_args = {'fig_width':8,'xy_annot':True,'ftr_annot':True,            
            'xy_args':{'alpha':.2,'edgecolor':'k'}, 
            'bptr_args':{'color':'orange','linewidth':3},
            'ftr_args':{'cmap':'YlOrBr','edgecolor':'g','alpha':.3},
            }

# By increasing the costs for off-diagonal transition, you force the alignment to become maximally diagonal
x_ftrs=x2d
y_ftrs=y2d
# case 1: small off-diagonal costs
trans = {'dx':[-1,-1,0], 'dy':[-1,0,-1], 'm':[1.0,1.2,1.2] }
dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x_ftrs,y_ftrs,trans=trans,result='details')
fig = dtw.plot_trellis(x=x_ftrs,y=y_ftrs,xy_mat=ld_matrix,trace=trace,**plt_args)
display(fig)
# case 2: large off-diagonal costs
trans = {'dx':[-1,-1,0], 'dy':[-1,0,-1], 'm':[1.0,2.,2.] }
dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x_ftrs,y_ftrs,trans=trans,result='details')
fig = dtw.plot_trellis(x=x_ftrs,y=y_ftrs,xy_mat=ld_matrix,trace=trace,**plt_args)
display(fig)

dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x_ftrs,y_ftrs,trans='ITX3',result='details',CLIP=False)
fig = dtw.plot_trellis(x=x_ftrs,y=y_ftrs,xy_mat=cd_matrix,trace=trace,**plt_args)
display(fig)
print("DTW distance = ",dist)

C:\Users\compi\anaconda3\envs\py310\lib\site-packages\matplotlib\colors.py:1355: RuntimeWarning: invalid value encountered in divide
  resdat /= (vmax - vmin)

DTW distance =  10.307493819563167

x_ftrs=x2d
y_ftrs=y2d[(0,3,4),:]
dist,trace,ld_matrix,cd_matrix,bptrs = dtw.dtw(x_ftrs,y_ftrs,trans='DTW',result='details',CLIP=False)
fig = dtw.plot_trellis(x=x_ftrs,y=y_ftrs,xy_mat=ld_matrix,trace=trace,**plt_args)
display(fig)
print("DTW distance = ",dist)

DTW distance =  9.338238609939435

dir = 'https://homes.esat.kuleuven.be/~spchlab/data/'
# sa1: she had your dark suit in greasy washwater all year
# sa2: don't ask me to carry an oily rag like that
# note there are some word segmentation errors in sa1, phn segmentations are OK
yname = dir+'timit/audio/train/dr1/fcjf0/sa2'
xname = dir+'timit/audio/train/dr1/fdaw0/sa2'
#
#yname = dir+'digits/5752'
#xname = dir+'digits/2927'
xwavdata, sr = Spch.load(xname+".wav")
ywavdata, sr = Spch.load(yname+".wav")

xsegdata = Spch.read_seg_file(xname+ ".wrd",dt=1/sr,fmt='float32')
ysegdata = Spch.read_seg_file(yname+ ".wrd",dt=1/sr,fmt='float32')
# compute a spectrogram with default parameters

n_mels = None
shift=0.01
length=0.03
n_shift = int(shift*sr)
n_length = int(length*sr)
#
xspgdata = Sps.spectrogram(xwavdata,sample_rate=sr,f_shift=shift,preemp=0.,n_mels=None)
xmeldata = Sps.spectrogram(xwavdata,sample_rate=sr,f_shift=shift,n_mels=24)
(nparam,xnfr)=xspgdata.shape
d_freq = sr/(2.*(nparam-1))
yspgdata = Sps.spectrogram(ywavdata,sample_rate=sr,f_shift=shift,preemp=0.,n_mels=None)
ymeldata = Sps.spectrogram(ywavdata,sample_rate=sr,f_shift=shift,n_mels=24)

# just displaying the spectrograms and mel spectrograms of both sentences
fig = Spd.PlotSpgFtrs(wavdata=xwavdata,spgdata=xspgdata,segdata=[xsegdata],
                      img_ftrs=[xmeldata],sample_rate=sr,dy=d_freq,figsize=(14,8))
display(fig)
#
fig = Spd.PlotSpgFtrs(wavdata=ywavdata,spgdata=yspgdata, #segwav=ysegdata,
                  img_ftrs=[ymeldata],sample_rate=sr,dy=d_freq,figsize=(14,8))
display(fig)

plt_args = {'fig_width':10,'ftr_scale':.1,'ftr_args':{'cmap':'jet','edgecolor':None},
            'xy_args':{'cmap':'Greys','alpha':1} }
x_ftrs = xmeldata.T
y_ftrs = ymeldata.T
#x_ftrs = xspgdata.T
#y_ftrs = yspgdata.T

cost,trace,ld_matrix,cd_matrix,_ = dtw.dtw(x_ftrs,y_ftrs,trans='ITY',result='details')
fig = dtw.plot_trellis(xy_mat=ld_matrix,trace=trace,y=y_ftrs,x=x_ftrs,**plt_args)
#fig = dtw.plot_trellis(xy_mat=ld_matrix,x=x_ftrs,y=y_ftrs)
#fig = dtw.plot_trellis(xy_mat=ld_matrix,trace=trace,y=yspgdata[0:255,:].T,x=xspgdata[0:255,:].T,**plt_args)
fig

dtw.plot_align(x_ftrs,y_ftrs,trace,cmap='jet',down_sample=3,figsize=(14,4))

dtw.plot_align(x_ftrs,y_ftrs,trace,x_wav=xwavdata,y_wav=ywavdata,sr=sr,x_seg=xsegdata,y_seg=ysegdata,cmap='jet',segcolor='k',down_sample=4,figsize=(14,6))

x_wp,y_wp = dtw.warp(x_ftrs,y_ftrs,trace)
dtw.plot_align(x_wp,y_wp,None,cmap='jet',down_sample=3,figsize=(14,6))

# Use the mel warping function to warp the spectrogram data
x_wpspg,y_wpspg = dtw.warp(xspgdata.T,yspgdata.T,trace)
dtw.plot_align(x_wpspg,y_wpspg,None,cmap='jet',down_sample=3,figsize=(14,6))

#
import librosa
def glim_synt(x,sample_rate=8000,shift=0.01):
    # dB to magnitude
    x_mag = librosa.db_to_power(x) **0.5
    hop_length = int(shift*sample_rate)
    xsyn = librosa.griffinlim(x_mag,hop_length=hop_length)
    return(xsyn)

x_syn = Sps.synth_griffinlim(x_wpspg.T,sample_rate=sr)
y_syn = Sps.synth_griffinlim(y_wpspg.T,sample_rate=sr)
fig,ax = plt.subplots(2)
ax[0].plot(x_syn)
ax[1].plot(y_syn)
print("Original spkr1")
display(Audio(xwavdata,rate=sr))
print("Warped spkr1")
display(Audio(x_syn,rate=sr))
print("Original spkr2")
display(Audio(ywavdata,rate=sr))
print("Warped spkr2")
display(Audio(y_syn,rate=sr))
print("Duo Speech")
display(Audio(x_syn+y_syn,rate=sr))