#
#!pip install git+https://github.com/compi1234/pyspch.git
#
try:
    import pyspch
except ModuleNotFoundError:
    try:
        print(
        """
        To enable this notebook on platforms as Google Colab, 
        install the pyspch package and dependencies by running following code:

        !pip install git+https://github.com/compi1234/pyspch.git
        """
        )
    except ModuleNotFoundError:
        raise

%matplotlib inline
import os,sys
import matplotlib as mpl
import matplotlib.pyplot as plt
import numpy as np

import pyspch.core as Sp
import pyspch.sp as Sps
import pyspch.display as Spd
import pkg_resources   # Will be deprecated in Python 3.11 !! -- change to importlib_resources() -- TBD
# code to used then
#import importlib_resources
#for entry in importlib_resources.files('pyspch.data.demo').iterdir():
#    print(entry, entry.name)


import ipywidgets as widgets
from IPython.display import display, clear_output, Audio, HTML
def box_layout():
     return widgets.Layout(
        border='solid 1px black',
        margin='0px 10px 10px 0px',
        padding='5px 5px 5px 5px'
     )

# when loading sampled data, both the data and the sampling rate are returned
y,sr = Sp.load_data( "demo/friendly.wav")  
print("sampling rate=",sr)
plt.plot(y);

sampling rate= 8000

name = "demo/friendly"
segwrd = Sp.load_data(name+".wrd")
seg = Sp.load_data(name+".phn")
print("Phonetic segmentation of: ","'"+" ".join(segwrd.seg)+"'")
seg.T

Phonetic segmentation of:  'friendly computers'

name = "demo/friendly"
wavdata,sr = Sp.load_data(name+".wav")
seg = Sp.load_data(name+".gra")
Spd.PlotWaveform(wavdata,sample_rate=sr,seg=seg,title="Waveform Plot with Graphemic Segmentation")

class Signals(widgets.VBox):
    def __init__(self,dir="demo/",figsize=(12,6),dpi=100):
        super().__init__()
        self.dir = dir
        self.transcript = "bla bla"
        
        all_files = pkg_resources.resource_listdir('pyspch',"data/"+self.dir) #  os.listdir(self.dir) -- this works with local installs only
        print(all_files)
        self.names =  [ name.split('.',maxsplit=1)[0]  for name in  all_files if name.split('.',maxsplit=1)[1] == "wav"] 
        print(self.names)
        self.wg_signals = widgets.Dropdown(options=self.names,value=self.names[0],description="Signal") 
        self.wg_signals.observe(self.signals_observe,'value')  
        self.wg_rate = widgets.IntText(
            value=0,
            description='Rate:',
            disabled=True   
        )
        self.wg_transcript = widgets.Text(
            value='---',
            placeholder='---',
            description='Transcript:',
            disabled=True   
        )
        self.wg_rate.layout.width = '20%'
        self.wg_transcript.layout.width='50%'
        self.signal = self.names[0]
        self.audio = widgets.Output()
        self.out = widgets.Output(layout=box_layout())
        self.UI = widgets.HBox( [self.wg_signals, self.wg_rate,self.wg_transcript],layout=box_layout())

        self.update()
        plt.close()
        self.children = [ self.UI, self.out, self.audio]
        
    def update(self):
        name = self.dir + self.signal
        y,self.sample_rate = Sp.load_data(name+".wav")
        self.fig = Spd.PlotWaveform(y,sample_rate=self.sample_rate)
        
        # try to add segmentations
        # The TIMIT segmentation files in the demo dir are slightly different than the original ones
        # Sample level segmentations were converted to time based segmentation
        # and the phonetic alphabet was collapsed to the CMU set (+closure)
        segwrd = None
        transcript = None
        # first find a word segmentation
        #try:
        segwrd = Sp.load_data(self.dir+self.signal+".wrd",dt=None)
        if segwrd is not None:
            self.fig.add_seg_plot(segwrd,iax=0,ypos=0.95,color="red",size=12,Lines=True)
            transcript = " ".join(segwrd.seg)
        
        # then add grapheme or phoneme segmentation
        seg = None
        seg = Sp.load_data(self.dir+self.signal+".gra")
        if seg is None:
            seg = Sp.load_data(self.dir+self.signal+".phn")          
        if seg is not None:
            self.fig.add_seg_plot(seg,iax=0,ypos=0.05,color="blue",size=12,Lines=True)
        if transcript is None:
            try:
                transcript = " ".join(seg.seg)
            except:
                transcript = ""
        self.wg_transcript.value = transcript 
        self.wg_rate.value = self.sample_rate
        with self.out:
            clear_output(wait=True)
            display(self.fig)
        with self.audio:
            clear_output(wait=True)
            display(Audio(data=y,rate=self.sample_rate,normalize=False,autoplay=False))
                
    def signals_observe(self,change):
        self.signal = change.new
        self.update()
        
Signals(dir="demo/")

['bad_bead_booed.phn', 'bad_bead_booed.wav', 'bad_bead_booed.wrd', 'beed.wav', 'b_8k.wav', 'd15zz6.wav', 'd15zz6.wrd', 'expansionist.gra', 'expansionist.phn', 'expansionist.wav', 'expansionist.wrd', 'expansionist_8k.wav', 'female1.wav', 'female2.wav', 'friendly.gra', 'friendly.ogg', 'friendly.phn', 'friendly.syl', 'friendly.wav', 'friendly.wrd', 'horse.wav', 'male1.gra', 'male1.syl', 'male1.wav', 'male1.wrd', 'male1_recognize.wav', 'male1_speech.wav', 'mini_corpus.lst', 'mini_corpus.txt', 'misinterpret.wav', 'splat.wav', 'timit_f1_sa1.phn', 'timit_f1_sa1.wav', 'timit_f1_sa1.wrd', 'timit_f1_sa2.phn', 'timit_f1_sa2.wav', 'timit_f1_sa2.wrd', 'timit_f1_si1027.phn', 'timit_f1_si1027.wav', 'timit_f1_si1027.wrd', 'timit_f2_sa2.phn', 'timit_f2_sa2.wav', 'timit_f2_sa2.wrd', 'timit_m1_sa1.phn', 'timit_m1_sa1.wav', 'timit_m1_sa1.wrd', 'timit_m1_sa2.phn', 'timit_m1_sa2.wav', 'timit_m1_sa2.wrd', 'train.wav', 'voice_processing.wav']
['bad_bead_booed', 'beed', 'b_8k', 'd15zz6', 'expansionist', 'expansionist_8k', 'female1', 'female2', 'friendly', 'horse', 'male1', 'male1_recognize', 'male1_speech', 'misinterpret', 'splat', 'timit_f1_sa1', 'timit_f1_sa2', 'timit_f1_si1027', 'timit_f2_sa2', 'timit_m1_sa1', 'timit_m1_sa2', 'train', 'voice_processing']

dir = "https://homes.esat.kuleuven.be/~spchlab/data/"
name = "demo/friendly"

seg = Sp.load_data(name+".gra",root=dir)  
segwrd = Sp.load_data(name+".wrd",root=dir)  
wavdata, sr = Sp.load(dir+name+".wav")
shift=0.01
spg = Sps.spectrogram(wavdata,sample_rate=sr,f_shift=shift)
# this shows the spectrogram with two extra tiers of segmentations given in segdata
fig = Spd.PlotSpgFtrs(wavdata=wavdata,spgdata=spg,segdata=[seg,segwrd],sample_rate=sr,dy=None)
# the next 2 lines overlay segmentations in the waveform and spectrogram pane
fig.add_seg_plot(seg,iax=0,ypos=0.85,color="#444",size=12,Lines=True)
fig.add_seg_plot(seg,iax=1,ypos=None,color="#222")
fig.suptitle("SPECTROGRAM with graphemic and word level segmentations")
display(fig)

#! jupyter nbconvert Segmentations.ipynb --to html

	0	1	2	3	4	5	6	7	8	9	10	11	12	13	14	15	16	17
t0	0.01	0.05	0.07	0.17	0.25	0.28	0.32	0.44	0.49	0.52	0.61	0.64	0.69	0.72	0.81	0.88	0.96	1.0
t1	0.05	0.07	0.17	0.25	0.28	0.32	0.44	0.49	0.52	0.61	0.64	0.69	0.72	0.81	0.88	0.96	1.0	1.04
seg	f	r	eh	n	d	l	iy	sil	k	ah	m	p	y	uw	t	eh	r	z

Waveforms and Segmentations¶

Setting up pyspch¶

Doing the imports¶

Loading Example data¶

Transcribing, Segmenting and Recognizing Speech¶

Transcriptions and Alignments in pyspch¶

Example GUI¶

Working with data on a remote URL resource and spectrogram plot¶