%pylab inline

Populating the interactive namespace from numpy and matplotlib

import struct

!cd /tmp/; wget http://razik.univ-tln.fr/misc/I322/I322_tp.tgz ; tar xzvf /tmp/I322_tp.tgz

--2020-11-23 10:20:35--  http://razik.univ-tln.fr/misc/I322/I322_tp.tgz
Résolution de razik.univ-tln.fr (razik.univ-tln.fr)… 193.49.96.234
Connexion à razik.univ-tln.fr (razik.univ-tln.fr)|193.49.96.234|:80… connecté.
requête HTTP transmise, en attente de la réponse… 200 OK
Taille : 331711 (324K) [application/x-gzip]
Sauvegarde en : « I322_tp.tgz »

I322_tp.tgz         100%[===================>] 323,94K  1,56MB/s    ds 0,2s    

2020-11-23 10:20:35 (1,56 MB/s) — « I322_tp.tgz » sauvegardé [331711/331711]

I322/
I322/RAW/
I322/RAW/b.raw
I322/RAW/t.raw
I322/RAW/p.raw
I322/RAW/1.raw
I322/RAW/0.raw
I322/RAW/f.raw
I322/RAW/i.raw
I322/RAW/9.raw
I322/RAW/j.raw
I322/RAW/y.raw
I322/RAW/c.raw
I322/RAW/5.raw
I322/RAW/m.raw
I322/RAW/g.raw
I322/RAW/o.raw
I322/RAW/a.raw
I322/RAW/l.raw
I322/RAW/4.raw
I322/RAW/7.raw
I322/RAW/d.raw
I322/RAW/3.raw
I322/RAW/v.raw
I322/RAW/w.raw
I322/RAW/z.raw
I322/RAW/6.raw
I322/RAW/8.raw
I322/RAW/r.raw
I322/RAW/2.raw
I322/RAW/e.raw
I322/RAW/n.raw
I322/RAW/x.raw
I322/RAW/u.raw
I322/RAW/k.raw
I322/RAW/h.raw
I322/RAW/q.raw
I322/RAW/s.raw

# f_name = "/home/partage/I322/RAW/a.raw"
f_name = "/tmp/a.raw"

def lire_son(f_name):
    valeurs = []
    with open(f_name, 'br') as fichier:
        while fichier:
            v = fichier.read(2)
            if not v:
                break
            valeurs.append(struct.unpack('h', v)[0])
    return(array(valeurs))

valeurs = lire_son(f_name)

#f = figure(figsize=(12,5))
f, ax = subplots()
figsize(12,5)
ax.set_axis_off()
plot(valeurs)

[<matplotlib.lines.Line2D at 0x7f5a91aae490>]

def zcr(fenetre):
    cpt = 0
    old_val = fenetre[0]
    for v in fenetre:
        if v*old_val < 0:
            cpt += 1
        old_val = v
    return cpt

zcr(valeurs)

3268

len(valeurs)

14400

range(220, len(valeurs), 220)

range(220, 14400, 220)

les_zcr = [zcr(valeurs[deb:deb+220]) for deb in range(0, len(valeurs), 220)]

plot(les_zcr)

[<matplotlib.lines.Line2D at 0x7f07add49b20>]

plot(les_zcr)

[<matplotlib.lines.Line2D at 0x7f07adca9ac0>]

hist(les_zcr)

(array([ 1.,  1.,  2., 11., 16.,  5., 10.,  3.,  4., 13.]),
 array([ 0. ,  8.3, 16.6, 24.9, 33.2, 41.5, 49.8, 58.1, 66.4, 74.7, 83. ]),
 <BarContainer object of 10 artists>)

hist(les_zcr)

(array([ 1.,  1.,  2., 11., 16.,  5., 10.,  3.,  4., 13.]),
 array([ 0. ,  8.3, 16.6, 24.9, 33.2, 41.5, 49.8, 58.1, 66.4, 74.7, 83. ]),
 <BarContainer object of 10 artists>)

mean(les_zcr)

49.303030303030305

std(les_zcr)

20.222227267681184

def gauss(x, mu, sigma):
    return 1/(sqrt(2*pi)*sigma) * exp(-0.5*(x - mu)**2/sigma**2)

Y = [gauss(x, 49.3, 20.22) for x in range(101)]

plot(Y)
plot(les_zcr, [0]*len(les_zcr), 'ro')

[<matplotlib.lines.Line2D at 0x7f07adb747c0>]

from sklearn import mixture

g = mixture.GaussianMixture(1, covariance_type='diag')

g.fit(array(les_zcr).reshape(-1,1))

GaussianMixture(covariance_type='diag')

g.means_

array([[49.3030303]])

g.covariances_

array([[408.93847667]])

g.weights_

array([1.])

Z = [exp(g.score(x.reshape(-1,1))) for x in arange(101)]

plot(Z)

[<matplotlib.lines.Line2D at 0x7f07926bae20>]

a_g2 = mixture.GaussianMixture(2, covariance_type='diag')

a_g2.fit(array(les_zcr).reshape(-1,1))

GaussianMixture(covariance_type='diag', n_components=2)

a_g2.means_

array([[79.11111498],
       [40.90125872]])

a_g2.covariances_

array([[ 10.77008664],
       [200.13660043]])

a_g2.weights_

array([0.21988493, 0.78011507])

Z = [exp(a_g2.score(x.reshape(-1,1))) for x in arange(101)]

plot(Z)

[<matplotlib.lines.Line2D at 0x7f079053cfd0>]

test_f_name = "/tmp/I322/RAW/0.raw"

test_valeurs = lire_son(test_f_name)

test_les_zcr = [zcr(test_valeurs[deb:deb+220]) for deb in range(0, len(test_valeurs), 220)]

plot(test_les_zcr)

[<matplotlib.lines.Line2D at 0x7f079051a6d0>]

len(test_les_zcr)

31

hist(test_les_zcr)

(array([ 3.,  1.,  1.,  0.,  9., 11.,  3.,  2.,  0.,  1.]),
 array([ 0. ,  6.2, 12.4, 18.6, 24.8, 31. , 37.2, 43.4, 49.6, 55.8, 62. ]),
 <BarContainer object of 10 artists>)

a_g2.score(array([test_les_zcr[0]]).reshape(-1,1))

-7.996180299159372

test_les_zcr[0]

0

def vraisemblance(x):
    return 0.21988493*gauss(x, 79.11111498 , sqrt(10.77008664)) + 0.78011507*gauss(x, 40.90125872, sqrt(200.13660043))

# vraisemblance pour la première valeur des zcr
# c_g1*gauss(x, mu_g1, sigma_g1) + c_g2*gauss(x, mu_g2, sigma_g2)

# v = 0.21988493*gauss(0, 79.11111498 , sqrt(10.77008664)) + 0.78011507*gauss(0, 40.90125872, sqrt(200.13660043))
v = vraisemblance(test_les_zcr[0])
print(v)
print(log(v))

0.0003367464450031686
-7.996180299512988

P = prod(array([vraisemblance(x) for x in test_les_zcr]))
print(P)

2.2866752681968918e-61

log(P)

-139.63059175797204

P_log = sum(array([log(vraisemblance(x)) for x in test_les_zcr]))
print(P_log)

-139.630591757972

a_g2.score(array(test_les_zcr).reshape(-1,1))

-4.504212637677535

P_a = prod(array([vraisemblance(x) for x in les_zcr]))
print(log(P_a))

-278.7023749118592

zero_g2 = mixture.GaussianMixture(2, covariance_type='diag')

zero_g2.fit(array(les_zcr).reshape(-1,1))

GaussianMixture(covariance_type='diag', n_components=2)

zero_g2.means_

array([[31.21117743],
       [29.43841612]])

zero_g2.covariances_

array([[  6.64596133],
       [344.80709667]])

zero_g2.weights_

array([0.53514291, 0.46485709])

Z = [exp(zero_g2.score(x.reshape(-1,1))) for x in arange(101)]

plot(Z)

[<matplotlib.lines.Line2D at 0x7f078ee90af0>]

def vraisemblance_0(x):
    return 0.53514291*gauss(x, 31.21117743 , sqrt(6.64596133)) + 0.46485709*gauss(x, 29.43841612, sqrt(344.80709667))

P_0 = prod(array([vraisemblance_0(x) for x in test_les_zcr]))
print(log(P_0))

-114.11049941907352

P_0 = prod(array([vraisemblance_0(x) for x in les_zcr]))
print(log(P_0))

-346.219561095101

# ce qui reste à faire
# 1. faire un modèle pour chaque classe (a ... z, 0 ... 9)
# 2. tester chaque fichier son sur l'ensemble des modèles (prise de décision)
# 3. construire la matrice de confusion (à partir des résultats précédents)

Joseph Razik - UTLN/LIS

Tpravaux pratique aprrentissage et ZCR