python-Kmeans/em_mog.py at master · tA-bot-git/python-Kmeans · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
import numpy as np
from scipy.stats import multivariate_normal as mvn
from numpy.linalg import inv
from sklearn.cluster import KMeans
import time


def em_mog(X, k, max_iter=20):
    """
    Learn a Mixture of Gaussians model using the EM-algorithm.

    Args:
        X: The data used for training [n, num_features]
        k: The number of gaussians to be used

    Returns:
        phi: A vector of probabilities for the latent vars z of shape [k]
        mu: A marix of mean vectors of shape [k, num_features]
        sigma: A list of length k of covariance matrices each of shape [num_features, num_features]
        w: A vector of weights for the k gaussians per example of shape [n, k] (result of the E-step)

    """

    # Initialize variables
    mu = None
    sigma = [np.eye(X.shape[1]) for i in range(k)]
    phi = np.ones([k,])/k
    ll_prev = float('inf')
    start = time.time()

    #Perform KMeans to get the centers of the clusters
    kmeans = KMeans(n_clusters=k, random_state=0,  max_iter=20).fit(X)
    mu = kmeans.cluster_centers_

    for l in range(max_iter):
        # E-Step: compute the probabilities p(z==j|x; mu, sigma, phi)
        w = e_step(X, mu, sigma, phi)

        # M-step: Update the parameters mu, sigma and phi
        phi, mu, sigma = m_step(w, X, mu, sigma, phi, k)

        # Check convergence
        ll = log_likelihood(X, mu, sigma, phi)
        print('Iter: {}/{}, LL: {}'.format(l+1, max_iter, ll))
        if ll/ll_prev > 0.999:
            print('EM has converged...')
            break
        ll_prev = ll

    # Get stats
    exec_time = time.time()-start
    print('Number of iterations: {}, Execution time: {}s'.format(l+1, exec_time))

    # Computes final assignment
    w = e_step(X, mu, sigma, phi)

    return phi, mu, sigma, w


def log_likelihood(X, mu, sigma, phi):
    """
    Returns the log-likelihood of the data under the current parameters of the MoG model.

    """
    ll = 0.0
    n, p = X.shape
    k = len(phi)

    for i in range(n):
        temp = 0
        for j in range(k):
            temp += phi[j] * mvn(mu[j].T, sigma[j]).pdf(X[i])
        ll += np.log(temp)

    return ll


def e_step(X, mu, sigma, phi):
    """
    Computes the E-step of the EM algorithm.

    Returns:
        w:  A vector of probabilities p(z==j|x; mu, sigma, phi) for the k
            gaussians per example of shape [n, k]
    """
    n, p = X.shape
    k=len(phi)
    w = np.zeros((k, n))
    np.zeros((k, n))
    for j in range(k):
        for i in range(n):
            w[j, i] = phi[j] * mvn(mu[j], sigma[j]).pdf(X[i]) #No Error
    w /= w.sum(0)

    return w


def m_step(w, X, mu, sigma, phi, k):
    """
    Computes the M-step of the EM algorithm.
    """
    n, p = X.shape
    phi = np.zeros(k)
    for j in range(len(mu)):
        for i in range(n): #No error
            phi[j] += w[j, i]
        phi /= n

    mu = np.zeros((k, p))
    for j in range(k):
        for i in range(n):
            mu[j] += w[j, i] * X[i] #No error
        mu[j] /= w[j,:].sum()

    sigma = np.zeros((k, p, p))
    for j in range(k):
        for i in range(n):
            ys = np.reshape(X[i]- mu[j], (2,1)) #No error
            sigma[j] += w[j, i] * np.dot(ys, ys.T)
        sigma[j] /= w[j,:].sum()

    return phi, mu, sigma