qm-dsp: hmm/hmm.c comparison

comparison hmm/hmm.c @ 483:fdaa63607c15

Untabify, indent, tidy

author	Chris Cannam <cannam@all-day-breakfast.com>
date	Fri, 31 May 2019 11:54:32 +0100
parents	7e8d1f26b098
children	d48276a3ae24

comparison

equal deleted inserted replaced

-:cbe668c7d724
+:fdaa63607c15
 #include <stdio.h>
 #include <math.h>
 #include <stdlib.h>
 #include <float.h>
-#include <time.h>				/* to seed random number generator */
+#include <time.h>               /* to seed random number generator */
-#include <clapack.h>		/* LAPACK for matrix inversion */
+#include <clapack.h>            /* LAPACK for matrix inversion */
 #include "maths/nan-inf.h"
 #ifdef ATLAS_ORDER
 #define HAVE_ATLAS 1
 #endif
 #ifdef _MAC_OS_X
 #include <vecLib/cblas.h>
 #else
-#include <cblas.h>		/* BLAS for matrix multiplication */
+#include <cblas.h>              /* BLAS for matrix multiplication */
 #endif
 #include "hmm.h"
 model_t* hmm_init(double** x, int T, int L, int N)
 {
-	int i, j, d, e, t;
+int i, j, d, e, t;
-	double s, ss;
+double s, ss;
-	model_t* model;
+model_t* model;
-	model = (model_t*) malloc(sizeof(model_t));
+model = (model_t*) malloc(sizeof(model_t));
-	model->N = N;
+model->N = N;
-	model->L = L;
+model->L = L;
-	model->p0 = (double*) malloc(N*sizeof(double));
+model->p0 = (double*) malloc(N*sizeof(double));
-	model->a = (double**) malloc(N*sizeof(double*));
+model->a = (double**) malloc(N*sizeof(double*));
-	model->mu = (double**) malloc(N*sizeof(double*));
+model->mu = (double**) malloc(N*sizeof(double*));
-	for (i = 0; i < N; i++)
+for (i = 0; i < N; i++) {
-	{
+model->a[i] = (double*) malloc(N*sizeof(double));
-		model->a[i] = (double*) malloc(N*sizeof(double));
+model->mu[i] = (double*) malloc(L*sizeof(double));
-		model->mu[i] = (double*) malloc(L*sizeof(double));
+}
-	}
+model->cov = (double**) malloc(L*sizeof(double*));
-	model->cov = (double**) malloc(L*sizeof(double*));
+for (i = 0; i < L; i++) {
-	for (i = 0; i < L; i++)
+model->cov[i] = (double*) malloc(L*sizeof(double));
-		model->cov[i] = (double*) malloc(L*sizeof(double));
+}
-	srand(time(0));
+srand(time(0));
-	double* global_mean = (double*) malloc(L*sizeof(double));
+double* global_mean = (double*) malloc(L*sizeof(double));
-	/* find global mean */
+/* find global mean */
-	for (d = 0; d < L; d++)
+for (d = 0; d < L; d++) {
-	{
+global_mean[d] = 0;
-		global_mean[d] = 0;
+for (t = 0; t < T; t++) {
-		for (t = 0; t < T; t++)
+global_mean[d] += x[t][d];
-			global_mean[d] += x[t][d];
+}
-		global_mean[d] /= T;
+global_mean[d] /= T;
-	}
+}
-	/* calculate global diagonal covariance */
+/* calculate global diagonal covariance */
-	for (d = 0; d < L; d++)
+for (d = 0; d < L; d++) {
-	{
+for (e = 0; e < L; e++) {
-		for (e = 0; e < L; e++)
+model->cov[d][e] = 0;
-			model->cov[d][e] = 0;
+}
-		for (t = 0; t < T; t++)
+for (t = 0; t < T; t++) {
-			model->cov[d][d] += (x[t][d] - global_mean[d]) * (x[t][d] - global_mean[d]);
+model->cov[d][d] +=
-		model->cov[d][d] /= T-1;
+(x[t][d] - global_mean[d]) * (x[t][d] - global_mean[d]);
-	}
+}
+model->cov[d][d] /= T-1;
-	/* set all means close to global mean */
+}
-	for (i = 0; i < N; i++)
-	{
+/* set all means close to global mean */
-		for (d = 0; d < L; d++)
+for (i = 0; i < N; i++) {
-		{
+for (d = 0; d < L; d++) {
-			/* add some random noise related to covariance */
+/* add some random noise related to covariance */
-			/* ideally the random number would be Gaussian(0,1), as a hack we make it uniform on [-0.25,0.25] */
+/* ideally the random number would be Gaussian(0,1),
-			model->mu[i][d] = global_mean[d] + (0.5 * rand() / (double) RAND_MAX - 0.25) * sqrt(model->cov[d][d]);
+as a hack we make it uniform on [-0.25,0.25] */
-		}
+model->mu[i][d] = global_mean[d] +
-	}
+(0.5 * rand() / (double) RAND_MAX - 0.25)
+* sqrt(model->cov[d][d]);
-	/* random intial and transition probs */
+}
-	s = 0;
+}
-	for (i = 0; i < N; i++)
-	{
+/* random initial and transition probs */
-		model->p0[i] = 1 + rand() / (double) RAND_MAX;
+s = 0;
-		s += model->p0[i];
+for (i = 0; i < N; i++) {
-		ss = 0;
+model->p0[i] = 1 + rand() / (double) RAND_MAX;
-		for (j = 0; j < N; j++)
+s += model->p0[i];
-		{
+ss = 0;
-			model->a[i][j] = 1 + rand() / (double) RAND_MAX;
+for (j = 0; j < N; j++) {
-			ss += model->a[i][j];
+model->a[i][j] = 1 + rand() / (double) RAND_MAX;
-		}
+ss += model->a[i][j];
-		for (j = 0; j < N; j++)
+}
-		{
+for (j = 0; j < N; j++) {
-			model->a[i][j] /= ss;
+model->a[i][j] /= ss;
-		}
+}
-	}
+}
-	for (i = 0; i < N; i++)
+for (i = 0; i < N; i++) {
-		model->p0[i] /= s;
+model->p0[i] /= s;
+}
-	free(global_mean);
+free(global_mean);
-	return model;
+return model;
 }
 void hmm_close(model_t* model)
 {
-	int i;
+int i;
-	for (i = 0; i < model->N; i++)
+for (i = 0; i < model->N; i++) {
-	{
+free(model->a[i]);
-		free(model->a[i]);
+free(model->mu[i]);
-		free(model->mu[i]);
+}
-	}
+free(model->a);
-	free(model->a);
+free(model->mu);
-	free(model->mu);
+for (i = 0; i < model->L; i++) {
-	for (i = 0; i < model->L; i++)
+free(model->cov[i]);
-		free(model->cov[i]);
+}
-	free(model->cov);
+free(model->cov);
-	free(model);
+free(model);
 }
 void hmm_train(double** x, int T, model_t* model)
 {
-	int i, t;
+int i, t;
-	double loglik;	/* overall log-likelihood at each iteration */
+double loglik;  /* overall log-likelihood at each iteration */
-	int N = model->N;
+int N = model->N;
-	int L = model->L;
+int L = model->L;
-	double* p0 = model->p0;
+double* p0 = model->p0;
-	double** a = model->a;
+double** a = model->a;
-	double** mu = model->mu;
+double** mu = model->mu;
-	double** cov = model->cov;
+double** cov = model->cov;
-	/* allocate memory */
+/* allocate memory */
-	double** gamma = (double**) malloc(T*sizeof(double*));
+double** gamma = (double**) malloc(T*sizeof(double*));
-	double*** xi = (double***) malloc(T*sizeof(double**));
+double*** xi = (double***) malloc(T*sizeof(double**));
-	for (t = 0; t < T; t++)
+for (t = 0; t < T; t++) {
-	{
+gamma[t] = (double*) malloc(N*sizeof(double));
-		gamma[t] = (double*) malloc(N*sizeof(double));
+xi[t] = (double**) malloc(N*sizeof(double*));
-		xi[t] = (double**) malloc(N*sizeof(double*));
+for (i = 0; i < N; i++) {
-		for (i = 0; i < N; i++)
+xi[t][i] = (double*) malloc(N*sizeof(double));
-			xi[t][i] = (double*) malloc(N*sizeof(double));
+}
-	}
+}
-	/* temporary memory */
+/* temporary memory */
-	double* gauss_y = (double*) malloc(L*sizeof(double));
+double* gauss_y = (double*) malloc(L*sizeof(double));
-	double* gauss_z = (double*) malloc(L*sizeof(double));
+double* gauss_z = (double*) malloc(L*sizeof(double));
-	/* obs probs P(j|{x}) */
+/* obs probs P(j|{x}) */
-	double** b = (double**) malloc(T*sizeof(double*));
+double** b = (double**) malloc(T*sizeof(double*));
-	for (t = 0; t < T; t++)
+for (t = 0; t < T; t++) {
-		b[t] = (double*) malloc(N*sizeof(double));
+b[t] = (double*) malloc(N*sizeof(double));
+}
-	/* inverse covariance and its determinant */
-	double** icov = (double**) malloc(L*sizeof(double*));
+/* inverse covariance and its determinant */
-	for (i = 0; i < L; i++)
+double** icov = (double**) malloc(L*sizeof(double*));
-		icov[i] = (double*) malloc(L*sizeof(double));
+for (i = 0; i < L; i++) {
-	double detcov;
+icov[i] = (double*) malloc(L*sizeof(double));
+}
-	double thresh = 0.0001;
+double detcov;
-	int niter = 50;
-	int iter = 0;
+double thresh = 0.0001;
-	double loglik1, loglik2;
+int niter = 50;
-	int foundnan = 0;
+int iter = 0;
+double loglik1, loglik2;
-	while (iter < niter && !foundnan && !(iter > 1 && (loglik - loglik1) < thresh * (loglik1 - loglik2)))
+int foundnan = 0;
-	{
-		++iter;
+while (iter < niter && !foundnan &&
-/*
+!(iter > 1 && (loglik - loglik1) < thresh * (loglik1 - loglik2))) {
-		fprintf(stderr, "calculating obsprobs...\n");
-		fflush(stderr);
+++iter;
-*/
-		/* precalculate obs probs */
+/* precalculate obs probs */
-		invert(cov, L, icov, &detcov);
+invert(cov, L, icov, &detcov);
-		for (t = 0; t < T; t++)
+for (t = 0; t < T; t++) {
-		{
+for (i = 0; i < N; i++) {
-			//int allzero = 1;
+b[t][i] = exp(loggauss(x[t], L, mu[i], icov, detcov, gauss_y, gauss_z));
-			for (i = 0; i < N; i++)
+}
-			{
+}
-				b[t][i] = exp(loggauss(x[t], L, mu[i], icov, detcov, gauss_y, gauss_z));
+forward_backwards(xi, gamma, &loglik, &loglik1, &loglik2,
+iter, N, T, p0, a, b);
-				//if (b[t][i] != 0)
+if (ISNAN(loglik)) {
-				//	allzero = 0;
+foundnan = 1;
-			}
+continue;
-			/*
+}
-			if (allzero)
-			{
+baum_welch(p0, a, mu, cov, N, T, L, x, xi, gamma);
-				printf("all the b[t][i] were zero for t = %d, correcting...\n", t);
+}
-				for (i = 0; i < N; i++)
-				{
+/* deallocate memory */
-					b[t][i] = 0.00001;
+for (t = 0; t < T; t++) {
-				}
+free(gamma[t]);
-			}
+free(b[t]);
-			*/
+for (i = 0; i < N; i++) {
-		}
+free(xi[t][i]);
-/*
+}
-		fprintf(stderr, "forwards-backwards...\n");
+free(xi[t]);
-		fflush(stderr);
+}
-*/
+free(gamma);
-		forward_backwards(xi, gamma, &loglik, &loglik1, &loglik2, iter, N, T, p0, a, b);
+free(xi);
-/*
+free(b);
-		fprintf(stderr, "iteration %d: loglik = %f\n", iter, loglik);
-		fprintf(stderr, "re-estimation...\n");
+for (i = 0; i < L; i++) {
-		fflush(stderr);
+free(icov[i]);
-*/
+}
-		if (ISNAN(loglik)) {
+free(icov);
-		    foundnan = 1;
-		    continue;
+free(gauss_y);
-		}
+free(gauss_z);
+}
-		baum_welch(p0, a, mu, cov, N, T, L, x, xi, gamma);
+void baum_welch(double* p0, double** a, double** mu, double** cov,
-		/*
+int N, int T, int L, double** x, double*** xi, double** gamma)
-		printf("a:\n");
+{
-		for (i = 0; i < model->N; i++)
+int i, j, t;
-		{
-			for (j = 0; j < model->N; j++)
+double* sum_gamma = (double*) malloc(N*sizeof(double));
-				printf("%f ", model->a[i][j]);
-			printf("\n");
+/* temporary memory */
-		}
+double* u = (double*) malloc(L*L*sizeof(double));
-		printf("\n\n");
+double* yy = (double*) malloc(T*L*sizeof(double));
-		 */
+double* yy2 = (double*) malloc(T*L*sizeof(double));
-		//hmm_print(model);
-	}
+/* re-estimate transition probs */
+for (i = 0; i < N; i++) {
-	/* deallocate memory */
+sum_gamma[i] = 0;
-	for (t = 0; t < T; t++)
+for (t = 0; t < T-1; t++) {
-	{
+sum_gamma[i] += gamma[t][i];
-		free(gamma[t]);
+}
-		free(b[t]);
+}
-		for (i = 0; i < N; i++)
-			free(xi[t][i]);
+for (i = 0; i < N; i++) {
-		free(xi[t]);
+for (j = 0; j < N; j++) {
-	}
+a[i][j] = 0;
-	free(gamma);
+if (sum_gamma[i] == 0.) {
-	free(xi);
+continue;
-	free(b);
+}
+for (t = 0; t < T-1; t++) {
-	for (i = 0; i < L; i++)
+a[i][j] += xi[t][i][j];
-		free(icov[i]);
+}
-	free(icov);
+a[i][j] /= sum_gamma[i];
+}
-	free(gauss_y);
+}
-	free(gauss_z);
-}
+/* NB: now we need to sum gamma over all t */
+for (i = 0; i < N; i++) {
-void baum_welch(double* p0, double** a, double** mu, double** cov, int N, int T, int L, double** x, double*** xi, double** gamma)
+sum_gamma[i] += gamma[T-1][i];
-{
+}
-	int i, j, t;
+/* re-estimate initial probs */
-	double* sum_gamma = (double*) malloc(N*sizeof(double));
+for (i = 0; i < N; i++) {
+p0[i] = gamma[0][i];
-	/* temporary memory */
+}
-	double* u = (double*) malloc(L*L*sizeof(double));
-	double* yy = (double*) malloc(T*L*sizeof(double));
+/* re-estimate covariance */
-	double* yy2 = (double*) malloc(T*L*sizeof(double));
+int d, e;
+double sum_sum_gamma = 0;
-	/* re-estimate transition probs */
+for (i = 0; i < N; i++) {
-	for (i = 0; i < N; i++)
+sum_sum_gamma += sum_gamma[i];
-	{
+}
-		sum_gamma[i] = 0;
-		for (t = 0; t < T-1; t++)
+/* using BLAS */
-			sum_gamma[i] += gamma[t][i];
+for (d = 0; d < L; d++) {
-	}
+for (e = 0; e < L; e++) {
+cov[d][e] = 0;
-	for (i = 0; i < N; i++)
+}
-	{
+}
-		if (sum_gamma[i] == 0)
-		{
+for (j = 0; j < N; j++) {
-/*			fprintf(stderr, "sum_gamma[%d] was zero...\n", i); */
-		}
+for (d = 0; d < L; d++) {
-		//double s = 0;
+for (t = 0; t < T; t++) {
-		for (j = 0; j < N; j++)
+yy[d*T+t] = x[t][d] - mu[j][d];
-		{
+yy2[d*T+t] = gamma[t][j] * (x[t][d] - mu[j][d]);
-			a[i][j] = 0;
+}
-			if (sum_gamma[i] == 0.) continue;
+}
-			for (t = 0; t < T-1; t++)
-				a[i][j] += xi[t][i][j];
+cblas_dgemm(CblasColMajor, CblasTrans, CblasNoTrans,
-			//s += a[i][j];
+L, L, T, 1.0, yy, T, yy2, T, 0, u, L);
-			a[i][j] /= sum_gamma[i];
-		}
+for (e = 0; e < L; e++) {
-		/*
+for (d = 0; d < L; d++) {
-		 for (j = 0; j < N; j++)
+cov[d][e] += u[e*L+d];
-		 {
+}
-			 a[i][j] /= s;
+}
-		 }
+}
-		 */
-	}
+for (d = 0; d < L; d++) {
+for (e = 0; e < L; e++) {
-	/* NB: now we need to sum gamma over all t */
+cov[d][e] /= T; /* sum_sum_gamma; */
-	for (i = 0; i < N; i++)
+}
-		sum_gamma[i] += gamma[T-1][i];
+}
-	/* re-estimate initial probs */
+//printf("sum_sum_gamma = %f\n", sum_sum_gamma); /* fine, = T IS THIS ALWAYS TRUE with pooled cov?? */
-	for (i = 0; i < N; i++)
-		p0[i] = gamma[0][i];
+/* re-estimate means */
+for (j = 0; j < N; j++) {
-	/* re-estimate covariance */
+for (d = 0; d < L; d++) {
-	int d, e;
+mu[j][d] = 0;
-	double sum_sum_gamma = 0;
+for (t = 0; t < T; t++)
-	for (i = 0; i < N; i++)
+mu[j][d] += gamma[t][j] * x[t][d];
-		sum_sum_gamma += sum_gamma[i];
+mu[j][d] /= sum_gamma[j];
+}
-	/*
+}
-	 for (d = 0; d < L; d++)
-	 {
+/* deallocate memory */
-		 for (e = d; e < L; e++)
+free(sum_gamma);
-		 {
+free(yy);
-			 cov[d][e] = 0;
+free(yy2);
-			 for (t = 0; t < T; t++)
+free(u);
-				 for (j = 0; j < N; j++)
+}
-					 cov[d][e] += gamma[t][j] * (x[t][d] - mu[j][d]) * (x[t][e] - mu[j][e]);
+void forward_backwards(double*** xi, double** gamma,
-			 cov[d][e] /= sum_sum_gamma;
+double* loglik, double* loglik1, double* loglik2,
+int iter, int N, int T,
-			 if (ISNAN(cov[d][e]))
+double* p0, double** a, double** b)
-			 {
+{
-				 printf("cov[%d][%d] was nan\n", d, e);
+/* forwards-backwards with scaling */
-				 for (j = 0; j < N; j++)
+int i, j, t;
-					 for (i = 0; i < L; i++)
-						 if (ISNAN(mu[j][i]))
+double** alpha = (double**) malloc(T*sizeof(double*));
-							 printf("mu[%d][%d] was nan\n", j, i);
+double** beta = (double**) malloc(T*sizeof(double*));
-				 for (t = 0; t < T; t++)
+for (t = 0; t < T; t++) {
-					 for (j = 0; j < N; j++)
+alpha[t] = (double*) malloc(N*sizeof(double));
-						 if (ISNAN(gamma[t][j]))
+beta[t] = (double*) malloc(N*sizeof(double));
-							 printf("gamma[%d][%d] was nan\n", t, j);
+}
-				 exit(-1);
-			 }
+/* scaling coefficients */
-		 }
+double* c = (double*) malloc(T*sizeof(double));
-	 }
-	 for (d = 0; d < L; d++)
+/* calculate forward probs and scale coefficients */
-	 for (e = 0; e < d; e++)
+c[0] = 0;
-	 cov[d][e] = cov[e][d];
+for (i = 0; i < N; i++) {
-	 */
+alpha[0][i] = p0[i] * b[0][i];
+c[0] += alpha[0][i];
-	/* using BLAS */
+}
-	for (d = 0; d < L; d++)
+c[0] = 1 / c[0];
-		for (e = 0; e < L; e++)
+for (i = 0; i < N; i++) {
-			cov[d][e] = 0;
+alpha[0][i] *= c[0];
+}
-	for (j = 0; j < N; j++)
-	{
+*loglik1 = *loglik;
-		for (d = 0; d < L; d++)
+*loglik = -log(c[0]);
-			for (t = 0; t < T; t++)
+if (iter == 2) {
-			{
+*loglik2 = *loglik;
-				yy[d*T+t] = x[t][d] - mu[j][d];
+}
-				yy2[d*T+t] = gamma[t][j] * (x[t][d] - mu[j][d]);
-			}
+for (t = 1; t < T; t++) {
-				cblas_dgemm(CblasColMajor, CblasTrans, CblasNoTrans, L, L, T, 1.0, yy, T, yy2, T, 0, u, L);
+c[t] = 0;
-		for (e = 0; e < L; e++)
+for (j = 0; j < N; j++) {
-			for (d = 0; d < L; d++)
+alpha[t][j] = 0;
-				cov[d][e] += u[e*L+d];
+for (i = 0; i < N; i++) {
-	}
+alpha[t][j] += alpha[t-1][i] * a[i][j];
+}
-	for (d = 0; d < L; d++)
+alpha[t][j] *= b[t][j];
-		for (e = 0; e < L; e++)
-			cov[d][e] /= T; /* sum_sum_gamma; */
+c[t] += alpha[t][j];
+}
-	//printf("sum_sum_gamma = %f\n", sum_sum_gamma); /* fine, = T IS THIS ALWAYS TRUE with pooled cov?? */
+c[t] = 1 / c[t];
-	/* re-estimate means */
+for (j = 0; j < N; j++) {
-	for (j = 0; j < N; j++)
+alpha[t][j] *= c[t];
-	{
+}
-		for (d = 0; d < L; d++)
-		{
+*loglik -= log(c[t]);
-			mu[j][d] = 0;
+}
-			for (t = 0; t < T; t++)
-				mu[j][d] += gamma[t][j] * x[t][d];
+/* calculate backwards probs using same coefficients */
-			mu[j][d] /= sum_gamma[j];
+for (i = 0; i < N; i++) {
-		}
+beta[T-1][i] = 1;
-	}
+}
+t = T - 1;
-	/* deallocate memory */
-	free(sum_gamma);
+while (1) {
-	free(yy);
+for (i = 0; i < N; i++) {
-	free(yy2);
+beta[t][i] *= c[t];
-	free(u);
+}
-}
+if (t == 0) {
-void forward_backwards(double*** xi, double** gamma, double* loglik, double* loglik1, double* loglik2, int iter, int N, int T, double* p0, double** a, double** b)
+break;
-{
+}
-	/* forwards-backwards with scaling */
-	int i, j, t;
+for (i = 0; i < N; i++) {
+beta[t-1][i] = 0;
-	double** alpha = (double**) malloc(T*sizeof(double*));
+for (j = 0; j < N; j++) {
-	double** beta = (double**) malloc(T*sizeof(double*));
+beta[t-1][i] += a[i][j] * b[t][j] * beta[t][j];
-	for (t = 0; t < T; t++)
+}
-	{
+}
-		alpha[t] = (double*) malloc(N*sizeof(double));
-		beta[t] = (double*) malloc(N*sizeof(double));
+t--;
-	}
+}
-	/* scaling coefficients */
+/* calculate posterior probs */
-	double* c = (double*) malloc(T*sizeof(double));
+double tot;
+for (t = 0; t < T; t++) {
-	/* calculate forward probs and scale coefficients */
+tot = 0;
-	c[0] = 0;
+for (i = 0; i < N; i++) {
-	for (i = 0; i < N; i++)
+gamma[t][i] = alpha[t][i] * beta[t][i];
-	{
+tot += gamma[t][i];
-		alpha[0][i] = p0[i] * b[0][i];
+}
-		c[0] += alpha[0][i];
+for (i = 0; i < N; i++) {
+gamma[t][i] /= tot;
-		//printf("p0[%d] = %f, b[0][%d] = %f\n", i, p0[i], i, b[0][i]);
+}
-	}
+}
-	c[0] = 1 / c[0];
-	for (i = 0; i < N; i++)
+for (t = 0; t < T-1; t++) {
-	{
+tot = 0;
-		alpha[0][i] *= c[0];
+for (i = 0; i < N; i++) {
+for (j = 0; j < N; j++) {
-		//printf("alpha[0][%d] = %f\n", i, alpha[0][i]);	/* OK agrees with Matlab */
+xi[t][i][j] = alpha[t][i] * a[i][j] * b[t+1][j] * beta[t+1][j];
-	}
+tot += xi[t][i][j];
+}
-	*loglik1 = *loglik;
+}
-	*loglik = -log(c[0]);
+for (i = 0; i < N; i++) {
-	if (iter == 2)
+for (j = 0; j < N; j++) {
-		*loglik2 = *loglik;
+xi[t][i][j] /= tot;
+}
-	for (t = 1; t < T; t++)
+}
-	{
+}
-		c[t] = 0;
-		for (j = 0; j < N; j++)
+for (t = 0; t < T; t++) {
-		{
+free(alpha[t]);
-			alpha[t][j] = 0;
+free(beta[t]);
-			for (i = 0; i < N; i++)
+}
-				alpha[t][j] += alpha[t-1][i] * a[i][j];
+free(alpha);
-			alpha[t][j] *= b[t][j];
+free(beta);
+free(c);
-			c[t] += alpha[t][j];
-		}
-		/*
-		 if (c[t] == 0)
-		 {
-			 printf("c[%d] = 0, going to blow up so exiting\n", t);
-			 for (i = 0; i < N; i++)
-				 if (b[t][i] == 0)
-					 fprintf(stderr, "b[%d][%d] was zero\n", t, i);
-			 fprintf(stderr, "x[t] was \n");
-			 for (i = 0; i < L; i++)
-				 fprintf(stderr, "%f ", x[t][i]);
-			 fprintf(stderr, "\n\n");
-			 exit(-1);
-		 }
-		 */
-		c[t] = 1 / c[t];
-		for (j = 0; j < N; j++)
-			alpha[t][j] *= c[t];
-		//printf("c[%d] = %e\n", t, c[t]);
-		*loglik -= log(c[t]);
-	}
-	/* calculate backwards probs using same coefficients */
-	for (i = 0; i < N; i++)
-		beta[T-1][i] = 1;
-	t = T - 1;
-	while (1)
-	{
-		for (i = 0; i < N; i++)
-			beta[t][i] *= c[t];
-		if (t == 0)
-			break;
-		for (i = 0; i < N; i++)
-		{
-			beta[t-1][i] = 0;
-			for (j = 0; j < N; j++)
-				beta[t-1][i] += a[i][j] * b[t][j] * beta[t][j];
-		}
-		t--;
-	}
-	/*
-	 printf("alpha:\n");
-	 for (t = 0; t < T; t++)
-	 {
-		 for (i = 0; i < N; i++)
-			 printf("%4.4e\t\t", alpha[t][i]);
-		 printf("\n");
-	 }
-	 printf("\n\n");printf("beta:\n");
-	 for (t = 0; t < T; t++)
-	 {
-		 for (i = 0; i < N; i++)
-			 printf("%4.4e\t\t", beta[t][i]);
-		 printf("\n");
-	 }
-	 printf("\n\n");
-	 */
-	/* calculate posterior probs */
-	double tot;
-	for (t = 0; t < T; t++)
-	{
-		tot = 0;
-		for (i = 0; i < N; i++)
-		{
-			gamma[t][i] = alpha[t][i] * beta[t][i];
-			tot += gamma[t][i];
-		}
-		for (i = 0; i < N; i++)
-		{
-			gamma[t][i] /= tot;
-			//printf("gamma[%d][%d] = %f\n", t, i, gamma[t][i]);
-		}
-	}
-	for (t = 0; t < T-1; t++)
-	{
-		tot = 0;
-		for (i = 0; i < N; i++)
-		{
-			for (j = 0; j < N; j++)
-			{
-				xi[t][i][j] = alpha[t][i] * a[i][j] * b[t+1][j] * beta[t+1][j];
-				tot += xi[t][i][j];
-			}
-		}
-		for (i = 0; i < N; i++)
-			for (j = 0; j < N; j++)
-				xi[t][i][j] /= tot;
-	}
-	/*
-	 // CHECK - fine
-	 // gamma[t][i] = \sum_j{xi[t][i][j]}
-	 tot = 0;
-	 for (j = 0; j < N; j++)
-	 tot += xi[3][1][j];
-	 printf("gamma[3][1] = %f, sum_j(xi[3][1][j]) = %f\n", gamma[3][1], tot);
-	 */
-	for (t = 0; t < T; t++)
-	{
-		free(alpha[t]);
-		free(beta[t]);
-	}
-	free(alpha);
-	free(beta);
-	free(c);
 }
 void viterbi_decode(double** x, int T, model_t* model, int* q)
 {
-	int i, j, t;
+int i, j, t;
-	double max;
+double max;
-	int havemax;
+int havemax;
-	int N = model->N;
+int N = model->N;
-	int L = model->L;
+int L = model->L;
-	double* p0 = model->p0;
+double* p0 = model->p0;
-	double** a = model->a;
+double** a = model->a;
-	double** mu = model->mu;
+double** mu = model->mu;
-	double** cov = model->cov;
+double** cov = model->cov;
-	/* inverse covariance and its determinant */
+/* inverse covariance and its determinant */
-	double** icov = (double**) malloc(L*sizeof(double*));
+double** icov = (double**) malloc(L*sizeof(double*));
-	for (i = 0; i < L; i++)
+for (i = 0; i < L; i++) {
-		icov[i] = (double*) malloc(L*sizeof(double));
+icov[i] = (double*) malloc(L*sizeof(double));
-	double detcov;
+}
+double detcov;
-	double** logb = (double**) malloc(T*sizeof(double*));
-	double** phi = (double**) malloc(T*sizeof(double*));
+double** logb = (double**) malloc(T*sizeof(double*));
-	int** psi = (int**) malloc(T*sizeof(int*));
+double** phi = (double**) malloc(T*sizeof(double*));
-	for (t = 0; t < T; t++)
+int** psi = (int**) malloc(T*sizeof(int*));
-	{
-		logb[t] = (double*) malloc(N*sizeof(double));
+for (t = 0; t < T; t++) {
-		phi[t] = (double*) malloc(N*sizeof(double));
+logb[t] = (double*) malloc(N*sizeof(double));
-		psi[t] = (int*) malloc(N*sizeof(int));
+phi[t] = (double*) malloc(N*sizeof(double));
-	}
+psi[t] = (int*) malloc(N*sizeof(int));
+}
-	/* temporary memory */
-	double* gauss_y = (double*) malloc(L*sizeof(double));
+/* temporary memory */
-	double* gauss_z = (double*) malloc(L*sizeof(double));
+double* gauss_y = (double*) malloc(L*sizeof(double));
+double* gauss_z = (double*) malloc(L*sizeof(double));
-	/* calculate observation logprobs */
-	invert(cov, L, icov, &detcov);
+/* calculate observation logprobs */
-	for (t = 0; t < T; t++)
+invert(cov, L, icov, &detcov);
-		for (i = 0; i < N; i++)
+for (t = 0; t < T; t++) {
-			logb[t][i] = loggauss(x[t], L, mu[i], icov, detcov, gauss_y, gauss_z);
+for (i = 0; i < N; i++) {
+logb[t][i] = loggauss
-	/* initialise */
+(x[t], L, mu[i], icov, detcov, gauss_y, gauss_z);
-	for (i = 0; i < N; i++)
+}
-	{
+}
-		phi[0][i] = log(p0[i]) + logb[0][i];
-		psi[0][i] = 0;
+/* initialise */
-	}
+for (i = 0; i < N; i++) {
+phi[0][i] = log(p0[i]) + logb[0][i];
-	for (t = 1; t < T; t++)
+psi[0][i] = 0;
-	{
+}
-		for (j = 0; j < N; j++)
-		{
+for (t = 1; t < T; t++) {
-			max = -1000000;
+for (j = 0; j < N; j++) {
-			havemax = 0;
+max = -1000000;
+havemax = 0;
-			psi[t][j] = 0;
-			for (i = 0; i < N; i++)
+psi[t][j] = 0;
-			{
+for (i = 0; i < N; i++) {
-				if (phi[t-1][i] + log(a[i][j]) > max || !havemax)
+if (phi[t-1][i] + log(a[i][j]) > max || !havemax) {
-				{
+max = phi[t-1][i] + log(a[i][j]);
-					max = phi[t-1][i] + log(a[i][j]);
+phi[t][j] = max + logb[t][j];
-					phi[t][j] = max + logb[t][j];
+psi[t][j] = i;
-					psi[t][j] = i;
+havemax = 1;
-					havemax = 1;
+}
-				}
+}
-			}
+}
-		}
+}
-	}
+/* find maximising state at time T-1 */
-	/* find maximising state at time T-1 */
+max = phi[T-1][0];
-	max = phi[T-1][0];
+q[T-1] = 0;
-	q[T-1] = 0;
+for (i = 1; i < N; i++) {
-	for (i = 1; i < N; i++)
+if (phi[T-1][i] > max) {
-	{
+max = phi[T-1][i];
-		if (phi[T-1][i] > max)
+q[T-1] = i;
-		{
+}
-			max = phi[T-1][i];
+}
-			q[T-1] = i;
-		}
+/* track back */
-	}
+t = T - 2;
+while (t >= 0) {
+q[t] = psi[t+1][q[t+1]];
-	/* track back */
+t--;
-	t = T - 2;
+}
-	while (t >= 0)
-	{
+/* de-allocate memory */
-		q[t] = psi[t+1][q[t+1]];
+for (i = 0; i < L; i++) {
-		t--;
+free(icov[i]);
-	}
+}
+free(icov);
-	/* de-allocate memory */
+for (t = 0; t < T; t++) {
-	for (i = 0; i < L; i++)
+free(logb[t]);
-		free(icov[i]);
+free(phi[t]);
-	free(icov);
+free(psi[t]);
-	for (t = 0; t < T; t++)
+}
-	{
+free(logb);
-		free(logb[t]);
+free(phi);
-		free(phi[t]);
+free(psi);
-		free(psi[t]);
-	}
+free(gauss_y);
-	free(logb);
+free(gauss_z);
-	free(phi);
-	free(psi);
-	free(gauss_y);
-	free(gauss_z);
 }
 /* invert matrix and calculate determinant using LAPACK */
 void invert(double** cov, int L, double** icov, double* detcov)
 {
-	/* copy square matrix into a vector in column-major order */
+/* copy square matrix into a vector in column-major order */
-	double* a = (double*) malloc(L*L*sizeof(double));
+double* a = (double*) malloc(L*L*sizeof(double));
-	int i, j;
+int i, j;
-	for(j=0; j < L; j++)
+for (j=0; j < L; j++) {
-		for (i=0; i < L; i++)
+for (i=0; i < L; i++) {
-			a[j*L+i] = cov[i][j];
+a[j*L+i] = cov[i][j];
+}
-	int M = (int) L;
+}
-	int* ipiv = (int *) malloc(L*L*sizeof(int));
-	int ret;
+int M = (int) L;
+int* ipiv = (int *) malloc(L*L*sizeof(int));
-	/* LU decomposition */
+int ret;
-	ret = dgetrf_(&M, &M, a, &M, ipiv, &ret);	/* ret should be zero, negative if cov is singular */
-	if (ret < 0)
+/* LU decomposition */
-	{
+ret = dgetrf_(&M, &M, a, &M, ipiv, &ret);	/* ret should be zero, negative if cov is singular */
-		fprintf(stderr, "Covariance matrix was singular, couldn't invert\n");
+if (ret < 0) {
-		exit(-1);
+fprintf(stderr, "Covariance matrix was singular, couldn't invert\n");
-	}
+exit(-1);
+}
-	/* find determinant */
-	double det = 1;
+/* find determinant */
-	for(i = 0; i < L; i++)
+double det = 1;
-		det *= a[i*L+i];
+for (i = 0; i < L; i++) {
-	// TODO: get this to work!!! If detcov < 0 then cov is bad anyway...
+det *= a[i*L+i];
-	/*
+}
-	int sign = 1;
-	for (i = 0; i < L; i++)
+// TODO: get this to work!!! If detcov < 0 then cov is bad anyway...
-		if (ipiv[i] != i)
+if (det < 0) {
-			sign = -sign;
+det = -det;
-	det *= sign;
+}
-	 */
+*detcov = det;
-	if (det < 0)
-		det = -det;
+/* allocate required working storage */
-	*detcov = det;
-	/* allocate required working storage */
 #ifndef HAVE_ATLAS
-	int lwork = -1;
+int lwork = -1;
-	double lwbest = 0.0;
+double lwbest = 0.0;
-	dgetri_(&M, a, &M, ipiv, &lwbest, &lwork, &ret);
+dgetri_(&M, a, &M, ipiv, &lwbest, &lwork, &ret);
-	lwork = (int) lwbest;
+lwork = (int) lwbest;
-	double* work  = (double*) malloc(lwork*sizeof(double));
+double* work  = (double*) malloc(lwork*sizeof(double));
 #endif
-	/* find inverse */
+/* find inverse */
-	dgetri_(&M, a, &M, ipiv, work, &lwork, &ret);
+dgetri_(&M, a, &M, ipiv, work, &lwork, &ret);
-	for(j=0; j < L; j++)
+for (j=0; j < L; j++) {
-		for (i=0; i < L; i++)
+for (i=0; i < L; i++) {
-			icov[i][j] = a[j*L+i];
+icov[i][j] = a[j*L+i];
+}
+}
 #ifndef HAVE_ATLAS
-	free(work);
+free(work);
 #endif
-	free(a);
+free(a);
 }
 /* probability of multivariate Gaussian given mean, inverse and determinant of covariance */
 double gauss(double* x, int L, double* mu, double** icov, double detcov, double* y, double* z)
 {
-	int i;
+int i;
-	double s = 0;
+double s = 0;
-	for (i = 0; i < L; i++)
-		y[i] = x[i] - mu[i];
+for (i = 0; i < L; i++) {
-	for (i = 0; i < L; i++)
+y[i] = x[i] - mu[i];
-	{
+}
-		//z[i] = 0;
-		//for (j = 0; j < L; j++)
+for (i = 0; i < L; i++) {
-		//	z[i] += icov[i][j] *  y[j];
+z[i] = cblas_ddot(L, &icov[i][0], 1, y, 1);
-		z[i] = cblas_ddot(L, &icov[i][0], 1, y, 1);
+}
-	}
-	s = cblas_ddot(L, z, 1, y, 1);
+s = cblas_ddot(L, z, 1, y, 1);
-	//for (i = 0; i < L; i++)
-	//	s += z[i] * y[i];
+return exp(-s/2.0) / (pow(2*PI, L/2.0) * sqrt(detcov));
-	return exp(-s/2.0) / (pow(2*PI, L/2.0) * sqrt(detcov));
 }
 /* log probability of multivariate Gaussian given mean, inverse and determinant of covariance */
 double loggauss(double* x, int L, double* mu, double** icov, double detcov, double* y, double* z)
 {
-	int i;
+int i;
-	double s = 0;
+double s = 0;
-	double ret;
+double ret;
-	for (i = 0; i < L; i++)
-		y[i] = x[i] - mu[i];
+for (i = 0; i < L; i++) {
-	for (i = 0; i < L; i++)
+y[i] = x[i] - mu[i];
-	{
+}
-		//z[i] = 0;
-		//for (j = 0; j < L; j++)
+for (i = 0; i < L; i++) {
-		//	z[i] += icov[i][j] *  y[j];
+z[i] = cblas_ddot(L, &icov[i][0], 1, y, 1);
-		z[i] = cblas_ddot(L, &icov[i][0], 1, y, 1);
+}
-	}
-	s = cblas_ddot(L, z, 1, y, 1);
+s = cblas_ddot(L, z, 1, y, 1);
-	//for (i = 0; i < L; i++)
-	//	s += z[i] * y[i];
+ret = -0.5 * (s + L * log(2*PI) + log(detcov));
-	ret = -0.5 * (s + L * log(2*PI) + log(detcov));
+return ret;
-	/*
-	// TEST
-	if (ISINF(ret) > 0)
-		printf("loggauss returning infinity\n");
-	if (ISINF(ret) < 0)
-		printf("loggauss returning -infinity\n");
-	if (ISNAN(ret))
-		printf("loggauss returning nan\n");
-	*/
-	return ret;
 }
 void hmm_print(model_t* model)
 {
-	int i, j;
+int i, j;
-	printf("p0:\n");
+printf("p0:\n");
-	for (i = 0; i < model->N; i++)
+for (i = 0; i < model->N; i++) {
-		printf("%f ", model->p0[i]);
+printf("%f ", model->p0[i]);
-	printf("\n\n");
+}
-	printf("a:\n");
+printf("\n\n");
-	for (i = 0; i < model->N; i++)
+printf("a:\n");
-	{
+for (i = 0; i < model->N; i++) {
-		for (j = 0; j < model->N; j++)
+for (j = 0; j < model->N; j++) {
-			printf("%f ", model->a[i][j]);
+printf("%f ", model->a[i][j]);
-		printf("\n");
+}
-	}
+printf("\n");
-	printf("\n\n");
+}
-	printf("mu:\n");
+printf("\n\n");
-	for (i = 0; i < model->N; i++)
+printf("mu:\n");
-	{
+for (i = 0; i < model->N; i++) {
-		for (j = 0; j < model->L; j++)
+for (j = 0; j < model->L; j++) {
-			printf("%f ", model->mu[i][j]);
+printf("%f ", model->mu[i][j]);
-		printf("\n");
+}
-	}
+printf("\n");
-	printf("\n\n");
+}
-	printf("cov:\n");
+printf("\n\n");
-	for (i = 0; i < model->L; i++)
+printf("cov:\n");
-	{
+for (i = 0; i < model->L; i++) {
-		for (j = 0; j < model->L; j++)
+for (j = 0; j < model->L; j++) {
-			printf("%f ", model->cov[i][j]);
+printf("%f ", model->cov[i][j]);
-		printf("\n");
+}
-	}
+printf("\n");
-	printf("\n\n");
+}
-}
+printf("\n\n");
+}

Mercurial > hg > qm-dsp

comparison hmm/hmm.c @ 483:fdaa63607c15