summaryrefslogtreecommitdiffstats
path: root/media/pocketsphinx/src/ps_mllr.c
diff options
context:
space:
mode:
Diffstat (limited to 'media/pocketsphinx/src/ps_mllr.c')
-rw-r--r--media/pocketsphinx/src/ps_mllr.c169
1 files changed, 169 insertions, 0 deletions
diff --git a/media/pocketsphinx/src/ps_mllr.c b/media/pocketsphinx/src/ps_mllr.c
new file mode 100644
index 000000000..b43f6fbdb
--- /dev/null
+++ b/media/pocketsphinx/src/ps_mllr.c
@@ -0,0 +1,169 @@
+/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
+/* ====================================================================
+ * Copyright (c) 2009 Carnegie Mellon University. All rights
+ * reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ *
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ *
+ * This work was supported in part by funding from the Defense Advanced
+ * Research Projects Agency and the National Science Foundation of the
+ * United States of America, and the CMU Sphinx Speech Consortium.
+ *
+ * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
+ * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
+ * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
+ * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ * ====================================================================
+ *
+ */
+
+/**
+ * @file ps_mllr.c Model-space linear transforms for speaker adaptation
+ */
+
+/* System headers. */
+#include <stdio.h>
+
+/* SphinxBase headers. */
+#include <sphinxbase/ckd_alloc.h>
+
+/* Local headers. */
+#include "acmod.h"
+
+ps_mllr_t *
+ps_mllr_read(char const *regmatfile)
+{
+ ps_mllr_t *mllr;
+ FILE *fp;
+ int n, i, m, j, k;
+
+ mllr = ckd_calloc(1, sizeof(*mllr));
+ mllr->refcnt = 1;
+
+ if ((fp = fopen(regmatfile, "r")) == NULL) {
+ E_ERROR_SYSTEM("Failed to open MLLR file '%s' for reading", regmatfile);
+ goto error_out;
+ }
+ else
+ E_INFO("Reading MLLR transformation file '%s'\n", regmatfile);
+
+ if ((fscanf(fp, "%d", &n) != 1) || (n < 1)) {
+ E_ERROR("Failed to read number of MLLR classes\n");
+ goto error_out;
+ }
+ mllr->n_class = n;
+
+ if ((fscanf(fp, "%d", &n) != 1)) {
+ E_ERROR("Failed to read number of feature streams\n");
+ goto error_out;
+ }
+ mllr->n_feat = n;
+ mllr->veclen = ckd_calloc(mllr->n_feat, sizeof(*mllr->veclen));
+
+ mllr->A = (float32 ****) ckd_calloc(mllr->n_feat, sizeof(float32 **));
+ mllr->b = (float32 ***) ckd_calloc(mllr->n_feat, sizeof(float32 *));
+ mllr->h = (float32 ***) ckd_calloc(mllr->n_feat, sizeof(float32 *));
+
+ for (i = 0; i < mllr->n_feat; ++i) {
+ if (fscanf(fp, "%d", &n) != 1) {
+ E_ERROR("Failed to read stream length for feature %d\n", i);
+ goto error_out;
+ }
+ mllr->veclen[i] = n;
+ mllr->A[i] =
+ (float32 ***) ckd_calloc_3d(mllr->n_class, mllr->veclen[i],
+ mllr->veclen[i], sizeof(float32));
+ mllr->b[i] =
+ (float32 **) ckd_calloc_2d(mllr->n_class, mllr->veclen[i],
+ sizeof(float32));
+ mllr->h[i] =
+ (float32 **) ckd_calloc_2d(mllr->n_class, mllr->veclen[i],
+ sizeof(float32));
+
+ for (m = 0; m < mllr->n_class; ++m) {
+ for (j = 0; j < mllr->veclen[i]; ++j) {
+ for (k = 0; k < mllr->veclen[i]; ++k) {
+ if (fscanf(fp, "%f ", &mllr->A[i][m][j][k]) != 1) {
+ E_ERROR("Failed reading MLLR rotation (%d,%d,%d,%d)\n",
+ i, m, j, k);
+ goto error_out;
+ }
+ }
+ }
+ for (j = 0; j < mllr->veclen[i]; ++j) {
+ if (fscanf(fp, "%f ", &mllr->b[i][m][j]) != 1) {
+ E_ERROR("Failed reading MLLR bias (%d,%d,%d)\n",
+ i, m, j);
+ goto error_out;
+ }
+ }
+ for (j = 0; j < mllr->veclen[i]; ++j) {
+ if (fscanf(fp, "%f ", &mllr->h[i][m][j]) != 1) {
+ E_ERROR("Failed reading MLLR variance scale (%d,%d,%d)\n",
+ i, m, j);
+ goto error_out;
+ }
+ }
+ }
+ }
+ fclose(fp);
+ return mllr;
+
+error_out:
+ if (fp)
+ fclose(fp);
+ ps_mllr_free(mllr);
+ return NULL;
+}
+
+ps_mllr_t *
+ps_mllr_retain(ps_mllr_t *mllr)
+{
+ ++mllr->refcnt;
+ return mllr;
+}
+
+int
+ps_mllr_free(ps_mllr_t *mllr)
+{
+ int i;
+
+ if (mllr == NULL)
+ return 0;
+ if (--mllr->refcnt > 0)
+ return mllr->refcnt;
+
+ for (i = 0; i < mllr->n_feat; ++i) {
+ if (mllr->A)
+ ckd_free_3d(mllr->A[i]);
+ if (mllr->b)
+ ckd_free_2d(mllr->b[i]);
+ if (mllr->h)
+ ckd_free_2d(mllr->h[i]);
+ }
+ ckd_free(mllr->veclen);
+ ckd_free(mllr->A);
+ ckd_free(mllr->b);
+ ckd_free(mllr->h);
+ ckd_free(mllr);
+
+ return 0;
+}