summaryrefslogtreecommitdiffstats
path: root/media/sphinxbase/src/libsphinxbase/fe
diff options
context:
space:
mode:
Diffstat (limited to 'media/sphinxbase/src/libsphinxbase/fe')
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_interface.c776
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_internal.h216
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_noise.c425
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_noise.h66
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.c182
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.h79
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_sigproc.c1377
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_type.h65
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp.c252
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp.h90
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.c181
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.h76
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.c178
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.h77
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.c223
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.h77
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/fixlog.c229
-rw-r--r--media/sphinxbase/src/libsphinxbase/fe/yin.c412
18 files changed, 0 insertions, 4981 deletions
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_interface.c b/media/sphinxbase/src/libsphinxbase/fe/fe_interface.c
deleted file mode 100644
index cd2e1e2db..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_interface.c
+++ /dev/null
@@ -1,776 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 1996-2004 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-#include <stdio.h>
-#include <string.h>
-#include <math.h>
-#include <stdlib.h>
-#include <assert.h>
-#ifdef _WIN32_WCE
-#include <windows.h>
-#else
-#include <time.h>
-#endif
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include "sphinxbase/prim_type.h"
-#include "sphinxbase/byteorder.h"
-#include "sphinxbase/fixpoint.h"
-#include "sphinxbase/genrand.h"
-#include "sphinxbase/err.h"
-#include "sphinxbase/cmd_ln.h"
-#include "sphinxbase/ckd_alloc.h"
-
-#include "fe_internal.h"
-#include "fe_warp.h"
-
-static const arg_t fe_args[] = {
- waveform_to_cepstral_command_line_macro(),
- { NULL, 0, NULL, NULL }
-};
-
-int
-fe_parse_general_params(cmd_ln_t *config, fe_t * fe)
-{
- int j, frate;
-
- fe->config = config;
- fe->sampling_rate = cmd_ln_float32_r(config, "-samprate");
- frate = cmd_ln_int32_r(config, "-frate");
- if (frate > MAX_INT16 || frate > fe->sampling_rate || frate < 1) {
- E_ERROR
- ("Frame rate %d can not be bigger than sample rate %.02f\n",
- frate, fe->sampling_rate);
- return -1;
- }
-
- fe->frame_rate = (int16)frate;
- if (cmd_ln_boolean_r(config, "-dither")) {
- fe->dither = 1;
- fe->seed = cmd_ln_int32_r(config, "-seed");
- }
-#ifdef WORDS_BIGENDIAN
- fe->swap = strcmp("big", cmd_ln_str_r(config, "-input_endian")) == 0 ? 0 : 1;
-#else
- fe->swap = strcmp("little", cmd_ln_str_r(config, "-input_endian")) == 0 ? 0 : 1;
-#endif
- fe->window_length = cmd_ln_float32_r(config, "-wlen");
- fe->pre_emphasis_alpha = cmd_ln_float32_r(config, "-alpha");
-
- fe->num_cepstra = (uint8)cmd_ln_int32_r(config, "-ncep");
- fe->fft_size = (int16)cmd_ln_int32_r(config, "-nfft");
-
- /* Check FFT size, compute FFT order (log_2(n)) */
- for (j = fe->fft_size, fe->fft_order = 0; j > 1; j >>= 1, fe->fft_order++) {
- if (((j % 2) != 0) || (fe->fft_size <= 0)) {
- E_ERROR("fft: number of points must be a power of 2 (is %d)\n",
- fe->fft_size);
- return -1;
- }
- }
- /* Verify that FFT size is greater or equal to window length. */
- if (fe->fft_size < (int)(fe->window_length * fe->sampling_rate)) {
- E_ERROR("FFT: Number of points must be greater or equal to frame size (%d samples)\n",
- (int)(fe->window_length * fe->sampling_rate));
- return -1;
- }
-
- fe->prespch_len = (int16)cmd_ln_int32_r(config, "-vad_prespeech");
- fe->postspch_len = (int16)cmd_ln_int32_r(config, "-vad_postspeech");
- fe->vad_threshold = cmd_ln_float32_r(config, "-vad_threshold");
-
- fe->remove_dc = cmd_ln_boolean_r(config, "-remove_dc");
- fe->remove_noise = cmd_ln_boolean_r(config, "-remove_noise");
- fe->remove_silence = cmd_ln_boolean_r(config, "-remove_silence");
-
- if (0 == strcmp(cmd_ln_str_r(config, "-transform"), "dct"))
- fe->transform = DCT_II;
- else if (0 == strcmp(cmd_ln_str_r(config, "-transform"), "legacy"))
- fe->transform = LEGACY_DCT;
- else if (0 == strcmp(cmd_ln_str_r(config, "-transform"), "htk"))
- fe->transform = DCT_HTK;
- else {
- E_ERROR("Invalid transform type (values are 'dct', 'legacy', 'htk')\n");
- return -1;
- }
-
- if (cmd_ln_boolean_r(config, "-logspec"))
- fe->log_spec = RAW_LOG_SPEC;
- if (cmd_ln_boolean_r(config, "-smoothspec"))
- fe->log_spec = SMOOTH_LOG_SPEC;
-
- return 0;
-}
-
-static int
-fe_parse_melfb_params(cmd_ln_t *config, fe_t *fe, melfb_t * mel)
-{
- mel->sampling_rate = fe->sampling_rate;
- mel->fft_size = fe->fft_size;
- mel->num_cepstra = fe->num_cepstra;
- mel->num_filters = cmd_ln_int32_r(config, "-nfilt");
-
- if (fe->log_spec)
- fe->feature_dimension = mel->num_filters;
- else
- fe->feature_dimension = fe->num_cepstra;
-
- mel->upper_filt_freq = cmd_ln_float32_r(config, "-upperf");
- mel->lower_filt_freq = cmd_ln_float32_r(config, "-lowerf");
-
- mel->doublewide = cmd_ln_boolean_r(config, "-doublebw");
-
- mel->warp_type = cmd_ln_str_r(config, "-warp_type");
- mel->warp_params = cmd_ln_str_r(config, "-warp_params");
- mel->lifter_val = cmd_ln_int32_r(config, "-lifter");
-
- mel->unit_area = cmd_ln_boolean_r(config, "-unit_area");
- mel->round_filters = cmd_ln_boolean_r(config, "-round_filters");
-
- if (fe_warp_set(mel, mel->warp_type) != FE_SUCCESS) {
- E_ERROR("Failed to initialize the warping function.\n");
- return -1;
- }
- fe_warp_set_parameters(mel, mel->warp_params, mel->sampling_rate);
- return 0;
-}
-
-void
-fe_print_current(fe_t const *fe)
-{
- E_INFO("Current FE Parameters:\n");
- E_INFO("\tSampling Rate: %f\n", fe->sampling_rate);
- E_INFO("\tFrame Size: %d\n", fe->frame_size);
- E_INFO("\tFrame Shift: %d\n", fe->frame_shift);
- E_INFO("\tFFT Size: %d\n", fe->fft_size);
- E_INFO("\tLower Frequency: %g\n",
- fe->mel_fb->lower_filt_freq);
- E_INFO("\tUpper Frequency: %g\n",
- fe->mel_fb->upper_filt_freq);
- E_INFO("\tNumber of filters: %d\n", fe->mel_fb->num_filters);
- E_INFO("\tNumber of Overflow Samps: %d\n", fe->num_overflow_samps);
- E_INFO("\tStart Utt Status: %d\n", fe->start_flag);
- E_INFO("Will %sremove DC offset at frame level\n",
- fe->remove_dc ? "" : "not ");
- if (fe->dither) {
- E_INFO("Will add dither to audio\n");
- E_INFO("Dither seeded with %d\n", fe->seed);
- }
- else {
- E_INFO("Will not add dither to audio\n");
- }
- if (fe->mel_fb->lifter_val) {
- E_INFO("Will apply sine-curve liftering, period %d\n",
- fe->mel_fb->lifter_val);
- }
- E_INFO("Will %snormalize filters to unit area\n",
- fe->mel_fb->unit_area ? "" : "not ");
- E_INFO("Will %sround filter frequencies to DFT points\n",
- fe->mel_fb->round_filters ? "" : "not ");
- E_INFO("Will %suse double bandwidth in mel filter\n",
- fe->mel_fb->doublewide ? "" : "not ");
-}
-
-fe_t *
-fe_init_auto()
-{
- return fe_init_auto_r(cmd_ln_get());
-}
-
-fe_t *
-fe_init_auto_r(cmd_ln_t *config)
-{
- fe_t *fe;
- int prespch_frame_len;
-
- fe = (fe_t*)ckd_calloc(1, sizeof(*fe));
- fe->refcount = 1;
-
- /* transfer params to front end */
- if (fe_parse_general_params(cmd_ln_retain(config), fe) < 0) {
- fe_free(fe);
- return NULL;
- }
-
- /* compute remaining fe parameters */
- /* We add 0.5 so approximate the float with the closest
- * integer. E.g., 2.3 is truncate to 2, whereas 3.7 becomes 4
- */
- fe->frame_shift = (int32) (fe->sampling_rate / fe->frame_rate + 0.5);
- fe->frame_size = (int32) (fe->window_length * fe->sampling_rate + 0.5);
- fe->prior = 0;
-
- fe_start_stream(fe);
-
- assert (fe->frame_shift > 1);
-
- if (fe->frame_size > (fe->fft_size)) {
- E_ERROR
- ("Number of FFT points has to be a power of 2 higher than %d, it is %d\n",
- fe->frame_size, fe->fft_size);
- fe_free(fe);
- return NULL;
- }
-
- if (fe->dither)
- fe_init_dither(fe->seed);
-
- /* establish buffers for overflow samps and hamming window */
- fe->overflow_samps = ckd_calloc(fe->frame_size, sizeof(int16));
- fe->hamming_window = ckd_calloc(fe->frame_size/2, sizeof(window_t));
-
- /* create hamming window */
- fe_create_hamming(fe->hamming_window, fe->frame_size);
-
- /* init and fill appropriate filter structure */
- fe->mel_fb = ckd_calloc(1, sizeof(*fe->mel_fb));
-
- /* transfer params to mel fb */
- fe_parse_melfb_params(config, fe, fe->mel_fb);
-
- if (fe->mel_fb->upper_filt_freq > fe->sampling_rate / 2 + 1.0) {
- E_ERROR("Upper frequency %.1f is higher than samprate/2 (%.1f)\n",
- fe->mel_fb->upper_filt_freq, fe->sampling_rate / 2);
- fe_free(fe);
- return NULL;
- }
-
- fe_build_melfilters(fe->mel_fb);
-
- fe_compute_melcosine(fe->mel_fb);
- if (fe->remove_noise || fe->remove_silence)
- fe->noise_stats = fe_init_noisestats(fe->mel_fb->num_filters);
-
- fe->vad_data = (vad_data_t*)ckd_calloc(1, sizeof(*fe->vad_data));
- prespch_frame_len = fe->log_spec != RAW_LOG_SPEC ? fe->num_cepstra : fe->mel_fb->num_filters;
- fe->vad_data->prespch_buf = fe_prespch_init(fe->prespch_len + 1, prespch_frame_len, fe->frame_shift);
-
- /* Create temporary FFT, spectrum and mel-spectrum buffers. */
- /* FIXME: Gosh there are a lot of these. */
- fe->spch = ckd_calloc(fe->frame_size, sizeof(*fe->spch));
- fe->frame = ckd_calloc(fe->fft_size, sizeof(*fe->frame));
- fe->spec = ckd_calloc(fe->fft_size, sizeof(*fe->spec));
- fe->mfspec = ckd_calloc(fe->mel_fb->num_filters, sizeof(*fe->mfspec));
-
- /* create twiddle factors */
- fe->ccc = ckd_calloc(fe->fft_size / 4, sizeof(*fe->ccc));
- fe->sss = ckd_calloc(fe->fft_size / 4, sizeof(*fe->sss));
- fe_create_twiddle(fe);
-
- if (cmd_ln_boolean_r(config, "-verbose")) {
- fe_print_current(fe);
- }
-
- /*** Initialize the overflow buffers ***/
- fe_start_utt(fe);
- return fe;
-}
-
-arg_t const *
-fe_get_args(void)
-{
- return fe_args;
-}
-
-const cmd_ln_t *
-fe_get_config(fe_t *fe)
-{
- return fe->config;
-}
-
-void
-fe_init_dither(int32 seed)
-{
- if (seed < 0) {
- E_INFO("You are using the internal mechanism to generate the seed.\n");
-#ifdef _WIN32_WCE
- s3_rand_seed(GetTickCount());
-#else
- s3_rand_seed((long) time(0));
-#endif
- } else {
- E_INFO("You are using %d as the seed.\n", seed);
- s3_rand_seed(seed);
- }
-}
-
-static void
-fe_reset_vad_data(vad_data_t * vad_data)
-{
- vad_data->global_state = 0;
- vad_data->state_changed = 0;
- vad_data->prespch_num = 0;
- vad_data->postspch_num = 0;
- fe_prespch_reset_cep(vad_data->prespch_buf);
-}
-
-int32
-fe_start_utt(fe_t * fe)
-{
- fe->num_overflow_samps = 0;
- memset(fe->overflow_samps, 0, fe->frame_size * sizeof(int16));
- fe->start_flag = 1;
- fe->prior = 0;
- fe_reset_vad_data(fe->vad_data);
- return 0;
-}
-
-void
-fe_start_stream(fe_t *fe)
-{
- fe->sample_counter = 0;
- fe_reset_noisestats(fe->noise_stats);
-}
-
-int
-fe_get_output_size(fe_t *fe)
-{
- return (int)fe->feature_dimension;
-}
-
-void
-fe_get_input_size(fe_t *fe, int *out_frame_shift,
- int *out_frame_size)
-{
- if (out_frame_shift)
- *out_frame_shift = fe->frame_shift;
- if (out_frame_size)
- *out_frame_size = fe->frame_size;
-}
-
-uint8
-fe_get_vad_state(fe_t *fe)
-{
- return fe->vad_data->global_state;
-}
-
-int
-fe_process_frames(fe_t *fe,
- int16 const **inout_spch,
- size_t *inout_nsamps,
- mfcc_t **buf_cep,
- int32 *inout_nframes,
- int32 *out_frameidx)
-{
- int outidx, n_overflow, orig_n_overflow;
- int16 const *orig_spch;
- size_t orig_nsamps;
-
- /* In the special case where there is no output buffer, return the
- * maximum number of frames which would be generated. */
- if (buf_cep == NULL) {
- if (*inout_nsamps + fe->num_overflow_samps < (size_t)fe->frame_size)
- *inout_nframes = 0;
- else
- *inout_nframes = 1
- + ((*inout_nsamps + fe->num_overflow_samps - fe->frame_size)
- / fe->frame_shift);
- if (fe->vad_data->global_state)
- *inout_nframes += fe_prespch_ncep(fe->vad_data->prespch_buf);
- return *inout_nframes;
- }
-
- if (out_frameidx)
- *out_frameidx = 0;
-
- /* Are there not enough samples to make at least 1 frame? */
- if (*inout_nsamps + fe->num_overflow_samps < (size_t)fe->frame_size) {
- if (*inout_nsamps > 0) {
- /* Append them to the overflow buffer. */
- memcpy(fe->overflow_samps + fe->num_overflow_samps,
- *inout_spch, *inout_nsamps * (sizeof(int16)));
- fe->num_overflow_samps += *inout_nsamps;
- /* Update input-output pointers and counters. */
- *inout_spch += *inout_nsamps;
- *inout_nsamps = 0;
- }
- /* We produced no frames of output, sorry! */
- *inout_nframes = 0;
- return 0;
- }
-
- /* Can't write a frame? Then do nothing! */
- if (*inout_nframes < 1) {
- *inout_nframes = 0;
- return 0;
- }
-
- /* Index of output frame. */
- outidx = 0;
-
- /* Try to read from prespeech buffer */
- if (fe->vad_data->global_state) {
- while ((*inout_nframes) > 0 && fe_prespch_read_cep(fe->vad_data->prespch_buf, buf_cep[outidx]) > 0) {
- outidx++;
- (*inout_nframes)--;
- }
- if ((*inout_nframes) < 1) {
- /* mfcc buffer is filled from prespeech buffer */
- *inout_nframes = outidx;
- return 0;
- }
-
- /* Sets the start frame for the returned data so that caller can update timings */
- if (out_frameidx && fe->vad_data->state_changed) {
- *out_frameidx = fe->sample_counter / fe->frame_shift - fe->prespch_len;
- }
- }
-
- /* Keep track of the original start of the buffer. */
- orig_spch = *inout_spch;
- orig_nsamps = *inout_nsamps;
- orig_n_overflow = fe->num_overflow_samps;
-
- /* Start processing, taking care of any incoming overflow. */
- if (fe->num_overflow_samps) {
- int offset = fe->frame_size - fe->num_overflow_samps;
-
- /* Append start of spch to overflow samples to make a full frame. */
- memcpy(fe->overflow_samps + fe->num_overflow_samps,
- *inout_spch, offset * sizeof(**inout_spch));
- fe_read_frame(fe, fe->overflow_samps, fe->frame_size);
- /* Update input-output pointers and counters. */
- *inout_spch += offset;
- *inout_nsamps -= offset;
- fe->num_overflow_samps -= fe->frame_shift;
- } else {
- fe_read_frame(fe, *inout_spch, fe->frame_size);
- /* Update input-output pointers and counters. */
- *inout_spch += fe->frame_size;
- *inout_nsamps -= fe->frame_size;
- }
-
- fe_write_frame(fe, buf_cep[outidx]);
-
- if (!fe->vad_data->state_changed && fe->vad_data->global_state) {
- outidx++;
- (*inout_nframes)--;
- }
- if (fe->vad_data->state_changed && fe->vad_data->global_state) {
- /* previous frame triggered vad into speech state
- * dumping prespeech buffer */
- while ((*inout_nframes) > 0 && fe_prespch_read_cep(fe->vad_data->prespch_buf, buf_cep[outidx]) > 0) {
- outidx++;
- (*inout_nframes)--;
- }
-
- /* Sets the start frame for the returned data so that caller can update timings */
- if (out_frameidx) {
- *out_frameidx = (fe->sample_counter + orig_nsamps - *inout_nsamps) / fe->frame_shift - fe->prespch_len;
- }
- }
-
- /* Process all remaining frames. */
- while (*inout_nframes > 0 && *inout_nsamps >= (size_t)fe->frame_shift) {
- fe_shift_frame(fe, *inout_spch, fe->frame_shift);
- fe_write_frame(fe, buf_cep[outidx]);
- if (!fe->vad_data->state_changed && fe->vad_data->global_state) {
- (*inout_nframes)--;
- outidx++;
- }
- /* Update input-output pointers and counters. */
- *inout_spch += fe->frame_shift;
- *inout_nsamps -= fe->frame_shift;
- /* Amount of data behind the original input which is still needed. */
- if (fe->num_overflow_samps > 0)
- fe->num_overflow_samps -= fe->frame_shift;
-
- if (fe->vad_data->state_changed && fe->vad_data->global_state) {
- /* previous frame triggered vad into speech state */
- while (*inout_nframes > 0 && fe_prespch_read_cep(fe->vad_data->prespch_buf, buf_cep[outidx]) != 0) {
- (*inout_nframes)--;
- outidx++;
- }
- }
- }
-
- /* How many relevant overflow samples are there left? */
- if (fe->num_overflow_samps <= 0) {
- /* Maximum number of overflow samples past *inout_spch to save. */
- n_overflow = *inout_nsamps;
- if (n_overflow > fe->frame_shift)
- n_overflow = fe->frame_shift;
- fe->num_overflow_samps = fe->frame_size - fe->frame_shift;
- /* Make sure this isn't an illegal read! */
- if (fe->num_overflow_samps > *inout_spch - orig_spch)
- fe->num_overflow_samps = *inout_spch - orig_spch;
- fe->num_overflow_samps += n_overflow;
- if (fe->num_overflow_samps > 0) {
- memcpy(fe->overflow_samps,
- *inout_spch - (fe->frame_size - fe->frame_shift),
- fe->num_overflow_samps * sizeof(**inout_spch));
- /* Update the input pointer to cover this stuff. */
- *inout_spch += n_overflow;
- *inout_nsamps -= n_overflow;
- }
- } else {
- /* There is still some relevant data left in the overflow buffer. */
- /* Shift existing data to the beginning. */
- memmove(fe->overflow_samps,
- fe->overflow_samps + orig_n_overflow - fe->num_overflow_samps,
- fe->num_overflow_samps * sizeof(*fe->overflow_samps));
- /* Copy in whatever we had in the original speech buffer. */
- n_overflow = *inout_spch - orig_spch + *inout_nsamps;
- if (n_overflow > fe->frame_size - fe->num_overflow_samps)
- n_overflow = fe->frame_size - fe->num_overflow_samps;
- memcpy(fe->overflow_samps + fe->num_overflow_samps,
- orig_spch, n_overflow * sizeof(*orig_spch));
- fe->num_overflow_samps += n_overflow;
- /* Advance the input pointers. */
- if (n_overflow > *inout_spch - orig_spch) {
- n_overflow -= (*inout_spch - orig_spch);
- *inout_spch += n_overflow;
- *inout_nsamps -= n_overflow;
- }
- }
-
- /* Finally update the frame counter with the number of frames
- * and global sample counter with number of samples we procesed*/
- *inout_nframes = outidx; /* FIXME: Not sure why I wrote it this way... */
- fe->sample_counter += orig_nsamps - *inout_nsamps;
- return 0;
-}
-
-int
-fe_process_frames_ext(fe_t *fe,
- int16 const **inout_spch,
- size_t *inout_nsamps,
- mfcc_t **buf_cep,
- int32 *inout_nframes,
- int16 **voiced_spch,
- int32 *voiced_spch_nsamps,
- int32 *out_frameidx)
-{
- int proc_result;
-
- fe_prespch_extend_pcm(fe->vad_data->prespch_buf, *inout_nframes);
-
- fe->vad_data->store_pcm = TRUE;
- proc_result = fe_process_frames(fe, inout_spch, inout_nsamps, buf_cep, inout_nframes, out_frameidx);
- fe->vad_data->store_pcm = FALSE;
-
- if (fe->vad_data->global_state)
- fe_prespch_read_pcm(fe->vad_data->prespch_buf, voiced_spch, voiced_spch_nsamps);
- else
- *voiced_spch_nsamps = 0;
-
- return proc_result;
-}
-
-int
-fe_process_utt(fe_t * fe, int16 const * spch, size_t nsamps,
- mfcc_t *** cep_block, int32 * nframes)
-{
- mfcc_t **cep;
- int rv;
-
- /* Figure out how many frames we will need. */
- fe_process_frames(fe, NULL, &nsamps, NULL, nframes, NULL);
- /* Create the output buffer (it has to exist, even if there are no output frames). */
- if (*nframes)
- cep = (mfcc_t **)ckd_calloc_2d(*nframes, fe->feature_dimension, sizeof(**cep));
- else
- cep = (mfcc_t **)ckd_calloc_2d(1, fe->feature_dimension, sizeof(**cep));
- /* Now just call fe_process_frames() with the allocated buffer. */
- rv = fe_process_frames(fe, &spch, &nsamps, cep, nframes, NULL);
- *cep_block = cep;
-
- return rv;
-}
-
-
-int32
-fe_end_utt(fe_t * fe, mfcc_t * cepvector, int32 * nframes)
-{
- /* Process any remaining data. */
- *nframes = 0;
- if (fe->num_overflow_samps > 0) {
- fe_read_frame(fe, fe->overflow_samps, fe->num_overflow_samps);
- fe_write_frame(fe, cepvector);
- if (!fe->vad_data->state_changed && fe->vad_data->global_state)
- (*nframes)++;
- }
-
- /* reset overflow buffers... */
- fe->num_overflow_samps = 0;
- fe->start_flag = 0;
-
- return 0;
-}
-
-fe_t *
-fe_retain(fe_t *fe)
-{
- ++fe->refcount;
- return fe;
-}
-
-int
-fe_free(fe_t * fe)
-{
- if (fe == NULL)
- return 0;
- if (--fe->refcount > 0)
- return fe->refcount;
-
- /* kill FE instance - free everything... */
- if (fe->mel_fb) {
- if (fe->mel_fb->mel_cosine)
- fe_free_2d((void *) fe->mel_fb->mel_cosine);
- ckd_free(fe->mel_fb->lifter);
- ckd_free(fe->mel_fb->spec_start);
- ckd_free(fe->mel_fb->filt_start);
- ckd_free(fe->mel_fb->filt_width);
- ckd_free(fe->mel_fb->filt_coeffs);
- ckd_free(fe->mel_fb);
- }
- ckd_free(fe->spch);
- ckd_free(fe->frame);
- ckd_free(fe->ccc);
- ckd_free(fe->sss);
- ckd_free(fe->spec);
- ckd_free(fe->mfspec);
- ckd_free(fe->overflow_samps);
- ckd_free(fe->hamming_window);
-
- if (fe->noise_stats)
- fe_free_noisestats(fe->noise_stats);
-
- if (fe->vad_data) {
- fe_prespch_free(fe->vad_data->prespch_buf);
- ckd_free(fe->vad_data);
- }
-
- cmd_ln_free_r(fe->config);
- ckd_free(fe);
-
- return 0;
-}
-
-/**
- * Convert a block of mfcc_t to float32 (can be done in-place)
- **/
-int32
-fe_mfcc_to_float(fe_t * fe,
- mfcc_t ** input, float32 ** output, int32 nframes)
-{
- int32 i;
-
-#ifndef FIXED_POINT
- if ((void *) input == (void *) output)
- return nframes * fe->feature_dimension;
-#endif
- for (i = 0; i < nframes * fe->feature_dimension; ++i)
- output[0][i] = MFCC2FLOAT(input[0][i]);
-
- return i;
-}
-
-/**
- * Convert a block of float32 to mfcc_t (can be done in-place)
- **/
-int32
-fe_float_to_mfcc(fe_t * fe,
- float32 ** input, mfcc_t ** output, int32 nframes)
-{
- int32 i;
-
-#ifndef FIXED_POINT
- if ((void *) input == (void *) output)
- return nframes * fe->feature_dimension;
-#endif
- for (i = 0; i < nframes * fe->feature_dimension; ++i)
- output[0][i] = FLOAT2MFCC(input[0][i]);
-
- return i;
-}
-
-int32
-fe_logspec_to_mfcc(fe_t * fe, const mfcc_t * fr_spec, mfcc_t * fr_cep)
-{
-#ifdef FIXED_POINT
- fe_spec2cep(fe, fr_spec, fr_cep);
-#else /* ! FIXED_POINT */
- powspec_t *powspec;
- int32 i;
-
- powspec = ckd_malloc(fe->mel_fb->num_filters * sizeof(powspec_t));
- for (i = 0; i < fe->mel_fb->num_filters; ++i)
- powspec[i] = (powspec_t) fr_spec[i];
- fe_spec2cep(fe, powspec, fr_cep);
- ckd_free(powspec);
-#endif /* ! FIXED_POINT */
- return 0;
-}
-
-int32
-fe_logspec_dct2(fe_t * fe, const mfcc_t * fr_spec, mfcc_t * fr_cep)
-{
-#ifdef FIXED_POINT
- fe_dct2(fe, fr_spec, fr_cep, 0);
-#else /* ! FIXED_POINT */
- powspec_t *powspec;
- int32 i;
-
- powspec = ckd_malloc(fe->mel_fb->num_filters * sizeof(powspec_t));
- for (i = 0; i < fe->mel_fb->num_filters; ++i)
- powspec[i] = (powspec_t) fr_spec[i];
- fe_dct2(fe, powspec, fr_cep, 0);
- ckd_free(powspec);
-#endif /* ! FIXED_POINT */
- return 0;
-}
-
-int32
-fe_mfcc_dct3(fe_t * fe, const mfcc_t * fr_cep, mfcc_t * fr_spec)
-{
-#ifdef FIXED_POINT
- fe_dct3(fe, fr_cep, fr_spec);
-#else /* ! FIXED_POINT */
- powspec_t *powspec;
- int32 i;
-
- powspec = ckd_malloc(fe->mel_fb->num_filters * sizeof(powspec_t));
- fe_dct3(fe, fr_cep, powspec);
- for (i = 0; i < fe->mel_fb->num_filters; ++i)
- fr_spec[i] = (mfcc_t) powspec[i];
- ckd_free(powspec);
-#endif /* ! FIXED_POINT */
- return 0;
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_internal.h b/media/sphinxbase/src/libsphinxbase/fe/fe_internal.h
deleted file mode 100644
index f6c943c72..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_internal.h
+++ /dev/null
@@ -1,216 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 1996-2004 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#ifndef __FE_INTERNAL_H__
-#define __FE_INTERNAL_H__
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include "sphinxbase/fe.h"
-#include "sphinxbase/fixpoint.h"
-
-#include "fe_noise.h"
-#include "fe_prespch_buf.h"
-#include "fe_type.h"
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-#if 0
-/* Fool Emacs. */
-}
-#endif
-
-/* Values for the 'logspec' field. */
-enum {
- RAW_LOG_SPEC = 1,
- SMOOTH_LOG_SPEC = 2
-};
-
-/* Values for the 'transform' field. */
-enum {
- LEGACY_DCT = 0,
- DCT_II = 1,
- DCT_HTK = 2
-};
-
-typedef struct melfb_s melfb_t;
-/** Base Struct to hold all structure for MFCC computation. */
-struct melfb_s {
- float32 sampling_rate;
- int32 num_cepstra;
- int32 num_filters;
- int32 fft_size;
- float32 lower_filt_freq;
- float32 upper_filt_freq;
- /* DCT coefficients. */
- mfcc_t **mel_cosine;
- /* Filter coefficients. */
- mfcc_t *filt_coeffs;
- int16 *spec_start;
- int16 *filt_start;
- int16 *filt_width;
- /* Luxury mobile home. */
- int32 doublewide;
- char const *warp_type;
- char const *warp_params;
- uint32 warp_id;
- /* Precomputed normalization constants for unitary DCT-II/DCT-III */
- mfcc_t sqrt_inv_n, sqrt_inv_2n;
- /* Value and coefficients for HTK-style liftering */
- int32 lifter_val;
- mfcc_t *lifter;
- /* Normalize filters to unit area */
- int32 unit_area;
- /* Round filter frequencies to DFT points (hurts accuracy, but is
- useful for legacy purposes) */
- int32 round_filters;
-};
-
-typedef struct ringbuf_s {
- powspec_t** bufs;
- int16 buf_num;
- int32 buf_len;
- int16 start;
- int16 end;
- int32 recs;
-} ringbuf_t;
-
-/* sqrt(1/2), also used for unitary DCT-II/DCT-III */
-#define SQRT_HALF FLOAT2MFCC(0.707106781186548)
-
-typedef struct vad_data_s {
- uint8 global_state;
- uint8 state_changed;
- uint8 store_pcm;
- int16 prespch_num;
- int16 postspch_num;
- prespch_buf_t* prespch_buf;
-} vad_data_t;
-
-/** Structure for the front-end computation. */
-struct fe_s {
- cmd_ln_t *config;
- int refcount;
-
- int16 prespch_len;
- int16 postspch_len;
- float32 vad_threshold;
-
- float32 sampling_rate;
- int16 frame_rate;
- int16 frame_shift;
-
- float32 window_length;
- int16 frame_size;
- int16 fft_size;
-
- uint8 fft_order;
- uint8 feature_dimension;
- uint8 num_cepstra;
- uint8 remove_dc;
- uint8 log_spec;
- uint8 swap;
- uint8 dither;
- uint8 transform;
- uint8 remove_noise;
- uint8 remove_silence;
-
- float32 pre_emphasis_alpha;
- int32 seed;
-
- size_t sample_counter;
- uint8 start_flag;
- uint8 reserved;
-
- /* Twiddle factors for FFT. */
- frame_t *ccc, *sss;
- /* Mel filter parameters. */
- melfb_t *mel_fb;
- /* Half of a Hamming Window. */
- window_t *hamming_window;
- /* Storage for noise removal */
- noise_stats_t *noise_stats;
-
- /* Storage for VAD variables */
- vad_data_t *vad_data;
-
- /* Temporary buffers for processing. */
- /* FIXME: too many of these. */
- int16 *spch;
- frame_t *frame;
- powspec_t *spec, *mfspec;
- int16 *overflow_samps;
- int16 num_overflow_samps;
- int16 prior;
-};
-
-void fe_init_dither(int32 seed);
-
-/* Apply 1/2 bit noise to a buffer of audio. */
-int32 fe_dither(int16 *buffer, int32 nsamps);
-
-/* Load a frame of data into the fe. */
-int fe_read_frame(fe_t *fe, int16 const *in, int32 len);
-
-/* Shift the input buffer back and read more data. */
-int fe_shift_frame(fe_t *fe, int16 const *in, int32 len);
-
-/* Process a frame of data into features. */
-void fe_write_frame(fe_t *fe, mfcc_t *fea);
-
-/* Initialization functions. */
-int32 fe_build_melfilters(melfb_t *MEL_FB);
-int32 fe_compute_melcosine(melfb_t *MEL_FB);
-void fe_create_hamming(window_t *in, int32 in_len);
-void fe_create_twiddle(fe_t *fe);
-
-fixed32 fe_log_add(fixed32 x, fixed32 y);
-fixed32 fe_log_sub(fixed32 x, fixed32 y);
-
-/* Miscellaneous processing functions. */
-void fe_spec2cep(fe_t * fe, const powspec_t * mflogspec, mfcc_t * mfcep);
-void fe_dct2(fe_t *fe, const powspec_t *mflogspec, mfcc_t *mfcep, int htk);
-void fe_dct3(fe_t *fe, const mfcc_t *mfcep, powspec_t *mflogspec);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif /* __FE_INTERNAL_H__ */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_noise.c b/media/sphinxbase/src/libsphinxbase/fe/fe_noise.c
deleted file mode 100644
index 4fb6d21a9..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_noise.c
+++ /dev/null
@@ -1,425 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2013 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-/* This noise removal algorithm is inspired by the following papers
- * Computationally Efficient Speech Enchancement by Spectral Minina Tracking
- * by G. Doblinger
- *
- * Power-Normalized Cepstral Coefficients (PNCC) for Robust Speech Recognition
- * by C. Kim.
- *
- * For the recent research and state of art see papers about IMRCA and
- * A Minimum-Mean-Square-Error Noise Reduction Algorithm On Mel-Frequency
- * Cepstra For Robust Speech Recognition by Dong Yu and others
- */
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include <math.h>
-
-#include "sphinxbase/prim_type.h"
-#include "sphinxbase/ckd_alloc.h"
-#include "sphinxbase/strfuncs.h"
-#include "sphinxbase/err.h"
-
-#include "fe_noise.h"
-#include "fe_internal.h"
-
-/* Noise supression constants */
-#define SMOOTH_WINDOW 4
-#define LAMBDA_POWER 0.7
-#define LAMBDA_A 0.995
-#define LAMBDA_B 0.5
-#define LAMBDA_T 0.85
-#define MU_T 0.2
-#define MAX_GAIN 20
-
-struct noise_stats_s {
- /* Smoothed power */
- powspec_t *power;
- /* Noise estimate */
- powspec_t *noise;
- /* Signal floor estimate */
- powspec_t *floor;
- /* Peak for temporal masking */
- powspec_t *peak;
-
- /* Initialize it next time */
- uint8 undefined;
- /* Number of items to process */
- uint32 num_filters;
-
- /* Precomputed constants */
- powspec_t lambda_power;
- powspec_t comp_lambda_power;
- powspec_t lambda_a;
- powspec_t comp_lambda_a;
- powspec_t lambda_b;
- powspec_t comp_lambda_b;
- powspec_t lambda_t;
- powspec_t mu_t;
- powspec_t max_gain;
- powspec_t inv_max_gain;
-
- powspec_t smooth_scaling[2 * SMOOTH_WINDOW + 3];
-};
-
-static void
-fe_lower_envelope(noise_stats_t *noise_stats, powspec_t * buf, powspec_t * floor_buf, int32 num_filt)
-{
- int i;
-
- for (i = 0; i < num_filt; i++) {
-#ifndef FIXED_POINT
- if (buf[i] >= floor_buf[i]) {
- floor_buf[i] =
- noise_stats->lambda_a * floor_buf[i] + noise_stats->comp_lambda_a * buf[i];
- }
- else {
- floor_buf[i] =
- noise_stats->lambda_b * floor_buf[i] + noise_stats->comp_lambda_b * buf[i];
- }
-#else
- if (buf[i] >= floor_buf[i]) {
- floor_buf[i] = fe_log_add(noise_stats->lambda_a + floor_buf[i],
- noise_stats->comp_lambda_a + buf[i]);
- }
- else {
- floor_buf[i] = fe_log_add(noise_stats->lambda_b + floor_buf[i],
- noise_stats->comp_lambda_b + buf[i]);
- }
-#endif
- }
-}
-
-/* temporal masking */
-static void
-fe_temp_masking(noise_stats_t *noise_stats, powspec_t * buf, powspec_t * peak, int32 num_filt)
-{
- powspec_t cur_in;
- int i;
-
- for (i = 0; i < num_filt; i++) {
- cur_in = buf[i];
-
-#ifndef FIXED_POINT
- peak[i] *= noise_stats->lambda_t;
- if (buf[i] < noise_stats->lambda_t * peak[i])
- buf[i] = peak[i] * noise_stats->mu_t;
-#else
- peak[i] += noise_stats->lambda_t;
- if (buf[i] < noise_stats->lambda_t + peak[i])
- buf[i] = peak[i] + noise_stats->mu_t;
-#endif
-
- if (cur_in > peak[i])
- peak[i] = cur_in;
- }
-}
-
-/* spectral weight smoothing */
-static void
-fe_weight_smooth(noise_stats_t *noise_stats, powspec_t * buf, powspec_t * coefs, int32 num_filt)
-{
- int i, j;
- int l1, l2;
- powspec_t coef;
-
- for (i = 0; i < num_filt; i++) {
- l1 = ((i - SMOOTH_WINDOW) > 0) ? (i - SMOOTH_WINDOW) : 0;
- l2 = ((i + SMOOTH_WINDOW) <
- (num_filt - 1)) ? (i + SMOOTH_WINDOW) : (num_filt - 1);
-
-#ifndef FIXED_POINT
- coef = 0;
- for (j = l1; j <= l2; j++) {
- coef += coefs[j];
- }
- buf[i] = buf[i] * (coef / (l2 - l1 + 1));
-#else
- coef = MIN_FIXLOG;
- for (j = l1; j <= l2; j++) {
- coef = fe_log_add(coef, coefs[j]);
- }
- buf[i] = buf[i] + coef - noise_stats->smooth_scaling[l2 - l1 + 1];
-#endif
-
- }
-}
-
-noise_stats_t *
-fe_init_noisestats(int num_filters)
-{
- int i;
- noise_stats_t *noise_stats;
-
- noise_stats = (noise_stats_t *) ckd_calloc(1, sizeof(noise_stats_t));
-
- noise_stats->power =
- (powspec_t *) ckd_calloc(num_filters, sizeof(powspec_t));
- noise_stats->noise =
- (powspec_t *) ckd_calloc(num_filters, sizeof(powspec_t));
- noise_stats->floor =
- (powspec_t *) ckd_calloc(num_filters, sizeof(powspec_t));
- noise_stats->peak =
- (powspec_t *) ckd_calloc(num_filters, sizeof(powspec_t));
-
- noise_stats->undefined = TRUE;
- noise_stats->num_filters = num_filters;
-
-#ifndef FIXED_POINT
- noise_stats->lambda_power = LAMBDA_POWER;
- noise_stats->comp_lambda_power = 1 - LAMBDA_POWER;
- noise_stats->lambda_a = LAMBDA_A;
- noise_stats->comp_lambda_a = 1 - LAMBDA_A;
- noise_stats->lambda_b = LAMBDA_B;
- noise_stats->comp_lambda_b = 1 - LAMBDA_B;
- noise_stats->lambda_t = LAMBDA_T;
- noise_stats->mu_t = MU_T;
- noise_stats->max_gain = MAX_GAIN;
- noise_stats->inv_max_gain = 1.0 / MAX_GAIN;
-
- for (i = 1; i < 2 * SMOOTH_WINDOW + 1; i++) {
- noise_stats->smooth_scaling[i] = 1.0 / i;
- }
-#else
- noise_stats->lambda_power = FLOAT2FIX(log(LAMBDA_POWER));
- noise_stats->comp_lambda_power = FLOAT2FIX(log(1 - LAMBDA_POWER));
- noise_stats->lambda_a = FLOAT2FIX(log(LAMBDA_A));
- noise_stats->comp_lambda_a = FLOAT2FIX(log(1 - LAMBDA_A));
- noise_stats->lambda_b = FLOAT2FIX(log(LAMBDA_B));
- noise_stats->comp_lambda_b = FLOAT2FIX(log(1 - LAMBDA_B));
- noise_stats->lambda_t = FLOAT2FIX(log(LAMBDA_T));
- noise_stats->mu_t = FLOAT2FIX(log(MU_T));
- noise_stats->max_gain = FLOAT2FIX(log(MAX_GAIN));
- noise_stats->inv_max_gain = FLOAT2FIX(log(1.0 / MAX_GAIN));
-
- for (i = 1; i < 2 * SMOOTH_WINDOW + 3; i++) {
- noise_stats->smooth_scaling[i] = FLOAT2FIX(log(i));
- }
-#endif
-
- return noise_stats;
-}
-
-void
-fe_reset_noisestats(noise_stats_t * noise_stats)
-{
- if (noise_stats)
- noise_stats->undefined = TRUE;
-}
-
-void
-fe_free_noisestats(noise_stats_t * noise_stats)
-{
- ckd_free(noise_stats->power);
- ckd_free(noise_stats->noise);
- ckd_free(noise_stats->floor);
- ckd_free(noise_stats->peak);
- ckd_free(noise_stats);
-}
-
-/**
- * For fixed point we are doing the computation in a fixlog domain,
- * so we have to add many processing cases.
- */
-void
-fe_track_snr(fe_t * fe, int32 *in_speech)
-{
- powspec_t *signal;
- powspec_t *gain;
- noise_stats_t *noise_stats;
- powspec_t *mfspec;
- int32 i, num_filts;
- powspec_t lrt, snr, max_signal, log_signal;
-
- if (!(fe->remove_noise || fe->remove_silence)) {
- *in_speech = TRUE;
- return;
- }
-
- noise_stats = fe->noise_stats;
- mfspec = fe->mfspec;
- num_filts = noise_stats->num_filters;
-
- signal = (powspec_t *) ckd_calloc(num_filts, sizeof(powspec_t));
-
- if (noise_stats->undefined) {
- for (i = 0; i < num_filts; i++) {
- noise_stats->power[i] = mfspec[i];
- noise_stats->noise[i] = mfspec[i];
-#ifndef FIXED_POINT
- noise_stats->floor[i] = mfspec[i] / noise_stats->max_gain;
- noise_stats->peak[i] = 0.0;
-#else
- noise_stats->floor[i] = mfspec[i] - noise_stats->max_gain;
- noise_stats->peak[i] = MIN_FIXLOG;
-#endif
- }
- noise_stats->undefined = FALSE;
- }
-
- /* Calculate smoothed power */
- for (i = 0; i < num_filts; i++) {
-#ifndef FIXED_POINT
- noise_stats->power[i] =
- noise_stats->lambda_power * noise_stats->power[i] + noise_stats->comp_lambda_power * mfspec[i];
-#else
- noise_stats->power[i] = fe_log_add(noise_stats->lambda_power + noise_stats->power[i],
- noise_stats->comp_lambda_power + mfspec[i]);
-#endif
- }
-
- /* Noise estimation and vad decision */
- fe_lower_envelope(noise_stats, noise_stats->power, noise_stats->noise, num_filts);
-
- lrt = FLOAT2FIX(0.0f);
- max_signal = FLOAT2FIX(0.0f);
- for (i = 0; i < num_filts; i++) {
-#ifndef FIXED_POINT
- signal[i] = noise_stats->power[i] - noise_stats->noise[i];
- if (signal[i] < 1.0)
- signal[i] = 1.0;
- snr = log(noise_stats->power[i] / noise_stats->noise[i]);
- log_signal = log(signal[i]);
-#else
- signal[i] = fe_log_sub(noise_stats->power[i], noise_stats->noise[i]);
- snr = noise_stats->power[i] - noise_stats->noise[i];
- log_signal = signal[i];
-#endif
- if (snr > lrt) {
- lrt = snr;
- if (log_signal > max_signal) {
- max_signal = log_signal;
- }
- }
- }
-
-#ifndef FIXED_POINT
- if (fe->remove_silence && (lrt < fe->vad_threshold || max_signal < fe->vad_threshold)) {
-#else
- if (fe->remove_silence && (lrt < FLOAT2FIX(fe->vad_threshold) || max_signal < FLOAT2FIX(fe->vad_threshold))) {
-#endif
- *in_speech = FALSE;
- } else {
- *in_speech = TRUE;
- }
-
- fe_lower_envelope(noise_stats, signal, noise_stats->floor, num_filts);
-
- fe_temp_masking(noise_stats, signal, noise_stats->peak, num_filts);
-
- if (!fe->remove_noise) {
- //no need for further calculations if noise cancellation disabled
- ckd_free(signal);
- return;
- }
-
- for (i = 0; i < num_filts; i++) {
- if (signal[i] < noise_stats->floor[i])
- signal[i] = noise_stats->floor[i];
- }
-
- gain = (powspec_t *) ckd_calloc(num_filts, sizeof(powspec_t));
-#ifndef FIXED_POINT
- for (i = 0; i < num_filts; i++) {
- if (signal[i] < noise_stats->max_gain * noise_stats->power[i])
- gain[i] = signal[i] / noise_stats->power[i];
- else
- gain[i] = noise_stats->max_gain;
- if (gain[i] < noise_stats->inv_max_gain)
- gain[i] = noise_stats->inv_max_gain;
- }
-#else
- for (i = 0; i < num_filts; i++) {
- gain[i] = signal[i] - noise_stats->power[i];
- if (gain[i] > noise_stats->max_gain)
- gain[i] = noise_stats->max_gain;
- if (gain[i] < noise_stats->inv_max_gain)
- gain[i] = noise_stats->inv_max_gain;
- }
-#endif
-
- /* Weight smoothing and time frequency normalization */
- fe_weight_smooth(noise_stats, mfspec, gain, num_filts);
-
- ckd_free(gain);
- ckd_free(signal);
-}
-
-void
-fe_vad_hangover(fe_t * fe, mfcc_t * fea, int32 is_speech)
-{
- /* track vad state and deal with cepstrum prespeech buffer */
- fe->vad_data->state_changed = 0;
- if (is_speech) {
- fe->vad_data->postspch_num = 0;
- if (!fe->vad_data->global_state) {
- fe->vad_data->prespch_num++;
- fe_prespch_write_cep(fe->vad_data->prespch_buf, fea);
- /* check for transition sil->speech */
- if (fe->vad_data->prespch_num >= fe->prespch_len) {
- fe->vad_data->prespch_num = 0;
- fe->vad_data->global_state = 1;
- /* transition silence->speech occurred */
- fe->vad_data->state_changed = 1;
- }
- }
- } else {
- fe->vad_data->prespch_num = 0;
- fe_prespch_reset_cep(fe->vad_data->prespch_buf);
- if (fe->vad_data->global_state) {
- fe->vad_data->postspch_num++;
- /* check for transition speech->sil */
- if (fe->vad_data->postspch_num >= fe->postspch_len) {
- fe->vad_data->postspch_num = 0;
- fe->vad_data->global_state = 0;
- /* transition speech->silence occurred */
- fe->vad_data->state_changed = 1;
- }
- }
- }
-
- if (fe->vad_data->store_pcm) {
- if (is_speech || fe->vad_data->global_state)
- fe_prespch_write_pcm(fe->vad_data->prespch_buf, fe->spch);
- if (!is_speech && !fe->vad_data->global_state)
- fe_prespch_reset_pcm(fe->vad_data->prespch_buf);
- }
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_noise.h b/media/sphinxbase/src/libsphinxbase/fe/fe_noise.h
deleted file mode 100644
index b633a4cec..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_noise.h
+++ /dev/null
@@ -1,66 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2013 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-#ifndef FE_NOISE_H
-#define FE_NOISE_H
-
-#include "sphinxbase/fe.h"
-#include "sphinxbase/fixpoint.h"
-#include "fe_type.h"
-
-typedef struct noise_stats_s noise_stats_t;
-
-/* Creates noisestats object */
-noise_stats_t *fe_init_noisestats(int num_filters);
-
-/* Resets collected noise statistics */
-void fe_reset_noisestats(noise_stats_t * noise_stats);
-
-/* Frees allocated data */
-void fe_free_noisestats(noise_stats_t * noise_stats);
-
-/**
- * Process frame, update noise statistics, remove noise components if needed,
- * and return local vad decision.
- */
-void fe_track_snr(fe_t *fe, int32 *in_speech);
-
-/**
- * Updates global state based on local VAD state smoothing the estimate.
- */
-void fe_vad_hangover(fe_t *fe, mfcc_t *fea, int32 is_speech);
-
-#endif /* FE_NOISE_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.c b/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.c
deleted file mode 100644
index 028c09ac5..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.c
+++ /dev/null
@@ -1,182 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
-* Copyright (c) 2013 Carnegie Mellon University. All rights
-* reserved.
-*
-* Redistribution and use in source and binary forms, with or without
-* modification, are permitted provided that the following conditions
-* are met:
-*
-* 1. Redistributions of source code must retain the above copyright
-* notice, this list of conditions and the following disclaimer.
-*
-* 2. Redistributions in binary form must reproduce the above copyright
-* notice, this list of conditions and the following disclaimer in
-* the documentation and/or other materials provided with the
-* distribution.
-*
-* This work was supported in part by funding from the Defense Advanced
-* Research Projects Agency and the National Science Foundation of the
-* United States of America, and the CMU Sphinx Speech Consortium.
-*
-* THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
-* ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
-* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
-* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
-* NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-*
-* ====================================================================
-*
-*/
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include <stdio.h>
-#include <string.h>
-#include <assert.h>
-
-#include "sphinxbase/ckd_alloc.h"
-#include "sphinxbase/err.h"
-
-#include "fe_prespch_buf.h"
-
-struct prespch_buf_s {
- /* saved mfcc frames */
- mfcc_t **cep_buf;
- /* saved pcm audio */
- int16 *pcm_buf;
- /* flag for pcm buffer initialization */
- int16 cep_write_ptr;
- /* read pointer for cep buffer */
- int16 cep_read_ptr;
- /* write pointer for pcm buffer */
- int16 pcm_write_ptr;
- /* frames amount in cep buffer */
- int16 num_frames_cep;
- /* frames amount in pcm buffer */
- int16 num_frames_pcm;
- /* filters amount */
- int16 num_cepstra;
- /* amount of fresh samples in frame */
- int16 num_samples;
-};
-
-prespch_buf_t *
-fe_prespch_init(int num_frames, int num_cepstra, int num_samples)
-{
- prespch_buf_t *prespch_buf;
-
- prespch_buf = (prespch_buf_t *) ckd_calloc(1, sizeof(prespch_buf_t));
-
- prespch_buf->num_cepstra = num_cepstra;
- prespch_buf->num_frames_cep = num_frames;
- prespch_buf->num_samples = num_samples;
- prespch_buf->num_frames_pcm = 0;
- prespch_buf->cep_write_ptr = 0;
- prespch_buf->cep_read_ptr = 0;
- prespch_buf->pcm_write_ptr = 0;
-
- prespch_buf->cep_buf = (mfcc_t **)
- ckd_calloc_2d(num_frames, num_cepstra,
- sizeof(**prespch_buf->cep_buf));
-
- return prespch_buf;
-}
-
-void
-fe_prespch_extend_pcm(prespch_buf_t* prespch_buf, int num_frames_pcm)
-{
- num_frames_pcm += prespch_buf->num_frames_cep + 1;
- if (num_frames_pcm > prespch_buf->num_frames_pcm) {
- prespch_buf->num_frames_pcm = num_frames_pcm;
- prespch_buf->pcm_buf = (int16 *) ckd_realloc(prespch_buf->pcm_buf, prespch_buf->num_frames_pcm * prespch_buf->num_samples * sizeof(int16));
- }
-}
-
-int
-fe_prespch_read_cep(prespch_buf_t * prespch_buf, mfcc_t * fea)
-{
- if (prespch_buf->cep_read_ptr >= prespch_buf->num_frames_cep)
- return 0;
- if (prespch_buf->cep_read_ptr >= prespch_buf->cep_write_ptr)
- return 0;
- memcpy(fea, prespch_buf->cep_buf[prespch_buf->cep_read_ptr],
- sizeof(mfcc_t) * prespch_buf->num_cepstra);
- prespch_buf->cep_read_ptr++;
- return 1;
-}
-
-void
-fe_prespch_write_cep(prespch_buf_t * prespch_buf, mfcc_t * fea)
-{
- assert(prespch_buf->cep_write_ptr < prespch_buf->num_frames_cep);
- memcpy(prespch_buf->cep_buf[prespch_buf->cep_write_ptr], fea,
- sizeof(mfcc_t) * prespch_buf->num_cepstra);
- prespch_buf->cep_write_ptr++;
-}
-
-void
-fe_prespch_read_pcm(prespch_buf_t * prespch_buf, int16 ** samples,
- int32 * samples_num)
-{
- if (!prespch_buf->pcm_buf) {
- /* pcm prespch buffer isn't initialized yet */
- samples = NULL;
- *samples_num = 0;
- return;
- }
- *samples = prespch_buf->pcm_buf;
- *samples_num = prespch_buf->pcm_write_ptr * prespch_buf->num_samples;
- prespch_buf->pcm_write_ptr = 0;
-}
-
-void
-fe_prespch_write_pcm(prespch_buf_t * prespch_buf, int16 * samples)
-{
- int32 sample_ptr;
-
- assert(prespch_buf->pcm_write_ptr < prespch_buf->num_frames_pcm);
- sample_ptr = prespch_buf->pcm_write_ptr * prespch_buf->num_samples;
- memcpy(&prespch_buf->pcm_buf[sample_ptr], samples,
- prespch_buf->num_samples * sizeof(int16));
- prespch_buf->pcm_write_ptr++;
-}
-
-void
-fe_prespch_reset_cep(prespch_buf_t * prespch_buf)
-{
- prespch_buf->cep_read_ptr = 0;
- prespch_buf->cep_write_ptr = 0;
-}
-
-void
-fe_prespch_reset_pcm(prespch_buf_t * prespch_buf)
-{
- prespch_buf->pcm_write_ptr = 0;
-}
-
-void
-fe_prespch_free(prespch_buf_t * prespch_buf)
-{
- if (!prespch_buf)
- return;
- if (prespch_buf->cep_buf)
- ckd_free_2d((void **) prespch_buf->cep_buf);
- if (prespch_buf->pcm_buf)
- ckd_free(prespch_buf->pcm_buf);
- ckd_free(prespch_buf);
-}
-
-int32
-fe_prespch_ncep(prespch_buf_t * prespch_buf)
-{
- return prespch_buf->cep_write_ptr - prespch_buf->cep_read_ptr;
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.h b/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.h
deleted file mode 100644
index d349ddfdb..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_prespch_buf.h
+++ /dev/null
@@ -1,79 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2013 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-/* Buffer that maintains both features and raw audio for the VAD implementation */
-
-#ifndef FE_INTERNAL_H
-#define FE_INTERNAL_H
-
-#include "sphinxbase/fe.h"
-
-typedef struct prespch_buf_s prespch_buf_t;
-
-/* Creates prespeech buffer */
-prespch_buf_t *fe_prespch_init(int num_frames, int num_cepstra,
- int num_samples);
-
-/* Extends pcm prespeech buffer with specified amount of frames */
-void fe_prespch_extend_pcm(prespch_buf_t* prespch_buf, int num_frames_pcm);
-
-/* Reads mfcc frame from prespeech buffer */
-int fe_prespch_read_cep(prespch_buf_t * prespch_buf, mfcc_t * fea);
-
-/* Writes mfcc frame to prespeech buffer */
-void fe_prespch_write_cep(prespch_buf_t * prespch_buf, mfcc_t * fea);
-
-/* Reads pcm frame from prespeech buffer */
-void fe_prespch_read_pcm(prespch_buf_t * prespch_buf, int16 ** samples,
- int32 * samples_num);
-
-/* Writes pcm frame to prespeech buffer */
-void fe_prespch_write_pcm(prespch_buf_t * prespch_buf, int16 * samples);
-
-/* Resets read/write pointers for cepstrum buffer */
-void fe_prespch_reset_cep(prespch_buf_t * prespch_buf);
-
-/* Resets read/write pointer for pcm audio buffer */
-void fe_prespch_reset_pcm(prespch_buf_t * prespch_buf);
-
-/* Releases prespeech buffer */
-void fe_prespch_free(prespch_buf_t * prespch_buf);
-
-/* Returns number of accumulated frames */
-int32 fe_prespch_ncep(prespch_buf_t * prespch_buf);
-
-#endif /* FE_INTERNAL_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_sigproc.c b/media/sphinxbase/src/libsphinxbase/fe/fe_sigproc.c
deleted file mode 100644
index 577640f62..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_sigproc.c
+++ /dev/null
@@ -1,1377 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 1996-2004 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#include <stdio.h>
-#include <math.h>
-#include <string.h>
-#include <stdlib.h>
-#include <assert.h>
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#ifdef _MSC_VER
-#pragma warning (disable: 4244)
-#endif
-
-/**
- * Windows math.h does not contain M_PI
- */
-#ifndef M_PI
-#define M_PI 3.14159265358979323846
-#endif
-
-#include "sphinxbase/prim_type.h"
-#include "sphinxbase/ckd_alloc.h"
-#include "sphinxbase/byteorder.h"
-#include "sphinxbase/fixpoint.h"
-#include "sphinxbase/fe.h"
-#include "sphinxbase/genrand.h"
-#include "sphinxbase/err.h"
-
-#include "fe_internal.h"
-#include "fe_warp.h"
-
-/* Use extra precision for cosines, Hamming window, pre-emphasis
- * coefficient, twiddle factors. */
-#ifdef FIXED_POINT
-#define FLOAT2COS(x) FLOAT2FIX_ANY(x,30)
-#define COSMUL(x,y) FIXMUL_ANY(x,y,30)
-#else
-#define FLOAT2COS(x) (x)
-#define COSMUL(x,y) ((x)*(y))
-#endif
-
-#ifdef FIXED_POINT
-
-/* Internal log-addition table for natural log with radix point at 8
- * bits. Each entry is 256 * log(1 + e^{-n/256}). This is used in the
- * log-add computation:
- *
- * e^z = e^x + e^y
- * e^z = e^x(1 + e^{y-x}) = e^y(1 + e^{x-y})
- * z = x + log(1 + e^{y-x}) = y + log(1 + e^{x-y})
- *
- * So when y > x, z = y + logadd_table[-(x-y)]
- * when x > y, z = x + logadd_table[-(y-x)]
- */
-static const unsigned char fe_logadd_table[] = {
- 177, 177, 176, 176, 175, 175, 174, 174, 173, 173,
- 172, 172, 172, 171, 171, 170, 170, 169, 169, 168,
- 168, 167, 167, 166, 166, 165, 165, 164, 164, 163,
- 163, 162, 162, 161, 161, 161, 160, 160, 159, 159,
- 158, 158, 157, 157, 156, 156, 155, 155, 155, 154,
- 154, 153, 153, 152, 152, 151, 151, 151, 150, 150,
- 149, 149, 148, 148, 147, 147, 147, 146, 146, 145,
- 145, 144, 144, 144, 143, 143, 142, 142, 141, 141,
- 141, 140, 140, 139, 139, 138, 138, 138, 137, 137,
- 136, 136, 136, 135, 135, 134, 134, 134, 133, 133,
- 132, 132, 131, 131, 131, 130, 130, 129, 129, 129,
- 128, 128, 128, 127, 127, 126, 126, 126, 125, 125,
- 124, 124, 124, 123, 123, 123, 122, 122, 121, 121,
- 121, 120, 120, 119, 119, 119, 118, 118, 118, 117,
- 117, 117, 116, 116, 115, 115, 115, 114, 114, 114,
- 113, 113, 113, 112, 112, 112, 111, 111, 110, 110,
- 110, 109, 109, 109, 108, 108, 108, 107, 107, 107,
- 106, 106, 106, 105, 105, 105, 104, 104, 104, 103,
- 103, 103, 102, 102, 102, 101, 101, 101, 100, 100,
- 100, 99, 99, 99, 98, 98, 98, 97, 97, 97,
- 96, 96, 96, 96, 95, 95, 95, 94, 94, 94,
- 93, 93, 93, 92, 92, 92, 92, 91, 91, 91,
- 90, 90, 90, 89, 89, 89, 89, 88, 88, 88,
- 87, 87, 87, 87, 86, 86, 86, 85, 85, 85,
- 85, 84, 84, 84, 83, 83, 83, 83, 82, 82,
- 82, 82, 81, 81, 81, 80, 80, 80, 80, 79,
- 79, 79, 79, 78, 78, 78, 78, 77, 77, 77,
- 77, 76, 76, 76, 75, 75, 75, 75, 74, 74,
- 74, 74, 73, 73, 73, 73, 72, 72, 72, 72,
- 71, 71, 71, 71, 71, 70, 70, 70, 70, 69,
- 69, 69, 69, 68, 68, 68, 68, 67, 67, 67,
- 67, 67, 66, 66, 66, 66, 65, 65, 65, 65,
- 64, 64, 64, 64, 64, 63, 63, 63, 63, 63,
- 62, 62, 62, 62, 61, 61, 61, 61, 61, 60,
- 60, 60, 60, 60, 59, 59, 59, 59, 59, 58,
- 58, 58, 58, 58, 57, 57, 57, 57, 57, 56,
- 56, 56, 56, 56, 55, 55, 55, 55, 55, 54,
- 54, 54, 54, 54, 53, 53, 53, 53, 53, 52,
- 52, 52, 52, 52, 52, 51, 51, 51, 51, 51,
- 50, 50, 50, 50, 50, 50, 49, 49, 49, 49,
- 49, 49, 48, 48, 48, 48, 48, 48, 47, 47,
- 47, 47, 47, 47, 46, 46, 46, 46, 46, 46,
- 45, 45, 45, 45, 45, 45, 44, 44, 44, 44,
- 44, 44, 43, 43, 43, 43, 43, 43, 43, 42,
- 42, 42, 42, 42, 42, 41, 41, 41, 41, 41,
- 41, 41, 40, 40, 40, 40, 40, 40, 40, 39,
- 39, 39, 39, 39, 39, 39, 38, 38, 38, 38,
- 38, 38, 38, 37, 37, 37, 37, 37, 37, 37,
- 37, 36, 36, 36, 36, 36, 36, 36, 35, 35,
- 35, 35, 35, 35, 35, 35, 34, 34, 34, 34,
- 34, 34, 34, 34, 33, 33, 33, 33, 33, 33,
- 33, 33, 32, 32, 32, 32, 32, 32, 32, 32,
- 32, 31, 31, 31, 31, 31, 31, 31, 31, 31,
- 30, 30, 30, 30, 30, 30, 30, 30, 30, 29,
- 29, 29, 29, 29, 29, 29, 29, 29, 28, 28,
- 28, 28, 28, 28, 28, 28, 28, 28, 27, 27,
- 27, 27, 27, 27, 27, 27, 27, 27, 26, 26,
- 26, 26, 26, 26, 26, 26, 26, 26, 25, 25,
- 25, 25, 25, 25, 25, 25, 25, 25, 25, 24,
- 24, 24, 24, 24, 24, 24, 24, 24, 24, 24,
- 23, 23, 23, 23, 23, 23, 23, 23, 23, 23,
- 23, 23, 22, 22, 22, 22, 22, 22, 22, 22,
- 22, 22, 22, 22, 21, 21, 21, 21, 21, 21,
- 21, 21, 21, 21, 21, 21, 21, 20, 20, 20,
- 20, 20, 20, 20, 20, 20, 20, 20, 20, 20,
- 19, 19, 19, 19, 19, 19, 19, 19, 19, 19,
- 19, 19, 19, 19, 18, 18, 18, 18, 18, 18,
- 18, 18, 18, 18, 18, 18, 18, 18, 18, 17,
- 17, 17, 17, 17, 17, 17, 17, 17, 17, 17,
- 17, 17, 17, 17, 16, 16, 16, 16, 16, 16,
- 16, 16, 16, 16, 16, 16, 16, 16, 16, 16,
- 16, 15, 15, 15, 15, 15, 15, 15, 15, 15,
- 15, 15, 15, 15, 15, 15, 15, 15, 14, 14,
- 14, 14, 14, 14, 14, 14, 14, 14, 14, 14,
- 14, 14, 14, 14, 14, 14, 14, 13, 13, 13,
- 13, 13, 13, 13, 13, 13, 13, 13, 13, 13,
- 13, 13, 13, 13, 13, 13, 13, 12, 12, 12,
- 12, 12, 12, 12, 12, 12, 12, 12, 12, 12,
- 12, 12, 12, 12, 12, 12, 12, 12, 12, 11,
- 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
- 11, 11, 11, 11, 11, 11, 11, 11, 11, 11,
- 11, 11, 11, 10, 10, 10, 10, 10, 10, 10,
- 10, 10, 10, 10, 10, 10, 10, 10, 10, 10,
- 10, 10, 10, 10, 10, 10, 10, 10, 10, 9,
- 9, 9, 9, 9, 9, 9, 9, 9, 9, 9,
- 9, 9, 9, 9, 9, 9, 9, 9, 9, 9,
- 9, 9, 9, 9, 9, 9, 9, 9, 8, 8,
- 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
- 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
- 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
- 7, 7, 7, 7, 7, 7, 7, 7, 7, 7,
- 7, 7, 7, 7, 7, 7, 7, 7, 7, 7,
- 7, 7, 7, 7, 7, 7, 7, 7, 7, 7,
- 7, 7, 7, 7, 7, 7, 7, 7, 6, 6,
- 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
- 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
- 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
- 6, 6, 6, 6, 6, 6, 6, 6, 6, 6,
- 6, 5, 5, 5, 5, 5, 5, 5, 5, 5,
- 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
- 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
- 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
- 5, 5, 5, 5, 5, 5, 5, 5, 5, 5,
- 5, 5, 5, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 4, 4,
- 4, 4, 4, 4, 4, 4, 4, 4, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
- 3, 3, 3, 3, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
- 2, 2, 2, 2, 2, 2, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
- 1, 1, 1, 1, 1, 1, 1, 0
-};
-
-static const int fe_logadd_table_size =
- sizeof(fe_logadd_table) / sizeof(fe_logadd_table[0]);
-
-fixed32
-fe_log_add(fixed32 x, fixed32 y)
-{
- fixed32 d, r;
-
- if (x > y) {
- d = (x - y) >> (DEFAULT_RADIX - 8);
- r = x;
- }
- else {
- d = (y - x) >> (DEFAULT_RADIX - 8);
- r = y;
- }
-
- if (r <= MIN_FIXLOG)
- return MIN_FIXLOG;
- else if (d > fe_logadd_table_size - 1)
- return r;
- else {
- r += ((fixed32) fe_logadd_table[d] << (DEFAULT_RADIX - 8));
-/* printf("%d - %d = %d | %f - %f = %f | %f - %f = %f\n",
- x, y, r, FIX2FLOAT(x), FIX2FLOAT(y), FIX2FLOAT(r),
- exp(FIX2FLOAT(x)), exp(FIX2FLOAT(y)), exp(FIX2FLOAT(r)));
-*/
- return r;
- }
-}
-
-/*
- * log_sub for spectral subtraction, similar to logadd but we had
- * to smooth function around zero with fixlog in order to improve
- * table interpolation properties
- *
- * The table is created with the file included into distribution
- *
- * e^z = e^x - e^y
- * e^z = e^x (1 - e^(-(x - y)))
- * z = x + log(1 - e^(-(x - y)))
- * z = x + fixlog(a) + (log(1 - e^(- a)) - log(a))
- *
- * Input radix is 8 output radix is 10
- */
-static const uint16 fe_logsub_table[] = {
-1, 3, 5, 7, 9, 11, 13, 15, 17, 19,
-21, 23, 25, 27, 29, 31, 33, 35, 37, 39,
-41, 43, 45, 47, 49, 51, 53, 55, 56, 58,
-60, 62, 64, 66, 68, 70, 72, 74, 76, 78,
-80, 82, 84, 86, 88, 90, 92, 94, 95, 97,
-99, 101, 103, 105, 107, 109, 111, 113, 115, 117,
-119, 121, 122, 124, 126, 128, 130, 132, 134, 136,
-138, 140, 142, 143, 145, 147, 149, 151, 153, 155,
-157, 159, 161, 162, 164, 166, 168, 170, 172, 174,
-176, 178, 179, 181, 183, 185, 187, 189, 191, 193,
-194, 196, 198, 200, 202, 204, 206, 207, 209, 211,
-213, 215, 217, 219, 220, 222, 224, 226, 228, 230,
-232, 233, 235, 237, 239, 241, 243, 244, 246, 248,
-250, 252, 254, 255, 257, 259, 261, 263, 265, 266,
-268, 270, 272, 274, 275, 277, 279, 281, 283, 284,
-286, 288, 290, 292, 294, 295, 297, 299, 301, 302,
-304, 306, 308, 310, 311, 313, 315, 317, 319, 320,
-322, 324, 326, 327, 329, 331, 333, 335, 336, 338,
-340, 342, 343, 345, 347, 349, 350, 352, 354, 356,
-357, 359, 361, 363, 364, 366, 368, 370, 371, 373,
-375, 377, 378, 380, 382, 384, 385, 387, 389, 391,
-392, 394, 396, 397, 399, 401, 403, 404, 406, 408,
-410, 411, 413, 415, 416, 418, 420, 422, 423, 425,
-427, 428, 430, 432, 433, 435, 437, 439, 440, 442,
-444, 445, 447, 449, 450, 452, 454, 455, 457, 459,
-460, 462, 464, 465, 467, 469, 471, 472, 474, 476,
-477, 479, 481, 482, 484, 486, 487, 489, 490, 492,
-494, 495, 497, 499, 500, 502, 504, 505, 507, 509,
-510, 512, 514, 515, 517, 518, 520, 522, 523, 525,
-527, 528, 530, 532, 533, 535, 536, 538, 540, 541,
-543, 544, 546, 548, 549, 551, 553, 554, 556, 557,
-559, 561, 562, 564, 565, 567, 569, 570, 572, 573,
-575, 577, 578, 580, 581, 583, 585, 586, 588, 589,
-591, 592, 594, 596, 597, 599, 600, 602, 603, 605,
-607, 608, 610, 611, 613, 614, 616, 618, 619, 621,
-622, 624, 625, 627, 628, 630, 632, 633, 635, 636,
-638, 639, 641, 642, 644, 645, 647, 649, 650, 652,
-653, 655, 656, 658, 659, 661, 662, 664, 665, 667,
-668, 670, 671, 673, 674, 676, 678, 679, 681, 682,
-684, 685, 687, 688, 690, 691, 693, 694, 696, 697,
-699, 700, 702, 703, 705, 706, 708, 709, 711, 712,
-714, 715, 717, 718, 719, 721, 722, 724, 725, 727,
-728, 730, 731, 733, 734, 736, 737, 739, 740, 742,
-743, 745, 746, 747, 749, 750, 752, 753, 755, 756,
-758, 759, 761, 762, 763, 765, 766, 768, 769, 771,
-772, 774, 775, 776, 778, 779, 781, 782, 784, 785,
-786, 788, 789, 791, 792, 794, 795, 796, 798, 799,
-801, 802, 804, 805, 806, 808, 809, 811, 812, 813,
-815, 816, 818, 819, 820, 822, 823, 825, 826, 827,
-829, 830, 832, 833, 834, 836, 837, 839, 840, 841,
-843, 844, 846, 847, 848, 850, 851, 852, 854, 855,
-857, 858, 859, 861, 862, 863, 865, 866, 868, 869,
-870, 872, 873, 874, 876, 877, 878, 880, 881, 883,
-884, 885, 887, 888, 889, 891, 892, 893, 895, 896,
-897, 899, 900, 901, 903, 904, 905, 907, 908, 909,
-911, 912, 913, 915, 916, 917, 919, 920, 921, 923,
-924, 925, 927, 928, 929, 931, 932, 933, 935, 936,
-937, 939, 940, 941, 942, 944, 945, 946, 948, 949,
-950, 952, 953, 954, 956, 957, 958, 959, 961, 962,
-963, 965, 966, 967, 968, 970, 971, 972, 974, 975,
-976, 977, 979, 980, 981, 983, 984, 985, 986, 988,
-989, 990, 991, 993, 994, 995, 997, 998, 999, 1000,
-1002, 1003, 1004, 1005, 1007, 1008, 1009, 1010, 1012, 1013,
-1014, 1015, 1017, 1018, 1019, 1020, 1022, 1023, 1024, 1025,
-1027, 1028, 1029, 1030, 1032, 1033, 1034, 1035, 1037, 1038,
-1039, 1040, 1041, 1043, 1044, 1045, 1046, 1048, 1049, 1050,
-1051, 1052, 1054, 1055, 1056, 1057, 1059, 1060, 1061, 1062,
-1063, 1065, 1066, 1067, 1068, 1069, 1071, 1072, 1073, 1074,
-1076, 1077, 1078, 1079, 1080, 1082, 1083, 1084, 1085, 1086,
-1087, 1089, 1090, 1091, 1092, 1093, 1095, 1096, 1097, 1098,
-1099, 1101, 1102, 1103, 1104, 1105, 1106, 1108, 1109, 1110,
-1111, 1112, 1114, 1115, 1116, 1117, 1118, 1119, 1121, 1122,
-1123, 1124, 1125, 1126, 1128, 1129, 1130, 1131, 1132, 1133,
-1135, 1136, 1137, 1138, 1139, 1140, 1141, 1143, 1144, 1145,
-1146, 1147, 1148, 1149, 1151, 1152, 1153, 1154, 1155, 1156,
-1157, 1159, 1160, 1161, 1162, 1163, 1164, 1165, 1167, 1168,
-1169, 1170, 1171, 1172, 1173, 1174, 1176, 1177, 1178, 1179,
-1180, 1181, 1182, 1183, 1185, 1186, 1187, 1188, 1189, 1190,
-1191, 1192, 1193, 1195, 1196, 1197, 1198, 1199, 1200, 1201,
-1202, 1203, 1205, 1206, 1207, 1208, 1209, 1210, 1211, 1212,
-1213, 1214, 1216, 1217, 1218, 1219, 1220, 1221, 1222, 1223,
-1224, 1225, 1226, 1228, 1229, 1230, 1231, 1232, 1233, 1234,
-1235, 1236, 1237, 1238, 1239, 1240, 1242, 1243, 1244, 1245,
-1246, 1247, 1248, 1249, 1250, 1251, 1252, 1253, 1254, 1255,
-1256, 1258, 1259, 1260, 1261, 1262, 1263, 1264, 1265, 1266,
-1267, 1268, 1269, 1270, 1271, 1272, 1273, 1274, 1275, 1277,
-1278, 1279, 1280, 1281, 1282, 1283, 1284, 1285, 1286, 1287,
-1288, 1289, 1290, 1291, 1292, 1293, 1294, 1295, 1296, 1297,
-1298, 1299, 1300, 1301, 1302, 1303, 1305, 1306, 1307, 1308,
-1309, 1310, 1311, 1312, 1313, 1314, 1315, 1316, 1317, 1318,
-1319, 1320, 1321, 1322, 1323, 1324, 1325, 1326, 1327, 1328,
-1329, 1330, 1331, 1332, 1333, 1334, 1335, 1336, 1337, 1338,
-1339, 1340, 1341, 1342, 1343, 1344, 1345, 1346, 1347, 1348,
-1349, 1350, 1351, 1352, 1353, 1354, 1355, 1356, 1357, 1358,
-1359, 1360, 1361, 1362, 1363, 1364, 1365, 1366, 1367, 1368,
-1369, 1370, 1371, 1372, 1372, 1373, 1374, 1375, 1376, 1377,
-1378, 1379, 1380, 1381, 1382, 1383, 1384, 1385, 1386, 1387,
-1388, 1389, 1390, 1391, 1392, 1393, 1394, 1395, 1396, 1397,
-1398, 1399, 1399, 1400, 1401, 1402, 1403, 1404, 1405, 1406,
-1407, 1408, 1409, 1410, 1411, 1412, 1413, 1414, 1415, 1416,
-1417, 1418, 1418, 1419, 1420, 1421, 1422, 1423, 1424, 1425,
-1426, 1427, 1428, 1429, 1430, 1431, 1432, 1432, 1433, 1434,
-1435, 1436, 1437, 1438, 1439, 1440, 1441, 1442, 1443, 1444,
-1444, 1445, 1446, 1447, 1448, 1449, 1450, 1451, 1452, 1453,
-1454, 1455, 1455, 1456, 1457, 1458, 1459, 1460, 1461, 1462,
-1463, 1464, 1465, 1466, 1466, 1467, 1468, 1469, 1470, 1471,
-1472, 1473, 1474, 1475, 1475, 1476, 1477, 1478, 1479, 1480,
-1481, 1482, 1483, 1483, 1484, 1485, 1486, 1487, 1488, 1489,
-1490, 1491, 1491, 1492, 1493, 1494, 1495, 1496, 1497, 1498,
-1499, 1499, 1500, 1501, 1502, 1503, 1504, 1505, 1506, 1506,
-1507, 1508, 1509, 1510, 1511, 1512, 1513, 1513, 1514, 1515,
-1516, 1517, 1518, 1519, 1520, 1520, 1521, 1522, 1523, 1524,
-1525, 1526, 1526, 1527, 1528, 1529, 1530, 1531, 1532, 1532,
-1533, 1534, 1535, 1536, 1537, 1538, 1538, 1539, 1540, 1541,
-1542, 1543, 1544, 1544, 1545, 1546, 1547, 1548, 1549, 1550,
-1550, 1551, 1552, 1553, 1554, 1555, 1555, 1556, 1557, 1558,
-1559, 1560, 1560, 1561, 1562, 1563, 1564, 1565, 1565, 1566,
-1567, 1568, 1569, 1570, 1570, 1571, 1572, 1573, 1574, 1575,
-1575, 1576, 1577, 1578, 1579, 1580, 1580, 1581, 1582, 1583,
-1584, 1584, 1585, 1586, 1587, 1588, 1589, 1589, 1590, 1591,
-1592, 1593, 1593, 1594, 1595, 1596, 1597, 1598, 1598, 1599,
-1600, 1601, 1602, 1602, 1603, 1604, 1605, 1606, 1606, 1607,
-1608, 1609, 1610, 1610, 1611, 1612, 1613, 1614, 1614, 1615,
-1616, 1617, 1618, 1618, 1619, 1620, 1621, 1622, 1622, 1623,
-1624, 1625, 1626, 1626, 1627, 1628, 1629, 1630, 1630, 1631,
-1632, 1633, 1634, 1634, 1635, 1636, 1637, 1637, 1638, 1639,
-1640, 1641, 1641, 1642, 1643, 1644, 1645, 1645, 1646, 1647,
-1648, 1648, 1649, 1650, 1651, 1652, 1652, 1653, 1654, 1655,
-1655, 1656, 1657, 1658, 1658, 1659, 1660, 1661, 1662, 1662,
-1663, 1664, 1665, 1665, 1666, 1667, 1668, 1668, 1669, 1670,
-1671, 1671, 1672, 1673, 1674, 1675, 1675, 1676, 1677, 1678,
-1678, 1679, 1680, 1681, 1681, 1682, 1683, 1684, 1684, 1685,
-1686, 1687, 1687, 1688, 1689, 1690, 1690, 1691, 1692, 1693,
-1693, 1694, 1695, 1696, 1696, 1697, 1698, 1699, 1699, 1700,
-1701, 1702, 1702, 1703, 1704, 1705, 1705, 1706, 1707, 1707,
-1708, 1709, 1710, 1710, 1711, 1712, 1713, 1713, 1714, 1715,
-1716, 1716, 1717, 1718, 1718, 1719, 1720, 1721, 1721, 1722,
-1723, 1724, 1724, 1725, 1726, 1727, 1727, 1728, 1729, 1729,
-1730, 1731, 1732, 1732, 1733, 1734, 1734, 1735, 1736, 1737,
-1737, 1738, 1739, 1740, 1740, 1741, 1742, 1742, 1743, 1744,
-1745, 1745, 1746, 1747, 1747, 1748, 1749, 1749, 1750, 1751,
-1752, 1752, 1753, 1754, 1754, 1755, 1756, 1757, 1757, 1758,
-1759, 1759, 1760, 1761, 1762, 1762, 1763, 1764, 1764, 1765,
-1766, 1766, 1767, 1768, 1769, 1769, 1770, 1771, 1771, 1772,
-1773, 1773, 1774, 1775, 1776, 1776, 1777, 1778, 1778, 1779,
-1780, 1780, 1781, 1782, 1782, 1783, 1784, 1784, 1785, 1786,
-1787, 1787, 1788, 1789, 1789, 1790, 1791, 1791, 1792, 1793,
-1793, 1794, 1795, 1795, 1796, 1797, 1798, 1798, 1799, 1800,
-1800, 1801, 1802, 1802, 1803, 1804, 1804, 1805, 1806, 1806,
-1807, 1808, 1808, 1809, 1810, 1810, 1811, 1812, 1812, 1813,
-1814, 1814, 1815, 1816, 1816, 1817, 1818, 1818, 1819, 1820,
-1820, 1821, 1822, 1822, 1823, 1824, 1824, 1825, 1826, 1826,
-1827, 1828, 1828, 1829, 1830, 1830, 1831, 1832, 1832, 1833,
-1834, 1834, 1835, 1836, 1836, 1837, 1838, 1838, 1839, 1840,
-1840, 1841, 1842, 1842, 1843, 1844, 1844, 1845, 1845, 1846,
-1847, 1847, 1848, 1849, 1849, 1850, 1851, 1851, 1852, 1853,
-1853, 1854, 1855, 1855, 1856, 1857, 1857, 1858, 1858, 1859,
-1860, 1860, 1861, 1862, 1862, 1863, 1864, 1864, 1865, 1866,
-1866, 1867, 1867, 1868, 1869, 1869, 1870, 1871, 1871, 1872,
-1873, 1873, 1874, 1874, 1875, 1876, 1876, 1877, 1878, 1878,
-1879, 1879, 1880, 1881, 1881, 1882, 1883, 1883, 1884, 1885,
-1885, 1886, 1886, 1887, 1888, 1888, 1889, 1890, 1890, 1891,
-1891, 1892, 1893, 1893, 1894, 1895, 1895, 1896, 1896, 1897,
-1898, 1898, 1899, 1900, 1900, 1901, 1901, 1902, 1903, 1903,
-1904, 1904, 1905, 1906, 1906, 1907, 1908, 1908, 1909, 1909,
-1910, 1911, 1911, 1912, 1912, 1913, 1914, 1914, 1915, 1916,
-1916, 1917, 1917, 1918, 1919, 1919, 1920, 1920, 1921, 1922,
-1922, 1923, 1923, 1924, 1925, 1925, 1926, 1926, 1927, 1928,
-1928, 1929, 1929, 1930, 1931, 1931, 1932, 1932, 1933, 1934,
-1934, 1935, 1935, 1936, 1937, 1937, 1938, 1938, 1939, 1940,
-1940, 1941, 1941, 1942, 1943, 1943, 1944, 1944, 1945, 1946,
-1946, 1947, 1947, 1948, 1949, 1949, 1950, 1950, 1951, 1952,
-1952, 1953, 1953, 1954, 1955, 1955, 1956, 1956, 1957, 1957,
-1958, 1959, 1959, 1960, 1960, 1961, 1962, 1962, 1963, 1963,
-1964, 1964, 1965, 1966, 1966, 1967, 1967, 1968, 1969, 1969,
-1970, 1970, 1971, 1971, 1972, 1973, 1973, 1974, 1974, 1975,
-1976, 1976, 1977, 1977, 1978, 1978, 1979, 1980, 1980, 1981,
-1981, 1982, 1982, 1983, 1984, 1984, 1985, 1985, 1986, 1986,
-1987, 1988, 1988, 1989, 1989, 1990, 1990, 1991, 1992, 1992,
-1993, 1993, 1994, 1994, 1995, 1996, 1996, 1997, 1997, 1998,
-1998, 1999, 1999, 2000, 2001, 2001, 2002, 2002, 2003, 2003,
-2004, 2005, 2005, 2006, 2006, 2007, 2007, 2008, 2008, 2009,
-2010, 2010, 2011, 2011, 2012, 2012, 2013, 2014, 2014, 2015,
-2015, 2016, 2016, 2017, 2017, 2018, 2019, 2019, 2020, 2020,
-2021, 2021, 2022, 2022, 2023, 2023, 2024, 2025, 2025, 2026,
-2026, 2027, 2027, 2028, 2028, 2029, 2030, 2030, 2031, 2031,
-2032, 2032, 2033, 2033, 2034, 2034, 2035, 2036, 2036, 2037,
-2037, 2038, 2038, 2039, 2039, 2040, 2040, 2041, 2042, 2042,
-2043, 2043, 2044, 2044, 2045, 2045, 2046, 2046, 2047, 2048,
-2048, 2049, 2049, 2050, 2050, 2051, 2051, 2052, 2052, 2053,
-2053, 2054, 2054, 2055, 2056, 2056, 2057, 2057, 2058, 2058,
-2059, 2059, 2060, 2060, 2061, 2061, 2062, 2062, 2063, 2064,
-2064, 2065, 2065, 2066, 2066, 2067, 2067, 2068, 2068, 2069,
-2069, 2070, 2070, 2071, 2072, 2072, 2073, 2073, 2074, 2074,
-2075, 2075, 2076, 2076, 2077, 2077, 2078, 2078, 2079, 2079,
-2080, 2080, 2081
-};
-
-static const int fe_logsub_table_size =
- sizeof(fe_logsub_table) / sizeof(fe_logsub_table[0]);
-
-fixed32
-fe_log_sub(fixed32 x, fixed32 y)
-{
- fixed32 d, r;
-
- if (x < MIN_FIXLOG || y >= x)
- return MIN_FIXLOG;
-
- d = (x - y) >> (DEFAULT_RADIX - 8);
-
- if (d > fe_logsub_table_size - 1)
- return x;
-
- r = fe_logsub_table[d] << (DEFAULT_RADIX - 10);
-/*
- printf("diff=%d\n",
- x + FIXLN(x-y) - r -
- (x + FLOAT2FIX(logf(-expm1f(FIX2FLOAT(y - x))))));
-*/
- return x + FIXLN(x-y) - r;
-}
-
-static fixed32
-fe_log(float32 x)
-{
- if (x <= 0) {
- return MIN_FIXLOG;
- }
- else {
- return FLOAT2FIX(log(x));
- }
-}
-#endif
-
-static float32
-fe_mel(melfb_t * mel, float32 x)
-{
- float32 warped = fe_warp_unwarped_to_warped(mel, x);
-
- return (float32) (2595.0 * log10(1.0 + warped / 700.0));
-}
-
-static float32
-fe_melinv(melfb_t * mel, float32 x)
-{
- float32 warped = (float32) (700.0 * (pow(10.0, x / 2595.0) - 1.0));
- return fe_warp_warped_to_unwarped(mel, warped);
-}
-
-int32
-fe_build_melfilters(melfb_t * mel_fb)
-{
- float32 melmin, melmax, melbw, fftfreq;
- int n_coeffs, i, j;
-
-
- /* Filter coefficient matrix, in flattened form. */
- mel_fb->spec_start =
- ckd_calloc(mel_fb->num_filters, sizeof(*mel_fb->spec_start));
- mel_fb->filt_start =
- ckd_calloc(mel_fb->num_filters, sizeof(*mel_fb->filt_start));
- mel_fb->filt_width =
- ckd_calloc(mel_fb->num_filters, sizeof(*mel_fb->filt_width));
-
- /* First calculate the widths of each filter. */
- /* Minimum and maximum frequencies in mel scale. */
- melmin = fe_mel(mel_fb, mel_fb->lower_filt_freq);
- melmax = fe_mel(mel_fb, mel_fb->upper_filt_freq);
-
- /* Width of filters in mel scale */
- melbw = (melmax - melmin) / (mel_fb->num_filters + 1);
- if (mel_fb->doublewide) {
- melmin -= melbw;
- melmax += melbw;
- if ((fe_melinv(mel_fb, melmin) < 0) ||
- (fe_melinv(mel_fb, melmax) > mel_fb->sampling_rate / 2)) {
- E_WARN
- ("Out of Range: low filter edge = %f (%f)\n",
- fe_melinv(mel_fb, melmin), 0.0);
- E_WARN
- (" high filter edge = %f (%f)\n",
- fe_melinv(mel_fb, melmax), mel_fb->sampling_rate / 2);
- return FE_INVALID_PARAM_ERROR;
- }
- }
-
- /* DFT point spacing */
- fftfreq = mel_fb->sampling_rate / (float32) mel_fb->fft_size;
-
- /* Count and place filter coefficients. */
- n_coeffs = 0;
- for (i = 0; i < mel_fb->num_filters; ++i) {
- float32 freqs[3];
-
- /* Left, center, right frequencies in Hertz */
- for (j = 0; j < 3; ++j) {
- if (mel_fb->doublewide)
- freqs[j] = fe_melinv(mel_fb, (i + j * 2) * melbw + melmin);
- else
- freqs[j] = fe_melinv(mel_fb, (i + j) * melbw + melmin);
- /* Round them to DFT points if requested */
- if (mel_fb->round_filters)
- freqs[j] = ((int) (freqs[j] / fftfreq + 0.5)) * fftfreq;
- }
-
- /* spec_start is the start of this filter in the power spectrum. */
- mel_fb->spec_start[i] = -1;
- /* There must be a better way... */
- for (j = 0; j < mel_fb->fft_size / 2 + 1; ++j) {
- float32 hz = j * fftfreq;
- if (hz < freqs[0])
- continue;
- else if (hz > freqs[2] || j == mel_fb->fft_size / 2) {
- /* filt_width is the width in DFT points of this filter. */
- mel_fb->filt_width[i] = j - mel_fb->spec_start[i];
- /* filt_start is the start of this filter in the filt_coeffs array. */
- mel_fb->filt_start[i] = n_coeffs;
- n_coeffs += mel_fb->filt_width[i];
- break;
- }
- if (mel_fb->spec_start[i] == -1)
- mel_fb->spec_start[i] = j;
- }
- }
-
- /* Now go back and allocate the coefficient array. */
- mel_fb->filt_coeffs =
- ckd_malloc(n_coeffs * sizeof(*mel_fb->filt_coeffs));
-
- /* And now generate the coefficients. */
- n_coeffs = 0;
- for (i = 0; i < mel_fb->num_filters; ++i) {
- float32 freqs[3];
-
- /* Left, center, right frequencies in Hertz */
- for (j = 0; j < 3; ++j) {
- if (mel_fb->doublewide)
- freqs[j] = fe_melinv(mel_fb, (i + j * 2) * melbw + melmin);
- else
- freqs[j] = fe_melinv(mel_fb, (i + j) * melbw + melmin);
- /* Round them to DFT points if requested */
- if (mel_fb->round_filters)
- freqs[j] = ((int) (freqs[j] / fftfreq + 0.5)) * fftfreq;
- }
-
- for (j = 0; j < mel_fb->filt_width[i]; ++j) {
- float32 hz, loslope, hislope;
-
- hz = (mel_fb->spec_start[i] + j) * fftfreq;
- if (hz < freqs[0] || hz > freqs[2]) {
- E_FATAL
- ("Failed to create filterbank, frequency range does not match. "
- "Sample rate %f, FFT size %d, lowerf %f < freq %f > upperf %f.\n",
- mel_fb->sampling_rate, mel_fb->fft_size, freqs[0], hz,
- freqs[2]);
- }
- loslope = (hz - freqs[0]) / (freqs[1] - freqs[0]);
- hislope = (freqs[2] - hz) / (freqs[2] - freqs[1]);
- if (mel_fb->unit_area) {
- loslope *= 2 / (freqs[2] - freqs[0]);
- hislope *= 2 / (freqs[2] - freqs[0]);
- }
- if (loslope < hislope) {
-#ifdef FIXED_POINT
- mel_fb->filt_coeffs[n_coeffs] = fe_log(loslope);
-#else
- mel_fb->filt_coeffs[n_coeffs] = loslope;
-#endif
- }
- else {
-#ifdef FIXED_POINT
- mel_fb->filt_coeffs[n_coeffs] = fe_log(hislope);
-#else
- mel_fb->filt_coeffs[n_coeffs] = hislope;
-#endif
- }
- ++n_coeffs;
- }
- }
-
- return FE_SUCCESS;
-}
-
-int32
-fe_compute_melcosine(melfb_t * mel_fb)
-{
-
- float64 freqstep;
- int32 i, j;
-
- mel_fb->mel_cosine =
- (mfcc_t **) ckd_calloc_2d(mel_fb->num_cepstra,
- mel_fb->num_filters, sizeof(mfcc_t));
-
- freqstep = M_PI / mel_fb->num_filters;
- /* NOTE: The first row vector is actually unnecessary but we leave
- * it in to avoid confusion. */
- for (i = 0; i < mel_fb->num_cepstra; i++) {
- for (j = 0; j < mel_fb->num_filters; j++) {
- float64 cosine;
-
- cosine = cos(freqstep * i * (j + 0.5));
- mel_fb->mel_cosine[i][j] = FLOAT2COS(cosine);
- }
- }
-
- /* Also precompute normalization constants for unitary DCT. */
- mel_fb->sqrt_inv_n = FLOAT2COS(sqrt(1.0 / mel_fb->num_filters));
- mel_fb->sqrt_inv_2n = FLOAT2COS(sqrt(2.0 / mel_fb->num_filters));
-
- /* And liftering weights */
- if (mel_fb->lifter_val) {
- mel_fb->lifter =
- calloc(mel_fb->num_cepstra, sizeof(*mel_fb->lifter));
- for (i = 0; i < mel_fb->num_cepstra; ++i) {
- mel_fb->lifter[i] = FLOAT2MFCC(1 + mel_fb->lifter_val / 2
- * sin(i * M_PI /
- mel_fb->lifter_val));
- }
- }
-
- return (0);
-}
-
-static void
-fe_pre_emphasis(int16 const *in, frame_t * out, int32 len,
- float32 factor, int16 prior)
-{
- int i;
-
-#if defined(FIXED16)
- int16 fxd_alpha = (int16) (factor * 0x8000);
- int32 tmp1, tmp2;
-
- tmp1 = (int32) in[0] << 15;
- tmp2 = (int32) prior *fxd_alpha;
- out[0] = (int16) ((tmp1 - tmp2) >> 15);
- for (i = 1; i < len; ++i) {
- tmp1 = (int32) in[i] << 15;
- tmp2 = (int32) in[i - 1] * fxd_alpha;
- out[i] = (int16) ((tmp1 - tmp2) >> 15);
- }
-#elif defined(FIXED_POINT)
- fixed32 fxd_alpha = FLOAT2FIX(factor);
- out[0] = ((fixed32) in[0] << DEFAULT_RADIX) - (prior * fxd_alpha);
- for (i = 1; i < len; ++i)
- out[i] = ((fixed32) in[i] << DEFAULT_RADIX)
- - (fixed32) in[i - 1] * fxd_alpha;
-#else
- out[0] = (frame_t) in[0] - (frame_t) prior *factor;
- for (i = 1; i < len; i++)
- out[i] = (frame_t) in[i] - (frame_t) in[i - 1] * factor;
-#endif
-}
-
-static void
-fe_short_to_frame(int16 const *in, frame_t * out, int32 len)
-{
- int i;
-
-#if defined(FIXED16)
- memcpy(out, in, len * sizeof(*out));
-#elif defined(FIXED_POINT)
- for (i = 0; i < len; i++)
- out[i] = (int32) in[i] << DEFAULT_RADIX;
-#else /* FIXED_POINT */
- for (i = 0; i < len; i++)
- out[i] = (frame_t) in[i];
-#endif /* FIXED_POINT */
-}
-
-void
-fe_create_hamming(window_t * in, int32 in_len)
-{
- int i;
-
- /* Symmetric, so we only create the first half of it. */
- for (i = 0; i < in_len / 2; i++) {
- float64 hamm;
- hamm = (0.54 - 0.46 * cos(2 * M_PI * i /
- ((float64) in_len - 1.0)));
-#ifdef FIXED16
- in[i] = (int16) (hamm * 0x8000);
-#else
- in[i] = FLOAT2COS(hamm);
-#endif
- }
-}
-
-static void
-fe_hamming_window(frame_t * in, window_t * window, int32 in_len,
- int32 remove_dc)
-{
- int i;
-
- if (remove_dc) {
-#ifdef FIXED16
- int32 mean = 0; /* Use int32 to avoid possibility of overflow */
-#else
- frame_t mean = 0;
-#endif
-
- for (i = 0; i < in_len; i++)
- mean += in[i];
- mean /= in_len;
- for (i = 0; i < in_len; i++)
- in[i] -= (frame_t) mean;
- }
-
-#ifdef FIXED16
- for (i = 0; i < in_len / 2; i++) {
- int32 tmp1, tmp2;
-
- tmp1 = (int32) in[i] * window[i];
- tmp2 = (int32) in[in_len - 1 - i] * window[i];
- in[i] = (int16) (tmp1 >> 15);
- in[in_len - 1 - i] = (int16) (tmp2 >> 15);
- }
-#else
- for (i = 0; i < in_len / 2; i++) {
- in[i] = COSMUL(in[i], window[i]);
- in[in_len - 1 - i] = COSMUL(in[in_len - 1 - i], window[i]);
- }
-#endif
-}
-
-static int
-fe_spch_to_frame(fe_t * fe, int len)
-{
- /* Copy to the frame buffer. */
- if (fe->pre_emphasis_alpha != 0.0) {
- fe_pre_emphasis(fe->spch, fe->frame, len,
- fe->pre_emphasis_alpha, fe->prior);
- if (len >= fe->frame_shift)
- fe->prior = fe->spch[fe->frame_shift - 1];
- else
- fe->prior = fe->spch[len - 1];
- }
- else
- fe_short_to_frame(fe->spch, fe->frame, len);
-
- /* Zero pad up to FFT size. */
- memset(fe->frame + len, 0, (fe->fft_size - len) * sizeof(*fe->frame));
-
- /* Window. */
- fe_hamming_window(fe->frame, fe->hamming_window, fe->frame_size,
- fe->remove_dc);
-
- return len;
-}
-
-int
-fe_read_frame(fe_t * fe, int16 const *in, int32 len)
-{
- int i;
-
- if (len > fe->frame_size)
- len = fe->frame_size;
-
- /* Read it into the raw speech buffer. */
- memcpy(fe->spch, in, len * sizeof(*in));
- /* Swap and dither if necessary. */
- if (fe->swap)
- for (i = 0; i < len; ++i)
- SWAP_INT16(&fe->spch[i]);
- if (fe->dither)
- for (i = 0; i < len; ++i)
- fe->spch[i] += (int16) ((!(s3_rand_int31() % 4)) ? 1 : 0);
-
- return fe_spch_to_frame(fe, len);
-}
-
-int
-fe_shift_frame(fe_t * fe, int16 const *in, int32 len)
-{
- int offset, i;
-
- if (len > fe->frame_shift)
- len = fe->frame_shift;
- offset = fe->frame_size - fe->frame_shift;
-
- /* Shift data into the raw speech buffer. */
- memmove(fe->spch, fe->spch + fe->frame_shift,
- offset * sizeof(*fe->spch));
- memcpy(fe->spch + offset, in, len * sizeof(*fe->spch));
- /* Swap and dither if necessary. */
- if (fe->swap)
- for (i = 0; i < len; ++i)
- SWAP_INT16(&fe->spch[offset + i]);
- if (fe->dither)
- for (i = 0; i < len; ++i)
- fe->spch[offset + i]
- += (int16) ((!(s3_rand_int31() % 4)) ? 1 : 0);
-
- return fe_spch_to_frame(fe, offset + len);
-}
-
-/**
- * Create arrays of twiddle factors.
- */
-void
-fe_create_twiddle(fe_t * fe)
-{
- int i;
-
- for (i = 0; i < fe->fft_size / 4; ++i) {
- float64 a = 2 * M_PI * i / fe->fft_size;
-#ifdef FIXED16
- fe->ccc[i] = (int16) (cos(a) * 0x8000);
- fe->sss[i] = (int16) (sin(a) * 0x8000);
-#elif defined(FIXED_POINT)
- fe->ccc[i] = FLOAT2COS(cos(a));
- fe->sss[i] = FLOAT2COS(sin(a));
-#else
- fe->ccc[i] = cos(a);
- fe->sss[i] = sin(a);
-#endif
- }
-}
-
-
-/* Translated from the FORTRAN (obviously) from "Real-Valued Fast
- * Fourier Transform Algorithms" by Henrik V. Sorensen et al., IEEE
- * Transactions on Acoustics, Speech, and Signal Processing, vol. 35,
- * no.6. The 16-bit version does a version of "block floating
- * point" in order to avoid rounding errors.
- */
-#if defined(FIXED16)
-static int
-fe_fft_real(fe_t * fe)
-{
- int i, j, k, m, n, lz;
- frame_t *x, xt, max;
-
- x = fe->frame;
- m = fe->fft_order;
- n = fe->fft_size;
-
- /* Bit-reverse the input. */
- j = 0;
- for (i = 0; i < n - 1; ++i) {
- if (i < j) {
- xt = x[j];
- x[j] = x[i];
- x[i] = xt;
- }
- k = n / 2;
- while (k <= j) {
- j -= k;
- k /= 2;
- }
- j += k;
- }
- /* Determine how many bits of dynamic range are in the input. */
- max = 0;
- for (i = 0; i < n; ++i)
- if (abs(x[i]) > max)
- max = abs(x[i]);
- /* The FFT has a gain of M bits, so we need to attenuate the input
- * by M bits minus the number of leading zeroes in the input's
- * range in order to avoid overflows. */
- for (lz = 0; lz < m; ++lz)
- if (max & (1 << (15 - lz)))
- break;
-
- /* Basic butterflies (2-point FFT, real twiddle factors):
- * x[i] = x[i] + 1 * x[i+1]
- * x[i+1] = x[i] + -1 * x[i+1]
- */
- /* The quantization error introduced by attenuating the input at
- * any given stage of the FFT has a cascading effect, so we hold
- * off on it until it's absolutely necessary. */
- for (i = 0; i < n; i += 2) {
- int atten = (lz == 0);
- xt = x[i] >> atten;
- x[i] = xt + (x[i + 1] >> atten);
- x[i + 1] = xt - (x[i + 1] >> atten);
- }
-
- /* The rest of the butterflies, in stages from 1..m */
- for (k = 1; k < m; ++k) {
- int n1, n2, n4;
- /* Start attenuating once we hit the number of leading zeros. */
- int atten = (k >= lz);
-
- n4 = k - 1;
- n2 = k;
- n1 = k + 1;
- /* Stride over each (1 << (k+1)) points */
- for (i = 0; i < n; i += (1 << n1)) {
- /* Basic butterfly with real twiddle factors:
- * x[i] = x[i] + 1 * x[i + (1<<k)]
- * x[i + (1<<k)] = x[i] + -1 * x[i + (1<<k)]
- */
- xt = x[i] >> atten;
- x[i] = xt + (x[i + (1 << n2)] >> atten);
- x[i + (1 << n2)] = xt - (x[i + (1 << n2)] >> atten);
-
- /* The other ones with real twiddle factors:
- * x[i + (1<<k) + (1<<(k-1))]
- * = 0 * x[i + (1<<k-1)] + -1 * x[i + (1<<k) + (1<<k-1)]
- * x[i + (1<<(k-1))]
- * = 1 * x[i + (1<<k-1)] + 0 * x[i + (1<<k) + (1<<k-1)]
- */
- x[i + (1 << n2) + (1 << n4)] =
- -x[i + (1 << n2) + (1 << n4)] >> atten;
- x[i + (1 << n4)] = x[i + (1 << n4)] >> atten;
-
- /* Butterflies with complex twiddle factors.
- * There are (1<<k-1) of them.
- */
- for (j = 1; j < (1 << n4); ++j) {
- frame_t cc, ss, t1, t2;
- int i1, i2, i3, i4;
-
- i1 = i + j;
- i2 = i + (1 << n2) - j;
- i3 = i + (1 << n2) + j;
- i4 = i + (1 << n2) + (1 << n2) - j;
-
- /*
- * cc = real(W[j * n / (1<<(k+1))])
- * ss = imag(W[j * n / (1<<(k+1))])
- */
- cc = fe->ccc[j << (m - n1)];
- ss = fe->sss[j << (m - n1)];
-
- /* There are some symmetry properties which allow us
- * to get away with only four multiplications here. */
- {
- int32 tmp1, tmp2;
- tmp1 = (int32) x[i3] * cc + (int32) x[i4] * ss;
- tmp2 = (int32) x[i3] * ss - (int32) x[i4] * cc;
- t1 = (int16) (tmp1 >> 15) >> atten;
- t2 = (int16) (tmp2 >> 15) >> atten;
- }
-
- x[i4] = (x[i2] >> atten) - t2;
- x[i3] = (-x[i2] >> atten) - t2;
- x[i2] = (x[i1] >> atten) - t1;
- x[i1] = (x[i1] >> atten) + t1;
- }
- }
- }
-
- /* Return the residual scaling factor. */
- return lz;
-}
-#else /* !FIXED16 */
-static int
-fe_fft_real(fe_t * fe)
-{
- int i, j, k, m, n;
- frame_t *x, xt;
-
- x = fe->frame;
- m = fe->fft_order;
- n = fe->fft_size;
-
- /* Bit-reverse the input. */
- j = 0;
- for (i = 0; i < n - 1; ++i) {
- if (i < j) {
- xt = x[j];
- x[j] = x[i];
- x[i] = xt;
- }
- k = n / 2;
- while (k <= j) {
- j -= k;
- k /= 2;
- }
- j += k;
- }
-
- /* Basic butterflies (2-point FFT, real twiddle factors):
- * x[i] = x[i] + 1 * x[i+1]
- * x[i+1] = x[i] + -1 * x[i+1]
- */
- for (i = 0; i < n; i += 2) {
- xt = x[i];
- x[i] = (xt + x[i + 1]);
- x[i + 1] = (xt - x[i + 1]);
- }
-
- /* The rest of the butterflies, in stages from 1..m */
- for (k = 1; k < m; ++k) {
- int n1, n2, n4;
-
- n4 = k - 1;
- n2 = k;
- n1 = k + 1;
- /* Stride over each (1 << (k+1)) points */
- for (i = 0; i < n; i += (1 << n1)) {
- /* Basic butterfly with real twiddle factors:
- * x[i] = x[i] + 1 * x[i + (1<<k)]
- * x[i + (1<<k)] = x[i] + -1 * x[i + (1<<k)]
- */
- xt = x[i];
- x[i] = (xt + x[i + (1 << n2)]);
- x[i + (1 << n2)] = (xt - x[i + (1 << n2)]);
-
- /* The other ones with real twiddle factors:
- * x[i + (1<<k) + (1<<(k-1))]
- * = 0 * x[i + (1<<k-1)] + -1 * x[i + (1<<k) + (1<<k-1)]
- * x[i + (1<<(k-1))]
- * = 1 * x[i + (1<<k-1)] + 0 * x[i + (1<<k) + (1<<k-1)]
- */
- x[i + (1 << n2) + (1 << n4)] = -x[i + (1 << n2) + (1 << n4)];
- x[i + (1 << n4)] = x[i + (1 << n4)];
-
- /* Butterflies with complex twiddle factors.
- * There are (1<<k-1) of them.
- */
- for (j = 1; j < (1 << n4); ++j) {
- frame_t cc, ss, t1, t2;
- int i1, i2, i3, i4;
-
- i1 = i + j;
- i2 = i + (1 << n2) - j;
- i3 = i + (1 << n2) + j;
- i4 = i + (1 << n2) + (1 << n2) - j;
-
- /*
- * cc = real(W[j * n / (1<<(k+1))])
- * ss = imag(W[j * n / (1<<(k+1))])
- */
- cc = fe->ccc[j << (m - n1)];
- ss = fe->sss[j << (m - n1)];
-
- /* There are some symmetry properties which allow us
- * to get away with only four multiplications here. */
- t1 = COSMUL(x[i3], cc) + COSMUL(x[i4], ss);
- t2 = COSMUL(x[i3], ss) - COSMUL(x[i4], cc);
-
- x[i4] = (x[i2] - t2);
- x[i3] = (-x[i2] - t2);
- x[i2] = (x[i1] - t1);
- x[i1] = (x[i1] + t1);
- }
- }
- }
-
- /* This isn't used, but return it for completeness. */
- return m;
-}
-#endif /* !FIXED16 */
-
-static void
-fe_spec_magnitude(fe_t * fe)
-{
- frame_t *fft;
- powspec_t *spec;
- int32 j, scale, fftsize;
-
- /* Do FFT and get the scaling factor back (only actually used in
- * fixed-point). Note the scaling factor is expressed in bits. */
- scale = fe_fft_real(fe);
-
- /* Convenience pointers to make things less awkward below. */
- fft = fe->frame;
- spec = fe->spec;
- fftsize = fe->fft_size;
-
- /* We need to scale things up the rest of the way to N. */
- scale = fe->fft_order - scale;
-
- /* The first point (DC coefficient) has no imaginary part */
- {
-#ifdef FIXED16
- spec[0] = fixlog(abs(fft[0]) << scale) * 2;
-#elif defined(FIXED_POINT)
- spec[0] = FIXLN(abs(fft[0]) << scale) * 2;
-#else
- spec[0] = fft[0] * fft[0];
-#endif
- }
-
- for (j = 1; j <= fftsize / 2; j++) {
-#ifdef FIXED16
- int32 rr = fixlog(abs(fft[j]) << scale) * 2;
- int32 ii = fixlog(abs(fft[fftsize - j]) << scale) * 2;
- spec[j] = fe_log_add(rr, ii);
-#elif defined(FIXED_POINT)
- int32 rr = FIXLN(abs(fft[j]) << scale) * 2;
- int32 ii = FIXLN(abs(fft[fftsize - j]) << scale) * 2;
- spec[j] = fe_log_add(rr, ii);
-#else
- spec[j] = fft[j] * fft[j] + fft[fftsize - j] * fft[fftsize - j];
-#endif
- }
-}
-
-static void
-fe_mel_spec(fe_t * fe)
-{
- int whichfilt;
- powspec_t *spec, *mfspec;
-
- /* Convenience poitners. */
- spec = fe->spec;
- mfspec = fe->mfspec;
- for (whichfilt = 0; whichfilt < fe->mel_fb->num_filters; whichfilt++) {
- int spec_start, filt_start, i;
-
- spec_start = fe->mel_fb->spec_start[whichfilt];
- filt_start = fe->mel_fb->filt_start[whichfilt];
-
-#ifdef FIXED_POINT
- mfspec[whichfilt] =
- spec[spec_start] + fe->mel_fb->filt_coeffs[filt_start];
- for (i = 1; i < fe->mel_fb->filt_width[whichfilt]; i++) {
- mfspec[whichfilt] = fe_log_add(mfspec[whichfilt],
- spec[spec_start + i] +
- fe->mel_fb->
- filt_coeffs[filt_start + i]);
- }
-#else /* !FIXED_POINT */
- mfspec[whichfilt] = 0;
- for (i = 0; i < fe->mel_fb->filt_width[whichfilt]; i++)
- mfspec[whichfilt] +=
- spec[spec_start + i] * fe->mel_fb->filt_coeffs[filt_start +
- i];
-#endif /* !FIXED_POINT */
- }
-
-}
-
-#define LOG_FLOOR 1e-4
-
-static void
-fe_mel_cep(fe_t * fe, mfcc_t * mfcep)
-{
- int32 i;
- powspec_t *mfspec;
-
- /* Convenience pointer. */
- mfspec = fe->mfspec;
-
- for (i = 0; i < fe->mel_fb->num_filters; ++i) {
-#ifndef FIXED_POINT /* It's already in log domain for fixed point */
- mfspec[i] = log(mfspec[i] + LOG_FLOOR);
-#endif /* !FIXED_POINT */
- }
-
- /* If we are doing LOG_SPEC, then do nothing. */
- if (fe->log_spec == RAW_LOG_SPEC) {
- for (i = 0; i < fe->feature_dimension; i++) {
- mfcep[i] = (mfcc_t) mfspec[i];
- }
- }
- /* For smoothed spectrum, do DCT-II followed by (its inverse) DCT-III */
- else if (fe->log_spec == SMOOTH_LOG_SPEC) {
- /* FIXME: This is probably broken for fixed-point. */
- fe_dct2(fe, mfspec, mfcep, 0);
- fe_dct3(fe, mfcep, mfspec);
- for (i = 0; i < fe->feature_dimension; i++) {
- mfcep[i] = (mfcc_t) mfspec[i];
- }
- }
- else if (fe->transform == DCT_II)
- fe_dct2(fe, mfspec, mfcep, FALSE);
- else if (fe->transform == DCT_HTK)
- fe_dct2(fe, mfspec, mfcep, TRUE);
- else
- fe_spec2cep(fe, mfspec, mfcep);
-
- return;
-}
-
-void
-fe_spec2cep(fe_t * fe, const powspec_t * mflogspec, mfcc_t * mfcep)
-{
- int32 i, j, beta;
-
- /* Compute C0 separately (its basis vector is 1) to avoid
- * costly multiplications. */
- mfcep[0] = mflogspec[0] / 2; /* beta = 0.5 */
- for (j = 1; j < fe->mel_fb->num_filters; j++)
- mfcep[0] += mflogspec[j]; /* beta = 1.0 */
- mfcep[0] /= (frame_t) fe->mel_fb->num_filters;
-
- for (i = 1; i < fe->num_cepstra; ++i) {
- mfcep[i] = 0;
- for (j = 0; j < fe->mel_fb->num_filters; j++) {
- if (j == 0)
- beta = 1; /* 0.5 */
- else
- beta = 2; /* 1.0 */
- mfcep[i] += COSMUL(mflogspec[j],
- fe->mel_fb->mel_cosine[i][j]) * beta;
- }
- /* Note that this actually normalizes by num_filters, like the
- * original Sphinx front-end, due to the doubled 'beta' factor
- * above. */
- mfcep[i] /= (frame_t) fe->mel_fb->num_filters * 2;
- }
-}
-
-void
-fe_dct2(fe_t * fe, const powspec_t * mflogspec, mfcc_t * mfcep, int htk)
-{
- int32 i, j;
-
- /* Compute C0 separately (its basis vector is 1) to avoid
- * costly multiplications. */
- mfcep[0] = mflogspec[0];
- for (j = 1; j < fe->mel_fb->num_filters; j++)
- mfcep[0] += mflogspec[j];
- if (htk)
- mfcep[0] = COSMUL(mfcep[0], fe->mel_fb->sqrt_inv_2n);
- else /* sqrt(1/N) = sqrt(2/N) * 1/sqrt(2) */
- mfcep[0] = COSMUL(mfcep[0], fe->mel_fb->sqrt_inv_n);
-
- for (i = 1; i < fe->num_cepstra; ++i) {
- mfcep[i] = 0;
- for (j = 0; j < fe->mel_fb->num_filters; j++) {
- mfcep[i] += COSMUL(mflogspec[j], fe->mel_fb->mel_cosine[i][j]);
- }
- mfcep[i] = COSMUL(mfcep[i], fe->mel_fb->sqrt_inv_2n);
- }
-}
-
-void
-fe_lifter(fe_t * fe, mfcc_t * mfcep)
-{
- int32 i;
-
- if (fe->mel_fb->lifter_val == 0)
- return;
-
- for (i = 0; i < fe->num_cepstra; ++i) {
- mfcep[i] = MFCCMUL(mfcep[i], fe->mel_fb->lifter[i]);
- }
-}
-
-void
-fe_dct3(fe_t * fe, const mfcc_t * mfcep, powspec_t * mflogspec)
-{
- int32 i, j;
-
- for (i = 0; i < fe->mel_fb->num_filters; ++i) {
- mflogspec[i] = COSMUL(mfcep[0], SQRT_HALF);
- for (j = 1; j < fe->num_cepstra; j++) {
- mflogspec[i] += COSMUL(mfcep[j], fe->mel_fb->mel_cosine[j][i]);
- }
- mflogspec[i] = COSMUL(mflogspec[i], fe->mel_fb->sqrt_inv_2n);
- }
-}
-
-void
-fe_write_frame(fe_t * fe, mfcc_t * fea)
-{
- int32 is_speech;
-
- fe_spec_magnitude(fe);
- fe_mel_spec(fe);
- fe_track_snr(fe, &is_speech);
- fe_mel_cep(fe, fea);
- fe_lifter(fe, fea);
- fe_vad_hangover(fe, fea, is_speech);
-}
-
-
-void *
-fe_create_2d(int32 d1, int32 d2, int32 elem_size)
-{
- return (void *) ckd_calloc_2d(d1, d2, elem_size);
-}
-
-void
-fe_free_2d(void *arr)
-{
- ckd_free_2d((void **) arr);
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_type.h b/media/sphinxbase/src/libsphinxbase/fe/fe_type.h
deleted file mode 100644
index 160ed8ff8..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_type.h
+++ /dev/null
@@ -1,65 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2013 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-#ifndef FE_TYPE_H
-#define FE_TYPE_H
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include "sphinxbase/fe.h"
-#include "sphinxbase/fixpoint.h"
-
-#ifdef FIXED16
-/* Q15 format */
-typedef int16 frame_t;
-typedef int16 window_t;
-typedef int32 powspec_t;
-typedef struct { int16 r, i; } complex;
-#elif defined(FIXED_POINT)
-typedef fixed32 frame_t;
-typedef int32 powspec_t;
-typedef fixed32 window_t;
-typedef struct { fixed32 r, i; } complex;
-#else /* FIXED_POINT */
-typedef float64 frame_t;
-typedef float64 powspec_t;
-typedef float64 window_t;
-typedef struct { float64 r, i; } complex;
-#endif /* FIXED_POINT */
-
-#endif /* FE_TYPE_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp.c b/media/sphinxbase/src/libsphinxbase/fe/fe_warp.c
deleted file mode 100644
index e409bea76..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp.c
+++ /dev/null
@@ -1,252 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-/*********************************************************************
- *
- * File: fe_warp.c
- *
- * Description:
- * Allows a caller to choose a warping function.
- *********************************************************************/
-
-/* static char rcsid[] = "@(#)$Id: fe_warp.c,v 1.2 2006/02/17 00:31:34 egouvea Exp $";*/
-
-#include "fe_warp_inverse_linear.h"
-#include "fe_warp_affine.h"
-#include "fe_warp_piecewise_linear.h"
-#include "fe_warp.h"
-
-#include "sphinxbase/err.h"
-
-#include <stdio.h>
-#include <string.h>
-#include <assert.h>
-#include <stdlib.h>
-
-/* This is for aliases for each of the entries below. Currently not
- used.
-*/
-static char *__name2id[] = {
- "inverse",
- "linear",
- "piecewise",
- NULL
-};
-
-static char *name2id[] = {
- "inverse_linear",
- "affine",
- "piecewise_linear",
- NULL
-};
-
-static fe_warp_conf_t fe_warp_conf[FE_WARP_ID_MAX + 1] = {
- {fe_warp_inverse_linear_set_parameters,
- fe_warp_inverse_linear_doc,
- fe_warp_inverse_linear_id,
- fe_warp_inverse_linear_n_param,
- fe_warp_inverse_linear_warped_to_unwarped,
- fe_warp_inverse_linear_unwarped_to_warped,
- fe_warp_inverse_linear_print}, /* Inverse linear warping */
- {fe_warp_affine_set_parameters,
- fe_warp_affine_doc,
- fe_warp_affine_id,
- fe_warp_affine_n_param,
- fe_warp_affine_warped_to_unwarped,
- fe_warp_affine_unwarped_to_warped,
- fe_warp_affine_print}, /* Affine warping */
- {fe_warp_piecewise_linear_set_parameters,
- fe_warp_piecewise_linear_doc,
- fe_warp_piecewise_linear_id,
- fe_warp_piecewise_linear_n_param,
- fe_warp_piecewise_linear_warped_to_unwarped,
- fe_warp_piecewise_linear_unwarped_to_warped,
- fe_warp_piecewise_linear_print}, /* Piecewise_Linear warping */
-};
-
-int
-fe_warp_set(melfb_t *mel, const char *id_name)
-{
- uint32 i;
-
- for (i = 0; name2id[i]; i++) {
- if (strcmp(id_name, name2id[i]) == 0) {
- mel->warp_id = i;
- break;
- }
- }
-
- if (name2id[i] == NULL) {
- for (i = 0; __name2id[i]; i++) {
- if (strcmp(id_name, __name2id[i]) == 0) {
- mel->warp_id = i;
- break;
- }
- }
- if (__name2id[i] == NULL) {
- E_ERROR("Unimplemented warping function %s\n", id_name);
- E_ERROR("Implemented functions are:\n");
- for (i = 0; name2id[i]; i++) {
- fprintf(stderr, "\t%s\n", name2id[i]);
- }
- mel->warp_id = FE_WARP_ID_NONE;
-
- return FE_START_ERROR;
- }
- }
-
- return FE_SUCCESS;
-}
-
-void
-fe_warp_set_parameters(melfb_t *mel, char const *param_str, float sampling_rate)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- fe_warp_conf[mel->warp_id].set_parameters(param_str, sampling_rate);
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("feat module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-}
-
-const char *
-fe_warp_doc(melfb_t *mel)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- return fe_warp_conf[mel->warp_id].doc();
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("fe_warp module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-
- return NULL;
-}
-
-uint32
-fe_warp_id(melfb_t *mel)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- assert(mel->warp_id == fe_warp_conf[mel->warp_id].id());
- return mel->warp_id;
- }
- else if (mel->warp_id != FE_WARP_ID_NONE) {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-
- return FE_WARP_ID_NONE;
-}
-
-uint32
-fe_warp_n_param(melfb_t *mel)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- return fe_warp_conf[mel->warp_id].n_param();
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("fe_warp module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-
- return 0;
-}
-
-float
-fe_warp_warped_to_unwarped(melfb_t *mel, float nonlinear)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- return fe_warp_conf[mel->warp_id].warped_to_unwarped(nonlinear);
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("fe_warp module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-
- return 0;
-}
-
-float
-fe_warp_unwarped_to_warped(melfb_t *mel,float linear)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- return fe_warp_conf[mel->warp_id].unwarped_to_warped(linear);
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("fe_warp module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-
- return 0;
-}
-
-void
-fe_warp_print(melfb_t *mel, const char *label)
-{
- if (mel->warp_id <= FE_WARP_ID_MAX) {
- fe_warp_conf[mel->warp_id].print(label);
- }
- else if (mel->warp_id == FE_WARP_ID_NONE) {
- E_FATAL("fe_warp module must be configured w/ a valid ID\n");
- }
- else {
- E_FATAL
- ("fe_warp module misconfigured with invalid fe_warp_id %u\n",
- mel->warp_id);
- }
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp.h b/media/sphinxbase/src/libsphinxbase/fe/fe_warp.h
deleted file mode 100644
index f2fd14550..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp.h
+++ /dev/null
@@ -1,90 +0,0 @@
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#ifndef FE_WARP_H
-#define FE_WARP_H
-
-#include "fe_internal.h"
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-#if 0
-/* Fool Emacs. */
-}
-#endif
-
-#define FE_WARP_ID_INVERSE_LINEAR 0
-#define FE_WARP_ID_AFFINE 1
-#define FE_WARP_ID_PIECEWISE_LINEAR 2
-#define FE_WARP_ID_EIDE_GISH 3
-#define FE_WARP_ID_MAX 2
-#define FE_WARP_ID_NONE 0xffffffff
-
-typedef struct {
- void (*set_parameters)(char const *param_str, float sampling_rate);
- const char * (*doc)(void);
- uint32 (*id)(void);
- uint32 (*n_param)(void);
- float (*warped_to_unwarped)(float nonlinear);
- float (*unwarped_to_warped)(float linear);
- void (*print)(const char *label);
-} fe_warp_conf_t;
-
-int fe_warp_set(melfb_t *mel, const char *id_name);
-
-uint32 fe_warp_id(melfb_t *mel);
-
-const char * fe_warp_doc(melfb_t *mel);
-
-void fe_warp_set_parameters(melfb_t *mel, char const *param_str, float sampling_rate);
-
-uint32 fe_warp_n_param(melfb_t *mel);
-
-float fe_warp_warped_to_unwarped(melfb_t *mel, float nonlinear);
-
-float fe_warp_unwarped_to_warped(melfb_t *mel, float linear);
-
-void fe_warp_print(melfb_t *mel, const char *label);
-
-#define FE_WARP_NO_SIZE 0xffffffff
-
-#ifdef __cplusplus
-}
-#endif
-
-
-#endif /* FE_WARP_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.c b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.c
deleted file mode 100644
index 398611917..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.c
+++ /dev/null
@@ -1,181 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-/*********************************************************************
- *
- * File: fe_warp_affine.c
- *
- * Description:
- * Warp the frequency axis according to an affine function, i.e.:
- *
- * w' = a * w + b
- *
- *********************************************************************/
-
-/* static char rcsid[] = "@(#)$Id: fe_warp_affine.c,v 1.2 2006/02/17 00:31:34 egouvea Exp $"; */
-
-#include <stdio.h>
-#include <stdlib.h>
-#include <math.h>
-#include <string.h>
-
-#ifdef _MSC_VER
-#pragma warning (disable: 4996)
-#endif
-
-#include "sphinxbase/strfuncs.h"
-#include "sphinxbase/err.h"
-
-#include "fe_warp.h"
-#include "fe_warp_affine.h"
-
-#define N_PARAM 2
-#define YES 1
-#define NO 0
-
-/*
- * params[0] : a
- * params[1] : b
- */
-static float params[N_PARAM] = { 1.0f, 0.0f };
-static int32 is_neutral = YES;
-static char p_str[256] = "";
-static float nyquist_frequency = 0.0f;
-
-
-const char *
-fe_warp_affine_doc()
-{
- return "affine :== < w' = a * x + b >";
-}
-
-uint32
-fe_warp_affine_id()
-{
- return FE_WARP_ID_AFFINE;
-}
-
-uint32
-fe_warp_affine_n_param()
-{
- return N_PARAM;
-}
-
-void
-fe_warp_affine_set_parameters(char const *param_str, float sampling_rate)
-{
- char *tok;
- char *seps = " \t";
- char temp_param_str[256];
- int param_index = 0;
-
- nyquist_frequency = sampling_rate / 2;
- if (param_str == NULL) {
- is_neutral = YES;
- return;
- }
- /* The new parameters are the same as the current ones, so do nothing. */
- if (strcmp(param_str, p_str) == 0) {
- return;
- }
- is_neutral = NO;
- strcpy(temp_param_str, param_str);
- memset(params, 0, N_PARAM * sizeof(float));
- strcpy(p_str, param_str);
- /* FIXME: strtok() is not re-entrant... */
- tok = strtok(temp_param_str, seps);
- while (tok != NULL) {
- params[param_index++] = (float) atof_c(tok);
- tok = strtok(NULL, seps);
- if (param_index >= N_PARAM) {
- break;
- }
- }
- if (tok != NULL) {
- E_INFO
- ("Affine warping takes up to two arguments, %s ignored.\n",
- tok);
- }
- if (params[0] == 0) {
- is_neutral = YES;
- E_INFO
- ("Affine warping cannot have slope zero, warping not applied.\n");
- }
-}
-
-float
-fe_warp_affine_warped_to_unwarped(float nonlinear)
-{
- if (is_neutral) {
- return nonlinear;
- }
- else {
- /* linear = (nonlinear - b) / a */
- float temp = nonlinear - params[1];
- temp /= params[0];
- if (temp > nyquist_frequency) {
- E_WARN
- ("Warp factor %g results in frequency (%.1f) higher than Nyquist (%.1f)\n",
- params[0], temp, nyquist_frequency);
- }
- return temp;
- }
-}
-
-float
-fe_warp_affine_unwarped_to_warped(float linear)
-{
- if (is_neutral) {
- return linear;
- }
- else {
- /* nonlinear = a * linear - b */
- float temp = linear * params[0];
- temp += params[1];
- return temp;
- }
-}
-
-void
-fe_warp_affine_print(const char *label)
-{
- uint32 i;
-
- for (i = 0; i < N_PARAM; i++) {
- printf("%s[%04u]: %6.3f ", label, i, params[i]);
- }
- printf("\n");
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.h b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.h
deleted file mode 100644
index 44027d97a..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_affine.h
+++ /dev/null
@@ -1,76 +0,0 @@
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#ifndef FE_WARP_AFFINE_H
-#define FE_WARP_AFFINE_H
-
-#include "sphinxbase/fe.h"
-
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-#if 0
-/* Fool Emacs. */
-}
-#endif
-
-const char *
-fe_warp_affine_doc(void);
-
-uint32
-fe_warp_affine_id(void);
-
-uint32
-fe_warp_affine_n_param(void);
-
-void
-fe_warp_affine_set_parameters(char const *param_str, float sampling_rate);
-
-float
-fe_warp_affine_warped_to_unwarped(float nonlinear);
-
-float
-fe_warp_affine_unwarped_to_warped(float linear);
-
-void
-fe_warp_affine_print(const char *label);
-
-#ifdef __cplusplus
-}
-#endif
-
-#endif /* FE_WARP_AFFINE_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.c b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.c
deleted file mode 100644
index 85e42986b..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.c
+++ /dev/null
@@ -1,178 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-/*********************************************************************
- *
- * File: fe_warp_inverse_linear.c
- *
- * Description:
- * Warp the frequency axis according to an inverse_linear function, i.e.:
- *
- * w' = w / a
- *
- *********************************************************************/
-
-/* static char rcsid[] = "@(#)$Id: fe_warp_inverse_linear.c,v 1.3 2006/02/23 19:40:11 eht Exp $"; */
-
-#include <stdio.h>
-#include <stdlib.h>
-#include <math.h>
-#include <string.h>
-
-#ifdef _MSC_VER
-#pragma warning (disable: 4996)
-#endif
-
-#include "sphinxbase/strfuncs.h"
-#include "sphinxbase/err.h"
-
-#include "fe_warp.h"
-#include "fe_warp_inverse_linear.h"
-
-#define N_PARAM 1
-#define YES 1
-#define NO 0
-
-/*
- * params[0] : a
- */
-static float params[N_PARAM] = { 1.0f };
-static int32 is_neutral = YES;
-static char p_str[256] = "";
-static float nyquist_frequency = 0.0f;
-
-
-const char *
-fe_warp_inverse_linear_doc()
-{
- return "inverse_linear :== < w' = x / a >";
-}
-
-uint32
-fe_warp_inverse_linear_id()
-{
- return FE_WARP_ID_INVERSE_LINEAR;
-}
-
-uint32
-fe_warp_inverse_linear_n_param()
-{
- return N_PARAM;
-}
-
-void
-fe_warp_inverse_linear_set_parameters(char const *param_str, float sampling_rate)
-{
- char *tok;
- char *seps = " \t";
- char temp_param_str[256];
- int param_index = 0;
-
- nyquist_frequency = sampling_rate / 2;
- if (param_str == NULL) {
- is_neutral = YES;
- return;
- }
- /* The new parameters are the same as the current ones, so do nothing. */
- if (strcmp(param_str, p_str) == 0) {
- return;
- }
- is_neutral = NO;
- strcpy(temp_param_str, param_str);
- memset(params, 0, N_PARAM * sizeof(float));
- strcpy(p_str, param_str);
- /* FIXME: strtok() is not re-entrant... */
- tok = strtok(temp_param_str, seps);
- while (tok != NULL) {
- params[param_index++] = (float) atof_c(tok);
- tok = strtok(NULL, seps);
- if (param_index >= N_PARAM) {
- break;
- }
- }
- if (tok != NULL) {
- E_INFO
- ("Inverse linear warping takes only one argument, %s ignored.\n",
- tok);
- }
- if (params[0] == 0) {
- is_neutral = YES;
- E_INFO
- ("Inverse linear warping cannot have slope zero, warping not applied.\n");
- }
-}
-
-float
-fe_warp_inverse_linear_warped_to_unwarped(float nonlinear)
-{
- if (is_neutral) {
- return nonlinear;
- }
- else {
- /* linear = nonlinear * a */
- float temp = nonlinear * params[0];
- if (temp > nyquist_frequency) {
- E_WARN
- ("Warp factor %g results in frequency (%.1f) higher than Nyquist (%.1f)\n",
- params[0], temp, nyquist_frequency);
- }
- return temp;
- }
-}
-
-float
-fe_warp_inverse_linear_unwarped_to_warped(float linear)
-{
- if (is_neutral) {
- return linear;
- }
- else {
- /* nonlinear = a / linear */
- float temp = linear / params[0];
- return temp;
- }
-}
-
-void
-fe_warp_inverse_linear_print(const char *label)
-{
- uint32 i;
-
- for (i = 0; i < N_PARAM; i++) {
- printf("%s[%04u]: %6.3f ", label, i, params[i]);
- }
- printf("\n");
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.h b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.h
deleted file mode 100644
index 8d4a76725..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_inverse_linear.h
+++ /dev/null
@@ -1,77 +0,0 @@
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#ifndef FE_WARP_inverse_linear_H
-#define FE_WARP_inverse_linear_H
-
-#include "sphinxbase/fe.h"
-
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-#if 0
-/* Fool Emacs. */
-}
-#endif
-
-const char *
-fe_warp_inverse_linear_doc(void);
-
-uint32
-fe_warp_inverse_linear_id(void);
-
-uint32
-fe_warp_inverse_linear_n_param(void);
-
-void
-fe_warp_inverse_linear_set_parameters(char const *param_str, float sampling_rate);
-
-float
-fe_warp_inverse_linear_warped_to_unwarped(float nonlinear);
-
-float
-fe_warp_inverse_linear_unwarped_to_warped(float linear);
-
-void
-fe_warp_inverse_linear_print(const char *label);
-
-#ifdef __cplusplus
-}
-#endif
-
-
-#endif /* FE_WARP_inverse_linear_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.c b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.c
deleted file mode 100644
index 34570120f..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.c
+++ /dev/null
@@ -1,223 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-/*********************************************************************
- *
- * File: fe_warp_piecewise_linear.c
- *
- * Description:
- *
- * Warp the frequency axis according to an piecewise linear
- * function. The function is linear up to a frequency F, where
- * the slope changes so that the Nyquist frequency in the warped
- * axis maps to the Nyquist frequency in the unwarped.
- *
- * w' = a * w, w < F
- * w' = a' * w + b, W > F
- * w'(0) = 0
- * w'(F) = F
- * w'(Nyq) = Nyq
- *
- *********************************************************************/
-
-/* static char rcsid[] = "@(#)$Id: fe_warp_piecewise_linear.c,v 1.2 2006/02/17 00:31:34 egouvea Exp $"; */
-
-#include <stdio.h>
-#include <stdlib.h>
-#include <math.h>
-#include <string.h>
-
-#ifdef _MSC_VER
-#pragma warning (disable: 4996)
-#endif
-
-#include "sphinxbase/strfuncs.h"
-#include "sphinxbase/err.h"
-
-#include "fe_warp.h"
-#include "fe_warp_piecewise_linear.h"
-
-#define N_PARAM 2
-#define YES 1
-#define NO 0
-
-/*
- * params[0] : a
- * params[1] : F (the non-differentiable point)
- */
-static float params[N_PARAM] = { 1.0f, 6800.0f };
-static float final_piece[2];
-static int32 is_neutral = YES;
-static char p_str[256] = "";
-static float nyquist_frequency = 0.0f;
-
-
-const char *
-fe_warp_piecewise_linear_doc()
-{
- return "piecewise_linear :== < w' = a * w, w < F >";
-}
-
-uint32
-fe_warp_piecewise_linear_id()
-{
- return FE_WARP_ID_PIECEWISE_LINEAR;
-}
-
-uint32
-fe_warp_piecewise_linear_n_param()
-{
- return N_PARAM;
-}
-
-void
-fe_warp_piecewise_linear_set_parameters(char const *param_str,
- float sampling_rate)
-{
- char *tok;
- char *seps = " \t";
- char temp_param_str[256];
- int param_index = 0;
-
- nyquist_frequency = sampling_rate / 2;
- if (param_str == NULL) {
- is_neutral = YES;
- return;
- }
- /* The new parameters are the same as the current ones, so do nothing. */
- if (strcmp(param_str, p_str) == 0) {
- return;
- }
- is_neutral = NO;
- strcpy(temp_param_str, param_str);
- memset(params, 0, N_PARAM * sizeof(float));
- memset(final_piece, 0, 2 * sizeof(float));
- strcpy(p_str, param_str);
- /* FIXME: strtok() is not re-entrant... */
- tok = strtok(temp_param_str, seps);
- while (tok != NULL) {
- params[param_index++] = (float) atof_c(tok);
- tok = strtok(NULL, seps);
- if (param_index >= N_PARAM) {
- break;
- }
- }
- if (tok != NULL) {
- E_INFO
- ("Piecewise linear warping takes up to two arguments, %s ignored.\n",
- tok);
- }
- if (params[1] < sampling_rate) {
- /* Precompute these. These are the coefficients of a
- * straight line that contains the points (F, aF) and (N,
- * N), where a = params[0], F = params[1], N = Nyquist
- * frequency.
- */
- if (params[1] == 0) {
- params[1] = sampling_rate * 0.85f;
- }
- final_piece[0] =
- (nyquist_frequency -
- params[0] * params[1]) / (nyquist_frequency - params[1]);
- final_piece[1] =
- nyquist_frequency * params[1] * (params[0] -
- 1.0f) / (nyquist_frequency -
- params[1]);
- }
- else {
- memset(final_piece, 0, 2 * sizeof(float));
- }
- if (params[0] == 0) {
- is_neutral = YES;
- E_INFO
- ("Piecewise linear warping cannot have slope zero, warping not applied.\n");
- }
-}
-
-float
-fe_warp_piecewise_linear_warped_to_unwarped(float nonlinear)
-{
- if (is_neutral) {
- return nonlinear;
- }
- else {
- /* linear = (nonlinear - b) / a */
- float temp;
- if (nonlinear < params[0] * params[1]) {
- temp = nonlinear / params[0];
- }
- else {
- temp = nonlinear - final_piece[1];
- temp /= final_piece[0];
- }
- if (temp > nyquist_frequency) {
- E_WARN
- ("Warp factor %g results in frequency (%.1f) higher than Nyquist (%.1f)\n",
- params[0], temp, nyquist_frequency);
- }
- return temp;
- }
-}
-
-float
-fe_warp_piecewise_linear_unwarped_to_warped(float linear)
-{
- if (is_neutral) {
- return linear;
- }
- else {
- float temp;
- /* nonlinear = a * linear - b */
- if (linear < params[1]) {
- temp = linear * params[0];
- }
- else {
- temp = final_piece[0] * linear + final_piece[1];
- }
- return temp;
- }
-}
-
-void
-fe_warp_piecewise_linear_print(const char *label)
-{
- uint32 i;
-
- for (i = 0; i < N_PARAM; i++) {
- printf("%s[%04u]: %6.3f ", label, i, params[i]);
- }
- printf("\n");
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.h b/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.h
deleted file mode 100644
index f15cb251e..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fe_warp_piecewise_linear.h
+++ /dev/null
@@ -1,77 +0,0 @@
-/* ====================================================================
- * Copyright (c) 2006 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- */
-
-#ifndef FE_WARP_PIECEWIDE_LINEAR_H
-#define FE_WARP_PIECEWIDE_LINEAR_H
-
-#include "sphinxbase/fe.h"
-
-
-#ifdef __cplusplus
-extern "C" {
-#endif
-#if 0
-/* Fool Emacs. */
-}
-#endif
-
-const char *
-fe_warp_piecewise_linear_doc(void);
-
-uint32
-fe_warp_piecewise_linear_id(void);
-
-uint32
-fe_warp_piecewise_linear_n_param(void);
-
-void
-fe_warp_piecewise_linear_set_parameters(char const *param_str, float sampling_rate);
-
-float
-fe_warp_piecewise_linear_warped_to_unwarped(float nonlinear);
-
-float
-fe_warp_piecewise_linear_unwarped_to_warped(float linear);
-
-void
-fe_warp_piecewise_linear_print(const char *label);
-
-#ifdef __cplusplus
-}
-#endif
-
-
-#endif /* FE_WARP_PIECEWIDE_LINEAR_H */
diff --git a/media/sphinxbase/src/libsphinxbase/fe/fixlog.c b/media/sphinxbase/src/libsphinxbase/fe/fixlog.c
deleted file mode 100644
index 459c9ffd6..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/fixlog.c
+++ /dev/null
@@ -1,229 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/* ====================================================================
- * Copyright (c) 2005 Carnegie Mellon University. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * This work was supported in part by funding from the Defense Advanced
- * Research Projects Agency and the National Science Foundation of the
- * United States of America, and the CMU Sphinx Speech Consortium.
- *
- * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND
- * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
- * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY
- * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- *
- * ====================================================================
- *
- * File: fixlog.c
- *
- * Description: Fast approximate fixed-point logarithms
- *
- * Author: David Huggins-Daines <dhuggins@cs.cmu.edu>
- *
- */
-
-#ifdef HAVE_CONFIG_H
-#include <config.h>
-#endif
-
-#include "sphinxbase/prim_type.h"
-#include "sphinxbase/fixpoint.h"
-
-#include "fe_internal.h"
-
-/* Table of log2(x/128)*(1<<DEFAULT_RADIX) */
-/* perl -e 'for (0..128) {my $x = 1 + $_/128; $y = 1 + ($_ + 1.) / 128;
- print " (uint32)(", (log($x) + log($y))/2/log(2)," *(1<<DEFAULT_RADIX)),\n"}' */
-static uint32 logtable[] = {
- (uint32)(0.00561362771162706*(1<<DEFAULT_RADIX)),
- (uint32)(0.0167975342258543*(1<<DEFAULT_RADIX)),
- (uint32)(0.0278954072829524*(1<<DEFAULT_RADIX)),
- (uint32)(0.0389085604479519*(1<<DEFAULT_RADIX)),
- (uint32)(0.0498382774298215*(1<<DEFAULT_RADIX)),
- (uint32)(0.060685812979481*(1<<DEFAULT_RADIX)),
- (uint32)(0.0714523937543017*(1<<DEFAULT_RADIX)),
- (uint32)(0.0821392191505851*(1<<DEFAULT_RADIX)),
- (uint32)(0.0927474621054331*(1<<DEFAULT_RADIX)),
- (uint32)(0.103278269869348*(1<<DEFAULT_RADIX)),
- (uint32)(0.113732764750838*(1<<DEFAULT_RADIX)),
- (uint32)(0.124112044834237*(1<<DEFAULT_RADIX)),
- (uint32)(0.13441718467188*(1<<DEFAULT_RADIX)),
- (uint32)(0.144649235951738*(1<<DEFAULT_RADIX)),
- (uint32)(0.154809228141536*(1<<DEFAULT_RADIX)),
- (uint32)(0.164898169110351*(1<<DEFAULT_RADIX)),
- (uint32)(0.174917045728623*(1<<DEFAULT_RADIX)),
- (uint32)(0.184866824447476*(1<<DEFAULT_RADIX)),
- (uint32)(0.194748451858191*(1<<DEFAULT_RADIX)),
- (uint32)(0.204562855232657*(1<<DEFAULT_RADIX)),
- (uint32)(0.214310943045556*(1<<DEFAULT_RADIX)),
- (uint32)(0.223993605479021*(1<<DEFAULT_RADIX)),
- (uint32)(0.23361171491048*(1<<DEFAULT_RADIX)),
- (uint32)(0.243166126384332*(1<<DEFAULT_RADIX)),
- (uint32)(0.252657678068119*(1<<DEFAULT_RADIX)),
- (uint32)(0.262087191693777*(1<<DEFAULT_RADIX)),
- (uint32)(0.271455472984569*(1<<DEFAULT_RADIX)),
- (uint32)(0.280763312068243*(1<<DEFAULT_RADIX)),
- (uint32)(0.290011483876938*(1<<DEFAULT_RADIX)),
- (uint32)(0.299200748534365*(1<<DEFAULT_RADIX)),
- (uint32)(0.308331851730729*(1<<DEFAULT_RADIX)),
- (uint32)(0.317405525085859*(1<<DEFAULT_RADIX)),
- (uint32)(0.32642248650099*(1<<DEFAULT_RADIX)),
- (uint32)(0.335383440499621*(1<<DEFAULT_RADIX)),
- (uint32)(0.344289078557851*(1<<DEFAULT_RADIX)),
- (uint32)(0.353140079424581*(1<<DEFAULT_RADIX)),
- (uint32)(0.36193710943195*(1<<DEFAULT_RADIX)),
- (uint32)(0.37068082279637*(1<<DEFAULT_RADIX)),
- (uint32)(0.379371861910488*(1<<DEFAULT_RADIX)),
- (uint32)(0.388010857626406*(1<<DEFAULT_RADIX)),
- (uint32)(0.396598429530472*(1<<DEFAULT_RADIX)),
- (uint32)(0.405135186209943*(1<<DEFAULT_RADIX)),
- (uint32)(0.4136217255118*(1<<DEFAULT_RADIX)),
- (uint32)(0.422058634793998*(1<<DEFAULT_RADIX)),
- (uint32)(0.430446491169411*(1<<DEFAULT_RADIX)),
- (uint32)(0.438785861742727*(1<<DEFAULT_RADIX)),
- (uint32)(0.447077303840529*(1<<DEFAULT_RADIX)),
- (uint32)(0.455321365234813*(1<<DEFAULT_RADIX)),
- (uint32)(0.463518584360147*(1<<DEFAULT_RADIX)),
- (uint32)(0.471669490524698*(1<<DEFAULT_RADIX)),
- (uint32)(0.479774604115327*(1<<DEFAULT_RADIX)),
- (uint32)(0.487834436796966*(1<<DEFAULT_RADIX)),
- (uint32)(0.49584949170644*(1<<DEFAULT_RADIX)),
- (uint32)(0.503820263640951*(1<<DEFAULT_RADIX)),
- (uint32)(0.511747239241369*(1<<DEFAULT_RADIX)),
- (uint32)(0.519630897170528*(1<<DEFAULT_RADIX)),
- (uint32)(0.527471708286662*(1<<DEFAULT_RADIX)),
- (uint32)(0.535270135812172*(1<<DEFAULT_RADIX)),
- (uint32)(0.543026635497834*(1<<DEFAULT_RADIX)),
- (uint32)(0.550741655782637*(1<<DEFAULT_RADIX)),
- (uint32)(0.558415637949355*(1<<DEFAULT_RADIX)),
- (uint32)(0.56604901627601*(1<<DEFAULT_RADIX)),
- (uint32)(0.573642218183348*(1<<DEFAULT_RADIX)),
- (uint32)(0.581195664378452*(1<<DEFAULT_RADIX)),
- (uint32)(0.588709768994618*(1<<DEFAULT_RADIX)),
- (uint32)(0.596184939727604*(1<<DEFAULT_RADIX)),
- (uint32)(0.603621577968369*(1<<DEFAULT_RADIX)),
- (uint32)(0.61102007893241*(1<<DEFAULT_RADIX)),
- (uint32)(0.618380831785792*(1<<DEFAULT_RADIX)),
- (uint32)(0.625704219767993*(1<<DEFAULT_RADIX)),
- (uint32)(0.632990620311629*(1<<DEFAULT_RADIX)),
- (uint32)(0.640240405159187*(1<<DEFAULT_RADIX)),
- (uint32)(0.647453940476827*(1<<DEFAULT_RADIX)),
- (uint32)(0.654631586965362*(1<<DEFAULT_RADIX)),
- (uint32)(0.661773699968486*(1<<DEFAULT_RADIX)),
- (uint32)(0.668880629578336*(1<<DEFAULT_RADIX)),
- (uint32)(0.675952720738471*(1<<DEFAULT_RADIX)),
- (uint32)(0.682990313344332*(1<<DEFAULT_RADIX)),
- (uint32)(0.689993742341272*(1<<DEFAULT_RADIX)),
- (uint32)(0.696963337820209*(1<<DEFAULT_RADIX)),
- (uint32)(0.703899425110987*(1<<DEFAULT_RADIX)),
- (uint32)(0.710802324873503*(1<<DEFAULT_RADIX)),
- (uint32)(0.717672353186654*(1<<DEFAULT_RADIX)),
- (uint32)(0.724509821635192*(1<<DEFAULT_RADIX)),
- (uint32)(0.731315037394519*(1<<DEFAULT_RADIX)),
- (uint32)(0.738088303313493*(1<<DEFAULT_RADIX)),
- (uint32)(0.744829917995304*(1<<DEFAULT_RADIX)),
- (uint32)(0.751540175876464*(1<<DEFAULT_RADIX)),
- (uint32)(0.758219367303974*(1<<DEFAULT_RADIX)),
- (uint32)(0.764867778610703*(1<<DEFAULT_RADIX)),
- (uint32)(0.77148569218905*(1<<DEFAULT_RADIX)),
- (uint32)(0.778073386562917*(1<<DEFAULT_RADIX)),
- (uint32)(0.784631136458046*(1<<DEFAULT_RADIX)),
- (uint32)(0.791159212870769*(1<<DEFAULT_RADIX)),
- (uint32)(0.797657883135205*(1<<DEFAULT_RADIX)),
- (uint32)(0.804127410988954*(1<<DEFAULT_RADIX)),
- (uint32)(0.810568056637321*(1<<DEFAULT_RADIX)),
- (uint32)(0.816980076816112*(1<<DEFAULT_RADIX)),
- (uint32)(0.823363724853051*(1<<DEFAULT_RADIX)),
- (uint32)(0.829719250727828*(1<<DEFAULT_RADIX)),
- (uint32)(0.836046901130843*(1<<DEFAULT_RADIX)),
- (uint32)(0.84234691952066*(1<<DEFAULT_RADIX)),
- (uint32)(0.848619546180216*(1<<DEFAULT_RADIX)),
- (uint32)(0.854865018271815*(1<<DEFAULT_RADIX)),
- (uint32)(0.861083569890926*(1<<DEFAULT_RADIX)),
- (uint32)(0.867275432118842*(1<<DEFAULT_RADIX)),
- (uint32)(0.873440833074202*(1<<DEFAULT_RADIX)),
- (uint32)(0.879579997963421*(1<<DEFAULT_RADIX)),
- (uint32)(0.88569314913005*(1<<DEFAULT_RADIX)),
- (uint32)(0.891780506103101*(1<<DEFAULT_RADIX)),
- (uint32)(0.897842285644346*(1<<DEFAULT_RADIX)),
- (uint32)(0.903878701794633*(1<<DEFAULT_RADIX)),
- (uint32)(0.90988996591924*(1<<DEFAULT_RADIX)),
- (uint32)(0.915876286752278*(1<<DEFAULT_RADIX)),
- (uint32)(0.921837870440188*(1<<DEFAULT_RADIX)),
- (uint32)(0.927774920584334*(1<<DEFAULT_RADIX)),
- (uint32)(0.933687638282728*(1<<DEFAULT_RADIX)),
- (uint32)(0.939576222170905*(1<<DEFAULT_RADIX)),
- (uint32)(0.945440868461959*(1<<DEFAULT_RADIX)),
- (uint32)(0.951281770985776*(1<<DEFAULT_RADIX)),
- (uint32)(0.957099121227478*(1<<DEFAULT_RADIX)),
- (uint32)(0.962893108365084*(1<<DEFAULT_RADIX)),
- (uint32)(0.968663919306429*(1<<DEFAULT_RADIX)),
- (uint32)(0.974411738725344*(1<<DEFAULT_RADIX)),
- (uint32)(0.980136749097113*(1<<DEFAULT_RADIX)),
- (uint32)(0.985839130733238*(1<<DEFAULT_RADIX)),
- (uint32)(0.991519061815512*(1<<DEFAULT_RADIX)),
- (uint32)(0.997176718429429*(1<<DEFAULT_RADIX)),
- (uint32)(1.00281227459694*(1<<DEFAULT_RADIX)),
-};
-
-int32
-fixlog2(uint32 x)
-{
- uint32 y;
-
- if (x == 0)
- return MIN_FIXLOG2;
-
- /* Get the exponent. */
-#if ((defined(__ARM_ARCH_5__) || defined(__ARM_ARCH_5T__) || \
- defined(__ARM_ARCH_5TE__) || defined(__ARM_ARCH_7A__)) && !defined(__thumb__))
- __asm__("clz %0, %1\n": "=r"(y):"r"(x));
- x <<= y;
- y = 31 - y;
-#elif defined(__ppc__)
- __asm__("cntlzw %0, %1\n": "=r"(y):"r"(x));
- x <<= y;
- y = 31 - y;
-#elif __GNUC__ >= 4
- y = __builtin_clz(x);
- x <<= y;
- y = (31 - y);
-#else
- for (y = 31; y > 0; --y) {
- if (x & 0x80000000)
- break;
- x <<= 1;
- }
-#endif
- y <<= DEFAULT_RADIX;
- /* Do a table lookup for the MSB of the mantissa. */
- x = (x >> 24) & 0x7f;
- return y + logtable[x];
-}
-
-int
-fixlog(uint32 x)
-{
- int32 y;
- y = fixlog2(x);
- return FIXMUL(y, FIXLN_2);
-}
diff --git a/media/sphinxbase/src/libsphinxbase/fe/yin.c b/media/sphinxbase/src/libsphinxbase/fe/yin.c
deleted file mode 100644
index a63fb30a9..000000000
--- a/media/sphinxbase/src/libsphinxbase/fe/yin.c
+++ /dev/null
@@ -1,412 +0,0 @@
-/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */
-/*
- * Copyright (c) 2008 Beyond Access, Inc. All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * THIS SOFTWARE IS PROVIDED BY BEYOND ACCESS, INC. ``AS IS'' AND ANY
- * EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
- * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
- * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL BEYOND ACCESS, INC. NOR
- * ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
- * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
- * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
- * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
- * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
- * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
- * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
-
-/**
- * @file yin.c Implementation of pitch extraction.
- * @author David Huggins-Daines <dhuggins@cs.cmu.edu>
- */
-
-/* This implements part of the YIN algorithm:
- *
- * "YIN, a fundamental frequency estimator for speech and music".
- * Alain de Cheveigné and Hideki Kawahara. Journal of the Acoustical
- * Society of America, 111 (4), April 2002.
- */
-
-#include "sphinxbase/prim_type.h"
-#include "sphinxbase/ckd_alloc.h"
-#include "sphinxbase/fixpoint.h"
-
-#include "sphinxbase/yin.h"
-
-#include <stdio.h>
-#include <string.h>
-
-struct yin_s {
- uint16 frame_size; /** Size of analysis frame. */
-#ifndef FIXED_POINT
- float search_threshold; /**< Threshold for finding period */
- float search_range; /**< Range around best local estimate to search */
-#else
- uint16 search_threshold; /**< Threshold for finding period, in Q15 */
- uint16 search_range; /**< Range around best local estimate to search, in Q15 */
-#endif
- uint16 nfr; /**< Number of frames read so far. */
-
- unsigned char wsize; /**< Size of smoothing window. */
- unsigned char wstart; /**< First frame in window. */
- unsigned char wcur; /**< Current frame of analysis. */
- unsigned char endut; /**< Hoch Hech! Are we at the utterance end? */
-
-#ifndef FIXED_POINT
- float **diff_window; /**< Window of difference function outputs. */
-#else
- fixed32 **diff_window; /**< Window of difference function outputs. */
-#endif
- uint16 *period_window; /**< Window of best period estimates. */
- int16 *frame; /**< Storage for frame */
-};
-
-/**
- * The core of YIN: cumulative mean normalized difference function.
- */
-#ifndef FIXED_POINT
-static void
-cmn_diff(int16 const *signal, float *out_diff, int ndiff)
-{
- double cum;
- int t, j;
-
- cum = 0.0f;
- out_diff[0] = 1.0f;
-
- for (t = 1; t < ndiff; ++t) {
- float dd;
- dd = 0.0f;
- for (j = 0; j < ndiff; ++j) {
- int diff = signal[j] - signal[t + j];
- dd += (diff * diff);
- }
- cum += dd;
- out_diff[t] = (float)(dd * t / cum);
- }
-}
-#else
-static void
-cmn_diff(int16 const *signal, int32 *out_diff, int ndiff)
-{
- uint32 cum, cshift;
- int32 t, tscale;
-
- out_diff[0] = 32768;
- cum = 0;
- cshift = 0;
-
- /* Determine how many bits we can scale t up by below. */
- for (tscale = 0; tscale < 32; ++tscale)
- if (ndiff & (1<<(31-tscale)))
- break;
- --tscale; /* Avoid teh overflowz. */
- /* printf("tscale is %d (ndiff - 1) << tscale is %d\n",
- tscale, (ndiff-1) << tscale); */
-
- /* Somewhat elaborate block floating point implementation.
- * The fp implementation of this is really a lot simpler. */
- for (t = 1; t < ndiff; ++t) {
- uint32 dd, dshift, norm;
- int j;
-
- dd = 0;
- dshift = 0;
- for (j = 0; j < ndiff; ++j) {
- int diff = signal[j] - signal[t + j];
- /* Guard against overflows. */
- if (dd > (1UL<<tscale)) {
- dd >>= 1;
- ++dshift;
- }
- dd += (diff * diff) >> dshift;
- }
- /* Make sure the diffs and cum are shifted to the same
- * scaling factor (usually dshift will be zero) */
- if (dshift > cshift) {
- cum += dd << (dshift-cshift);
- }
- else {
- cum += dd >> (cshift-dshift);
- }
-
- /* Guard against overflows and also ensure that (t<<tscale) > cum. */
- while (cum > (1UL<<tscale)) {
- cum >>= 1;
- ++cshift;
- }
- /* Avoid divide-by-zero! */
- if (cum == 0) cum = 1;
- /* Calculate the normalizer in high precision. */
- norm = (t << tscale) / cum;
- /* Do a long multiply and shift down to Q15. */
- out_diff[t] = (int32)(((long long)dd * norm)
- >> (tscale - 15 + cshift - dshift));
- /* printf("dd %d cshift %d dshift %d scaledt %d cum %d norm %d cmn %d\n",
- dd, cshift, dshift, (t<<tscale), cum, norm, out_diff[t]); */
- }
-}
-#endif
-
-yin_t *
-yin_init(int frame_size, float search_threshold,
- float search_range, int smooth_window)
-{
- yin_t *pe;
-
- pe = ckd_calloc(1, sizeof(*pe));
- pe->frame_size = frame_size;
-#ifndef FIXED_POINT
- pe->search_threshold = search_threshold;
- pe->search_range = search_range;
-#else
- pe->search_threshold = (uint16)(search_threshold * 32768);
- pe->search_range = (uint16)(search_range * 32768);
-#endif
- pe->wsize = smooth_window * 2 + 1;
- pe->diff_window = ckd_calloc_2d(pe->wsize,
- pe->frame_size / 2,
- sizeof(**pe->diff_window));
- pe->period_window = ckd_calloc(pe->wsize,
- sizeof(*pe->period_window));
- pe->frame = ckd_calloc(pe->frame_size, sizeof(*pe->frame));
- return pe;
-}
-
-void
-yin_free(yin_t *pe)
-{
- ckd_free_2d(pe->diff_window);
- ckd_free(pe->period_window);
- ckd_free(pe);
-}
-
-void
-yin_start(yin_t *pe)
-{
- /* Reset the circular window pointers. */
- pe->wstart = pe->endut = 0;
- pe->nfr = 0;
-}
-
-void
-yin_end(yin_t *pe)
-{
- pe->endut = 1;
-}
-
-int
-#ifndef FIXED_POINT
-thresholded_search(float *diff_window, float threshold, int start, int end)
-#else
-thresholded_search(int32 *diff_window, fixed32 threshold, int start, int end)
-#endif
-{
- int i, argmin;
-#ifndef FIXED_POINT
- float min;
-#else
- int min;
-#endif
-
- min = diff_window[start];
- argmin = start;
- for (i = start + 1; i < end; ++i) {
-#ifndef FIXED_POINT
- float diff = diff_window[i];
-#else
- int diff = diff_window[i];
-#endif
-
- if (diff < threshold) {
- min = diff;
- argmin = i;
- break;
- }
- if (diff < min) {
- min = diff;
- argmin = i;
- }
- }
- return argmin;
-}
-
-void
-yin_store(yin_t *pe, int16 const *frame)
-{
- memcpy(pe->frame, frame, pe->frame_size * sizeof(*pe->frame));
-}
-
-void
-yin_write(yin_t *pe, int16 const *frame)
-{
- int outptr, difflen;
-
- /* Rotate the window one frame forward. */
- ++pe->wstart;
- /* Fill in the frame before wstart. */
- outptr = pe->wstart - 1;
- /* Wrap around the window pointer. */
- if (pe->wstart == pe->wsize)
- pe->wstart = 0;
-
- /* Now calculate normalized difference function. */
- difflen = pe->frame_size / 2;
- cmn_diff(frame, pe->diff_window[outptr], difflen);
-
- /* Find the first point under threshold. If not found, then
- * use the absolute minimum. */
- pe->period_window[outptr]
- = thresholded_search(pe->diff_window[outptr],
- pe->search_threshold, 0, difflen);
-
- /* Increment total number of frames. */
- ++pe->nfr;
-}
-
-void
-yin_write_stored(yin_t *pe)
-{
- yin_write(pe, pe->frame);
-}
-
-int
-yin_read(yin_t *pe, uint16 *out_period, float *out_bestdiff)
-{
- int wstart, wlen, half_wsize, i;
- int best, search_width, low_period, high_period;
-#ifndef FIXED_POINT
- float best_diff;
-#else
- int best_diff;
-#endif
-
- half_wsize = (pe->wsize-1)/2;
- /* Without any smoothing, just return the current value (don't
- * need to do anything to the current poitner either). */
- if (half_wsize == 0) {
- if (pe->endut)
- return 0;
- *out_period = pe->period_window[0];
-#ifndef FIXED_POINT
- *out_bestdiff = pe->diff_window[0][pe->period_window[0]];
-#else
- *out_bestdiff = pe->diff_window[0][pe->period_window[0]] / 32768.0f;
-#endif
- return 1;
- }
-
- /* We can't do anything unless we have at least (wsize-1)/2 + 1
- * frames, unless we're at the end of the utterance. */
- if (pe->endut == 0 && pe->nfr < half_wsize + 1) {
- /* Don't increment the current pointer either. */
- return 0;
- }
-
- /* Establish the smoothing window. */
- /* End of utterance. */
- if (pe->endut) {
- /* We are done (no more data) when pe->wcur = pe->wstart. */
- if (pe->wcur == pe->wstart)
- return 0;
- /* I.e. pe->wcur (circular minus) half_wsize. */
- wstart = (pe->wcur + pe->wsize - half_wsize) % pe->wsize;
- /* Number of frames from wstart up to pe->wstart. */
- wlen = pe->wstart - wstart;
- if (wlen < 0) wlen += pe->wsize;
- /*printf("ENDUT! ");*/
- }
- /* Beginning of utterance. */
- else if (pe->nfr < pe->wsize) {
- wstart = 0;
- wlen = pe->nfr;
- }
- /* Normal case, it is what it is. */
- else {
- wstart = pe->wstart;
- wlen = pe->wsize;
- }
-
- /* Now (finally) look for the best local estimate. */
- /* printf("Searching for local estimate in %d frames around %d\n",
- wlen, pe->nfr + 1 - wlen); */
- best = pe->period_window[pe->wcur];
- best_diff = pe->diff_window[pe->wcur][best];
- for (i = 0; i < wlen; ++i) {
- int j = wstart + i;
-#ifndef FIXED_POINT
- float diff;
-#else
- int diff;
-#endif
-
- j %= pe->wsize;
- diff = pe->diff_window[j][pe->period_window[j]];
- /* printf("%.2f,%.2f ", 1.0 - (double)diff/32768,
- pe->period_window[j] ? 8000.0/pe->period_window[j] : 8000.0); */
- if (diff < best_diff) {
- best_diff = diff;
- best = pe->period_window[j];
- }
- }
- /* printf("best: %.2f, %.2f\n", 1.0 - (double)best_diff/32768,
- best ? 8000.0/best : 8000.0); */
- /* If it's the same as the current one then return it. */
- if (best == pe->period_window[pe->wcur]) {
- /* Increment the current pointer. */
- if (++pe->wcur == pe->wsize)
- pe->wcur = 0;
- *out_period = best;
-#ifndef FIXED_POINT
- *out_bestdiff = best_diff;
-#else
- *out_bestdiff = best_diff / 32768.0f;
-#endif
- return 1;
- }
- /* Otherwise, redo the search inside a narrower range. */
-#ifndef FIXED_POINT
- search_width = (int)(best * pe->search_range);
-#else
- search_width = best * pe->search_range / 32768;
-#endif
- /* printf("Search width = %d * %.2f = %d\n",
- best, (double)pe->search_range/32768, search_width); */
- if (search_width == 0) search_width = 1;
- low_period = best - search_width;
- high_period = best + search_width;
- if (low_period < 0) low_period = 0;
- if (high_period > pe->frame_size / 2) high_period = pe->frame_size / 2;
- /* printf("Searching from %d to %d\n", low_period, high_period); */
- best = thresholded_search(pe->diff_window[pe->wcur],
- pe->search_threshold,
- low_period, high_period);
- best_diff = pe->diff_window[pe->wcur][best];
-
- if (out_period)
- *out_period = (best > 65535) ? 65535 : best;
- if (out_bestdiff) {
-#ifndef FIXED_POINT
- *out_bestdiff = (best_diff > 1.0f) ? 1.0f : best_diff;
-#else
- *out_bestdiff = (best_diff > 32768) ? 1.0f : best_diff / 32768.0f;
-#endif
- }
-
- /* Increment the current pointer. */
- if (++pe->wcur == pe->wsize)
- pe->wcur = 0;
- return 1;
-}