<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> <title>SphinxBase: src/libsphinxbase/feat/lda.c Source File</title> <link href="tabs.css" rel="stylesheet" type="text/css"/> <link href="navtree.css" rel="stylesheet" type="text/css"/> <script type="text/javascript" src="jquery.js"></script> <script type="text/javascript" src="navtree.js"></script> <script type="text/javascript" src="resize.js"></script> <script type="text/javascript"> $(document).ready(initResizable); </script> <link href="doxygen.css" rel="stylesheet" type="text/css"/> </head> <body> <!-- Generated by Doxygen 1.7.3 --> <div id="top"> <div id="titlearea"> <table cellspacing="0" cellpadding="0"> <tbody> <tr style="height: 56px;"> <td style="padding-left: 0.5em;"> <div id="projectname">SphinxBase <span id="projectnumber">0.6</span></div> </td> </tr> </tbody> </table> </div> <div id="navrow1" class="tabs"> <ul class="tablist"> <li><a href="index.html"><span>Main Page</span></a></li> <li><a href="pages.html"><span>Related Pages</span></a></li> <li><a href="annotated.html"><span>Data Structures</span></a></li> <li class="current"><a href="files.html"><span>Files</span></a></li> </ul> </div> <div id="navrow2" class="tabs2"> <ul class="tablist"> <li><a href="files.html"><span>File List</span></a></li> <li><a href="globals.html"><span>Globals</span></a></li> </ul> </div> </div> <div id="side-nav" class="ui-resizable side-nav-resizable"> <div id="nav-tree"> <div id="nav-tree-contents"> </div> </div> <div id="splitbar" style="-moz-user-select:none;" class="ui-resizable-handle"> </div> </div> <script type="text/javascript"> initNavTree('lda_8c.html',''); </script> <div id="doc-content"> <div class="header"> <div class="headertitle"> <h1>src/libsphinxbase/feat/lda.c</h1> </div> </div> <div class="contents"> <div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */</span> <a name="l00002"></a>00002 <span class="comment">/* ====================================================================</span> <a name="l00003"></a>00003 <span class="comment"> * Copyright (c) 2006 Carnegie Mellon University. All rights</span> <a name="l00004"></a>00004 <span class="comment"> * reserved.</span> <a name="l00005"></a>00005 <span class="comment"> *</span> <a name="l00006"></a>00006 <span class="comment"> * Redistribution and use in source and binary forms, with or without</span> <a name="l00007"></a>00007 <span class="comment"> * modification, are permitted provided that the following conditions</span> <a name="l00008"></a>00008 <span class="comment"> * are met:</span> <a name="l00009"></a>00009 <span class="comment"> *</span> <a name="l00010"></a>00010 <span class="comment"> * 1. Redistributions of source code must retain the above copyright</span> <a name="l00011"></a>00011 <span class="comment"> * notice, this list of conditions and the following disclaimer. </span> <a name="l00012"></a>00012 <span class="comment"> *</span> <a name="l00013"></a>00013 <span class="comment"> * 2. Redistributions in binary form must reproduce the above copyright</span> <a name="l00014"></a>00014 <span class="comment"> * notice, this list of conditions and the following disclaimer in</span> <a name="l00015"></a>00015 <span class="comment"> * the documentation and/or other materials provided with the</span> <a name="l00016"></a>00016 <span class="comment"> * distribution.</span> <a name="l00017"></a>00017 <span class="comment"> *</span> <a name="l00018"></a>00018 <span class="comment"> * This work was supported in part by funding from the Defense Advanced </span> <a name="l00019"></a>00019 <span class="comment"> * Research Projects Agency and the National Science Foundation of the </span> <a name="l00020"></a>00020 <span class="comment"> * United States of America, and the CMU Sphinx Speech Consortium.</span> <a name="l00021"></a>00021 <span class="comment"> *</span> <a name="l00022"></a>00022 <span class="comment"> * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND </span> <a name="l00023"></a>00023 <span class="comment"> * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, </span> <a name="l00024"></a>00024 <span class="comment"> * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR</span> <a name="l00025"></a>00025 <span class="comment"> * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY</span> <a name="l00026"></a>00026 <span class="comment"> * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,</span> <a name="l00027"></a>00027 <span class="comment"> * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT </span> <a name="l00028"></a>00028 <span class="comment"> * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, </span> <a name="l00029"></a>00029 <span class="comment"> * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY </span> <a name="l00030"></a>00030 <span class="comment"> * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT </span> <a name="l00031"></a>00031 <span class="comment"> * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE </span> <a name="l00032"></a>00032 <span class="comment"> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.</span> <a name="l00033"></a>00033 <span class="comment"> *</span> <a name="l00034"></a>00034 <span class="comment"> * ====================================================================</span> <a name="l00035"></a>00035 <span class="comment"> *</span> <a name="l00036"></a>00036 <span class="comment"> */</span> <a name="l00037"></a>00037 <span class="comment">/*</span> <a name="l00038"></a>00038 <span class="comment"> * lda.c -- Read and apply LDA matrices to features.</span> <a name="l00039"></a>00039 <span class="comment"> *</span> <a name="l00040"></a>00040 <span class="comment"> * Author: David Huggins-Daines <dhuggins@cs.cmu.edu></span> <a name="l00041"></a>00041 <span class="comment"> */</span> <a name="l00042"></a>00042 <a name="l00043"></a>00043 <span class="preprocessor">#include <assert.h></span> <a name="l00044"></a>00044 <span class="preprocessor">#include <string.h></span> <a name="l00045"></a>00045 <span class="preprocessor">#ifdef HAVE_CONFIG_H</span> <a name="l00046"></a>00046 <span class="preprocessor"></span><span class="preprocessor">#include <config.h></span> <a name="l00047"></a>00047 <span class="preprocessor">#endif</span> <a name="l00048"></a>00048 <span class="preprocessor"></span> <a name="l00049"></a>00049 <span class="preprocessor">#ifdef _MSC_VER</span> <a name="l00050"></a>00050 <span class="preprocessor"></span><span class="preprocessor">#pragma warning (disable: 4018)</span> <a name="l00051"></a>00051 <span class="preprocessor"></span><span class="preprocessor">#endif</span> <a name="l00052"></a>00052 <span class="preprocessor"></span> <a name="l00053"></a>00053 <span class="preprocessor">#include "sphinxbase/feat.h"</span> <a name="l00054"></a>00054 <span class="preprocessor">#include "sphinxbase/ckd_alloc.h"</span> <a name="l00055"></a>00055 <span class="preprocessor">#include "sphinxbase/bio.h"</span> <a name="l00056"></a>00056 <span class="preprocessor">#include "sphinxbase/err.h"</span> <a name="l00057"></a>00057 <a name="l00058"></a>00058 <span class="preprocessor">#define MATRIX_FILE_VERSION "0.1"</span> <a name="l00059"></a>00059 <span class="preprocessor"></span> <a name="l00060"></a>00060 int32 <a name="l00061"></a><a class="code" href="feat_8h.html#a7639fbc34e3328d7e3259e61372c64b8">00061</a> <a class="code" href="feat_8h.html#a7639fbc34e3328d7e3259e61372c64b8" title="Add an LDA transformation to the feature module from a file.">feat_read_lda</a>(<a class="code" href="structfeat__t.html" title="Structure for describing a speech feature type Structure for describing a speech feature type (no...">feat_t</a> *feat, <span class="keyword">const</span> <span class="keywordtype">char</span> *ldafile, int32 dim) <a name="l00062"></a>00062 { <a name="l00063"></a>00063 FILE *fh; <a name="l00064"></a>00064 int32 byteswap, chksum_present; <a name="l00065"></a>00065 uint32 chksum, i, m, n; <a name="l00066"></a>00066 <span class="keywordtype">char</span> **argname, **argval; <a name="l00067"></a>00067 <a name="l00068"></a>00068 assert(feat); <a name="l00069"></a>00069 <span class="keywordflow">if</span> (feat->n_stream != 1) { <a name="l00070"></a>00070 <a class="code" href="err_8h.html#a5f7b2f58f5a663a6bdd51f197ae21993" title="Print error message to standard error stream.">E_ERROR</a>(<span class="stringliteral">"LDA incompatible with multi-stream features (n_stream = %d)\n"</span>, <a name="l00071"></a>00071 feat->n_stream); <a name="l00072"></a>00072 <span class="keywordflow">return</span> -1; <a name="l00073"></a>00073 } <a name="l00074"></a>00074 <a name="l00075"></a>00075 <span class="keywordflow">if</span> ((fh = fopen(ldafile, <span class="stringliteral">"rb"</span>)) == NULL) { <a name="l00076"></a>00076 <a class="code" href="err_8h.html#a54ffbfe898d74595c586a1f48f32ef03" title="Print error text; Call perror(&quot;&quot;);.">E_ERROR_SYSTEM</a>(<span class="stringliteral">"Failed to open transform file '%s' for reading: %s\n"</span>, ldafile, strerror(errno)); <a name="l00077"></a>00077 <span class="keywordflow">return</span> -1; <a name="l00078"></a>00078 } <a name="l00079"></a>00079 <a name="l00080"></a>00080 <span class="keywordflow">if</span> (<a class="code" href="bio_8h.html#a7a155ff51740f1d9a31f7bb7b6e4bc3a" title="Read binary file format header: has the following format.">bio_readhdr</a>(fh, &argname, &argval, &byteswap) < 0) { <a name="l00081"></a>00081 <a class="code" href="err_8h.html#a5f7b2f58f5a663a6bdd51f197ae21993" title="Print error message to standard error stream.">E_ERROR</a>(<span class="stringliteral">"Failed to read header from transform file '%s'\n"</span>, ldafile); <a name="l00082"></a>00082 fclose(fh); <a name="l00083"></a>00083 <span class="keywordflow">return</span> -1; <a name="l00084"></a>00084 } <a name="l00085"></a>00085 <a name="l00086"></a>00086 chksum_present = 0; <a name="l00087"></a>00087 <span class="keywordflow">for</span> (i = 0; argname[i]; i++) { <a name="l00088"></a>00088 <span class="keywordflow">if</span> (strcmp(argname[i], <span class="stringliteral">"version"</span>) == 0) { <a name="l00089"></a>00089 <span class="keywordflow">if</span> (strcmp(argval[i], MATRIX_FILE_VERSION) != 0) <a name="l00090"></a>00090 <a class="code" href="err_8h.html#a6a794bec721b555ac1f2167f9e12f662" title="Print warning information to standard error stream.">E_WARN</a>(<span class="stringliteral">"%s: Version mismatch: %s, expecting %s\n"</span>, <a name="l00091"></a>00091 ldafile, argval[i], MATRIX_FILE_VERSION); <a name="l00092"></a>00092 } <a name="l00093"></a>00093 <span class="keywordflow">else</span> <span class="keywordflow">if</span> (strcmp(argname[i], <span class="stringliteral">"chksum0"</span>) == 0) { <a name="l00094"></a>00094 chksum_present = 1; <span class="comment">/* Ignore the associated value */</span> <a name="l00095"></a>00095 } <a name="l00096"></a>00096 } <a name="l00097"></a>00097 <a name="l00098"></a>00098 <a class="code" href="bio_8h.html#adb3c858a50381aeff022ccd4271af2d9" title="Free name and value strings previously allocated and returned by bio_readhdr.">bio_hdrarg_free</a>(argname, argval); <a name="l00099"></a>00099 argname = argval = NULL; <a name="l00100"></a>00100 <a name="l00101"></a>00101 chksum = 0; <a name="l00102"></a>00102 <a name="l00103"></a>00103 <span class="keywordflow">if</span> (feat->lda) <a name="l00104"></a>00104 <a class="code" href="ckd__alloc_8h.html#a443accde4663a4a07c6d147088614d57" title="Free a 3-D array (ptr) previously allocated by ckd_calloc_3d.">ckd_free_3d</a>((<span class="keywordtype">void</span> ***)feat->lda); <a name="l00105"></a>00105 <a name="l00106"></a>00106 { <a name="l00107"></a>00107 <span class="comment">/* Use a temporary variable to avoid strict-aliasing problems. */</span> <a name="l00108"></a>00108 <span class="keywordtype">void</span> ***outlda; <a name="l00109"></a>00109 <a name="l00110"></a>00110 <span class="keywordflow">if</span> (<a class="code" href="bio_8h.html#aca6a6b71d02b9e5ca6b136a28640e0c1" title="Read a 3-d array (set of matrices)">bio_fread_3d</a>(&outlda, <span class="keyword">sizeof</span>(float32), <a name="l00111"></a>00111 &feat->n_lda, &m, &n, <a name="l00112"></a>00112 fh, byteswap, &chksum) < 0) { <a name="l00113"></a>00113 <a class="code" href="err_8h.html#a54ffbfe898d74595c586a1f48f32ef03" title="Print error text; Call perror(&quot;&quot;);.">E_ERROR_SYSTEM</a>(<span class="stringliteral">"%s: bio_fread_3d(lda) failed\n"</span>, ldafile); <a name="l00114"></a>00114 fclose(fh); <a name="l00115"></a>00115 <span class="keywordflow">return</span> -1; <a name="l00116"></a>00116 } <a name="l00117"></a>00117 feat->lda = (<span class="keywordtype">void</span> *)outlda; <a name="l00118"></a>00118 } <a name="l00119"></a>00119 fclose(fh); <a name="l00120"></a>00120 <a name="l00121"></a>00121 <span class="preprocessor">#ifdef FIXED_POINT</span> <a name="l00122"></a>00122 <span class="preprocessor"></span> <span class="comment">/* FIXME: This is a fragile hack that depends on mfcc_t and</span> <a name="l00123"></a>00123 <span class="comment"> * float32 being the same size (which they are, but...) */</span> <a name="l00124"></a>00124 <span class="keywordflow">for</span> (i = 0; i < feat->n_lda * m * n; ++i) { <a name="l00125"></a>00125 feat->lda[0][0][i] = FLOAT2MFCC(((<span class="keywordtype">float</span> *)feat->lda[0][0])[i]); <a name="l00126"></a>00126 } <a name="l00127"></a>00127 <span class="preprocessor">#endif</span> <a name="l00128"></a>00128 <span class="preprocessor"></span> <a name="l00129"></a>00129 <span class="comment">/* Note that SphinxTrain stores the eigenvectors as row vectors. */</span> <a name="l00130"></a>00130 <span class="keywordflow">if</span> (n != feat->stream_len[0]) <a name="l00131"></a>00131 <a class="code" href="err_8h.html#a1a4495946ab2449d61108fe829a94613" title="Exit with non-zero status after error message.">E_FATAL</a>(<span class="stringliteral">"LDA matrix dimension %d doesn't match feature stream size %d\n"</span>, n, feat->stream_len[0]); <a name="l00132"></a>00132 <a name="l00133"></a>00133 <span class="comment">/* Override dim from file if it is 0 or greater than m. */</span> <a name="l00134"></a>00134 <span class="keywordflow">if</span> (dim > m || dim <= 0) { <a name="l00135"></a>00135 dim = m; <a name="l00136"></a>00136 } <a name="l00137"></a>00137 feat->out_dim = dim; <a name="l00138"></a>00138 <a name="l00139"></a>00139 <span class="keywordflow">return</span> 0; <a name="l00140"></a>00140 } <a name="l00141"></a>00141 <a name="l00142"></a>00142 <span class="keywordtype">void</span> <a name="l00143"></a><a class="code" href="feat_8h.html#a7452702cb435ea9244c7e1f61bbf5da1">00143</a> <a class="code" href="feat_8h.html#a7452702cb435ea9244c7e1f61bbf5da1" title="Transform a block of features using the feature module&#39;s LDA transform.">feat_lda_transform</a>(<a class="code" href="structfeat__t.html" title="Structure for describing a speech feature type Structure for describing a speech feature type (no...">feat_t</a> *fcb, mfcc_t ***inout_feat, uint32 nfr) <a name="l00144"></a>00144 { <a name="l00145"></a>00145 mfcc_t *tmp; <a name="l00146"></a>00146 uint32 i, j, k; <a name="l00147"></a>00147 <a name="l00148"></a>00148 tmp = <a class="code" href="ckd__alloc_8h.html#aa00ef21903bc4f8a972488417adc8d2e" title="Macros to simplify the use of above functions.">ckd_calloc</a>(fcb->stream_len[0], <span class="keyword">sizeof</span>(mfcc_t)); <a name="l00149"></a>00149 <span class="keywordflow">for</span> (i = 0; i < nfr; ++i) { <a name="l00150"></a>00150 <span class="comment">/* Do the matrix multiplication inline here since fcb->lda</span> <a name="l00151"></a>00151 <span class="comment"> * is transposed (eigenvectors in rows not columns). */</span> <a name="l00152"></a>00152 <span class="comment">/* FIXME: In the future we ought to use the BLAS. */</span> <a name="l00153"></a>00153 memset(tmp, 0, <span class="keyword">sizeof</span>(mfcc_t) * fcb->stream_len[0]); <a name="l00154"></a>00154 <span class="keywordflow">for</span> (j = 0; j < <a class="code" href="feat_8h.html#a66dc16aeea4307bf36ec4e08e05d0c7c" title="Total dimensionality of feature output.">feat_dimension</a>(fcb); ++j) { <a name="l00155"></a>00155 <span class="keywordflow">for</span> (k = 0; k < fcb->stream_len[0]; ++k) { <a name="l00156"></a>00156 tmp[j] += MFCCMUL(inout_feat[i][0][k], fcb->lda[0][j][k]); <a name="l00157"></a>00157 } <a name="l00158"></a>00158 } <a name="l00159"></a>00159 memcpy(inout_feat[i][0], tmp, fcb->stream_len[0] * <span class="keyword">sizeof</span>(mfcc_t)); <a name="l00160"></a>00160 } <a name="l00161"></a>00161 <a class="code" href="ckd__alloc_8h.html#a31c6b405558620ac37599737b5722fbf" title="Test and free a 1-D array.">ckd_free</a>(tmp); <a name="l00162"></a>00162 } </pre></div></div> </div> <div id="nav-path" class="navpath"> <ul> <li class="navelem"><b>lda.c</b> </li> <li class="footer">Generated on Tue Apr 19 2011 for SphinxBase by  <a href="http://www.doxygen.org/index.html"> <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.3 </li> </ul> </div> </body> </html>