<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> <meta http-equiv="X-UA-Compatible" content="IE=9"/> <meta name="generator" content="Doxygen 1.8.3"/> <title>GNU Radio 3.6.4.1 C++ API: volk_32fc_32f_dot_prod_32fc_a.h Source File</title> <link href="tabs.css" rel="stylesheet" type="text/css"/> <script type="text/javascript" src="jquery.js"></script> <script type="text/javascript" src="dynsections.js"></script> <link href="navtree.css" rel="stylesheet" type="text/css"/> <script type="text/javascript" src="resize.js"></script> <script type="text/javascript" src="navtree.js"></script> <script type="text/javascript"> $(document).ready(initResizable); $(window).load(resizeHeight); </script> <link href="doxygen.css" rel="stylesheet" type="text/css" /> </head> <body> <div id="top"><!-- do not remove this div, it is closed by doxygen! --> <div id="titlearea"> <table cellspacing="0" cellpadding="0"> <tbody> <tr style="height: 56px;"> <td style="padding-left: 0.5em;"> <div id="projectname">GNU Radio 3.6.4.1 C++ API </div> </td> </tr> </tbody> </table> </div> <!-- end header part --> <!-- Generated by Doxygen 1.8.3 --> </div><!-- top --> <div id="side-nav" class="ui-resizable side-nav-resizable"> <div id="nav-tree"> <div id="nav-tree-contents"> <div id="nav-sync" class="sync"></div> </div> </div> <div id="splitbar" style="-moz-user-select:none;" class="ui-resizable-handle"> </div> </div> <script type="text/javascript"> $(document).ready(function(){initNavTree('volk__32fc__32f__dot__prod__32fc__a_8h_source.html','');}); </script> <div id="doc-content"> <div class="header"> <div class="headertitle"> <div class="title">volk_32fc_32f_dot_prod_32fc_a.h</div> </div> </div><!--header--> <div class="contents"> <a href="volk__32fc__32f__dot__prod__32fc__a_8h.html">Go to the documentation of this file.</a><div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno"> 1</span> <span class="preprocessor">#ifndef INCLUDED_volk_32fc_32f_dot_prod_32fc_a_H</span></div> <div class="line"><a name="l00002"></a><span class="lineno"> 2</span> <span class="preprocessor"></span><span class="preprocessor">#define INCLUDED_volk_32fc_32f_dot_prod_32fc_a_H</span></div> <div class="line"><a name="l00003"></a><span class="lineno"> 3</span> <span class="preprocessor"></span></div> <div class="line"><a name="l00004"></a><span class="lineno"> 4</span> <span class="preprocessor">#include <<a class="code" href="volk__common_8h.html">volk/volk_common.h</a>></span></div> <div class="line"><a name="l00005"></a><span class="lineno"> 5</span> <span class="preprocessor">#include<stdio.h></span></div> <div class="line"><a name="l00006"></a><span class="lineno"> 6</span> </div> <div class="line"><a name="l00007"></a><span class="lineno"> 7</span> </div> <div class="line"><a name="l00008"></a><span class="lineno"> 8</span> <span class="preprocessor">#ifdef LV_HAVE_GENERIC</span></div> <div class="line"><a name="l00009"></a><span class="lineno"> 9</span> <span class="preprocessor"></span></div> <div class="line"><a name="l00010"></a><span class="lineno"> 10</span> </div> <div class="line"><a name="l00011"></a><span class="lineno"> 11</span> <span class="keyword">static</span> <span class="keyword">inline</span> <span class="keywordtype">void</span> volk_32fc_32f_dot_prod_32fc_a_generic(<a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>* result, <span class="keyword">const</span> <a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>* input, <span class="keyword">const</span> <span class="keywordtype">float</span> * <a class="code" href="gnuradio-core_2src_2lib_2filter_2interpolator__taps_8h.html#a30bf032e13c2a9fc4a98e14e390cd65a">taps</a>, <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> num_points) {</div> <div class="line"><a name="l00012"></a><span class="lineno"> 12</span> </div> <div class="line"><a name="l00013"></a><span class="lineno"> 13</span>  <span class="keywordtype">float</span> res[2];</div> <div class="line"><a name="l00014"></a><span class="lineno"> 14</span>  <span class="keywordtype">float</span> *realpt = &res[0], *imagpt = &res[1];</div> <div class="line"><a name="l00015"></a><span class="lineno"> 15</span>  <span class="keyword">const</span> <span class="keywordtype">float</span>* aPtr = (<span class="keywordtype">float</span>*)input;</div> <div class="line"><a name="l00016"></a><span class="lineno"> 16</span>  <span class="keyword">const</span> <span class="keywordtype">float</span>* bPtr= <a class="code" href="gnuradio-core_2src_2lib_2filter_2interpolator__taps_8h.html#a30bf032e13c2a9fc4a98e14e390cd65a">taps</a>;</div> <div class="line"><a name="l00017"></a><span class="lineno"> 17</span>  <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> number = 0;</div> <div class="line"><a name="l00018"></a><span class="lineno"> 18</span> </div> <div class="line"><a name="l00019"></a><span class="lineno"> 19</span>  *realpt = 0;</div> <div class="line"><a name="l00020"></a><span class="lineno"> 20</span>  *imagpt = 0;</div> <div class="line"><a name="l00021"></a><span class="lineno"> 21</span> </div> <div class="line"><a name="l00022"></a><span class="lineno"> 22</span>  <span class="keywordflow">for</span>(number = 0; number < num_points; number++){</div> <div class="line"><a name="l00023"></a><span class="lineno"> 23</span>  *realpt += ((*aPtr++) * (*bPtr));</div> <div class="line"><a name="l00024"></a><span class="lineno"> 24</span>  *imagpt += ((*aPtr++) * (*bPtr++));</div> <div class="line"><a name="l00025"></a><span class="lineno"> 25</span>  }</div> <div class="line"><a name="l00026"></a><span class="lineno"> 26</span> </div> <div class="line"><a name="l00027"></a><span class="lineno"> 27</span>  *result = *(<a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>*)(&res[0]);</div> <div class="line"><a name="l00028"></a><span class="lineno"> 28</span> }</div> <div class="line"><a name="l00029"></a><span class="lineno"> 29</span> </div> <div class="line"><a name="l00030"></a><span class="lineno"> 30</span> <span class="preprocessor">#endif </span><span class="comment">/*LV_HAVE_GENERIC*/</span><span class="preprocessor"></span></div> <div class="line"><a name="l00031"></a><span class="lineno"> 31</span> <span class="preprocessor"></span></div> <div class="line"><a name="l00032"></a><span class="lineno"> 32</span> </div> <div class="line"><a name="l00033"></a><span class="lineno"> 33</span> <span class="preprocessor">#ifdef LV_HAVE_SSE</span></div> <div class="line"><a name="l00034"></a><span class="lineno"> 34</span> <span class="preprocessor"></span></div> <div class="line"><a name="l00035"></a><span class="lineno"> 35</span> </div> <div class="line"><a name="l00036"></a><span class="lineno"> 36</span> <span class="keyword">static</span> <span class="keyword">inline</span> <span class="keywordtype">void</span> volk_32fc_32f_dot_prod_32fc_a_sse( <a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>* result, <span class="keyword">const</span> <a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>* input, <span class="keyword">const</span> <span class="keywordtype">float</span>* taps, <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> num_points) {</div> <div class="line"><a name="l00037"></a><span class="lineno"> 37</span> </div> <div class="line"><a name="l00038"></a><span class="lineno"> 38</span>  <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> number = 0;</div> <div class="line"><a name="l00039"></a><span class="lineno"> 39</span>  <span class="keyword">const</span> <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> sixteenthPoints = num_points / 8;</div> <div class="line"><a name="l00040"></a><span class="lineno"> 40</span> </div> <div class="line"><a name="l00041"></a><span class="lineno"> 41</span>  <span class="keywordtype">float</span> res[2];</div> <div class="line"><a name="l00042"></a><span class="lineno"> 42</span>  <span class="keywordtype">float</span> *realpt = &res[0], *imagpt = &res[1];</div> <div class="line"><a name="l00043"></a><span class="lineno"> 43</span>  <span class="keyword">const</span> <span class="keywordtype">float</span>* aPtr = (<span class="keywordtype">float</span>*)input;</div> <div class="line"><a name="l00044"></a><span class="lineno"> 44</span>  <span class="keyword">const</span> <span class="keywordtype">float</span>* bPtr = <a class="code" href="gnuradio-core_2src_2lib_2filter_2interpolator__taps_8h.html#a30bf032e13c2a9fc4a98e14e390cd65a">taps</a>;</div> <div class="line"><a name="l00045"></a><span class="lineno"> 45</span> </div> <div class="line"><a name="l00046"></a><span class="lineno"> 46</span>  __m128 a0Val, a1Val, a2Val, a3Val;</div> <div class="line"><a name="l00047"></a><span class="lineno"> 47</span>  __m128 b0Val, b1Val, b2Val, b3Val;</div> <div class="line"><a name="l00048"></a><span class="lineno"> 48</span>  __m128 x0Val, x1Val, x2Val, x3Val;</div> <div class="line"><a name="l00049"></a><span class="lineno"> 49</span>  __m128 c0Val, c1Val, c2Val, c3Val;</div> <div class="line"><a name="l00050"></a><span class="lineno"> 50</span> </div> <div class="line"><a name="l00051"></a><span class="lineno"> 51</span>  __m128 dotProdVal0 = _mm_setzero_ps();</div> <div class="line"><a name="l00052"></a><span class="lineno"> 52</span>  __m128 dotProdVal1 = _mm_setzero_ps();</div> <div class="line"><a name="l00053"></a><span class="lineno"> 53</span>  __m128 dotProdVal2 = _mm_setzero_ps();</div> <div class="line"><a name="l00054"></a><span class="lineno"> 54</span>  __m128 dotProdVal3 = _mm_setzero_ps();</div> <div class="line"><a name="l00055"></a><span class="lineno"> 55</span> </div> <div class="line"><a name="l00056"></a><span class="lineno"> 56</span>  <span class="keywordflow">for</span>(;number < sixteenthPoints; number++){</div> <div class="line"><a name="l00057"></a><span class="lineno"> 57</span> </div> <div class="line"><a name="l00058"></a><span class="lineno"> 58</span>  a0Val = _mm_load_ps(aPtr);</div> <div class="line"><a name="l00059"></a><span class="lineno"> 59</span>  a1Val = _mm_load_ps(aPtr+4);</div> <div class="line"><a name="l00060"></a><span class="lineno"> 60</span>  a2Val = _mm_load_ps(aPtr+8);</div> <div class="line"><a name="l00061"></a><span class="lineno"> 61</span>  a3Val = _mm_load_ps(aPtr+12);</div> <div class="line"><a name="l00062"></a><span class="lineno"> 62</span> </div> <div class="line"><a name="l00063"></a><span class="lineno"> 63</span>  x0Val = _mm_load_ps(bPtr);</div> <div class="line"><a name="l00064"></a><span class="lineno"> 64</span>  x1Val = _mm_load_ps(bPtr);</div> <div class="line"><a name="l00065"></a><span class="lineno"> 65</span>  x2Val = _mm_load_ps(bPtr+4);</div> <div class="line"><a name="l00066"></a><span class="lineno"> 66</span>  x3Val = _mm_load_ps(bPtr+4);</div> <div class="line"><a name="l00067"></a><span class="lineno"> 67</span>  b0Val = _mm_unpacklo_ps(x0Val, x1Val);</div> <div class="line"><a name="l00068"></a><span class="lineno"> 68</span>  b1Val = _mm_unpackhi_ps(x0Val, x1Val);</div> <div class="line"><a name="l00069"></a><span class="lineno"> 69</span>  b2Val = _mm_unpacklo_ps(x2Val, x3Val);</div> <div class="line"><a name="l00070"></a><span class="lineno"> 70</span>  b3Val = _mm_unpackhi_ps(x2Val, x3Val);</div> <div class="line"><a name="l00071"></a><span class="lineno"> 71</span> </div> <div class="line"><a name="l00072"></a><span class="lineno"> 72</span>  c0Val = _mm_mul_ps(a0Val, b0Val);</div> <div class="line"><a name="l00073"></a><span class="lineno"> 73</span>  c1Val = _mm_mul_ps(a1Val, b1Val);</div> <div class="line"><a name="l00074"></a><span class="lineno"> 74</span>  c2Val = _mm_mul_ps(a2Val, b2Val);</div> <div class="line"><a name="l00075"></a><span class="lineno"> 75</span>  c3Val = _mm_mul_ps(a3Val, b3Val);</div> <div class="line"><a name="l00076"></a><span class="lineno"> 76</span> </div> <div class="line"><a name="l00077"></a><span class="lineno"> 77</span>  dotProdVal0 = _mm_add_ps(c0Val, dotProdVal0);</div> <div class="line"><a name="l00078"></a><span class="lineno"> 78</span>  dotProdVal1 = _mm_add_ps(c1Val, dotProdVal1);</div> <div class="line"><a name="l00079"></a><span class="lineno"> 79</span>  dotProdVal2 = _mm_add_ps(c2Val, dotProdVal2);</div> <div class="line"><a name="l00080"></a><span class="lineno"> 80</span>  dotProdVal3 = _mm_add_ps(c3Val, dotProdVal3);</div> <div class="line"><a name="l00081"></a><span class="lineno"> 81</span> </div> <div class="line"><a name="l00082"></a><span class="lineno"> 82</span>  aPtr += 16;</div> <div class="line"><a name="l00083"></a><span class="lineno"> 83</span>  bPtr += 8;</div> <div class="line"><a name="l00084"></a><span class="lineno"> 84</span>  }</div> <div class="line"><a name="l00085"></a><span class="lineno"> 85</span> </div> <div class="line"><a name="l00086"></a><span class="lineno"> 86</span>  dotProdVal0 = _mm_add_ps(dotProdVal0, dotProdVal1);</div> <div class="line"><a name="l00087"></a><span class="lineno"> 87</span>  dotProdVal0 = _mm_add_ps(dotProdVal0, dotProdVal2);</div> <div class="line"><a name="l00088"></a><span class="lineno"> 88</span>  dotProdVal0 = _mm_add_ps(dotProdVal0, dotProdVal3);</div> <div class="line"><a name="l00089"></a><span class="lineno"> 89</span> </div> <div class="line"><a name="l00090"></a><span class="lineno"> 90</span>  <a class="code" href="volk__common_8h.html#af8ae70079c1927f7c46b6d1880473d17">__VOLK_ATTR_ALIGNED</a>(16) float dotProductVector[4];</div> <div class="line"><a name="l00091"></a><span class="lineno"> 91</span> </div> <div class="line"><a name="l00092"></a><span class="lineno"> 92</span>  _mm_store_ps(dotProductVector,dotProdVal0); <span class="comment">// Store the results back into the dot product vector</span></div> <div class="line"><a name="l00093"></a><span class="lineno"> 93</span> </div> <div class="line"><a name="l00094"></a><span class="lineno"> 94</span>  *realpt = dotProductVector[0];</div> <div class="line"><a name="l00095"></a><span class="lineno"> 95</span>  *imagpt = dotProductVector[1];</div> <div class="line"><a name="l00096"></a><span class="lineno"> 96</span>  *realpt += dotProductVector[2];</div> <div class="line"><a name="l00097"></a><span class="lineno"> 97</span>  *imagpt += dotProductVector[3];</div> <div class="line"><a name="l00098"></a><span class="lineno"> 98</span> </div> <div class="line"><a name="l00099"></a><span class="lineno"> 99</span>  number = sixteenthPoints*8;</div> <div class="line"><a name="l00100"></a><span class="lineno"> 100</span>  for(;number < num_points; number++){</div> <div class="line"><a name="l00101"></a><span class="lineno"> 101</span>  *realpt += ((*aPtr++) * (*bPtr));</div> <div class="line"><a name="l00102"></a><span class="lineno"> 102</span>  *imagpt += ((*aPtr++) * (*bPtr++));</div> <div class="line"><a name="l00103"></a><span class="lineno"> 103</span>  }</div> <div class="line"><a name="l00104"></a><span class="lineno"> 104</span> </div> <div class="line"><a name="l00105"></a><span class="lineno"> 105</span>  *result = *(<a class="code" href="volk__complex_8h.html#ace50e1c8ef539cdeee04bc86f0e99169">lv_32fc_t</a>*)(&res[0]);</div> <div class="line"><a name="l00106"></a><span class="lineno"> 106</span> }</div> <div class="line"><a name="l00107"></a><span class="lineno"> 107</span> </div> <div class="line"><a name="l00108"></a><span class="lineno"> 108</span> <span class="preprocessor">#endif </span><span class="comment">/*LV_HAVE_SSE*/</span><span class="preprocessor"></span></div> <div class="line"><a name="l00109"></a><span class="lineno"> 109</span> <span class="preprocessor"></span></div> <div class="line"><a name="l00110"></a><span class="lineno"> 110</span> </div> <div class="line"><a name="l00111"></a><span class="lineno"> 111</span> <span class="preprocessor">#endif </span><span class="comment">/*INCLUDED_volk_32fc_32f_dot_prod_32fc_a_H*/</span><span class="preprocessor"></span></div> </div><!-- fragment --></div><!-- contents --> </div><!-- doc-content --> <!-- start footer part --> <div id="nav-path" class="navpath"><!-- id is needed for treeview function! --> <ul> <li class="navelem"><a class="el" href="dir_ae2bed2ec5a7e8cc3c6fe8189aba5582.html">volk</a></li><li class="navelem"><a class="el" href="dir_65faefda812cb3f8ac5b182df74eac77.html">include</a></li><li class="navelem"><a class="el" href="dir_35412c2d6cdb849e27c8bd8fabbcf131.html">volk</a></li><li class="navelem"><a class="el" href="volk__32fc__32f__dot__prod__32fc__a_8h.html">volk_32fc_32f_dot_prod_32fc_a.h</a></li> <li class="footer">Generated on Fri Apr 19 2013 16:20:34 for GNU Radio 3.6.4.1 C++ API by <a href="http://www.doxygen.org/index.html"> <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.8.3 </li> </ul> </div> </body> </html>