<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head> <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> <title>Crypto++: cpu.cpp Source File</title> <link href="tabs.css" rel="stylesheet" type="text/css"/> <link href="doxygen.css" rel="stylesheet" type="text/css"/> </head> <body> <!-- Generated by Doxygen 1.6.1 --> <div class="navigation" id="top"> <div class="tabs"> <ul> <li><a href="index.html"><span>Main Page</span></a></li> <li><a href="namespaces.html"><span>Namespaces</span></a></li> <li><a href="annotated.html"><span>Classes</span></a></li> <li class="current"><a href="files.html"><span>Files</span></a></li> </ul> </div> <div class="tabs"> <ul> <li><a href="files.html"><span>File List</span></a></li> <li><a href="globals.html"><span>File Members</span></a></li> </ul> </div> <h1>cpu.cpp</h1><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">// cpu.cpp - written and placed in the public domain by Wei Dai</span> <a name="l00002"></a>00002 <a name="l00003"></a>00003 <span class="preprocessor">#include "pch.h"</span> <a name="l00004"></a>00004 <a name="l00005"></a>00005 <span class="preprocessor">#ifndef CRYPTOPP_IMPORTS</span> <a name="l00006"></a>00006 <span class="preprocessor"></span> <a name="l00007"></a>00007 <span class="preprocessor">#include "cpu.h"</span> <a name="l00008"></a>00008 <span class="preprocessor">#include "misc.h"</span> <a name="l00009"></a>00009 <span class="preprocessor">#include <algorithm></span> <a name="l00010"></a>00010 <a name="l00011"></a>00011 <span class="preprocessor">#ifdef __GNUC__</span> <a name="l00012"></a>00012 <span class="preprocessor"></span><span class="preprocessor">#include <signal.h></span> <a name="l00013"></a>00013 <span class="preprocessor">#include <setjmp.h></span> <a name="l00014"></a>00014 <span class="preprocessor">#endif</span> <a name="l00015"></a>00015 <span class="preprocessor"></span> <a name="l00016"></a>00016 <span class="preprocessor">#ifdef CRYPTOPP_MSVC6PP_OR_LATER</span> <a name="l00017"></a>00017 <span class="preprocessor"></span><span class="preprocessor">#include <emmintrin.h></span> <a name="l00018"></a>00018 <span class="preprocessor">#endif</span> <a name="l00019"></a>00019 <span class="preprocessor"></span> <a name="l00020"></a>00020 NAMESPACE_BEGIN(CryptoPP) <a name="l00021"></a>00021 <a name="l00022"></a>00022 <span class="preprocessor">#ifdef CRYPTOPP_X86_ASM_AVAILABLE</span> <a name="l00023"></a>00023 <span class="preprocessor"></span> <a name="l00024"></a>00024 <span class="preprocessor">#ifndef _MSC_VER</span> <a name="l00025"></a>00025 <span class="preprocessor"></span><span class="keyword">typedef</span> void (*SigHandler)(int); <a name="l00026"></a>00026 <a name="l00027"></a>00027 <span class="keyword">static</span> jmp_buf s_jmpNoCPUID; <a name="l00028"></a>00028 <span class="keyword">static</span> <span class="keywordtype">void</span> SigIllHandlerCPUID(<span class="keywordtype">int</span>) <a name="l00029"></a>00029 { <a name="l00030"></a>00030 longjmp(s_jmpNoCPUID, 1); <a name="l00031"></a>00031 } <a name="l00032"></a>00032 <span class="preprocessor">#endif</span> <a name="l00033"></a>00033 <span class="preprocessor"></span> <a name="l00034"></a>00034 <span class="keywordtype">bool</span> CpuId(word32 input, word32 *output) <a name="l00035"></a>00035 { <a name="l00036"></a>00036 <span class="preprocessor">#ifdef _MSC_VER</span> <a name="l00037"></a>00037 <span class="preprocessor"></span> __try <a name="l00038"></a>00038 { <a name="l00039"></a>00039 __asm <a name="l00040"></a>00040 { <a name="l00041"></a>00041 mov eax, input <a name="l00042"></a>00042 cpuid <a name="l00043"></a>00043 mov edi, output <a name="l00044"></a>00044 mov [edi], eax <a name="l00045"></a>00045 mov [edi+4], ebx <a name="l00046"></a>00046 mov [edi+8], ecx <a name="l00047"></a>00047 mov [edi+12], edx <a name="l00048"></a>00048 } <a name="l00049"></a>00049 } <a name="l00050"></a>00050 __except (1) <a name="l00051"></a>00051 { <a name="l00052"></a>00052 <span class="keywordflow">return</span> <span class="keyword">false</span>; <a name="l00053"></a>00053 } <a name="l00054"></a>00054 <span class="keywordflow">return</span> <span class="keyword">true</span>; <a name="l00055"></a>00055 <span class="preprocessor">#else</span> <a name="l00056"></a>00056 <span class="preprocessor"></span> SigHandler oldHandler = signal(SIGILL, SigIllHandlerCPUID); <a name="l00057"></a>00057 <span class="keywordflow">if</span> (oldHandler == SIG_ERR) <a name="l00058"></a>00058 <span class="keywordflow">return</span> <span class="keyword">false</span>; <a name="l00059"></a>00059 <a name="l00060"></a>00060 <span class="keywordtype">bool</span> result = <span class="keyword">true</span>; <a name="l00061"></a>00061 <span class="keywordflow">if</span> (setjmp(s_jmpNoCPUID)) <a name="l00062"></a>00062 result = <span class="keyword">false</span>; <a name="l00063"></a>00063 <span class="keywordflow">else</span> <a name="l00064"></a>00064 { <a name="l00065"></a>00065 __asm__ <a name="l00066"></a>00066 ( <a name="l00067"></a>00067 <span class="comment">// save ebx in case -fPIC is being used</span> <a name="l00068"></a>00068 #<span class="keywordflow">if</span> CRYPTOPP_BOOL_X86 <a name="l00069"></a>00069 <span class="stringliteral">"push %%ebx; cpuid; mov %%ebx, %%edi; pop %%ebx"</span> <a name="l00070"></a>00070 #<span class="keywordflow">else</span> <a name="l00071"></a>00071 <span class="stringliteral">"pushq %%rbx; cpuid; mov %%ebx, %%edi; popq %%rbx"</span> <a name="l00072"></a>00072 #endif <a name="l00073"></a>00073 : <span class="stringliteral">"=a"</span> (output[0]), <span class="stringliteral">"=D"</span> (output[1]), <span class="stringliteral">"=c"</span> (output[2]), <span class="stringliteral">"=d"</span> (output[3]) <a name="l00074"></a>00074 : <span class="stringliteral">"a"</span> (input) <a name="l00075"></a>00075 ); <a name="l00076"></a>00076 } <a name="l00077"></a>00077 <a name="l00078"></a>00078 signal(SIGILL, oldHandler); <a name="l00079"></a>00079 <span class="keywordflow">return</span> result; <a name="l00080"></a>00080 <span class="preprocessor">#endif</span> <a name="l00081"></a>00081 <span class="preprocessor"></span>} <a name="l00082"></a>00082 <a name="l00083"></a>00083 <span class="preprocessor">#ifndef _MSC_VER</span> <a name="l00084"></a>00084 <span class="preprocessor"></span><span class="keyword">static</span> jmp_buf s_jmpNoSSE2; <a name="l00085"></a>00085 <span class="keyword">static</span> <span class="keywordtype">void</span> SigIllHandlerSSE2(<span class="keywordtype">int</span>) <a name="l00086"></a>00086 { <a name="l00087"></a>00087 longjmp(s_jmpNoSSE2, 1); <a name="l00088"></a>00088 } <a name="l00089"></a>00089 <span class="preprocessor">#endif</span> <a name="l00090"></a>00090 <span class="preprocessor"></span> <a name="l00091"></a>00091 <span class="preprocessor">#elif _MSC_VER >= 1400 && CRYPTOPP_BOOL_X64</span> <a name="l00092"></a>00092 <span class="preprocessor"></span> <a name="l00093"></a>00093 <span class="keywordtype">bool</span> CpuId(word32 input, word32 *output) <a name="l00094"></a>00094 { <a name="l00095"></a>00095 __cpuid((<span class="keywordtype">int</span> *)output, input); <a name="l00096"></a>00096 <span class="keywordflow">return</span> <span class="keyword">true</span>; <a name="l00097"></a>00097 } <a name="l00098"></a>00098 <a name="l00099"></a>00099 <span class="preprocessor">#endif</span> <a name="l00100"></a>00100 <span class="preprocessor"></span> <a name="l00101"></a>00101 <span class="preprocessor">#ifdef CRYPTOPP_CPUID_AVAILABLE</span> <a name="l00102"></a>00102 <span class="preprocessor"></span> <a name="l00103"></a>00103 <span class="keyword">static</span> <span class="keywordtype">bool</span> TrySSE2() <a name="l00104"></a>00104 { <a name="l00105"></a>00105 <span class="preprocessor">#if CRYPTOPP_BOOL_X64</span> <a name="l00106"></a>00106 <span class="preprocessor"></span> <span class="keywordflow">return</span> <span class="keyword">true</span>; <a name="l00107"></a>00107 <span class="preprocessor">#elif defined(_MSC_VER)</span> <a name="l00108"></a>00108 <span class="preprocessor"></span> __try <a name="l00109"></a>00109 { <a name="l00110"></a>00110 <span class="preprocessor">#if CRYPTOPP_BOOL_SSE2_ASM_AVAILABLE</span> <a name="l00111"></a>00111 <span class="preprocessor"></span> AS2(por xmm0, xmm0) <span class="comment">// executing SSE2 instruction</span> <a name="l00112"></a>00112 <span class="preprocessor">#elif CRYPTOPP_BOOL_SSE2_INTRINSICS_AVAILABLE</span> <a name="l00113"></a>00113 <span class="preprocessor"></span> __mm128i x = _mm_setzero_si128(); <a name="l00114"></a>00114 <span class="keywordflow">return</span> _mm_cvtsi128_si32(x) == 0; <a name="l00115"></a>00115 <span class="preprocessor">#endif</span> <a name="l00116"></a>00116 <span class="preprocessor"></span> } <a name="l00117"></a>00117 __except (1) <a name="l00118"></a>00118 { <a name="l00119"></a>00119 <span class="keywordflow">return</span> <span class="keyword">false</span>; <a name="l00120"></a>00120 } <a name="l00121"></a>00121 <span class="keywordflow">return</span> <span class="keyword">true</span>; <a name="l00122"></a>00122 <span class="preprocessor">#elif defined(__GNUC__)</span> <a name="l00123"></a>00123 <span class="preprocessor"></span> SigHandler oldHandler = signal(SIGILL, SigIllHandlerSSE2); <a name="l00124"></a>00124 <span class="keywordflow">if</span> (oldHandler == SIG_ERR) <a name="l00125"></a>00125 <span class="keywordflow">return</span> <span class="keyword">false</span>; <a name="l00126"></a>00126 <a name="l00127"></a>00127 <span class="keywordtype">bool</span> result = <span class="keyword">true</span>; <a name="l00128"></a>00128 <span class="keywordflow">if</span> (setjmp(s_jmpNoSSE2)) <a name="l00129"></a>00129 result = <span class="keyword">false</span>; <a name="l00130"></a>00130 <span class="keywordflow">else</span> <a name="l00131"></a>00131 { <a name="l00132"></a>00132 <span class="preprocessor">#if CRYPTOPP_BOOL_SSE2_ASM_AVAILABLE</span> <a name="l00133"></a>00133 <span class="preprocessor"></span> __asm __volatile (<span class="stringliteral">"por %xmm0, %xmm0"</span>); <a name="l00134"></a>00134 <span class="preprocessor">#elif CRYPTOPP_BOOL_SSE2_INTRINSICS_AVAILABLE</span> <a name="l00135"></a>00135 <span class="preprocessor"></span> __mm128i x = _mm_setzero_si128(); <a name="l00136"></a>00136 result = _mm_cvtsi128_si32(x) == 0; <a name="l00137"></a>00137 <span class="preprocessor">#endif</span> <a name="l00138"></a>00138 <span class="preprocessor"></span> } <a name="l00139"></a>00139 <a name="l00140"></a>00140 signal(SIGILL, oldHandler); <a name="l00141"></a>00141 <span class="keywordflow">return</span> result; <a name="l00142"></a>00142 <span class="preprocessor">#else</span> <a name="l00143"></a>00143 <span class="preprocessor"></span> <span class="keywordflow">return</span> <span class="keyword">false</span>; <a name="l00144"></a>00144 <span class="preprocessor">#endif</span> <a name="l00145"></a>00145 <span class="preprocessor"></span>} <a name="l00146"></a>00146 <a name="l00147"></a>00147 <span class="keywordtype">bool</span> g_x86DetectionDone = <span class="keyword">false</span>; <a name="l00148"></a>00148 <span class="keywordtype">bool</span> g_hasISSE = <span class="keyword">false</span>, g_hasSSE2 = <span class="keyword">false</span>, g_hasSSSE3 = <span class="keyword">false</span>, g_hasMMX = <span class="keyword">false</span>, g_isP4 = <span class="keyword">false</span>; <a name="l00149"></a>00149 word32 g_cacheLineSize = CRYPTOPP_L1_CACHE_LINE_SIZE; <a name="l00150"></a>00150 <a name="l00151"></a>00151 <span class="keywordtype">void</span> DetectX86Features() <a name="l00152"></a>00152 { <a name="l00153"></a>00153 word32 cpuid[4], cpuid1[4]; <a name="l00154"></a>00154 <span class="keywordflow">if</span> (!CpuId(0, cpuid)) <a name="l00155"></a>00155 <span class="keywordflow">return</span>; <a name="l00156"></a>00156 <span class="keywordflow">if</span> (!CpuId(1, cpuid1)) <a name="l00157"></a>00157 <span class="keywordflow">return</span>; <a name="l00158"></a>00158 <a name="l00159"></a>00159 g_hasMMX = (cpuid1[3] & (1 << 23)) != 0; <a name="l00160"></a>00160 <span class="keywordflow">if</span> ((cpuid1[3] & (1 << 26)) != 0) <a name="l00161"></a>00161 g_hasSSE2 = TrySSE2(); <a name="l00162"></a>00162 g_hasSSSE3 = g_hasSSE2 && (cpuid1[2] & (1<<9)); <a name="l00163"></a>00163 <a name="l00164"></a>00164 <span class="keywordflow">if</span> ((cpuid1[3] & (1 << 25)) != 0) <a name="l00165"></a>00165 g_hasISSE = <span class="keyword">true</span>; <a name="l00166"></a>00166 <span class="keywordflow">else</span> <a name="l00167"></a>00167 { <a name="l00168"></a>00168 word32 cpuid2[4]; <a name="l00169"></a>00169 CpuId(0x080000000, cpuid2); <a name="l00170"></a>00170 <span class="keywordflow">if</span> (cpuid2[0] >= 0x080000001) <a name="l00171"></a>00171 { <a name="l00172"></a>00172 CpuId(0x080000001, cpuid2); <a name="l00173"></a>00173 g_hasISSE = (cpuid2[3] & (1 << 22)) != 0; <a name="l00174"></a>00174 } <a name="l00175"></a>00175 } <a name="l00176"></a>00176 <a name="l00177"></a>00177 std::swap(cpuid[2], cpuid[3]); <a name="l00178"></a>00178 <span class="keywordflow">if</span> (memcmp(cpuid+1, <span class="stringliteral">"GenuineIntel"</span>, 12) == 0) <a name="l00179"></a>00179 { <a name="l00180"></a>00180 g_isP4 = ((cpuid1[0] >> 8) & 0xf) == 0xf; <a name="l00181"></a>00181 g_cacheLineSize = 8 * GETBYTE(cpuid1[1], 1); <a name="l00182"></a>00182 } <a name="l00183"></a>00183 <span class="keywordflow">else</span> <span class="keywordflow">if</span> (memcmp(cpuid+1, <span class="stringliteral">"AuthenticAMD"</span>, 12) == 0) <a name="l00184"></a>00184 { <a name="l00185"></a>00185 CpuId(0x80000005, cpuid); <a name="l00186"></a>00186 g_cacheLineSize = GETBYTE(cpuid[2], 0); <a name="l00187"></a>00187 } <a name="l00188"></a>00188 <a name="l00189"></a>00189 <span class="keywordflow">if</span> (!g_cacheLineSize) <a name="l00190"></a>00190 g_cacheLineSize = CRYPTOPP_L1_CACHE_LINE_SIZE; <a name="l00191"></a>00191 <a name="l00192"></a>00192 g_x86DetectionDone = <span class="keyword">true</span>; <a name="l00193"></a>00193 } <a name="l00194"></a>00194 <a name="l00195"></a>00195 <span class="preprocessor">#endif</span> <a name="l00196"></a>00196 <span class="preprocessor"></span> <a name="l00197"></a>00197 NAMESPACE_END <a name="l00198"></a>00198 <a name="l00199"></a>00199 <span class="preprocessor">#endif</span> </pre></div></div> <hr size="1"/><address style="text-align: right;"><small>Generated on 9 Dec 2009 for Crypto++ by <a href="http://www.doxygen.org/index.html"> <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.6.1 </small></address> </body> </html>