📄 rijndael_8cpp-source.html
字号:
<a name="l00156"></a>00156 <span class="keyword">const</span> word32 *kLoopEnd = k + m_rounds*4;<a name="l00157"></a>00157 <span class="preprocessor"> #if CRYPTOPP_BOOL_X64</span><a name="l00158"></a>00158 <span class="preprocessor"></span><span class="preprocessor"> #define K_REG r8</span><a name="l00159"></a>00159 <span class="preprocessor"></span><span class="preprocessor"> #define K_END_REG r9</span><a name="l00160"></a>00160 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_K</span><a name="l00161"></a>00161 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_K</span><a name="l00162"></a>00162 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_K_END</span><a name="l00163"></a>00163 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_0(x) AS2(mov r10d, x)</span><a name="l00164"></a>00164 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_1(x) AS2(mov r11d, x)</span><a name="l00165"></a>00165 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_2(x) AS2(mov r12d, x)</span><a name="l00166"></a>00166 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_0(x) AS2(mov x, r10d)</span><a name="l00167"></a>00167 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_1(x) AS2(mov x, r11d)</span><a name="l00168"></a>00168 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_2(x) AS2(mov x, r12d)</span><a name="l00169"></a>00169 <span class="preprocessor"></span><span class="preprocessor"> #else</span><a name="l00170"></a>00170 <span class="preprocessor"></span><span class="preprocessor"> #define K_REG esi</span><a name="l00171"></a>00171 <span class="preprocessor"></span><span class="preprocessor"> #define K_END_REG edi</span><a name="l00172"></a>00172 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_K AS2(movd mm4, esi)</span><a name="l00173"></a>00173 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_K AS2(movd esi, mm4)</span><a name="l00174"></a>00174 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_K_END AS2(movd edi, mm5)</span><a name="l00175"></a>00175 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_0(x) AS2(movd mm0, x)</span><a name="l00176"></a>00176 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_1(x) AS2(movd mm1, x)</span><a name="l00177"></a>00177 <span class="preprocessor"></span><span class="preprocessor"> #define SAVE_2(x) AS2(movd mm2, x)</span><a name="l00178"></a>00178 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_0(x) AS2(movd x, mm0)</span><a name="l00179"></a>00179 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_1(x) AS2(movd x, mm1)</span><a name="l00180"></a>00180 <span class="preprocessor"></span><span class="preprocessor"> #define RESTORE_2(x) AS2(movd x, mm2)</span><a name="l00181"></a>00181 <span class="preprocessor"></span><span class="preprocessor"> #endif</span><a name="l00182"></a>00182 <span class="preprocessor"></span><span class="preprocessor">#ifdef __GNUC__</span><a name="l00183"></a>00183 <span class="preprocessor"></span> word32 t0, t1, t2, t3;<a name="l00184"></a>00184 __asm__ __volatile__<a name="l00185"></a>00185 (<a name="l00186"></a>00186 <span class="stringliteral">".intel_syntax noprefix;"</span><a name="l00187"></a>00187 AS_PUSH( bx)<a name="l00188"></a>00188 AS_PUSH( bp)<a name="l00189"></a>00189 AS2( mov WORD_REG(bp), WORD_REG(ax))<a name="l00190"></a>00190 #<span class="keywordflow">if</span> CRYPTOPP_BOOL_X64<a name="l00191"></a>00191 <span class="comment">// save these manually. clobber list doesn't seem to work as of GCC 4.1.0</span><a name="l00192"></a>00192 AS1( pushq K_REG)<a name="l00193"></a>00193 AS1( pushq K_END_REG)<a name="l00194"></a>00194 AS1( pushq r10)<a name="l00195"></a>00195 AS1( pushq r11)<a name="l00196"></a>00196 AS1( pushq r12)<a name="l00197"></a>00197 AS2( mov K_REG, rsi)<a name="l00198"></a>00198 AS2( mov K_END_REG, rcx)<a name="l00199"></a>00199 #<span class="keywordflow">else</span><a name="l00200"></a>00200 AS2( movd mm5, ecx)<a name="l00201"></a>00201 #endif<a name="l00202"></a>00202 #<span class="keywordflow">else</span><a name="l00203"></a>00203 #<span class="keywordflow">if</span> _MSC_VER < 1300<a name="l00204"></a>00204 <span class="keyword">const</span> word32 *t = Te;<a name="l00205"></a>00205 AS2( mov eax, t)<a name="l00206"></a>00206 <span class="preprocessor">#endif</span><a name="l00207"></a>00207 <span class="preprocessor"></span> AS2( mov edx, g_cacheLineSize)<a name="l00208"></a>00208 AS2( mov WORD_REG(di), inBlock)<a name="l00209"></a>00209 AS2( mov K_REG, k)<a name="l00210"></a>00210 AS2( movd mm5, kLoopEnd)<a name="l00211"></a>00211 <span class="preprocessor">#if _MSC_VER < 1300</span><a name="l00212"></a>00212 <span class="preprocessor"></span> AS_PUSH( bx)<a name="l00213"></a>00213 AS_PUSH( bp)<a name="l00214"></a>00214 AS2( mov ebp, eax)<a name="l00215"></a>00215 <span class="preprocessor">#else</span><a name="l00216"></a>00216 <span class="preprocessor"></span> AS_PUSH( bp)<a name="l00217"></a>00217 AS2( lea ebp, Te)<a name="l00218"></a>00218 <span class="preprocessor">#endif</span><a name="l00219"></a>00219 <span class="preprocessor"></span><span class="preprocessor">#endif</span><a name="l00220"></a>00220 <span class="preprocessor"></span> AS2( mov eax, [K_REG+0*4]) <span class="comment">// s0</span><a name="l00221"></a>00221 AS2( xor eax, [WORD_REG(di)+0*4])<a name="l00222"></a>00222 SAVE_0(eax)<a name="l00223"></a>00223 AS2( mov ebx, [K_REG+1*4])<a name="l00224"></a>00224 AS2( xor ebx, [WORD_REG(di)+1*4])<a name="l00225"></a>00225 SAVE_1(ebx)<a name="l00226"></a>00226 AS2( and ebx, eax)<a name="l00227"></a>00227 AS2( mov eax, [K_REG+2*4])<a name="l00228"></a>00228 AS2( xor eax, [WORD_REG(di)+2*4])<a name="l00229"></a>00229 SAVE_2(eax)<a name="l00230"></a>00230 AS2( and ebx, eax)<a name="l00231"></a>00231 AS2( mov ecx, [K_REG+3*4])<a name="l00232"></a>00232 AS2( xor ecx, [WORD_REG(di)+3*4])<a name="l00233"></a>00233 AS2( and ebx, ecx)<a name="l00234"></a>00234 <a name="l00235"></a>00235 <span class="comment">// read Te0 into L1 cache. this code could be simplifed by using lfence, but that is an SSE2 instruction</span><a name="l00236"></a>00236 AS2( and ebx, 0)<a name="l00237"></a>00237 AS2( mov edi, ebx) <span class="comment">// make index depend on previous loads to simulate lfence</span><a name="l00238"></a>00238 ASL(2)<a name="l00239"></a>00239 AS2( and ebx, [WORD_REG(bp)+WORD_REG(di)])<a name="l00240"></a>00240 AS2( add edi, edx)<a name="l00241"></a>00241 AS2( and ebx, [WORD_REG(bp)+WORD_REG(di)])<a name="l00242"></a>00242 AS2( add edi, edx)<a name="l00243"></a>00243 AS2( and ebx, [WORD_REG(bp)+WORD_REG(di)])<a name="l00244"></a>00244 AS2( add edi, edx)<a name="l00245"></a>00245 AS2( and ebx, [WORD_REG(bp)+WORD_REG(di)])<a name="l00246"></a>00246 AS2( add edi, edx)<a name="l00247"></a>00247 AS2( cmp edi, 1024)<a name="l00248"></a>00248 ASJ( jl, 2, b)<a name="l00249"></a>00249 AS2( and ebx, [WORD_REG(bp)+1020])<a name="l00250"></a>00250 <span class="preprocessor">#if CRYPTOPP_BOOL_X64</span><a name="l00251"></a>00251 <span class="preprocessor"></span> AS2( xor r10d, ebx)<a name="l00252"></a>00252 AS2( xor r11d, ebx)<a name="l00253"></a>00253 AS2( xor r12d, ebx)<a name="l00254"></a>00254 <span class="preprocessor">#else</span><a name="l00255"></a>00255 <span class="preprocessor"></span> AS2( movd mm6, ebx)<a name="l00256"></a>00256 AS2( pxor mm2, mm6)<a name="l00257"></a>00257 AS2( pxor mm1, mm6)<a name="l00258"></a>00258 AS2( pxor mm0, mm6)<a name="l00259"></a>00259 <span class="preprocessor">#endif</span><a name="l00260"></a>00260 <span class="preprocessor"></span> AS2( xor ecx, ebx)<a name="l00261"></a>00261 <a name="l00262"></a>00262 AS2( mov edi, [K_REG+4*4]) <span class="comment">// t0</span><a name="l00263"></a>00263 AS2( mov eax, [K_REG+5*4])<a name="l00264"></a>00264 AS2( mov ebx, [K_REG+6*4])<a name="l00265"></a>00265 AS2( mov edx, [K_REG+7*4])<a name="l00266"></a>00266 AS2( add K_REG, 8*4)<a name="l00267"></a>00267 SAVE_K<a name="l00268"></a>00268 <a name="l00269"></a>00269 <span class="preprocessor">#define QUARTER_ROUND(t, a, b, c, d) \</span><a name="l00270"></a>00270 <span class="preprocessor"> AS2(movzx esi, t##l)\</span><a name="l00271"></a>00271 <span class="preprocessor"> AS2(d, [WORD_REG(bp)+0*1024+4*WORD_REG(si)])\</span><a name="l00272"></a>00272 <span class="preprocessor"> AS2(movzx esi, t##h)\</span><a name="l00273"></a>00273 <span class="preprocessor"> AS2(c, [WORD_REG(bp)+1*1024+4*WORD_REG(si)])\</span><a name="l00274"></a>00274 <span class="preprocessor"> AS2(shr e##t##x, 16)\</span><a name="l00275"></a>00275 <span class="preprocessor"> AS2(movzx esi, t##l)\</span><a name="l00276"></a>00276 <span class="preprocessor"> AS2(b, [WORD_REG(bp)+2*1024+4*WORD_REG(si)])\</span><a name="l00277"></a>00277 <span class="preprocessor"> AS2(movzx esi, t##h)\</span><a name="l00278"></a>00278 <span class="preprocessor"> AS2(a, [WORD_REG(bp)+3*1024+4*WORD_REG(si)])</span><a name="l00279"></a>00279 <span class="preprocessor"></span><a name="l00280"></a>00280 <span class="preprocessor">#define s0 xor edi</span><a name="l00281"></a>00281 <span class="preprocessor"></span><span class="preprocessor">#define s1 xor eax</span><a name="l00282"></a>00282 <span class="preprocessor"></span><span class="preprocessor">#define s2 xor ebx</span><a name="l00283"></a>00283 <span class="preprocessor"></span><span class="preprocessor">#define s3 xor ecx</span><a name="l00284"></a>00284 <span class="preprocessor"></span><span class="preprocessor">#define t0 xor edi</span><a name="l00285"></a>00285 <span class="preprocessor"></span><span class="preprocessor">#define t1 xor eax</span><a name="l00286"></a>00286 <span class="preprocessor"></span><span class="preprocessor">#define t2 xor ebx</span><a name="l00287"></a>00287 <span class="preprocessor"></span><span class="preprocessor">#define t3 xor edx</span><a name="l00288"></a>00288 <span class="preprocessor"></span><a name="l00289"></a>00289 QUARTER_ROUND(c, t0, t1, t2, t3)<a name="l00290"></a>00290 RESTORE_2(ecx)<a name="l00291"></a>00291 QUARTER_ROUND(c, t3, t0, t1, t2)<a name="l00292"></a>00292 RESTORE_1(ecx)<a name="l00293"></a>00293 QUARTER_ROUND(c, t2, t3, t0, t1)<a name="l00294"></a>00294 RESTORE_0(ecx)<a name="l00295"></a>00295 QUARTER_ROUND(c, t1, t2, t3, t0)<a name="l00296"></a>00296 SAVE_2(ebx)<a name="l00297"></a>00297 SAVE_1(eax)<a name="l00298"></a>00298 SAVE_0(edi)<a name="l00299"></a>00299 <span class="preprocessor">#undef QUARTER_ROUND</span><a name="l00300"></a>00300 <span class="preprocessor"></span><a name="l00301"></a>00301 RESTORE_K<a name="l00302"></a>00302 <a name="l00303"></a>00303 ASL(0)<a name="l00304"></a>00304 AS2( mov edi, [K_REG+0*4])<a name="l00305"></a>00305 AS2( mov eax, [K_REG+1*4])<a name="l00306"></a>00306 AS2( mov ebx, [K_REG+2*4])<a name="l00307"></a>00307 AS2( mov ecx, [K_REG+3*4])<a name="l00308"></a>00308 <a name="l00309"></a>00309 <span class="preprocessor">#define QUARTER_ROUND(t, a, b, c, d) \</span><a name="l00310"></a>00310 <span class="preprocessor"> AS2(movzx esi, t##l)\</span><a name="l00311"></a>00311 <span class="preprocessor"> AS2(a, [WORD_REG(bp)+3*1024+4*WORD_REG(si)])\</span><a name="l00312"></a>00312 <span class="preprocessor"> AS2(movzx esi, t##h)\</span><a name="l00313"></a>00313 <span class="preprocessor"> AS2(b, [WORD_REG(bp)+2*1024+4*WORD_REG(si)])\</span><a name="l00314"></a>00314 <span class="preprocessor"> AS2(shr e##t##x, 16)\</span><a name="l00315"></a>00315 <span class="preprocessor"> AS2(movzx esi, t##l)\</span><a name="l00316"></a>00316 <span class="preprocessor"> AS2(c, [WORD_REG(bp)+1*1024+4*WORD_REG(si)])\</span><a name="l00317"></a>00317 <span class="preprocessor"> AS2(movzx esi, t##h)\</span><a name="l00318"></a>00318 <span class="preprocessor"> AS2(d, [WORD_REG(bp)+0*1024+4*WORD_REG(si)])</span><a name="l00319"></a>00319 <span class="preprocessor"></span><a name="l00320"></a>00320 QUARTER_ROUND(d, s0, s1, s2, s3)<a name="l00321"></a>00321 RESTORE_2(edx)<a name="l00322"></a>00322 QUARTER_ROUND(d, s3, s0, s1, s2)<a name="l00323"></a>00323 RESTORE_1(edx)<a name="l00324"></a>00324 QUARTER_ROUND(d, s2, s3, s0, s1)<a name="l00325"></a>00325 RESTORE_0(edx)<a name="l00326"></a>00326 QUARTER_ROUND(d, s1, s2, s3, s0)<a name="l00327"></a>00327 RESTORE_K<a name="l00328"></a>00328 SAVE_2(ebx)<a name="l00329"></a>00329 SAVE_1(eax)<a name="l00330"></a>00330 SAVE_0(edi)<a name="l00331"></a>00331
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -