📄 s_erfl.s
字号:
};;{ .mfi add rAddr1 = rDataPtr, rOffset // Get address for // interval data nop.f 0 shl rTailAddOffset = rInterval, 5 // Offset to interval // "tail" data }{ .mib add rAddr2 = rShiftedDataPtr, rOffset // Get second // address for interval data (p7) cmp.leu p11, p0 = rSaturation, rArgSig // if arg is // in [6.53;8] interval(p11) br.cond.spnt _saturation // Branch to Saturation path};;{ .mmi ldfe fA3 = [rAddr1], 0x90 // Load A3 ldfpd fA2H, fA2L = [rAddr2], 16 // Load A2High, A2Low add rTailOffset = rTailOffset, rTailAddOffset // "Tail" offset};;{ .mmi ldfe fA20 = [rAddr1], 16 // Load A20 ldfpd fA1H, fA1L = [rAddr2], 16 // Load A1High, A1Low(p8) adds rTailOffset = 0x140, rTailOffset // Additional offset // for [3.24;4] interval};;{ .mmi ldfe fA19 = [rAddr1], 16 // Load A19 ldfpd fA0H, fA0L = [rAddr2], 16 // Load A0High, A0Low add rTailAddr1 = rTailDataPtr, rTailOffset // First tail // data address};;.pred.rel "mutex",p8,p10{ .mfi ldfe fA18 = [rAddr1], 16 // Load A18(p8) fms.s1 fArgAbsNorm = fArgAbsNorm, f1, f2p0 // Add 2.0 // to normalized arg (for [3.24;4] interval) adds rTailAddr2 = 0x10, rTailAddr1 // First tail // data address}{ .mfi ldfe fA25 = [rAddr2], 16 // Load A25 (p10) fms.s1 fArgAbsNorm = fArgAbsNorm, f1, f1p5 // Add 1.5 // to normalized arg nop.i 0};;{ .mmi ldfe fA17 = [rAddr1], 16 // Load A17 ldfe fA24 = [rAddr2], 16 // Load A24 nop.i 0};;{ .mmi ldfe fA16 = [rAddr1], 16 // Load A16 ldfe fA23 = [rAddr2], 16 // Load A23 nop.i 0};;{ .mmi ldfe fA15 = [rAddr1], 16 // Load A15 ldfe fA22 = [rAddr2], 16 // Load A22 nop.i 0};;{ .mmi ldfe fA14 = [rAddr1], 16 // Load A14 ldfe fA21 = [rAddr2], 16 // Load A21 nop.i 0};;{ .mfi ldfe fA13 = [rTailAddr1], 32 // Load A13 fms.s1 fArgAbsNorm2 = fArgAbsNorm, fArgAbsNorm, f0 // x^2 nop.i 0}{ .mfi ldfe fA12 = [rTailAddr2], 32 // Load A12 nop.f 0 nop.i 0};;{ .mfi ldfe fA11 = [rTailAddr1], 32 // Load A11 fma.s1 fRes3H = fA3, fArgAbsNorm, fA2H // (A3*x+A2)*x^2 nop.i 0}{ .mfi ldfe fA10 = [rTailAddr2], 32 // Load A10 fma.s1 fTH = fA3, fArgAbsNorm, f0 // (A3*x+A2)*x^2 nop.i 0};;{ .mfi ldfe fA9 = [rTailAddr1], 32 // Load A9 fma.s1 fTT2 = fA1L, fArgAbsNorm, f0 // A1*x+A0 nop.i 0}{ .mfi ldfe fA8 = [rTailAddr2], 32 // Load A8 nop.f 0 nop.i 0};;{ .mmi ldfe fA7 = [rTailAddr1], 32 // Load A7 ldfe fA6 = [rTailAddr2], 32 // Load A6 nop.i 0};;{ .mmi ldfe fA5 = [rTailAddr1], 32 // Load A5 ldfe fA4 = [rTailAddr2], 32 // Load A4 nop.i 0};;{ .mfi nop.m 0 fms.s1 fArgAbsNorm2L = fArgAbsNorm, fArgAbsNorm, fArgAbsNorm2 // Low part of x^2 (delta) nop.i 0}{ .mfi nop.m 0 fms.s1 fArgAbsNorm4 = fArgAbsNorm2, fArgAbsNorm2, f0 // x^4 nop.i 0};;{ .mfi nop.m 0 fms.s1 fRes3L = fA2H, f1, fRes3H // // (A3*x+A2)*x^2 nop.i 0};;{ .mfi nop.m 0 fms.s1 fArgAbsNorm3 = fArgAbsNorm2, fArgAbsNorm, f0 // x^3 nop.i 0}{ .mfi nop.m 0 fma.s1 fTH2 = fA1H, fArgAbsNorm, fTT2 // A1*x+A0 nop.i 0};;{ .mfi nop.m 0 fma.s1 fA23 = fA24, fArgAbsNorm, fA23 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA21 = fA22, fArgAbsNorm, fA21 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fA12 = fA13, fArgAbsNorm, fA12 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fRes3L = fRes3L, f1, fTH // (A3*x+A2)*x^2 nop.i 0}{ .mfi nop.m 0 fma.s1 fA19 = fA20, fArgAbsNorm, fA19 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fRes1H = fTH2, f1, fA0H // A1*x+A0 nop.i 0}{ .mfi nop.m 0 fms.s1 fTL2 = fA1H, fArgAbsNorm, fTH2 // A1*x+A0 nop.i 0};;{ .mfi nop.m 0 fma.s1 fA8 = fA9, fArgAbsNorm, fA8 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA10 = fA11, fArgAbsNorm, fA10 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fA15 = fA16, fArgAbsNorm, fA15 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA17 = fA18, fArgAbsNorm, fA17 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fms.s1 fArgAbsNorm11 = fArgAbsNorm4, fArgAbsNorm4, f0 // x^8 nop.i 0}{ .mfi nop.m 0 fma.s1 fA4 = fA5, fArgAbsNorm, fA4 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fRes3L = fRes3L, f1, fA2L // (A3*x+A2)*x^2 nop.i 0}{ .mfi nop.m 0 fma.s1 fA6 = fA7, fArgAbsNorm, fA6 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fTL2 = fTL2, f1, fTT2 // A1*x+A0 nop.i 0}{ .mfi nop.m 0 fms.s1 fRes1L = fA0H, f1, fRes1H // A1*x+A0 nop.i 0};;{ .mfi nop.m 0 fma.s1 fA23 = fA25, fArgAbsNorm2, fA23 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA12 = fA14, fArgAbsNorm2, fA12 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fA19 = fA21, fArgAbsNorm2, fA19 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA8 = fA10, fArgAbsNorm2, fA8 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fA15 = fA17, fArgAbsNorm2, fA15 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fms.s1 fArgAbsNorm11 = fArgAbsNorm11, fArgAbsNorm3, f0 // x^11 nop.i 0};;{ .mfi nop.m 0 fma.s1 fTT = fRes3L, fArgAbsNorm2, f0 // (A3*x+A2)*x^2 nop.i 0}{ .mfi nop.m 0 fma.s1 fA4 = fA6, fArgAbsNorm2, fA4 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fRes1L = fRes1L, f1, fTH2 // A1*x+A0 nop.i 0};;{ .mfi nop.m 0 fma.s1 fA19 = fA23, fArgAbsNorm4, fA19 // Polynomial tail nop.i 0}{ .mfi nop.m 0 fma.s1 fA8 = fA12, fArgAbsNorm4, fA8 // Polynomial tail nop.i 0};;{ .mfi nop.m 0 fma.s1 fTT = fRes3H, fArgAbsNorm2L, fTT // (A3*x+A2)*x^2 nop.i 0};;{ .mfi
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -