⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 atl_dmm4x1x90_x87.c

📁 基于Blas CLapck的.用过的人知道是干啥的
💻 C
📖 第 1 页 / 共 5 页
字号:
	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	152-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	152-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	152-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 20	fldl	160-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	160-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	160-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	160-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	160-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 21	fldl	168-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	168-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	168-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	168-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	168-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 22	fldl	176-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	176-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	176-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	176-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	176-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 23	fldl	184-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	184-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	184-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	184-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	184-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 24	fldl	192-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	192-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	192-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	192-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	192-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 25	fldl	200-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	200-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	200-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	200-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	200-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 26	fldl	208-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	208-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	208-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	208-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	208-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 27	fldl	216-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	216-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	216-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	216-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	216-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 28	fldl	224-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	224-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	224-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	224-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	224-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 29	fldl	232-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	232-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	232-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	232-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	232-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 30	fldl	240-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	240-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	240-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	240-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	240-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 31	fldl	248-128(pB0)	 /* st = rB0, rC3, rC1, rC0, rC2 */#if KB > 32 && defined(ATL_GAS_x8632)        addl    $KB*8-128, pB0#endif	fldl	248-128(pA0)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	248-128(pA0,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	248-128(pA0,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	248-128(pA0,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */#if KB > 32 && defined(ATL_GAS_x8632)        addl    $KB*8-128, pA0#endif	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if (KB > 32)   #ifdef ATL_GAS_x8632ALIGN8   #endif	fldl	8*(32-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(32-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(32-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	8*(32-KB)(pAE,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	8*(32-KB)(pAE,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 33	fldl	8*(33-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(33-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(33-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	8*(33-KB)(pAE,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	8*(33-KB)(pAE,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 34	fldl	8*(34-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(34-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(34-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	8*(34-KB)(pAE,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	8*(34-KB)(pAE,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 35	fldl	8*(35-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(35-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(35-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	8*(35-KB)(pAE,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	8*(35-KB)(pAE,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 36	fldl	8*(36-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(36-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(36-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */	fldl	8*(36-KB)(pAE,lda,2) /* st = rA2, rB0, rC3, rC1+, rC0+,rC2 */	fmul	%st(1), %st	 /* st = rA2*rB0, rB0, rC3, rC1+, rC0+, rC2 */	faddp	%st, %st(5)	 /* st = rB0, rC3, rC1+, rC0+, rC2+ */	fmull	8*(36-KB)(pAE,lda3)	 /* st = rA3*rB0, rC3, rC1+, rC0+, rC2+ */	faddp	%st, %st(1)	 /* st = rC3+, rC1+, rC0+, rC2+ */#endif#if KB > 37	fldl	8*(37-KB)(pBE)	 /* st = rB0, rC3, rC1, rC0, rC2 */	fldl	8*(37-KB)(pAE)	 /* st = rA0, rB0, rC3, rC1, rC0, rC2 */	fmul	%st(1), %st	 /* st = rA0*rB0, rB0, rC3, rC1, rC0, rC2 */	faddp	%st, %st(4)	 /* st = rB0, rC3, rC1, rC0+, rC2 */	fldl	8*(37-KB)(pAE,lda)	 /* st = rA1, rB0, rC3, rC1, rC0+, rC2 */	fmul	%st(1),%st	 /* st = rA1*rB0, rB0, rC3, rC1, rC0+, rC2 */	faddp	%st, %st(3)	 /* st = rA1*rB0, rB0, rC3, rC1+, rC0+, rC2 */

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -