📄 mc_mmx.asm
字号:
mov ebx, [esp+20+16]
mov ecx, [esp+20+20]
;-------------------------------------------------------------------
;儖乕僾僷儔儊乕僞嶌惉
pxor mm7, mm7
;-------------------------------------------------------------------
; loop
prediction_w16_ff_2nd_loop:
dec ecx
;-------------------------------------------------------------------
; core
movd mm0, [esi]
movd mm1, [esi+4]
movd mm2, [esi+8]
movd mm3, [esi+12]
movd mm4, [edi]
movd mm5, [edi+4]
punpcklbw mm0, mm7
punpcklbw mm1, mm7
punpcklbw mm2, mm7
punpcklbw mm3, mm7
punpcklbw mm4, mm7
punpcklbw mm5, mm7
paddw mm0, mm4
paddw mm1, mm5
paddw mm0, adjust_1
paddw mm1, adjust_1
psrlw mm0, 1
psrlw mm1, 1
packuswb mm0, mm1
movq [edi], mm0
movd mm4, [edi+8]
movd mm5, [edi+12]
punpcklbw mm4, mm7
punpcklbw mm5, mm7
paddw mm2, mm4
paddw mm3, mm5
paddw mm2, adjust_1
paddw mm3, adjust_1
psrlw mm2, 1
psrlw mm3, 1
packuswb mm2, mm3
movq [edi+8], mm2
lea esi, [esi+eax]
lea edi, [edi+ebx]
;-------------------------------------------------------------------
; 儖乕僾廔抂僠僃僢僋
test ecx, ecx
jnz prediction_w16_ff_2nd_loop
;-------------------------------------------------------------------
; 儗僕僗僞暅尦側偳屻巒枛
pop eax
pop ebx
pop ecx
pop edi
pop esi
ret 20
_prediction_w16_ff_2nd_mmx@20 ENDP
;-------------------------------------------------------------------
; 廔椆
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 摦偒曗彏乮width 8, Half/Half, 1st乯
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 婎杮曽恓
; 16bit 惛搙偱係暲楍寁嶼
;
;-------------------------------------------------------------------
PUBLIC C _prediction_w8_hh_1st_mmx@20
; void __stdcall prediction_w8_hh_1st_mmx(
; [esp+ 4] unsigned char *in,
; [esp+ 8] unsigned char *out,
; [esp+12] int in_step,
; [esp+16] int out_step,
; [esp+20] int height
; )
_prediction_w8_hh_1st_mmx@20 PROC
;-------------------------------------------------------------------
; 巊梡偡傞儗僕僗僞
; esi - 擖椡
; edi - 弌椡
; ecx - 儖乕僾僇僂儞僞
; eax - 擖椡僗僥僢僾
; ebx - 弌椡僗僥僢僾
;-------------------------------------------------------------------
; 巊梡偡傞儘乕僇儖曄悢
; 側偟
;-------------------------------------------------------------------
; 梡搑屌掕 MMX 儗僕僗僞
; mm7 - 0
;-------------------------------------------------------------------
; 儗僕僗僞偺戅旔
push esi
push edi
push ecx
push ebx
push eax
;-------------------------------------------------------------------
; 堷悢偐傜僨乕僞傪庴偗庢偭偰偍偔
mov esi, [esp+20+ 4]
mov edi, [esp+20+ 8]
mov eax, [esp+20+12]
mov ebx, [esp+20+16]
mov ecx, [esp+20+20]
;-------------------------------------------------------------------
; 壓弨旛
shr ecx, 1
pxor mm7, mm7
movd mm0, [esi]
movd mm1, [esi+4]
movd mm2, [esi+8]
psllq mm2, 32
por mm2, mm1
psrlq mm2, 8
psllq mm1, 32
por mm1, mm0
psrlq mm1, 8
punpcklbw mm0, mm7
punpcklbw mm2, mm7
lea esi, [esi+eax]
; mm0, 00030002_00010000
; mm1, 00070605_04030201
; mm2, 00080007_00060005
;-------------------------------------------------------------------
; loop
prediction_w8_hh_1st_loop:
dec ecx
;-------------------------------------------------------------------
; core
movd mm3, [esi]
movd mm4, [esi+4]
movd mm5, [esi+8]
psllq mm5, 32
por mm5, mm4
psrlq mm5, 8
psllq mm4, 32
por mm4, mm3
psrlq mm4, 8
movq mm6, mm1
punpcklbw mm3, mm7
punpcklbw mm5, mm7
punpcklbw mm6, mm7
paddw mm0, mm3
paddw mm0, mm6
movq mm6, mm4
punpcklbw mm6, mm7
paddw mm0, mm6
paddw mm0, adjust_2
psrlw mm0, 2
movq mm6, mm4
psrlq mm1, 24
psrlq mm6, 24
punpcklbw mm1, mm7
punpcklbw mm6, mm7
paddw mm1, mm2
paddw mm1, mm5
paddw mm1, mm6
paddw mm1, adjust_2
psrlw mm1, 2
packuswb mm0, mm1
movq [edi], mm0
lea edi, [edi+ebx]
lea esi, [esi+eax]
movd mm0, [esi]
movd mm1, [esi+4]
movd mm2, [esi+8]
psllq mm2, 32
por mm2, mm1
psrlq mm2, 8
psllq mm1, 32
por mm1, mm0
psrlq mm1, 8
movq mm6, mm4
punpcklbw mm0, mm7
punpcklbw mm2, mm7
punpcklbw mm6, mm7
paddw mm3, mm0
paddw mm3, mm6
movq mm6, mm1
punpcklbw mm6, mm7
paddw mm3, mm6
paddw mm3, adjust_2
psrlw mm3, 2
movq mm6, mm1
psrlq mm4, 24
psrlq mm6, 24
punpcklbw mm4, mm7
punpcklbw mm6, mm7
paddw mm4, mm2
paddw mm4, mm5
paddw mm4, mm6
paddw mm4, adjust_2
psrlw mm4, 2
packuswb mm3, mm4
movq [edi], mm3
lea edi, [edi+ebx]
lea esi, [esi+eax]
;-------------------------------------------------------------------
; 儖乕僾廔抂僠僃僢僋
test ecx, ecx
jnz prediction_w8_hh_1st_loop
;-------------------------------------------------------------------
; 儗僕僗僞暅尦側偳屻巒枛
pop eax
pop ebx
pop ecx
pop edi
pop esi
ret 20
_prediction_w8_hh_1st_mmx@20 ENDP
;-------------------------------------------------------------------
; 廔椆
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 摦偒曗彏乮width 8, Half/Half, 2nd乯
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 婎杮曽恓
; 16bit 惛搙偱係暲楍寁嶼
;
;-------------------------------------------------------------------
PUBLIC C _prediction_w8_hh_2nd_mmx@20
; void __stdcall prediction_w8_hh_2nd_mmx(
; [esp+ 4] unsigned char *in,
; [esp+ 8] unsigned char *out,
; [esp+12] int in_step,
; [esp+16] int out_step,
; [esp+20] int height
; )
_prediction_w8_hh_2nd_mmx@20 PROC
;-------------------------------------------------------------------
; 巊梡偡傞儗僕僗僞
; esi - 擖椡
; edi - 弌椡
; ecx - 儖乕僾僇僂儞僞
; eax - 擖椡僗僥僢僾
; ebx - 弌椡僗僥僢僾
;-------------------------------------------------------------------
; 巊梡偡傞儘乕僇儖曄悢
; 側偟
;-------------------------------------------------------------------
; 梡搑屌掕 MMX 儗僕僗僞
; mm7 - 0
;-------------------------------------------------------------------
; 儗僕僗僞偺戅旔
push esi
push edi
push ecx
push ebx
push eax
;-------------------------------------------------------------------
; 堷悢偐傜僨乕僞傪庴偗庢偭偰偍偔
mov esi, [esp+20+ 4]
mov edi, [esp+20+ 8]
mov eax, [esp+20+12]
mov ebx, [esp+20+16]
mov ecx, [esp+20+20]
;-------------------------------------------------------------------
; 壓弨旛
shr ecx, 1
pxor mm7, mm7
movd mm0, [esi]
movd mm1, [esi+4]
movd mm2, [esi+8]
psllq mm2, 32
por mm2, mm1
psrlq mm2, 8
psllq mm1, 32
por mm1, mm0
psrlq mm1, 8
punpcklbw mm0, mm7
punpcklbw mm2, mm7
lea esi, [esi+eax]
;-------------------------------------------------------------------
; loop
prediction_w8_hh_2nd_loop:
dec ecx
;-------------------------------------------------------------------
; core
movd mm3, [esi]
movd mm4, [esi+4]
movd mm5, [esi+8]
psllq mm5, 32
por mm5, mm4
psrlq mm5, 8
psllq mm4, 32
por mm4, mm3
psrlq mm4, 8
movq mm6, mm1
punpcklbw mm3, mm7
punpcklbw mm5, mm7
punpcklbw mm6, mm7
paddw mm0, mm3
paddw mm0, mm6
movq mm6, mm4
punpcklbw mm6, mm7
paddw mm0, mm6
paddw mm0, adjust_6
psrlw mm0, 2
movd mm6, [edi]
punpcklbw mm6, mm7
paddw mm0, mm6
psrlw mm0, 1
movq mm6, mm4
psrlq mm1, 24
psrlq mm6, 24
punpcklbw mm1, mm7
punpcklbw mm6, mm7
paddw mm1, mm2
paddw mm1, mm5
paddw mm1, mm6
paddw mm1, adjust_6
psrlw mm1, 2
movd mm6, [edi+4]
punpcklbw mm6, mm7
paddw mm1, mm6
psrlw mm1, 1
packuswb mm0, mm1
movq [edi], mm0
lea edi, [edi+ebx]
lea esi, [esi+eax]
movd mm0, [esi]
movd mm1, [esi+4]
movd mm2, [esi+8]
psllq mm2, 32
por mm2, mm1
psrlq mm2, 8
psllq mm1, 32
por mm1, mm0
psrlq mm1, 8
movq mm6, mm4
punpcklbw mm0, mm7
punpcklbw mm2, mm7
punpcklbw mm6, mm7
paddw mm3, mm0
paddw mm3, mm6
movq mm6, mm1
punpcklbw mm6, mm7
paddw mm3, mm6
paddw mm3, adjust_6
psrlw mm3, 2
movd mm6, [edi]
punpcklbw mm6, mm7
paddw mm3, mm6
psrlw mm3, 1
movq mm6, mm1
psrlq mm4, 24
psrlq mm6, 24
punpcklbw mm4, mm7
punpcklbw mm6, mm7
paddw mm4, mm2
paddw mm4, mm5
paddw mm4, mm6
paddw mm4, adjust_6
psrlw mm4, 2
movd mm6, [edi+4]
punpcklbw mm6, mm7
paddw mm4, mm6
psrlw mm4, 1
packuswb mm3, mm4
movq [edi], mm3
lea edi, [edi+ebx]
lea esi, [esi+eax]
;-------------------------------------------------------------------
; 儖乕僾廔抂僠僃僢僋
test ecx, ecx
jnz prediction_w8_hh_2nd_loop
;-------------------------------------------------------------------
; 儗僕僗僞暅尦側偳屻巒枛
pop eax
pop ebx
pop ecx
pop edi
pop esi
ret 20
_prediction_w8_hh_2nd_mmx@20 ENDP
;-------------------------------------------------------------------
; 廔椆
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 摦偒曗彏乮width 8, Full/Half, 1st乯悈暯 Full, 悅捈 Half
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
; 婎杮曽恓
; 16bit 惛搙偱係暲楍寁嶼
;
;-------------------------------------------------------------------
PUBLIC C _prediction_w8_fh_1st_mmx@20
; void __stdcall prediction_w8_fh_1st_mmx(
; [esp+ 4] unsigned char *in,
; [esp+ 8] unsigned char *out,
; [esp+12] int in_step,
; [esp+16] int out_step,
; [esp+20] int height
; )
_prediction_w8_fh_1st_mmx@20 PROC
;-------------------------------------------------------------------
; 巊梡偡傞儗僕僗僞
; esi - 擖椡
; edi - 弌椡
; ecx - 儖乕僾僇僂儞僞
; eax - 擖椡僗僥僢僾
; ebx - 弌椡僗僥僢僾
;-------------------------------------------------------------------
; 巊梡偡傞儘乕僇儖曄悢
; 側偟
;-------------------------------------------------------------------
; 梡搑屌掕 MMX 儗僕僗僞
; mm7 - 0
;-------------------------------------------------------------------
; 儗僕僗僞偺戅旔
push esi
push edi
push ecx
push ebx
push eax
;-------------------------------------------------------------------
; 堷悢偐傜僨乕僞傪庴偗庢偭偰偍偔
mov esi, [esp+20+ 4]
mov edi, [esp+20+ 8]
mov eax, [esp+20+12]
mov ebx, [esp+20+16]
mov ecx, [esp+20+20]
;-------------------------------------------------------------------
; 壓弨旛
shr ecx, 1
pxor mm7, mm7
movd mm0, [esi]
movd mm1, [esi+4]
punpcklbw mm0, mm7
punpcklbw mm1, mm7
lea esi, [esi+eax]
;-------------------------------------------------------------------
; loop
prediction_w8_fh_1st_loop:
dec ecx
;-------------------------------------------------------------------
; core
movd mm2, [esi]
movd mm3, [esi+4]
punpcklbw mm2, mm7
punpcklbw mm3, mm7
paddw mm0, mm2
paddw mm1, mm3
paddw mm0, adjust_1
paddw mm1, adjust_1
psrlw mm0, 1
psrlw mm1, 1
packuswb mm0, mm1
movq [edi], mm0
lea edi, [edi+ebx]
lea esi, [esi+eax]
movd mm0, [esi]
movd mm1, [esi+4]
punpcklbw mm0, mm7
punpcklbw mm1, mm7
paddw mm2, mm0
paddw mm3, mm1
paddw mm2, adjust_1
paddw mm3, adjust_1
psrlw mm2, 1
psrlw mm3, 1
packuswb mm2, mm3
movq [edi], mm2
lea edi, [edi+ebx]
lea esi, [esi+eax]
;-------------------------------------------------------------------
; 儖乕僾廔抂僠僃僢僋
test ecx, ecx
jnz prediction_w8_fh_1st_loop
;-------------------------------------------------------------------
; 儗僕僗僞暅尦側偳屻巒枛
pop eax
pop ebx
pop ecx
pop edi
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -