⭐ 欢迎来到虫虫下载站! | 📦 资源下载 📁 资源专辑 ℹ️ 关于我们
⭐ 虫虫下载站

📄 blit_arm_stretch.c

📁 大名鼎鼎的CE下播放软件,TCPPMP的源代码!!!2410下可以流畅的解QVGA的H264,MPEG4等格式.
💻 C
📖 第 1 页 / 共 2 页
字号:
/*****************************************************************************
 *
 * This program is free software ; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
 *
 * $Id: blit_arm_stretch.c 543 2006-01-07 22:06:24Z picard $
 *
 * The Core Pocket Media Player
 * Copyright (c) 2004-2005 Gabor Kovacs
 *
 ****************************************************************************/

//todo: ReUse with OnlyDiff condition. optimize IncPtr (change to pre increment)

#include "../common.h"
#include "../dyncode/dyncode.h"
#include "blit_soft.h"

#if defined(ARM)

typedef struct stack
{
	int InvertMask;
	int DiffMask;
	int PalPtr;
	int EndOfLine;
	int EndOfRect;
	int DstPitch;
	int DstNext;
	int Y;
	int U;
	int V;
	int Pos;
	int SaveR7; //onlydifference && dither
	int SaveR8; //onlydifference && dither

	int StackFrame[STACKFRAME];

	//void* this   R0
	//char* Dst    R1
	//char* Src    R2
	//int DstPitch R3
	int SrcPitch;
	int Width; 
	int Height;
	int Src2SrcLast;
} stack;

// palette
// 

// R0 result RGB
// R1..R3 R,G,B accumulator
// R4..R6 temporary

// R9 Dst
// R7 U+UVNextRow (when SwapXY)
// R8 V+UVNextRow (when SwapXY)
// R10 U
// R11 V
// R12 Y
// R14 Y+YNextRow (when SwapXY)

static NOINLINE void Inc_RGB_UV_Pixel(blit_soft* p, int dY, int dUV)
{
	bool_t NextRow = (p->SwapXY) && (p->Upper == (p->DirX>0));
	reg Y,V,U;

	Y = (reg)(NextRow ? R14:R12);
	V = (reg)(NextRow ? R8:R11);
	U = (reg)(NextRow ? R7:R10);

	if (dY) I2C(ADD,Y,Y,dY);
	if (dUV) I2C(ADD,U,U,dUV);
	if (dUV) I2C(ADD,V,V,dUV);
}

static NOINLINE void Add_RGB_UV_Pixel(blit_soft* p, int Amount, int dY, int dUV, bool_t IncPtr)
{
	assert(Amount>0 || !IncPtr);

	if (Amount)
	{
		int Load = IncPtr ? LDR_POST : LDR;
		reg Y,V,U;
		bool_t NextRow = (p->SwapXY) && (p->Upper == (p->DirX>0));

		Y = (reg)(NextRow ? R14:R12);
		V = (reg)(NextRow ? R8:R11);
		U = (reg)(NextRow ? R7:R10);

		if (p->DstPalette)
		{
			Byte(); I2C(Load,R4,Y,dY);  //y
			Byte(); I2C(Load,R6,V,dUV); //v
			Byte(); I2C(Load,R5,U,dUV); //u
		}
		else
		{
			Byte(); I2C(Load,R4,Y,dY); //y
			IConst(R5,(p->_YMul >> 8) * Amount);
			Byte(); I2C(Load,R6,V,dUV); //v
			I4(MLA,R1,R5,R4,R1);
			I4(MLA,R2,R5,R4,R2);
			I4(MLA,R3,R5,R4,R3);
			Byte(); I2C(Load,R4,U,dUV); //u
			IConst(R5,(p->_GVMul >> 8) * Amount);
			I4(MLA,R2,R5,R6,R2);
			IConst(R5,(p->_RVMul >> 8) * Amount);
			I4(MLA,R1,R5,R6,R1);
			IConst(R5,(p->_GUMul >> 8) * Amount);
			I4(MLA,R2,R5,R4,R2);
			IConst(R5,(p->_BUMul >> 8) * Amount);
			I4(MLA,R3,R5,R4,R3);
		}
	}
}

static NOINLINE void Stretch_RGB_UV_Pixel(blit_soft* p, int Col, int dY, int dUV)
{
	int SatBit = p->QAdd ? 32 : 24;
	int RPos = p->DstPos[0];
	int GPos = p->DstPos[1];
	int BPos = p->DstPos[2];

	if (p->Upper && p->DstBPP<=16)
	{
		RPos += p->DstBPP;
		GPos += p->DstBPP;
		BPos += p->DstBPP;
	}

	if (!p->DstPalette)
	{
		if (p->Dither)
		{
			IConst(R4,p->_RAdd);
			IConst(R5,p->_GAdd);
			IConst(R6,p->_BAdd);
			I3S(ADD,R1,R4,R1,LSR,32-SatBit+p->DstSize[0]);
			I3S(ADD,R2,R5,R2,LSR,32-SatBit+p->DstSize[1]);
			I3S(ADD,R3,R6,R3,LSR,32-SatBit+p->DstSize[2]);
		}
		else
		{
			IConst(R1,p->_RAdd);
			IConst(R2,p->_GAdd);
			IConst(R3,p->_BAdd);
		}
	}

	if (p->ArithStretch)
	{
		int x = Col * p->RScaleX;

		Add_RGB_UV_Pixel(p,16*(16-(x & 15)),dY,dUV,!p->OnlyDiff);

		if (!p->OnlyDiff)
		{
			dY = -dY;
			dUV = -dUV;
		}

		++dY;
		if (((x >> 4)&1) || p->SrcUVX2==0) //need UV increment?
			++dUV;

		Add_RGB_UV_Pixel(p,16*(x & 15),dY,dUV,0);
	}
	else
		Add_RGB_UV_Pixel(p,256,dY,dUV,!p->OnlyDiff);

	if (p->DstPalette)
	{
		if (p->Dither)
		{
			I3S(ADD,R1,R1,R4,ROR,0);
			I3S(ADD,R2,R2,R5,ROR,0);
			I3S(ADD,R2,R2,R6,ROR,16);

			I2C(AND,R4,R1,0x1E0);
			I2C(AND,R5,R2,0x1E0);
			I2C(AND,R6,R2,0x1E00000);

			I3S(ADD,R0,R3,R4,LSL,5);
			I3S(ADD,R0,R0,R5,LSL,1);
			I3S(ADD,R0,R0,R6,LSR,3+16);

			Byte(); I2C(LDR,R4,R0,1);
			Byte(); I2C(LDR,R5,R0,2);
			Byte(); I2C(LDR,R6,R0,3);
			Byte(); I2C(LDR,R0,R0,0);

			I3S(SUB,R1,R1,R4,ROR,0);
			I3S(SUB,R2,R2,R5,ROR,0);
			I3S(SUB,R2,R2,R6,ROR,16);
		}
		else
		{
			I2C(AND,R4,R4,0x1E0);
			I2C(AND,R5,R5,0x1E0);
			I2C(AND,R6,R6,0x1E0);

			I3S(ADD,R0,R3,R4,LSL,5);
			I3S(ADD,R0,R0,R5,LSL,1);
			I3S(ADD,R0,R0,R6,LSR,3);

			Byte(); I2C(LDR,R0,R0,0);
		}
		p->Pos = 0;
	}
	else
	{
		if (p->QAdd)
		{
			I3(QDADD,R1,R1,R1);
			I3(QDADD,R2,R2,R2);
			I3(QDADD,R3,R3,R3);
		}
		else
		{
			I2C(TST,NONE,R1,0xFF000000);
			C(NE);I2C(MVN,R1,NONE,0xFF000000);
			C(MI);I2C(MOV,R1,NONE,0x00000000);
			I2C(TST,NONE,R2,0xFF000000);
			C(NE);I2C(MVN,R2,NONE,0xFF000000);
			C(MI);I2C(MOV,R2,NONE,0x00000000);
			I2C(TST,NONE,R3,0xFF000000);
			C(NE);I2C(MVN,R3,NONE,0xFF000000);
			C(MI);I2C(MOV,R3,NONE,0x00000000);
		}

		if (p->InvertMask && p->Pos<0)
		{
			p->Pos = RPos;
			MB(); I2C(LDR,R0,SP,OFS(stack,InvertMask));
		}
		if (p->Pos!=RPos && p->Pos>=0) I3S(MOV,R0,NONE,R0,ROR,RPos-p->Pos);
		I3S(p->Pos<0?MOV:EOR,R0,(reg)(p->Pos<0?NONE:R0),R1,LSR,SatBit-p->DstSize[0]);
		I3S(MOV,R4,NONE,R2,LSR,SatBit-p->DstSize[1]);
		I3S(MOV,R0,NONE,R0,ROR,BPos-RPos);
		I3S(EOR,R0,R0,R4,ROR,BPos-GPos);
		I3S(EOR,R0,R0,R3,LSR,SatBit-p->DstSize[2]);
		p->Pos = BPos;

		if (p->Dither)
		{
			MB(); I3S(MOV,R1,NONE,R1,LSL,32-SatBit+p->DstSize[0]);
			MB(); I3S(MOV,R2,NONE,R2,LSL,32-SatBit+p->DstSize[1]);
			MB(); I3S(MOV,R3,NONE,R3,LSL,32-SatBit+p->DstSize[2]);
		}
	}
}

void Stretch_RGB_UV(blit_soft* p)
{
	bool_t Special;
	dyninst* LoopX;
	dyninst* LoopY;
	dyninst* EndOfLine;
	int i,Col,ColCount,RowStep;
	int Mask = 0;
	int Invert = 0;
	bool_t ReUse;
	bool_t NoInc;
	bool_t RegDirty; //R4,R5

	p->Dither = (boolmem_t)((p->DstBPP<=16) && (p->FX.Flags & BLITFX_DITHER)!=0);
	p->DstStepX = p->DirX * ((p->DstBPP*2) >> 3);
	p->PalPtr = NULL;
	p->DiffMask = NULL;
	p->InvertMask = NULL;

	if (p->Dst.Flags & PF_INVERTED)
		Invert = -1;

	CodeBegin();
	I2C(SUB,SP,SP,OFS(stack,StackFrame));

	I2C(LDR,R9,R1,0);  //Dst[0] RGB
	I2C(LDR,R10,R2,4); //Src[1] U
	I2C(LDR,R11,R2,8); //Src[2] V
	I2C(LDR,R12,R2,0); //Src[0] Y

	I2C(STR,R10,SP,OFS(stack,U));
	I2C(STR,R11,SP,OFS(stack,V));
	I2C(STR,R12,SP,OFS(stack,Y));

	ReUse = p->RScaleX<16 && !Invert && !p->OnlyDiff && (!p->OnlyDiff || !p->SwapXY) && (!p->DstPalette || !p->SwapXY) && !p->ArithStretch; //R0 is saved in loop and not ArithStretch

	if (p->QAdd && ReUse && !p->SwapXY)
	{
		p->QAdd = 0; // invert not supported with ReUse
		CalcColor(p);
	}

	if (p->QAdd)
	{
		int Mask2,Shift,i;

		for (i=0;i<3;++i)
			Mask |= 1 << (p->DstPos[i] + p->DstSize[i] - 1);

		Mask2 = Mask;
		Shift = 0;
		if (p->DstBPP <= 16)
		{
			if (p->DirX<0) Shift = p->DstBPP;
			Mask2 |= Mask << p->DstBPP;
		}

		Invert ^= RotateRight(Mask2,Shift+p->DstPos[0]);
	}

	if (Invert)
	{
		p->InvertMask = InstCreate32(Invert,NONE,NONE,NONE,0,0);
		MB(); I1P(LDR,R5,p->InvertMask,0);
		I2C(STR,R5,SP,OFS(stack,InvertMask));
	}

	if (p->OnlyDiff)
	{
		p->DiffMask = InstCreate32(0xFCFCFCFC,NONE,NONE,NONE,0,0);
		MB(); I1P(LDR,R4,p->DiffMask,0);
		I2C(STR,R4,SP,OFS(stack,DiffMask));
	}

	I2C(STR,R3,SP,OFS(stack,DstPitch));

	I3(MOV,R6,NONE,R3); //DstPitch
	I2C(LDR,R7,SP,OFS(stack,SrcPitch));
	I2C(LDR,R0,SP,OFS(stack,Height));
	I2C(LDR,R4,SP,OFS(stack,Width));

	if (p->DirX<0 && p->DstBPP==16) //adjust reversed destination for block size
		I2C(SUB,R9,R9,-p->DstStepX-(p->DstBPP >> 3));
	if ((p->DstPalette || p->DstBPP==32) && p->SwapXY)
		I2C(ADD,R9,R9,p->DstStepX/2);

	if (p->SwapXY)
	{
		I2C(MOV,R1,NONE,p->DstBPP * p->DirX);
		I3(MUL,R0,R1,R0);
		I3S(ADD,R0,R9,R0,ASR,3);
		I2C(STR,R0,SP,OFS(stack,EndOfRect));

		//DstNext = DstStepX - Width*DstPitch;
		MB(); I3(MUL,R2,R6,R4);
		I2C(MOV,R0,NONE,p->DstStepX);
		I3(SUB,R0,R0,R2); 
		I2C(STR,R0,SP,OFS(stack,DstNext));
	}
	else
	{
		I3(MUL,R0,R6,R0); //DstPitch * Height
		I3(ADD,R0,R9,R0);
		I2C(STR,R0,SP,OFS(stack,EndOfRect));

		//DstNext = DstPitch - DirX * Width << DstBPP2;
		I3S(p->DirX>0?SUB:ADD,R2,R6,R4,LSL,p->DstBPP2); 
		I2C(STR,R2,SP,OFS(stack,DstNext));
	}

	if (p->Dst.Flags & PF_PALETTE)
	{

⌨️ 快捷键说明

复制代码 Ctrl + C
搜索代码 Ctrl + F
全屏模式 F11
切换主题 Ctrl + Shift + D
显示快捷键 ?
增大字号 Ctrl + =
减小字号 Ctrl + -