97 lines
2.4 KiB
C++
97 lines
2.4 KiB
C++
|
// Copyright (c) 2017- PPSSPP Project.
|
||
|
|
||
|
// This program is free software: you can redistribute it and/or modify
|
||
|
// it under the terms of the GNU General Public License as published by
|
||
|
// the Free Software Foundation, version 2.0 or later versions.
|
||
|
|
||
|
// This program is distributed in the hope that it will be useful,
|
||
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
// GNU General Public License 2.0 for more details.
|
||
|
|
||
|
// A copy of the GPL 2.0 should have been included with the program.
|
||
|
// If not, see http://www.gnu.org/licenses/
|
||
|
|
||
|
// Official git repository and contact information can be found at
|
||
|
// https://github.com/hrydgard/ppsspp and http://www.ppsspp.org/.
|
||
|
|
||
|
#include "ppsspp_config.h"
|
||
|
#if PPSSPP_ARCH(X86) || PPSSPP_ARCH(AMD64)
|
||
|
|
||
|
#include <emmintrin.h>
|
||
|
#include "Common/x64Emitter.h"
|
||
|
#include "GPU/Software/Sampler.h"
|
||
|
#include "GPU/ge_constants.h"
|
||
|
|
||
|
using namespace Gen;
|
||
|
|
||
|
namespace Sampler {
|
||
|
|
||
|
#ifdef _WIN32
|
||
|
static const X64Reg resultReg = RAX;
|
||
|
static const X64Reg tempReg1 = R10;
|
||
|
static const X64Reg tempReg2 = R11;
|
||
|
static const X64Reg uReg = RCX;
|
||
|
static const X64Reg vReg = RDX;
|
||
|
static const X64Reg srcReg = R8;
|
||
|
static const X64Reg bufwReg = R9;
|
||
|
// TODO: levelReg on stack
|
||
|
#else
|
||
|
static const X64Reg resultReg = RAX;
|
||
|
static const X64Reg tempReg1 = R9;
|
||
|
static const X64Reg tempReg2 = R10;
|
||
|
static const X64Reg uReg = RDI;
|
||
|
static const X64Reg vReg = RSI
|
||
|
static const X64Reg srcReg = RDX;
|
||
|
static const X64Reg bufwReg = RCX;
|
||
|
static const X64Reg levelReg = R8;
|
||
|
#endif
|
||
|
|
||
|
NearestFunc SamplerJitCache::Compile(const SamplerID &id) {
|
||
|
BeginWrite();
|
||
|
const u8 *start = this->AlignCode16();
|
||
|
|
||
|
SUB(PTRBITS, R(ESP), Imm8(64));
|
||
|
MOVUPS(MDisp(ESP, 0), XMM4);
|
||
|
MOVUPS(MDisp(ESP, 16), XMM5);
|
||
|
MOVUPS(MDisp(ESP, 32), XMM6);
|
||
|
MOVUPS(MDisp(ESP, 48), XMM7);
|
||
|
|
||
|
// Early exit on !srcPtr.
|
||
|
CMP(PTRBITS, R(srcReg), Imm32(0));
|
||
|
FixupBranch nonZeroSrc = J_CC(CC_NZ);
|
||
|
XOR(32, R(RAX), R(RAX));
|
||
|
FixupBranch zeroSrc = J(true);
|
||
|
SetJumpTarget(nonZeroSrc);
|
||
|
|
||
|
GETextureFormat fmt = (GETextureFormat)id.texfmt;
|
||
|
bool success = true;
|
||
|
switch (fmt) {
|
||
|
default:
|
||
|
success = false;
|
||
|
}
|
||
|
|
||
|
if (!success) {
|
||
|
EndWrite();
|
||
|
SetCodePtr(const_cast<u8 *>(start));
|
||
|
return nullptr;
|
||
|
}
|
||
|
|
||
|
SetJumpTarget(zeroSrc);
|
||
|
|
||
|
MOVUPS(XMM4, MDisp(ESP, 0));
|
||
|
MOVUPS(XMM5, MDisp(ESP, 16));
|
||
|
MOVUPS(XMM6, MDisp(ESP, 32));
|
||
|
MOVUPS(XMM7, MDisp(ESP, 48));
|
||
|
ADD(PTRBITS, R(ESP), Imm8(64));
|
||
|
|
||
|
RET();
|
||
|
|
||
|
EndWrite();
|
||
|
return (NearestFunc)start;
|
||
|
}
|
||
|
|
||
|
};
|
||
|
|
||
|
#endif
|