mirror of
https://github.com/libretro/ppsspp.git
synced 2024-11-25 01:00:01 +00:00
dc09875eca
It's pretty much all done the same way. Note that normals have always been a little inconsistent between 127/128 and 32767/32768. But it's probably not causing a major impact...
273 lines
6.2 KiB
C++
273 lines
6.2 KiB
C++
// Copyright (c) 2012- PPSSPP Project.
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, version 2.0 or later versions.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License 2.0 for more details.
|
|
|
|
// A copy of the GPL 2.0 should have been included with the program.
|
|
// If not, see http://www.gnu.org/licenses/
|
|
|
|
// Official git repository and contact information can be found at
|
|
// https://github.com/hrydgard/ppsspp and http://www.ppsspp.org/.
|
|
|
|
#pragma once
|
|
|
|
#include "base/basictypes.h"
|
|
|
|
#ifdef ARM
|
|
#include "Common/ArmEmitter.h"
|
|
#else
|
|
#include "Common/x64Emitter.h"
|
|
#endif
|
|
|
|
#include "Globals.h"
|
|
#include "GPU/Common/VertexDecoderCommon.h"
|
|
|
|
class VertexDecoder;
|
|
class VertexDecoderJitCache;
|
|
|
|
typedef void (VertexDecoder::*StepFunction)() const;
|
|
typedef void (VertexDecoderJitCache::*JitStepFunction)();
|
|
|
|
struct JitLookup {
|
|
StepFunction func;
|
|
JitStepFunction jitFunc;
|
|
};
|
|
|
|
typedef void (*JittedVertexDecoder)(const u8 *src, u8 *dst, int count);
|
|
|
|
// Right now
|
|
// - compiles into list of called functions
|
|
// Future TODO
|
|
// - will compile into lighting fast specialized x86 and ARM
|
|
class VertexDecoder
|
|
{
|
|
public:
|
|
VertexDecoder();
|
|
|
|
// A jit cache is not mandatory, we don't use it in the sw renderer
|
|
void SetVertexType(u32 vtype, VertexDecoderJitCache *jitCache = 0);
|
|
|
|
u32 VertexType() const { return fmt_; }
|
|
|
|
const DecVtxFormat &GetDecVtxFmt() { return decFmt; }
|
|
|
|
void DecodeVerts(u8 *decoded, const void *verts, int indexLowerBound, int indexUpperBound) const;
|
|
|
|
bool hasColor() const { return col != 0; }
|
|
bool hasTexcoord() const { return tc != 0; }
|
|
int VertexSize() const { return size; } // PSP format size
|
|
|
|
void Step_WeightsU8() const;
|
|
void Step_WeightsU16() const;
|
|
void Step_WeightsFloat() const;
|
|
|
|
void Step_WeightsU8Skin() const;
|
|
void Step_WeightsU16Skin() const;
|
|
void Step_WeightsFloatSkin() const;
|
|
|
|
void Step_TcU8() const;
|
|
void Step_TcU16() const;
|
|
void Step_TcFloat() const;
|
|
|
|
void Step_TcU8Prescale() const;
|
|
void Step_TcU16Prescale() const;
|
|
void Step_TcFloatPrescale() const;
|
|
|
|
void Step_TcU16Double() const;
|
|
void Step_TcU16Through() const;
|
|
void Step_TcU16ThroughDouble() const;
|
|
void Step_TcFloatThrough() const;
|
|
|
|
void Step_Color4444() const;
|
|
void Step_Color565() const;
|
|
void Step_Color5551() const;
|
|
void Step_Color8888() const;
|
|
|
|
void Step_Color4444Morph() const;
|
|
void Step_Color565Morph() const;
|
|
void Step_Color5551Morph() const;
|
|
void Step_Color8888Morph() const;
|
|
|
|
void Step_NormalS8() const;
|
|
void Step_NormalS16() const;
|
|
void Step_NormalFloat() const;
|
|
|
|
void Step_NormalS8Skin() const;
|
|
void Step_NormalS16Skin() const;
|
|
void Step_NormalFloatSkin() const;
|
|
|
|
void Step_NormalS8Morph() const;
|
|
void Step_NormalS16Morph() const;
|
|
void Step_NormalFloatMorph() const;
|
|
|
|
void Step_PosS8() const;
|
|
void Step_PosS16() const;
|
|
void Step_PosFloat() const;
|
|
|
|
void Step_PosS8Skin() const;
|
|
void Step_PosS16Skin() const;
|
|
void Step_PosFloatSkin() const;
|
|
|
|
void Step_PosS8Morph() const;
|
|
void Step_PosS16Morph() const;
|
|
void Step_PosFloatMorph() const;
|
|
|
|
void Step_PosS8Through() const;
|
|
void Step_PosS16Through() const;
|
|
void Step_PosFloatThrough() const;
|
|
|
|
void ResetStats() {
|
|
memset(stats_, 0, sizeof(stats_));
|
|
}
|
|
|
|
void IncrementStat(int stat, int amount) {
|
|
stats_[stat] += amount;
|
|
}
|
|
|
|
// output must be big for safety.
|
|
// Returns number of chars written.
|
|
// Ugly for speed.
|
|
int ToString(char *output) const;
|
|
|
|
// Mutable decoder state
|
|
mutable u8 *decoded_;
|
|
mutable const u8 *ptr_;
|
|
|
|
// "Immutable" state, set at startup
|
|
|
|
// The decoding steps
|
|
StepFunction steps_[5];
|
|
int numSteps_;
|
|
|
|
u32 fmt_;
|
|
DecVtxFormat decFmt;
|
|
|
|
bool throughmode;
|
|
int biggest;
|
|
int size;
|
|
int onesize_;
|
|
|
|
int weightoff;
|
|
int tcoff;
|
|
int coloff;
|
|
int nrmoff;
|
|
int posoff;
|
|
|
|
int tc;
|
|
int col;
|
|
int nrm;
|
|
int pos;
|
|
int weighttype;
|
|
int idx;
|
|
int morphcount;
|
|
int nweights;
|
|
|
|
int stats_[NUM_VERTEX_DECODER_STATS];
|
|
|
|
JittedVertexDecoder jitted_;
|
|
|
|
friend class VertexDecoderJitCache;
|
|
};
|
|
|
|
|
|
// A compiled vertex decoder takes the following arguments (C calling convention):
|
|
// u8 *src, u8 *dst, int count
|
|
//
|
|
// x86:
|
|
// src is placed in esi and dst in edi
|
|
// for every vertex, we step esi and edi forwards by the two vertex sizes
|
|
// all movs are done relative to esi and edi
|
|
//
|
|
// that's it!
|
|
|
|
|
|
#ifdef ARM
|
|
class VertexDecoderJitCache : public ArmGen::ARMXCodeBlock {
|
|
#else
|
|
class VertexDecoderJitCache : public Gen::XCodeBlock {
|
|
#endif
|
|
public:
|
|
VertexDecoderJitCache();
|
|
|
|
// Returns a pointer to the code to run.
|
|
JittedVertexDecoder Compile(const VertexDecoder &dec);
|
|
void Clear();
|
|
|
|
void Jit_WeightsU8();
|
|
void Jit_WeightsU16();
|
|
void Jit_WeightsFloat();
|
|
|
|
void Jit_WeightsU8Skin();
|
|
void Jit_WeightsU16Skin();
|
|
void Jit_WeightsFloatSkin();
|
|
|
|
void Jit_TcU8();
|
|
void Jit_TcU16();
|
|
void Jit_TcFloat();
|
|
|
|
void Jit_TcU8Prescale();
|
|
void Jit_TcU16Prescale();
|
|
void Jit_TcFloatPrescale();
|
|
|
|
void Jit_TcU16Double();
|
|
void Jit_TcU16ThroughDouble();
|
|
|
|
void Jit_TcU16Through();
|
|
void Jit_TcFloatThrough();
|
|
|
|
void Jit_Color8888();
|
|
void Jit_Color4444();
|
|
void Jit_Color565();
|
|
void Jit_Color5551();
|
|
|
|
void Jit_NormalS8();
|
|
void Jit_NormalS16();
|
|
void Jit_NormalFloat();
|
|
|
|
void Jit_NormalS8Skin();
|
|
void Jit_NormalS16Skin();
|
|
void Jit_NormalFloatSkin();
|
|
|
|
void Jit_PosS8();
|
|
void Jit_PosS16();
|
|
void Jit_PosFloat();
|
|
void Jit_PosS8Through();
|
|
void Jit_PosS16Through();
|
|
|
|
void Jit_PosS8Skin();
|
|
void Jit_PosS16Skin();
|
|
void Jit_PosFloatSkin();
|
|
|
|
void Jit_NormalS8Morph();
|
|
void Jit_NormalS16Morph();
|
|
void Jit_NormalFloatMorph();
|
|
|
|
void Jit_PosS8Morph();
|
|
void Jit_PosS16Morph();
|
|
void Jit_PosFloatMorph();
|
|
|
|
void Jit_Color8888Morph();
|
|
void Jit_Color4444Morph();
|
|
void Jit_Color565Morph();
|
|
void Jit_Color5551Morph();
|
|
|
|
private:
|
|
bool CompileStep(const VertexDecoder &dec, int i);
|
|
void Jit_ApplyWeights();
|
|
void Jit_WriteMatrixMul(int outOff, bool pos);
|
|
void Jit_WriteMorphColor(int outOff, bool checkAlpha = true);
|
|
void Jit_AnyS8ToFloat(int srcoff);
|
|
void Jit_AnyS16ToFloat(int srcoff);
|
|
void Jit_AnyS8Morph(int srcoff, int dstoff);
|
|
void Jit_AnyS16Morph(int srcoff, int dstoff);
|
|
void Jit_AnyFloatMorph(int srcoff, int dstoff);
|
|
|
|
const VertexDecoder *dec_;
|
|
};
|